parse.pl 417 B

123456789101112131415161718192021222324
  1. #!/usr/bin/perl
  2. use strict;
  3. use warnings;
  4. # Scratch pad for parsing webpages for lists
  5. # of different words/names, for the seed file
  6. my @page = split("\n", `cat saints.html`);
  7. foreach my $line ( @page ) {
  8. if ( $line =~ m/title="(.*)">.*/ ) {
  9. my $line1 = $1;
  10. if ( $line1 =~ m/ctx/ ) {
  11. next;
  12. } else {
  13. print "$line1\n";
  14. }
  15. #if ( $line1 =~ m/^([a-zA-z0-9\ ,-]{1,})/ ) {
  16. # print "$1\n";
  17. #}
  18. }
  19. }