parse.pl 368 B

123456789101112131415161718
  1. #!/usr/bin/perl
  2. use strict;
  3. use warnings;
  4. # Scratch pad for parsing webpages for lists
  5. # of different words/names, for the seed file
  6. my @page = split("\n", `cat saints.html`);
  7. foreach my $line ( @page ) {
  8. if ( $line =~ m/<td data-sort-value=.*<a\ href=.*title="(.*)"/ ) {
  9. my $line1 = $1;
  10. if ( $line1 =~ m/^([a-zA-z0-9\ ,-]{1,})/ ) {
  11. print "$1\n";
  12. }
  13. }
  14. }