From: Fredrik Tolf Date: Sat, 30 Nov 2013 04:06:37 +0000 (+0100) Subject: ANN: Updated HTML patterns. X-Git-Url: http://git.dolda2000.com/gitweb/?a=commitdiff_plain;ds=sidebyside;h=a8823c2f505b1ae3d86cf3610a80d538a28859ed;p=utils.git ANN: Updated HTML patterns. --- diff --git a/ANN.pm b/ANN.pm index f10e869..6dd02e9 100644 --- a/ANN.pm +++ b/ANN.pm @@ -58,7 +58,7 @@ sub getlist # The only way to recognize entries that seems sure is to look # after the "HOVERLINE" class. - while($html =~ /]*>(]*>)?(\.*\<\/small\>)?\s*([^<]+)<\//ig) { + while($html =~ /]*>(]*>)?([^<]*<\/small>)?\s*([^<]+)<\//ig) { if((substr "" . lc $4 , 0, length $name) eq lc $name) { push @ret, $4; } @@ -83,7 +83,7 @@ sub getid # The only way to recognize entries that seems sure is to look # after the "HOVERLINE" class. - while($html =~ /]*>(]*>)?(\.*\<\/small\>)?\s*([^<]+)<\//ig) { + while($html =~ /]*>(]*>)?([^<]*<\/small>)?\s*([^<]+)<\//ig) { if((substr "" . lc $4 , 0, length $name) eq lc $name) { return ($1 =~ /id=(\d+)$/)[0]; }