remove %nn strings from dups of announces and spots
[spider.git] / perl / AnnTalk.pm
index a74c0e250495bfdd7c1ae0603a285ddbeb8f45ed..5a387d219ff30946138c720d92ce36ac058c68b0 100644 (file)
@@ -44,6 +44,7 @@ sub dup
 
        chomp $text;
        unpad($text);
+       $text =~ s/[\\\%]\d+//g;
        $text =~ s/[^a-zA-Z0-9]//g;
        $text = substr($text, 0, $duplth) if length $text > $duplth; 
        my $dupkey = "A$to|\L$text";