new-words

diff grep-sentences.pl @ 28:7db7bbf96fad

temporary files names
author Igor Chubin <igor@chub.in>
date Tue Jun 15 05:46:50 2010 +0300 (2010-06-15)
parents 416394a87d9f
children c631833fa2be
line diff
     1.1 --- a/grep-sentences.pl	Tue Apr 20 21:15:19 2010 +0400
     1.2 +++ b/grep-sentences.pl	Tue Jun 15 05:46:50 2010 +0300
     1.3 @@ -9,10 +9,14 @@
     1.4      $text=<PAGE>;
     1.5      $text =~ s@http://[a-zA-Z&_.:/0-9%?=,\#+()\[\]~-]*@@g;
     1.6      $text =~ s@\n@@g;
     1.7 -    $text =~ s@(Mr|Mrs)\.@\1POINT@g;
     1.8 +    $text =~ s@(Mr|Mrs|viz)\.@\1POINT@g;
     1.9 +    $text =~ s@e\.g\.@ePOINTgPOINT@g;
    1.10 +    $text =~ s@i\.e\.@iPOINTePOINT@g;
    1.11      @sentences=split /[.!?]/, $text;
    1.12      for (@sentences) {
    1.13 -         s@(Mr|Mrs)POINT@\1.@g;
    1.14 +        s@iPOINTePOINT@i\.e\.@g;
    1.15 +        s@ePOINTgPOINT@e\.g\.@g;
    1.16 +        s@(Mr|Mrs|viz)POINT@\1.@g;
    1.17          s/^\s*//;
    1.18          s/\s*$//;
    1.19          s/\[[0-9]+\]//g;