voxforge.org
VoxForge Dev
Show
Ignore:
Timestamp:
05/27/08 12:38:46 (6 months ago)
Author:
kmaclean
Message:

AudioSegmentation scripts -snapshot

Files:

Legend:

Unmodified
Added
Removed
Modified
Copied
Moved
  • Trunk/Scripts/Audio_scripts/AudioSegmentation/AudioBook/Text.pm

    r2594 r2595  
    4646                $line =~ s/\.\"//g; # period followed by double quote 
    4747                $line =~ s/\,\"//g; # comma followed by double quote 
     48                $line =~ s/\;\"//g; # semi-colon followed by double quote                
    4849                $line =~ s/\?\"//g; # question mark followed by double quote 
    4950                $line =~ s/\!\"//g; # exclamation mark followed by double quote  
    5051                $line =~ s/\.\'//g; # period followed by single quote 
    5152                $line =~ s/\,\'//g; # comma followed by single quote 
     53                $line =~ s/\;\'//g; # semi-colon followed by single quote                                
    5254                $line =~ s/\?\'//g; # question mark followed by single quote 
    5355                $line =~ s/\!\'//g; # exclamation mark followed by single quote 
     
    9698                $line =~ s/\.\"//g; # period followed by double quote 
    9799                $line =~ s/\,\"//g; # comma followed by double quote 
     100                $line =~ s/\;\"//g; # semi-colon followed by double quote                
    98101                $line =~ s/\?\"//g; # question mark followed by double quote 
    99102                $line =~ s/\!\"//g; # exclamation mark followed by double quote  
    100103                $line =~ s/\.\'//g; # period followed by single quote 
    101104                $line =~ s/\,\'//g; # comma followed by single quote 
     105                $line =~ s/\;\'//g; # semi-colon followed by single quote                
    102106                $line =~ s/\?\'//g; # question mark followed by single quote 
    103107                $line =~ s/\!\'//g; # exclamation mark followed by single quote 
     
    198202                $$word =~ s/^\'+//;  
    199203                push (@$quotelog, "changed:$tempword to:$$word\n");  
     204        } elsif ($$word  =~ /\'+$/) { # one or more single quote(s) from end of word 
     205                my $tempword = $$word;           
     206                $$word =~ s/\'+$//;  
     207                push (@$quotelog, "changed:$tempword to:$$word\n");  
    200208        } else {                 
    201                 # don;t remove single quote(s) from end of word - further manual processing might be required 
     209                # don;t remove single quote(s) from body of word - further manual processing might be required 
    202210                #$word =~ s/\'+$//; # single quote(s) from end of word ... but some contractions use a single quote at the end of the word 
    203211                push (@$quotelog, "$$word\n") if $log_single_quotes;