26 lines
655 B
Perl
26 lines
655 B
Perl
print "Usage: perl $0 transcription_file path_prefix output_file\n";
|
|
print "Example: perl $0 /direct/datadigest/en_sg/ives/000.txt /direct/datadigest/en_sg/ives/calls/ ~/ives.list\n";
|
|
|
|
open TRAN, $ARGV[0] or die "Cannot open transcription file $ARGV[0] for read.\n";
|
|
open CORPUS, ">>$ARGV[2]" or die "Cannot open corpus file $ARGV[1] for write.\n";
|
|
|
|
if ($ARGV[1] =~ m|/$|) # the parameter "path_prefix" is ended with /
|
|
{
|
|
$prefix = $ARGV[1];
|
|
}else
|
|
{
|
|
$prefix = "$ARGV[1]/";
|
|
}
|
|
|
|
while (<TRAN>)
|
|
{
|
|
chomp;
|
|
m|([^ ]+)\s+(.*)|;
|
|
if ($1 =~ m|\.info$|)
|
|
{
|
|
print CORPUS "new_speaker\n";
|
|
next;
|
|
}
|
|
print CORPUS "$prefix$1.ulaw\t$2\n";
|
|
}
|