# Copyright (c) 2009 by Grzegorz Kondrak # purpose: recover lexical stress from the encoded file eow_loe # usage: cut -d'\' -f2 LDC96L14/english/eow/eow.cd | paste - eow_loe | perl .p use strict; my $s1 = "'"; # primary stress my $s2 = "\""; # secondary stress while (<>) { chomp; my ($symb, $code) = split /\t/; die unless $symb; if (!$code) { printf "\n"; next; } $symb =~ s/[`#^",~]//g; # diacritics removed my @l = split //, $symb; my @c = split //, $code; my $out = ""; for (my $i = 0; $i < scalar(@l); $i++) { $out .= $s1 if $c[$i] == 1; $out .= $s2 if $c[$i] == 2; $out .= $l[$i]; } printf "%s", $out; printf "\n"; }