#!/usr/local/bin/perl

open(STRUCT, "/afs/cs.cmu.edu/project/avenue-1/Avenue/Hebrew-MT/Data/RLTrainingData/Struct-EC/AlonStruct.rl") 
    or die $!;

open(HEB, "> heb-struct.txt") or die $!;
open(ENG, "> heb-struct-ref.txt") or die $!;


while ($line = <STRUCT>) {
    $line =~ s/[\r\n]*$//;
    if ($line =~ m/^SL: (.*)$/) {
	$sent = $1;
	print ENG "$sent\n";
	push @engsents, $sent;
    } elsif ($line =~ m/^TL: (.*)$/) {
	$sent = $1;
	print HEB "$sent\n";
    }
}

close(HEB);
close(ENG);
close(STRUCT);

`cat /avenue/usr2/shared/Hebrew-MT/Tests/h1.txt heb-struct.txt > h1_struct.txt`;

open(REF, "/avenue/usr2/shared/Hebrew-MT/Tests/e1.ref.sgm") or die $!;
open(NEWREF, "> e1_struct.ref.sgm") or die $!;
while ($line = <REF>) {
    $line =~ s/[\r\n]*$//;
    if ($line =~ m/<\/DOC>/i) {
	foreach $engsent (@engsents) {
	    $segcount++;
	    print NEWREF "<seg id=$segcount>$engsent</seg>\n";
	}
    }
    print NEWREF "$line\n";
    if ($line =~ m/<seg id=(\d+)>/) { $segcount = $1; }
}
close(REF);
close(NEWREF);
