".$word[$from]; } else { $color = coverage_color($coverage[$from][$to]); $phrase = ""; $highlightwords = ""; $lowlightwords = ""; for($j=$from;$j<=$to;$j++) { if ($j>$from) { $phrase .= " "; } $phrase .= $word[$j]; $highlightwords .= " document.getElementById('inputword-$i-$j').style.backgroundColor='#ffff80';"; $lowlightwords .= " document.getElementById('inputword-$i-$j').style.backgroundColor='".coverage_color($coverage[$j][$j])."';"; } print "

"; } print "

"; $from += $size-1; } else { print "

"; } } print "\n"; } # display input words print "

"; for($j=$sep_start;$j<$sep_end;$j++) { if ($segmentation && array_key_exists($j,$segmentation["input_start"])) { $id = $segmentation["input_start"][$j]; print ""; } if (array_key_exists($j,$coverage)) { $color = coverage_color($coverage[$j][$j]); $cc = $coverage[$j][$j]["corpus_count"]; $tc = $coverage[$j][$j]["ttable_count"]; $te = $coverage[$j][$j]["ttable_entropy"]; } else { # unknown words $color = '#ffffff'; $cc = 0; $tc = 0; $te = 0; } print ""; if ($word[$j] == $filter) { print "".$word[$j].""; } else { print $word[$j]; } print ""; if ($segmentation && array_key_exists($j,$segmentation["input_end"])) { print ""; } print " "; } print "

\n"; print "\n"; $sep_start = $sep_end; } } print "
"; } // color-coded coverage stats (corpus count, ttable count, entropy) function coverage_color($phrase) { $corpus_count = 255 - 10 * log(1 + $phrase["corpus_count"]); if ($corpus_count < 128) { $corpus_count = 128; } $cc_color = dechex($corpus_count / 16) . dechex($corpus_count % 16); $ttable_count = 255 - 20 * log(1 + $phrase["ttable_count"]); if ($ttable_count < 128) { $ttable_count = 128; } $tc_color = dechex($ttable_count / 16) . dechex($ttable_count % 16); $ttable_entropy = 255 - 32 * $phrase["ttable_entropy"]; if ($ttable_entropy < 128) { $ttable_entropy = 128; } $te_color = dechex($ttable_entropy / 16) . dechex($ttable_entropy % 16); // $color = "#". $cc_color . $te_color . $tc_color; # reddish browns with some green // $color = "#". $cc_color . $tc_color . $te_color; # reddish brown with some blueish purple $color = "#". $te_color . $cc_color . $tc_color; # pale green towards red // $color = "#". $te_color . $tc_color . $cc_color; # pale purple towards red // $color = "#". $tc_color . $te_color . $cc_color; // # blue-grey towards green // $color = "#". $tc_color . $cc_color . $te_color; // # green-grey towards blue return $color; } // annotate an output sentence function output_annotation($sentence,$system,$segmentation) { #$color = array("#FFC0C0","#FFC0FF","#C0C0FF","#C0FFFF","#C0FFC0"); $color = array("#c0c0c0","#e0e0ff","#b0b0ff","#8080ff","#4040ff"); $word = split(" ",$system); for($j=0;$j"; } print "$surface"; if ($segmentation && array_key_exists($j,$segmentation["output_end"])) { print ""; } print " "; } } function annotation_hierarchical($sentence,$segmentation,$segmentation_out,$node) { print "\n"; } function sentence_annotation_hierarchical($info,$sentence,$sequence,$segmentation,$in_out) { $In_Out = $in_out == "out" ? "Out" : "In"; #list($words,$coverage_vector) = split("\t",$input); $coverage = coverage($sequence); $word = preg_split("/\s/",$sequence); $color = array("#ffe0e0","#f0e0ff","#e0e0ff","#c0c0ff","#a0a0ff"); #$color = array("#FFC0C0","#FFC0FF","#C0C0FF","#C0FFFF","#C0FFC0"); #$color = array("#c0c0c0","#e0e0ff","#b0b0ff","#8080ff","#4040ff"); print "

\n"; print "

[$info]

"; $word_count = 0; for($span=0;$span"; for($depth=0;$depth"; } $words = $segmentation[$span]["words"]; # non terminal if (array_key_exists("nt",$segmentation[$span]) && $segmentation[$span]["nt"] != "") { print $segmentation[$span]["nt"].": "; } # no nonterminal and no words => invisible bar else if($words == "") { print "|"; } $span_word = array(); if ($words != "") { $span_word = split(" ",$words); } for($w=0;$w 0) { print " "; } if ($in_out == "in") { #print ""; print $word[$word_count]; #print ""; } else { list($surface,$correct) = split("\|", $word[$word_count]); print "$surface"; } $word_count++; } for($depth=0;$depth"; } print ""; # enclosing } print "

\n"; } function biconcor($query) { global $set,$id,$dir; $sentence = $_GET['sentence']; $biconcor = get_biconcor_version($dir,$set,$id); print "

"; $cmd = "./biconcor -l $dir/model/biconcor.$biconcor -Q ".base64_encode($query)." 2>/dev/null"; #print $cmd."

"; system($cmd); # print "

done."; print "

"; }

Count	Precision		Delete		Length
$word	%.1f%s	%.1f/%d	%.1f%s	%d/%d	%.3f

Count	Precision		Delete		Length
$i	%.1f%s	%.1f/%d	%.1f%s	%d/%d	%.3f	Ⓘ

(loading...)	(loading...)	(loading...)	(loading...)
(loading...)	(loading...)	(loading...)	(loading...)

$type	1-gram	2-gram	3-gram	4-gram
correct	%d	%d	%d	%d
	%.1f%s	%.1f%s	%.1f%s	%.1f%s
wrong	%d	%d	%d	%d

$order-gram	ok	x	ratio
".$line["ngram"]."	".$line["correct"]."	".($line["total"]-$line["correct"])."	%.3f

By log₂-count in the training corpus

By factor ".factor_name("input",$factor_id)."

For each factor, by log₂-count in the corpus

	model	corpus
$range	%d (%.1f%s)

	1	2	3	4+
$in".($in==4?"+":"")." to	%d (%.1f%s)

By log2-count in the training corpus

By factor ".factor_name("input",$factor_id)."

For each factor, by log2-count in the corpus

By log₂-count in the training corpus

For each factor, by log₂-count in the corpus