From 536c7bdbcc9d349dbe229bca6cc3b3898eb1c462 Mon Sep 17 00:00:00 2001 From: bojar Date: Tue, 26 Jan 2010 17:01:12 +0000 Subject: commiting a script by Loic Barrault to display moses search graph (-output-search-graph) using graphviz dot git-svn-id: https://mosesdecoder.svn.sourceforge.net/svnroot/mosesdecoder/trunk@2672 1f5c12ca-751b-0410-a591-d2e778427230 --- scripts/analysis/sg2dot.pl | 101 +++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 101 insertions(+) create mode 100755 scripts/analysis/sg2dot.pl (limited to 'scripts/analysis') diff --git a/scripts/analysis/sg2dot.pl b/scripts/analysis/sg2dot.pl new file mode 100755 index 000000000..adf84dcc2 --- /dev/null +++ b/scripts/analysis/sg2dot.pl @@ -0,0 +1,101 @@ +#!/usr/bin/perl -w +# +# Author : Loic BARRAULT +# Script to convert MOSES searchgraph to DOT format +# + +use strict; +use File::Path; +use File::Basename; +use File::Copy; + +if ($#ARGV+1 != 1) +{ + print "\n\n INPUT:"; + print "\n 1) Search graph file "; + print "\n"; + exit(-1); +} + +my $searchgraph = $ARGV[0]; +print STDERR "searchgraph = $searchgraph\n"; + +my %stacks = (); +$stacks{0}{0} = 0; + +print STDOUT "digraph searchgraph\n{\nrankdir=LR\n"; + + +my($line, $cpt, $from, $to, $label, $recombined, $transition, $o, $stack, $state); +$cpt = 0; + +open(LISTFD, "<$searchgraph") or die "Cannot read input file $searchgraph, Erreur: $!\n"; +$line=; #skip first line ... + +while(($line=) ) +{ + $from = ""; + $to = ""; + $label = ""; + $recombined = ""; + chomp($line); + #print STDERR "$line\n"; + + #Three kinds of lines in searchgraph + #0 hyp=0 stack=0 forward=1 fscore=-205.192 + #0 hyp=5 stack=1 back=0 score=-0.53862 transition=-0.53862 forward=181 fscore=-205.36 covered=0-0 out=I am , pC=-0.401291, c=-0.98555 + #256 hyp=6566 stack=2 back=23 score=-2.15644 transition=-0.921959 recombined=6302 forward=15519 fscore=-112.807 covered=2-2 out=countries , , pC=-0.640574, c=-1.07215 + + if($line =~ /hyp=(\d+).+stack=(\d+).+back=(\d+).+transition=([^ ]*).+recombined=(\d+).+out=(.*), pC/) + { + #print STDERR "hyp=$1, stack=$2, from=$3, transition=$4, recombined=$5, out=$6\n"; + $to = $1; + $stack = $2; + $from = $3; + $transition=$4; + $recombined = $5; + $o = $6; + $label = "[color=blue label="; + + $to = $recombined; + $stacks{$stack}{$recombined} = $recombined; + #$stack++; + #$stacks{$stack}{$recombined} = $recombined; + } + elsif($line =~ /hyp=(\d+).+stack=(\d+).+back=(\d+).+transition=([^ ]*).+out=(.*), pC/) + { + #print STDERR "hyp=$1, stack=$2, from=$3, transition=$4, out=$5\n"; + $to = $1; + $stack = $2; + $from = $3; + $transition=$4; + $o = $5; + $label = "[label="; + $stacks{$stack}{$to} = $to; + #$stack++; + #$stacks{$stack}{$to} = $to; + } + else{ print STDERR "Bad file format ..."; exit(); } + + $o =~ s/\"/\\"/g ; + #print STDERR "out = $o after regexp\n"; + $label .= "\"$o p=$transition\"]\n"; + #$label .= " p=$transition\"]\n"; + + print STDOUT "$from -> $to $label"; + + $cpt++; +} + + +foreach $stack (sort (keys(%stacks))) +{ + print STDOUT "{ rank=same; "; + foreach $state (sort keys %{ $stacks{$stack} } ) + { + print STDOUT "$stacks{$stack}{$state} "; + } + print STDOUT "}\n"; +} + +print STDOUT "\n}\n"; -- cgit v1.2.3