X-Git-Url: http://git.shadowcat.co.uk/gitweb/gitweb.cgi?a=blobdiff_plain;f=t%2Fgraph.t;h=c65f516833a839c71f02da648f59c74d865da72c;hb=e4b0f4643062d1654a512ab882b9e0798d40248e;hp=de42d5028581c39763e88c3a8dacdbd94d20ba97;hpb=3265b0ce233468b116be19a3bfcc80a0fa3e3af9;p=scpubgit%2Fstemmatology.git diff --git a/t/graph.t b/t/graph.t index de42d50..c65f516 100644 --- a/t/graph.t +++ b/t/graph.t @@ -1,7 +1,7 @@ #!/usr/bin/perl use strict; use warnings; -use Test::More; +use Test::More skip_all => "lemmatization disabled for now"; use lib 'lib'; use Text::Tradition; use XML::LibXML; @@ -9,10 +9,11 @@ use XML::LibXML::XPathContext; my $datafile = 't/data/Collatex-16.xml'; -open( GRAPHFILE, $datafile ) or die "Could not open $datafile"; -my @lines = ; -close GRAPHFILE; -my $tradition = Text::Tradition->new( 'GraphML' => join( '', @lines ) ); +my $tradition = Text::Tradition->new( + 'name' => 'inline', + 'input' => 'CollateX', + 'file' => $datafile, + ); my $collation = $tradition->collation; # Test the svg creation @@ -32,8 +33,9 @@ my @svg_edges = $svg_xpc->findnodes( '//svg:g[@class="edge"]' ); is( scalar @svg_edges, 32, "Correct number of edges in the graph" ); # Test for the correct common nodes -my @expected_nodes = map { [ $_, 1 ] } qw/ #START# n1 n5 n6 n7 n12 - n16 n19 n20 n27 /; +my @common_nodes = ( '#START#' ); +push( @common_nodes, qw/ n1 n5 n6 n7 n12 n16 n19 n20 n27 / ); +my @expected_nodes = map { [ $_, 1 ] } @common_nodes; foreach my $idx ( qw/2 3 4 8 10 11 13 16 17 18/ ) { splice( @expected_nodes, $idx, 0, [ "node_null", undef ] ); } @@ -61,7 +63,7 @@ sub make_text { my @words; foreach my $n ( @_ ) { if( $n->[1] ) { - push( @words, $collation->reading( $n->[0] )->label ); + push( @words, $collation->reading( $n->[0] )->text ); } elsif ( !defined $n->[1] ) { push( @words, '...' ); } @@ -69,6 +71,11 @@ sub make_text { return join( ' ', @words ); } +# Test that the common nodes are marked common +foreach my $cn ( @common_nodes ) { + ok( $collation->reading( $cn )->is_common, "Node $cn is marked common" ); +} + # Test the manuscript paths my $wit_a = '# when april with his showers sweet with fruit the drought of march has pierced unto the root #'; my $wit_b = '# when showers sweet with april fruit the march of drought has pierced to the root #'; @@ -113,7 +120,6 @@ $string = '# when ... ... ... showers sweet with ... fruit ... ... of ... has pi is( make_text( @active_nodes ), $string, "Got the right text" ); # Test the toggling effects of transposition - @off = $collation->toggle_reading( 'n14' ); # Add the turned on node $expected_nodes[ 11 ] = [ "n14", 1 ]; @@ -177,4 +183,121 @@ subtest 'Turned on another node after singleton switchoff' => \&compare_active; $string = '# when ... ... showers sweet with ... fruit ... march of ... has pierced unto ... ... #'; is( make_text( @active_nodes ), $string, "Got the right text" ); +# Now start testing some position identifiers +# 2. 'april with his' have no colocated +# 3. 'april' 2 has no colocated +# 4. 'teh' and 'the' +# 5. 'drought' & 'march' +# 6. 'march' & 'drought' +# 7. 'unto' 'the' 'root'... +# 'unto can match 'to' or 'teh' +# 'the' can match 'teh' or 'rood' +# 'root' can mach 'rood' + +foreach my $cn ( @common_nodes ) { + my $cnr = $collation->reading( $cn ); + is( scalar( $collation->same_position_as( $cnr ) ), 0, "Node $cn has no colocations" ); +} + +my %expected_colocations = ( + 'n2' => [], # april + 'n3' => [], # with + 'n4' => [], # his + 'n11' => [], # april + 'n8' => [ 'n13' ], # teh -> the + 'n13' => [ 'n8' ], # the -> teh + 'n14' => [ 'n15' ], # drought -> march + 'n18' => [ 'n17' ], # drought -> march + 'n17' => [ 'n18' ], # march -> drought + 'n15' => [ 'n14' ], # march -> drought + 'n21' => [ 'n22', 'n9' ], # unto -> to, teh + 'n22' => [ 'n21', 'n9' ], # to -> unto, teh + 'n9' => [ 'n21', 'n22', 'n23' ], # teh -> unto, to, the + 'n23' => [ 'n25', 'n9' ], # the -> teh, rood + 'n25' => [ 'n23', 'n26' ], # rood -> the, root + 'n26' => [ 'n25' ], # root -> rood +); + +foreach my $n ( keys %expected_colocations ) { + my $nr = $collation->reading( $n ); + my @colocated = sort( map { $_->name } $collation->same_position_as( $nr ) ); + is_deeply( \@colocated, $expected_colocations{$n}, "Colocated nodes for $n correct" ); +} + +# Test strict colocations +$expected_colocations{'n9'} = []; +$expected_colocations{'n21'} = ['n22']; +$expected_colocations{'n22'} = ['n21']; +$expected_colocations{'n23'} = []; +$expected_colocations{'n25'} = []; +$expected_colocations{'n26'} = []; + +foreach my $n ( keys %expected_colocations ) { + my $nr = $collation->reading( $n ); + my @colocated = sort( map { $_->name } $collation->same_position_as( $nr, 1 ) ); + is_deeply( \@colocated, $expected_colocations{$n}, "Strictly colocated nodes for $n correct" ); +} + +# Test turning on, then off, an annoyingly overlapping node + +@off = $collation->toggle_reading( 'n9' ); +# Remove the old toggle-off +splice( @expected_nodes, 16, 1 ); +splice( @expected_nodes, 17, 0, [ "n9", 1 ] ); +@active_nodes = $collation->lemma_readings( @off ); +subtest 'Turned on a node without fixed position' => \&compare_active; +$string = '# when ... ... showers sweet with ... fruit ... march of ... has pierced unto teh ... ... #'; +is( make_text( @active_nodes ), $string, "Got the right text" ); + +@off = $collation->toggle_reading( 'n23' ); +splice( @expected_nodes, 18, 1, [ "n23", 1 ] ); +@active_nodes = $collation->lemma_readings( @off ); +subtest 'Turned on a node colocated to one without fixed position' => \&compare_active; +$string = '# when ... ... showers sweet with ... fruit ... march of ... has pierced unto teh the ... #'; +is( make_text( @active_nodes ), $string, "Got the right text" ); + +@off = $collation->toggle_reading( 'n9' ); +splice( @expected_nodes, 17, 1, [ "n9", 0 ] ); +@active_nodes = $collation->lemma_readings( @off ); +subtest 'Turned on a node colocated to one without fixed position' => \&compare_active; +$string = '# when ... ... showers sweet with ... fruit ... march of ... has pierced unto the ... #'; +is( make_text( @active_nodes ), $string, "Got the right text" ); + +### Now test relationship madness. + +my( $result, @relations ) = $collation->add_relationship( 'n25', 'n23', {'type' => 'lexical'} ); # rood -> the +ok( $result, "Added relationship between nodes" ); +is( scalar @relations, 1, "Returned only the one collapse" ); +is_deeply( $relations[0], [ 'n25', 'n23' ], "Returned the correct collapse" ); +is( $collation->reading( 'n25' )->position->reference, '9,3', "Harmonized position for n25 correct" ); +is( $collation->reading( 'n23' )->position->reference, '9,3', "Harmonized position for n23 correct" ); +is( $collation->reading( 'n9' )->position->reference, '9,2', "Adjusted position for n9 correct" ); + +# Do some yucky hardcoded cleanup to undo this relationship. +$collation->reading('n25')->position->max( 4 ); +$collation->reading('n9')->position->max( 3 ); +$collation->graph->del_edge( $collation->reading('n25')->edges_to( $collation->reading('n23')) ); + +( $result, @relations ) = $collation->add_relationship( 'n26', 'n25', {'type' => 'spelling'} ); # root -> rood +ok( $result, "Added relationship between nodes" ); +is( scalar @relations, 1, "Returned only the one collapse" ); +is_deeply( $relations[0], [ 'n26', 'n25' ], "Returned the correct collapse" ); +is( $collation->reading( 'n26' )->position->reference, '9,4', "Harmonized position for n26 correct" ); +is( $collation->reading( 'n25' )->position->reference, '9,4', "Harmonized position for n25 correct" ); +is( $collation->reading( 'n9' )->position->reference, '9,2-3', "Adjusted position for n9 correct" ); + +( $result, @relations ) = $collation->add_relationship( 'n15', 'n9', {'type' => 'lexical'} ); # bogus march -> teh +ok( !$result, "Refused to add skewed relationship: " . $relations[0] ); + +( $result, @relations ) = $collation->add_relationship( 'n25', 'n26', {'type' => 'spelling'} ); # root -> rood +ok( !$result, "Refused to add dupe relationship: " . $relations[0] ); + +( $result, @relations ) = $collation->add_relationship( 'n8', 'n13', {'type' => 'spelling', 'global' => 1 } ); # teh -> the +ok( $result, "Added global relationship between nodes" ); +is( scalar @relations, 2, "Returned two relationship creations" ); +is_deeply( $relations[0], [ 'n8', 'n13' ], "Returned the original collapse" ); +is_deeply( $relations[1], [ 'n9', 'n23' ], "Returned the other collapse" ); +is( $collation->reading( 'n8' )->position->reference, '6,2', "Harmonized position for n8 correct" ); +is( $collation->reading( 'n9' )->position->reference, '9,3', "Harmonized position for n9 correct" ); + done_testing();