save Ternary data type to graphml too

[scpubgit/stemmatology.git] / base / lib / Text / Tradition / Collation.pm
diff --git a/base/lib/Text/Tradition/Collation.pm b/base/lib/Text/Tradition/Collation.pm

index bf9832a..1573eb1 100644 (file)
--- a/base/lib/Text/Tradition/Collation.pm
+++ b/base/lib/Text/Tradition/Collation.pm
@@ -159,15 +159,6 @@ See L<Text::Tradition::Collation::Reading> for the available arguments.
 Removes the given reading from the collation, implicitly removing its
 paths and relationships.
 
-=head2 merge_readings( $main, $second, $concatenate, $with_str )
-
-Merges the $second reading into the $main one. If $concatenate is true, then
-the merged node will carry the text of both readings, concatenated with either
-$with_str (if specified) or a sensible default (the empty string if the
-appropriate 'join_*' flag is set on either reading, or else $self->wordsep.)
-
-The first two arguments may be either readings or reading IDs.
-
 =head2 has_reading( $id )
 
 Predicate to see whether a given reading ID is in the graph.
@@ -233,6 +224,21 @@ sub BUILD {
        { 'collation' => $self, 'is_end' => 1, 'init' => 1 } ) );
 }
 
+sub register_relationship_type {
+       my $self = shift;
+       my %args = @_ == 1 ? %{$_[0]} : @_;
+       if( $self->relations->has_type( $args{name} ) ) {
+               throw( 'Relationship type ' . $args{name} . ' already registered' );
+       }
+       $self->relations->add_type( %args );
+}
+
+sub get_relationship_type {
+       my( $self, $name ) = @_;
+               return $self->relations->has_type( $name ) 
+                       ? $self->relations->type( $name ) : undef;
+}
+
 ### Reading construct/destruct functions
 
 sub add_reading {
@@ -243,7 +249,8 @@ sub add_reading {
                        # If we are initializing an empty collation, don't assume that we
                        # have set a tradition.
                        delete $args{'init'};
-               } elsif( $self->tradition->has_language && !exists $args{'language'} ) {
+               } elsif( $self->tradition->can('language') && $self->tradition->has_language
+                       && !exists $args{'language'} ) {
                        $args{'language'} = $self->tradition->language;
                }
                $reading = Text::Tradition::Collation::Reading->new( 
@@ -280,9 +287,19 @@ around del_reading => sub {
        $self->$orig( $arg );
 };
 
+=head2 merge_readings( $main, $second, $concatenate, $with_str )
+
+Merges the $second reading into the $main one. If $concatenate is true, then
+the merged node will carry the text of both readings, concatenated with either
+$with_str (if specified) or a sensible default (the empty string if the
+appropriate 'join_*' flag is set on either reading, or else $self->wordsep.)
+
+The first two arguments may be either readings or reading IDs.
+
 =begin testing
 
 use Text::Tradition;
+use TryCatch;
 
 my $cxfile = 't/data/Collatex-16.xml';
 my $t = Text::Tradition->new( 
@@ -293,13 +310,14 @@ my $t = Text::Tradition->new(
 my $c = $t->collation;
 
 my $rno = scalar $c->readings;
-# Split n21 for testing purposes
+# Split n21 ('unto') for testing purposes
 my $new_r = $c->add_reading( { 'id' => 'n21p0', 'text' => 'un', 'join_next' => 1 } );
 my $old_r = $c->reading( 'n21' );
 $old_r->alter_text( 'to' );
 $c->del_path( 'n20', 'n21', 'A' );
 $c->add_path( 'n20', 'n21p0', 'A' );
 $c->add_path( 'n21p0', 'n21', 'A' );
+$c->add_relationship( 'n21', 'n22', { type => 'collated', scope => 'local' } );
 $c->flatten_ranks();
 ok( $c->reading( 'n21p0' ), "New reading exists" );
 is( scalar $c->readings, $rno, "Reading add offset by flatten_ranks" );
@@ -314,12 +332,24 @@ $c->merge_readings( 'n9', 'n10' );
 ok( !$c->reading('n10'), "Reading n10 is gone" );
 is( $c->reading('n9')->text, 'rood', "Reading n9 has an unchanged word" );
 
-# Combine n21 and n21p0
+# Try to combine n21 and n21p0. This should break.
 my $remaining = $c->reading('n21');
 $remaining ||= $c->reading('n22');  # one of these should still exist
-$c->merge_readings( 'n21p0', $remaining, 1 );
-ok( !$c->reading('n21'), "Reading $remaining is gone" );
-is( $c->reading('n21p0')->text, 'unto', "Reading n21p0 merged correctly" );
+try {
+       $c->merge_readings( 'n21p0', $remaining, 1 );
+       ok( 0, "Bad reading merge changed the graph" );
+} catch( Text::Tradition::Error $e ) {
+       like( $e->message, qr/neither concatenated nor collated/, "Expected exception from bad concatenation" );
+} catch {
+       ok( 0, "Unexpected error on bad reading merge: $@" );
+}
+
+try {
+       $c->calculate_ranks();
+       ok( 1, "Graph is still evidently whole" );
+} catch( Text::Tradition::Error $e ) {
+       ok( 0, "Caught a rank exception: " . $e->message );
+}
 
 =end testing
 
@@ -340,6 +370,22 @@ sub merge_readings {
                                || $del_obj eq $self->start || $del_obj eq $self->end );
                throw( "Cannot combine text of meta readings" ) if $combine;
        }
+       # We can only merge readings in a linear graph if:
+       # - they are contiguous with only one edge between them, OR
+       # - they are at equivalent ranks in the graph.
+       if( $self->linear ) {
+               my @delpred = $del_obj->predecessors;
+               my @keptsuc = $kept_obj->successors;
+               unless ( @delpred == 1 && $delpred[0] eq $kept_obj 
+                       && @keptsuc == 1 && $keptsuc[0] eq $del_obj ) {
+                       my( $is_ok, $msg ) = $self->relations->relationship_valid( 
+                               $kept_obj, $del_obj, 'collated' );
+                       unless( $is_ok ) {
+                               throw( "Readings $kept_obj and $del_obj can be neither concatenated nor collated" );
+                       } 
+               }
+       }
+       
        # We only need the IDs for adding paths to the graph, not the reading
        # objects themselves.
        my $kept = $kept_obj->id;
@@ -374,6 +420,97 @@ sub merge_readings {
        $self->del_reading( $deleted );
 }
 
+=head2 merge_related( @relationship_types )
+
+Merge all readings linked with the relationship types given. If any of the selected type(s) is not a colocation, the graph will no longer be linear. The majority/plurality reading in each case will be the one kept. 
+
+WARNING: This operation cannot be undone.
+
+=cut
+
+=begin testing
+
+use Test::Warn;
+use Text::Tradition;
+use TryCatch;
+
+my $t;
+warnings_exist {
+       $t = Text::Tradition->new( 'input' => 'Self', 'file' => 't/data/legendfrag.xml' );
+} [qr/Cannot set relationship on a meta reading/],
+       "Got expected relationship drop warning on parse";
+
+my $c = $t->collation;
+
+my %rdg_ids;
+map { $rdg_ids{$_} = 1 } $c->readings;
+$c->merge_related( 'orthographic' );
+is( scalar( $c->readings ), keys( %rdg_ids ) - 8, 
+       "Successfully collapsed orthographic variation" );
+map { $rdg_ids{$_} = undef } qw/ r13.3 r11.4 r8.5 r8.2 r7.7 r7.5 r7.4 r7.1 /;
+foreach my $rid ( keys %rdg_ids ) {
+       my $exp = $rdg_ids{$rid};
+       is( !$c->reading( $rid ), !$exp, "Reading $rid correctly " . 
+               ( $exp ? "retained" : "removed" ) );
+}
+ok( $c->linear, "Graph is still linear" );
+try {
+       $c->calculate_ranks; # This should succeed
+       ok( 1, "Can still calculate ranks on the new graph" );
+} catch {
+       ok( 0, "Rank calculation on merged graph failed: $@" );
+}
+
+# Now add some transpositions
+$c->add_relationship( 'r8.4', 'r10.4', { type => 'transposition' } );
+$c->merge_related( 'transposition' );
+is( scalar( $c->readings ), keys( %rdg_ids ) - 9, 
+       "Transposed relationship is merged away" );
+ok( !$c->reading('r8.4'), "Correct transposed reading removed" );
+ok( !$c->linear, "Graph is no longer linear" );
+try {
+       $c->calculate_ranks; # This should fail
+       ok( 0, "Rank calculation happened on nonlinear graph?!" );
+} catch ( Text::Tradition::Error $e ) {
+       is( $e->message, 'Cannot calculate ranks on a non-linear graph', 
+               "Rank calculation on merged graph threw an error" );
+}
+
+=end testing
+
+=cut
+
+# TODO: there should be a way to display merged without affecting the underlying data!
+
+sub merge_related {
+       my $self = shift;
+       my %reltypehash;
+       map { $reltypehash{$_} = 1 } @_;
+       
+       # Set up the filter for finding related readings
+       my $filter = sub {
+               exists $reltypehash{$_[0]->type};
+       };
+       
+       # Go through all readings looking for related ones
+       foreach my $r ( $self->readings ) {
+               next unless $self->reading( "$r" ); # might have been deleted meanwhile
+               my @related = $self->related_readings( $r, $filter );
+               if( @related ) {
+                       push( @related, $r );
+                       @related = sort { 
+                                       scalar $b->witnesses <=> scalar $a->witnesses
+                               } @related;
+                       my $keep = shift @related;
+                       foreach my $delr ( @related ) {
+                               $self->linear( 0 )
+                                       unless( $self->get_relationship( $keep, $delr )->colocated );
+                               $self->merge_readings( $keep, $delr );
+                       }
+               }
+       }
+}
+
 =head2 compress_readings
 
 Where possible in the graph, compresses plain sequences of readings into a
@@ -442,6 +579,188 @@ sub _objectify_args {
         unless ref( $second ) eq 'Text::Tradition::Collation::Reading';        
     return( $first, $second, $arg );
 }
+
+=head2 duplicate_reading( $reading, @witlist )
+
+Split the given reading into two, so that the new reading is in the path for
+the witnesses given in @witlist. If the result is that certain non-colocated
+relationships (e.g. transpositions) are no longer valid, these will be removed.
+Returns the newly-created reading.
+
+=begin testing
+
+use Test::More::UTF8;
+use Text::Tradition;
+use TryCatch;
+
+my $st = Text::Tradition->new( 'input' => 'Self', 'file' => 't/data/collatecorr.xml' );
+is( ref( $st ), 'Text::Tradition', "Got a tradition from test file" );
+ok( $st->has_witness('Ba96'), "Tradition has the affected witness" );
+
+my $sc = $st->collation;
+my $numr = 17;
+ok( $sc->reading('n131'), "Tradition has the affected reading" );
+is( scalar( $sc->readings ), $numr, "There are $numr readings in the graph" );
+is( $sc->end->rank, 14, "There are fourteen ranks in the graph" );
+
+# Detach the erroneously collated reading
+my( $newr, @del_rdgs ) = $sc->duplicate_reading( 'n131', 'Ba96' );
+ok( $newr, "New reading was created" );
+ok( $sc->reading('n131_0'), "Detached the bad collation with a new reading" );
+is( scalar( $sc->readings ), $numr + 1, "A reading was added to the graph" );
+is( $sc->end->rank, 10, "There are now only ten ranks in the graph" );
+my $csucc = $sc->common_successor( 'n131', 'n131_0' );
+is( $csucc->id, 'n136', "Found correct common successor to duped reading" ); 
+
+# Check that the bad transposition is gone
+is( scalar @del_rdgs, 1, "Deleted reading was returned by API call" );
+is( $sc->get_relationship( 'n130', 'n135' ), undef, "Bad transposition relationship is gone" );
+
+# The collation should not be fixed
+my @pairs = $sc->identical_readings();
+is( scalar @pairs, 0, "Not re-collated yet" );
+# Fix the collation
+ok( $sc->merge_readings( 'n124', 'n131_0' ), "Collated the readings correctly" );
+@pairs = $sc->identical_readings( start => 'n124', end => $csucc->id );
+is( scalar @pairs, 3, "Found three more identical readings" );
+is( $sc->end->rank, 11, "The ranks shifted appropriately" );
+$sc->flatten_ranks();
+is( scalar( $sc->readings ), $numr - 3, "Now we are collated correctly" );
+
+# Check that we can't "duplicate" a reading with no wits or with all wits
+try {
+       my( $badr, @del_rdgs ) = $sc->duplicate_reading( 'n124' );
+       ok( 0, "Reading duplication without witnesses throws an error" );
+} catch( Text::Tradition::Error $e ) {
+       like( $e->message, qr/Must specify one or more witnesses/, 
+               "Reading duplication without witnesses throws the expected error" );
+} catch {
+       ok( 0, "Reading duplication without witnesses threw the wrong error" );
+}
+
+try {
+       my( $badr, @del_rdgs ) = $sc->duplicate_reading( 'n124', 'Ba96', 'Mü11475' );
+       ok( 0, "Reading duplication with all witnesses throws an error" );
+} catch( Text::Tradition::Error $e ) {
+       like( $e->message, qr/Cannot join all witnesses/, 
+               "Reading duplication with all witnesses throws the expected error" );
+} catch {
+       ok( 0, "Reading duplication with all witnesses threw the wrong error" );
+}
+
+try {
+       $sc->calculate_ranks();
+       ok( 1, "Graph is still evidently whole" );
+} catch( Text::Tradition::Error $e ) {
+       ok( 0, "Caught a rank exception: " . $e->message );
+}
+
+=end testing
+
+=cut
+
+sub duplicate_reading {
+       my( $self, $r, @wits ) = @_;
+       # Check that we are not doing anything unwise.
+       throw( "Must specify one or more witnesses for the duplicated reading" )
+               unless @wits;
+       unless( ref( $r ) eq 'Text::Tradition::Collation::Reading' ) {
+               $r = $self->reading( $r );
+       }
+       throw( "Cannot duplicate a meta-reading" )
+               if $r->is_meta;
+       throw( "Cannot join all witnesses to the new reading" )
+               if scalar( @wits ) == scalar( $r->witnesses );
+
+       # Get all the reading attributes and duplicate them.    
+       my $rmeta = Text::Tradition::Collation::Reading->meta;
+       my %args;
+    foreach my $attr( $rmeta->get_all_attributes ) {
+               next if $attr->name =~ /^_/;
+               my $acc = $attr->get_read_method;
+               if( !$acc && $attr->has_applied_traits ) {
+                       my $tr = $attr->applied_traits;
+                       if( $tr->[0] =~ /::(Array|Hash)$/ ) {
+                               my $which = $1;
+                               my %methods = reverse %{$attr->handles};
+                               $acc = $methods{elements};
+                               $args{$attr->name} = $which eq 'Array' 
+                                       ? [ $r->$acc ] : { $r->$acc };
+                       } 
+               } else {
+                       $args{$attr->name} = $r->$acc if $acc;
+               }
+       }
+       # By definition the new reading will no longer be common.
+       $args{is_common} = 0;
+       # The new reading also needs its own ID.
+       $args{id} = $self->_generate_dup_id( $r->id );
+
+       # Try to make the new reading.
+       my $newr = $self->add_reading( \%args );
+       # The old reading is also no longer common.
+       $r->is_common( 0 );
+       
+       # For each of the witnesses, dissociate from the old reading and
+       # associate with the new.
+       foreach my $wit ( @wits ) {
+               my $prior = $self->prior_reading( $r, $wit );
+               my $next = $self->next_reading( $r, $wit );
+               $self->del_path( $prior, $r, $wit );
+               $self->add_path( $prior, $newr, $wit );
+               $self->del_path( $r, $next, $wit );
+               $self->add_path( $newr, $next, $wit );
+       }
+       
+       # If the graph is ranked, we need to look for relationships that are now
+       # invalid (i.e. 'non-colocation' types that might now be colocated) and
+       # remove them. If not, we can skip it.
+       my $succ;
+       my %rrk;
+       my @deleted_relations;
+       if( $self->end->has_rank ) {
+               # Find the point where we can stop checking
+               $succ = $self->common_successor( $r, $newr );
+               
+               # Hash the existing ranks
+               foreach my $rdg ( $self->readings ) {
+                       $rrk{$rdg->id} = $rdg->rank;
+               }
+               # Calculate the new ranks       
+               $self->calculate_ranks();
+       
+               # Check for invalid non-colocated relationships among changed-rank readings
+               # from where the ranks start changing up to $succ
+               my $lastrank = $succ->rank;
+               foreach my $rdg ( $self->readings ) {
+                       next if $rdg->rank > $lastrank;
+                       next if $rdg->rank == $rrk{$rdg->id};
+                       my @noncolo = $rdg->related_readings( sub { !$_[0]->colocated } );
+                       next unless @noncolo;
+                       foreach my $nc ( @noncolo ) {
+                               unless( $self->relations->verify_or_delete( $rdg, $nc ) ) {
+                                       push( @deleted_relations, [ $rdg->id, $nc->id ] );
+                               }
+                       }
+               }
+       }
+       return ( $newr, @deleted_relations );
+}
+
+sub _generate_dup_id {
+       my( $self, $rid ) = @_;
+       my $newid;
+       my $i = 0;
+       while( !$newid ) {
+               $newid = $rid."_$i";
+               if( $self->has_reading( $newid ) ) {
+                       $newid = '';
+                       $i++;
+               }
+       }
+       return $newid;
+}
+
 ### Path logic
 
 sub add_path {
@@ -471,7 +790,7 @@ sub del_path {
                @args = @_;
        }
 
-       # We only need the IDs for adding paths to the graph, not the reading
+       # We only need the IDs for removing paths from the graph, not the reading
        # objects themselves.
     my( $source, $target, $wit ) = $self->_stringify_args( @args );
 
@@ -479,7 +798,7 @@ sub del_path {
        if( $self->sequence->has_edge_attribute( $source, $target, $wit ) ) {
                $self->sequence->delete_edge_attribute( $source, $target, $wit );
        }
-       unless( keys %{$self->sequence->get_edge_attributes( $source, $target )} ) {
+       unless( $self->sequence->has_edge_attributes( $source, $target ) ) {
                $self->sequence->delete_edge( $source, $target );
                $self->relations->delete_equivalence_edge( $source, $target );
        }
@@ -525,7 +844,15 @@ sub add_relationship {
        my $self = shift;
     my( $source, $target, $opts ) = $self->_stringify_args( @_ );
     my( @vectors ) = $self->relations->add_relationship( $source, $target, $opts );
-       $self->_graphcalc_done(0);
+    foreach my $v ( @vectors ) {
+       next unless $self->get_relationship( $v )->colocated;
+       if( $self->reading( $v->[0] )->has_rank && $self->reading( $v->[1] )->has_rank
+               && $self->reading( $v->[0] )->rank ne $self->reading( $v->[1] )->rank ) {
+                       $self->_graphcalc_done(0);
+                       $self->_clear_cache;
+                       last;
+       }
+    }
     return @vectors;
 }
 
@@ -536,8 +863,8 @@ around qw/ get_relationship del_relationship / => sub {
        if( @args == 1 && ref( $args[0] ) eq 'ARRAY' ) {
                @args = @{$_[0]};
        }
-       my( $source, $target ) = $self->_stringify_args( @args );
-       $self->$orig( $source, $target );
+       my @stringargs = $self->_stringify_args( @args );
+       $self->$orig( @stringargs );
 };
 
 =head2 reading_witnesses( $reading )
@@ -551,7 +878,7 @@ sub reading_witnesses {
        # We need only check either the incoming or the outgoing edges; I have
        # arbitrarily chosen "incoming".  Thus, special-case the start node.
        if( $reading eq $self->start ) {
-               return map { $_->sigil } $self->tradition->witnesses;
+               return map { $_->sigil } grep { $_->is_collated } $self->tradition->witnesses;
        }
        my %all_witnesses;
        foreach my $e ( $self->sequence->edges_to( $reading ) ) {
@@ -700,7 +1027,8 @@ sub as_dot {
     foreach my $edge ( @edges ) {
        # Do we need to output this edge?
        if( $used{$edge->[0]} && $used{$edge->[1]} ) {
-               my $label = $self->_path_display_label( $self->path_witnesses( $edge ) );
+               my $label = $self->_path_display_label( $opts,
+                       $self->path_witnesses( $edge ) );
                        my $variables = { %edge_attrs, 'label' => $label };
                        
                        # Account for the rank gap if necessary
@@ -732,9 +1060,45 @@ sub as_dot {
                $substart{$edge->[1]} = $edge->[0];
         }
     }
+    
+    # If we are asked to, add relationship links
+    if( exists $opts->{show_relations} ) {
+       my $filter = $opts->{show_relations}; # can be 'transposition' or 'all'
+       if( $filter eq 'transposition' ) {
+               $filter =~ qr/^transposition$/;
+       }
+       my %typecolors;
+       my @types = sort( map { $_->name } $self->relations->types );
+       if( exists $opts->{graphcolors} ) {
+               foreach my $tdx ( 0 .. $#types ) {
+                       $typecolors{$types[$tdx]} = $opts->{graphcolors}->[$tdx];
+               }
+       } else {
+               map { $typecolors{$_} = '#FFA14F' } @types;
+       }
+       foreach my $redge ( $self->relationships ) {
+               if( $used{$redge->[0]} && $used{$redge->[1]} ) {
+                               my $rel = $self->get_relationship( $redge );
+                               next unless $filter eq 'all' || $rel->type =~ /$filter/;
+                               my $variables = { 
+                                       arrowhead => 'none',
+                                       color => $typecolors{$rel->type},
+                                       constraint => 'false',
+                                       penwidth => '3',
+                               };
+                               unless( exists $opts->{graphcolors} ) {
+                                       $variables->{label} = uc( substr( $rel->type, 0, 4 ) ), 
+                               }
+                               $dot .= sprintf( "\t\"%s\" -> \"%s\" %s;\n",
+                                       $redge->[0], $redge->[1], _dot_attr_string( $variables ) );
+               }
+       }
+    }
+    
     # Add substitute start and end edges if necessary
     foreach my $node ( keys %substart ) {
-       my $witstr = $self->_path_display_label ( $self->path_witnesses( $substart{$node}, $node ) );
+       my $witstr = $self->_path_display_label( $opts, 
+               $self->path_witnesses( $substart{$node}, $node ) );
        my $variables = { %edge_attrs, 'label' => $witstr };
        my $nrdg = $self->reading( $node );
        if( $nrdg->has_rank && $nrdg->rank > $startrank ) {
@@ -745,7 +1109,8 @@ sub as_dot {
         $dot .= "\t\"__SUBSTART__\" -> \"$node\" $varopts;\n";
        }
     foreach my $node ( keys %subend ) {
-       my $witstr = $self->_path_display_label ( $self->path_witnesses( $node, $subend{$node} ) );
+       my $witstr = $self->_path_display_label( $opts,
+               $self->path_witnesses( $node, $subend{$node} ) );
        my $variables = { %edge_attrs, 'label' => $witstr };
         my $varopts = _dot_attr_string( $variables );
         $dot .= "\t\"$node\" -> \"__SUBEND__\" $varopts;\n";
@@ -818,6 +1183,7 @@ sub path_witnesses {
 # witnesses only where the main witness is not also in the list.
 sub _path_display_label {
        my $self = shift;
+       my $opts = shift;
        my %wits;
        map { $wits{$_} = 1 } @_;
 
@@ -835,14 +1201,18 @@ sub _path_display_label {
                }
        }
        
-       # See if we are in a majority situation.
-       my $maj = scalar( $self->tradition->witnesses ) * 0.6;
-       $maj = $maj > 5 ? $maj : 5;
-       if( scalar keys %wits > $maj ) {
-               unshift( @disp_ac, 'majority' );
-               return join( ', ', @disp_ac );
-       } else {
+       if( $opts->{'explicit_wits'} ) {
                return join( ', ', sort keys %wits );
+       } else {
+               # See if we are in a majority situation.
+               my $maj = scalar( $self->tradition->witnesses ) * 0.6;
+               $maj = $maj > 5 ? $maj : 5;
+               if( scalar keys %wits > $maj ) {
+                       unshift( @disp_ac, 'majority' );
+                       return join( ', ', @disp_ac );
+               } else {
+                       return join( ', ', sort keys %wits );
+               }
        }
 }
 
@@ -899,7 +1269,8 @@ is( scalar $c->relationships, 0, "Collation has all relationships" );
 # Add a few relationships
 $c->add_relationship( 'w123', 'w125', { 'type' => 'collated' } );
 $c->add_relationship( 'w193', 'w196', { 'type' => 'collated' } );
-$c->add_relationship( 'w257', 'w262', { 'type' => 'transposition' } );
+$c->add_relationship( 'w257', 'w262', { 'type' => 'transposition', 
+                                         'is_significant' => 'yes' } );
 
 # Now write it to GraphML and parse it again.
 
@@ -908,16 +1279,12 @@ my $st = Text::Tradition->new( 'input' => 'Self', 'string' => $graphml );
 is( scalar $st->collation->readings, $READINGS, "Reparsed collation has all readings" );
 is( scalar $st->collation->paths, $PATHS, "Reparsed collation has all paths" );
 is( scalar $st->collation->relationships, 3, "Reparsed collation has new relationships" );
+my $sigrel = $st->collation->get_relationship( 'w257', 'w262' );
+is( $sigrel->is_significant, 'yes', "Ternary attribute value was restored" );
 
 # Now add a stemma, write to GraphML, and look at the output.
-my $SKIP_STEMMA;
-try {
-       $tradition->enable_stemmata;
-} catch {
-       $SKIP_STEMMA = 1;
-}
 SKIP: {
-       skip "Analysis module not present", 3 if $SKIP_STEMMA;
+       skip "Analysis module not present", 3 unless $tradition->can( 'add_stemma' );
        my $stemma = $tradition->add_stemma( 'dotfile' => 't/data/florilegium.dot' );
        is( ref( $stemma ), 'Text::Tradition::Stemma', "Parsed dotfile into stemma" );
        is( $tradition->stemmata, 1, "Tradition now has the stemma" );
@@ -925,16 +1292,6 @@ SKIP: {
        like( $graphml, qr/digraph/, "Digraph declaration exists in GraphML" );
 }
 
-# Now add a user, write to GraphML, and look at the output.
-unlike( $graphml, qr/testuser/, "Test user name does not exist in GraphML yet" );
-my $testuser = Text::Tradition::User->new( 
-       id => 'testuser', password => 'testpass' );
-is( ref( $testuser ), 'Text::Tradition::User', "Created test user object" );
-$testuser->add_tradition( $tradition );
-is( $tradition->user->id, $testuser->id, "Tradition assigned to test user" );
-$graphml = $c->as_graphml;
-like( $graphml, qr/testuser/, "Test user name now exists in GraphML" );
-
 =end testing
 
 =cut
@@ -983,6 +1340,7 @@ sub as_graphml {
        'ReadingID' => 'string',
        'RelationshipType' => 'string',
        'RelationshipScope' => 'string',
+       'Ternary' => 'string',
     );
     
     # Add the data keys for the graph. Include an extra key 'version' for the
@@ -992,6 +1350,8 @@ sub as_graphml {
     my %graph_attributes = ( 'version' => 'string' );
        # Graph attributes include those of Tradition and those of Collation.
        my %gattr_from;
+       # TODO Use meta introspection method from duplicate_reading to do this
+       # instead of naming custom keys.
        my $tmeta = $self->tradition->meta;
        my $cmeta = $self->meta;
        map { $gattr_from{$_->name} = 'Tradition' } $tmeta->get_all_attributes;
@@ -1012,9 +1372,11 @@ sub as_graphml {
                };
        }
        
-    $graph_attributes{'user'} = sub { 
-       $self->tradition->user ? $self->tradition->user->id : undef 
-    };
+       if( $tmeta->has_method('user') ) {
+               $graph_attributes{'user'} = sub { 
+                       $self->tradition->user ? $self->tradition->user->id : undef 
+               };
+       }
        
     foreach my $datum ( sort keys %graph_attributes ) {
        $graph_data_keys{$datum} = 'dg'.$gdi++;
@@ -1200,27 +1562,113 @@ sub _add_graphml_data {
 Returns a CSV alignment table representation of the collation graph, one
 row per witness (or witness uncorrected.) 
 
+=head2 as_tsv
+
+Returns a tab-separated alignment table representation of the collation graph, 
+one row per witness (or witness uncorrected.) 
+
+=begin testing
+
+use Text::Tradition;
+use Text::CSV;
+
+my $READINGS = 311;
+my $PATHS = 361;
+my $WITS = 13;
+my $WITAC = 4;
+
+my $datafile = 't/data/florilegium_tei_ps.xml';
+my $tradition = Text::Tradition->new( 'input' => 'TEI',
+                                      'name' => 'test0',
+                                      'file' => $datafile,
+                                      'linear' => 1 );
+
+my $c = $tradition->collation;
+# Export the thing to CSV
+my $csvstr = $c->as_csv();
+# Count the columns
+my $csv = Text::CSV->new({ sep_char => ',', binary => 1 });
+my @lines = split(/\n/, $csvstr );
+ok( $csv->parse( $lines[0] ), "Successfully parsed first line of CSV" );
+is( scalar( $csv->fields ), $WITS + $WITAC, "CSV has correct number of witness columns" );
+my @q_ac = grep { $_ eq 'Q'.$c->ac_label } $csv->fields;
+ok( @q_ac, "Found a layered witness" );
+
+my $t2 = Text::Tradition->new( input => 'Tabular',
+                                                          name => 'test2',
+                                                          string => $csvstr,
+                                                          sep_char => ',' );
+is( scalar $t2->collation->readings, $READINGS, "Reparsed CSV collation has all readings" );
+is( scalar $t2->collation->paths, $PATHS, "Reparsed CSV collation has all paths" );
+
+# Now do it with TSV
+my $tsvstr = $c->as_tsv();
+my $t3 = Text::Tradition->new( input => 'Tabular',
+                                                          name => 'test3',
+                                                          string => $tsvstr,
+                                                          sep_char => "\t" );
+is( scalar $t3->collation->readings, $READINGS, "Reparsed TSV collation has all readings" );
+is( scalar $t3->collation->paths, $PATHS, "Reparsed TSV collation has all paths" );
+
+my $table = $c->alignment_table;
+my $noaccsv = $c->as_csv({ noac => 1 });
+my @noaclines = split(/\n/, $noaccsv );
+ok( $csv->parse( $noaclines[0] ), "Successfully parsed first line of no-ac CSV" );
+is( scalar( $csv->fields ), $WITS, "CSV has correct number of witness columns" );
+is( $c->alignment_table, $table, "Request for CSV did not alter the alignment table" );
+
+my $safecsv = $c->as_csv({ safe_ac => 1});
+my @safelines = split(/\n/, $safecsv );
+ok( $csv->parse( $safelines[0] ), "Successfully parsed first line of safe CSV" );
+is( scalar( $csv->fields ), $WITS + $WITAC, "CSV has correct number of witness columns" );
+@q_ac = grep { $_ eq 'Q__L' } $csv->fields;
+ok( @q_ac, "Found a sanitized layered witness" );
+is( $c->alignment_table, $table, "Request for CSV did not alter the alignment table" );
+
+=end testing
+
 =cut
 
-sub as_csv {
-    my( $self ) = @_;
-    my $table = $self->alignment_table;
-    my $csv = Text::CSV->new( { binary => 1, quote_null => 0 } );    
+sub _tabular {
+    my( $self, $opts ) = @_;
+    my $table = $self->alignment_table( $opts );
+       my $csv_options = { binary => 1, quote_null => 0 };
+       $csv_options->{'sep_char'} = $opts->{fieldsep};
+       if( $opts->{fieldsep} eq "\t" ) {
+               # If it is really tab separated, nothing is an escape char.
+               $csv_options->{'quote_char'} = undef;
+               $csv_options->{'escape_char'} = '';
+       }
+    my $csv = Text::CSV->new( $csv_options );    
     my @result;
     # Make the header row
     $csv->combine( map { $_->{'witness'} } @{$table->{'alignment'}} );
-       push( @result, decode_utf8( $csv->string ) );
+       push( @result, $csv->string );
     # Make the rest of the rows
     foreach my $idx ( 0 .. $table->{'length'} - 1 ) {
        my @rowobjs = map { $_->{'tokens'}->[$idx] } @{$table->{'alignment'}};
        my @row = map { $_ ? $_->{'t'}->text : $_ } @rowobjs;
         $csv->combine( @row );
-        push( @result, decode_utf8( $csv->string ) );
+        push( @result, $csv->string );
     }
     return join( "\n", @result );
 }
 
-=head2 alignment_table( $use_refs, $include_witnesses )
+sub as_csv {
+       my $self = shift;
+       my $opts = shift || {};
+       $opts->{fieldsep} = ',';
+       return $self->_tabular( $opts );
+}
+
+sub as_tsv {
+       my $self = shift;
+       my $opts = shift || {};
+       $opts->{fieldsep} = "\t";
+       return $self->_tabular( $opts );
+}
+
+=head2 alignment_table
 
 Return a reference to an alignment table, in a slightly enhanced CollateX
 format which looks like this:
@@ -1232,41 +1680,45 @@ format which looks like this:
                            ... ],
             length => TEXTLEN };
 
-If $use_refs is set to 1, the reading object is returned in the table 
-instead of READINGTEXT; if not, the text of the reading is returned.
-
-If $include_witnesses is set to a hashref, only the witnesses whose sigil
-keys have a true hash value will be included.
-
 =cut
 
 sub alignment_table {
-    my( $self ) = @_;
-    $self->calculate_ranks() unless $self->_graphcalc_done;
-    return $self->cached_table if $self->has_cached_table;
+    my( $self, $opts ) = @_;
+    if( $self->has_cached_table ) {
+               return $self->cached_table
+                       unless $opts->{noac} || $opts->{safe_ac};
+    }
     
     # Make sure we can do this
        throw( "Need a linear graph in order to make an alignment table" )
                unless $self->linear;
-       $self->calculate_ranks unless $self->end->has_rank;
-       
+    $self->calculate_ranks() 
+       unless $self->_graphcalc_done && $self->end->has_rank;
+
     my $table = { 'alignment' => [], 'length' => $self->end->rank - 1 };
     my @all_pos = ( 1 .. $self->end->rank - 1 );
     foreach my $wit ( sort { $a->sigil cmp $b->sigil } $self->tradition->witnesses ) {
         # say STDERR "Making witness row(s) for " . $wit->sigil;
         my @wit_path = $self->reading_sequence( $self->start, $self->end, $wit->sigil );
         my @row = _make_witness_row( \@wit_path, \@all_pos );
-        push( @{$table->{'alignment'}}, 
-               { 'witness' => $wit->sigil, 'tokens' => \@row } );
-        if( $wit->is_layered ) {
+        my $witobj = { 'witness' => $wit->sigil, 'tokens' => \@row };
+        $witobj->{'identifier'} = $wit->identifier if $wit->identifier;
+        push( @{$table->{'alignment'}}, $witobj );
+        if( $wit->is_layered && !$opts->{noac} ) {
                my @wit_ac_path = $self->reading_sequence( $self->start, $self->end, 
                        $wit->sigil.$self->ac_label );
             my @ac_row = _make_witness_row( \@wit_ac_path, \@all_pos );
-                       push( @{$table->{'alignment'}},
-                               { 'witness' => $wit->sigil.$self->ac_label, 'tokens' => \@ac_row } );
+            my $witlabel = $opts->{safe_ac} 
+               ? $wit->sigil . '__L' : $wit->sigil.$self->ac_label;
+            my $witacobj = { 'witness' => $witlabel, 
+               'tokens' => \@ac_row };
+            $witacobj->{'identifier'} = $wit->identifier if $wit->identifier;
+                       push( @{$table->{'alignment'}}, $witacobj );
         }           
     }
-    $self->cached_table( $table );
+    unless( $opts->{noac} || $opts->{safe_ac} ) {
+           $self->cached_table( $table );
+       }
     return $table;
 }
 
@@ -1296,6 +1748,7 @@ sub _make_witness_row {
     return @filled_row;
 }
 
+
 =head1 NAVIGATION METHODS
 
 =head2 reading_sequence( $first, $last, $sigil, $backup )
@@ -1554,8 +2007,10 @@ ok( $c->has_cached_table, "Alignment table was cached" );
 is( $c->alignment_table, $table, "Cached table returned upon second call" );
 $c->calculate_ranks;
 is( $c->alignment_table, $table, "Cached table retained with no rank change" );
-$c->add_relationship( 'n24', 'n23', { 'type' => 'spelling' } );
-isnt( $c->alignment_table, $table, "Alignment table changed after relationship add" );
+$c->add_relationship( 'n13', 'n23', { type => 'repetition' } );
+is( $c->alignment_table, $table, "Alignment table unchanged after non-colo relationship add" );
+$c->add_relationship( 'n24', 'n23', { type => 'spelling' } );
+isnt( $c->alignment_table, $table, "Alignment table changed after colo relationship add" );
 
 =end testing
 
@@ -1564,6 +2019,8 @@ isnt( $c->alignment_table, $table, "Alignment table changed after relationship a
 sub calculate_ranks {
     my $self = shift;
     # Save the existing ranks, in case we need to invalidate the cached SVG.
+    throw( "Cannot calculate ranks on a non-linear graph" ) 
+       unless $self->linear;
     my %existing_ranks;
     map { $existing_ranks{$_} = $_->rank } $self->readings;
 
@@ -1614,29 +2071,71 @@ with the same text at the same rank, and merges any that are found.
 =cut
 
 sub flatten_ranks {
-    my $self = shift;
+    my ( $self, %args ) = shift;
     my %unique_rank_rdg;
     my $changed;
+    foreach my $p ( $self->identical_readings( %args ) ) {
+               # say STDERR "Combining readings at same rank: @$p";
+               $changed = 1;
+               $self->merge_readings( @$p );
+               # TODO see if this now makes a common point.
+    }
+    # If we merged readings, the ranks are still fine but the alignment
+    # table is wrong. Wipe it.
+    $self->wipe_table() if $changed;
+}
+
+=head2 identical_readings
+=head2 identical_readings( start => $startnode, end => $endnode )
+=head2 identical_readings( startrank => $startrank, endrank => $endrank )
+
+Goes through the graph identifying all pairs of readings that appear to be
+identical, and therefore able to be merged into a single reading. Returns the 
+relevant identical pairs. Can be restricted to run over only a part of the 
+graph, specified either by node or by rank.
+
+=cut
+
+sub identical_readings {
+       my ( $self, %args ) = @_;
+    # Find where we should start and end.
+    my $startrank = $args{startrank} || 0;
+    if( $args{start} ) {
+       throw( "Starting reading has no rank" ) unless $self->reading( $args{start} ) 
+               && $self->reading( $args{start} )->has_rank;
+       $startrank = $self->reading( $args{start} )->rank;
+    }
+    my $endrank = $args{endrank} || $self->end->rank;
+    if( $args{end} ) {
+       throw( "Ending reading has no rank" ) unless $self->reading( $args{end} ) 
+               && $self->reading( $args{end} )->has_rank;
+       $endrank = $self->reading( $args{end} )->rank;
+    }
+    
+    # Make sure the ranks are correct.
+    unless( $self->_graphcalc_done ) {
+       $self->calculate_ranks;
+    }
+    # Go through the readings looking for duplicates.
+    my %unique_rank_rdg;
+    my @pairs;
     foreach my $rdg ( $self->readings ) {
         next unless $rdg->has_rank;
-        my $key = $rdg->rank . "||" . $rdg->text;
+        my $rk = $rdg->rank;
+        next if $rk > $endrank || $rk < $startrank;
+        my $key = $rk . "||" . $rdg->text;
         if( exists $unique_rank_rdg{$key} ) {
                # Make sure they don't have different grammatical forms
                        my $ur = $unique_rank_rdg{$key};
                if( $rdg->is_identical( $ur ) ) {
-                               # Combine!
-                               #say STDERR "Combining readings at same rank: $key";
-                               $changed = 1;
-                               $self->merge_readings( $unique_rank_rdg{$key}, $rdg );
-                               # TODO see if this now makes a common point.
+                               push( @pairs, [ $ur, $rdg ] );
                        }
         } else {
             $unique_rank_rdg{$key} = $rdg;
         }
-    }
-    # If we merged readings, the ranks are still fine but the alignment
-    # table is wrong. Wipe it.
-    $self->wipe_table() if $changed;
+    }  
+    
+    return @pairs;
 }