is( ref( $t ), 'Text::Tradition', "Parsed our own GraphML" );
if( $t ) {
is( scalar $t->collation->readings, 319, "Collation has all readings" );
- is( scalar $t->collation->paths, 2854, "Collation has all paths" );
+ is( scalar $t->collation->paths, 376, "Collation has all paths" );
is( scalar $t->witnesses, 13, "Collation has all witnesses" );
}
=cut
my( $IDKEY, $TOKENKEY, $TRANSPOS_KEY, $RANK_KEY, $CLASS_KEY,
- $SOURCE_KEY, $TARGET_KEY, $WITNESS_KEY, $EXTRA_KEY, $RELATIONSHIP_KEY )
- = qw/ name reading identical rank class
- source target witness extra relationship/;
+ $START_KEY, $END_KEY, $LACUNA_KEY,
+ $SOURCE_KEY, $TARGET_KEY, $WITNESS_KEY, $EXTRA_KEY, $RELATIONSHIP_KEY,
+ $COLO_KEY, $CORRECT_KEY, $INDEP_KEY )
+ = qw/ name reading identical rank class
+ is_start is_end is_lacuna
+ source target witness extra relationship
+ equal_rank non_correctable non_independent /;
sub parse {
my( $tradition, $opts ) = @_;
# Set up the graph-global attributes. They will appear in the
# hash under their accessor names.
+ my $use_version;
print STDERR "Setting graph globals\n";
$tradition->name( $graph_data->{'name'} );
- foreach my $gkey ( keys %{$graph_data->{'attr'}} ) {
- my $val = $graph_data->{'attr'}->{$gkey};
- $collation->$gkey( $val );
+ $DB::single = 1;
+ foreach my $gkey ( keys %{$graph_data->{'global'}} ) {
+ my $val = $graph_data->{'global'}->{$gkey};
+ if( $gkey eq 'version' ) {
+ $use_version = $val;
+ } else {
+ $collation->$gkey( $val );
+ }
+ }
+ if( $use_version ) {
+ # Many of our tags changed.
+ $IDKEY = 'id';
+ $TOKENKEY = 'text';
+ $COLO_KEY = 'colocated';
}
# Add the nodes to the graph.
# after the nodes & edges are created.
print STDERR "Adding graph nodes\n";
foreach my $n ( @{$graph_data->{'nodes'}} ) {
+ # If it is the start or end node, we already have one, so skip it.
+ next if defined $n->{$START_KEY} || defined $n->{$END_KEY};
+
# First extract the data that we can use without reference to
# anything else.
my %node_data = %$n; # Need $n itself untouched for edge processing
- my $nodeid = delete $node_data{$IDKEY};
- my $reading = delete $node_data{$TOKENKEY};
- my $class = delete $node_data{$CLASS_KEY} || '';
- my $rank = delete $node_data{$RANK_KEY};
- # Create the node. Current valid classes are common and meta.
- # Everything else is a normal reading.
- my $gnode = $collation->add_reading( $nodeid );
- $gnode->text( $reading );
- $gnode->make_common if $class eq 'common';
- $gnode->is_meta( 1 ) if $class eq 'meta';
- # This is a horrible hack.
- $gnode->is_lacuna( $reading =~ /^\#LACUNA/ );
- $gnode->rank( $rank ) if defined $rank;
+ # Create the node.
+ my $reading_options = {
+ 'id' => delete $node_data{$IDKEY},
+ 'is_lacuna' => delete $node_data{$LACUNA_KEY},
+ };
+ my $rank = delete $node_data{$RANK_KEY};
+ $reading_options->{'rank'} = $rank if $rank;
+ my $text = delete $node_data{$TOKENKEY};
+ $reading_options->{'text'} = $text if $text;
+
+ # This is a horrible hack for backwards compatibility.
+ unless( $use_version ) {
+ $reading_options->{'is_lacuna'} = 1
+ if $reading_options->{'text'} =~ /^\#LACUNA/;
+ }
+
+ delete $node_data{$CLASS_KEY}; # Not actually used
+ my $gnode = $collation->add_reading( $reading_options );
# Now save the data that we need for post-processing,
- # if it exists.
+ # if it exists. TODO this is unneeded after conversion
if ( keys %node_data ) {
- $extra_data->{$nodeid} = \%node_data
+ $extra_data->{$gnode->id} = \%node_data
}
}
} elsif( $class eq 'relationship' ) {
# We need the metadata about the relationship.
my $opts = { 'type' => $e->{$RELATIONSHIP_KEY} };
- $opts->{'equal_rank'} = $e->{'equal_rank'}
- if exists $e->{'equal_rank'};
- $opts->{'non_correctable'} = $e->{'non_correctable'}
- if exists $e->{'non_correctable'};
- $opts->{'non_independent'} = $e->{'non_independent'}
- if exists $e->{'non_independent'};
+ $opts->{$COLO_KEY} = $e->{$COLO_KEY}
+ if exists $e->{$COLO_KEY};
+ $opts->{$CORRECT_KEY} = $e->{$CORRECT_KEY}
+ if exists $e->{$CORRECT_KEY};
+ $opts->{$INDEP_KEY} = $e->{$INDEP_KEY}
+ if exists $e->{$INDEP_KEY};
warn "No relationship type for relationship edge!" unless $opts->{'type'};
my( $ok, @result ) = $collation->add_relationship( $from->{$IDKEY}, $to->{$IDKEY}, $opts );
unless( $ok ) {
## Deal with node information (transposition, relationships, etc.) that
## needs to be processed after all the nodes are created.
- print STDERR "Adding second-pass node data\n";
- foreach my $nkey ( keys %$extra_data ) {
- foreach my $edkey ( keys %{$extra_data->{$nkey}} ) {
- my $this_reading = $collation->reading( $nkey );
- if( $edkey eq $TRANSPOS_KEY ) {
- my $other_reading = $collation->reading( $extra_data->{$nkey}->{$edkey} );
- $this_reading->set_identical( $other_reading );
- } else {
- warn "Unfamiliar reading node data $edkey for $nkey";
- }
- }
+ ## TODO unneeded after conversion
+ unless( $use_version ) {
+ print STDERR "Adding second-pass node data\n";
+ foreach my $nkey ( keys %$extra_data ) {
+ foreach my $edkey ( keys %{$extra_data->{$nkey}} ) {
+ my $this_reading = $collation->reading( $nkey );
+ if( $edkey eq $TRANSPOS_KEY ) {
+ my $other_reading = $collation->reading( $extra_data->{$nkey}->{$edkey} );
+ $this_reading->set_identical( $other_reading );
+ } else {
+ warn "Unfamiliar reading node data $edkey for $nkey";
+ }
+ }
+ }
}
}