make the first couple of tests pass
[scpubgit/stemmatology.git] / lib / Text / Tradition / Witness.pm
CommitLineData
dd3b58b0 1package Text::Tradition::Witness;
2use Moose;
3
784877d9 4# Sigil. Required identifier for a witness.
dd3b58b0 5has 'sigil' => (
d047cd52 6 is => 'ro',
7 isa => 'Str',
8 required => 1,
9 );
dd3b58b0 10
d047cd52 11# Text. This is an array of strings (i.e. word tokens).
12# TODO Think about how to handle this for the case of pre-prepared
13# collations, where the tokens are in the graph already.
dd3b58b0 14has 'text' => (
d047cd52 15 is => 'rw',
16 isa => 'ArrayRef[Str]',
17 );
dd3b58b0 18
d047cd52 19# Source. This is where we read in the witness, if not from a
20# pre-prepared collation. It is probably a filename.
21has 'source' => (
22 is => 'ro',
23 isa => 'Str',
8e1394aa 24 predicate => 'has_source',
d047cd52 25 );
784877d9 26
27sub BUILD {
28 my $self = shift;
d047cd52 29 if( $self->has_source ) {
784877d9 30 # Read the file and initialize the text.
d047cd52 31 open( WITNESS, $self->source ) or die "Could not open "
784877d9 32 . $self->file . "for reading";
33 # TODO support TEI as well as plaintext, sometime
34 my @words;
35 while(<WITNESS>) {
36 chomp;
37 push( @words, split( /\s+/, $_ ) );
38 }
39 close WITNESS;
d047cd52 40 $self->text( \@words );
784877d9 41 }
42}
43
dd3b58b0 44no Moose;
45__PACKAGE__->meta->make_immutable;