Attempting clean up something.
[dbsrgits/SQL-Translator.git] / lib / SQL / Translator.pm
CommitLineData
16dc9970 1package SQL::Translator;
2
b346d8f1 3# ----------------------------------------------------------------------
8a990c91 4# $Id: Translator.pm,v 1.34 2003-06-25 19:15:19 kycl4rk Exp $
b346d8f1 5# ----------------------------------------------------------------------
abfa405a 6# Copyright (C) 2003 Ken Y. Clark <kclark@cpan.org>,
7# darren chamberlain <darren@cpan.org>,
8# Chris Mungall <cjm@fruitfly.org>
1fd8c91f 9#
077ebf34 10# This program is free software; you can redistribute it and/or
11# modify it under the terms of the GNU General Public License as
12# published by the Free Software Foundation; version 2.
ca10f295 13#
077ebf34 14# This program is distributed in the hope that it will be useful, but
15# WITHOUT ANY WARRANTY; without even the implied warranty of
16# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17# General Public License for more details.
ca10f295 18#
077ebf34 19# You should have received a copy of the GNU General Public License
20# along with this program; if not, write to the Free Software
21# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
22# 02111-1307 USA
ca10f295 23# -------------------------------------------------------------------
24
16dc9970 25use strict;
d529894e 26use vars qw( $VERSION $REVISION $DEFAULT_SUB $DEBUG $ERROR );
49e1eb70 27use base 'Class::Base';
c2d3a526 28
389b318c 29$VERSION = '0.02';
8a990c91 30$REVISION = sprintf "%d.%02d", q$Revision: 1.34 $ =~ /(\d+)\.(\d+)/;
d529894e 31$DEBUG = 0 unless defined $DEBUG;
32$ERROR = "";
c2d3a526 33
34use Carp qw(carp);
16dc9970 35
c0c4aef9 36use File::Spec::Functions qw(catfile);
37use File::Basename qw(dirname);
38use IO::Dir;
45ee6be0 39use SQL::Translator::Schema;
c0c4aef9 40
b346d8f1 41# ----------------------------------------------------------------------
42# The default behavior is to "pass through" values (note that the
43# SQL::Translator instance is the first value ($_[0]), and the stuff
44# to be parsed is the second value ($_[1])
45# ----------------------------------------------------------------------
05a56b57 46$DEFAULT_SUB = sub { $_[0]->schema } unless defined $DEFAULT_SUB;
16dc9970 47
b346d8f1 48# ----------------------------------------------------------------------
c2d3a526 49# init([ARGS])
b346d8f1 50# The constructor.
dfb4c915 51#
b346d8f1 52# new takes an optional hash of arguments. These arguments may
53# include a parser, specified with the keys "parser" or "from",
54# and a producer, specified with the keys "producer" or "to".
dfb4c915 55#
b346d8f1 56# The values that can be passed as the parser or producer are
57# given directly to the parser or producer methods, respectively.
58# See the appropriate method description below for details about
59# what each expects/accepts.
b346d8f1 60# ----------------------------------------------------------------------
c2d3a526 61sub init {
49e1eb70 62 my ( $self, $config ) = @_;
1fd8c91f 63
49e1eb70 64 #
b346d8f1 65 # Set the parser and producer.
ca10f295 66 #
b346d8f1 67 # If a 'parser' or 'from' parameter is passed in, use that as the
68 # parser; if a 'producer' or 'to' parameter is passed in, use that
69 # as the producer; both default to $DEFAULT_SUB.
49e1eb70 70 #
71 $self->parser ($config->{'parser'} || $config->{'from'} || $DEFAULT_SUB);
c2d3a526 72 $self->producer($config->{'producer'} || $config->{'to'} || $DEFAULT_SUB);
ca10f295 73
7d5bcab8 74 #
75 # Set up callbacks for formatting of pk,fk,table,package names in producer
76 #
77 $self->format_table_name($config->{'format_table_name'});
78 $self->format_package_name($config->{'format_package_name'});
79 $self->format_fk_name($config->{'format_fk_name'});
80 $self->format_pk_name($config->{'format_pk_name'});
81
49e1eb70 82 #
e2158c40 83 # Set the parser_args and producer_args
49e1eb70 84 #
85 for my $pargs ( qw[ parser_args producer_args ] ) {
86 $self->$pargs( $config->{$pargs} ) if defined $config->{ $pargs };
e2158c40 87 }
88
49e1eb70 89 #
9398955f 90 # Set the data source, if 'filename' or 'file' is provided.
49e1eb70 91 #
c2d3a526 92 $config->{'filename'} ||= $config->{'file'} || "";
49e1eb70 93 $self->filename( $config->{'filename'} ) if $config->{'filename'};
9398955f 94
49e1eb70 95 #
96 # Finally, if there is a 'data' parameter, use that in
97 # preference to filename and file
98 #
99 if ( my $data = $config->{'data'} ) {
100 $self->data( $data );
9398955f 101 }
102
d529894e 103 #
104 # Set various other options.
105 #
49e1eb70 106 $self->{'debug'} = defined $config->{'debug'} ? $config->{'debug'} : $DEBUG;
ca10f295 107
96844cae 108 $self->add_drop_table( $config->{'add_drop_table'} );
d529894e 109
d529894e 110 $self->no_comments( $config->{'no_comments'} );
111
96844cae 112 $self->show_warnings( $config->{'show_warnings'} );
113
114 $self->trace( $config->{'trace'} );
115
3f4af30d 116 $self->validate( $config->{'validate'} );
117
ca10f295 118 return $self;
dfb4c915 119}
1fd8c91f 120
0f3778d0 121# ----------------------------------------------------------------------
122# add_drop_table([$bool])
123# ----------------------------------------------------------------------
96844cae 124sub add_drop_table {
125 my $self = shift;
126 if ( defined (my $arg = shift) ) {
127 $self->{'add_drop_table'} = $arg ? 1 : 0;
128 }
129 return $self->{'add_drop_table'} || 0;
130}
131
0f3778d0 132# ----------------------------------------------------------------------
133# no_comments([$bool])
134# ----------------------------------------------------------------------
d529894e 135sub no_comments {
136 my $self = shift;
137 my $arg = shift;
138 if ( defined $arg ) {
139 $self->{'no_comments'} = $arg ? 1 : 0;
140 }
141 return $self->{'no_comments'} || 0;
142}
143
e2158c40 144
0f3778d0 145# ----------------------------------------------------------------------
146# producer([$producer_spec])
147#
148# Get or set the producer for the current translator.
149# ----------------------------------------------------------------------
ca10f295 150sub producer {
1fd8c91f 151 my $self = shift;
b346d8f1 152
7a8e1f51 153 # producer as a mutator
ca10f295 154 if (@_) {
155 my $producer = shift;
b346d8f1 156
7a8e1f51 157 # Passed a module name (string containing "::")
ca10f295 158 if ($producer =~ /::/) {
077ebf34 159 my $func_name;
b346d8f1 160
7a8e1f51 161 # Module name was passed directly
b346d8f1 162 # We try to load the name; if it doesn't load, there's
163 # a possibility that it has a function name attached to
164 # it.
077ebf34 165 if (load($producer)) {
166 $func_name = "produce";
7a8e1f51 167 }
b346d8f1 168
7a8e1f51 169 # Module::function was passed
b346d8f1 170 else {
171 # Passed Module::Name::function; try to recover
077ebf34 172 my @func_parts = split /::/, $producer;
173 $func_name = pop @func_parts;
174 $producer = join "::", @func_parts;
b346d8f1 175
176 # If this doesn't work, then we have a legitimate
177 # problem.
077ebf34 178 load($producer) or die "Can't load $producer: $@";
7a8e1f51 179 }
077ebf34 180
7a8e1f51 181 # get code reference and assign
077ebf34 182 $self->{'producer'} = \&{ "$producer\::$func_name" };
183 $self->{'producer_type'} = $producer;
49e1eb70 184 $self->debug("Got producer: $producer\::$func_name\n");
7a8e1f51 185 }
b346d8f1 186
7a8e1f51 187 # passed an anonymous subroutine reference
b346d8f1 188 elsif (isa($producer, 'CODE')) {
ca10f295 189 $self->{'producer'} = $producer;
077ebf34 190 $self->{'producer_type'} = "CODE";
49e1eb70 191 $self->debug("Got producer: code ref\n");
7a8e1f51 192 }
b346d8f1 193
7a8e1f51 194 # passed a string containing no "::"; relative package name
b346d8f1 195 else {
ca10f295 196 my $Pp = sprintf "SQL::Translator::Producer::$producer";
197 load($Pp) or die "Can't load $Pp: $@";
077ebf34 198 $self->{'producer'} = \&{ "$Pp\::produce" };
199 $self->{'producer_type'} = $Pp;
49e1eb70 200 $self->debug("Got producer: $Pp\n");
7a8e1f51 201 }
b346d8f1 202
ca10f295 203 # At this point, $self->{'producer'} contains a subroutine
b346d8f1 204 # reference that is ready to run
e2158c40 205
7a8e1f51 206 # Anything left? If so, it's producer_args
207 $self->producer_args(@_) if (@_);
208 }
b346d8f1 209
ca10f295 210 return $self->{'producer'};
211};
077ebf34 212
7a8e1f51 213# ----------------------------------------------------------------------
0f3778d0 214# producer_type()
7a8e1f51 215#
e2158c40 216# producer_type is an accessor that allows producer subs to get
217# information about their origin. This is poptentially important;
ca251f03 218# since all producer subs are called as subroutine references, there is
e2158c40 219# no way for a producer to find out which package the sub lives in
220# originally, for example.
7a8e1f51 221# ----------------------------------------------------------------------
222sub producer_type { $_[0]->{'producer_type'} }
e2158c40 223
7a8e1f51 224# ----------------------------------------------------------------------
0f3778d0 225# producer_args([\%args])
7a8e1f51 226#
e2158c40 227# Arbitrary name => value pairs of paramters can be passed to a
228# producer using this method.
52b828e8 229#
0f3778d0 230# If the first argument passed in is undef, then the hash of arguments
231# is cleared; all subsequent elements are added to the hash of name,
232# value pairs stored as producer_args.
7a8e1f51 233# ----------------------------------------------------------------------
e2158c40 234sub producer_args {
235 my $self = shift;
0f3778d0 236 return $self->_args("producer", @_);
7a8e1f51 237}
ca10f295 238
0f3778d0 239# ----------------------------------------------------------------------
240# parser([$parser_spec])
241# ----------------------------------------------------------------------
ca10f295 242sub parser {
243 my $self = shift;
b346d8f1 244
7a8e1f51 245 # parser as a mutator
ca10f295 246 if (@_) {
247 my $parser = shift;
b346d8f1 248
7a8e1f51 249 # Passed a module name (string containing "::")
ca10f295 250 if ($parser =~ /::/) {
b346d8f1 251 my $func_name;
252
7a8e1f51 253 # Module name was passed directly
b346d8f1 254 # We try to load the name; if it doesn't load, there's
255 # a possibility that it has a function name attached to
256 # it.
257 if (load($parser)) {
258 $func_name = "parse";
7a8e1f51 259 }
b346d8f1 260
7a8e1f51 261 # Module::function was passed
b346d8f1 262 else {
263 # Passed Module::Name::function; try to recover
264 my @func_parts = split /::/, $parser;
265 $func_name = pop @func_parts;
266 $parser = join "::", @func_parts;
267
268 # If this doesn't work, then we have a legitimate
269 # problem.
270 load($parser) or die "Can't load $parser: $@";
7a8e1f51 271 }
b346d8f1 272
7a8e1f51 273 # get code reference and assign
b346d8f1 274 $self->{'parser'} = \&{ "$parser\::$func_name" };
077ebf34 275 $self->{'parser_type'} = $parser;
49e1eb70 276 $self->debug("Got parser: $parser\::$func_name\n");
7a8e1f51 277 }
b346d8f1 278
7a8e1f51 279 # passed an anonymous subroutine reference
49e1eb70 280 elsif ( isa( $parser, 'CODE' ) ) {
281 $self->{'parser'} = $parser;
077ebf34 282 $self->{'parser_type'} = "CODE";
49e1eb70 283 $self->debug("Got parser: code ref\n");
7a8e1f51 284 }
b346d8f1 285
7a8e1f51 286 # passed a string containing no "::"; relative package name
b346d8f1 287 else {
49e1eb70 288 my $Pp = "SQL::Translator::Parser::$parser";
289 load( $Pp ) or die "Can't load $Pp: $@";
290 $self->{'parser'} = \&{ "$Pp\::parse" };
077ebf34 291 $self->{'parser_type'} = $Pp;
49e1eb70 292 $self->debug("Got parser: $Pp\n");
7a8e1f51 293 }
b346d8f1 294
49e1eb70 295 #
b346d8f1 296 # At this point, $self->{'parser'} contains a subroutine
297 # reference that is ready to run
49e1eb70 298 #
299 $self->parser_args( @_ ) if (@_);
7a8e1f51 300 }
b346d8f1 301
ca10f295 302 return $self->{'parser'};
16dc9970 303}
1fd8c91f 304
d529894e 305# ----------------------------------------------------------------------
077ebf34 306sub parser_type { $_[0]->{'parser_type'} }
e2158c40 307
e2158c40 308sub parser_args {
309 my $self = shift;
0f3778d0 310 return $self->_args("parser", @_);
311}
96844cae 312
313sub show_warnings {
314 my $self = shift;
315 my $arg = shift;
316 if ( defined $arg ) {
317 $self->{'show_warnings'} = $arg ? 1 : 0;
318 }
319 return $self->{'show_warnings'} || 0;
320}
321
ca10f295 322
0f3778d0 323# filename - get or set the filename
324sub filename {
325 my $self = shift;
326 if (@_) {
327 my $filename = shift;
328 if (-d $filename) {
329 my $msg = "Cannot use directory '$filename' as input source";
330 return $self->error($msg);
95a2cfb6 331 } elsif (ref($filename) eq 'ARRAY') {
332 $self->{'filename'} = $filename;
333 $self->debug("Got array of files: ".join(', ',@$filename)."\n");
0f3778d0 334 } elsif (-f _ && -r _) {
335 $self->{'filename'} = $filename;
336 $self->debug("Got filename: '$self->{'filename'}'\n");
337 } else {
338 my $msg = "Cannot use '$filename' as input source: ".
339 "file does not exist or is not readable.";
340 return $self->error($msg);
341 }
342 }
ca10f295 343
0f3778d0 344 $self->{'filename'};
345}
ca10f295 346
0f3778d0 347# ----------------------------------------------------------------------
348# data([$data])
349#
350# if $self->{'data'} is not set, but $self->{'filename'} is, then
351# $self->{'filename'} is opened and read, with the results put into
352# $self->{'data'}.
353# ----------------------------------------------------------------------
354sub data {
355 my $self = shift;
ca10f295 356
0f3778d0 357 # Set $self->{'data'} based on what was passed in. We will
358 # accept a number of things; do our best to get it right.
359 if (@_) {
360 my $data = shift;
361 if (isa($data, "SCALAR")) {
362 $self->{'data'} = $data;
363 }
364 else {
365 if (isa($data, 'ARRAY')) {
366 $data = join '', @$data;
367 }
368 elsif (isa($data, 'GLOB')) {
369 local $/;
370 $data = <$data>;
371 }
372 elsif (! ref $data && @_) {
373 $data = join '', $data, @_;
374 }
375 $self->{'data'} = \$data;
376 }
377 }
9398955f 378
7a8e1f51 379 # If we have a filename but no data yet, populate.
9398955f 380 if (not $self->{'data'} and my $filename = $self->filename) {
49e1eb70 381 $self->debug("Opening '$filename' to get contents.\n");
9398955f 382 local *FH;
383 local $/;
384 my $data;
385
95a2cfb6 386 my @files = ref($filename) eq 'ARRAY' ? @$filename : ($filename);
9398955f 387
95a2cfb6 388 foreach my $file (@files) {
389 unless (open FH, $file) {
390 return $self->error("Can't read file '$file': $!");
391 }
9398955f 392
95a2cfb6 393 $data .= <FH>;
394
395 unless (close FH) {
396 return $self->error("Can't close file '$file': $!");
397 }
398 }
399
400 $self->{'data'} = \$data;
9398955f 401 }
9398955f 402
403 return $self->{'data'};
7a8e1f51 404}
9398955f 405
45ee6be0 406# ----------------------------------------------------------------------
407sub schema {
408#
409# Returns the SQL::Translator::Schema object
410#
411 my $self = shift;
412
413 unless ( defined $self->{'schema'} ) {
414 $self->{'schema'} = SQL::Translator::Schema->new;
415 }
d529894e 416
45ee6be0 417 return $self->{'schema'};
418}
419
420# ----------------------------------------------------------------------
d529894e 421sub trace {
422 my $self = shift;
423 my $arg = shift;
424 if ( defined $arg ) {
425 $self->{'trace'} = $arg ? 1 : 0;
426 }
427 return $self->{'trace'} || 0;
428}
429
430# ----------------------------------------------------------------------
0f3778d0 431# translate([source], [\%args])
432#
433# translate does the actual translation. The main argument is the
434# source of the data to be translated, which can be a filename, scalar
435# reference, or glob reference.
436#
437# Alternatively, translate takes optional arguements, which are passed
438# to the appropriate places. Most notable of these arguments are
439# parser and producer, which can be used to set the parser and
440# producer, respectively. This is the applications last chance to set
441# these.
442#
443# translate returns a string.
444# ----------------------------------------------------------------------
ca251f03 445sub translate {
446 my $self = shift;
447 my ($args, $parser, $parser_type, $producer, $producer_type);
448 my ($parser_output, $producer_output);
ca10f295 449
7a8e1f51 450 # Parse arguments
9398955f 451 if (@_ == 1) {
7a8e1f51 452 # Passed a reference to a hash?
ca10f295 453 if (isa($_[0], 'HASH')) {
7a8e1f51 454 # yep, a hashref
49e1eb70 455 $self->debug("translate: Got a hashref\n");
ca10f295 456 $args = $_[0];
457 }
9398955f 458
0f3778d0 459 # Passed a GLOB reference, i.e., filehandle
460 elsif (isa($_[0], 'GLOB')) {
461 $self->debug("translate: Got a GLOB reference\n");
462 $self->data($_[0]);
463 }
464
7a8e1f51 465 # Passed a reference to a string containing the data
ca10f295 466 elsif (isa($_[0], 'SCALAR')) {
9398955f 467 # passed a ref to a string
49e1eb70 468 $self->debug("translate: Got a SCALAR reference (string)\n");
9398955f 469 $self->data($_[0]);
ca10f295 470 }
9398955f 471
7a8e1f51 472 # Not a reference; treat it as a filename
b346d8f1 473 elsif (! ref $_[0]) {
ca10f295 474 # Not a ref, it's a filename
49e1eb70 475 $self->debug("translate: Got a filename\n");
9398955f 476 $self->filename($_[0]);
ca10f295 477 }
9398955f 478
7a8e1f51 479 # Passed something else entirely.
b346d8f1 480 else {
481 # We're not impressed. Take your empty string and leave.
38254289 482 # return "";
483
7a8e1f51 484 # Actually, if data, parser, and producer are set, then we
485 # can continue. Too bad, because I like my comment
486 # (above)...
38254289 487 return "" unless ($self->data &&
488 $self->producer &&
489 $self->parser);
b346d8f1 490 }
16dc9970 491 }
492 else {
b346d8f1 493 # You must pass in a hash, or you get nothing.
494 return "" if @_ % 2;
ca10f295 495 $args = { @_ };
7a8e1f51 496 }
16dc9970 497
9398955f 498 # ----------------------------------------------------------------------
499 # Can specify the data to be transformed using "filename", "file",
7a8e1f51 500 # "data", or "datasource".
9398955f 501 # ----------------------------------------------------------------------
7a8e1f51 502 if (my $filename = ($args->{'filename'} || $args->{'file'})) {
9398955f 503 $self->filename($filename);
504 }
ca10f295 505
422298aa 506 if (my $data = ($args->{'data'} || $args->{'datasource'})) {
9398955f 507 $self->data($data);
16dc9970 508 }
ca10f295 509
9398955f 510 # ----------------------------------------------------------------
511 # Get the data.
512 # ----------------------------------------------------------------
513 my $data = $self->data;
5457eaf0 514 unless (ref($data) eq 'SCALAR' and length $$data) {
c2d3a526 515 return $self->error("Empty data file!");
9398955f 516 }
077ebf34 517
9398955f 518 # ----------------------------------------------------------------
ca10f295 519 # Local reference to the parser subroutine
9398955f 520 # ----------------------------------------------------------------
ca10f295 521 if ($parser = ($args->{'parser'} || $args->{'from'})) {
522 $self->parser($parser);
16dc9970 523 }
7a8e1f51 524 $parser = $self->parser;
525 $parser_type = $self->parser_type;
16dc9970 526
9398955f 527 # ----------------------------------------------------------------
ca10f295 528 # Local reference to the producer subroutine
9398955f 529 # ----------------------------------------------------------------
ca10f295 530 if ($producer = ($args->{'producer'} || $args->{'to'})) {
531 $self->producer($producer);
16dc9970 532 }
7a8e1f51 533 $producer = $self->producer;
534 $producer_type = $self->producer_type;
16dc9970 535
9398955f 536 # ----------------------------------------------------------------
7a8e1f51 537 # Execute the parser, then execute the producer with that output.
538 # Allowances are made for each piece to die, or fail to compile,
539 # since the referenced subroutines could be almost anything. In
540 # the future, each of these might happen in a Safe environment,
541 # depending on how paranoid we want to be.
9398955f 542 # ----------------------------------------------------------------
dbe45b7c 543 eval { $parser_output = $parser->($self, $$data) };
7a8e1f51 544 if ($@ || ! $parser_output) {
545 my $msg = sprintf "translate: Error with parser '%s': %s",
546 $parser_type, ($@) ? $@ : " no results";
c2d3a526 547 return $self->error($msg);
7a8e1f51 548 }
549
3f4af30d 550 if ( $self->validate ) {
551 my $schema = $self->schema;
552 return $self->error('Invalid schema') unless $schema->is_valid;
553 }
554
555 eval { $producer_output = $producer->($self) };
7a8e1f51 556 if ($@ || ! $producer_output) {
557 my $msg = sprintf "translate: Error with producer '%s': %s",
558 $producer_type, ($@) ? $@ : " no results";
c2d3a526 559 return $self->error($msg);
7a8e1f51 560 }
561
562 return $producer_output;
16dc9970 563}
ca10f295 564
d529894e 565# ----------------------------------------------------------------------
0f3778d0 566# list_parsers()
567#
568# Hacky sort of method to list all available parsers. This has
569# several problems:
570#
571# - Only finds things in the SQL::Translator::Parser namespace
572#
573# - Only finds things that are located in the same directory
574# as SQL::Translator::Parser. Yeck.
575#
576# This method will fail in several very likely cases:
577#
578# - Parser modules in different namespaces
579#
580# - Parser modules in the SQL::Translator::Parser namespace that
581# have any XS componenets will be installed in
582# arch_lib/SQL/Translator.
583#
584# ----------------------------------------------------------------------
585sub list_parsers {
ca1f2237 586 return shift->_list("parser");
0f3778d0 587}
588
589# ----------------------------------------------------------------------
590# list_producers()
591#
592# See notes for list_parsers(), above; all the problems apply to
593# list_producers as well.
594# ----------------------------------------------------------------------
c0c4aef9 595sub list_producers {
ca1f2237 596 return shift->_list("producer");
0f3778d0 597}
598
c0c4aef9 599
0f3778d0 600# ======================================================================
601# Private Methods
602# ======================================================================
c0c4aef9 603
0f3778d0 604# ----------------------------------------------------------------------
605# _args($type, \%args);
606#
607# Gets or sets ${type}_args. Called by parser_args and producer_args.
608# ----------------------------------------------------------------------
609sub _args {
610 my $self = shift;
611 my $type = shift;
612 $type = "${type}_args" unless $type =~ /_args$/;
613
614 unless (defined $self->{$type} && isa($self->{$type}, 'HASH')) {
615 $self->{$type} = { };
616 }
617
618 if (@_) {
619 # If the first argument is an explicit undef (remember, we
620 # don't get here unless there is stuff in @_), then we clear
621 # out the producer_args hash.
622 if (! defined $_[0]) {
623 shift @_;
624 %{$self->{$type}} = ();
625 }
626
627 my $args = isa($_[0], 'HASH') ? shift : { @_ };
628 %{$self->{$type}} = (%{$self->{$type}}, %$args);
629 }
630
631 $self->{$type};
c0c4aef9 632}
633
d529894e 634# ----------------------------------------------------------------------
0f3778d0 635# _list($type)
636# ----------------------------------------------------------------------
637sub _list {
ca1f2237 638 my $self = shift;
639 my $type = shift || return ();
640 my $uctype = ucfirst lc $type;
641 my %found;
642
643 load("SQL::Translator::$uctype") or return ();
644 my $path = catfile "SQL", "Translator", $uctype;
645 for (@INC) {
646 my $dir = catfile $_, $path;
647 $self->debug("_list_${type}s searching $dir");
648 next unless -d $dir;
649
650 my $dh = IO::Dir->new($dir);
651 for (grep /\.pm$/, $dh->read) {
652 s/\.pm$//;
653 $found{ join "::", "SQL::Translator::$uctype", $_ } = 1;
654 }
655 }
c0c4aef9 656
ca1f2237 657 return keys %found;
c0c4aef9 658}
659
d529894e 660# ----------------------------------------------------------------------
0f3778d0 661# load($module)
662#
663# Loads a Perl module. Short circuits if a module is already loaded.
664# ----------------------------------------------------------------------
ca10f295 665sub load {
666 my $module = do { my $m = shift; $m =~ s[::][/]g; "$m.pm" };
667 return 1 if $INC{$module};
ca1f2237 668
5760246d 669 eval {
670 require $module;
671 $module->import(@_);
672 };
ca1f2237 673
674 return __PACKAGE__->error($@) if ($@);
ca10f295 675 return 1;
1fd8c91f 676}
16dc9970 677
67e5ff53 678# ----------------------------------------------------------------------
7d5bcab8 679sub format_table_name {
f9a0c3b5 680 my $self = shift;
681 my $sub = shift;
682 $self->{'_format_table_name'} = $sub if ref $sub eq 'CODE';
683 return $self->{'_format_table_name'}->( $sub, @_ )
684 if defined $self->{'_format_table_name'};
685 return $sub;
7d5bcab8 686}
687
67e5ff53 688# ----------------------------------------------------------------------
7d5bcab8 689sub format_package_name {
f9a0c3b5 690 my $self = shift;
691 my $sub = shift;
692 $self->{'_format_package_name'} = $sub if ref $sub eq 'CODE';
693 return $self->{'_format_package_name'}->( $sub, @_ )
694 if defined $self->{'_format_package_name'};
695 return $sub;
7d5bcab8 696}
697
67e5ff53 698# ----------------------------------------------------------------------
7d5bcab8 699sub format_fk_name {
f9a0c3b5 700 my $self = shift;
701 my $sub = shift;
702 $self->{'_format_fk_name'} = $sub if ref $sub eq 'CODE';
703 return $self->{'_format_fk_name'}->( $sub, @_ )
704 if defined $self->{'_format_fk_name'};
705 return $sub;
7d5bcab8 706}
707
67e5ff53 708# ----------------------------------------------------------------------
7d5bcab8 709sub format_pk_name {
f9a0c3b5 710 my $self = shift;
8a990c91 711
712 if ( ref $_[0] eq 'CODE' ) {
713 $self->{'_format_pk_name'} = shift;
714 }
715
716 if ( @_ ) {
717 if ( defined $self->{'_format_pk_name'} ) {
718 return $self->{'_format_pk_name'}->( @_ );
719 }
720 else {
721 return '';
722 }
723 }
724
725 return $self->{'_format_pk_name'};
7d5bcab8 726}
727
d529894e 728# ----------------------------------------------------------------------
0f3778d0 729# isa($ref, $type)
730#
731# Calls UNIVERSAL::isa($ref, $type). I think UNIVERSAL::isa is ugly,
732# but I like function overhead.
733# ----------------------------------------------------------------------
734sub isa($$) {
735 my ($ref, $type) = @_;
736 return UNIVERSAL::isa($ref, $type);
737}
c2d3a526 738
3f4af30d 739# ----------------------------------------------------------------------
740sub validate {
3f4af30d 741 my ( $self, $arg ) = @_;
742 if ( defined $arg ) {
743 $self->{'validate'} = $arg ? 1 : 0;
744 }
745 return $self->{'validate'} || 0;
746}
747
16dc9970 7481;
16dc9970 749
389b318c 750# ----------------------------------------------------------------------
751# Who killed the pork chops?
752# What price bananas?
753# Are you my Angel?
754# Allen Ginsberg
755# ----------------------------------------------------------------------
756
757=pod
0f3778d0 758
759=head1 NAME
760
954f31f1 761SQL::Translator - manipulate structured data definitions (SQL and more)
0f3778d0 762
763=head1 SYNOPSIS
764
765 use SQL::Translator;
766
67e5ff53 767 my $translator = SQL::Translator->new(
768 # Print debug info
769 debug => 1,
770 # Print Parse::RecDescent trace
771 trace => 0,
772 # Don't include comments in output
773 no_comments => 0,
774 # Print name mutations, conflicts
775 show_warnings => 0,
776 # Add "drop table" statements
777 add_drop_table => 1,
778 # Validate schema object
779 validate => 1,
f9a0c3b5 780 # Make all table names CAPS in producers which support this option
67e5ff53 781 format_table_name => sub {my $tablename = shift; return uc($tablename)},
f9a0c3b5 782 # Null-op formatting, only here for documentation's sake
7d5bcab8 783 format_package_name => sub {return shift},
784 format_fk_name => sub {return shift},
785 format_pk_name => sub {return shift},
0f3778d0 786 );
787
788 my $output = $translator->translate(
389b318c 789 from => 'MySQL',
790 to => 'Oracle',
f9a0c3b5 791 # Or an arrayref of filenames, i.e. [ $file1, $file2, $file3 ]
792 filename => $file,
0f3778d0 793 ) or die $translator->error;
794
795 print $output;
796
797=head1 DESCRIPTION
798
29efc9fd 799SQL::Translator is a group of Perl modules that converts
800vendor-specific SQL table definitions into other formats, such as
801other vendor-specific SQL, ER diagrams, documentation (POD and HTML),
802XML, and Class::DBI classes. The main focus of SQL::Translator is
803SQL, but parsers exist for other structured data formats, including
804Excel spreadsheets and arbitrarily delimited text files. Through the
805separation of the code into parsers and producers with an object model
806in between, it's possible to combine any parser with any producer, to
807plug in custom parsers or producers, or to manipulate the parsed data
808via the built-in object model. Presently only the definition parts of
809SQL are handled (CREATE, ALTER), not the manipulation of data (INSERT,
810UPDATE, DELETE).
0f3778d0 811
812=head1 CONSTRUCTOR
813
5760246d 814The constructor is called C<new>, and accepts a optional hash of options.
0f3778d0 815Valid options are:
816
817=over 4
818
ca251f03 819=item *
820
821parser / from
822
823=item *
824
825parser_args
0f3778d0 826
ca251f03 827=item *
0f3778d0 828
ca251f03 829producer / to
0f3778d0 830
ca251f03 831=item *
0f3778d0 832
ca251f03 833producer_args
0f3778d0 834
ca251f03 835=item *
836
837filename / file
838
839=item *
840
841data
842
843=item *
0f3778d0 844
ca251f03 845debug
0f3778d0 846
389b318c 847=item *
848
849add_drop_table
850
851=item *
852
853no_comments
854
855=item *
856
857trace
858
859=item *
860
861validate
862
0f3778d0 863=back
864
865All options are, well, optional; these attributes can be set via
866instance methods. Internally, they are; no (non-syntactical)
867advantage is gained by passing options to the constructor.
868
869=head1 METHODS
870
5760246d 871=head2 add_drop_table
0f3778d0 872
873Toggles whether or not to add "DROP TABLE" statements just before the
874create definitions.
875
5760246d 876=head2 no_comments
0f3778d0 877
878Toggles whether to print comments in the output. Accepts a true or false
879value, returns the current value.
880
5760246d 881=head2 producer
0f3778d0 882
5760246d 883The C<producer> method is an accessor/mutator, used to retrieve or
0f3778d0 884define what subroutine is called to produce the output. A subroutine
885defined as a producer will be invoked as a function (I<not a method>)
ca251f03 886and passed 2 parameters: its container C<SQL::Translator> instance and a
0f3778d0 887data structure. It is expected that the function transform the data
ca251f03 888structure to a string. The C<SQL::Transformer> instance is provided for
0f3778d0 889informational purposes; for example, the type of the parser can be
5760246d 890retrieved using the C<parser_type> method, and the C<error> and
891C<debug> methods can be called when needed.
0f3778d0 892
ca251f03 893When defining a producer, one of several things can be passed in: A
5760246d 894module name (e.g., C<My::Groovy::Producer>), a module name relative to
895the C<SQL::Translator::Producer> namespace (e.g., C<MySQL>), a module
ca251f03 896name and function combination (C<My::Groovy::Producer::transmogrify>),
0f3778d0 897or a reference to an anonymous subroutine. If a full module name is
898passed in (for the purposes of this method, a string containing "::"
899is considered to be a module name), it is treated as a package, and a
ca251f03 900function called "produce" will be invoked: C<$modulename::produce>.
901If $modulename cannot be loaded, the final portion is stripped off and
0f3778d0 902treated as a function. In other words, if there is no file named
ca251f03 903F<My/Groovy/Producer/transmogrify.pm>, C<SQL::Translator> will attempt
5760246d 904to load F<My/Groovy/Producer.pm> and use C<transmogrify> as the name of
905the function, instead of the default C<produce>.
0f3778d0 906
907 my $tr = SQL::Translator->new;
908
909 # This will invoke My::Groovy::Producer::produce($tr, $data)
910 $tr->producer("My::Groovy::Producer");
911
912 # This will invoke SQL::Translator::Producer::Sybase::produce($tr, $data)
913 $tr->producer("Sybase");
914
915 # This will invoke My::Groovy::Producer::transmogrify($tr, $data),
916 # assuming that My::Groovy::Producer::transmogrify is not a module
917 # on disk.
918 $tr->producer("My::Groovy::Producer::transmogrify");
919
920 # This will invoke the referenced subroutine directly, as
921 # $subref->($tr, $data);
922 $tr->producer(\&my_producer);
923
5760246d 924There is also a method named C<producer_type>, which is a string
925containing the classname to which the above C<produce> function
0f3778d0 926belongs. In the case of anonymous subroutines, this method returns
927the string "CODE".
928
5760246d 929Finally, there is a method named C<producer_args>, which is both an
0f3778d0 930accessor and a mutator. Arbitrary data may be stored in name => value
931pairs for the producer subroutine to access:
932
933 sub My::Random::producer {
934 my ($tr, $data) = @_;
935 my $pr_args = $tr->producer_args();
936
937 # $pr_args is a hashref.
938
5760246d 939Extra data passed to the C<producer> method is passed to
940C<producer_args>:
0f3778d0 941
942 $tr->producer("xSV", delimiter => ',\s*');
943
944 # In SQL::Translator::Producer::xSV:
945 my $args = $tr->producer_args;
946 my $delimiter = $args->{'delimiter'}; # value is ,\s*
947
5760246d 948=head2 parser
0f3778d0 949
5760246d 950The C<parser> method defines or retrieves a subroutine that will be
0f3778d0 951called to perform the parsing. The basic idea is the same as that of
5760246d 952C<producer> (see above), except the default subroutine name is
ca251f03 953"parse", and will be invoked as C<$module_name::parse($tr, $data)>.
0f3778d0 954Also, the parser subroutine will be passed a string containing the
955entirety of the data to be parsed.
956
957 # Invokes SQL::Translator::Parser::MySQL::parse()
958 $tr->parser("MySQL");
959
960 # Invokes My::Groovy::Parser::parse()
961 $tr->parser("My::Groovy::Parser");
962
963 # Invoke an anonymous subroutine directly
964 $tr->parser(sub {
965 my $dumper = Data::Dumper->new([ $_[1] ], [ "SQL" ]);
966 $dumper->Purity(1)->Terse(1)->Deepcopy(1);
967 return $dumper->Dump;
968 });
969
5760246d 970There is also C<parser_type> and C<parser_args>, which perform
971analogously to C<producer_type> and C<producer_args>
0f3778d0 972
5760246d 973=head2 show_warnings
0f3778d0 974
975Toggles whether to print warnings of name conflicts, identifier
976mutations, etc. Probably only generated by producers to let the user
977know when something won't translate very smoothly (e.g., MySQL "enum"
978fields into Oracle). Accepts a true or false value, returns the
979current value.
980
5760246d 981=head2 translate
0f3778d0 982
5760246d 983The C<translate> method calls the subroutines referenced by the
984C<parser> and C<producer> data members (described above). It accepts
0f3778d0 985as arguments a number of things, in key => value format, including
986(potentially) a parser and a producer (they are passed directly to the
5760246d 987C<parser> and C<producer> methods).
0f3778d0 988
5760246d 989Here is how the parameter list to C<translate> is parsed:
0f3778d0 990
991=over
992
993=item *
994
9951 argument means it's the data to be parsed; which could be a string
ca251f03 996(filename) or a reference to a scalar (a string stored in memory), or a
0f3778d0 997reference to a hash, which is parsed as being more than one argument
998(see next section).
999
1000 # Parse the file /path/to/datafile
1001 my $output = $tr->translate("/path/to/datafile");
1002
1003 # Parse the data contained in the string $data
1004 my $output = $tr->translate(\$data);
1005
1006=item *
1007
1008More than 1 argument means its a hash of things, and it might be
1009setting a parser, producer, or datasource (this key is named
1010"filename" or "file" if it's a file, or "data" for a SCALAR reference.
1011
1012 # As above, parse /path/to/datafile, but with different producers
1013 for my $prod ("MySQL", "XML", "Sybase") {
1014 print $tr->translate(
1015 producer => $prod,
1016 filename => "/path/to/datafile",
1017 );
1018 }
1019
1020 # The filename hash key could also be:
1021 datasource => \$data,
1022
1023You get the idea.
1024
1025=back
1026
5760246d 1027=head2 filename, data
0f3778d0 1028
5760246d 1029Using the C<filename> method, the filename of the data to be parsed
1030can be set. This method can be used in conjunction with the C<data>
1031method, below. If both the C<filename> and C<data> methods are
1032invoked as mutators, the data set in the C<data> method is used.
0f3778d0 1033
1034 $tr->filename("/my/data/files/create.sql");
1035
1036or:
1037
1038 my $create_script = do {
1039 local $/;
1040 open CREATE, "/my/data/files/create.sql" or die $!;
1041 <CREATE>;
1042 };
1043 $tr->data(\$create_script);
1044
5760246d 1045C<filename> takes a string, which is interpreted as a filename.
1046C<data> takes a reference to a string, which is used as the data to be
0f3778d0 1047parsed. If a filename is set, then that file is opened and read when
5760246d 1048the C<translate> method is called, as long as the data instance
0f3778d0 1049variable is not set.
1050
45ee6be0 1051=head2 schema
1052
1053Returns the SQL::Translator::Schema object.
1054
5760246d 1055=head2 trace
0f3778d0 1056
1057Turns on/off the tracing option of Parse::RecDescent.
1058
389b318c 1059=head2 validate
1060
1061Whether or not to validate the schema object after parsing and before
1062producing.
1063
7a8e1f51 1064=head1 AUTHORS
16dc9970 1065
ca251f03 1066Ken Y. Clark, E<lt>kclark@cpan.orgE<gt>,
1067darren chamberlain E<lt>darren@cpan.orgE<gt>,
1068Chris Mungall E<lt>cjm@fruitfly.orgE<gt>,
389b318c 1069Allen Day E<lt>allenday@users.sourceforge.netE<gt>,
1070Sam Angiuoli E<lt>angiuoli@users.sourceforge.netE<gt>,
1071Ying Zhang E<lt>zyolive@yahoo.comE<gt>,
1072Mike Mellilo <mmelillo@users.sourceforge.net>.
dfb4c915 1073
ca10f295 1074=head1 COPYRIGHT
16dc9970 1075
ca10f295 1076This program is free software; you can redistribute it and/or modify
1077it under the terms of the GNU General Public License as published by
1078the Free Software Foundation; version 2.
dfb4c915 1079
ca10f295 1080This program is distributed in the hope that it will be useful, but
1081WITHOUT ANY WARRANTY; without even the implied warranty of
1082MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
1083General Public License for more details.
16dc9970 1084
ca10f295 1085You should have received a copy of the GNU General Public License
1086along with this program; if not, write to the Free Software
1087Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
1088USA
16dc9970 1089
87bf8a3a 1090=head1 BUGS
1091
1092Please use http://rt.cpan.org/ for reporting bugs.
1093
16dc9970 1094=head1 SEE ALSO
1095
abfa405a 1096L<perl>,
1097L<SQL::Translator::Parser>,
1098L<SQL::Translator::Producer>,
389b318c 1099L<Parse::RecDescent>,
1100L<GD>,
1101L<GraphViz>,
1102L<Text::RecordParser>,
1103L<Class::DBI>
1104L<XML::Writer>.