Cleaning up the project description.
[dbsrgits/SQL-Translator.git] / lib / SQL / Translator.pm
CommitLineData
16dc9970 1package SQL::Translator;
2
b346d8f1 3# ----------------------------------------------------------------------
67e5ff53 4# $Id: Translator.pm,v 1.31 2003-06-16 20:58:10 kycl4rk Exp $
b346d8f1 5# ----------------------------------------------------------------------
abfa405a 6# Copyright (C) 2003 Ken Y. Clark <kclark@cpan.org>,
7# darren chamberlain <darren@cpan.org>,
8# Chris Mungall <cjm@fruitfly.org>
1fd8c91f 9#
077ebf34 10# This program is free software; you can redistribute it and/or
11# modify it under the terms of the GNU General Public License as
12# published by the Free Software Foundation; version 2.
ca10f295 13#
077ebf34 14# This program is distributed in the hope that it will be useful, but
15# WITHOUT ANY WARRANTY; without even the implied warranty of
16# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17# General Public License for more details.
ca10f295 18#
077ebf34 19# You should have received a copy of the GNU General Public License
20# along with this program; if not, write to the Free Software
21# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
22# 02111-1307 USA
ca10f295 23# -------------------------------------------------------------------
24
16dc9970 25use strict;
d529894e 26use vars qw( $VERSION $REVISION $DEFAULT_SUB $DEBUG $ERROR );
49e1eb70 27use base 'Class::Base';
c2d3a526 28
389b318c 29$VERSION = '0.02';
67e5ff53 30$REVISION = sprintf "%d.%02d", q$Revision: 1.31 $ =~ /(\d+)\.(\d+)/;
d529894e 31$DEBUG = 0 unless defined $DEBUG;
32$ERROR = "";
c2d3a526 33
34use Carp qw(carp);
16dc9970 35
c0c4aef9 36use File::Spec::Functions qw(catfile);
37use File::Basename qw(dirname);
38use IO::Dir;
45ee6be0 39use SQL::Translator::Schema;
c0c4aef9 40
b346d8f1 41# ----------------------------------------------------------------------
42# The default behavior is to "pass through" values (note that the
43# SQL::Translator instance is the first value ($_[0]), and the stuff
44# to be parsed is the second value ($_[1])
45# ----------------------------------------------------------------------
46$DEFAULT_SUB = sub { $_[1] } unless defined $DEFAULT_SUB;
16dc9970 47
b346d8f1 48# ----------------------------------------------------------------------
c2d3a526 49# init([ARGS])
b346d8f1 50# The constructor.
dfb4c915 51#
b346d8f1 52# new takes an optional hash of arguments. These arguments may
53# include a parser, specified with the keys "parser" or "from",
54# and a producer, specified with the keys "producer" or "to".
dfb4c915 55#
b346d8f1 56# The values that can be passed as the parser or producer are
57# given directly to the parser or producer methods, respectively.
58# See the appropriate method description below for details about
59# what each expects/accepts.
b346d8f1 60# ----------------------------------------------------------------------
c2d3a526 61sub init {
49e1eb70 62 my ( $self, $config ) = @_;
1fd8c91f 63
49e1eb70 64 #
b346d8f1 65 # Set the parser and producer.
ca10f295 66 #
b346d8f1 67 # If a 'parser' or 'from' parameter is passed in, use that as the
68 # parser; if a 'producer' or 'to' parameter is passed in, use that
69 # as the producer; both default to $DEFAULT_SUB.
49e1eb70 70 #
71 $self->parser ($config->{'parser'} || $config->{'from'} || $DEFAULT_SUB);
c2d3a526 72 $self->producer($config->{'producer'} || $config->{'to'} || $DEFAULT_SUB);
ca10f295 73
7d5bcab8 74 #
75 # Set up callbacks for formatting of pk,fk,table,package names in producer
76 #
77 $self->format_table_name($config->{'format_table_name'});
78 $self->format_package_name($config->{'format_package_name'});
79 $self->format_fk_name($config->{'format_fk_name'});
80 $self->format_pk_name($config->{'format_pk_name'});
81
49e1eb70 82 #
e2158c40 83 # Set the parser_args and producer_args
49e1eb70 84 #
85 for my $pargs ( qw[ parser_args producer_args ] ) {
86 $self->$pargs( $config->{$pargs} ) if defined $config->{ $pargs };
e2158c40 87 }
88
49e1eb70 89 #
9398955f 90 # Set the data source, if 'filename' or 'file' is provided.
49e1eb70 91 #
c2d3a526 92 $config->{'filename'} ||= $config->{'file'} || "";
49e1eb70 93 $self->filename( $config->{'filename'} ) if $config->{'filename'};
9398955f 94
49e1eb70 95 #
96 # Finally, if there is a 'data' parameter, use that in
97 # preference to filename and file
98 #
99 if ( my $data = $config->{'data'} ) {
100 $self->data( $data );
9398955f 101 }
102
d529894e 103 #
104 # Set various other options.
105 #
49e1eb70 106 $self->{'debug'} = defined $config->{'debug'} ? $config->{'debug'} : $DEBUG;
ca10f295 107
96844cae 108 $self->add_drop_table( $config->{'add_drop_table'} );
d529894e 109
d529894e 110 $self->no_comments( $config->{'no_comments'} );
111
96844cae 112 $self->show_warnings( $config->{'show_warnings'} );
113
114 $self->trace( $config->{'trace'} );
115
3f4af30d 116 $self->validate( $config->{'validate'} );
117
ca10f295 118 return $self;
dfb4c915 119}
1fd8c91f 120
0f3778d0 121# ----------------------------------------------------------------------
122# add_drop_table([$bool])
123# ----------------------------------------------------------------------
96844cae 124sub add_drop_table {
125 my $self = shift;
126 if ( defined (my $arg = shift) ) {
127 $self->{'add_drop_table'} = $arg ? 1 : 0;
128 }
129 return $self->{'add_drop_table'} || 0;
130}
131
0f3778d0 132# ----------------------------------------------------------------------
133# no_comments([$bool])
134# ----------------------------------------------------------------------
d529894e 135sub no_comments {
136 my $self = shift;
137 my $arg = shift;
138 if ( defined $arg ) {
139 $self->{'no_comments'} = $arg ? 1 : 0;
140 }
141 return $self->{'no_comments'} || 0;
142}
143
e2158c40 144
0f3778d0 145# ----------------------------------------------------------------------
146# producer([$producer_spec])
147#
148# Get or set the producer for the current translator.
149# ----------------------------------------------------------------------
ca10f295 150sub producer {
1fd8c91f 151 my $self = shift;
b346d8f1 152
7a8e1f51 153 # producer as a mutator
ca10f295 154 if (@_) {
155 my $producer = shift;
b346d8f1 156
7a8e1f51 157 # Passed a module name (string containing "::")
ca10f295 158 if ($producer =~ /::/) {
077ebf34 159 my $func_name;
b346d8f1 160
7a8e1f51 161 # Module name was passed directly
b346d8f1 162 # We try to load the name; if it doesn't load, there's
163 # a possibility that it has a function name attached to
164 # it.
077ebf34 165 if (load($producer)) {
166 $func_name = "produce";
7a8e1f51 167 }
b346d8f1 168
7a8e1f51 169 # Module::function was passed
b346d8f1 170 else {
171 # Passed Module::Name::function; try to recover
077ebf34 172 my @func_parts = split /::/, $producer;
173 $func_name = pop @func_parts;
174 $producer = join "::", @func_parts;
b346d8f1 175
176 # If this doesn't work, then we have a legitimate
177 # problem.
077ebf34 178 load($producer) or die "Can't load $producer: $@";
7a8e1f51 179 }
077ebf34 180
7a8e1f51 181 # get code reference and assign
077ebf34 182 $self->{'producer'} = \&{ "$producer\::$func_name" };
183 $self->{'producer_type'} = $producer;
49e1eb70 184 $self->debug("Got producer: $producer\::$func_name\n");
7a8e1f51 185 }
b346d8f1 186
7a8e1f51 187 # passed an anonymous subroutine reference
b346d8f1 188 elsif (isa($producer, 'CODE')) {
ca10f295 189 $self->{'producer'} = $producer;
077ebf34 190 $self->{'producer_type'} = "CODE";
49e1eb70 191 $self->debug("Got producer: code ref\n");
7a8e1f51 192 }
b346d8f1 193
7a8e1f51 194 # passed a string containing no "::"; relative package name
b346d8f1 195 else {
ca10f295 196 my $Pp = sprintf "SQL::Translator::Producer::$producer";
197 load($Pp) or die "Can't load $Pp: $@";
077ebf34 198 $self->{'producer'} = \&{ "$Pp\::produce" };
199 $self->{'producer_type'} = $Pp;
49e1eb70 200 $self->debug("Got producer: $Pp\n");
7a8e1f51 201 }
b346d8f1 202
ca10f295 203 # At this point, $self->{'producer'} contains a subroutine
b346d8f1 204 # reference that is ready to run
e2158c40 205
7a8e1f51 206 # Anything left? If so, it's producer_args
207 $self->producer_args(@_) if (@_);
208 }
b346d8f1 209
ca10f295 210 return $self->{'producer'};
211};
077ebf34 212
7a8e1f51 213# ----------------------------------------------------------------------
0f3778d0 214# producer_type()
7a8e1f51 215#
e2158c40 216# producer_type is an accessor that allows producer subs to get
217# information about their origin. This is poptentially important;
ca251f03 218# since all producer subs are called as subroutine references, there is
e2158c40 219# no way for a producer to find out which package the sub lives in
220# originally, for example.
7a8e1f51 221# ----------------------------------------------------------------------
222sub producer_type { $_[0]->{'producer_type'} }
e2158c40 223
7a8e1f51 224# ----------------------------------------------------------------------
0f3778d0 225# producer_args([\%args])
7a8e1f51 226#
e2158c40 227# Arbitrary name => value pairs of paramters can be passed to a
228# producer using this method.
52b828e8 229#
0f3778d0 230# If the first argument passed in is undef, then the hash of arguments
231# is cleared; all subsequent elements are added to the hash of name,
232# value pairs stored as producer_args.
7a8e1f51 233# ----------------------------------------------------------------------
e2158c40 234sub producer_args {
235 my $self = shift;
0f3778d0 236 return $self->_args("producer", @_);
7a8e1f51 237}
ca10f295 238
0f3778d0 239# ----------------------------------------------------------------------
240# parser([$parser_spec])
241# ----------------------------------------------------------------------
ca10f295 242sub parser {
243 my $self = shift;
b346d8f1 244
7a8e1f51 245 # parser as a mutator
ca10f295 246 if (@_) {
247 my $parser = shift;
b346d8f1 248
7a8e1f51 249 # Passed a module name (string containing "::")
ca10f295 250 if ($parser =~ /::/) {
b346d8f1 251 my $func_name;
252
7a8e1f51 253 # Module name was passed directly
b346d8f1 254 # We try to load the name; if it doesn't load, there's
255 # a possibility that it has a function name attached to
256 # it.
257 if (load($parser)) {
258 $func_name = "parse";
7a8e1f51 259 }
b346d8f1 260
7a8e1f51 261 # Module::function was passed
b346d8f1 262 else {
263 # Passed Module::Name::function; try to recover
264 my @func_parts = split /::/, $parser;
265 $func_name = pop @func_parts;
266 $parser = join "::", @func_parts;
267
268 # If this doesn't work, then we have a legitimate
269 # problem.
270 load($parser) or die "Can't load $parser: $@";
7a8e1f51 271 }
b346d8f1 272
7a8e1f51 273 # get code reference and assign
b346d8f1 274 $self->{'parser'} = \&{ "$parser\::$func_name" };
077ebf34 275 $self->{'parser_type'} = $parser;
49e1eb70 276 $self->debug("Got parser: $parser\::$func_name\n");
7a8e1f51 277 }
b346d8f1 278
7a8e1f51 279 # passed an anonymous subroutine reference
49e1eb70 280 elsif ( isa( $parser, 'CODE' ) ) {
281 $self->{'parser'} = $parser;
077ebf34 282 $self->{'parser_type'} = "CODE";
49e1eb70 283 $self->debug("Got parser: code ref\n");
7a8e1f51 284 }
b346d8f1 285
7a8e1f51 286 # passed a string containing no "::"; relative package name
b346d8f1 287 else {
49e1eb70 288 my $Pp = "SQL::Translator::Parser::$parser";
289 load( $Pp ) or die "Can't load $Pp: $@";
290 $self->{'parser'} = \&{ "$Pp\::parse" };
077ebf34 291 $self->{'parser_type'} = $Pp;
49e1eb70 292 $self->debug("Got parser: $Pp\n");
7a8e1f51 293 }
b346d8f1 294
49e1eb70 295 #
b346d8f1 296 # At this point, $self->{'parser'} contains a subroutine
297 # reference that is ready to run
49e1eb70 298 #
299 $self->parser_args( @_ ) if (@_);
7a8e1f51 300 }
b346d8f1 301
ca10f295 302 return $self->{'parser'};
16dc9970 303}
1fd8c91f 304
d529894e 305# ----------------------------------------------------------------------
077ebf34 306sub parser_type { $_[0]->{'parser_type'} }
e2158c40 307
e2158c40 308sub parser_args {
309 my $self = shift;
0f3778d0 310 return $self->_args("parser", @_);
311}
96844cae 312
313sub show_warnings {
314 my $self = shift;
315 my $arg = shift;
316 if ( defined $arg ) {
317 $self->{'show_warnings'} = $arg ? 1 : 0;
318 }
319 return $self->{'show_warnings'} || 0;
320}
321
ca10f295 322
0f3778d0 323# filename - get or set the filename
324sub filename {
325 my $self = shift;
326 if (@_) {
327 my $filename = shift;
328 if (-d $filename) {
329 my $msg = "Cannot use directory '$filename' as input source";
330 return $self->error($msg);
95a2cfb6 331 } elsif (ref($filename) eq 'ARRAY') {
332 $self->{'filename'} = $filename;
333 $self->debug("Got array of files: ".join(', ',@$filename)."\n");
0f3778d0 334 } elsif (-f _ && -r _) {
335 $self->{'filename'} = $filename;
336 $self->debug("Got filename: '$self->{'filename'}'\n");
337 } else {
338 my $msg = "Cannot use '$filename' as input source: ".
339 "file does not exist or is not readable.";
340 return $self->error($msg);
341 }
342 }
ca10f295 343
0f3778d0 344 $self->{'filename'};
345}
ca10f295 346
0f3778d0 347# ----------------------------------------------------------------------
348# data([$data])
349#
350# if $self->{'data'} is not set, but $self->{'filename'} is, then
351# $self->{'filename'} is opened and read, with the results put into
352# $self->{'data'}.
353# ----------------------------------------------------------------------
354sub data {
355 my $self = shift;
ca10f295 356
0f3778d0 357 # Set $self->{'data'} based on what was passed in. We will
358 # accept a number of things; do our best to get it right.
359 if (@_) {
360 my $data = shift;
361 if (isa($data, "SCALAR")) {
362 $self->{'data'} = $data;
363 }
364 else {
365 if (isa($data, 'ARRAY')) {
366 $data = join '', @$data;
367 }
368 elsif (isa($data, 'GLOB')) {
369 local $/;
370 $data = <$data>;
371 }
372 elsif (! ref $data && @_) {
373 $data = join '', $data, @_;
374 }
375 $self->{'data'} = \$data;
376 }
377 }
9398955f 378
7a8e1f51 379 # If we have a filename but no data yet, populate.
9398955f 380 if (not $self->{'data'} and my $filename = $self->filename) {
49e1eb70 381 $self->debug("Opening '$filename' to get contents.\n");
9398955f 382 local *FH;
383 local $/;
384 my $data;
385
95a2cfb6 386 my @files = ref($filename) eq 'ARRAY' ? @$filename : ($filename);
9398955f 387
95a2cfb6 388 foreach my $file (@files) {
389 unless (open FH, $file) {
390 return $self->error("Can't read file '$file': $!");
391 }
9398955f 392
95a2cfb6 393 $data .= <FH>;
394
395 unless (close FH) {
396 return $self->error("Can't close file '$file': $!");
397 }
398 }
399
400 $self->{'data'} = \$data;
9398955f 401 }
9398955f 402
403 return $self->{'data'};
7a8e1f51 404}
9398955f 405
45ee6be0 406# ----------------------------------------------------------------------
407sub schema {
408#
409# Returns the SQL::Translator::Schema object
410#
411 my $self = shift;
412
413 unless ( defined $self->{'schema'} ) {
414 $self->{'schema'} = SQL::Translator::Schema->new;
415 }
d529894e 416
45ee6be0 417 return $self->{'schema'};
418}
419
420# ----------------------------------------------------------------------
d529894e 421sub trace {
422 my $self = shift;
423 my $arg = shift;
424 if ( defined $arg ) {
425 $self->{'trace'} = $arg ? 1 : 0;
426 }
427 return $self->{'trace'} || 0;
428}
429
430# ----------------------------------------------------------------------
0f3778d0 431# translate([source], [\%args])
432#
433# translate does the actual translation. The main argument is the
434# source of the data to be translated, which can be a filename, scalar
435# reference, or glob reference.
436#
437# Alternatively, translate takes optional arguements, which are passed
438# to the appropriate places. Most notable of these arguments are
439# parser and producer, which can be used to set the parser and
440# producer, respectively. This is the applications last chance to set
441# these.
442#
443# translate returns a string.
444# ----------------------------------------------------------------------
ca251f03 445sub translate {
446 my $self = shift;
447 my ($args, $parser, $parser_type, $producer, $producer_type);
448 my ($parser_output, $producer_output);
ca10f295 449
7a8e1f51 450 # Parse arguments
9398955f 451 if (@_ == 1) {
7a8e1f51 452 # Passed a reference to a hash?
ca10f295 453 if (isa($_[0], 'HASH')) {
7a8e1f51 454 # yep, a hashref
49e1eb70 455 $self->debug("translate: Got a hashref\n");
ca10f295 456 $args = $_[0];
457 }
9398955f 458
0f3778d0 459 # Passed a GLOB reference, i.e., filehandle
460 elsif (isa($_[0], 'GLOB')) {
461 $self->debug("translate: Got a GLOB reference\n");
462 $self->data($_[0]);
463 }
464
7a8e1f51 465 # Passed a reference to a string containing the data
ca10f295 466 elsif (isa($_[0], 'SCALAR')) {
9398955f 467 # passed a ref to a string
49e1eb70 468 $self->debug("translate: Got a SCALAR reference (string)\n");
9398955f 469 $self->data($_[0]);
ca10f295 470 }
9398955f 471
7a8e1f51 472 # Not a reference; treat it as a filename
b346d8f1 473 elsif (! ref $_[0]) {
ca10f295 474 # Not a ref, it's a filename
49e1eb70 475 $self->debug("translate: Got a filename\n");
9398955f 476 $self->filename($_[0]);
ca10f295 477 }
9398955f 478
7a8e1f51 479 # Passed something else entirely.
b346d8f1 480 else {
481 # We're not impressed. Take your empty string and leave.
38254289 482 # return "";
483
7a8e1f51 484 # Actually, if data, parser, and producer are set, then we
485 # can continue. Too bad, because I like my comment
486 # (above)...
38254289 487 return "" unless ($self->data &&
488 $self->producer &&
489 $self->parser);
b346d8f1 490 }
16dc9970 491 }
492 else {
b346d8f1 493 # You must pass in a hash, or you get nothing.
494 return "" if @_ % 2;
ca10f295 495 $args = { @_ };
7a8e1f51 496 }
16dc9970 497
9398955f 498 # ----------------------------------------------------------------------
499 # Can specify the data to be transformed using "filename", "file",
7a8e1f51 500 # "data", or "datasource".
9398955f 501 # ----------------------------------------------------------------------
7a8e1f51 502 if (my $filename = ($args->{'filename'} || $args->{'file'})) {
9398955f 503 $self->filename($filename);
504 }
ca10f295 505
422298aa 506 if (my $data = ($args->{'data'} || $args->{'datasource'})) {
9398955f 507 $self->data($data);
16dc9970 508 }
ca10f295 509
9398955f 510 # ----------------------------------------------------------------
511 # Get the data.
512 # ----------------------------------------------------------------
513 my $data = $self->data;
5457eaf0 514 unless (ref($data) eq 'SCALAR' and length $$data) {
c2d3a526 515 return $self->error("Empty data file!");
9398955f 516 }
077ebf34 517
9398955f 518 # ----------------------------------------------------------------
ca10f295 519 # Local reference to the parser subroutine
9398955f 520 # ----------------------------------------------------------------
ca10f295 521 if ($parser = ($args->{'parser'} || $args->{'from'})) {
522 $self->parser($parser);
16dc9970 523 }
7a8e1f51 524 $parser = $self->parser;
525 $parser_type = $self->parser_type;
16dc9970 526
9398955f 527 # ----------------------------------------------------------------
ca10f295 528 # Local reference to the producer subroutine
9398955f 529 # ----------------------------------------------------------------
ca10f295 530 if ($producer = ($args->{'producer'} || $args->{'to'})) {
531 $self->producer($producer);
16dc9970 532 }
7a8e1f51 533 $producer = $self->producer;
534 $producer_type = $self->producer_type;
16dc9970 535
9398955f 536 # ----------------------------------------------------------------
7a8e1f51 537 # Execute the parser, then execute the producer with that output.
538 # Allowances are made for each piece to die, or fail to compile,
539 # since the referenced subroutines could be almost anything. In
540 # the future, each of these might happen in a Safe environment,
541 # depending on how paranoid we want to be.
9398955f 542 # ----------------------------------------------------------------
dbe45b7c 543 eval { $parser_output = $parser->($self, $$data) };
7a8e1f51 544 if ($@ || ! $parser_output) {
545 my $msg = sprintf "translate: Error with parser '%s': %s",
546 $parser_type, ($@) ? $@ : " no results";
c2d3a526 547 return $self->error($msg);
7a8e1f51 548 }
549
3f4af30d 550 if ( $self->validate ) {
551 my $schema = $self->schema;
552 return $self->error('Invalid schema') unless $schema->is_valid;
553 }
554
555 eval { $producer_output = $producer->($self) };
7a8e1f51 556 if ($@ || ! $producer_output) {
557 my $msg = sprintf "translate: Error with producer '%s': %s",
558 $producer_type, ($@) ? $@ : " no results";
c2d3a526 559 return $self->error($msg);
7a8e1f51 560 }
561
562 return $producer_output;
16dc9970 563}
ca10f295 564
d529894e 565# ----------------------------------------------------------------------
0f3778d0 566# list_parsers()
567#
568# Hacky sort of method to list all available parsers. This has
569# several problems:
570#
571# - Only finds things in the SQL::Translator::Parser namespace
572#
573# - Only finds things that are located in the same directory
574# as SQL::Translator::Parser. Yeck.
575#
576# This method will fail in several very likely cases:
577#
578# - Parser modules in different namespaces
579#
580# - Parser modules in the SQL::Translator::Parser namespace that
581# have any XS componenets will be installed in
582# arch_lib/SQL/Translator.
583#
584# ----------------------------------------------------------------------
585sub list_parsers {
ca1f2237 586 return shift->_list("parser");
0f3778d0 587}
588
589# ----------------------------------------------------------------------
590# list_producers()
591#
592# See notes for list_parsers(), above; all the problems apply to
593# list_producers as well.
594# ----------------------------------------------------------------------
c0c4aef9 595sub list_producers {
ca1f2237 596 return shift->_list("producer");
0f3778d0 597}
598
c0c4aef9 599
0f3778d0 600# ======================================================================
601# Private Methods
602# ======================================================================
c0c4aef9 603
0f3778d0 604# ----------------------------------------------------------------------
605# _args($type, \%args);
606#
607# Gets or sets ${type}_args. Called by parser_args and producer_args.
608# ----------------------------------------------------------------------
609sub _args {
610 my $self = shift;
611 my $type = shift;
612 $type = "${type}_args" unless $type =~ /_args$/;
613
614 unless (defined $self->{$type} && isa($self->{$type}, 'HASH')) {
615 $self->{$type} = { };
616 }
617
618 if (@_) {
619 # If the first argument is an explicit undef (remember, we
620 # don't get here unless there is stuff in @_), then we clear
621 # out the producer_args hash.
622 if (! defined $_[0]) {
623 shift @_;
624 %{$self->{$type}} = ();
625 }
626
627 my $args = isa($_[0], 'HASH') ? shift : { @_ };
628 %{$self->{$type}} = (%{$self->{$type}}, %$args);
629 }
630
631 $self->{$type};
c0c4aef9 632}
633
d529894e 634# ----------------------------------------------------------------------
0f3778d0 635# _list($type)
636# ----------------------------------------------------------------------
637sub _list {
ca1f2237 638 my $self = shift;
639 my $type = shift || return ();
640 my $uctype = ucfirst lc $type;
641 my %found;
642
643 load("SQL::Translator::$uctype") or return ();
644 my $path = catfile "SQL", "Translator", $uctype;
645 for (@INC) {
646 my $dir = catfile $_, $path;
647 $self->debug("_list_${type}s searching $dir");
648 next unless -d $dir;
649
650 my $dh = IO::Dir->new($dir);
651 for (grep /\.pm$/, $dh->read) {
652 s/\.pm$//;
653 $found{ join "::", "SQL::Translator::$uctype", $_ } = 1;
654 }
655 }
c0c4aef9 656
ca1f2237 657 return keys %found;
c0c4aef9 658}
659
d529894e 660# ----------------------------------------------------------------------
0f3778d0 661# load($module)
662#
663# Loads a Perl module. Short circuits if a module is already loaded.
664# ----------------------------------------------------------------------
ca10f295 665sub load {
666 my $module = do { my $m = shift; $m =~ s[::][/]g; "$m.pm" };
667 return 1 if $INC{$module};
ca1f2237 668
5760246d 669 eval {
670 require $module;
671 $module->import(@_);
672 };
ca1f2237 673
674 return __PACKAGE__->error($@) if ($@);
ca10f295 675 return 1;
1fd8c91f 676}
16dc9970 677
67e5ff53 678# ----------------------------------------------------------------------
7d5bcab8 679sub format_table_name {
f9a0c3b5 680 my $self = shift;
681 my $sub = shift;
682 $self->{'_format_table_name'} = $sub if ref $sub eq 'CODE';
683 return $self->{'_format_table_name'}->( $sub, @_ )
684 if defined $self->{'_format_table_name'};
685 return $sub;
7d5bcab8 686}
687
67e5ff53 688# ----------------------------------------------------------------------
7d5bcab8 689sub format_package_name {
f9a0c3b5 690 my $self = shift;
691 my $sub = shift;
692 $self->{'_format_package_name'} = $sub if ref $sub eq 'CODE';
693 return $self->{'_format_package_name'}->( $sub, @_ )
694 if defined $self->{'_format_package_name'};
695 return $sub;
7d5bcab8 696}
697
67e5ff53 698# ----------------------------------------------------------------------
7d5bcab8 699sub format_fk_name {
f9a0c3b5 700 my $self = shift;
701 my $sub = shift;
702 $self->{'_format_fk_name'} = $sub if ref $sub eq 'CODE';
703 return $self->{'_format_fk_name'}->( $sub, @_ )
704 if defined $self->{'_format_fk_name'};
705 return $sub;
7d5bcab8 706}
707
67e5ff53 708# ----------------------------------------------------------------------
7d5bcab8 709sub format_pk_name {
f9a0c3b5 710 my $self = shift;
711 my $sub = shift;
712 $self->{'_format_pk_name'} = $sub if ref $sub eq 'CODE';
713 return $self->{'_format_pk_name'}->( $sub, @_ )
714 if defined $self->{'_format_pk_name'};
715 return $sub;
7d5bcab8 716}
717
d529894e 718# ----------------------------------------------------------------------
0f3778d0 719# isa($ref, $type)
720#
721# Calls UNIVERSAL::isa($ref, $type). I think UNIVERSAL::isa is ugly,
722# but I like function overhead.
723# ----------------------------------------------------------------------
724sub isa($$) {
725 my ($ref, $type) = @_;
726 return UNIVERSAL::isa($ref, $type);
727}
c2d3a526 728
3f4af30d 729# ----------------------------------------------------------------------
730sub validate {
3f4af30d 731 my ( $self, $arg ) = @_;
732 if ( defined $arg ) {
733 $self->{'validate'} = $arg ? 1 : 0;
734 }
735 return $self->{'validate'} || 0;
736}
737
16dc9970 7381;
16dc9970 739
389b318c 740# ----------------------------------------------------------------------
741# Who killed the pork chops?
742# What price bananas?
743# Are you my Angel?
744# Allen Ginsberg
745# ----------------------------------------------------------------------
746
747=pod
0f3778d0 748
749=head1 NAME
750
954f31f1 751SQL::Translator - manipulate structured data definitions (SQL and more)
0f3778d0 752
753=head1 SYNOPSIS
754
755 use SQL::Translator;
756
67e5ff53 757 my $translator = SQL::Translator->new(
758 # Print debug info
759 debug => 1,
760 # Print Parse::RecDescent trace
761 trace => 0,
762 # Don't include comments in output
763 no_comments => 0,
764 # Print name mutations, conflicts
765 show_warnings => 0,
766 # Add "drop table" statements
767 add_drop_table => 1,
768 # Validate schema object
769 validate => 1,
f9a0c3b5 770 # Make all table names CAPS in producers which support this option
67e5ff53 771 format_table_name => sub {my $tablename = shift; return uc($tablename)},
f9a0c3b5 772 # Null-op formatting, only here for documentation's sake
7d5bcab8 773 format_package_name => sub {return shift},
774 format_fk_name => sub {return shift},
775 format_pk_name => sub {return shift},
0f3778d0 776 );
777
778 my $output = $translator->translate(
389b318c 779 from => 'MySQL',
780 to => 'Oracle',
f9a0c3b5 781 # Or an arrayref of filenames, i.e. [ $file1, $file2, $file3 ]
782 filename => $file,
0f3778d0 783 ) or die $translator->error;
784
785 print $output;
786
787=head1 DESCRIPTION
788
954f31f1 789The SQLFairy project began with the idea of simplifying the task of
790converting one database create syntax to another through the use of
791Parsers (which understand the source format) and Producers (which
792understand the destination format). The idea is that any Parser can
793be used with any Producer in the conversion process, so, if you
794wanted Postgres-to-Oracle, you would use the Postgres parser and the
795Oracle producer. The project has since grown to include parsing
796structured data files like Excel spreadsheets and delimited text files
797and the production of various documentation aids, such as images,
798graphs, POD, and HTML descriptions of the schema, as well as automatic
799code generators through the use of Class::DBI. Presently only the
800definition parts of SQL are handled (CREATE, ALTER), not the
801manipulation of data (INSERT, UPDATE, DELETE).
0f3778d0 802
803=head1 CONSTRUCTOR
804
5760246d 805The constructor is called C<new>, and accepts a optional hash of options.
0f3778d0 806Valid options are:
807
808=over 4
809
ca251f03 810=item *
811
812parser / from
813
814=item *
815
816parser_args
0f3778d0 817
ca251f03 818=item *
0f3778d0 819
ca251f03 820producer / to
0f3778d0 821
ca251f03 822=item *
0f3778d0 823
ca251f03 824producer_args
0f3778d0 825
ca251f03 826=item *
827
828filename / file
829
830=item *
831
832data
833
834=item *
0f3778d0 835
ca251f03 836debug
0f3778d0 837
389b318c 838=item *
839
840add_drop_table
841
842=item *
843
844no_comments
845
846=item *
847
848trace
849
850=item *
851
852validate
853
0f3778d0 854=back
855
856All options are, well, optional; these attributes can be set via
857instance methods. Internally, they are; no (non-syntactical)
858advantage is gained by passing options to the constructor.
859
860=head1 METHODS
861
5760246d 862=head2 add_drop_table
0f3778d0 863
864Toggles whether or not to add "DROP TABLE" statements just before the
865create definitions.
866
5760246d 867=head2 no_comments
0f3778d0 868
869Toggles whether to print comments in the output. Accepts a true or false
870value, returns the current value.
871
5760246d 872=head2 producer
0f3778d0 873
5760246d 874The C<producer> method is an accessor/mutator, used to retrieve or
0f3778d0 875define what subroutine is called to produce the output. A subroutine
876defined as a producer will be invoked as a function (I<not a method>)
ca251f03 877and passed 2 parameters: its container C<SQL::Translator> instance and a
0f3778d0 878data structure. It is expected that the function transform the data
ca251f03 879structure to a string. The C<SQL::Transformer> instance is provided for
0f3778d0 880informational purposes; for example, the type of the parser can be
5760246d 881retrieved using the C<parser_type> method, and the C<error> and
882C<debug> methods can be called when needed.
0f3778d0 883
ca251f03 884When defining a producer, one of several things can be passed in: A
5760246d 885module name (e.g., C<My::Groovy::Producer>), a module name relative to
886the C<SQL::Translator::Producer> namespace (e.g., C<MySQL>), a module
ca251f03 887name and function combination (C<My::Groovy::Producer::transmogrify>),
0f3778d0 888or a reference to an anonymous subroutine. If a full module name is
889passed in (for the purposes of this method, a string containing "::"
890is considered to be a module name), it is treated as a package, and a
ca251f03 891function called "produce" will be invoked: C<$modulename::produce>.
892If $modulename cannot be loaded, the final portion is stripped off and
0f3778d0 893treated as a function. In other words, if there is no file named
ca251f03 894F<My/Groovy/Producer/transmogrify.pm>, C<SQL::Translator> will attempt
5760246d 895to load F<My/Groovy/Producer.pm> and use C<transmogrify> as the name of
896the function, instead of the default C<produce>.
0f3778d0 897
898 my $tr = SQL::Translator->new;
899
900 # This will invoke My::Groovy::Producer::produce($tr, $data)
901 $tr->producer("My::Groovy::Producer");
902
903 # This will invoke SQL::Translator::Producer::Sybase::produce($tr, $data)
904 $tr->producer("Sybase");
905
906 # This will invoke My::Groovy::Producer::transmogrify($tr, $data),
907 # assuming that My::Groovy::Producer::transmogrify is not a module
908 # on disk.
909 $tr->producer("My::Groovy::Producer::transmogrify");
910
911 # This will invoke the referenced subroutine directly, as
912 # $subref->($tr, $data);
913 $tr->producer(\&my_producer);
914
5760246d 915There is also a method named C<producer_type>, which is a string
916containing the classname to which the above C<produce> function
0f3778d0 917belongs. In the case of anonymous subroutines, this method returns
918the string "CODE".
919
5760246d 920Finally, there is a method named C<producer_args>, which is both an
0f3778d0 921accessor and a mutator. Arbitrary data may be stored in name => value
922pairs for the producer subroutine to access:
923
924 sub My::Random::producer {
925 my ($tr, $data) = @_;
926 my $pr_args = $tr->producer_args();
927
928 # $pr_args is a hashref.
929
5760246d 930Extra data passed to the C<producer> method is passed to
931C<producer_args>:
0f3778d0 932
933 $tr->producer("xSV", delimiter => ',\s*');
934
935 # In SQL::Translator::Producer::xSV:
936 my $args = $tr->producer_args;
937 my $delimiter = $args->{'delimiter'}; # value is ,\s*
938
5760246d 939=head2 parser
0f3778d0 940
5760246d 941The C<parser> method defines or retrieves a subroutine that will be
0f3778d0 942called to perform the parsing. The basic idea is the same as that of
5760246d 943C<producer> (see above), except the default subroutine name is
ca251f03 944"parse", and will be invoked as C<$module_name::parse($tr, $data)>.
0f3778d0 945Also, the parser subroutine will be passed a string containing the
946entirety of the data to be parsed.
947
948 # Invokes SQL::Translator::Parser::MySQL::parse()
949 $tr->parser("MySQL");
950
951 # Invokes My::Groovy::Parser::parse()
952 $tr->parser("My::Groovy::Parser");
953
954 # Invoke an anonymous subroutine directly
955 $tr->parser(sub {
956 my $dumper = Data::Dumper->new([ $_[1] ], [ "SQL" ]);
957 $dumper->Purity(1)->Terse(1)->Deepcopy(1);
958 return $dumper->Dump;
959 });
960
5760246d 961There is also C<parser_type> and C<parser_args>, which perform
962analogously to C<producer_type> and C<producer_args>
0f3778d0 963
5760246d 964=head2 show_warnings
0f3778d0 965
966Toggles whether to print warnings of name conflicts, identifier
967mutations, etc. Probably only generated by producers to let the user
968know when something won't translate very smoothly (e.g., MySQL "enum"
969fields into Oracle). Accepts a true or false value, returns the
970current value.
971
5760246d 972=head2 translate
0f3778d0 973
5760246d 974The C<translate> method calls the subroutines referenced by the
975C<parser> and C<producer> data members (described above). It accepts
0f3778d0 976as arguments a number of things, in key => value format, including
977(potentially) a parser and a producer (they are passed directly to the
5760246d 978C<parser> and C<producer> methods).
0f3778d0 979
5760246d 980Here is how the parameter list to C<translate> is parsed:
0f3778d0 981
982=over
983
984=item *
985
9861 argument means it's the data to be parsed; which could be a string
ca251f03 987(filename) or a reference to a scalar (a string stored in memory), or a
0f3778d0 988reference to a hash, which is parsed as being more than one argument
989(see next section).
990
991 # Parse the file /path/to/datafile
992 my $output = $tr->translate("/path/to/datafile");
993
994 # Parse the data contained in the string $data
995 my $output = $tr->translate(\$data);
996
997=item *
998
999More than 1 argument means its a hash of things, and it might be
1000setting a parser, producer, or datasource (this key is named
1001"filename" or "file" if it's a file, or "data" for a SCALAR reference.
1002
1003 # As above, parse /path/to/datafile, but with different producers
1004 for my $prod ("MySQL", "XML", "Sybase") {
1005 print $tr->translate(
1006 producer => $prod,
1007 filename => "/path/to/datafile",
1008 );
1009 }
1010
1011 # The filename hash key could also be:
1012 datasource => \$data,
1013
1014You get the idea.
1015
1016=back
1017
5760246d 1018=head2 filename, data
0f3778d0 1019
5760246d 1020Using the C<filename> method, the filename of the data to be parsed
1021can be set. This method can be used in conjunction with the C<data>
1022method, below. If both the C<filename> and C<data> methods are
1023invoked as mutators, the data set in the C<data> method is used.
0f3778d0 1024
1025 $tr->filename("/my/data/files/create.sql");
1026
1027or:
1028
1029 my $create_script = do {
1030 local $/;
1031 open CREATE, "/my/data/files/create.sql" or die $!;
1032 <CREATE>;
1033 };
1034 $tr->data(\$create_script);
1035
5760246d 1036C<filename> takes a string, which is interpreted as a filename.
1037C<data> takes a reference to a string, which is used as the data to be
0f3778d0 1038parsed. If a filename is set, then that file is opened and read when
5760246d 1039the C<translate> method is called, as long as the data instance
0f3778d0 1040variable is not set.
1041
45ee6be0 1042=head2 schema
1043
1044Returns the SQL::Translator::Schema object.
1045
5760246d 1046=head2 trace
0f3778d0 1047
1048Turns on/off the tracing option of Parse::RecDescent.
1049
389b318c 1050=head2 validate
1051
1052Whether or not to validate the schema object after parsing and before
1053producing.
1054
7a8e1f51 1055=head1 AUTHORS
16dc9970 1056
ca251f03 1057Ken Y. Clark, E<lt>kclark@cpan.orgE<gt>,
1058darren chamberlain E<lt>darren@cpan.orgE<gt>,
1059Chris Mungall E<lt>cjm@fruitfly.orgE<gt>,
389b318c 1060Allen Day E<lt>allenday@users.sourceforge.netE<gt>,
1061Sam Angiuoli E<lt>angiuoli@users.sourceforge.netE<gt>,
1062Ying Zhang E<lt>zyolive@yahoo.comE<gt>,
1063Mike Mellilo <mmelillo@users.sourceforge.net>.
dfb4c915 1064
ca10f295 1065=head1 COPYRIGHT
16dc9970 1066
ca10f295 1067This program is free software; you can redistribute it and/or modify
1068it under the terms of the GNU General Public License as published by
1069the Free Software Foundation; version 2.
dfb4c915 1070
ca10f295 1071This program is distributed in the hope that it will be useful, but
1072WITHOUT ANY WARRANTY; without even the implied warranty of
1073MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
1074General Public License for more details.
16dc9970 1075
ca10f295 1076You should have received a copy of the GNU General Public License
1077along with this program; if not, write to the Free Software
1078Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
1079USA
16dc9970 1080
87bf8a3a 1081=head1 BUGS
1082
1083Please use http://rt.cpan.org/ for reporting bugs.
1084
16dc9970 1085=head1 SEE ALSO
1086
abfa405a 1087L<perl>,
1088L<SQL::Translator::Parser>,
1089L<SQL::Translator::Producer>,
389b318c 1090L<Parse::RecDescent>,
1091L<GD>,
1092L<GraphViz>,
1093L<Text::RecordParser>,
1094L<Class::DBI>
1095L<XML::Writer>.