X-Git-Url: http://git.shadowcat.co.uk/gitweb/gitweb.cgi?a=blobdiff_plain;f=lib%2FSQL%2FTranslator.pm;h=3847b5a43c4802bbb04cccd3ea12560a3049a747;hb=a37acd3a937cb798d3b0811c995bec3c9fb0a334;hp=899483970b57edd4aba74ded55013e566280c0ca;hpb=d529894ef96e6c243cecd566e1b6b6d3325b8127;p=dbsrgits%2FSQL-Translator.git diff --git a/lib/SQL/Translator.pm b/lib/SQL/Translator.pm index 8994839..3847b5a 100644 --- a/lib/SQL/Translator.pm +++ b/lib/SQL/Translator.pm @@ -1,44 +1,746 @@ package SQL::Translator; +use Moo; +our ( $DEFAULT_SUB, $DEBUG, $ERROR ); + +our $VERSION = '0.11016'; +$DEBUG = 0 unless defined $DEBUG; +$ERROR = ""; + +use Carp qw(carp croak); + +use Data::Dumper; +use File::Find; +use File::Spec::Functions qw(catfile); +use File::Basename qw(dirname); +use IO::Dir; +use Sub::Quote qw(quote_sub); +use SQL::Translator::Producer; +use SQL::Translator::Schema; +use SQL::Translator::Utils qw(throw ex2err carp_ro); + +$DEFAULT_SUB = sub { $_[0]->schema } unless defined $DEFAULT_SUB; + +with qw( + SQL::Translator::Role::Debug + SQL::Translator::Role::Error + SQL::Translator::Role::BuildArgs +); + +around BUILDARGS => sub { + my $orig = shift; + my $self = shift; + my $config = $self->$orig(@_); + + # If a 'parser' or 'from' parameter is passed in, use that as the + # parser; if a 'producer' or 'to' parameter is passed in, use that + # as the producer; both default to $DEFAULT_SUB. + $config->{parser} ||= $config->{from} if defined $config->{from}; + $config->{producer} ||= $config->{to} if defined $config->{to}; + + $config->{filename} ||= $config->{file} if defined $config->{file}; + + my $quote; + if (defined $config->{quote_identifiers}) { + $quote = $config->{quote_identifiers}; + + for (qw/quote_table_names quote_field_names/) { + carp "Ignoring deprecated parameter '$_', since 'quote_identifiers' is supplied" + if defined $config->{$_} + } + } + # Legacy one set the other is not + elsif ( + defined $config->{'quote_table_names'} + xor + defined $config->{'quote_field_names'} + ) { + if (defined $config->{'quote_table_names'}) { + carp "Explicitly disabling the deprecated 'quote_table_names' implies disabling 'quote_identifiers' which in turn implies disabling 'quote_field_names'" + unless $config->{'quote_table_names'}; + $quote = $config->{'quote_table_names'} ? 1 : 0; + } + else { + carp "Explicitly disabling the deprecated 'quote_field_names' implies disabling 'quote_identifiers' which in turn implies disabling 'quote_table_names'" + unless $config->{'quote_field_names'}; + $quote = $config->{'quote_field_names'} ? 1 : 0; + } + } + # Legacy both are set + elsif(defined $config->{'quote_table_names'}) { + croak 'Setting quote_table_names and quote_field_names to conflicting values is no longer supported' + if ($config->{'quote_table_names'} xor $config->{'quote_field_names'}); + + $quote = $config->{'quote_table_names'} ? 1 : 0; + } + + $config->{quote_identifiers} = $quote if defined $quote; + + return $config; +}; + +sub BUILD { + my ($self) = @_; + # Make sure all the tool-related stuff is set up + foreach my $tool (qw(producer parser)) { + $self->$tool($self->$tool); + } +} + +has $_ => ( + is => 'rw', + default => quote_sub(q{ 0 }), + coerce => quote_sub(q{ $_[0] ? 1 : 0 }), +) foreach qw(add_drop_table no_comments show_warnings trace validate); + +# quote_identifiers is on by default, use a 0-but-true as indicator +# so we can allow individual producers to change the default +has quote_identifiers => ( + is => 'rw', + default => quote_sub(q{ '0E0' }), + coerce => quote_sub(q{ $_[0] || 0 }), +); + +sub quote_table_names { + (@_ > 1 and ($_[1] xor $_[0]->quote_identifiers) ) + ? croak 'Using quote_table_names as a setter is no longer supported' + : $_[0]->quote_identifiers; +} + +sub quote_field_names { + (@_ > 1 and ($_[1] xor $_[0]->quote_identifiers) ) + ? croak 'Using quote_field_names as a setter is no longer supported' + : $_[0]->quote_identifiers; +} + +after quote_identifiers => sub { + if (@_ > 1) { + # synchronize for old code reaching directly into guts + $_[0]->{quote_table_names} + = $_[0]->{quote_field_names} + = $_[1] ? 1 : 0; + } +}; + +has producer => ( is => 'rw', default => sub { $DEFAULT_SUB } ); + +around producer => sub { + my $orig = shift; + shift->_tool({ + orig => $orig, + name => 'producer', + path => "SQL::Translator::Producer", + default_sub => "produce", + }, @_); +}; + +has producer_type => ( is => 'rwp', init_arg => undef ); + +around producer_type => carp_ro('producer_type'); + +has producer_args => ( is => 'rw', default => quote_sub(q{ +{} }) ); + +around producer_args => sub { + my $orig = shift; + shift->_args($orig, @_); +}; + +has parser => ( is => 'rw', default => sub { $DEFAULT_SUB } ); + +around parser => sub { + my $orig = shift; + shift->_tool({ + orig => $orig, + name => 'parser', + path => "SQL::Translator::Parser", + default_sub => "parse", + }, @_); +}; + +has parser_type => ( is => 'rwp', init_arg => undef ); + +around parser_type => carp_ro('parser_type'); + +has parser_args => ( is => 'rw', default => quote_sub(q{ +{} }) ); + +around parser_args => sub { + my $orig = shift; + shift->_args($orig, @_); +}; + +has filters => ( + is => 'rw', + default => quote_sub(q{ [] }), + coerce => sub { + my @filters; + # Set. Convert args to list of [\&code,@args] + foreach (@{$_[0]||[]}) { + my ($filt,@args) = ref($_) eq "ARRAY" ? @$_ : $_; + if ( isa($filt,"CODE") ) { + push @filters, [$filt,@args]; + next; + } + else { + __PACKAGE__->debug("Adding $filt filter. Args:".Dumper(\@args)."\n"); + $filt = _load_sub("$filt\::filter", "SQL::Translator::Filter") + || throw(__PACKAGE__->error); + push @filters, [$filt,@args]; + } + } + return \@filters; + }, +); + +around filters => sub { + my $orig = shift; + my $self = shift; + return @{$self->$orig([@{$self->$orig}, @_])} if @_; + return @{$self->$orig}; +}; + +has filename => ( + is => 'rw', + isa => sub { + foreach my $filename (ref($_[0]) eq 'ARRAY' ? @{$_[0]} : $_[0]) { + if (-d $filename) { + throw("Cannot use directory '$filename' as input source"); + } + elsif (not -f _ && -r _) { + throw("Cannot use '$filename' as input source: ". + "file does not exist or is not readable."); + } + } + }, +); + +around filename => \&ex2err; + +has data => ( + is => 'rw', + builder => 1, + lazy => 1, + coerce => sub { + # Set $self->data based on what was passed in. We will + # accept a number of things; do our best to get it right. + my $data = shift; + if (isa($data, 'ARRAY')) { + $data = join '', @$data; + } + elsif (isa($data, 'GLOB')) { + seek ($data, 0, 0) if eof ($data); + local $/; + $data = <$data>; + } + return isa($data, 'SCALAR') ? $data : \$data; + }, +); + +around data => sub { + my $orig = shift; + my $self = shift; + + if (@_ > 1 && !ref $_[0]) { + return $self->$orig(\join('', @_)); + } + elsif (@_) { + return $self->$orig(@_); + } + return ex2err($orig, $self); +}; + +sub _build_data { + my $self = shift; + # If we have a filename but no data yet, populate. + if (my $filename = $self->filename) { + $self->debug("Opening '$filename' to get contents.\n"); + local $/; + my $data; + + my @files = ref($filename) eq 'ARRAY' ? @$filename : ($filename); + + foreach my $file (@files) { + open my $fh, '<', $file + or throw("Can't read file '$file': $!"); + + $data .= <$fh>; + + close $fh or throw("Can't close file '$file': $!"); + } + + return \$data; + } +} + +has schema => ( + is => 'lazy', + init_arg => undef, + clearer => 'reset', + predicate => '_has_schema', +); + +around schema => carp_ro('schema'); + +around reset => sub { + my $orig = shift; + my $self = shift; + $self->$orig(@_); + return 1 +}; + +sub _build_schema { SQL::Translator::Schema->new(translator => shift) } + +sub translate { + my $self = shift; + my ($args, $parser, $parser_type, $producer, $producer_type); + my ($parser_output, $producer_output, @producer_output); + + # Parse arguments + if (@_ == 1) { + # Passed a reference to a hash? + if (isa($_[0], 'HASH')) { + # yep, a hashref + $self->debug("translate: Got a hashref\n"); + $args = $_[0]; + } + + # Passed a GLOB reference, i.e., filehandle + elsif (isa($_[0], 'GLOB')) { + $self->debug("translate: Got a GLOB reference\n"); + $self->data($_[0]); + } + + # Passed a reference to a string containing the data + elsif (isa($_[0], 'SCALAR')) { + # passed a ref to a string + $self->debug("translate: Got a SCALAR reference (string)\n"); + $self->data($_[0]); + } + + # Not a reference; treat it as a filename + elsif (! ref $_[0]) { + # Not a ref, it's a filename + $self->debug("translate: Got a filename\n"); + $self->filename($_[0]); + } + + # Passed something else entirely. + else { + # We're not impressed. Take your empty string and leave. + # return ""; + + # Actually, if data, parser, and producer are set, then we + # can continue. Too bad, because I like my comment + # (above)... + return "" unless ($self->data && + $self->producer && + $self->parser); + } + } + else { + # You must pass in a hash, or you get nothing. + return "" if @_ % 2; + $args = { @_ }; + } + + # ---------------------------------------------------------------------- + # Can specify the data to be transformed using "filename", "file", + # "data", or "datasource". + # ---------------------------------------------------------------------- + if (my $filename = ($args->{'filename'} || $args->{'file'})) { + $self->filename($filename); + } + + if (my $data = ($args->{'data'} || $args->{'datasource'})) { + $self->data($data); + } + + # ---------------------------------------------------------------- + # Get the data. + # ---------------------------------------------------------------- + my $data = $self->data; + + # ---------------------------------------------------------------- + # Local reference to the parser subroutine + # ---------------------------------------------------------------- + if ($parser = ($args->{'parser'} || $args->{'from'})) { + $self->parser($parser); + } + $parser = $self->parser; + $parser_type = $self->parser_type; + + # ---------------------------------------------------------------- + # Local reference to the producer subroutine + # ---------------------------------------------------------------- + if ($producer = ($args->{'producer'} || $args->{'to'})) { + $self->producer($producer); + } + $producer = $self->producer; + $producer_type = $self->producer_type; + + # ---------------------------------------------------------------- + # Execute the parser, the filters and then execute the producer. + # Allowances are made for each piece to die, or fail to compile, + # since the referenced subroutines could be almost anything. In + # the future, each of these might happen in a Safe environment, + # depending on how paranoid we want to be. + # ---------------------------------------------------------------- + + # Run parser + unless ( $self->_has_schema ) { + eval { $parser_output = $parser->($self, $$data) }; + if ($@ || ! $parser_output) { + my $msg = sprintf "translate: Error with parser '%s': %s", + $parser_type, ($@) ? $@ : " no results"; + return $self->error($msg); + } + } + $self->debug("Schema =\n", Dumper($self->schema), "\n"); + + # Validate the schema if asked to. + if ($self->validate) { + my $schema = $self->schema; + return $self->error('Invalid schema') unless $schema->is_valid; + } + + # Run filters + my $filt_num = 0; + foreach ($self->filters) { + $filt_num++; + my ($code,@args) = @$_; + eval { $code->($self->schema, @args) }; + my $err = $@ || $self->error || 0; + return $self->error("Error with filter $filt_num : $err") if $err; + } + + # Run producer + # Calling wantarray in the eval no work, wrong scope. + my $wantarray = wantarray ? 1 : 0; + eval { + if ($wantarray) { + @producer_output = $producer->($self); + } else { + $producer_output = $producer->($self); + } + }; + if ($@ || !( $producer_output || @producer_output)) { + my $err = $@ || $self->error || "no results"; + my $msg = "translate: Error with producer '$producer_type': $err"; + return $self->error($msg); + } + + return wantarray ? @producer_output : $producer_output; +} + +sub list_parsers { + return shift->_list("parser"); +} + +sub list_producers { + return shift->_list("producer"); +} + + +# ====================================================================== +# Private Methods +# ====================================================================== + +# ---------------------------------------------------------------------- +# _args($type, \%args); +# +# Gets or sets ${type}_args. Called by parser_args and producer_args. +# ---------------------------------------------------------------------- +sub _args { + my $self = shift; + my $orig = shift; + + if (@_) { + # If the first argument is an explicit undef (remember, we + # don't get here unless there is stuff in @_), then we clear + # out the producer_args hash. + if (! defined $_[0]) { + shift @_; + $self->$orig({}); + } + + my $args = isa($_[0], 'HASH') ? shift : { @_ }; + return $self->$orig({ %{$self->$orig}, %$args }); + } + + return $self->$orig; +} + # ---------------------------------------------------------------------- -# $Id: Translator.pm,v 1.12 2002-11-22 03:03:40 kycl4rk Exp $ +# Does the get/set work for parser and producer. e.g. +# return $self->_tool({ +# name => 'producer', +# path => "SQL::Translator::Producer", +# default_sub => "produce", +# }, @_); +# ---------------------------------------------------------------------- +sub _tool { + my ($self,$args) = (shift, shift); + my $name = $args->{name}; + my $orig = $args->{orig}; + return $self->{$name} unless @_; # get accessor + + my $path = $args->{path}; + my $default_sub = $args->{default_sub}; + my $tool = shift; + + # passed an anonymous subroutine reference + if (isa($tool, 'CODE')) { + $self->$orig($tool); + $self->${\"_set_${name}_type"}("CODE"); + $self->debug("Got $name: code ref\n"); + } + + # Module name was passed directly + # We try to load the name; if it doesn't load, there's a + # possibility that it has a function name attached to it, + # so we give it a go. + else { + $tool =~ s/-/::/g if $tool !~ /::/; + my ($code,$sub); + ($code,$sub) = _load_sub("$tool\::$default_sub", $path); + unless ($code) { + if ( __PACKAGE__->error =~ m/Can't find module/ ) { + # Mod not found so try sub + ($code,$sub) = _load_sub("$tool", $path) unless $code; + die "Can't load $name subroutine '$tool' : ".__PACKAGE__->error + unless $code; + } + else { + die "Can't load $name '$tool' : ".__PACKAGE__->error; + } + } + + # get code reference and assign + my (undef,$module,undef) = $sub =~ m/((.*)::)?(\w+)$/; + $self->$orig($code); + $self->${\"_set_$name\_type"}($sub eq "CODE" ? "CODE" : $module); + $self->debug("Got $name: $sub\n"); + } + + # At this point, $self->{$name} contains a subroutine + # reference that is ready to run + + # Anything left? If so, it's args + my $meth = "$name\_args"; + $self->$meth(@_) if (@_); + + return $self->{$name}; +} + +# ---------------------------------------------------------------------- +# _list($type) +# ---------------------------------------------------------------------- +sub _list { + my $self = shift; + my $type = shift || return (); + my $uctype = ucfirst lc $type; + + # + # First find all the directories where SQL::Translator + # parsers or producers (the "type") appear to live. + # + load("SQL::Translator::$uctype") or return (); + my $path = catfile "SQL", "Translator", $uctype; + my @dirs; + for (@INC) { + my $dir = catfile $_, $path; + $self->debug("_list_${type}s searching $dir\n"); + next unless -d $dir; + push @dirs, $dir; + } + + # + # Now use File::File::find to look recursively in those + # directories for all the *.pm files, then present them + # with the slashes turned into dashes. + # + my %found; + find( + sub { + if ( -f && m/\.pm$/ ) { + my $mod = $_; + $mod =~ s/\.pm$//; + my $cur_dir = $File::Find::dir; + my $base_dir = quotemeta catfile 'SQL', 'Translator', $uctype; + + # + # See if the current directory is below the base directory. + # + if ( $cur_dir =~ m/$base_dir(.*)/ ) { + $cur_dir = $1; + $cur_dir =~ s!^/!!; # kill leading slash + $cur_dir =~ s!/!-!g; # turn other slashes into dashes + } + else { + $cur_dir = ''; + } + + $found{ join '-', map { $_ || () } $cur_dir, $mod } = 1; + } + }, + @dirs + ); + + return sort { lc $a cmp lc $b } keys %found; +} + # ---------------------------------------------------------------------- -# Copyright (C) 2002 Ken Y. Clark , -# darren chamberlain +# load(MODULE [,PATH[,PATH]...]) +# +# Loads a Perl module. Short circuits if a module is already loaded. +# +# MODULE - is the name of the module to load. # -# This program is free software; you can redistribute it and/or -# modify it under the terms of the GNU General Public License as -# published by the Free Software Foundation; version 2. +# PATH - optional list of 'package paths' to look for the module in. e.g +# If you called load('Super::Foo' => 'My', 'Other') it will +# try to load the mod Super::Foo then My::Super::Foo then Other::Super::Foo. # -# This program is distributed in the hope that it will be useful, but -# WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU -# General Public License for more details. +# Returns package name of the module actually loaded or false and sets error. # -# You should have received a copy of the GNU General Public License -# along with this program; if not, write to the Free Software -# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA -# 02111-1307 USA -# ------------------------------------------------------------------- +# Note, you can't load a name from the root namespace (ie one without '::' in +# it), therefore a single word name without a path fails. +# ---------------------------------------------------------------------- +sub load { + my $name = shift; + my @path; + push @path, "" if $name =~ /::/; # Empty path to check name on its own first + push @path, @_ if @_; + + foreach (@path) { + my $module = $_ ? "$_\::$name" : $name; + my $file = $module; $file =~ s[::][/]g; $file .= ".pm"; + __PACKAGE__->debug("Loading $name as $file\n"); + return $module if $INC{$file}; # Already loaded + + eval { require $file }; + next if $@ =~ /Can't locate $file in \@INC/; + eval { $module->import() } unless $@; + return __PACKAGE__->error("Error loading $name as $module : $@") + if $@ && $@ !~ /"SQL::Translator::Producer" is not exported/; + + return $module; # Module loaded ok + } + + return __PACKAGE__->error("Can't find module $name. Path:".join(",",@path)); +} + +# ---------------------------------------------------------------------- +# Load the sub name given (including package), optionally using a base package +# path. Returns code ref and name of sub loaded, including its package. +# (\&code, $sub) = load_sub( 'MySQL::produce', "SQL::Translator::Producer" ); +# (\&code, $sub) = load_sub( 'MySQL::produce', @path ); +# ---------------------------------------------------------------------- +sub _load_sub { + my ($tool, @path) = @_; + + my (undef,$module,$func_name) = $tool =~ m/((.*)::)?(\w+)$/; + if ( my $module = load($module => @path) ) { + my $sub = "$module\::$func_name"; + return wantarray ? ( \&{ $sub }, $sub ) : \&$sub; + } + return undef; +} + +sub format_table_name { + return shift->_format_name('_format_table_name', @_); +} + +sub format_package_name { + return shift->_format_name('_format_package_name', @_); +} + +sub format_fk_name { + return shift->_format_name('_format_fk_name', @_); +} + +sub format_pk_name { + return shift->_format_name('_format_pk_name', @_); +} + +# ---------------------------------------------------------------------- +# The other format_*_name methods rely on this one. It optionally +# accepts a subroutine ref as the first argument (or uses an identity +# sub if one isn't provided or it doesn't already exist), and applies +# it to the rest of the arguments (if any). +# ---------------------------------------------------------------------- +sub _format_name { + my $self = shift; + my $field = shift; + my @args = @_; + + if (ref($args[0]) eq 'CODE') { + $self->{$field} = shift @args; + } + elsif (! exists $self->{$field}) { + $self->{$field} = sub { return shift }; + } + + return @args ? $self->{$field}->(@args) : $self->{$field}; +} + +sub isa($$) { + my ($ref, $type) = @_; + return UNIVERSAL::isa($ref, $type); +} + +sub version { + my $self = shift; + return $VERSION; +} + +# Must come after all 'has' declarations +around new => \&ex2err; + +1; + +# ---------------------------------------------------------------------- +# Who killed the pork chops? +# What price bananas? +# Are you my Angel? +# Allen Ginsberg +# ---------------------------------------------------------------------- + +=pod =head1 NAME -SQL::Translator - convert schema from one database to another +SQL::Translator - manipulate structured data definitions (SQL and more) =head1 SYNOPSIS use SQL::Translator; - my $translator = SQL::Translator->new( - xlate => $xlate || {}, # Overrides for field translation - debug => $debug, # Print debug info - trace => $trace, # Print Parse::RecDescent trace - no_comments => $no_comments, # Don't include comments in output + my $translator = SQL::Translator->new( + # Print debug info + debug => 1, + # Print Parse::RecDescent trace + trace => 0, + # Don't include comments in output + no_comments => 0, + # Print name mutations, conflicts + show_warnings => 0, + # Add "drop table" statements + add_drop_table => 1, + # to quote or not to quote, thats the question + quote_identifiers => 1, + # Validate schema object + validate => 1, + # Make all table names CAPS in producers which support this option + format_table_name => sub {my $tablename = shift; return uc($tablename)}, + # Null-op formatting, only here for documentation's sake + format_package_name => sub {return shift}, + format_fk_name => sub {return shift}, + format_pk_name => sub {return shift}, ); my $output = $translator->translate( - from => "MySQL", - to => "Oracle", + from => 'MySQL', + to => 'Oracle', + # Or an arrayref of filenames, i.e. [ $file1, $file2, $file3 ] filename => $file, ) or die $translator->error; @@ -46,189 +748,148 @@ SQL::Translator - convert schema from one database to another =head1 DESCRIPTION -This module attempts to simplify the task of converting one database -create syntax to another through the use of Parsers (which understand -the sourced format) and Producers (which understand the destination -format). The idea is that any Parser can be used with any Producer in -the conversion process. So, if you wanted PostgreSQL-to-Oracle, you -would use the PostgreSQL parser and the Oracle producer. +This documentation covers the API for SQL::Translator. For a more general +discussion of how to use the modules and scripts, please see +L. + +SQL::Translator is a group of Perl modules that converts +vendor-specific SQL table definitions into other formats, such as +other vendor-specific SQL, ER diagrams, documentation (POD and HTML), +XML, and Class::DBI classes. The main focus of SQL::Translator is +SQL, but parsers exist for other structured data formats, including +Excel spreadsheets and arbitrarily delimited text files. Through the +separation of the code into parsers and producers with an object model +in between, it's possible to combine any parser with any producer, to +plug in custom parsers or producers, or to manipulate the parsed data +via the built-in object model. Presently only the definition parts of +SQL are handled (CREATE, ALTER), not the manipulation of data (INSERT, +UPDATE, DELETE). -=cut +=head1 CONSTRUCTOR -use strict; -use vars qw( $VERSION $REVISION $DEFAULT_SUB $DEBUG $ERROR ); -use base 'Class::Base'; +The constructor is called C, and accepts a optional hash of options. +Valid options are: -$VERSION = '0.01'; -$REVISION = sprintf "%d.%02d", q$Revision: 1.12 $ =~ /(\d+)\.(\d+)/; -$DEBUG = 0 unless defined $DEBUG; -$ERROR = ""; +=over 4 -use Carp qw(carp); +=item * -use File::Spec::Functions qw(catfile); -use File::Basename qw(dirname); -use IO::Dir; +parser / from -# ---------------------------------------------------------------------- -# The default behavior is to "pass through" values (note that the -# SQL::Translator instance is the first value ($_[0]), and the stuff -# to be parsed is the second value ($_[1]) -# ---------------------------------------------------------------------- -$DEFAULT_SUB = sub { $_[1] } unless defined $DEFAULT_SUB; +=item * -=head1 CONSTRUCTOR +parser_args + +=item * + +producer / to + +=item * + +producer_args + +=item * + +filters + +=item * + +filename / file + +=item * + +data + +=item * -The constructor is called B, and accepts a optional hash of options. -Valid options are: +debug -=over 4 +=item * -=item parser (aka from) +add_drop_table -=item parser_args +=item * -=item producer (aka to) +quote_identifiers -=item producer_args +=item * -=item filename (aka file) +quote_table_names (DEPRECATED) -=item data +=item * -=item debug +quote_field_names (DEPRECATED) -=back +=item * -All options are, well, optional; these attributes can be set via -instance methods. Internally, they are; no (non-syntactical) -advantage is gained by passing options to the constructor. +no_comments -=cut +=item * -# ---------------------------------------------------------------------- -# init([ARGS]) -# The constructor. -# -# new takes an optional hash of arguments. These arguments may -# include a parser, specified with the keys "parser" or "from", -# and a producer, specified with the keys "producer" or "to". -# -# The values that can be passed as the parser or producer are -# given directly to the parser or producer methods, respectively. -# See the appropriate method description below for details about -# what each expects/accepts. -# ---------------------------------------------------------------------- -sub init { - my ( $self, $config ) = @_; +trace - # - # Set the parser and producer. - # - # If a 'parser' or 'from' parameter is passed in, use that as the - # parser; if a 'producer' or 'to' parameter is passed in, use that - # as the producer; both default to $DEFAULT_SUB. - # - $self->parser ($config->{'parser'} || $config->{'from'} || $DEFAULT_SUB); - $self->producer($config->{'producer'} || $config->{'to'} || $DEFAULT_SUB); +=item * - # - # Set the parser_args and producer_args - # - for my $pargs ( qw[ parser_args producer_args ] ) { - $self->$pargs( $config->{$pargs} ) if defined $config->{ $pargs }; - } +validate - # - # Set the data source, if 'filename' or 'file' is provided. - # - $config->{'filename'} ||= $config->{'file'} || ""; - $self->filename( $config->{'filename'} ) if $config->{'filename'}; +=back - # - # Finally, if there is a 'data' parameter, use that in - # preference to filename and file - # - if ( my $data = $config->{'data'} ) { - $self->data( $data ); - } +All options are, well, optional; these attributes can be set via +instance methods. Internally, they are; no (non-syntactical) +advantage is gained by passing options to the constructor. - # - # Set various other options. - # - $self->{'debug'} = defined $config->{'debug'} ? $config->{'debug'} : $DEBUG; +=head1 METHODS - $self->trace( $config->{'trace'} ); - - $self->custom_translate( $config->{'xlate'} ); +=head2 add_drop_table - $self->no_comments( $config->{'no_comments'} ); +Toggles whether or not to add "DROP TABLE" statements just before the +create definitions. - return $self; -} +=head2 quote_identifiers -=head1 METHODS +Toggles whether or not to quote identifiers (table, column, constraint, etc.) +with a quoting mechanism suitable for the chosen Producer. The default (true) +is to quote them. -# ---------------------------------------------------------------------- -=head2 B +=head2 quote_table_names -Allows the user to override default translation of fields. For example, -if a MySQL "text" field would normally be converted to a "long" for Oracle, -the user could specify to change it to a "CLOB." Accepts a hashref where -keys are the "from" value and values are the "to," returns the current -value of the field. +DEPRECATED - A legacy proxy to L -=cut +=head2 quote_field_names -sub custom_translate { - my $self = shift; - $self->{'custom_translate'} = shift if @_; - return $self->{'custom_translate'} || {}; -} +DEPRECATED - A legacy proxy to L -# ---------------------------------------------------------------------- -=head2 B +=head2 no_comments Toggles whether to print comments in the output. Accepts a true or false value, returns the current value. -=cut - -sub no_comments { - my $self = shift; - my $arg = shift; - if ( defined $arg ) { - $self->{'no_comments'} = $arg ? 1 : 0; - } - return $self->{'no_comments'} || 0; -} - -# ---------------------------------------------------------------------- -=head2 B +=head2 producer -The B method is an accessor/mutator, used to retrieve or +The C method is an accessor/mutator, used to retrieve or define what subroutine is called to produce the output. A subroutine -defined as a producer will be invoked as a function (not a method) and -passed 2 parameters: its container SQL::Translator instance and a -data structure. It is expected that the function transform the data -structure to a string. The SQL::Transformer instance is provided for -informational purposes; for example, the type of the parser can be -retrieved using the B method, and the B and -B methods can be called when needed. - -When defining a producer, one of several things can be passed -in: A module name (e.g., My::Groovy::Producer), a module name -relative to the SQL::Translator::Producer namespace (e.g., MySQL), a -module name and function combination (My::Groovy::Producer::transmogrify), +defined as a producer will be invoked as a function (I) +and passed its container C instance, which it should +call the C method on, to get the C +generated by the parser. It is expected that the function transform the +schema structure to a string. The C instance is also useful +for informational purposes; for example, the type of the parser can be +retrieved using the C method, and the C and +C methods can be called when needed. + +When defining a producer, one of several things can be passed in: A +module name (e.g., C), a module name relative to +the C namespace (e.g., C), a module +name and function combination (C), or a reference to an anonymous subroutine. If a full module name is passed in (for the purposes of this method, a string containing "::" is considered to be a module name), it is treated as a package, and a -function called "produce" will be invoked: $modulename::produce. If -$modulename cannot be loaded, the final portion is stripped off and +function called "produce" will be invoked: C<$modulename::produce>. +If $modulename cannot be loaded, the final portion is stripped off and treated as a function. In other words, if there is no file named -My/Groovy/Producer/transmogrify.pm, SQL::Translator will attempt to load -My/Groovy/Producer.pm and use transmogrify as the name of the function, -instead of the default "produce". +F, C will attempt +to load F and use C as the name of +the function, instead of the default C. my $tr = SQL::Translator->new; @@ -247,12 +908,12 @@ instead of the default "produce". # $subref->($tr, $data); $tr->producer(\&my_producer); -There is also a method named B, which is a string -containing the classname to which the above B function +There is also a method named C, which is a string +containing the classname to which the above C function belongs. In the case of anonymous subroutines, this method returns the string "CODE". -Finally, there is a method named B, which is both an +Finally, there is a method named C, which is both an accessor and a mutator. Arbitrary data may be stored in name => value pairs for the producer subroutine to access: @@ -262,8 +923,8 @@ pairs for the producer subroutine to access: # $pr_args is a hashref. -Extra data passed to the B method is passed to -B: +Extra data passed to the C method is passed to +C: $tr->producer("xSV", delimiter => ',\s*'); @@ -271,107 +932,14 @@ B: my $args = $tr->producer_args; my $delimiter = $args->{'delimiter'}; # value is ,\s* -=cut - -# producer and producer_type -sub producer { - my $self = shift; - - # producer as a mutator - if (@_) { - my $producer = shift; - - # Passed a module name (string containing "::") - if ($producer =~ /::/) { - my $func_name; - - # Module name was passed directly - # We try to load the name; if it doesn't load, there's - # a possibility that it has a function name attached to - # it. - if (load($producer)) { - $func_name = "produce"; - } - - # Module::function was passed - else { - # Passed Module::Name::function; try to recover - my @func_parts = split /::/, $producer; - $func_name = pop @func_parts; - $producer = join "::", @func_parts; - - # If this doesn't work, then we have a legitimate - # problem. - load($producer) or die "Can't load $producer: $@"; - } - - # get code reference and assign - $self->{'producer'} = \&{ "$producer\::$func_name" }; - $self->{'producer_type'} = $producer; - $self->debug("Got producer: $producer\::$func_name\n"); - } - - # passed an anonymous subroutine reference - elsif (isa($producer, 'CODE')) { - $self->{'producer'} = $producer; - $self->{'producer_type'} = "CODE"; - $self->debug("Got producer: code ref\n"); - } - - # passed a string containing no "::"; relative package name - else { - my $Pp = sprintf "SQL::Translator::Producer::$producer"; - load($Pp) or die "Can't load $Pp: $@"; - $self->{'producer'} = \&{ "$Pp\::produce" }; - $self->{'producer_type'} = $Pp; - $self->debug("Got producer: $Pp\n"); - } - - # At this point, $self->{'producer'} contains a subroutine - # reference that is ready to run - - # Anything left? If so, it's producer_args - $self->producer_args(@_) if (@_); - } - - return $self->{'producer'}; -}; - -# ---------------------------------------------------------------------- -# producer_type -# -# producer_type is an accessor that allows producer subs to get -# information about their origin. This is poptentially important; -# since all producer subs are called as subroutine refernces, there is -# no way for a producer to find out which package the sub lives in -# originally, for example. -# ---------------------------------------------------------------------- -sub producer_type { $_[0]->{'producer_type'} } - -# ---------------------------------------------------------------------- -# producer_args -# -# Arbitrary name => value pairs of paramters can be passed to a -# producer using this method. -# ---------------------------------------------------------------------- -sub producer_args { - my $self = shift; - if (@_) { - my $args = isa($_[0], 'HASH') ? shift : { @_ }; - $self->{'producer_args'} = $args; - } - $self->{'producer_args'}; -} - -# ---------------------------------------------------------------------- -=head2 B +=head2 parser -The B method defines or retrieves a subroutine that will be +The C method defines or retrieves a subroutine that will be called to perform the parsing. The basic idea is the same as that of -B (see above), except the default subroutine name is -"parse", and will be invoked as $module_name::parse($tr, $data). +C (see above), except the default subroutine name is +"parse", and will be invoked as C<$module_name::parse($tr, $data)>. Also, the parser subroutine will be passed a string containing the -entirety of the data to be parsed (or possibly a reference to a string?). +entirety of the data to be parsed. # Invokes SQL::Translator::Parser::MySQL::parse() $tr->parser("MySQL"); @@ -386,104 +954,84 @@ entirety of the data to be parsed (or possibly a reference to a string?). return $dumper->Dump; }); -There is also B and B, which perform -analogously to B and B - -=cut - -sub parser { - my $self = shift; - - # parser as a mutator - if (@_) { - my $parser = shift; - - # Passed a module name (string containing "::") - if ($parser =~ /::/) { - my $func_name; - - # Module name was passed directly - # We try to load the name; if it doesn't load, there's - # a possibility that it has a function name attached to - # it. - if (load($parser)) { - $func_name = "parse"; - } - - # Module::function was passed - else { - # Passed Module::Name::function; try to recover - my @func_parts = split /::/, $parser; - $func_name = pop @func_parts; - $parser = join "::", @func_parts; - - # If this doesn't work, then we have a legitimate - # problem. - load($parser) or die "Can't load $parser: $@"; - } - - # get code reference and assign - $self->{'parser'} = \&{ "$parser\::$func_name" }; - $self->{'parser_type'} = $parser; - $self->debug("Got parser: $parser\::$func_name\n"); - } +There is also C and C, which perform +analogously to C and C + +=head2 filters + +Set or retrieve the filters to run over the schema during the +translation, before the producer creates its output. Filters are sub +routines called, in order, with the schema object to filter as the 1st +arg and a hash of options (passed as a list) for the rest of the args. +They are free to do whatever they want to the schema object, which will be +handed to any following filters, then used by the producer. + +Filters are set as an array, which gives the order they run in. +Like parsers and producers, they can be defined by a module name, a +module name relative to the SQL::Translator::Filter namespace, a module +name and function name together or a reference to an anonymous subroutine. +When using a module name a function called C will be invoked in +that package to do the work. + +To pass args to the filter set it as an array ref with the 1st value giving +the filter (name or sub) and the rest its args. e.g. + + $tr->filters( + sub { + my $schema = shift; + # Do stuff to schema here! + }, + DropFKeys, + [ "Names", table => 'lc' ], + [ "Foo", foo => "bar", hello => "world" ], + [ "Filter5" ], + ); + +Although you normally set them in the constructor, which calls +through to filters. i.e. + + my $translator = SQL::Translator->new( + ... + filters => [ + sub { ... }, + [ "Names", table => 'lc' ], + ], + ... + ); - # passed an anonymous subroutine reference - elsif ( isa( $parser, 'CODE' ) ) { - $self->{'parser'} = $parser; - $self->{'parser_type'} = "CODE"; - $self->debug("Got parser: code ref\n"); - } +See F for more examples. - # passed a string containing no "::"; relative package name - else { - my $Pp = "SQL::Translator::Parser::$parser"; - load( $Pp ) or die "Can't load $Pp: $@"; - $self->{'parser'} = \&{ "$Pp\::parse" }; - $self->{'parser_type'} = $Pp; - $self->debug("Got parser: $Pp\n"); - } - - # - # At this point, $self->{'parser'} contains a subroutine - # reference that is ready to run - # - $self->parser_args( @_ ) if (@_); - } +Multiple set calls to filters are cumulative with new filters added to +the end of the current list. - return $self->{'parser'}; -} +Returns the filters as a list of array refs, the 1st value being a +reference to the filter sub and the rest its args. -# ---------------------------------------------------------------------- -sub parser_type { $_[0]->{'parser_type'} } +=head2 show_warnings -# ---------------------------------------------------------------------- -sub parser_args { - my $self = shift; - if (@_) { - my $args = isa($_[0], 'HASH') ? shift : { @_ }; - $self->{'parser_args'} = $args; - } - $self->{'parser_args'}; -} +Toggles whether to print warnings of name conflicts, identifier +mutations, etc. Probably only generated by producers to let the user +know when something won't translate very smoothly (e.g., MySQL "enum" +fields into Oracle). Accepts a true or false value, returns the +current value. -# ---------------------------------------------------------------------- -=head2 B +=head2 translate -The B method calls the subroutines referenced by the -B and B data members (described above). It accepts -as arguments a number of things, in key => value format, including -(potentially) a parser and a producer (they are passed directly to the -B and B methods). +The C method calls the subroutine referenced by the +C data member, then calls any C and finally calls +the C sub routine (these members are described above). +It accepts as arguments a number of things, in key => value format, +including (potentially) a parser and a producer (they are passed +directly to the C and C methods). -Here is how the parameter list to B is parsed: +Here is how the parameter list to C is parsed: =over =item * 1 argument means it's the data to be parsed; which could be a string -(filename) or a refernce to a scalar (a string stored in memory), or a +(filename) or a reference to a scalar (a string stored in memory), or a reference to a hash, which is parsed as being more than one argument (see next section). @@ -514,13 +1062,12 @@ You get the idea. =back -# ---------------------------------------------------------------------- -=head2 B, B +=head2 filename, data -Using the B method, the filename of the data to be parsed -can be set. This method can be used in conjunction with the B -method, below. If both the B and B methods are -invoked as mutators, the data set in the B method is used. +Using the C method, the filename of the data to be parsed +can be set. This method can be used in conjunction with the C +method, below. If both the C and C methods are +invoked as mutators, the data set in the C method is used. $tr->filename("/my/data/files/create.sql"); @@ -533,275 +1080,69 @@ or: }; $tr->data(\$create_script); -B takes a string, which is interpreted as a filename. -B takes a reference to a string, which is used as the data to be +C takes a string, which is interpreted as a filename. +C takes a reference to a string, which is used as the data to be parsed. If a filename is set, then that file is opened and read when -the B method is called, as long as the data instance +the C method is called, as long as the data instance variable is not set. -=cut - -# filename - get or set the filename -sub filename { - my $self = shift; - if (@_) { - my $filename = shift; - if (-d $filename) { - my $msg = "Cannot use directory '$filename' as input source"; - return $self->error($msg); - } elsif (-f _ && -r _) { - $self->{'filename'} = $filename; - $self->debug("Got filename: '$self->{'filename'}'\n"); - } else { - my $msg = "Cannot use '$filename' as input source: ". - "file does not exist or is not readable."; - return $self->error($msg); - } - } - - $self->{'filename'}; -} - -# ---------------------------------------------------------------------- -# data - get or set the data -# if $self->{'data'} is not set, but $self->{'filename'} is, then -# $self->{'filename'} is opened and read, whith the results put into -# $self->{'data'}. -sub data { - my $self = shift; - - # Set $self->{'data'} to $_[0], if it is provided. - if (@_) { - my $data = shift; - if (isa($data, "SCALAR")) { - $self->{'data'} = $data; - } - elsif (! ref $data) { - $self->{'data'} = \$data; - } - } - - # If we have a filename but no data yet, populate. - if (not $self->{'data'} and my $filename = $self->filename) { - $self->debug("Opening '$filename' to get contents.\n"); - local *FH; - local $/; - my $data; - - unless (open FH, $filename) { - return $self->error("Can't read file '$filename': $!"); - } - - $data = ; - $self->{'data'} = \$data; - - unless (close FH) { - return $self->error("Can't close file '$filename': $!"); - } - } - - return $self->{'data'}; -} +=head2 schema -# ---------------------------------------------------------------------- -=pod +Returns the SQL::Translator::Schema object. -=head2 B +=head2 trace Turns on/off the tracing option of Parse::RecDescent. -=cut - -sub trace { - my $self = shift; - my $arg = shift; - if ( defined $arg ) { - $self->{'trace'} = $arg ? 1 : 0; - } - return $self->{'trace'} || 0; -} - -# ---------------------------------------------------------------------- -sub translate { - my $self = shift; - my ($args, $parser, $parser_type, $producer, $producer_type); - my ($parser_output, $producer_output); - - # Parse arguments - if (@_ == 1) { - # Passed a reference to a hash? - if (isa($_[0], 'HASH')) { - # yep, a hashref - $self->debug("translate: Got a hashref\n"); - $args = $_[0]; - } - - # Passed a reference to a string containing the data - elsif (isa($_[0], 'SCALAR')) { - # passed a ref to a string - $self->debug("translate: Got a SCALAR reference (string)\n"); - $self->data($_[0]); - } - - # Not a reference; treat it as a filename - elsif (! ref $_[0]) { - # Not a ref, it's a filename - $self->debug("translate: Got a filename\n"); - $self->filename($_[0]); - } - - # Passed something else entirely. - else { - # We're not impressed. Take your empty string and leave. - # return ""; - - # Actually, if data, parser, and producer are set, then we - # can continue. Too bad, because I like my comment - # (above)... - return "" unless ($self->data && - $self->producer && - $self->parser); - } - } - else { - # You must pass in a hash, or you get nothing. - return "" if @_ % 2; - $args = { @_ }; - } - - # ---------------------------------------------------------------------- - # Can specify the data to be transformed using "filename", "file", - # "data", or "datasource". - # ---------------------------------------------------------------------- - if (my $filename = ($args->{'filename'} || $args->{'file'})) { - $self->filename($filename); - } - - if (my $data = ($self->{'data'} || $self->{'datasource'})) { - $self->data($data); - } - - # ---------------------------------------------------------------- - # Get the data. - # ---------------------------------------------------------------- - my $data = $self->data; - unless (length $$data) { - return $self->error("Empty data file!"); - } - - # ---------------------------------------------------------------- - # Local reference to the parser subroutine - # ---------------------------------------------------------------- - if ($parser = ($args->{'parser'} || $args->{'from'})) { - $self->parser($parser); - } - $parser = $self->parser; - $parser_type = $self->parser_type; - - # ---------------------------------------------------------------- - # Local reference to the producer subroutine - # ---------------------------------------------------------------- - if ($producer = ($args->{'producer'} || $args->{'to'})) { - $self->producer($producer); - } - $producer = $self->producer; - $producer_type = $self->producer_type; - - # ---------------------------------------------------------------- - # Execute the parser, then execute the producer with that output. - # Allowances are made for each piece to die, or fail to compile, - # since the referenced subroutines could be almost anything. In - # the future, each of these might happen in a Safe environment, - # depending on how paranoid we want to be. - # ---------------------------------------------------------------- - eval { $parser_output = $parser->($self, $$data) }; - if ($@ || ! $parser_output) { - my $msg = sprintf "translate: Error with parser '%s': %s", - $parser_type, ($@) ? $@ : " no results"; - return $self->error($msg); - } - - eval { $producer_output = $producer->($self, $parser_output) }; - if ($@ || ! $producer_output) { - my $msg = sprintf "translate: Error with producer '%s': %s", - $producer_type, ($@) ? $@ : " no results"; - return $self->error($msg); - } - - return $producer_output; -} +=head2 validate -# ---------------------------------------------------------------------- -sub list_producers { - require SQL::Translator::Producer; - my $path = catfile(dirname($INC{'SQL/Translator/Producer.pm'}), "Producer"); - my $dh = IO::Dir->new($path); +Whether or not to validate the schema object after parsing and before +producing. - my @available = map { join "::", "SQL::Translator::Producer", $_ } - grep /\.pm$/, $dh->read; +=head2 version - return @available; -} +Returns the version of the SQL::Translator release. -# ---------------------------------------------------------------------- -sub list_parsers { - require SQL::Translator::Parser; - my $path = catfile(dirname($INC{'SQL/Translator/Parser.pm'}), "Parser"); - my $dh = IO::Dir->new($path); +=head1 AUTHORS - my @available = map { join "::", "SQL::Translator::Parser", $_ } - grep /\.pm$/, $dh->read; +See the included AUTHORS file: +L - return @available; -} +If you would like to contribute to the project, you can send patches +to the developers mailing list: -# ---------------------------------------------------------------------- -sub load { - my $module = do { my $m = shift; $m =~ s[::][/]g; "$m.pm" }; - return 1 if $INC{$module}; - - eval { require $module }; - - return if ($@); - return 1; -} + sqlfairy-developers@lists.sourceforge.net -# ---------------------------------------------------------------------- -sub isa { UNIVERSAL::isa($_[0], $_[1]) } +Or send us a message (with your Sourceforge username) asking to be +added to the project and what you'd like to contribute. -1; -#----------------------------------------------------- -# Rescue the drowning and tie your shoestrings. -# Henry David Thoreau -#----------------------------------------------------- +=head1 COPYRIGHT -=pod +Copyright 2012 the SQL::Translator authors, as listed in L. -=head1 AUTHORS +=head1 LICENSE -Ken Y. Clark, Ekclark@cpan.org, -darren chamberlain Edarren@cpan.orgE, -Chris Mungall Ecjm@fruitfly.orgE +This library is free software and may be distributed under the same terms as +Perl 5 itself. -=head1 COPYRIGHT +=head1 BUGS -This program is free software; you can redistribute it and/or modify -it under the terms of the GNU General Public License as published by -the Free Software Foundation; version 2. +Please use L for reporting bugs. -This program is distributed in the hope that it will be useful, but -WITHOUT ANY WARRANTY; without even the implied warranty of -MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU -General Public License for more details. +=head1 PRAISE -You should have received a copy of the GNU General Public License -along with this program; if not, write to the Free Software -Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 -USA +If you find this module useful, please use +L to rate it. =head1 SEE ALSO -L, L - -=cut +L, +L, +L, +L, +L, +L, +L, +L, +L.