diff options
author | mkanat%bugzilla.org <> | 2007-03-10 05:13:09 +0100 |
---|---|---|
committer | mkanat%bugzilla.org <> | 2007-03-10 05:13:09 +0100 |
commit | 3bc6ea42732020b00fef53a9b556e4a37e591bd7 (patch) | |
tree | 8de3ef7295c5e0345f8981fd32e08b268015e132 /Bugzilla | |
parent | 3a943fe055afe25c540698b0417854bd3f5b5ef4 (diff) | |
download | bugzilla-3bc6ea42732020b00fef53a9b556e4a37e591bd7.tar.gz bugzilla-3bc6ea42732020b00fef53a9b556e4a37e591bd7.tar.xz |
Bug 347439: Implement support for referential integrity in Bugzilla::DB::Schema and implement it on profiles_activity
Patch By Max Kanat-Alexander <mkanat@bugzilla.org> (module owner) a=mkanat
Diffstat (limited to 'Bugzilla')
-rw-r--r-- | Bugzilla/DB.pm | 5 | ||||
-rw-r--r-- | Bugzilla/DB/Schema.pm | 245 | ||||
-rw-r--r-- | Bugzilla/DB/Schema/Mysql.pm | 29 | ||||
-rw-r--r-- | Bugzilla/Install/DB.pm | 47 |
4 files changed, 297 insertions, 29 deletions
diff --git a/Bugzilla/DB.pm b/Bugzilla/DB.pm index 9f517a8e7..e4e30a8d3 100644 --- a/Bugzilla/DB.pm +++ b/Bugzilla/DB.pm @@ -515,10 +515,11 @@ sub bz_alter_column_raw { my @statements = $self->_bz_real_schema->get_alter_column_ddl( $table, $name, $new_def, defined $set_nulls_to ? $self->quote($set_nulls_to) : undef); - my $new_ddl = $self->_bz_schema->get_type_ddl($new_def); + my $new_ddl = $self->_bz_schema->get_display_ddl($table, $name, $new_def); print "Updating column $name in table $table ...\n"; if (defined $current_def) { - my $old_ddl = $self->_bz_schema->get_type_ddl($current_def); + my $old_ddl = $self->_bz_schema->get_display_ddl($table, $name, + $current_def); print "Old: $old_ddl\n"; } print "New: $new_ddl\n"; diff --git a/Bugzilla/DB/Schema.pm b/Bugzilla/DB/Schema.pm index 661677319..a97d3428b 100644 --- a/Bugzilla/DB/Schema.pm +++ b/Bugzilla/DB/Schema.pm @@ -96,7 +96,21 @@ more about how this integrates into the rest of Bugzilla. =head1 CONSTANTS -=over 4 +=over + +=item C<TABLES_FIRST> + +Because of L</"Referential Integrity">, certain tables must be created +before other tables. L</ABSTRACT_SCHEMA> can't specify this, because +it's a hash. So we specify it here. When calling C<get_table_list()>, +these tables will be returned before the other tables. + +=cut + +use constant TABLES_FIRST => qw( + fielddefs + profiles +); =item C<SCHEMA_VERSION> @@ -157,6 +171,49 @@ which can be used to specify the type of index such as UNIQUE or FULLTEXT. =back +=head2 Referential Integrity + +Bugzilla::DB::Schema supports "foreign keys", a way of saying +that "Column X may only contain values from Column Y in Table Z". +For example, in Bugzilla, bugs.resolution should only contain +values from the resolution.values field. + +It does this by adding an additional item to a column, called C<REFERENCES>. +This is a hash with the following members: + +=over + +=item C<TABLE> + +The table the foreign key points at + +=item C<COLUMN> + +The column pointed at in that table. + +=item C<DELETE> + +What to do if the row in the parent table is deleted. Choices are +C<RESTRICT> or C<CASCADE>. + +C<RESTRICT> means the deletion of the row in the parent table will +be forbidden by the database if there is a row in I<this> table that +still refers to it. This is the default, if you don't specify +C<DELETE>. + +C<CASCADE> means that this row will be deleted along with that row. + +=item C<UPDATE> + +What to do if the value in the parent table is updated. It has the +same choices as L</DELETE>, except it defaults to C<CASCADE>, which means +"also update this column in this table." + +=back + +Note that not all our supported databases actually enforce C<RESTRICT> +and C<CASCADE>, so don't depend on them. + =cut use constant SCHEMA_VERSION => '2.00'; @@ -645,10 +702,17 @@ use constant ABSTRACT_SCHEMA => { profiles_activity => { FIELDS => [ - userid => {TYPE => 'INT3', NOTNULL => 1}, - who => {TYPE => 'INT3', NOTNULL => 1}, + userid => {TYPE => 'INT3', NOTNULL => 1, + REFERENCES => {TABLE => 'profiles', + COLUMN => 'userid', + DELETE => 'CASCADE'}}, + who => {TYPE => 'INT3', NOTNULL => 1, + REFERENCES => {TABLE => 'profiles', + COLUMN => 'userid'}}, profiles_when => {TYPE => 'DATETIME', NOTNULL => 1}, - fieldid => {TYPE => 'INT3', NOTNULL => 1}, + fieldid => {TYPE => 'INT3', NOTNULL => 1, + REFERENCES => {TABLE => 'fielddefs', + COLUMN => 'id'}}, oldvalue => {TYPE => 'TINYTEXT'}, newvalue => {TYPE => 'TINYTEXT'}, ], @@ -1281,23 +1345,34 @@ sub get_type_ddl { =item C<get_type_ddl> - Description: Public method to convert abstract (database-generic) field - specifiers to database-specific data types suitable for use - in a C<CREATE TABLE> or C<ALTER TABLE> SQL statment. If no - database-specific field type has been defined for the given - field type, then it will just return the same field type. - Parameters: a hash or a reference to a hash of a field containing the - following keys: C<TYPE> (required), C<NOTNULL> (optional), - C<DEFAULT> (optional), C<PRIMARYKEY> (optional), C<REFERENCES> - (optional) - Returns: a DDL string suitable for describing a field in a - C<CREATE TABLE> or C<ALTER TABLE> SQL statement +=over + +=item B<Description> + +Public method to convert abstract (database-generic) field specifiers to +database-specific data types suitable for use in a C<CREATE TABLE> or +C<ALTER TABLE> SQL statment. If no database-specific field type has been +defined for the given field type, then it will just return the same field type. + +=item B<Parameters> + +=over + +=item C<$def> - A reference to a hash of a field containing the following keys: +C<TYPE> (required), C<NOTNULL> (optional), C<DEFAULT> (optional), +C<PRIMARYKEY> (optional), C<REFERENCES> (optional) + +=back + +-item B<Returns> + +A DDL string suitable for describing a field in a C<CREATE TABLE> or +C<ALTER TABLE> SQL statement =cut my $self = shift; my $finfo = (@_ == 1 && ref($_[0]) eq 'HASH') ? $_[0] : { @_ }; - my $type = $finfo->{TYPE}; die "A valid TYPE was not specified for this column." unless ($type); @@ -1308,19 +1383,91 @@ sub get_type_ddl { $default = $self->{db_specific}->{$default}; } - my $fkref = $self->{enable_references} ? $finfo->{REFERENCES} : undef; my $type_ddl = $self->convert_type($type); # DEFAULT attribute must appear before any column constraints # (e.g., NOT NULL), for Oracle $type_ddl .= " DEFAULT $default" if (defined($default)); $type_ddl .= " NOT NULL" if ($finfo->{NOTNULL}); $type_ddl .= " PRIMARY KEY" if ($finfo->{PRIMARYKEY}); - $type_ddl .= "\n\t\t\t\tREFERENCES $fkref" if $fkref; return($type_ddl); } #eosub--get_type_ddl + +# Used if you want to display the DDL to the user, as opposed to actually +# use it in the database. +sub get_display_ddl { + my ($self, $table, $column, $def) = @_; + my $ddl = $self->get_type_ddl($def); + if ($def->{REFERENCES}) { + $ddl .= $self->get_fk_ddl($table, $column, $def->{REFERENCES}); + } + return $ddl; +} + +sub get_fk_ddl { +=item C<_get_fk_ddl> + +=over + +=item B<Description> + +Protected method. Translates the C<REFERENCES> item of a column into SQL. + +=item B<Params> + +=over + +=item C<$table> - The name of the table the reference is from. +=item C<$column> - The name of the column the reference is from +=item C<$references> - The C<REFERENCES> hashref from a column. + +=back + +Returns: SQL for to define the foreign key, or an empty string + if C<$references> is undefined. + +=cut + + my ($self, $table, $column, $references) = @_; + return "" if !$references; + + my $update = $references->{UPDATE} || 'CASCADE'; + my $delete = $references->{DELETE} || 'RESTRICT'; + my $to_table = $references->{TABLE} || die "No table in reference"; + my $to_column = $references->{COLUMN} || die "No column in reference"; + my $fk_name = $self->_get_fk_name($table, $column, $references); + + return "\n CONSTRAINT $fk_name FOREIGN KEY ($column)\n" + . " REFERENCES $to_table($to_column)\n" + . " ON UPDATE $update ON DELETE $delete"; +} + +# Generates a name for a Foreign Key. It's separate from get_fk_ddl +# so that certain databases can override it (for shorter identifiers or +# other reasons). +sub _get_fk_name { + my ($self, $table, $column, $references) = @_; + my $to_table = $references->{TABLE}; + my $to_column = $references->{COLUMN}; + return "fk_${table}_${column}_${to_table}_${to_column}"; +} + +sub _get_add_fk_sql { + my ($self, $table, $column, $new_def) = @_; + + my $fk_string = $self->get_fk_ddl($table, $column, $new_def->{REFERENCES}); + return ("ALTER TABLE $table ADD $fk_string"); +} + +sub _get_drop_fk_sql { + my ($self, $table, $column, $old_def) = @_; + my $fk_name = $self->_get_fk_name($table, $column, $old_def->{REFERENCES}); + + return ("ALTER TABLE $table DROP CONSTRAINT $fk_name"); +} + sub convert_type { =item C<convert_type> @@ -1363,17 +1510,27 @@ sub get_table_list { Description: Public method for discovering what tables should exist in the Bugzilla database. + Parameters: none - Returns: an array of table names + + Returns: An array of table names. The tables specified + in L</TABLES_FIRST> will come first, in order. The + rest of the tables will be in random order. =cut my $self = shift; - return(sort(keys %{ $self->{schema} })); + my %schema = %{$self->{schema}}; + my @tables; + foreach my $table (TABLES_FIRST) { + push(@tables, $table); + delete $schema{$table}; + } + push(@tables, keys %schema); + return @tables; +} -} #eosub--get_table_list -#-------------------------------------------------------------------------- sub get_table_columns { =item C<get_table_columns> @@ -1440,6 +1597,14 @@ sub get_table_ddl { push(@ddl, $index_sql) if $index_sql; } + my %fields = @{$self->{schema}{$table}{FIELDS}}; + foreach my $col (keys %fields) { + my $def = $fields{$col}; + if ($def->{REFERENCES}) { + push(@ddl, $self->_get_add_fk_sql($table, $col, $def)); + } + } + push(@ddl, @{ $self->{schema}{$table}{DB_EXTRAS} }) if (ref($self->{schema}{$table}{DB_EXTRAS})); @@ -1653,6 +1818,15 @@ sub get_alter_column_ddl { push(@statements, "ALTER TABLE $table DROP PRIMARY KEY"); } + # If we went from not having an FK to having an FK + # XXX For right now, you can't change an FK's actual definition. + if (!$old_def->{REFERENCES} && $new_def->{REFERENCES}) { + push(@statements, $self->_get_add_fk_sql($table, $column, $new_def)); + } + elsif ($old_def->{REFERENCES} && !$new_def->{REFERENCES}) { + push(@statements, $self->_get_drop_fk_sql($table, $column, $old_def)); + } + return @statements; } @@ -2040,14 +2214,31 @@ sub columns_equal { $col_one->{TYPE} = uc($col_one->{TYPE}); $col_two->{TYPE} = uc($col_two->{TYPE}); - my @col_one_array = %$col_one; - my @col_two_array = %$col_two; + # It doesn't work to compare the two REFERENCES items, because + # they look like 'HASH(0xaf3c434)' to diff_arrays--they'll never + # be equal. + my %col_one_def = %$col_one; + delete $col_one_def{REFERENCES}; + my %col_two_def = %$col_two; + delete $col_two_def{REFERENCES}; + + my @col_one_array = %col_one_def; + my @col_two_array = %col_two_def; my ($removed, $added) = diff_arrays(\@col_one_array, \@col_two_array); - # If there are no differences between the arrays, - # then they are equal. - return !scalar(@$removed) && !scalar(@$added) ? 1 : 0; + # If there are no differences between the arrays, then they are equal. + my $defs_identical = !scalar(@$removed) && !scalar(@$added); + + # If the basic definitions are identical, we still want to check + # if the two foreign key definitions are different. + my @fk_array_one = %{$col_one->{REFERENCES} || {}}; + my @fk_array_two = %{$col_two->{REFERENCES} || {}}; + my ($fk_removed, $fk_added) = + diff_arrays(\@fk_array_one, \@fk_array_two); + my $fk_identical = !scalar(@$fk_removed) && !scalar(@$fk_added); + + return $defs_identical && $fk_identical ? 1 : 0; } diff --git a/Bugzilla/DB/Schema/Mysql.pm b/Bugzilla/DB/Schema/Mysql.pm index 358137ea5..eb7cd3c87 100644 --- a/Bugzilla/DB/Schema/Mysql.pm +++ b/Bugzilla/DB/Schema/Mysql.pm @@ -176,9 +176,17 @@ sub get_alter_column_ddl { # keys are not allowed. delete $new_def_copy{PRIMARYKEY}; } + # CHANGE COLUMN doesn't support REFERENCES + delete $new_def_copy{REFERENCES}; my $new_ddl = $self->get_type_ddl(\%new_def_copy); my @statements; + + # Drop the FK if the new definition doesn't have one. + if ($old_def->{REFERENCES} && !$new_def->{REFERENCES}) { + push(@statements, $self->_get_drop_fk_sql($table, $column, $old_def)); + } + push(@statements, "UPDATE $table SET $column = $set_nulls_to WHERE $column IS NULL") if defined $set_nulls_to; push(@statements, "ALTER TABLE $table CHANGE COLUMN @@ -187,9 +195,30 @@ sub get_alter_column_ddl { # Dropping a PRIMARY KEY needs an explicit DROP PRIMARY KEY push(@statements, "ALTER TABLE $table DROP PRIMARY KEY"); } + + # Add the FK if the new definition has one and the old definition doesn't. + if ($new_def->{REFERENCES} && !$old_def->{REFERENCES}) { + push(@statements, $self->_get_add_fk_sql($table, $column, $new_def)); + } return @statements; } +sub _get_drop_fk_sql { + my ($self, $table, $column, $old_def) = @_; + my $fk_name = $self->_get_fk_name($table, $column, $old_def->{REFERENCES}); + my @sql = ("ALTER TABLE $table DROP FOREIGN KEY $fk_name"); + my $dbh = Bugzilla->dbh; + + # MySQL requires, and will create, an index on any column with + # an FK. It will name it after the fk, which we never do. + # So if there's an index named after the fk, we also have to delete it. + if ($dbh->bz_index_info_real($table, $fk_name)) { + push(@sql, $self->get_drop_index_ddl($table, $fk_name)); + } + + return @sql; +} + sub get_drop_index_ddl { my ($self, $table, $name) = @_; return ("DROP INDEX \`$name\` ON $table"); diff --git a/Bugzilla/Install/DB.pm b/Bugzilla/Install/DB.pm index 00032d15b..5e6401828 100644 --- a/Bugzilla/Install/DB.pm +++ b/Bugzilla/Install/DB.pm @@ -49,6 +49,39 @@ sub indicate_progress { } } +# This is used before adding a foreign key to a column, to make sure +# that the database won't fail adding the key. +sub check_references { + my ($table, $column, $foreign_table, $foreign_column) = @_; + my $dbh = Bugzilla->dbh; + + my $bad_values = $dbh->selectcol_arrayref( + "SELECT DISTINCT $table.$column + FROM $table LEFT JOIN $foreign_table + ON $table.$column = $foreign_table.$foreign_column + WHERE $foreign_table.$foreign_column IS NULL"); + + if (@$bad_values) { + my $values = join(', ', @$bad_values); + print <<EOT; + +ERROR: There are invalid values for the $column column in the $table +table. (These values do not exist in the $foreign_table table, in the +$foreign_column column.) + +Before continuing with checksetup, you will need to fix these values, +either by deleting these rows from the database, or changing the values +of $column in $table to point to valid values in $foreign_table.$foreign_column. + +The bad values from the $table.$column column are: +$values + +EOT + # I just picked a number above 2, to be considered "abnormal exit." + exit 3; + } +} + # NOTE: This is NOT the function for general table updates. See # update_table_definitions for that. This is only for the fielddefs table. sub update_fielddefs_definition { @@ -519,6 +552,20 @@ sub update_table_definitions { $dbh->bz_add_column('milestones', 'id', {TYPE => 'MEDIUMSERIAL', NOTNULL => 1, PRIMARYKEY => 1}); + # Referential Integrity begins here + check_references('profiles_activity', 'userid', 'profiles', 'userid'); + $dbh->bz_alter_column('profiles_activity', 'userid', + {TYPE => 'INT3', NOTNULL => 1, REFERENCES => + {TABLE => 'profiles', COLUMN => 'userid', DELETE => 'CASCADE'}}); + check_references('profiles_activity', 'who', 'profiles', 'userid'); + $dbh->bz_alter_column('profiles_activity', 'who', + {TYPE => 'INT3', NOTNULL => 1, REFERENCES => + {TABLE => 'profiles', COLUMN => 'userid'}}); + check_references('profiles_activity', 'fieldid', 'fielddefs', 'id'); + $dbh->bz_alter_column('profiles_activity', 'fieldid', + {TYPE => 'INT3', NOTNULL => 1, REFERENCES => + {TABLE => 'fielddefs', COLUMN => 'id'}}); + ################################################################ # New --TABLE-- changes should go *** A B O V E *** this point # ################################################################ |