| 1 | /* Copyright (C) 2006 MySQL AB & MySQL Finland AB & TCX DataKonsult AB | 
|---|
| 2 |  | 
|---|
| 3 | This program is free software; you can redistribute it and/or modify | 
|---|
| 4 | it under the terms of the GNU General Public License as published by | 
|---|
| 5 | the Free Software Foundation; version 2 of the License. | 
|---|
| 6 |  | 
|---|
| 7 | This program is distributed in the hope that it will be useful, | 
|---|
| 8 | but WITHOUT ANY WARRANTY; without even the implied warranty of | 
|---|
| 9 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
|---|
| 10 | GNU General Public License for more details. | 
|---|
| 11 |  | 
|---|
| 12 | You should have received a copy of the GNU General Public License | 
|---|
| 13 | along with this program; if not, write to the Free Software | 
|---|
| 14 | Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111-1301 USA */ | 
|---|
| 15 |  | 
|---|
| 16 | /* Functions to check if a row is unique */ | 
|---|
| 17 |  | 
|---|
| 18 | #include "maria_def.h" | 
|---|
| 19 | #include <m_ctype.h> | 
|---|
| 20 |  | 
|---|
| 21 | /** | 
|---|
| 22 | Check if there exist a row with the same hash | 
|---|
| 23 |  | 
|---|
| 24 | @notes | 
|---|
| 25 | This function is not versioning safe. For the moment this is not a problem | 
|---|
| 26 | as it's only used for internal temporary tables in MySQL for which there | 
|---|
| 27 | isn't any versioning information. | 
|---|
| 28 | */ | 
|---|
| 29 |  | 
|---|
| 30 | my_bool _ma_check_unique(MARIA_HA *info, MARIA_UNIQUEDEF *def, | 
|---|
| 31 | const uchar *record, | 
|---|
| 32 | ha_checksum unique_hash, my_off_t disk_pos) | 
|---|
| 33 | { | 
|---|
| 34 | my_off_t lastpos=info->cur_row.lastpos; | 
|---|
| 35 | MARIA_KEYDEF *keyinfo= &info->s->keyinfo[def->key]; | 
|---|
| 36 | uchar *key_buff= info->lastkey_buff2; | 
|---|
| 37 | MARIA_KEY key; | 
|---|
| 38 | int error= 0; | 
|---|
| 39 | DBUG_ENTER( "_ma_check_unique"); | 
|---|
| 40 | DBUG_PRINT( "enter",( "unique_hash: %lu", (ulong) unique_hash)); | 
|---|
| 41 |  | 
|---|
| 42 | /* We need to store the hash value as a key in the record, breaking const */ | 
|---|
| 43 | maria_unique_store(record+keyinfo->seg->start, unique_hash); | 
|---|
| 44 | /* Can't be spatial so it's ok to call _ma_make_key directly here */ | 
|---|
| 45 | _ma_make_key(info, &key, def->key, key_buff, record, 0, 0); | 
|---|
| 46 |  | 
|---|
| 47 | /* The above changed info->lastkey_buff2. Inform maria_rnext_same(). */ | 
|---|
| 48 | info->update&= ~HA_STATE_RNEXT_SAME; | 
|---|
| 49 |  | 
|---|
| 50 | /* Setup that unique key is active key */ | 
|---|
| 51 | info->last_key.keyinfo= keyinfo; | 
|---|
| 52 |  | 
|---|
| 53 | /* any key pointer in data is destroyed */ | 
|---|
| 54 | info->lastinx= ~0; | 
|---|
| 55 |  | 
|---|
| 56 | DBUG_ASSERT(key.data_length == MARIA_UNIQUE_HASH_LENGTH); | 
|---|
| 57 | if (_ma_search(info, &key, SEARCH_FIND | SEARCH_SAVE_BUFF, | 
|---|
| 58 | info->s->state.key_root[def->key])) | 
|---|
| 59 | { | 
|---|
| 60 | info->page_changed=1;			/* Can't optimize read next */ | 
|---|
| 61 | info->cur_row.lastpos= lastpos; | 
|---|
| 62 | goto end; | 
|---|
| 63 | } | 
|---|
| 64 |  | 
|---|
| 65 | for (;;) | 
|---|
| 66 | { | 
|---|
| 67 | if (info->cur_row.lastpos != disk_pos && | 
|---|
| 68 | !(*info->s->compare_unique)(info,def,record,info->cur_row.lastpos)) | 
|---|
| 69 | { | 
|---|
| 70 | my_errno=HA_ERR_FOUND_DUPP_UNIQUE; | 
|---|
| 71 | info->errkey= (int) def->key; | 
|---|
| 72 | info->dup_key_pos= info->cur_row.lastpos; | 
|---|
| 73 | info->page_changed= 1;			/* Can't optimize read next */ | 
|---|
| 74 | info->cur_row.lastpos= lastpos; | 
|---|
| 75 | DBUG_PRINT( "info",( "Found duplicate")); | 
|---|
| 76 | error= 1;                                 /* Found identical  */ | 
|---|
| 77 | goto end; | 
|---|
| 78 | } | 
|---|
| 79 | DBUG_ASSERT(info->last_key.data_length == MARIA_UNIQUE_HASH_LENGTH); | 
|---|
| 80 | if (_ma_search_next(info, &info->last_key, SEARCH_BIGGER, | 
|---|
| 81 | info->s->state.key_root[def->key]) || | 
|---|
| 82 | bcmp(info->last_key.data, key_buff, MARIA_UNIQUE_HASH_LENGTH)) | 
|---|
| 83 | { | 
|---|
| 84 | info->page_changed= 1;			/* Can't optimize read next */ | 
|---|
| 85 | info->cur_row.lastpos= lastpos; | 
|---|
| 86 | break;                                    /* end of tree */ | 
|---|
| 87 | } | 
|---|
| 88 | } | 
|---|
| 89 |  | 
|---|
| 90 | end: | 
|---|
| 91 | DBUG_RETURN(error); | 
|---|
| 92 | } | 
|---|
| 93 |  | 
|---|
| 94 |  | 
|---|
| 95 | /* | 
|---|
| 96 | Calculate a hash for a row | 
|---|
| 97 |  | 
|---|
| 98 | TODO | 
|---|
| 99 | Add support for bit fields | 
|---|
| 100 | */ | 
|---|
| 101 |  | 
|---|
| 102 | ha_checksum _ma_unique_hash(MARIA_UNIQUEDEF *def, const uchar *record) | 
|---|
| 103 | { | 
|---|
| 104 | const uchar *pos, *end; | 
|---|
| 105 | ha_checksum crc= 0; | 
|---|
| 106 | ulong seed1=0, seed2= 4; | 
|---|
| 107 | HA_KEYSEG *keyseg; | 
|---|
| 108 |  | 
|---|
| 109 | for (keyseg=def->seg ; keyseg < def->end ; keyseg++) | 
|---|
| 110 | { | 
|---|
| 111 | enum ha_base_keytype type=(enum ha_base_keytype) keyseg->type; | 
|---|
| 112 | uint length=keyseg->length; | 
|---|
| 113 |  | 
|---|
| 114 | if (keyseg->null_bit) | 
|---|
| 115 | { | 
|---|
| 116 | if (record[keyseg->null_pos] & keyseg->null_bit) | 
|---|
| 117 | { | 
|---|
| 118 | /* | 
|---|
| 119 | Change crc in a way different from an empty string or 0. | 
|---|
| 120 | (This is an optimisation;  The code will work even if this isn't | 
|---|
| 121 | done) | 
|---|
| 122 | */ | 
|---|
| 123 | crc=((crc << 8) + 511+ | 
|---|
| 124 | (crc >> (8*sizeof(ha_checksum)-8))); | 
|---|
| 125 | continue; | 
|---|
| 126 | } | 
|---|
| 127 | } | 
|---|
| 128 | pos= record+keyseg->start; | 
|---|
| 129 | if (keyseg->flag & HA_VAR_LENGTH_PART) | 
|---|
| 130 | { | 
|---|
| 131 | uint pack_length=  keyseg->bit_start; | 
|---|
| 132 | uint tmp_length= (pack_length == 1 ? (uint) *pos : | 
|---|
| 133 | uint2korr(pos)); | 
|---|
| 134 | pos+= pack_length;			/* Skip VARCHAR length */ | 
|---|
| 135 | set_if_smaller(length,tmp_length); | 
|---|
| 136 | } | 
|---|
| 137 | else if (keyseg->flag & HA_BLOB_PART) | 
|---|
| 138 | { | 
|---|
| 139 | uint tmp_length= _ma_calc_blob_length(keyseg->bit_start,pos); | 
|---|
| 140 | memcpy((void*) &pos,pos+keyseg->bit_start,sizeof(char*)); | 
|---|
| 141 | if (!length || length > tmp_length) | 
|---|
| 142 | length=tmp_length;			/* The whole blob */ | 
|---|
| 143 | } | 
|---|
| 144 | end= pos+length; | 
|---|
| 145 | if (type == HA_KEYTYPE_TEXT || type == HA_KEYTYPE_VARTEXT1 || | 
|---|
| 146 | type == HA_KEYTYPE_VARTEXT2) | 
|---|
| 147 | { | 
|---|
| 148 | keyseg->charset->coll->hash_sort(keyseg->charset, | 
|---|
| 149 | (const uchar*) pos, length, &seed1, | 
|---|
| 150 | &seed2); | 
|---|
| 151 | crc+= seed1; | 
|---|
| 152 | } | 
|---|
| 153 | else | 
|---|
| 154 | { | 
|---|
| 155 | my_hash_sort_bin((CHARSET_INFO*) 0, pos, (size_t) (end-pos), | 
|---|
| 156 | &seed1, &seed2); | 
|---|
| 157 | crc+= seed1; | 
|---|
| 158 | } | 
|---|
| 159 | } | 
|---|
| 160 | return crc; | 
|---|
| 161 | } | 
|---|
| 162 |  | 
|---|
| 163 |  | 
|---|
| 164 | /* | 
|---|
| 165 | compare unique key for two rows | 
|---|
| 166 |  | 
|---|
| 167 | TODO | 
|---|
| 168 | Add support for bit fields | 
|---|
| 169 |  | 
|---|
| 170 | RETURN | 
|---|
| 171 | 0   if both rows have equal unique value | 
|---|
| 172 | 1   Rows are different | 
|---|
| 173 | */ | 
|---|
| 174 |  | 
|---|
| 175 | my_bool _ma_unique_comp(MARIA_UNIQUEDEF *def, const uchar *a, const uchar *b, | 
|---|
| 176 | my_bool null_are_equal) | 
|---|
| 177 | { | 
|---|
| 178 | const uchar *pos_a, *pos_b, *end; | 
|---|
| 179 | HA_KEYSEG *keyseg; | 
|---|
| 180 |  | 
|---|
| 181 | for (keyseg=def->seg ; keyseg < def->end ; keyseg++) | 
|---|
| 182 | { | 
|---|
| 183 | enum ha_base_keytype type=(enum ha_base_keytype) keyseg->type; | 
|---|
| 184 | uint a_length, b_length; | 
|---|
| 185 | a_length= b_length= keyseg->length; | 
|---|
| 186 |  | 
|---|
| 187 | /* If part is NULL it's regarded as different */ | 
|---|
| 188 | if (keyseg->null_bit) | 
|---|
| 189 | { | 
|---|
| 190 | uint tmp; | 
|---|
| 191 | if ((tmp=(a[keyseg->null_pos] & keyseg->null_bit)) != | 
|---|
| 192 | (uint) (b[keyseg->null_pos] & keyseg->null_bit)) | 
|---|
| 193 | return 1; | 
|---|
| 194 | if (tmp) | 
|---|
| 195 | { | 
|---|
| 196 | if (!null_are_equal) | 
|---|
| 197 | return 1; | 
|---|
| 198 | continue; | 
|---|
| 199 | } | 
|---|
| 200 | } | 
|---|
| 201 | pos_a= a+keyseg->start; | 
|---|
| 202 | pos_b= b+keyseg->start; | 
|---|
| 203 | if (keyseg->flag & HA_VAR_LENGTH_PART) | 
|---|
| 204 | { | 
|---|
| 205 | uint pack_length= keyseg->bit_start; | 
|---|
| 206 | if (pack_length == 1) | 
|---|
| 207 | { | 
|---|
| 208 | a_length= (uint) *pos_a++; | 
|---|
| 209 | b_length= (uint) *pos_b++; | 
|---|
| 210 | } | 
|---|
| 211 | else | 
|---|
| 212 | { | 
|---|
| 213 | a_length= uint2korr(pos_a); | 
|---|
| 214 | b_length= uint2korr(pos_b); | 
|---|
| 215 | pos_a+= 2;				/* Skip VARCHAR length */ | 
|---|
| 216 | pos_b+= 2; | 
|---|
| 217 | } | 
|---|
| 218 | set_if_smaller(a_length, keyseg->length); /* Safety */ | 
|---|
| 219 | set_if_smaller(b_length, keyseg->length); /* safety */ | 
|---|
| 220 | } | 
|---|
| 221 | else if (keyseg->flag & HA_BLOB_PART) | 
|---|
| 222 | { | 
|---|
| 223 | /* Only compare 'length' characters if length != 0 */ | 
|---|
| 224 | a_length= _ma_calc_blob_length(keyseg->bit_start,pos_a); | 
|---|
| 225 | b_length= _ma_calc_blob_length(keyseg->bit_start,pos_b); | 
|---|
| 226 | /* Check that a and b are of equal length */ | 
|---|
| 227 | if (keyseg->length) | 
|---|
| 228 | { | 
|---|
| 229 | /* | 
|---|
| 230 | This is used in some cases when we are not interested in comparing | 
|---|
| 231 | the whole length of the blob. | 
|---|
| 232 | */ | 
|---|
| 233 | set_if_smaller(a_length, keyseg->length); | 
|---|
| 234 | set_if_smaller(b_length, keyseg->length); | 
|---|
| 235 | } | 
|---|
| 236 | memcpy((void*) &pos_a, pos_a+keyseg->bit_start, sizeof(char*)); | 
|---|
| 237 | memcpy((void*) &pos_b, pos_b+keyseg->bit_start, sizeof(char*)); | 
|---|
| 238 | } | 
|---|
| 239 | if (type == HA_KEYTYPE_TEXT || type == HA_KEYTYPE_VARTEXT1 || | 
|---|
| 240 | type == HA_KEYTYPE_VARTEXT2) | 
|---|
| 241 | { | 
|---|
| 242 | if (ha_compare_text(keyseg->charset, pos_a, a_length, | 
|---|
| 243 | pos_b, b_length, 0)) | 
|---|
| 244 | return 1; | 
|---|
| 245 | } | 
|---|
| 246 | else | 
|---|
| 247 | { | 
|---|
| 248 | if (a_length != b_length) | 
|---|
| 249 | return 1; | 
|---|
| 250 | end= pos_a+a_length; | 
|---|
| 251 | while (pos_a != end) | 
|---|
| 252 | { | 
|---|
| 253 | if (*pos_a++ != *pos_b++) | 
|---|
| 254 | return 1; | 
|---|
| 255 | } | 
|---|
| 256 | } | 
|---|
| 257 | } | 
|---|
| 258 | return 0; | 
|---|
| 259 | } | 
|---|
| 260 |  | 
|---|