Changeset 782 for git/branches/dmik/diffcore-rename.c
- Timestamp:
- Jun 23, 2014, 9:45:51 PM (11 years ago)
- Location:
- git/branches/dmik
- Files:
-
- 2 edited
Legend:
- Unmodified
- Added
- Removed
-
git/branches/dmik ¶
- Property svn:mergeinfo changed
/git/vendor/2.0.0 (added) merged: 777 /git/vendor/current merged: 772,774,776
- Property svn:mergeinfo changed
-
TabularUnified git/branches/dmik/diffcore-rename.c ¶
r347 r782 5 5 #include "diff.h" 6 6 #include "diffcore.h" 7 #include "hash .h"7 #include "hashmap.h" 8 8 #include "progress.h" 9 9 … … 39 39 return NULL; 40 40 /* insert to make it at "first" */ 41 if (rename_dst_alloc <= rename_dst_nr) { 42 rename_dst_alloc = alloc_nr(rename_dst_alloc); 43 rename_dst = xrealloc(rename_dst, 44 rename_dst_alloc * sizeof(*rename_dst)); 45 } 41 ALLOC_GROW(rename_dst, rename_dst_nr + 1, rename_dst_alloc); 46 42 rename_dst_nr++; 47 43 if (first < rename_dst_nr) … … 49 45 (rename_dst_nr - first - 1) * sizeof(*rename_dst)); 50 46 rename_dst[first].two = alloc_filespec(two->path); 51 fill_filespec(rename_dst[first].two, two->sha1, two-> mode);47 fill_filespec(rename_dst[first].two, two->sha1, two->sha1_valid, two->mode); 52 48 rename_dst[first].pair = NULL; 53 49 return &(rename_dst[first]); … … 83 79 84 80 /* insert to make it at "first" */ 85 if (rename_src_alloc <= rename_src_nr) { 86 rename_src_alloc = alloc_nr(rename_src_alloc); 87 rename_src = xrealloc(rename_src, 88 rename_src_alloc * sizeof(*rename_src)); 89 } 81 ALLOC_GROW(rename_src, rename_src_nr + 1, rename_src_alloc); 90 82 rename_src_nr++; 91 83 if (first < rename_src_nr) … … 244 236 245 237 struct file_similarity { 246 int src_dst, index; 238 struct hashmap_entry entry; 239 int index; 247 240 struct diff_filespec *filespec; 248 struct file_similarity *next;249 241 }; 250 251 static int find_identical_files(struct file_similarity *src,252 struct file_similarity *dst,253 struct diff_options *options)254 {255 int renames = 0;256 257 /*258 * Walk over all the destinations ...259 */260 do {261 struct diff_filespec *target = dst->filespec;262 struct file_similarity *p, *best;263 int i = 100, best_score = -1;264 265 /*266 * .. to find the best source match267 */268 best = NULL;269 for (p = src; p; p = p->next) {270 int score;271 struct diff_filespec *source = p->filespec;272 273 /* False hash collision? */274 if (hashcmp(source->sha1, target->sha1))275 continue;276 /* Non-regular files? If so, the modes must match! */277 if (!S_ISREG(source->mode) || !S_ISREG(target->mode)) {278 if (source->mode != target->mode)279 continue;280 }281 /* Give higher scores to sources that haven't been used already */282 score = !source->rename_used;283 if (source->rename_used && options->detect_rename != DIFF_DETECT_COPY)284 continue;285 score += basename_same(source, target);286 if (score > best_score) {287 best = p;288 best_score = score;289 if (score == 2)290 break;291 }292 293 /* Too many identical alternatives? Pick one */294 if (!--i)295 break;296 }297 if (best) {298 record_rename_pair(dst->index, best->index, MAX_SCORE);299 renames++;300 }301 } while ((dst = dst->next) != NULL);302 return renames;303 }304 305 static void free_similarity_list(struct file_similarity *p)306 {307 while (p) {308 struct file_similarity *entry = p;309 p = p->next;310 free(entry);311 }312 }313 314 static int find_same_files(void *ptr, void *data)315 {316 int ret;317 struct file_similarity *p = ptr;318 struct file_similarity *src = NULL, *dst = NULL;319 struct diff_options *options = data;320 321 /* Split the hash list up into sources and destinations */322 do {323 struct file_similarity *entry = p;324 p = p->next;325 if (entry->src_dst < 0) {326 entry->next = src;327 src = entry;328 } else {329 entry->next = dst;330 dst = entry;331 }332 } while (p);333 334 /*335 * If we have both sources *and* destinations, see if336 * we can match them up337 */338 ret = (src && dst) ? find_identical_files(src, dst, options) : 0;339 340 /* Free the hashes and return the number of renames found */341 free_similarity_list(src);342 free_similarity_list(dst);343 return ret;344 }345 242 346 243 static unsigned int hash_filespec(struct diff_filespec *filespec) … … 356 253 } 357 254 358 static void insert_file_table(struct hash_table *table, int src_dst, int index, struct diff_filespec *filespec) 359 { 360 void **pos; 361 unsigned int hash; 255 static int find_identical_files(struct hashmap *srcs, 256 int dst_index, 257 struct diff_options *options) 258 { 259 int renames = 0; 260 261 struct diff_filespec *target = rename_dst[dst_index].two; 262 struct file_similarity *p, *best, dst; 263 int i = 100, best_score = -1; 264 265 /* 266 * Find the best source match for specified destination. 267 */ 268 best = NULL; 269 hashmap_entry_init(&dst, hash_filespec(target)); 270 for (p = hashmap_get(srcs, &dst, NULL); p; p = hashmap_get_next(srcs, p)) { 271 int score; 272 struct diff_filespec *source = p->filespec; 273 274 /* False hash collision? */ 275 if (hashcmp(source->sha1, target->sha1)) 276 continue; 277 /* Non-regular files? If so, the modes must match! */ 278 if (!S_ISREG(source->mode) || !S_ISREG(target->mode)) { 279 if (source->mode != target->mode) 280 continue; 281 } 282 /* Give higher scores to sources that haven't been used already */ 283 score = !source->rename_used; 284 if (source->rename_used && options->detect_rename != DIFF_DETECT_COPY) 285 continue; 286 score += basename_same(source, target); 287 if (score > best_score) { 288 best = p; 289 best_score = score; 290 if (score == 2) 291 break; 292 } 293 294 /* Too many identical alternatives? Pick one */ 295 if (!--i) 296 break; 297 } 298 if (best) { 299 record_rename_pair(dst_index, best->index, MAX_SCORE); 300 renames++; 301 } 302 return renames; 303 } 304 305 static void insert_file_table(struct hashmap *table, int index, struct diff_filespec *filespec) 306 { 362 307 struct file_similarity *entry = xmalloc(sizeof(*entry)); 363 308 364 entry->src_dst = src_dst;365 309 entry->index = index; 366 310 entry->filespec = filespec; 367 entry->next = NULL; 368 369 hash = hash_filespec(filespec); 370 pos = insert_hash(hash, entry, table); 371 372 /* We already had an entry there? */ 373 if (pos) { 374 entry->next = *pos; 375 *pos = entry; 376 } 311 312 hashmap_entry_init(entry, hash_filespec(filespec)); 313 hashmap_add(table, entry); 377 314 } 378 315 … … 386 323 static int find_exact_renames(struct diff_options *options) 387 324 { 388 int i; 389 struct hash_table file_table; 390 391 init_hash(&file_table); 325 int i, renames = 0; 326 struct hashmap file_table; 327 328 /* Add all sources to the hash table */ 329 hashmap_init(&file_table, NULL, rename_src_nr); 392 330 for (i = 0; i < rename_src_nr; i++) 393 insert_file_table(&file_table, -1, i, rename_src[i].p->one); 394 331 insert_file_table(&file_table, i, rename_src[i].p->one); 332 333 /* Walk the destinations and find best source match */ 395 334 for (i = 0; i < rename_dst_nr; i++) 396 insert_file_table(&file_table, 1, i, rename_dst[i].two); 397 398 /* Find the renames */ 399 i = for_each_hash(&file_table, find_same_files, options); 400 401 /* .. and free the hash data structure */ 402 free_hash(&file_table); 403 404 return i; 335 renames += find_identical_files(&file_table, i, options); 336 337 /* Free the hash data structure and entries */ 338 hashmap_free(&file_table, 1); 339 340 return renames; 405 341 } 406 342 … … 513 449 strcmp(options->single_follow, p->two->path)) 514 450 continue; /* not interested */ 451 else if (!DIFF_OPT_TST(options, RENAME_EMPTY) && 452 is_empty_blob_sha1(p->two->sha1)) 453 continue; 515 454 else 516 455 locate_rename_dst(p->two, 1); 517 456 } 457 else if (!DIFF_OPT_TST(options, RENAME_EMPTY) && 458 is_empty_blob_sha1(p->one->sha1)) 459 continue; 518 460 else if (!DIFF_PAIR_UNMERGED(p) && !DIFF_FILE_VALID(p->two)) { 519 461 /* … … 573 515 if (options->show_rename_progress) { 574 516 progress = start_progress_delay( 575 "Performing inexact rename detection",517 _("Performing inexact rename detection"), 576 518 rename_dst_nr * rename_src_nr, 50, 1); 577 519 }
Note:
See TracChangeset
for help on using the changeset viewer.