1
=== modified file 'bzrlib/builtins.py'
2
--- bzrlib/builtins.py	2009-06-11 06:54:33 +0000
3
+++ bzrlib/builtins.py	2009-06-16 02:37:12 +0000
4
@@ -2230,16 +2230,14 @@
5
2230
            # the underlying repository format is faster at generating
2230
            # the underlying repository format is faster at generating
6
2231
            # deltas or can provide everything we need from the indices.
2231
            # deltas or can provide everything we need from the indices.
7
2232
            # The default algorithm - match-using-deltas - works for
2232
            # The default algorithm - match-using-deltas - works for
10
2233
            # multiple files and directories and is faster for small
2233
            # multiple files and directories. However, it's too
9
2234
            # amounts of history (200 revisions say). However, it's too
11
2235
            # slow for logging a single file in a repository with deep
2234
            # slow for logging a single file in a repository with deep
12
2236
            # history, i.e. > 10K revisions. In the spirit of "do no
2235
            # history, i.e. > 10K revisions. In the spirit of "do no
13
2237
            # evil when adding features", we continue to use the
2236
            # evil when adding features", we continue to use the
14
2238
            # original algorithm - per-file-graph - for the "single
2237
            # original algorithm - per-file-graph - for the "single
15
2239
            # file that isn't a directory without showing a delta" case.
2238
            # file that isn't a directory without showing a delta" case.
16
2240
            partial_history = revision and b.repository._format.supports_chks
17
2241
            match_using_deltas = (len(file_ids) != 1 or filter_by_dir
2239
            match_using_deltas = (len(file_ids) != 1 or filter_by_dir
19
2242
                or delta_type or partial_history)
2240
                or delta_type)
20
2243
2241
21
2244
            # Build the LogRequest and execute it
2242
            # Build the LogRequest and execute it
22
2245
            if len(file_ids) == 0:
2243
            if len(file_ids) == 0:
23
2246
2244
24
=== modified file 'bzrlib/log.py'
25
--- bzrlib/log.py	2009-06-10 03:56:49 +0000
26
+++ bzrlib/log.py	2009-06-16 02:37:12 +0000
27
@@ -69,7 +69,11 @@
28
69
    config,
69
    config,
29
70
    diff,
70
    diff,
30
71
    errors,
71
    errors,
31
72
<<<<<<< TREE
32
72
    foreign,
73
    foreign,
33
74
=======
34
75
    graph,
35
76
>>>>>>> MERGE-SOURCE
36
73
    repository as _mod_repository,
77
    repository as _mod_repository,
37
74
    revision as _mod_revision,
78
    revision as _mod_revision,
38
75
    revisionspec,
79
    revisionspec,
39
@@ -460,21 +464,131 @@
40
460
            direction=rqst.get('direction'))
464
            direction=rqst.get('direction'))
41
461
465
42
462
    def _log_revision_iterator_using_per_file_graph(self):
466
    def _log_revision_iterator_using_per_file_graph(self):
43
463
        # Get the base revisions, filtering by the revision range.
44
464
        # Note that we always generate the merge revisions because
45
465
        # filter_revisions_touching_file_id() requires them ...
46
466
        rqst = self.rqst
467
        rqst = self.rqst
54
467
        view_revisions = _calc_view_revisions(self.branch, self.start_rev_id,
468
        direction = rqst.get('direction')
55
468
            self.end_rev_id, rqst.get('direction'), True)
469
        file_id = rqst.get('specific_fileids')[0]
56
469
        if not isinstance(view_revisions, list):
470
        multi_level = rqst.get('levels') != 1
57
470
            view_revisions = list(view_revisions)
471
        try:
58
471
        view_revisions = _filter_revisions_touching_file_id(self.branch,
472
            file_graph, graph_tip = _per_file_graph(self.branch, file_id,
59
472
            rqst.get('specific_fileids')[0], view_revisions,
473
                self.end_rev_id)
60
473
            include_merges=rqst.get('levels') != 1)
474
        except errors.NoSuchId:
61
475
            # File doesn't exist at end of range - fall back to old algorithm
62
476
            view_revisions = None
63
477
        else:
64
478
            # Try iterating over the revisions given by the per-file graph.
65
479
            # This returns None if it fails.
66
480
            view_revisions = _calc_view_revisions_for_file(self.branch,
67
481
                file_graph, graph_tip, self.start_rev_id, self.end_rev_id,
68
482
                direction, multi_level)
69
483
70
484
        if view_revisions is None:
71
485
            # Get the base revisions, filtering by the revision range.
72
486
            # Note that we always generate the merge revisions because
73
487
            # filter_revisions_touching_file_id() requires them ...
74
488
            view_revisions = _calc_view_revisions(self.branch,
75
489
                self.start_rev_id, self.end_rev_id, direction, True)
76
490
            if not isinstance(view_revisions, list):
77
491
                view_revisions = list(view_revisions)
78
492
            # TODO: pass in the already calculated file graph and re-use it
79
493
            view_revisions = _filter_revisions_touching_file_id(self.branch,
80
494
                file_id, view_revisions, include_merges=multi_level)
81
474
        return make_log_rev_iterator(self.branch, view_revisions,
495
        return make_log_rev_iterator(self.branch, view_revisions,
82
475
            rqst.get('delta_type'), rqst.get('message_search'))
496
            rqst.get('delta_type'), rqst.get('message_search'))
83
476
497
84
477
498
85
499
def _per_file_graph(branch, file_id, end_rev_id):
86
500
    """Get the per file graph.
87
501
88
502
    :param end_rev_id: the last interesting revision-id or None to use
89
503
      the basis tree. If non-None, the file must exist in that revision
90
504
      or NoSuchId will be raised.
91
505
    :return: graph, tip where
92
506
      graph is a Graph with (file_id,rev_id) tuple keys and
93
507
      tip is the graph tip
94
508
    """
95
509
    # Find when the file was last modified
96
510
    if end_rev_id is None:
97
511
        rev_tree = branch.basis_tree()
98
512
    else:
99
513
        rev_tree = branch.repository.revision_tree(end_rev_id)
100
514
    last_modified = rev_tree.inventory[file_id].revision
101
515
102
516
    # Return the result
103
517
    tip = (file_id, last_modified)
104
518
    return graph.Graph(branch.repository.texts), tip
105
519
106
520
107
521
def _calc_view_revisions_for_file(branch, file_graph, graph_tip, start_rev_id,
108
522
    end_rev_id, direction, include_merges):
109
523
    """Calculate the revisions to view for a file.
110
524
111
525
    :param file_graph: the per-file graph
112
526
    :param graph_tip: the tip of the per-file graph
113
527
    :param include_merges: if True, include all revisions, not just the top
114
528
      level
115
529
    :return: An list of (revision_id, dotted_revno, merge_depth) tuples OR
116
530
      None if the algorithm fails (and another one should be used).
117
531
    """
118
532
    br_revno, br_rev_id = branch.last_revision_info()
119
533
    if br_revno == 0:
120
534
        return []
121
535
122
536
    # Find when the file was changed and merged
123
537
    file_rev_ids = []
124
538
    file_merges = []
125
539
    for (_, rev_id), parents in file_graph.iter_ancestry([graph_tip]):
126
540
        file_rev_ids.append(rev_id)
127
541
        if len(parents) > 1:
128
542
            file_merges.append(rev_id)
129
543
130
544
    # Handle the simple cases
131
545
    if len(file_rev_ids) == 1:
132
546
        return _generate_one_revision(branch, file_rev_ids[0], br_rev_id,
133
547
            br_revno)
134
548
    elif len(file_rev_ids) == 0:
135
549
        # Should this ever happen?
136
550
        return []
137
551
    elif file_merges and include_merges:
138
552
        # Fall back to the old algorithm for now
139
553
        return None
140
554
141
555
    # Find all the revisions we can using a linear search
142
556
    result = []
143
557
    missing = set(file_rev_ids)
144
558
    merges_to_search = 0
145
559
    try:
146
560
        candidates = _linear_view_revisions(branch, start_rev_id, end_rev_id)
147
561
        for rev_id, revno, depth in candidates:
148
562
            if rev_id in missing:
149
563
                result.append((rev_id, revno, depth))
150
564
                missing.remove(rev_id)
151
565
                if len(missing) == 0:
152
566
                    break
153
567
            if _has_merges(branch, rev_id):
154
568
                merges_to_search += 1
155
569
    except _StartNotLinearAncestor:
156
570
        raise errors.BzrCommandError('Start revision not found in'
157
571
            ' left-hand history of end revision.')
158
572
159
573
    # If no merges were found in the revision range, then we can be
160
574
    # certain that we've found all the revisions we care about.
161
575
    if missing and merges_to_search:
162
576
        # TODO: search the deltas of the merges, splicing successful
163
577
        # matches into their rightful spots. That should work well on
164
578
        # chk repositories for typical histories but we need to benchmark
165
579
        # it to confirm. There's most likely a sweet spot above which
166
580
        # the O(history) traditional way - generating the full graph of
167
581
        # history and post-filtering - remains the best performer.
168
582
        trace.mutter("log file fastpath failed to find %d revisions" %
169
583
            len(missing))
170
584
        return None
171
585
172
586
    # We came, we saw, we walked away victorious ...
173
587
    if direction == 'forward':
174
588
        result = reversed(result)
175
589
    return result
176
590
177
591
178
478
def _calc_view_revisions(branch, start_rev_id, end_rev_id, direction,
592
def _calc_view_revisions(branch, start_rev_id, end_rev_id, direction,
179
479
    generate_merge_revisions, delayed_graph_generation=False):
593
    generate_merge_revisions, delayed_graph_generation=False):
180
480
    """Calculate the revisions to view.
594
    """Calculate the revisions to view.
Status:	Superseded
Proposed branch:	lp:~ian-clatworthy/bzr/faster-log-file
Merge into:	lp:~bzr/bzr/trunk-old
Diff against target:	180 lines (has conflicts) Text conflict in bzrlib/log.py
To merge this branch:	bzr merge lp:~ian-clatworthy/bzr/faster-log-file
Related bugs:	Link a bug report
Reviewer	Review Type	Date Requested	Status
John A Meinel		2009-05-27	Needs Information on 2009-06-01
Review via email: mp+6805@code.launchpad.net