Don't add a separate class to iterate history

2016-07-07 17:30:49 -04:00 · 2016-07-07 17:30:49 -04:00 · 35471d3c3f
commit 35471d3c3f
parent 74452fe58f
1 changed files with 47 additions and 75 deletions
--- a/realms/modules/wiki/models.py
+++ b/realms/modules/wiki/models.py
@ -96,7 +96,7 @@ class WikiPage(object):
        if cached:
            return cached
-        info = self.get_history(limit=1)[0]
+        info = next(self.history)
        cache.set(cache_key, info)
        return info
@ -104,10 +104,54 @@ class WikiPage(object):
    def history(self):
        """Get page history.
-        :return: list -- List of dicts
+        History can take a long time to generate for repositories with many commits.
        This returns an iterator to avoid having to load them all at once.
        :return: iter -- Iterator over dicts
        """
-        return PageHistory(self, self._cache_key('history'))
+        cache_complete = False
        cached_revs = cache.get(self._cache_key('history')) or []
        start_sha = None
        if cached_revs:
            if cached_revs[-1] == 'TAIL':
                del cached_revs[-1]
                cache_complete = True
            else:
                start_sha = cached_revs[-1]['sha']
        for rev in cached_revs:
            yield rev
        if cache_complete:
            return
        if not len(self.wiki.repo.open_index()):
            # Index is empty, no commits
            return
        walker = iter(self.wiki.repo.get_walker(paths=[self.filename], include=start_sha, follow=True))
        if start_sha:
            # If we are not starting from HEAD, we already have the start commit
            next(walker)
        filename = self.filename
        try:
            for entry in walker:
                change_type = None
                for change in entry.changes():
                    if change.new.path == filename:
                        filename = change.old.path
                        change_type = change.type
                        break
                author_name, author_email = entry.commit.author.rstrip('>').split('<')
                r = dict(author=author_name.strip(),
                         author_email=author_email,
                         time=entry.commit.author_time,
                         message=entry.commit.message,
                         sha=entry.commit.id,
                         type=change_type)
                cached_revs.append(r)
                yield r
            cached_revs.append('TAIL')
        finally:
            cache.set(self._cache_key('history'), cached_revs)
    @property
    def partials(self):
@ -298,75 +342,3 @@ class WikiPage(object):
            # We'll get a KeyError if self.sha isn't in the repo, or if self.filename isn't in the tree of our commit
            return False
        return True
 class PageHistory(collections.Sequence):
    """Acts like a list, but dynamically loads and caches history revisions as requested."""
    def __init__(self, page, cache_key):
        self.page = page
        self.cache_key = cache_key
        self._store = cache.get(cache_key) or []
        if not self._store:
            self._iter_rest = self._get_rest()
        elif self._store[-1] == 'TAIL':
            self._iter_rest = None
        else:
            self._iter_rest = self._get_rest(self._store[-1]['sha'])
    def __iter__(self):
        # Iterate over the revisions already cached
        for r in self._store:
            if r == 'TAIL':
                return
            yield r
        # Iterate over the revisions yet to be discovered
        if self._iter_rest:
            try:
                for r in self._iter_rest:
                    self._store.append(r)
                    yield r
                self._store.append('TAIL')
            finally:
                # Make sure we cache the results whether or not the iteration was completed
                cache.set(self.cache_key, self._store)
    def _get_rest(self, start_sha=None):
        if not len(self.page.wiki.repo.open_index()):
            # Index is empty, no commits
            return
        walker = iter(self.page.wiki.repo.get_walker(paths=[self.page.filename], include=start_sha, follow=True))
        if start_sha:
            # If we are not starting from HEAD, we already have the start commit
            print(next(walker))
        filename = self.page.filename
        for entry in walker:
            change_type = None
            for change in entry.changes():
                if change.new.path == filename:
                    filename = change.old.path
                    change_type = change.type
                    break
            author_name, author_email = entry.commit.author.rstrip('>').split('<')
            r = dict(author=author_name.strip(),
                     author_email=author_email,
                     time=entry.commit.author_time,
                     message=entry.commit.message,
                     sha=entry.commit.id,
                     type=change_type)
            yield r
    def __getitem__(self, index):
        if isinstance(index, slice):
            return list(itertools.islice(self, index.start, index.stop, index.step))
        else:
            try:
                return next(itertools.islice(self, index, index+1))
            except StopIteration:
                raise IndexError
    def __len__(self):
        if not self._store or self._store[-1] != 'TAIL':
            # Force generation of all revisions
            list(self)
        return len(self._store) - 1  # Don't include the TAIL sentinel