diff options
Diffstat (limited to 'bzrlib/_knit_load_data_py.py')
-rw-r--r-- | bzrlib/_knit_load_data_py.py | 96 |
1 files changed, 96 insertions, 0 deletions
diff --git a/bzrlib/_knit_load_data_py.py b/bzrlib/_knit_load_data_py.py new file mode 100644 index 0000000..7e781f8 --- /dev/null +++ b/bzrlib/_knit_load_data_py.py @@ -0,0 +1,96 @@ +# Copyright (C) 2007 Canonical Ltd +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write to the Free Software +# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + +from __future__ import absolute_import + +from bzrlib import errors + + +def _load_data_py(kndx, fp): + """Read in a knit index.""" + cache = kndx._cache + history = kndx._history + + kndx.check_header(fp) + # readlines reads the whole file at once: + # bad for transports like http, good for local disk + # we save 60 ms doing this one change ( + # from calling readline each time to calling + # readlines once. + # probably what we want for nice behaviour on + # http is a incremental readlines that yields, or + # a check for local vs non local indexes, + history_top = len(history) - 1 + for line in fp.readlines(): + rec = line.split() + if len(rec) < 5 or rec[-1] != ':': + # corrupt line. + # FIXME: in the future we should determine if its a + # short write - and ignore it + # or a different failure, and raise. RBC 20060407 + continue + + try: + parents = [] + for value in rec[4:-1]: + if value[0] == '.': + # uncompressed reference + parent_id = value[1:] + else: + parent_id = history[int(value)] + parents.append(parent_id) + except (IndexError, ValueError), e: + # The parent could not be decoded to get its parent row. This + # at a minimum will cause this row to have wrong parents, or + # even to apply a delta to the wrong base and decode + # incorrectly. its therefore not usable, and because we have + # encountered a situation where a new knit index had this + # corrupt we can't asssume that no other rows referring to the + # index of this record actually mean the subsequent uncorrupt + # one, so we error. + raise errors.KnitCorrupt(kndx._filename, "line %r: %s" % (rec, e)) + + version_id, options, pos, size = rec[:4] + version_id = version_id + try: + pos = int(pos) + except ValueError, e: + raise errors.KnitCorrupt(kndx._filename, + "invalid position on line %r: %s" + % (rec, e)) + try: + size = int(size) + except ValueError, e: + raise errors.KnitCorrupt(kndx._filename, + "invalid size on line %r: %s" + % (rec, e)) + + # See kndx._cache_version + # only want the _history index to reference the 1st + # index entry for version_id + if version_id not in cache: + history_top += 1 + index = history_top + history.append(version_id) + else: + index = cache[version_id][5] + cache[version_id] = (version_id, + options.split(','), + pos, + size, + tuple(parents), + index) + # end kndx._cache_version |