2009-04-26 03:47:44 +04:00
|
|
|
# bzr.py - bzr support for the convert extension
|
|
|
|
#
|
|
|
|
# Copyright 2008, 2009 Marek Kubica <marek@xivilization.net> and others
|
|
|
|
#
|
|
|
|
# This software may be used and distributed according to the terms of the
|
2010-01-20 07:20:08 +03:00
|
|
|
# GNU General Public License version 2 or any later version.
|
2009-04-26 03:47:44 +04:00
|
|
|
|
2008-09-26 22:33:47 +04:00
|
|
|
# This module is for handling 'bzr', that was formerly known as Bazaar-NG;
|
|
|
|
# it cannot access 'bar' repositories, but they were never used very much
|
2016-03-02 19:32:52 +03:00
|
|
|
from __future__ import absolute_import
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
import os
|
2016-05-14 08:03:12 +03:00
|
|
|
|
|
|
|
from mercurial.i18n import _
|
2016-03-02 19:32:52 +03:00
|
|
|
from mercurial import (
|
|
|
|
demandimport,
|
|
|
|
error
|
|
|
|
)
|
|
|
|
from . import common
|
|
|
|
|
2008-09-26 22:33:47 +04:00
|
|
|
# these do not work with demandimport, blacklist
|
|
|
|
demandimport.ignore.extend([
|
|
|
|
'bzrlib.transactions',
|
|
|
|
'bzrlib.urlutils',
|
2010-03-01 16:15:55 +03:00
|
|
|
'ElementPath',
|
2008-09-26 22:33:47 +04:00
|
|
|
])
|
|
|
|
|
|
|
|
try:
|
|
|
|
# bazaar imports
|
2016-03-02 19:32:52 +03:00
|
|
|
import bzrlib.bzrdir
|
|
|
|
import bzrlib.errors
|
|
|
|
import bzrlib.revision
|
2017-10-05 03:48:44 +03:00
|
|
|
import bzrlib.revisionspec
|
2016-03-02 19:32:52 +03:00
|
|
|
bzrdir = bzrlib.bzrdir
|
|
|
|
errors = bzrlib.errors
|
|
|
|
revision = bzrlib.revision
|
|
|
|
revisionspec = bzrlib.revisionspec
|
2017-10-05 03:48:44 +03:00
|
|
|
revisionspec.RevisionSpec
|
2008-09-26 22:33:47 +04:00
|
|
|
except ImportError:
|
|
|
|
pass
|
|
|
|
|
2009-04-11 22:18:51 +04:00
|
|
|
supportedkinds = ('file', 'symlink')
|
|
|
|
|
2016-03-02 19:32:52 +03:00
|
|
|
class bzr_source(common.converter_source):
|
2008-09-26 22:33:47 +04:00
|
|
|
"""Reads Bazaar repositories by using the Bazaar Python libraries"""
|
|
|
|
|
2017-11-23 04:49:01 +03:00
|
|
|
def __init__(self, ui, repotype, path, revs=None):
|
|
|
|
super(bzr_source, self).__init__(ui, repotype, path, revs=revs)
|
2008-09-26 22:33:47 +04:00
|
|
|
|
2009-04-04 21:28:13 +04:00
|
|
|
if not os.path.exists(os.path.join(path, '.bzr')):
|
2016-03-02 19:32:52 +03:00
|
|
|
raise common.NoRepo(_('%s does not look like a Bazaar repository')
|
|
|
|
% path)
|
2009-04-04 21:28:13 +04:00
|
|
|
|
2008-09-26 22:33:47 +04:00
|
|
|
try:
|
|
|
|
# access bzrlib stuff
|
2012-02-02 13:15:12 +04:00
|
|
|
bzrdir
|
2008-09-26 22:33:47 +04:00
|
|
|
except NameError:
|
2016-03-02 19:32:52 +03:00
|
|
|
raise common.NoRepo(_('Bazaar modules could not be loaded'))
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
path = os.path.abspath(path)
|
2009-05-17 16:35:06 +04:00
|
|
|
self._checkrepotype(path)
|
2012-02-02 13:15:12 +04:00
|
|
|
try:
|
|
|
|
self.sourcerepo = bzrdir.BzrDir.open(path).open_repository()
|
|
|
|
except errors.NoRepositoryPresent:
|
2016-03-02 19:32:52 +03:00
|
|
|
raise common.NoRepo(_('%s does not look like a Bazaar repository')
|
|
|
|
% path)
|
2008-09-26 22:33:47 +04:00
|
|
|
self._parentids = {}
|
|
|
|
|
2009-05-17 16:35:06 +04:00
|
|
|
def _checkrepotype(self, path):
|
|
|
|
# Lightweight checkouts detection is informational but probably
|
|
|
|
# fragile at API level. It should not terminate the conversion.
|
|
|
|
try:
|
|
|
|
dir = bzrdir.BzrDir.open_containing(path)[0]
|
|
|
|
try:
|
|
|
|
tree = dir.open_workingtree(recommend_upgrade=False)
|
|
|
|
branch = tree.branch
|
2010-08-27 21:32:40 +04:00
|
|
|
except (errors.NoWorkingTree, errors.NotLocalUrl):
|
2009-05-17 16:35:06 +04:00
|
|
|
tree = None
|
|
|
|
branch = dir.open_branch()
|
|
|
|
if (tree is not None and tree.bzrdir.root_transport.base !=
|
|
|
|
branch.bzrdir.root_transport.base):
|
|
|
|
self.ui.warn(_('warning: lightweight checkouts may cause '
|
|
|
|
'conversion failures, try with a regular '
|
|
|
|
'branch instead.\n'))
|
2012-05-12 18:02:46 +04:00
|
|
|
except Exception:
|
2009-05-17 16:35:06 +04:00
|
|
|
self.ui.note(_('bzr source type could not be determined\n'))
|
|
|
|
|
2008-09-26 22:33:47 +04:00
|
|
|
def before(self):
|
|
|
|
"""Before the conversion begins, acquire a read lock
|
|
|
|
for all the operations that might need it. Fortunately
|
|
|
|
read locks don't block other reads or writes to the
|
|
|
|
repository, so this shouldn't have any impact on the usage of
|
|
|
|
the source repository.
|
|
|
|
|
|
|
|
The alternative would be locking on every operation that
|
|
|
|
needs locks (there are currently two: getting the file and
|
|
|
|
getting the parent map) and releasing immediately after,
|
|
|
|
but this approach can take even 40% longer."""
|
|
|
|
self.sourcerepo.lock_read()
|
|
|
|
|
|
|
|
def after(self):
|
|
|
|
self.sourcerepo.unlock()
|
|
|
|
|
2012-02-08 20:45:10 +04:00
|
|
|
def _bzrbranches(self):
|
|
|
|
return self.sourcerepo.find_branches(using=True)
|
|
|
|
|
2008-09-26 22:33:47 +04:00
|
|
|
def getheads(self):
|
2015-07-08 20:27:43 +03:00
|
|
|
if not self.revs:
|
2012-02-08 20:45:10 +04:00
|
|
|
# Set using=True to avoid nested repositories (see issue3254)
|
|
|
|
heads = sorted([b.last_revision() for b in self._bzrbranches()])
|
2012-02-02 13:15:12 +04:00
|
|
|
else:
|
|
|
|
revid = None
|
2012-02-08 20:45:10 +04:00
|
|
|
for branch in self._bzrbranches():
|
2012-02-02 13:15:12 +04:00
|
|
|
try:
|
2016-03-02 19:32:52 +03:00
|
|
|
r = revisionspec.RevisionSpec.from_string(self.revs[0])
|
2012-02-02 13:15:12 +04:00
|
|
|
info = r.in_history(branch)
|
|
|
|
except errors.BzrError:
|
|
|
|
pass
|
|
|
|
revid = info.rev_id
|
|
|
|
if revid is None:
|
2015-10-08 22:55:45 +03:00
|
|
|
raise error.Abort(_('%s is not a valid revision')
|
|
|
|
% self.revs[0])
|
2012-02-02 13:15:12 +04:00
|
|
|
heads = [revid]
|
2012-02-02 13:15:13 +04:00
|
|
|
# Empty repositories return 'null:', which cannot be retrieved
|
|
|
|
heads = [h for h in heads if h != 'null:']
|
2012-02-02 13:15:12 +04:00
|
|
|
return heads
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
def getfile(self, name, rev):
|
|
|
|
revtree = self.sourcerepo.revision_tree(rev)
|
2009-06-11 23:18:40 +04:00
|
|
|
fileid = revtree.path2id(name.decode(self.encoding or 'utf-8'))
|
2009-05-15 18:12:09 +04:00
|
|
|
kind = None
|
|
|
|
if fileid is not None:
|
|
|
|
kind = revtree.kind(fileid)
|
|
|
|
if kind not in supportedkinds:
|
2008-09-26 22:33:47 +04:00
|
|
|
# the file is not available anymore - was deleted
|
2014-08-27 00:03:32 +04:00
|
|
|
return None, None
|
2010-05-09 23:52:34 +04:00
|
|
|
mode = self._modecache[(name, rev)]
|
2009-05-15 18:12:09 +04:00
|
|
|
if kind == 'symlink':
|
|
|
|
target = revtree.get_symlink_target(fileid)
|
|
|
|
if target is None:
|
2015-10-08 22:55:45 +03:00
|
|
|
raise error.Abort(_('%s.%s symlink has no target')
|
2009-05-15 18:12:09 +04:00
|
|
|
% (name, rev))
|
2010-05-09 23:52:34 +04:00
|
|
|
return target, mode
|
2009-05-15 18:12:09 +04:00
|
|
|
else:
|
|
|
|
sio = revtree.get_file(fileid)
|
2010-05-09 23:52:34 +04:00
|
|
|
return sio.read(), mode
|
2008-09-26 22:33:47 +04:00
|
|
|
|
convert: introduce --full for converting all files
Convert will normally only process files that were changed in a source
revision, apply the filemap, and record it has a change in the target
repository. (If it ends up not really changing anything, nothing changes.)
That means that _if_ the filemap is changed before continuing an incremental
convert, the change will only kick in when the files it affects are modified in
a source revision and thus processed.
With --full, convert will make a full conversion every time and process
all files in the source repo and remove target repo files that shouldn't be
there. Filemap changes will thus kick in on the first converted revision, no
matter what is changed.
This flag should in most cases not make any difference but will make convert
significantly slower.
Other names has been considered for this feature, such as "resync", "sync",
"checkunmodified", "all" or "allfiles", but I found that they were less obvious
and required more explanation than "full" and were harder to describe
consistently.
2014-08-27 00:03:32 +04:00
|
|
|
def getchanges(self, version, full):
|
|
|
|
if full:
|
2015-10-14 09:06:54 +03:00
|
|
|
raise error.Abort(_("convert from cvs does not support --full"))
|
2008-09-26 22:33:47 +04:00
|
|
|
self._modecache = {}
|
|
|
|
self._revtree = self.sourcerepo.revision_tree(version)
|
|
|
|
# get the parentids from the cache
|
|
|
|
parentids = self._parentids.pop(version)
|
|
|
|
# only diff against first parent id
|
|
|
|
prevtree = self.sourcerepo.revision_tree(parentids[0])
|
2015-03-19 19:40:19 +03:00
|
|
|
files, changes = self._gettreechanges(self._revtree, prevtree)
|
|
|
|
return files, changes, set()
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
def getcommit(self, version):
|
|
|
|
rev = self.sourcerepo.get_revision(version)
|
|
|
|
# populate parent id cache
|
|
|
|
if not rev.parent_ids:
|
|
|
|
parents = []
|
|
|
|
self._parentids[version] = (revision.NULL_REVISION,)
|
|
|
|
else:
|
|
|
|
parents = self._filterghosts(rev.parent_ids)
|
|
|
|
self._parentids[version] = parents
|
|
|
|
|
2012-02-02 13:15:12 +04:00
|
|
|
branch = self.recode(rev.properties.get('branch-nick', u'default'))
|
|
|
|
if branch == 'trunk':
|
|
|
|
branch = 'default'
|
2016-03-02 19:32:52 +03:00
|
|
|
return common.commit(parents=parents,
|
2009-05-07 01:48:03 +04:00
|
|
|
date='%d %d' % (rev.timestamp, -rev.timezone),
|
2008-09-26 22:33:47 +04:00
|
|
|
author=self.recode(rev.committer),
|
|
|
|
desc=self.recode(rev.message),
|
2012-02-02 13:15:12 +04:00
|
|
|
branch=branch,
|
2008-09-26 22:33:47 +04:00
|
|
|
rev=version)
|
|
|
|
|
|
|
|
def gettags(self):
|
|
|
|
bytetags = {}
|
2012-02-08 20:45:10 +04:00
|
|
|
for branch in self._bzrbranches():
|
2012-02-02 13:15:12 +04:00
|
|
|
if not branch.supports_tags():
|
|
|
|
return {}
|
|
|
|
tagdict = branch.tags.get_tag_dict()
|
|
|
|
for name, rev in tagdict.iteritems():
|
|
|
|
bytetags[self.recode(name)] = rev
|
2008-09-26 22:33:47 +04:00
|
|
|
return bytetags
|
|
|
|
|
|
|
|
def getchangedfiles(self, rev, i):
|
|
|
|
self._modecache = {}
|
|
|
|
curtree = self.sourcerepo.revision_tree(rev)
|
|
|
|
if i is not None:
|
2009-04-26 13:35:53 +04:00
|
|
|
parentid = self._parentids[rev][i]
|
2008-09-26 22:33:47 +04:00
|
|
|
else:
|
|
|
|
# no parent id, get the empty revision
|
|
|
|
parentid = revision.NULL_REVISION
|
|
|
|
|
|
|
|
prevtree = self.sourcerepo.revision_tree(parentid)
|
|
|
|
changes = [e[0] for e in self._gettreechanges(curtree, prevtree)[0]]
|
|
|
|
return changes
|
|
|
|
|
|
|
|
def _gettreechanges(self, current, origin):
|
2010-02-08 17:36:34 +03:00
|
|
|
revid = current._revision_id
|
2008-09-26 22:33:47 +04:00
|
|
|
changes = []
|
|
|
|
renames = {}
|
2011-11-08 20:08:58 +04:00
|
|
|
seen = set()
|
2017-12-02 07:27:08 +03:00
|
|
|
|
|
|
|
# Fall back to the deprecated attribute for legacy installations.
|
|
|
|
try:
|
|
|
|
inventory = origin.root_inventory
|
|
|
|
except AttributeError:
|
|
|
|
inventory = origin.inventory
|
|
|
|
|
2011-11-08 20:08:58 +04:00
|
|
|
# Process the entries by reverse lexicographic name order to
|
|
|
|
# handle nested renames correctly, most specific first.
|
|
|
|
curchanges = sorted(current.iter_changes(origin),
|
|
|
|
key=lambda c: c[1][0] or c[1][1],
|
|
|
|
reverse=True)
|
2008-09-26 22:33:47 +04:00
|
|
|
for (fileid, paths, changed_content, versioned, parent, name,
|
2011-11-08 20:08:58 +04:00
|
|
|
kind, executable) in curchanges:
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
if paths[0] == u'' or paths[1] == u'':
|
|
|
|
# ignore changes to tree root
|
|
|
|
continue
|
|
|
|
|
|
|
|
# bazaar tracks directories, mercurial does not, so
|
|
|
|
# we have to rename the directory contents
|
|
|
|
if kind[1] == 'directory':
|
2009-04-23 17:07:05 +04:00
|
|
|
if kind[0] not in (None, 'directory'):
|
|
|
|
# Replacing 'something' with a directory, record it
|
|
|
|
# so it can be removed.
|
|
|
|
changes.append((self.recode(paths[0]), revid))
|
|
|
|
|
2011-11-08 20:08:58 +04:00
|
|
|
if kind[0] == 'directory' and None not in paths:
|
|
|
|
renaming = paths[0] != paths[1]
|
2008-09-26 22:33:47 +04:00
|
|
|
# neither an add nor an delete - a move
|
|
|
|
# rename all directory contents manually
|
2017-12-02 07:27:08 +03:00
|
|
|
subdir = inventory.path2id(paths[0])
|
2008-09-26 22:33:47 +04:00
|
|
|
# get all child-entries of the directory
|
2017-12-02 07:27:08 +03:00
|
|
|
for name, entry in inventory.iter_entries(subdir):
|
2008-09-26 22:33:47 +04:00
|
|
|
# hg does not track directory renames
|
|
|
|
if entry.kind == 'directory':
|
|
|
|
continue
|
|
|
|
frompath = self.recode(paths[0] + '/' + name)
|
2011-11-08 20:08:58 +04:00
|
|
|
if frompath in seen:
|
|
|
|
# Already handled by a more specific change entry
|
|
|
|
# This is important when you have:
|
|
|
|
# a => b
|
|
|
|
# a/c => a/c
|
|
|
|
# Here a/c must not be renamed into b/c
|
|
|
|
continue
|
|
|
|
seen.add(frompath)
|
|
|
|
if not renaming:
|
|
|
|
continue
|
2008-09-26 22:33:47 +04:00
|
|
|
topath = self.recode(paths[1] + '/' + name)
|
|
|
|
# register the files as changed
|
|
|
|
changes.append((frompath, revid))
|
|
|
|
changes.append((topath, revid))
|
|
|
|
# add to mode cache
|
2010-01-25 09:05:27 +03:00
|
|
|
mode = ((entry.executable and 'x')
|
|
|
|
or (entry.kind == 'symlink' and 's')
|
2008-09-26 22:33:47 +04:00
|
|
|
or '')
|
|
|
|
self._modecache[(topath, revid)] = mode
|
|
|
|
# register the change as move
|
|
|
|
renames[topath] = frompath
|
|
|
|
|
2012-08-16 00:38:42 +04:00
|
|
|
# no further changes, go to the next change
|
2008-09-26 22:33:47 +04:00
|
|
|
continue
|
|
|
|
|
|
|
|
# we got unicode paths, need to convert them
|
2012-02-02 13:15:04 +04:00
|
|
|
path, topath = paths
|
|
|
|
if path is not None:
|
|
|
|
path = self.recode(path)
|
|
|
|
if topath is not None:
|
|
|
|
topath = self.recode(topath)
|
2011-11-08 20:08:58 +04:00
|
|
|
seen.add(path or topath)
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
if topath is None:
|
|
|
|
# file deleted
|
|
|
|
changes.append((path, revid))
|
|
|
|
continue
|
|
|
|
|
|
|
|
# renamed
|
|
|
|
if path and path != topath:
|
|
|
|
renames[topath] = path
|
2009-04-09 00:59:02 +04:00
|
|
|
changes.append((path, revid))
|
2008-09-26 22:33:47 +04:00
|
|
|
|
|
|
|
# populate the mode cache
|
|
|
|
kind, executable = [e[1] for e in (kind, executable)]
|
2009-04-24 12:34:11 +04:00
|
|
|
mode = ((executable and 'x') or (kind == 'symlink' and 'l')
|
2008-09-26 22:33:47 +04:00
|
|
|
or '')
|
|
|
|
self._modecache[(topath, revid)] = mode
|
|
|
|
changes.append((topath, revid))
|
|
|
|
|
|
|
|
return changes, renames
|
|
|
|
|
|
|
|
def _filterghosts(self, ids):
|
|
|
|
"""Filters out ghost revisions which hg does not support, see
|
|
|
|
<http://bazaar-vcs.org/GhostRevision>
|
|
|
|
"""
|
|
|
|
parentmap = self.sourcerepo.get_parent_map(ids)
|
2008-10-02 17:48:57 +04:00
|
|
|
parents = tuple([parent for parent in ids if parent in parentmap])
|
2008-09-26 22:33:47 +04:00
|
|
|
return parents
|