Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #! /usr/bin/python
- """ hg-to-git.py - A Mercurial to GIT converter
- Copyright (C)2007 Stelian Pop <stelian@popies.net>
- This program is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2, or (at your option)
- any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program; if not, write to the Free Software
- Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- """
- import os, os.path, sys
- import tempfile, popen2, pickle, getopt
- import re
- # Maps hg version -> git version
- hgvers = {}
- # List of children for each hg revision
- hgchildren = {}
- # List of parents for each hg revision
- hgparents = {}
- # Current branch for each hg revision
- hgbranch = {}
- # Number of new changesets converted from hg
- hgnewcsets = 0
- #------------------------------------------------------------------------------
- def usage():
- print """\
- %s: [OPTIONS] <hgprj>
- options:
- -s, --gitstate=FILE: name of the state to be saved/read
- for incrementals
- -n, --nrepack=INT: number of changesets that will trigger
- a repack (default=0, -1 to deactivate)
- -v, --verbose: be verbose
- required:
- hgprj: name of the HG project to import (directory)
- """ % sys.argv[0]
- #------------------------------------------------------------------------------
- def getgitenv(user, date):
- env = ''
- elems = re.compile('(.*?)\s+<(.*)>').match(user)
- if elems:
- env += 'export GIT_AUTHOR_NAME="%s" ;' % elems.group(1)
- #env += 'export GIT_COMMITER_NAME="%s" ;' % elems.group(1)
- env += 'export GIT_AUTHOR_EMAIL="%s" ;' % elems.group(2)
- #env += 'export GIT_COMMITER_EMAIL="%s" ;' % elems.group(2)
- else:
- env += 'export GIT_AUTHOR_NAME="%s" ;' % user
- #env += 'export GIT_COMMITER_NAME="%s" ;' % user
- env += 'export GIT_AUTHOR_EMAIL= ;'
- #env += 'export GIT_COMMITER_EMAIL= ;'
- env += 'export GIT_AUTHOR_DATE="%s" ;' % date
- #env += 'export GIT_COMMITTER_DATE="%s" ;' % date
- return env
- #------------------------------------------------------------------------------
- state = ''
- opt_nrepack = 0
- verbose = False
- try:
- opts, args = getopt.getopt(sys.argv[1:], 's:t:n:v', ['gitstate=', 'tempdir=', 'nrepack=', 'verbose'])
- for o, a in opts:
- if o in ('-s', '--gitstate'):
- state = a
- state = os.path.abspath(state)
- if o in ('-n', '--nrepack'):
- opt_nrepack = int(a)
- if o in ('-v', '--verbose'):
- verbose = True
- if len(args) != 1:
- raise Exception('params')
- except:
- usage()
- sys.exit(1)
- hgprj = args[0]
- os.chdir(hgprj)
- if state:
- if os.path.exists(state):
- if verbose:
- print 'State does exist, reading'
- f = open(state, 'r')
- hgvers = pickle.load(f)
- else:
- print 'State does not exist, first run'
- sock = os.popen('hg tip --template "{rev}"')
- tip = sock.read()
- if sock.close():
- sys.exit(1)
- if verbose:
- print 'tip is', tip
- # Calculate the branches
- if verbose:
- print 'analysing the branches...'
- hgchildren["0"] = ()
- hgparents["0"] = (None, None)
- hgbranch["0"] = "master"
- for cset in range(1, int(tip) + 1):
- hgchildren[str(cset)] = ()
- prnts = os.popen('hg log -r %d --template "{parents}"' % cset).read().strip().split(' ')
- prnts = map(lambda x: x[:x.find(':')], prnts)
- if prnts[0] != '':
- parent = prnts[0].strip()
- else:
- parent = str(cset - 1)
- hgchildren[parent] += ( str(cset), )
- if len(prnts) > 1:
- mparent = prnts[1].strip()
- hgchildren[mparent] += ( str(cset), )
- else:
- mparent = None
- hgparents[str(cset)] = (parent, mparent)
- if mparent:
- # For merge changesets, take either one, preferably the 'master' branch
- if hgbranch[mparent] == 'master':
- hgbranch[str(cset)] = 'master'
- else:
- hgbranch[str(cset)] = hgbranch[parent]
- else:
- # Normal changesets
- # For first children, take the parent branch, for the others create a new branch
- if hgchildren[parent][0] == str(cset):
- hgbranch[str(cset)] = hgbranch[parent]
- else:
- hgbranch[str(cset)] = "branch-" + str(cset)
- if not hgvers.has_key("0"):
- print 'creating repository'
- os.system('git init')
- # loop through every hg changeset
- for cset in range(int(tip) + 1):
- # incremental, already seen
- if hgvers.has_key(str(cset)):
- continue
- hgnewcsets += 1
- # get info
- log_data = os.popen('hg log -r %d --template "{tags}\n{date|date}\n{author}\n"' % cset).readlines()
- tag = log_data[0].strip()
- date = log_data[1].strip()
- user = log_data[2].strip()
- parent = hgparents[str(cset)][0]
- mparent = hgparents[str(cset)][1]
- #get comment
- (fdcomment, filecomment) = tempfile.mkstemp()
- csetcomment = os.popen('hg log -r %d --template "{desc}"' % cset).read().strip()
- os.write(fdcomment, csetcomment)
- os.close(fdcomment)
- print '-----------------------------------------'
- print 'cset:', cset
- print 'branch:', hgbranch[str(cset)]
- print 'user:', user
- print 'date:', date
- print 'comment:', csetcomment
- if parent:
- print 'parent:', parent
- if mparent:
- print 'mparent:', mparent
- if tag:
- print 'tag:', tag
- print '-----------------------------------------'
- # checkout the parent if necessary
- if cset != 0:
- if hgbranch[str(cset)] == "branch-" + str(cset):
- print 'creating new branch', hgbranch[str(cset)]
- os.system('git checkout -b %s %s' % (hgbranch[str(cset)], hgvers[parent]))
- else:
- print 'checking out branch', hgbranch[str(cset)]
- os.system('git checkout %s' % hgbranch[str(cset)])
- # merge
- if mparent:
- if hgbranch[parent] == hgbranch[str(cset)]:
- otherbranch = hgbranch[mparent]
- else:
- otherbranch = hgbranch[parent]
- print 'merging', otherbranch, 'into', hgbranch[str(cset)]
- os.system(getgitenv(user, date) + 'git merge --no-commit -s ours "" %s %s' % (hgbranch[str(cset)], otherbranch))
- # remove everything except .git and .hg directories
- os.system('find . \( -path "./.hg" -o -path "./.git" \) -prune -o ! -name "." -print | xargs rm -rf')
- # repopulate with checkouted files
- os.system('hg update -C %d' % cset)
- # add new files
- os.system('git ls-files -x .hg --others | git update-index --add --stdin')
- # delete removed files
- os.system('git ls-files -x .hg --deleted | git update-index --remove --stdin')
- # commit
- os.system(getgitenv(user, date) + 'git commit --allow-empty -a -F %s' % filecomment)
- os.unlink(filecomment)
- # tag
- if tag and tag != 'tip':
- os.system(getgitenv(user, date) + 'git tag %s' % tag)
- # delete branch if not used anymore...
- if mparent and len(hgchildren[str(cset)]):
- print "Deleting unused branch:", otherbranch
- os.system('git branch -d %s' % otherbranch)
- # retrieve and record the version
- vvv = os.popen('git show --quiet --pretty=format:%H').read()
- print 'record', cset, '->', vvv
- hgvers[str(cset)] = vvv
- if hgnewcsets >= opt_nrepack and opt_nrepack != -1:
- os.system('git repack -a -d')
- # write the state for incrementals
- if state:
- if verbose:
- print 'Writing state'
- f = open(state, 'w')
- pickle.dump(hgvers, f)
- # vim: et ts=8 sw=4 sts=4
Add Comment
Please, Sign In to add comment