Created
August 26, 2008 21:40
-
-
Save sr/7358 to your computer and use it in GitHub Desktop.
make a git mirror of an hg repository
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#! /usr/bin/python | |
""" hg-to-git.py - A Mercurial to GIT converter | |
Copyright (C)2007 Stelian Pop <[email protected]> | |
This program is free software; you can redistribute it and/or modify | |
it under the terms of the GNU General Public License as published by | |
the Free Software Foundation; either version 2, or (at your option) | |
any later version. | |
This program is distributed in the hope that it will be useful, | |
but WITHOUT ANY WARRANTY; without even the implied warranty of | |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
GNU General Public License for more details. | |
You should have received a copy of the GNU General Public License | |
along with this program; if not, write to the Free Software | |
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. | |
""" | |
import os, os.path, sys | |
import tempfile, popen2, pickle, getopt | |
import re | |
# Maps hg version -> git version | |
hgvers = {} | |
# List of children for each hg revision | |
hgchildren = {} | |
# List of parents for each hg revision | |
hgparents = {} | |
# Current branch for each hg revision | |
hgbranch = {} | |
# Number of new changesets converted from hg | |
hgnewcsets = 0 | |
#------------------------------------------------------------------------------ | |
def usage(): | |
print """\ | |
%s: [OPTIONS] <hgprj> | |
options: | |
-s, --gitstate=FILE: name of the state to be saved/read | |
for incrementals | |
-n, --nrepack=INT: number of changesets that will trigger | |
a repack (default=0, -1 to deactivate) | |
-v, --verbose: be verbose | |
required: | |
hgprj: name of the HG project to import (directory) | |
""" % sys.argv[0] | |
#------------------------------------------------------------------------------ | |
def getgitenv(user, date): | |
env = '' | |
elems = re.compile('(.*?)\s+<(.*)>').match(user) | |
if elems: | |
env += 'export GIT_AUTHOR_NAME="%s" ;' % elems.group(1) | |
#env += 'export GIT_COMMITER_NAME="%s" ;' % elems.group(1) | |
env += 'export GIT_AUTHOR_EMAIL="%s" ;' % elems.group(2) | |
#env += 'export GIT_COMMITER_EMAIL="%s" ;' % elems.group(2) | |
else: | |
env += 'export GIT_AUTHOR_NAME="%s" ;' % user | |
#env += 'export GIT_COMMITER_NAME="%s" ;' % user | |
env += 'export GIT_AUTHOR_EMAIL= ;' | |
#env += 'export GIT_COMMITER_EMAIL= ;' | |
env += 'export GIT_AUTHOR_DATE="%s" ;' % date | |
#env += 'export GIT_COMMITTER_DATE="%s" ;' % date | |
return env | |
#------------------------------------------------------------------------------ | |
state = '' | |
opt_nrepack = 0 | |
verbose = False | |
try: | |
opts, args = getopt.getopt(sys.argv[1:], 's:t:n:v', ['gitstate=', 'tempdir=', 'nrepack=', 'verbose']) | |
for o, a in opts: | |
if o in ('-s', '--gitstate'): | |
state = a | |
state = os.path.abspath(state) | |
if o in ('-n', '--nrepack'): | |
opt_nrepack = int(a) | |
if o in ('-v', '--verbose'): | |
verbose = True | |
if len(args) != 1: | |
raise Exception('params') | |
except: | |
usage() | |
sys.exit(1) | |
hgprj = args[0] | |
os.chdir(hgprj) | |
if state: | |
if os.path.exists(state): | |
if verbose: | |
print 'State does exist, reading' | |
f = open(state, 'r') | |
hgvers = pickle.load(f) | |
else: | |
print 'State does not exist, first run' | |
sock = os.popen('hg tip --template "{rev}"') | |
tip = sock.read() | |
if sock.close(): | |
sys.exit(1) | |
if verbose: | |
print 'tip is', tip | |
# Calculate the branches | |
if verbose: | |
print 'analysing the branches...' | |
hgchildren["0"] = () | |
hgparents["0"] = (None, None) | |
hgbranch["0"] = "master" | |
for cset in range(1, int(tip) + 1): | |
hgchildren[str(cset)] = () | |
prnts = os.popen('hg log -r %d --template "{parents}"' % cset).read().strip().split(' ') | |
prnts = map(lambda x: x[:x.find(':')], prnts) | |
if prnts[0] != '': | |
parent = prnts[0].strip() | |
else: | |
parent = str(cset - 1) | |
hgchildren[parent] += ( str(cset), ) | |
if len(prnts) > 1: | |
mparent = prnts[1].strip() | |
hgchildren[mparent] += ( str(cset), ) | |
else: | |
mparent = None | |
hgparents[str(cset)] = (parent, mparent) | |
if mparent: | |
# For merge changesets, take either one, preferably the 'master' branch | |
if hgbranch[mparent] == 'master': | |
hgbranch[str(cset)] = 'master' | |
else: | |
hgbranch[str(cset)] = hgbranch[parent] | |
else: | |
# Normal changesets | |
# For first children, take the parent branch, for the others create a new branch | |
if hgchildren[parent][0] == str(cset): | |
hgbranch[str(cset)] = hgbranch[parent] | |
else: | |
hgbranch[str(cset)] = "branch-" + str(cset) | |
if not hgvers.has_key("0"): | |
print 'creating repository' | |
os.system('git init') | |
# loop through every hg changeset | |
for cset in range(int(tip) + 1): | |
# incremental, already seen | |
if hgvers.has_key(str(cset)): | |
continue | |
hgnewcsets += 1 | |
# get info | |
log_data = os.popen('hg log -r %d --template "{tags}\n{date|date}\n{author}\n"' % cset).readlines() | |
tag = log_data[0].strip() | |
date = log_data[1].strip() | |
user = log_data[2].strip() | |
parent = hgparents[str(cset)][0] | |
mparent = hgparents[str(cset)][1] | |
#get comment | |
(fdcomment, filecomment) = tempfile.mkstemp() | |
csetcomment = os.popen('hg log -r %d --template "{desc}"' % cset).read().strip() | |
os.write(fdcomment, csetcomment) | |
os.close(fdcomment) | |
print '-----------------------------------------' | |
print 'cset:', cset | |
print 'branch:', hgbranch[str(cset)] | |
print 'user:', user | |
print 'date:', date | |
print 'comment:', csetcomment | |
if parent: | |
print 'parent:', parent | |
if mparent: | |
print 'mparent:', mparent | |
if tag: | |
print 'tag:', tag | |
print '-----------------------------------------' | |
# checkout the parent if necessary | |
if cset != 0: | |
if hgbranch[str(cset)] == "branch-" + str(cset): | |
print 'creating new branch', hgbranch[str(cset)] | |
os.system('git checkout -b %s %s' % (hgbranch[str(cset)], hgvers[parent])) | |
else: | |
print 'checking out branch', hgbranch[str(cset)] | |
os.system('git checkout %s' % hgbranch[str(cset)]) | |
# merge | |
if mparent: | |
if hgbranch[parent] == hgbranch[str(cset)]: | |
otherbranch = hgbranch[mparent] | |
else: | |
otherbranch = hgbranch[parent] | |
print 'merging', otherbranch, 'into', hgbranch[str(cset)] | |
os.system(getgitenv(user, date) + 'git merge --no-commit -s ours "" %s %s' % (hgbranch[str(cset)], otherbranch)) | |
# remove everything except .git and .hg directories | |
os.system('find . \( -path "./.hg" -o -path "./.git" \) -prune -o ! -name "." -print | xargs rm -rf') | |
# repopulate with checkouted files | |
os.system('hg update -C %d' % cset) | |
# add new files | |
os.system('git ls-files -x .hg --others | git update-index --add --stdin') | |
# delete removed files | |
os.system('git ls-files -x .hg --deleted | git update-index --remove --stdin') | |
# commit | |
os.system(getgitenv(user, date) + 'git commit --allow-empty -a -F %s' % filecomment) | |
os.unlink(filecomment) | |
# tag | |
if tag and tag != 'tip': | |
os.system(getgitenv(user, date) + 'git tag %s' % tag) | |
# delete branch if not used anymore... | |
if mparent and len(hgchildren[str(cset)]): | |
print "Deleting unused branch:", otherbranch | |
os.system('git branch -d %s' % otherbranch) | |
# retrieve and record the version | |
vvv = os.popen('git show --quiet --pretty=format:%H').read() | |
print 'record', cset, '->', vvv | |
hgvers[str(cset)] = vvv | |
if hgnewcsets >= opt_nrepack and opt_nrepack != -1: | |
os.system('git repack -a -d') | |
# write the state for incrementals | |
if state: | |
if verbose: | |
print 'Writing state' | |
f = open(state, 'w') | |
pickle.dump(hgvers, f) | |
# vim: et ts=8 sw=4 sts=4 |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
RemoteHgRepository = 'http://code.suckless.org/hg/dwm' | |
RemoteGitRepository = '[email protected]:sr/dwm.git' | |
__DIR__ = File.dirname(__FILE__) | |
Repository = __DIR__ + '/dwm' | |
GitRepository = __DIR__ + '/dwm-git' | |
StateFile = __DIR__ + '/hg-to-git-state' | |
ImportScript = __DIR__ + '/hg-to-git.py' | |
task :default => :mirror | |
desc 'make a git mirror of an hg repo' | |
task :mirror => 'git-mirror:git:push' | |
namespace :"git-mirror" do | |
task :redo => [:wipe, 'git:push'] | |
task :wipe do | |
rm_rf Repository + '/.git' if File.directory?(Repository + '/.git') | |
rm_rf GitRepository if File.directory?(GitRepository) | |
rm_rf Repository if File.directory?(Repository) | |
rm StateFile if File.file?(StateFile) | |
end | |
namespace :git do | |
task :push => :pull do | |
Dir.chdir(GitRepository) do | |
sh "git push #{RemoteGitRepository} master" | |
end | |
end | |
task :pull => :clone do | |
Dir.chdir(GitRepository) do | |
sh 'git fetch origin' | |
sh 'git rebase origin/master' | |
end | |
end | |
task :clone => :import do | |
sh "git clone #{Repository} #{GitRepository}" unless File.directory?(GitRepository + '/.git') | |
end | |
task :import => 'hg:pull' do | |
sh "python #{ImportScript} -v --gitstate=#{StateFile} #{Repository}" | |
end | |
end | |
namespace :hg do | |
task :clone do | |
sh "hg clone #{RemoteHgRepository}" unless File.directory?(Repository + '/.hg') | |
end | |
task :pull => :clone do | |
Dir.chdir(Repository) { sh 'hg pull' } | |
end | |
end | |
end |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment