1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160
|
#!/usr/bin/python
#
# svn-fast-export.py
# ----------
# Walk through each revision of a local Subversion repository and export it
# in a stream that git-fast-import can consume.
#
# Author: Chris Lee <clee@kde.org>
# License: MIT <http://www.opensource.org/licenses/mit-license.php>
trunk_path = '/trunk/'
branches_path = '/branches/'
tags_path = '/tags/'
first_rev = 1
final_rev = 0
import sys, os.path
from optparse import OptionParser
from time import mktime, strptime
from svn.fs import svn_fs_file_length, svn_fs_file_contents, svn_fs_is_dir, svn_fs_revision_root, svn_fs_youngest_rev, svn_fs_revision_proplist, svn_fs_paths_changed
from svn.core import svn_pool_create, svn_pool_clear, svn_pool_destroy, svn_stream_for_stdout, svn_stream_copy, svn_stream_close, run_app
from svn.repos import svn_repos_open, svn_repos_fs
ct_short = ['M', 'A', 'D', 'R', 'X']
def dump_file_blob(root, full_path, pool):
stream_length = svn_fs_file_length(root, full_path, pool)
stream = svn_fs_file_contents(root, full_path, pool)
sys.stdout.write("data %s\n" % stream_length)
sys.stdout.flush()
ostream = svn_stream_for_stdout(pool)
svn_stream_copy(stream, ostream, pool)
svn_stream_close(ostream)
sys.stdout.write("\n")
def export_revision(rev, repo, fs, pool):
sys.stderr.write("Exporting revision %s... " % rev)
revpool = svn_pool_create(pool)
svn_pool_clear(revpool)
# Open a root object representing the youngest (HEAD) revision.
root = svn_fs_revision_root(fs, rev, revpool)
# And the list of what changed in this revision.
changes = svn_fs_paths_changed(root, revpool)
i = 1
marks = {}
file_changes = []
for path, change_type in changes.iteritems():
c_t = ct_short[change_type.change_kind]
if svn_fs_is_dir(root, path, revpool):
continue
if not path.startswith(trunk_path):
# We don't handle branches. Or tags. Yet.
pass
else:
if c_t == 'D':
file_changes.append("D %s" % path.replace(trunk_path, ''))
else:
marks[i] = path.replace(trunk_path, '')
file_changes.append("M 644 :%s %s" % (i, marks[i]))
sys.stdout.write("blob\nmark :%s\n" % i)
dump_file_blob(root, path, revpool)
i += 1
# Get the commit author and message
props = svn_fs_revision_proplist(fs, rev, revpool)
# Do the recursive crawl.
if props.has_key('svn:author'):
author = "%s <%s@localhost>" % (props['svn:author'], props['svn:author'])
else:
author = 'nobody <nobody@localhost>'
if len(file_changes) == 0:
svn_pool_destroy(revpool)
sys.stderr.write("skipping.\n")
return
svndate = props['svn:date'][0:-8]
commit_time = mktime(strptime(svndate, '%Y-%m-%dT%H:%M:%S'))
sys.stdout.write("commit refs/heads/master\n")
sys.stdout.write("committer %s %s -0000\n" % (author, int(commit_time)))
sys.stdout.write("data %s\n" % len(props['svn:log']))
sys.stdout.write(props['svn:log'])
sys.stdout.write("\n")
sys.stdout.write('\n'.join(file_changes))
sys.stdout.write("\n\n")
svn_pool_destroy(revpool)
sys.stderr.write("done!\n")
#if rev % 1000 == 0:
# sys.stderr.write("gc: %s objects\n" % len(gc.get_objects()))
# sleep(5)
def crawl_revisions(pool, repos_path):
"""Open the repository at REPOS_PATH, and recursively crawl all its
revisions."""
global final_rev
# Open the repository at REPOS_PATH, and get a reference to its
# versioning filesystem.
repos_obj = svn_repos_open(repos_path, pool)
fs_obj = svn_repos_fs(repos_obj)
# Query the current youngest revision.
youngest_rev = svn_fs_youngest_rev(fs_obj, pool)
first_rev = 1
if final_rev == 0:
final_rev = youngest_rev
for rev in xrange(first_rev, final_rev + 1):
export_revision(rev, repos_obj, fs_obj, pool)
if __name__ == '__main__':
usage = '%prog [options] REPOS_PATH'
parser = OptionParser()
parser.set_usage(usage)
parser.add_option('-f', '--final-rev', help='Final revision to import',
dest='final_rev', metavar='FINAL_REV', type='int')
parser.add_option('-t', '--trunk-path', help='Path in repo to /trunk',
dest='trunk_path', metavar='TRUNK_PATH')
parser.add_option('-b', '--branches-path', help='Path in repo to /branches',
dest='branches_path', metavar='BRANCHES_PATH')
parser.add_option('-T', '--tags-path', help='Path in repo to /tags',
dest='tags_path', metavar='TAGS_PATH')
(options, args) = parser.parse_args()
if options.trunk_path != None:
trunk_path = options.trunk_path
if options.branches_path != None:
branches_path = options.branches_path
if options.tags_path != None:
tags_path = options.tags_path
if options.final_rev != None:
final_rev = options.final_rev
if len(args) != 1:
parser.print_help()
sys.exit(2)
# Canonicalize (enough for Subversion, at least) the repository path.
repos_path = os.path.normpath(args[0])
if repos_path == '.':
repos_path = ''
# Call the app-wrapper, which takes care of APR initialization/shutdown
# and the creation and cleanup of our top-level memory pool.
run_app(crawl_revisions, repos_path)
|