2 Replicate (replay) changesets from one SVN repository to another.
5 from .. import base_version
, full_version
7 from .. import svnclient
8 from ..shell
import run_svn
9 from ..errors
import (ExternalCommandFailed
, UnsupportedSVNAction
, InternalError
, VerificationError
)
10 from parse
import HelpFormatter
19 from datetime
import datetime
21 _valid_svn_actions
= "MARD" # The list of known SVN action abbr's, from "svn log"
23 # Module-level variables/parameters
24 source_url
= "" # URL to source path in source SVN repo, e.g. 'http://server/svn/source/trunk'
25 source_repos_url
= "" # URL to root of source SVN repo, e.g. 'http://server/svn/source'
26 source_base
= "" # Relative path of source_url in source SVN repo, e.g. '/trunk'
27 source_repos_uuid
= "" # UUID of source SVN repo
28 target_url
="" # URL to target path in target SVN repo, e.g. 'file:///svn/repo_target/trunk'
29 rev_map
= {} # The running mapping-table dictionary for source_url rev #'s -> target_url rev #'s
31 def commit_from_svn_log_entry(log_entry
, options
, commit_paths
=None, target_revprops
=None):
33 Given an SVN log entry and an optional list of changed paths, do an svn commit.
35 # TODO: Run optional external shell hook here, for doing pre-commit filtering
36 # Display the _wc_target "svn status" info if running in -vv (or higher) mode
37 if ui
.get_level() >= ui
.EXTRA
:
38 ui
.status(">> commit_from_svn_log_entry: Pre-commit _wc_target status:", level
=ui
.EXTRA
, color
='CYAN')
39 ui
.status(run_svn(["status"]), level
=ui
.EXTRA
, color
='CYAN')
40 # This will use the local timezone for displaying commit times
41 timestamp
= int(log_entry
['date'])
42 svn_date
= str(datetime
.fromtimestamp(timestamp
))
43 # Uncomment this one one if you prefer UTC commit times
44 #svn_date = "%d 0" % timestamp
45 args
= ["commit", "--force-log"]
46 if options
.keep_author
:
47 args
+= ["-m", log_entry
['message'] + "\nDate: " + svn_date
, "--username", log_entry
['author']]
49 args
+= ["-m", log_entry
['message'] + "\nDate: " + svn_date
+ "\nAuthor: " + log_entry
['author']]
51 if log_entry
['revprops']:
52 # Carry forward any revprop's from the source revision
53 for v
in log_entry
['revprops']:
54 revprops
[v
['name']] = v
['value']
56 # Add any extra revprop's we want to set for the target repo commits
57 for v
in target_revprops
:
58 revprops
[v
['name']] = v
['value']
61 args
+= ["--with-revprop", "%s=%s" % (key
, str(revprops
[key
]))]
63 if len(commit_paths
)<100:
64 # If we don't have an excessive amount of individual changed paths, pass
65 # those to the "svn commit" command. Else, pass nothing so we commit at
66 # the root of the working-copy.
67 args
+= list(commit_paths
)
69 if not options
.dry_run
:
70 # Run the "svn commit" command, and screen-scrape the target_rev value (if any)
71 output
= run_svn(args
)
73 output_lines
= output
.strip("\n").split("\n")
75 for line
in output_lines
:
76 if line
[0:19] == 'Committed revision ':
77 rev
= line
[19:].rstrip('.')
80 ui
.status("Committed revision %s.", rev
)
83 def full_svn_revert():
85 Do an "svn revert" and proactively remove any extra files in the working copy.
87 run_svn(["revert", "--recursive", "."])
88 output
= run_svn(["status"])
90 output_lines
= output
.strip("\n").split("\n")
91 for line
in output_lines
:
93 path
= line
[4:].strip(" ")
94 if os
.path
.isfile(path
):
96 if os
.path
.isdir(path
):
99 def gen_tracking_revprops(source_rev
):
101 Build an array of svn2svn-specific source-tracking revprops.
103 revprops
= [{'name':'svn2svn:source_uuid', 'value':source_repos_uuid}
,
104 {'name':'svn2svn:source_url', 'value':source_url}
,
105 {'name':'svn2svn:source_rev', 'value':source_rev}
]
108 def in_svn(p
, require_in_repo
=False, prefix
=""):
110 Check if a given file/folder is being tracked by Subversion.
111 Prior to SVN 1.6, we could "cheat" and look for the existence of ".svn" directories.
112 With SVN 1.7 and beyond, WC-NG means only a single top-level ".svn" at the root of the working-copy.
113 Use "svn status" to check the status of the file/folder.
115 entries
= svnclient
.get_svn_status(p
, no_recursive
=True)
119 if require_in_repo
and (d
['status'] == 'added' or d
['revision'] is None):
120 # If caller requires this path to be in the SVN repo, prevent returning True
121 # for paths that are only locally-added.
124 # Don't consider files tracked as deleted in the WC as under source-control.
125 # Consider files which are locally added/copied as under source-control.
126 ret
= True if not (d
['status'] == 'deleted') and (d
['type'] == 'normal' or d
['status'] == 'added' or d
['copied'] == 'true') else False
127 ui
.status(prefix
+ ">> in_svn('%s', require_in_repo=%s) --> %s", p
, str(require_in_repo
), str(ret
), level
=ui
.DEBUG
, color
='GREEN')
130 def find_svn_ancestors(svn_repos_url
, base_path
, source_path
, source_rev
, prefix
= ""):
132 Given a source path, walk the SVN history backwards to inspect the ancestory of
133 that path, seeing if it traces back to base_path. Build an array of copyfrom_path
134 and copyfrom_revision pairs for each of the "svn copies". If we find a copyfrom_path
135 which base_path is a substring match of (e.g. we crawled back to the initial branch-
136 copy from trunk), then return the collection of ancestor paths. Otherwise,
137 copyfrom_path has no ancestory compared to base_path.
139 This is useful when comparing "trunk" vs. "branch" paths, to handle cases where a
140 file/folder was renamed in a branch and then that branch was merged back to trunk.
142 'svn_repos_url' is the full URL to the root of the SVN repository,
143 e.g. 'file:///path/to/repo'
144 'base_path' is the path in the SVN repo to the target path we're trying to
145 trace ancestry back to, e.g. 'trunk'.
146 'source_path' is the path in the SVN repo to the source path to start checking
147 ancestry at, e.g. 'branches/fix1/projectA/file1.txt'.
148 (full_path = svn_repos_url+base_path+"/"+path_offset)
149 'source_rev' is the revision to start walking the history of source_path backwards from.
151 ui
.status(prefix
+ ">> find_svn_ancestors: Start: (%s) source_path: %s base_path: %s",
152 svn_repos_url
, source_path
+"@"+str(source_rev
), base_path
, level
=ui
.DEBUG
, color
='YELLOW')
154 working_path
= base_path
+"/"+source_path
155 working_rev
= source_rev
156 first_iter_done
= False
159 # Get the first "svn log" entry for this path (relative to @rev)
160 ui
.status(prefix
+ ">> find_svn_ancestors: %s", svn_repos_url
+ working_path
+"@"+str(working_rev
), level
=ui
.DEBUG
, color
='YELLOW')
161 log_entry
= svnclient
.get_first_svn_log_entry(svn_repos_url
+ working_path
+"@"+str(working_rev
), 1, working_rev
, True)
163 ui
.status(prefix
+ ">> find_svn_ancestors: Done: no log_entry", level
=ui
.DEBUG
, color
='YELLOW')
166 # If we found a copy-from case which matches our base_path, we're done.
167 # ...but only if we've at least tried to search for the first copy-from path.
168 if first_iter_done
and working_path
.startswith(base_path
):
169 ui
.status(prefix
+ ">> find_svn_ancestors: Done: Found working_path.startswith(base_path) and first_iter_done=True", level
=ui
.DEBUG
, color
='YELLOW')
172 first_iter_done
= True
173 # Search for any actions on our target path (or parent paths).
174 changed_paths_temp
= []
175 for d
in log_entry
['changed_paths']:
177 if path
in working_path
:
178 changed_paths_temp
.append({'path': path, 'data': d}
)
179 if not changed_paths_temp
:
180 # If no matches, then we've hit the end of the chain and this path has no ancestry back to base_path.
181 ui
.status(prefix
+ ">> find_svn_ancestors: Done: No matching changed_paths", level
=ui
.DEBUG
, color
='YELLOW')
184 # Reverse-sort any matches, so that we start with the most-granular (deepest in the tree) path.
185 changed_paths
= sorted(changed_paths_temp
, key
=operator
.itemgetter('path'), reverse
=True)
186 # Find the action for our working_path in this revision. Use a loop to check in reverse order,
187 # so that if the target file/folder is "M" but has a parent folder with an "A" copy-from.
188 for v
in changed_paths
:
191 # Check action-type for this file
193 if action
not in _valid_svn_actions
:
194 raise UnsupportedSVNAction("In SVN rev. %d: action '%s' not supported. Please report a bug!"
195 % (log_entry
['revision'], action
))
196 ui
.status(prefix
+ "> %s %s%s", action
, path
,
197 (" (from %s)" % (d
['copyfrom_path']+"@"+str(d
['copyfrom_revision']))) if d
['copyfrom_path'] else "",
198 level
=ui
.DEBUG
, color
='YELLOW')
200 # If file/folder was deleted, it has no ancestor
202 ui
.status(prefix
+ ">> find_svn_ancestors: Done: deleted", level
=ui
.DEBUG
, color
='YELLOW')
206 # If file/folder was added/replaced but not a copy, it has no ancestor
207 if not d
['copyfrom_path']:
209 ui
.status(prefix
+ ">> find_svn_ancestors: Done: %s with no copyfrom_path",
210 "Added" if action
== "A" else "Replaced",
211 level
=ui
.DEBUG
, color
='YELLOW')
214 # Else, file/folder was added/replaced and is a copy, so add an entry to our ancestors list
215 # and keep checking for ancestors
216 ui
.status(prefix
+ ">> find_svn_ancestors: Found copy-from (action=%s): %s --> %s",
217 action
, path
, d
['copyfrom_path']+"@"+str(d
['copyfrom_revision']),
218 level
=ui
.DEBUG
, color
='YELLOW')
219 ancestors_temp
.append({'path': path
, 'revision': log_entry
['revision'],
220 'copyfrom_path': d
['copyfrom_path'], 'copyfrom_rev': d
['copyfrom_revision']})
221 working_path
= working_path
.replace(d
['path'], d
['copyfrom_path'])
222 working_rev
= d
['copyfrom_revision']
223 # Follow the copy and keep on searching
227 ancestors
.append({'path': base_path+"/"+source_path, 'revision': source_rev}
)
228 working_path
= base_path
+"/"+source_path
229 for idx
in range(len(ancestors_temp
)):
230 d
= ancestors_temp
[idx
]
231 working_path
= working_path
.replace(d
['path'], d
['copyfrom_path'])
232 working_rev
= d
['copyfrom_rev']
233 ancestors
.append({'path': working_path, 'revision': working_rev}
)
234 if ui
.get_level() >= ui
.DEBUG
:
236 for idx
in range(len(ancestors
)):
238 max_len
= max(max_len
, len(d
['path']+"@"+str(d
['revision'])))
239 ui
.status(prefix
+ ">> find_svn_ancestors: Found parent ancestors:", level
=ui
.DEBUG
, color
='YELLOW_B')
240 for idx
in range(len(ancestors
)-1):
242 d_next
= ancestors
[idx
+1]
243 ui
.status(prefix
+ " [%s] %s <-- %s", idx
,
244 str(d
['path']+"@"+str(d
['revision'])).ljust(max_len
),
245 str(d_next
['path']+"@"+str(d_next
['revision'])).ljust(max_len
),
246 level
=ui
.DEBUG
, color
='YELLOW')
248 ui
.status(prefix
+ ">> find_svn_ancestors: No ancestor-chain found: %s",
249 svn_repos_url
+base_path
+"/"+source_path
+"@"+str(source_rev
), level
=ui
.DEBUG
, color
='YELLOW')
252 def get_rev_map(source_rev
, prefix
):
254 Find the equivalent rev # in the target repo for the given rev # from the source repo.
256 ui
.status(prefix
+ ">> get_rev_map(%s)", source_rev
, level
=ui
.DEBUG
, color
='GREEN')
257 # Find the highest entry less-than-or-equal-to source_rev
258 for rev
in range(int(source_rev
), 0, -1):
259 ui
.status(prefix
+ ">> get_rev_map: rev=%s in_rev_map=%s", rev
, str(rev
in rev_map
), level
=ui
.DEBUG
, color
='BLACK_B')
261 return int(rev_map
[rev
])
262 # Else, we fell off the bottom of the rev_map. Ruh-roh...
265 def set_rev_map(source_rev
, target_rev
):
266 ui
.status(">> set_rev_map: source_rev=%s target_rev=%s", source_rev
, target_rev
, level
=ui
.DEBUG
, color
='GREEN')
268 rev_map
[int(source_rev
)]=int(target_rev
)
270 def build_rev_map(target_url
, source_info
):
272 Check for any already-replayed history from source_url (source_info) and
273 build the mapping-table of source_rev -> target_rev.
277 ui
.status("Rebuilding rev_map...", level
=ui
.VERBOSE
)
279 it_log_entries
= svnclient
.iter_svn_log_entries(target_url
, 1, 'HEAD', get_changed_paths
=False, get_revprops
=True)
280 for log_entry
in it_log_entries
:
281 if log_entry
['revprops']:
283 for v
in log_entry
['revprops']:
284 if v
['name'].startswith('svn2svn:'):
285 revprops
[v
['name']] = v
['value']
287 revprops
['svn2svn:source_uuid'] == source_info
['repos_uuid'] and \
288 revprops
['svn2svn:source_url'] == source_info
['url']:
289 source_rev
= revprops
['svn2svn:source_rev']
290 target_rev
= log_entry
['revision']
291 set_rev_map(source_rev
, target_rev
)
293 def get_svn_dirlist(svn_path
, svn_rev
= ""):
295 Get a list of all the child contents (recusive) of the given folder path.
300 args
+= ["-r", svn_rev
]
301 path
+= "@"+str(svn_rev
)
303 paths
= run_svn(args
, no_fail
=True)
304 paths
= paths
.strip("\n").split("\n") if len(paths
)>1 else []
307 def path_in_list(paths
, path
):
309 if path
.startswith(p
):
313 def add_path(paths
, path
):
314 if not path_in_list(paths
, path
):
317 def do_svn_add(path_offset
, source_rev
, parent_copyfrom_path
="", parent_copyfrom_rev
="", \
318 export_paths
={}, is_dir
= False, prefix
= ""):
320 Given the add'd source path, replay the "svn add/copy" commands to correctly
321 track renames across copy-from's.
323 For example, consider a sequence of events like this:
324 1. svn copy /trunk /branches/fix1
325 2. (Make some changes on /branches/fix1)
326 3. svn mv /branches/fix1/Proj1 /branches/fix1/Proj2 " Rename folder
327 4. svn mv /branches/fix1/Proj2/file1.txt /branches/fix1/Proj2/file2.txt " Rename file inside renamed folder
328 5. svn co /trunk && svn merge /branches/fix1
329 After the merge and commit, "svn log -v" with show a delete of /trunk/Proj1
330 and and add of /trunk/Proj2 copy-from /branches/fix1/Proj2. If we were just
331 to do a straight "svn export+add" based on the /branches/fix1/Proj2 folder,
332 we'd lose the logical history that Proj2/file2.txt is really a descendant
335 'path_offset' is the offset from source_base to the file to check ancestry for,
336 e.g. 'projectA/file1.txt'. path = source_repos_url + source_base + path_offset.
337 'source_rev' is the revision ("svn log") that we're processing from the source repo.
338 'parent_copyfrom_path' and 'parent_copyfrom_rev' is the copy-from path of the parent
339 directory, when being called recursively by do_svn_add_dir().
340 'export_paths' is the list of path_offset's that we've deferred running "svn export" on.
341 'is_dir' is whether path_offset is a directory (rather than a file).
343 ui
.status(prefix
+ ">> do_svn_add: %s %s", source_base
+"/"+path_offset
+"@"+str(source_rev
),
344 " (parent-copyfrom: "+parent_copyfrom_path
+"@"+str(parent_copyfrom_rev
)+")" if parent_copyfrom_path
else "",
345 level
=ui
.DEBUG
, color
='GREEN')
346 # Check if the given path has ancestors which chain back to the current source_base
347 found_ancestor
= False
348 ancestors
= find_svn_ancestors(source_repos_url
, source_base
, path_offset
, source_rev
, prefix
+" ")
349 # ancestors[n] is the original (pre-branch-copy) trunk path.
350 # ancestors[n-1] is the first commit on the new branch.
351 copyfrom_path
= ancestors
[len(ancestors
)-1]['path'] if ancestors
else ""
352 copyfrom_rev
= ancestors
[len(ancestors
)-1]['revision'] if ancestors
else ""
354 # The copy-from path has ancestory back to source_url.
355 ui
.status(prefix
+ ">> do_svn_add: Check copy-from: Found parent: %s", copyfrom_path
+"@"+str(copyfrom_rev
),
356 level
=ui
.DEBUG
, color
='GREEN', bold
=True)
357 found_ancestor
= True
358 # Map the copyfrom_rev (source repo) to the equivalent target repo rev #. This can
359 # return None in the case where copyfrom_rev is *before* our source_start_rev.
360 tgt_rev
= get_rev_map(copyfrom_rev
, prefix
+" ")
361 ui
.status(prefix
+ ">> do_svn_add: get_rev_map: %s (source) -> %s (target)", copyfrom_rev
, tgt_rev
, level
=ui
.DEBUG
, color
='GREEN')
363 ui
.status(prefix
+ ">> do_svn_add: Check copy-from: No ancestor chain found.", level
=ui
.DEBUG
, color
='GREEN')
364 found_ancestor
= False
365 if found_ancestor
and tgt_rev
:
366 # Check if this path_offset in the target WC already has this ancestry, in which
367 # case there's no need to run the "svn copy" (again).
368 path_in_svn
= in_svn(path_offset
, prefix
=prefix
+" ")
369 log_entry
= svnclient
.get_last_svn_log_entry(path_offset
, 1, 'HEAD', get_changed_paths
=False) if in_svn(path_offset
, require_in_repo
=True, prefix
=prefix
+" ") else []
370 if (not log_entry
or (log_entry
['revision'] != tgt_rev
)):
371 copyfrom_offset
= copyfrom_path
[len(source_base
):].strip('/')
372 ui
.status(prefix
+ ">> do_svn_add: svn_copy: Copy-from: %s", copyfrom_path
+"@"+str(copyfrom_rev
), level
=ui
.DEBUG
, color
='GREEN')
373 ui
.status(prefix
+ " copyfrom: %s", copyfrom_path
+"@"+str(copyfrom_rev
), level
=ui
.DEBUG
, color
='GREEN')
374 ui
.status(prefix
+ " p_copyfrom: %s", parent_copyfrom_path
+"@"+str(parent_copyfrom_rev
) if parent_copyfrom_path
else "", level
=ui
.DEBUG
, color
='GREEN')
376 ((parent_copyfrom_path
and copyfrom_path
.startswith(parent_copyfrom_path
)) and \
377 (parent_copyfrom_rev
and copyfrom_rev
== parent_copyfrom_rev
)):
378 # When being called recursively, if this child entry has the same ancestor as the
379 # the parent, then no need to try to run another "svn copy".
380 ui
.status(prefix
+ ">> do_svn_add: svn_copy: Same ancestry as parent: %s",
381 parent_copyfrom_path
+"@"+str(parent_copyfrom_rev
),level
=ui
.DEBUG
, color
='GREEN')
384 # Copy this path from the equivalent path+rev in the target repo, to create the
385 # equivalent history.
386 if parent_copyfrom_path
:
387 # If we have a parent copy-from path, we mis-match that so display a status
388 # message describing the action we're mimic'ing. If path_in_svn, then this
389 # is logically a "replace" rather than an "add".
390 ui
.status(" %s %s (from %s)", ('R' if path_in_svn
else 'A'), source_base
+"/"+path_offset
, ancestors
[1]['path']+"@"+str(copyfrom_rev
), level
=ui
.VERBOSE
)
392 # If local file is already under version-control, then this is a replace.
393 ui
.status(prefix
+ ">> do_svn_add: pre-copy: local path already exists: %s", path_offset
, level
=ui
.DEBUG
, color
='GREEN')
394 run_svn(["remove", "--force", path_offset
])
395 run_svn(["copy", "-r", tgt_rev
, target_url
+"/"+copyfrom_offset
+"@"+str(tgt_rev
), path_offset
])
396 # Export the final version of this file/folder from the source repo, to make
397 # sure we're up-to-date.
398 add_path(export_paths
, path_offset
)
400 ui
.status(prefix
+ ">> do_svn_add: Skipped 'svn copy': %s", path_offset
, level
=ui
.DEBUG
, color
='GREEN')
402 # Else, either this copy-from path has no ancestry back to source_url OR copyfrom_rev comes
403 # before our initial source_start_rev (i.e. tgt_rev == None), so can't do a "svn copy".
404 # Create (parent) directory if needed.
405 # TODO: This is (nearly) a duplicate of code in process_svn_log_entry(). Should this be
406 # split-out to a shared tag?
407 p_path
= path_offset
if is_dir
else os
.path
.dirname(path_offset
).strip() or '.'
408 if not os
.path
.exists(p_path
):
409 run_svn(["mkdir", p_path
])
410 if not in_svn(path_offset
, prefix
=prefix
+" "):
412 # Export the final verison of all files in this folder.
413 add_path(export_paths
, path_offset
)
415 # Export the final verison of this file. We *need* to do this before running
416 # the "svn add", even if we end-up re-exporting this file again via export_paths.
417 run_svn(["export", "--force", "-r", source_rev
,
418 source_repos_url
+source_base
+"/"+path_offset
+"@"+str(source_rev
), path_offset
])
419 # If not already under version-control, then "svn add" this file/folder.
420 run_svn(["add", "--parents", path_offset
])
421 # TODO: Need to copy SVN properties from source repos
423 # For any folders that we process, process any child contents, so that we correctly
424 # replay copies/replaces/etc.
425 do_svn_add_dir(path_offset
, source_rev
, copyfrom_path
, copyfrom_rev
, export_paths
, prefix
+" ")
427 def do_svn_add_dir(path_offset
, source_rev
, parent_copyfrom_path
, parent_copyfrom_rev
, \
428 export_paths
, prefix
=""):
429 # Get the directory contents, to compare between the local WC (target_url) vs. the remote repo (source_url)
430 # TODO: paths_local won't include add'd paths because "svn ls" lists the contents of the
431 # associated remote repo folder. (Is this a problem?)
432 paths_local
= get_svn_dirlist(path_offset
)
433 paths_remote
= get_svn_dirlist(source_url
+"/"+path_offset
, source_rev
)
434 ui
.status(prefix
+ ">> do_svn_add_dir: paths_local: %s", str(paths_local
), level
=ui
.DEBUG
, color
='GREEN')
435 ui
.status(prefix
+ ">> do_svn_add_dir: paths_remote: %s", str(paths_remote
), level
=ui
.DEBUG
, color
='GREEN')
436 # Update files/folders which exist in remote but not local
437 for path
in paths_remote
:
438 path_is_dir
= True if path
[-1] == "/" else False
439 working_path
= path_offset
+"/"+(path
.rstrip('/') if path_is_dir
else path
)
440 do_svn_add(working_path
, source_rev
, parent_copyfrom_path
, parent_copyfrom_rev
,
441 export_paths
, path_is_dir
, prefix
+" ")
442 # Remove files/folders which exist in local but not remote
443 for path
in paths_local
:
444 if not path
in paths_remote
:
445 ui
.status(" %s %s", 'D', source_base
+"/"+path_offset
+"/"+path
, level
=ui
.VERBOSE
)
446 run_svn(["remove", "--force", path_offset
+"/"+path
])
447 # TODO: Does this handle deleted folders too? Wouldn't want to have a case
448 # where we only delete all files from folder but leave orphaned folder around.
450 def process_svn_log_entry(log_entry
, options
, commit_paths
, prefix
= ""):
452 Process SVN changes from the given log entry. Build an array (commit_paths)
453 of the paths in the working-copy that were changed, i.e. the paths which
454 we'll pass to "svn commit".
457 source_rev
= log_entry
['revision']
458 ui
.status(prefix
+ ">> process_svn_log_entry: %s", source_url
+"@"+str(source_rev
), level
=ui
.DEBUG
, color
='GREEN')
459 for d
in log_entry
['changed_paths']:
460 # Get the full path for this changed_path
461 # e.g. '/branches/bug123/projectA/file1.txt'
463 if not path
.startswith(source_base
+ "/"):
464 # Ignore changed files that are not part of this subdir
465 if path
!= source_base
:
466 ui
.status(prefix
+ ">> process_svn_log_entry: Unrelated path: %s (base: %s)", path
, source_base
, level
=ui
.DEBUG
, color
='GREEN')
468 assert len(d
['kind'])>0
469 path_is_dir
= True if d
['kind'] == 'dir' else False
470 # Calculate the offset (based on source_base) for this changed_path
471 # e.g. 'projectA/file1.txt'
472 # (path = source_base + "/" + path_offset)
473 path_offset
= path
[len(source_base
):].strip("/")
474 # Get the action for this path
476 if action
not in _valid_svn_actions
:
477 raise UnsupportedSVNAction("In SVN rev. %d: action '%s' not supported. Please report a bug!"
478 % (source_rev
, action
))
479 ui
.status(" %s %s%s", action
, d
['path'],
480 (" (from %s)" % (d
['copyfrom_path']+"@"+str(d
['copyfrom_revision']))) if d
['copyfrom_path'] else "",
483 # Try to be efficient and keep track of an explicit list of paths in the
484 # working copy that changed. If we commit from the root of the working copy,
485 # then SVN needs to crawl the entire working copy looking for pending changes.
486 add_path(commit_paths
, path_offset
)
488 # Special-handling for replace's
490 # If file was "replaced" (deleted then re-added, all in same revision),
491 # then we need to run the "svn rm" first, then change action='A'. This
492 # lets the normal code below handle re-"svn add"'ing the files. This
493 # should replicate the "replace".
494 run_svn(["remove", "--force", path_offset
])
497 # Handle all the various action-types
498 # (Handle "add" first, for "svn copy/move" support)
500 # Determine where to export from.
502 # Handle cases where this "add" was a copy from another URL in the source repos
503 if d
['copyfrom_revision']:
504 copyfrom_path
= d
['copyfrom_path']
505 copyfrom_rev
= d
['copyfrom_revision']
506 do_svn_add(path_offset
, source_rev
, "", "", export_paths
, path_is_dir
, prefix
+" ")
507 # Else just "svn export" the files from the source repo and "svn add" them.
509 # Create (parent) directory if needed
510 p_path
= path_offset
if path_is_dir
else os
.path
.dirname(path_offset
).strip() or '.'
511 if not os
.path
.exists(p_path
):
512 run_svn(["mkdir", p_path
])
513 # Export the entire added tree.
515 # For directories, defer the (recurisve) "svn export". Might have a
516 # situation in a branch merge where the entry in the svn-log is a
517 # non-copy-from'd "add" but there are child contents (that we haven't
518 # gotten to yet in log_entry) that are copy-from's. When we try do
519 # the "svn copy" later on in do_svn_add() for those copy-from'd paths,
520 # having pre-existing (svn-add'd) contents creates some trouble.
521 # Instead, just create the stub folders ("svn mkdir" above) and defer
522 # exporting the final file-state until the end.
523 add_path(export_paths
, path_offset
)
525 # Export the final verison of this file. We *need* to do this before running
526 # the "svn add", even if we end-up re-exporting this file again via export_paths.
527 run_svn(["export", "--force", "-r", source_rev
,
528 source_url
+"/"+path_offset
+"@"+str(source_rev
), path_offset
])
529 if not in_svn(path_offset
, prefix
=prefix
+" "):
530 # Need to use in_svn here to handle cases where client committed the parent
531 # folder and each indiv sub-folder.
532 run_svn(["add", "--parents", path_offset
])
533 # TODO: Need to copy SVN properties from source repos
536 run_svn(["remove", "--force", path_offset
])
539 # TODO: Is "svn merge -c" correct here? Should this just be an "svn export" plus
541 out
= run_svn(["merge", "-c", source_rev
, "--non-recursive",
542 "--non-interactive", "--accept=theirs-full",
543 source_url
+"/"+path_offset
+"@"+str(source_rev
), path_offset
])
546 raise InternalError("Internal Error: process_svn_log_entry: Unhandled 'action' value: '%s'"
549 # Export the final version of all add'd paths from source_url
551 for path_offset
in export_paths
:
552 run_svn(["export", "--force", "-r", source_rev
,
553 source_url
+"/"+path_offset
+"@"+str(source_rev
), path_offset
])
555 def disp_svn_log_summary(log_entry
):
557 ui
.status("r%s | %s | %s",
558 log_entry
['revision'],
560 str(datetime
.fromtimestamp(int(log_entry
['date'])).isoformat(' ')))
561 ui
.status(log_entry
['message'])
562 ui
.status("------------------------------------------------------------------------")
564 def real_main(options
, args
):
565 global source_url
, target_url
, rev_map
566 source_url
= args
.pop(0).rstrip("/") # e.g. 'http://server/svn/source/trunk'
567 target_url
= args
.pop(0).rstrip("/") # e.g. 'file:///svn/target/trunk'
568 ui
.status("options: %s", str(options
), level
=ui
.DEBUG
, color
='GREEN')
570 # Make sure that both the source and target URL's are valid
571 source_info
= svnclient
.get_svn_info(source_url
)
572 assert source_url
.startswith(source_info
['repos_url'])
573 target_info
= svnclient
.get_svn_info(target_url
)
574 assert target_url
.startswith(target_info
['repos_url'])
577 global source_repos_url
,source_base
,source_repos_uuid
578 source_repos_url
= source_info
['repos_url'] # e.g. 'http://server/svn/source'
579 source_base
= source_url
[len(source_repos_url
):] # e.g. '/trunk'
580 source_repos_uuid
= source_info
['repos_uuid']
582 source_end_rev
= source_info
['revision'] # Last revision # in the source repo
583 wc_target
= os
.path
.abspath('_wc_target')
589 # Check out a working copy of target_url if needed
590 wc_exists
= os
.path
.exists(wc_target
)
591 if wc_exists
and not options
.cont_from_break
:
592 shutil
.rmtree(wc_target
)
595 svnclient
.svn_checkout(target_url
, wc_target
)
598 if not options
.cont_from_break
:
599 # TODO: Warn user if trying to start (non-continue) into a non-empty target path?
600 # Get log entry for the SVN revision we will check out
602 # If specify a rev, get log entry just before or at rev
603 source_start_log
= svnclient
.get_last_svn_log_entry(source_url
, 1, options
.svn_rev
, False)
605 # Otherwise, get log entry of branch creation
606 # Note: Trying to use svnclient.get_first_svn_log_entry(source_url, 1, source_end_rev, False)
607 # ends-up being *VERY* time-consuming on a repo with lots of revisions. Even though
608 # the "svn log" call is passing --limit 1, it seems like that limit-filter is happening
609 # _after_ svn has fetched the full log history. Instead, search the history in chunks
610 # and write some progress to the screen.
611 ui
.status("Searching for start source revision (%s)...", source_url
, level
=ui
.VERBOSE
)
616 entries
= svnclient
.run_svn_log(source_url
, rev
, min(rev
+chunk_size
-1, target_info
['revision']), 1, get_changed_paths
=False)
618 source_start_log
= entries
[0]
621 ui
.status("...%s...", rev
)
623 if rev
> target_info
['revision']:
625 if not source_start_log
:
626 raise InternalError("Unable to find first revision for source_url: %s" % source_url
)
628 # This is the revision we will start from for source_url
629 source_start_rev
= source_rev
= int(source_start_log
['revision'])
630 ui
.status("Starting at source revision %s.", source_start_rev
, level
=ui
.VERBOSE
)
632 # For the initial commit to the target URL, export all the contents from
633 # the source URL at the start-revision.
634 paths
= run_svn(["list", "-r", source_rev
, source_url
+"@"+str(source_rev
)])
636 disp_svn_log_summary(svnclient
.get_one_svn_log_entry(source_url
, source_rev
, source_rev
))
637 ui
.status("(Initial import)", level
=ui
.VERBOSE
)
638 paths
= paths
.strip("\n").split("\n")
639 for path_raw
in paths
:
640 # For each top-level file/folder...
643 # Directories have a trailing slash in the "svn list" output
644 path_is_dir
= True if path_raw
[-1] == "/" else False
645 path
= path_raw
.rstrip('/') if path_is_dir
else path_raw
646 if path_is_dir
and not os
.path
.exists(path
):
648 ui
.status(" A %s", source_url
[len(source_repos_url
):]+"/"+path
, level
=ui
.VERBOSE
)
649 run_svn(["export", "--force", "-r" , source_rev
, source_url
+"/"+path
+"@"+str(source_rev
), path
])
650 run_svn(["add", path
])
651 num_entries_proc
+= 1
652 target_revprops
= gen_tracking_revprops(source_rev
) # Build source-tracking revprop's
653 target_rev
= commit_from_svn_log_entry(source_start_log
, options
, target_revprops
=target_revprops
)
655 # Update rev_map, mapping table of source-repo rev # -> target-repo rev #
656 set_rev_map(source_rev
, target_rev
)
657 # Update our target working-copy, to ensure everything says it's at the new HEAD revision
661 # Re-build the rev_map based on any already-replayed history in target_url
662 build_rev_map(target_url
, source_info
)
664 raise RuntimeError("Called with continue-mode, but no already-replayed history found in target repo: %s" % target_url
)
665 source_start_rev
= int(max(rev_map
, key
=rev_map
.get
))
666 assert source_start_rev
667 ui
.status("Continuing from source revision %s.", source_start_rev
, level
=ui
.VERBOSE
)
669 svn_vers_t
= svnclient
.get_svn_client_version()
670 svn_vers
= float(".".join(map(str, svn_vers_t
[0:2])))
672 # Load SVN log starting from source_start_rev + 1
673 it_log_entries
= svnclient
.iter_svn_log_entries(source_url
, source_start_rev
+1, source_end_rev
, get_revprops
=True)
677 for log_entry
in it_log_entries
:
678 if options
.entries_proc_limit
:
679 if num_entries_proc
>= options
.entries_proc_limit
:
681 # Replay this revision from source_url into target_url
682 disp_svn_log_summary(log_entry
)
683 source_rev
= log_entry
['revision']
684 # Process all the changed-paths in this log entry
686 process_svn_log_entry(log_entry
, options
, commit_paths
)
687 num_entries_proc
+= 1
688 # Commit any changes made to _wc_target
689 target_revprops
= gen_tracking_revprops(source_rev
) # Build source-tracking revprop's
690 target_rev
= commit_from_svn_log_entry(log_entry
, options
, commit_paths
, target_revprops
=target_revprops
)
692 # Update rev_map, mapping table of source-repo rev # -> target-repo rev #
693 source_rev
= log_entry
['revision']
694 set_rev_map(source_rev
, target_rev
)
695 # Update our target working-copy, to ensure everything says it's at the new HEAD revision
698 # Run "svn cleanup" every 100 commits if SVN 1.7+, to clean-up orphaned ".svn/pristines/*"
699 if svn_vers
>= 1.7 and (commit_count
% 100 == 0):
702 # If there were no new source_url revisions to process, init source_rev
703 # for the "finally" message below.
704 source_rev
= source_end_rev
706 except KeyboardInterrupt:
707 print "\nStopped by user."
708 print "\nCleaning-up..."
712 print "\nCommand failed with following error:\n"
713 traceback
.print_exc()
714 print "\nCleaning-up..."
716 print run_svn(["status"])
719 print "\nFinished at source revision %s%s." % (source_rev
, " (dry-run)" if options
.dry_run
else "")
722 # Defined as entry point. Must be callable without arguments.
723 usage
= "Usage: %prog [OPTIONS] source_url target_url"
725 Replicate (replay) history from one SVN repository to another. Maintain
726 logical ancestry wherever possible, so that 'svn log' on the replayed
727 repo will correctly follow file/folder renames.
730 Create a copy of only /trunk from source repo, starting at r5000
731 $ svnadmin create /svn/target
732 $ svn mkdir -m 'Add trunk' file:///svn/target/trunk
733 $ svn2svn -av -r 5000 http://server/source/trunk file:///svn/target/trunk
734 1. The target_url will be checked-out to ./_wc_target
735 2. The first commit to http://server/source/trunk at/after r5000 will be
736 exported & added into _wc_target
737 3. All revisions affecting http://server/source/trunk (starting at r5000)
738 will be replayed to _wc_target. Any add/copy/move/replaces that are
739 copy-from'd some path outside of /trunk (e.g. files renamed on a
740 /branch and branch was merged into /trunk) will correctly maintain
741 logical ancestry where possible.
743 Use continue-mode (-c) to pick-up where the last run left-off
744 $ svn2svn -avc http://server/source/trunk file:///svn/target/trunk
745 1. The target_url will be checked-out to ./_wc_target, if not already
747 2. All new revisions affecting http://server/source/trunk starting from
748 the last replayed revision to file:///svn/target/trunk (based on the
749 svn2svn:* revprops) will be replayed to _wc_target, maintaining all
750 logical ancestry where possible."""
751 parser
= optparse
.OptionParser(usage
, description
=description
,
752 formatter
=HelpFormatter(), version
="%prog "+str(full_version
))
753 #parser.remove_option("--help")
754 #parser.add_option("-h", "--help", dest="show_help", action="store_true",
755 # help="show this help message and exit")
756 parser
.add_option("-r", "--revision", type="int", dest
="svn_rev", metavar
="REV",
757 help="initial SVN revision to start source_url replay")
758 parser
.add_option("-a", "--keep-author", action
="store_true", dest
="keep_author", default
=False,
759 help="maintain original 'Author' info from source repo")
760 parser
.add_option("-c", "--continue", action
="store_true", dest
="cont_from_break",
761 help="continue from previous break")
762 parser
.add_option("-l", "--limit", type="int", dest
="entries_proc_limit", metavar
="NUM",
763 help="maximum number of log entries to process")
764 parser
.add_option("-n", "--dry-run", action
="store_true", dest
="dry_run", default
=False,
765 help="try processing next log entry but don't commit changes to "
766 "target working-copy (forces --limit=1)")
767 parser
.add_option("-v", "--verbose", dest
="verbosity", action
="count", default
=1,
768 help="enable additional output (use -vv or -vvv for more)")
769 parser
.add_option("--debug", dest
="verbosity", const
=ui
.DEBUG
, action
="store_const",
770 help="enable debugging output (same as -vvv)")
771 options
, args
= parser
.parse_args()
773 parser
.error("incorrect number of arguments")
774 if options
.verbosity
< 10:
775 # Expand multiple "-v" arguments to a real ui._level value
776 options
.verbosity
*= 10
778 # When in dry-run mode, only try to process the next log_entry
779 options
.entries_proc_limit
= 1
780 ui
.update_config(options
)
781 return real_main(options
, args
)
784 if __name__
== "__main__":
785 sys
.exit(main() or 0)