#!/usr/bin/env python2 # -*- coding: utf-8 -*- # Copyright (c) 2005, Giovanni Bajo # Copyright (c) 2004-2005, Awarix, Inc. # All rights reserved. # # This program is free software; you can redistribute it and/or # modify it under the terms of the GNU General Public License # as published by the Free Software Foundation; either version 2 # of the License, or (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program; if not, write to the Free Software # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA # # Author: Archie Cobbs <archie at awarix dot com> # Rewritten in Python by: Giovanni Bajo <rasky at develer dot com> # # Acknowledgments: # John Belmonte <john at neggie dot net> - metadata and usability # improvements # Blair Zajac <blair at orcaware dot com> - random improvements # Raman Gupta <rocketraman at fastmail dot fm> - bidirectional and transitive # merging support # Dustin J. Mitchell <dustin at zmanda dot com> - support for multiple # location identifier formats # # $HeadURL$ # $LastChangedDate$ # $LastChangedBy$ # $LastChangedRevision$ # # Requisites: # svnmerge.py has been tested with all SVN major versions since 1.1 (both # client and server). It is unknown if it works with previous versions. # # Differences from svnmerge.sh: # - More portable: tested as working in FreeBSD and OS/2. # - Add double-verbose mode, which shows every svn command executed (-v -v). # - "svnmerge avail" now only shows commits in source, not also commits in # other parts of the repository. # - Add "svnmerge block" to flag some revisions as blocked, so that # they will not show up anymore in the available list. Added also # the complementary "svnmerge unblock". # - "svnmerge avail" has grown two new options: # -B to display a list of the blocked revisions # -A to display both the blocked and the available revisions. # - Improved generated commit message to make it machine parsable even when # merging commits which are themselves merges. # - Add --force option to skip working copy check # - Add --record-only option to "svnmerge merge" to avoid performing # an actual merge, yet record that a merge happened. # - Can use a variety of location-identifier formats # # TODO: # - Add "svnmerge avail -R": show logs in reverse order # # Information for Hackers: # # Identifiers for branches: # A branch is identified in three ways within this source: # - as a working copy (variable name usually includes 'dir') # - as a fully qualified URL # - as a path identifier (an opaque string indicating a particular path # in a particular repository; variable name includes 'pathid') # A "target" is generally user-specified, and may be a working copy or # a URL. import sys, os, getopt, re, types, tempfile, time, locale from bisect import bisect from xml.dom import pulldom NAME = "svnmerge" if not hasattr(sys, "version_info") or sys.version_info < (2, 0): error("requires Python 2.0 or newer") # Set up the separator used to separate individual log messages from # each revision merged into the target location. Also, create a # regular expression that will find this same separator in already # committed log messages, so that the separator used for this run of # svnmerge.py will have one more LOG_SEPARATOR appended to the longest # separator found in all the commits. LOG_SEPARATOR = 8 * '.' LOG_SEPARATOR_RE = re.compile('^((%s)+)' % re.escape(LOG_SEPARATOR), re.MULTILINE) # Each line of the embedded log messages will be prefixed by LOG_LINE_PREFIX. LOG_LINE_PREFIX = 2 * ' ' # Set python to the default locale as per environment settings, same as svn # TODO we should really parse config and if log-encoding is specified, set # the locale to match that encoding locale.setlocale(locale.LC_ALL, '') # We want the svn output (such as svn info) to be non-localized # Using LC_MESSAGES should not affect localized output of svn log, for example if os.environ.has_key("LC_ALL"): del os.environ["LC_ALL"] os.environ["LC_MESSAGES"] = "C" ############################################################################### # Support for older Python versions ############################################################################### # True/False constants are Python 2.2+ try: True, False except NameError: True, False = 1, 0 def lstrip(s, ch): """Replacement for str.lstrip (support for arbitrary chars to strip was added in Python 2.2.2).""" i = 0 try: while s[i] == ch: i = i+1 return s[i:] except IndexError: return "" def rstrip(s, ch): """Replacement for str.rstrip (support for arbitrary chars to strip was added in Python 2.2.2).""" try: if s[-1] != ch: return s i = -2 while s[i] == ch: i = i-1 return s[:i+1] except IndexError: return "" def strip(s, ch): """Replacement for str.strip (support for arbitrary chars to strip was added in Python 2.2.2).""" return lstrip(rstrip(s, ch), ch) def rsplit(s, sep, maxsplits=0): """Like str.rsplit, which is Python 2.4+ only.""" L = s.split(sep) if not 0 < maxsplits <= len(L): return L return [sep.join(L[0:-maxsplits])] + L[-maxsplits:] ############################################################################### def kwextract(s): """Extract info from a svn keyword string.""" try: return strip(s, "$").strip().split(": ")[1] except IndexError: return "<unknown>" __revision__ = kwextract('$Rev$') __date__ = kwextract('$Date$') # Additional options, not (yet?) mapped to command line flags default_opts = { "svn": "svn", "prop": NAME + "-integrated", "block-prop": NAME + "-blocked", "commit-verbose": True, "verbose": 0, } logs = {} def console_width(): """Get the width of the console screen (if any).""" try: return int(os.environ["COLUMNS"]) except (KeyError, ValueError): pass try: # Call the Windows API (requires ctypes library) from ctypes import windll, create_string_buffer h = windll.kernel32.GetStdHandle(-11) csbi = create_string_buffer(22) res = windll.kernel32.GetConsoleScreenBufferInfo(h, csbi) if res: import struct (bufx, bufy, curx, cury, wattr, left, top, right, bottom, maxx, maxy) = struct.unpack("hhhhHhhhhhh", csbi.raw) return right - left + 1 except ImportError: pass # Parse the output of stty -a if os.isatty(1): out = os.popen("stty -a").read() m = re.search(r"columns (\d+);", out) if m: return int(m.group(1)) # sensible default return 80 def error(s): """Subroutine to output an error and bail.""" print >> sys.stderr, "%s: %s" % (NAME, s) sys.exit(1) def report(s): """Subroutine to output progress message, unless in quiet mode.""" if opts["verbose"]: print "%s: %s" % (NAME, s) def prefix_lines(prefix, lines): """Given a string representing one or more lines of text, insert the specified prefix at the beginning of each line, and return the result. The input must be terminated by a newline.""" assert lines[-1] == "\n" return prefix + lines[:-1].replace("\n", "\n"+prefix) + "\n" def recode_stdout_to_file(s): if locale.getdefaultlocale()[1] is None or not hasattr(sys.stdout, "encoding") \ or sys.stdout.encoding is None: return s u = s.decode(sys.stdout.encoding) return u.encode(locale.getdefaultlocale()[1]) class LaunchError(Exception): """Signal a failure in execution of an external command. Parameters are the exit code of the process, the original command line, and the output of the command.""" try: """Launch a sub-process. Return its output (both stdout and stderr), optionally split by lines (if split_lines is True). Raise a LaunchError exception if the exit code of the process is non-zero (failure). This function has two implementations, one based on subprocess (preferred), and one based on popen (for compatibility). """ import subprocess import shlex def launch(cmd, split_lines=True): # Requiring python 2.4 or higher, on some platforms we get # much faster performance from the subprocess module (where python # doesn't try to close an exhorbitant number of file descriptors) stdout = "" stderr = "" try: if os.name == 'nt': p = subprocess.Popen(cmd, stdout=subprocess.PIPE, \ close_fds=False, stderr=subprocess.PIPE) else: # Use shlex to break up the parameters intelligently, # respecting quotes. shlex can't handle unicode. args = shlex.split(cmd.encode('ascii')) p = subprocess.Popen(args, stdout=subprocess.PIPE, \ close_fds=False, stderr=subprocess.PIPE) stdoutAndErr = p.communicate() stdout = stdoutAndErr[0] stderr = stdoutAndErr[1] except OSError, inst: # Using 1 as failure code; should get actual number somehow? For # examples see svnmerge_test.py's TestCase_launch.test_failure and # TestCase_launch.test_failurecode. raise LaunchError(1, cmd, stdout + " " + stderr + ": " + str(inst)) if p.returncode == 0: if split_lines: # Setting keepends=True for compatibility with previous logic # (where file.readlines() preserves newlines) return stdout.splitlines(True) else: return stdout else: raise LaunchError(p.returncode, cmd, stdout + stderr) except ImportError: # support versions of python before 2.4 (slower on some systems) def launch(cmd, split_lines=True): if os.name not in ['nt', 'os2']: import popen2 p = popen2.Popen4(cmd) p.tochild.close() if split_lines: out = p.fromchild.readlines() else: out = p.fromchild.read() ret = p.wait() if ret == 0: ret = None else: ret >>= 8 else: i,k = os.popen4(cmd) i.close() if split_lines: out = k.readlines() else: out = k.read() ret = k.close() if ret is None: return out raise LaunchError(ret, cmd, out) def launchsvn(s, show=False, pretend=False, **kwargs): """Launch SVN and grab its output.""" username = password = configdir = "" if opts.get("username", None): username = "--username=" + opts["username"] if opts.get("password", None): password = "--password=" + opts["password"] if opts.get("config-dir", None): configdir = "--config-dir=" + opts["config-dir"] cmd = ' '.join(filter(None, [opts["svn"], "--non-interactive", username, password, configdir, s])) if show or opts["verbose"] >= 2: print cmd if pretend: return None return launch(cmd, **kwargs) def svn_command(s): """Do (or pretend to do) an SVN command.""" out = launchsvn(s, show=opts["show-changes"] or opts["dry-run"], pretend=opts["dry-run"], split_lines=False) if not opts["dry-run"]: print out def check_dir_clean(dir): """Check the current status of dir for local mods.""" if opts["force"]: report('skipping status check because of --force') return report('checking status of "%s"' % dir) # Checking with -q does not show unversioned files or external # directories. Though it displays a debug message for external # directories, after a blank line. So, practically, the first line # matters: if it's non-empty there is a modification. out = launchsvn("status -q %s" % dir) if out and out[0].strip(): error('"%s" has local modifications; it must be clean' % dir) class PathIdentifier: """Abstraction for a path identifier, so that we can start talking about it before we know the form that it takes in the properties (its external_form). Objects are referenced in the class variable 'locobjs', keyed by all known forms.""" # a map of UUID (or None) to repository root URL. repo_hints = {} # a map from any known string form to the corresponding PathIdentifier locobjs = {} def __init__(self, repo_relative_path, uuid=None, url=None, external_form=None): self.repo_relative_path = repo_relative_path self.uuid = uuid self.url = url self.external_form = external_form def __repr__(self): return "<PathIdentifier " + ', '.join('%s=%r' % i for i in self.__dict__.items()) + '>' def __str__(self): """Return a printable string representation""" if self.external_form: return self.external_form if self.url: return self.format('url') if self.uuid: return self.format('uuid') return self.format('path') def from_pathid(pathid_str): """convert pathid_str to a PathIdentifier""" if not PathIdentifier.locobjs.has_key(pathid_str): if is_url(pathid_str): # we can determine every form; PathIdentifier.hint knows how to do that PathIdentifier.hint(pathid_str) elif pathid_str[:7] == 'uuid://': mo = re.match('uuid://([^/]*)(.*)', pathid_str) if not mo: error("Invalid path identifier '%s'" % pathid_str) uuid, repo_relative_path = mo.groups() pathid = PathIdentifier(repo_relative_path, uuid=uuid) # we can cache this by uuid:// pathid and by repo-relative path PathIdentifier.locobjs[pathid_str] = PathIdentifier.locobjs[repo_relative_path] = pathid elif pathid_str and pathid_str[0] == '/': # strip any trailing slashes pathid_str = pathid_str.rstrip('/') pathid = PathIdentifier(repo_relative_path=pathid_str) # we can only cache this by repo-relative path PathIdentifier.locobjs[pathid_str] = pathid else: error("Invalid path identifier '%s'" % pathid_str) return PathIdentifier.locobjs[pathid_str] from_pathid = staticmethod(from_pathid) def from_target(target): """Convert a target (either a working copy path or an URL) into a path identifier.""" # prime the cache first if we don't know about this target yet if not PathIdentifier.locobjs.has_key(target): PathIdentifier.hint(target) try: return PathIdentifier.locobjs[target] except KeyError: error("Could not recognize path identifier '%s'" % target) from_target = staticmethod(from_target) def hint(target): """Cache some information about target, as it may be referenced by repo-relative path in subversion properties; the cache can help to expand such a relative path to a full path identifier.""" if PathIdentifier.locobjs.has_key(target): return if not is_url(target) and not is_wc(target): return url = target_to_url(target) root = get_repo_root(url) assert root[-1] != "/" assert url[:len(root)] == root, "url=%r, root=%r" % (url, root) repo_relative_path = url[len(root):] try: uuid = get_svninfo(target)['Repository UUID'] uuid_pathid = 'uuid://%s%s' % (uuid, repo_relative_path) except KeyError: uuid = None uuid_pathid = None locobj = PathIdentifier.locobjs.get(url) or \ (uuid_pathid and PathIdentifier.locobjs.get(uuid_pathid)) if not locobj: locobj = PathIdentifier(repo_relative_path, uuid=uuid, url=url) PathIdentifier.repo_hints[uuid] = root # (uuid may be None) PathIdentifier.locobjs[target] = locobj PathIdentifier.locobjs[url] = locobj if uuid_pathid: PathIdentifier.locobjs[uuid_pathid] = locobj if not PathIdentifier.locobjs.has_key(repo_relative_path): PathIdentifier.locobjs[repo_relative_path] = locobj hint = staticmethod(hint) def format(self, fmt): if fmt == 'path': return self.repo_relative_path elif fmt == 'uuid': return "uuid://%s%s" % (self.uuid, self.repo_relative_path) elif fmt == 'url': return self.url else: error("Unkonwn path type '%s'" % fmt) def match_substring(self, str): """Test whether str is a substring of any representation of this PathIdentifier.""" if self.repo_relative_path.find(str) >= 0: return True if self.uuid: if ("uuid://%s%s" % (self.uuid, self.repo_relative_path)).find(str) >= 0: return True if self.url: if (self.url + self.repo_relative_path).find(str) >= 0: return True return False def get_url(self): """Convert a pathid into a URL. If this is not possible, error out.""" if self.url: return self.url # if we have a uuid and happen to know the URL for it, use that elif self.uuid and PathIdentifier.repo_hints.has_key(self.uuid): self.url = PathIdentifier.repo_hints[self.uuid] + self.repo_relative_path PathIdentifier.locobjs[self.url] = self return self.url # if we've only seen one rep, use that (a guess, but an educated one) elif not self.uuid and len(PathIdentifier.repo_hints) == 1: uuid, root = PathIdentifier.repo_hints.items()[0] if uuid: self.uuid = uuid PathIdentifier.locobjs['uuid://%s%s' % (uuid, self.repo_relative_path)] = self self.url = root + self.repo_relative_path PathIdentifier.locobjs[self.url] = self report("Guessing that '%s' refers to '%s'" % (self, self.url)) return self.url else: error("Cannot determine URL for '%s'; " % self + "Explicit source argument (-S/--source) required.\n") class RevisionLog: """ A log of the revisions which affected a given URL between two revisions. """ def __init__(self, url, begin, end, find_propchanges=False): """ Create a new RevisionLog object, which stores, in self.revs, a list of the revisions which affected the specified URL between begin and end. If find_propchanges is True, self.propchange_revs will contain a list of the revisions which changed properties directly on the specified URL. URL must be the URL for a directory in the repository. """ self.url = url # Setup the log options (--quiet, so we don't show log messages) log_opts = '--xml --quiet -r%s:%s "%s"' % (begin, end, url) if find_propchanges: # The --verbose flag lets us grab merge tracking information # by looking at propchanges log_opts = "--verbose " + log_opts # Read the log to look for revision numbers and merge-tracking info self.revs = [] self.propchange_revs = [] repos_pathid = PathIdentifier.from_target(url) for chg in SvnLogParser(launchsvn("log %s" % log_opts, split_lines=False)): self.revs.append(chg.revision()) for p in chg.paths(): if p.action() == 'M' and p.pathid() == repos_pathid.repo_relative_path: self.propchange_revs.append(chg.revision()) # Save the range of the log self.begin = int(begin) if end == "HEAD": # If end is not provided, we do not know which is the latest # revision in the repository. So we set 'end' to the latest # known revision. self.end = self.revs[-1] else: self.end = int(end) self._merges = None self._blocks = None def merge_metadata(self): """ Return a VersionedProperty object, with a cached view of the merge metadata in the range of this log. """ # Load merge metadata if necessary if not self._merges: self._merges = VersionedProperty(self.url, opts["prop"]) self._merges.load(self) return self._merges def block_metadata(self): if not self._blocks: self._blocks = VersionedProperty(self.url, opts["block-prop"]) self._blocks.load(self) return self._blocks class VersionedProperty: """ A read-only, cached view of a versioned property. self.revs contains a list of the revisions in which the property changes. self.values stores the new values at each corresponding revision. If the value of the property is unknown, it is set to None. Initially, we set self.revs to [0] and self.values to [None]. This indicates that, as of revision zero, we know nothing about the value of the property. Later, if you run self.load(log), we cache the value of this property over the entire range of the log by noting each revision in which the property was changed. At the end of the range of the log, we invalidate our cache by adding the value "None" to our cache for any revisions which fall out of the range of our log. Once self.revs and self.values are filled, we can find the value of the property at any arbitrary revision using a binary search on self.revs. Once we find the last revision during which the property was changed, we can lookup the associated value in self.values. (If the associated value is None, the associated value was not cached and we have to do a full propget.) An example: We know that the 'svnmerge' property was added in r10, and changed in r21. We gathered log info up until r40. revs = [0, 10, 21, 40] values = [None, "val1", "val2", None] What these values say: - From r0 to r9, we know nothing about the property. - In r10, the property was set to "val1". This property stayed the same until r21, when it was changed to "val2". - We don't know what happened after r40. """ def __init__(self, url, name): """View the history of a versioned property at URL with name""" self.url = url self.name = name # We know nothing about the value of the property. Setup revs # and values to indicate as such. self.revs = [0] self.values = [None] # We don't have any revisions cached self._initial_value = None self._changed_revs = [] self._changed_values = [] def load(self, log): """ Load the history of property changes from the specified RevisionLog object. """ # Get the property value before the range of the log if log.begin > 1: self.revs.append(log.begin-1) try: self._initial_value = self.raw_get(log.begin-1) except LaunchError: # The specified URL might not exist before the # range of the log. If so, we can safely assume # that the property was empty at that time. self._initial_value = { } self.values.append(self._initial_value) else: self._initial_value = { } self.values[0] = self._initial_value # Cache the property values in the log range old_value = self._initial_value for rev in log.propchange_revs: new_value = self.raw_get(rev) if new_value != old_value: self._changed_revs.append(rev) self._changed_values.append(new_value) self.revs.append(rev) self.values.append(new_value) old_value = new_value # Indicate that we know nothing about the value of the property # after the range of the log. if log.revs: self.revs.append(log.end+1) self.values.append(None) def raw_get(self, rev=None): """ Get the property at revision REV. If rev is not specified, get the property at revision HEAD. """ return get_revlist_prop(self.url, self.name, rev) def get(self, rev=None): """ Get the property at revision REV. If rev is not specified, get the property at revision HEAD. """ if rev is not None: # Find the index using a binary search i = bisect(self.revs, rev) - 1 # Return the value of the property, if it was cached if self.values[i] is not None: return self.values[i] # Get the current value of the property return self.raw_get(rev) def changed_revs(self, key=None): """ Get a list of the revisions in which the specified dictionary key was changed in this property. If key is not specified, return a list of revisions in which any key was changed. """ if key is None: return self._changed_revs else: changed_revs = [] old_val = self._initial_value for rev, val in zip(self._changed_revs, self._changed_values): if val.get(key) != old_val.get(key): changed_revs.append(rev) old_val = val return changed_revs def initialized_revs(self): """ Get a list of the revisions in which keys were added or removed in this property. """ initialized_revs = [] old_len = len(self._initial_value) for rev, val in zip(self._changed_revs, self._changed_values): if len(val) != old_len: initialized_revs.append(rev) old_len = len(val) return initialized_revs class RevisionSet: """ A set of revisions, held in dictionary form for easy manipulation. If we were to rewrite this script for Python 2.3+, we would subclass this from set (or UserSet). As this class does not include branch information, it's assumed that one instance will be used per branch. """ def __init__(self, parm): """Constructs a RevisionSet from a string in property form, or from a dictionary whose keys are the revisions. Raises ValueError if the input string is invalid.""" self._revs = {} revision_range_split_re = re.compile('[-:]') if isinstance(parm, types.DictType): self._revs = parm.copy() elif isinstance(parm, types.ListType): for R in parm: self._revs[int(R)] = 1 else: parm = parm.strip() if parm: for R in parm.split(","): rev_or_revs = re.split(revision_range_split_re, R) if len(rev_or_revs) == 1: self._revs[int(rev_or_revs[0])] = 1 elif len(rev_or_revs) == 2: for rev in range(int(rev_or_revs[0]), int(rev_or_revs[1])+1): self._revs[rev] = 1 else: raise ValueError, 'Ill formatted revision range: ' + R def sorted(self): revnums = self._revs.keys() revnums.sort() return revnums def normalized(self): """Returns a normalized version of the revision set, which is an ordered list of couples (start,end), with the minimum number of intervals.""" revnums = self.sorted() revnums.reverse() ret = [] while revnums: s = e = revnums.pop() while revnums and revnums[-1] in (e, e+1): e = revnums.pop() ret.append((s, e)) return ret def __str__(self): """Convert the revision set to a string, using its normalized form.""" L = [] for s,e in self.normalized(): if s == e: L.append(str(s)) else: L.append(str(s) + "-" + str(e)) return ",".join(L) def __contains__(self, rev): return self._revs.has_key(rev) def __sub__(self, rs): """Compute subtraction as in sets.""" revs = {} for r in self._revs.keys(): if r not in rs: revs[r] = 1 return RevisionSet(revs) def __and__(self, rs): """Compute intersections as in sets.""" revs = {} for r in self._revs.keys(): if r in rs: revs[r] = 1 return RevisionSet(revs) def __nonzero__(self): return len(self._revs) != 0 def __len__(self): """Return the number of revisions in the set.""" return len(self._revs) def __iter__(self): return iter(self.sorted()) def __or__(self, rs): """Compute set union.""" revs = self._revs.copy() revs.update(rs._revs) return RevisionSet(revs) def merge_props_to_revision_set(merge_props, pathid): """A converter which returns a RevisionSet instance containing the revisions from PATH as known to BRANCH_PROPS. BRANCH_PROPS is a dictionary of pathid -> revision set branch integration information (as returned by get_merge_props()).""" if not merge_props.has_key(pathid): error('no integration info available for path "%s"' % pathid) return RevisionSet(merge_props[pathid]) def dict_from_revlist_prop(propvalue): """Given a property value as a string containing per-source revision lists, return a dictionary whose key is a source path identifier and whose value is the revisions for that source.""" prop = {} # Multiple sources are separated by any whitespace. for L in propvalue.split(): # We use rsplit to play safe and allow colons in pathids. pathid_str, revs = rsplit(L.strip(), ":", 1) pathid = PathIdentifier.from_pathid(pathid_str) # cache the "external" form we saw pathid.external_form = pathid_str prop[pathid] = revs return prop def get_revlist_prop(url_or_dir, propname, rev=None): """Given a repository URL or working copy path and a property name, extract the values of the property which store per-source revision lists and return a dictionary whose key is a source path identifier, and whose value is the revisions for that source.""" # Note that propget does not return an error if the property does # not exist, it simply does not output anything. So we do not need # to check for LaunchError here. args = '--strict "%s" "%s"' % (propname, url_or_dir) if rev: args = '-r %s %s' % (rev, args) out = launchsvn('propget %s' % args, split_lines=False) return dict_from_revlist_prop(out) def get_merge_props(dir): """Extract the merged revisions.""" return get_revlist_prop(dir, opts["prop"]) def get_block_props(dir): """Extract the blocked revisions.""" return get_revlist_prop(dir, opts["block-prop"]) def get_blocked_revs(dir, source_pathid): p = get_block_props(dir) if p.has_key(source_pathid): return RevisionSet(p[source_pathid]) return RevisionSet("") def format_merge_props(props, sep=" "): """Formats the hash PROPS as a string suitable for use as a Subversion property value.""" assert sep in ["\t", "\n", " "] # must be a whitespace props = props.items() props.sort() L = [] for h, r in props: L.append("%s:%s" % (h, r)) return sep.join(L) def _run_propset(dir, prop, value): """Set the property 'prop' of directory 'dir' to value 'value'. We go through a temporary file to not run into command line length limits.""" try: fd, fname = tempfile.mkstemp() f = os.fdopen(fd, "wb") except AttributeError: # Fallback for Python <= 2.3 which does not have mkstemp (mktemp # suffers from race conditions. Not that we care...) fname = tempfile.mktemp() f = open(fname, "wb") try: f.write(value) f.close() report("property data written to temp file: %s" % value) svn_command('propset "%s" -F "%s" "%s"' % (prop, fname, dir)) finally: os.remove(fname) def set_props(dir, name, props): props = format_merge_props(props) if props: _run_propset(dir, name, props) else: # Check if NAME exists on DIR before trying to delete it. # As of 1.6 propdel no longer supports deleting a # non-existent property. out = launchsvn('propget "%s" "%s"' % (name, dir)) if out: svn_command('propdel "%s" "%s"' % (name, dir)) def set_merge_props(dir, props): set_props(dir, opts["prop"], props) def set_block_props(dir, props): set_props(dir, opts["block-prop"], props) def set_blocked_revs(dir, source_pathid, revs): props = get_block_props(dir) if revs: props[source_pathid] = str(revs) elif props.has_key(source_pathid): del props[source_pathid] set_block_props(dir, props) def is_url(url): """Check if url looks like a valid url.""" return re.search(r"^[a-zA-Z][-+\.\w]*://[^\s]+$", url) is not None and url[:4] != 'uuid' def check_url(url): """Similar to is_url, but actually invoke get_svninfo to find out""" return get_svninfo(url) != {} def is_pathid(pathid): return isinstance(pathid, PathIdentifier) def is_wc(dir): """Check if a directory is a working copy.""" return os.path.isdir(os.path.join(dir, ".svn")) or \ os.path.isdir(os.path.join(dir, "_svn")) _cache_svninfo = {} def get_svninfo(target): """Extract the subversion information for a target (through 'svn info'). This function uses an internal cache to let clients query information many times.""" if _cache_svninfo.has_key(target): return _cache_svninfo[target] info = {} for L in launchsvn('info "%s"' % target): L = L.strip() if not L: continue key, value = L.split(": ", 1) info[key] = value.strip() _cache_svninfo[target] = info return info def target_to_url(target): """Convert working copy path or repos URL to a repos URL.""" if is_wc(target): info = get_svninfo(target) return info["URL"] return target _cache_reporoot = {} def get_repo_root(target): """Compute the root repos URL given a working-copy path, or a URL.""" # Try using "svn info WCDIR". This works only on SVN clients >= 1.3 if not is_url(target): try: info = get_svninfo(target) root = info["Repository Root"] _cache_reporoot[root] = None return root except KeyError: pass url = target_to_url(target) assert url[-1] != '/' else: url = target # Go through the cache of the repository roots. This avoids extra # server round-trips if we are asking the root of different URLs # in the same repository (the cache in get_svninfo() cannot detect # that of course and would issue a remote command). assert is_url(url) for r in _cache_reporoot: if url.startswith(r): return r # Try using "svn info URL". This works only on SVN clients >= 1.2 try: info = get_svninfo(url) # info may be {}, in which case we'll see KeyError here root = info["Repository Root"] _cache_reporoot[root] = None return root except (KeyError, LaunchError): pass # Constrained to older svn clients, we are stuck with this ugly # trial-and-error implementation. It could be made faster with a # binary search. while url: temp = os.path.dirname(url) try: launchsvn('proplist "%s"' % temp) except LaunchError: _cache_reporoot[url] = None return rstrip(url, "/") url = temp error("svn repos root of %s not found" % target) class SvnLogParser: """ Parse the "svn log", going through the XML output and using pulldom (which would even allow streaming the command output). """ def __init__(self, xml): self._events = pulldom.parseString(xml) def __getitem__(self, idx): for event, node in self._events: if event == pulldom.START_ELEMENT and node.tagName == "logentry": self._events.expandNode(node) return self.SvnLogRevision(node) raise IndexError, "Could not find 'logentry' tag in xml" class SvnLogRevision: def __init__(self, xmlnode): self.n = xmlnode def revision(self): return int(self.n.getAttribute("revision")) def author(self): return self.n.getElementsByTagName("author")[0].firstChild.data def paths(self): return [self.SvnLogPath(n) for n in self.n.getElementsByTagName("path")] class SvnLogPath: def __init__(self, xmlnode): self.n = xmlnode def action(self): return self.n.getAttribute("action") def pathid(self): return self.n.firstChild.data def copyfrom_rev(self): try: return self.n.getAttribute("copyfrom-rev") except KeyError: return None def copyfrom_pathid(self): try: return self.n.getAttribute("copyfrom-path") except KeyError: return None def get_copyfrom(target): """Get copyfrom info for a given target (it represents the repository-relative path from where it was branched). NOTE: repos root has no copyfrom info. In this case None is returned. Returns the: - source file or directory from which the copy was made - revision from which that source was copied - revision in which the copy was committed """ repos_path = PathIdentifier.from_target(target).repo_relative_path for chg in SvnLogParser(launchsvn('log -v --xml --stop-on-copy "%s"' % target, split_lines=False)): for p in chg.paths(): if p.action() == 'A' and p.pathid() == repos_path: # These values will be None if the corresponding elements are # not found in the log. return p.copyfrom_pathid(), p.copyfrom_rev(), chg.revision() return None,None,None def get_latest_rev(url): """Get the latest revision of the repository of which URL is part.""" try: info = get_svninfo(url) if not info.has_key("Revision"): error("Not a valid URL: %s" % url) return info["Revision"] except LaunchError: # Alternative method for latest revision checking (for svn < 1.2) report('checking latest revision of "%s"' % url) L = launchsvn('proplist --revprop -r HEAD "%s"' % opts["source-url"])[0] rev = re.search("revision (\d+)", L).group(1) report('latest revision of "%s" is %s' % (url, rev)) return rev def get_created_rev(url): """Lookup the revision at which the path identified by the provided URL was first created.""" oldest_rev = -1 report('determining oldest revision for URL "%s"' % url) ### TODO: Refactor this to use a modified RevisionLog class. lines = None cmd = "log -r1:HEAD --stop-on-copy -q " + url try: lines = launchsvn(cmd + " --limit=1") except LaunchError: # Assume that --limit isn't supported by the installed 'svn'. lines = launchsvn(cmd) if lines and len(lines) > 1: i = lines[1].find(" ") if i != -1: oldest_rev = int(lines[1][1:i]) if oldest_rev == -1: error('unable to determine oldest revision for URL "%s"' % url) return oldest_rev def get_commit_log(url, revnum): """Return the log message for a specific integer revision number.""" out = launchsvn("log --incremental -r%d %s" % (revnum, url)) return recode_stdout_to_file("".join(out[1:])) def construct_merged_log_message(url, revnums): """Return a commit log message containing all the commit messages in the specified revisions at the given URL. The separator used in this log message is determined by searching for the longest svnmerge separator existing in the commit log messages and extending it by one more separator. This results in a new commit log message that is clearer in describing merges that contain other merges. Trailing newlines are removed from the embedded log messages.""" messages = [''] longest_sep = '' for r in revnums.sorted(): message = get_commit_log(url, r) if message: message = re.sub(r'(\r\n|\r|\n)', "\n", message) message = rstrip(message, "\n") + "\n" messages.append(prefix_lines(LOG_LINE_PREFIX, message)) for match in LOG_SEPARATOR_RE.findall(message): sep = match[1] if len(sep) > len(longest_sep): longest_sep = sep longest_sep += LOG_SEPARATOR + "\n" messages.append('') return longest_sep.join(messages) def get_default_source(branch_target, branch_props): """Return the default source for branch_target (given its branch_props). Error out if there is ambiguity.""" if not branch_props: error("no integration info available") props = branch_props.copy() pathid = PathIdentifier.from_target(branch_target) # To make bidirectional merges easier, find the target's # repository local path so it can be removed from the list of # possible integration sources. if props.has_key(pathid): del props[pathid] if len(props) > 1: err_msg = "multiple sources found. " err_msg += "Explicit source argument (-S/--source) required.\n" err_msg += "The merge sources available are:" for prop in props: err_msg += "\n " + str(prop) error(err_msg) return props.keys()[0] def should_find_reflected(branch_dir): should_find_reflected = opts["bidirectional"] # If the source has integration info for the target, set find_reflected # even if --bidirectional wasn't specified if not should_find_reflected: source_props = get_merge_props(opts["source-url"]) should_find_reflected = source_props.has_key(PathIdentifier.from_target(branch_dir)) return should_find_reflected def analyze_revs(target_pathid, url, begin=1, end=None, find_reflected=False): """For the source of the merges in the source URL being merged into target_pathid, analyze the revisions in the interval begin-end (which defaults to 1-HEAD), to find out which revisions are changes in the url, which are changes elsewhere (so-called 'phantom' revisions), optionally which are reflected changes (to avoid conflicts that can occur when doing bidirectional merging between branches), and which revisions initialize merge tracking against other branches. Return a tuple of four RevisionSet's: (real_revs, phantom_revs, reflected_revs, initialized_revs). NOTE: To maximize speed, if "end" is not provided, the function is not able to find phantom revisions following the last real revision in the URL. """ begin = str(begin) if end is None: end = "HEAD" else: end = str(end) if long(begin) > long(end): return RevisionSet(""), RevisionSet(""), \ RevisionSet(""), RevisionSet("") logs[url] = RevisionLog(url, begin, end, find_reflected) revs = RevisionSet(logs[url].revs) if end == "HEAD": # If end is not provided, we do not know which is the latest revision # in the repository. So return the phantom revision set only up to # the latest known revision. end = str(list(revs)[-1]) phantom_revs = RevisionSet("%s-%s" % (begin, end)) - revs if find_reflected: reflected_revs = logs[url].merge_metadata().changed_revs(target_pathid) reflected_revs += logs[url].block_metadata().changed_revs(target_pathid) else: reflected_revs = [] initialized_revs = RevisionSet(logs[url].merge_metadata().initialized_revs()) reflected_revs = RevisionSet(reflected_revs) return revs, phantom_revs, reflected_revs, initialized_revs def analyze_source_revs(branch_target, source_url, **kwargs): """For the given branch and source, extract the real and phantom source revisions.""" branch_url = target_to_url(branch_target) branch_pathid = PathIdentifier.from_target(branch_target) # Extract the latest repository revision from the URL of the branch # directory (which is already cached at this point). end_rev = get_latest_rev(source_url) # Calculate the base of analysis. If there is a "1-XX" interval in the # merged_revs, we do not need to check those. base = 1 r = opts["merged-revs"].normalized() if r and r[0][0] == 1: base = r[0][1] + 1 # See if the user filtered the revision set. If so, we are not # interested in something outside that range. if opts["revision"]: revs = RevisionSet(opts["revision"]).sorted() if base < revs[0]: base = revs[0] if end_rev > revs[-1]: end_rev = revs[-1] return analyze_revs(branch_pathid, source_url, base, end_rev, **kwargs) def minimal_merge_intervals(revs, phantom_revs): """Produce the smallest number of intervals suitable for merging. revs is the RevisionSet which we want to merge, and phantom_revs are phantom revisions which can be used to concatenate intervals, thus minimizing the number of operations.""" revnums = revs.normalized() ret = [] cur = revnums.pop() while revnums: next = revnums.pop() assert next[1] < cur[0] # otherwise it is not ordered assert cur[0] - next[1] > 1 # otherwise it is not normalized for i in range(next[1]+1, cur[0]): if i not in phantom_revs: ret.append(cur) cur = next break else: cur = (next[0], cur[1]) ret.append(cur) ret.reverse() return ret def display_revisions(revs, display_style, revisions_msg, source_url): """Show REVS as dictated by DISPLAY_STYLE, either numerically, in log format, or as diffs. When displaying revisions numerically, prefix output with REVISIONS_MSG when in verbose mode. Otherwise, request logs or diffs using SOURCE_URL.""" if display_style == "revisions": if revs: report(revisions_msg) print revs elif display_style == "logs": for start,end in revs.normalized(): svn_command('log --incremental -v -r %d:%d %s' % \ (start, end, source_url)) elif display_style in ("diffs", "summarize"): if display_style == 'summarize': summarize = '--summarize ' else: summarize = '' for start, end in revs.normalized(): print if start == end: print "%s: changes in revision %d follow" % (NAME, start) else: print "%s: changes in revisions %d-%d follow" % (NAME, start, end) print # Note: the starting revision number to 'svn diff' is # NOT inclusive so we have to subtract one from ${START}. svn_command("diff -r %d:%d %s %s" % (start - 1, end, summarize, source_url)) else: assert False, "unhandled display style: %s" % display_style def action_init(target_dir, target_props): """Initialize for merges.""" # Check that directory is ready for being modified check_dir_clean(target_dir) target_pathid = PathIdentifier.from_target(target_dir) source_pathid = opts['source-pathid'] if source_pathid == target_pathid: error("cannot init integration source path '%s'\nIts path identifier does not " "differ from the path identifier of the current directory, '%s'." % (source_pathid, target_pathid)) source_url = opts['source-url'] # If the user hasn't specified the revisions to use, see if the # "source" is a copy from the current tree and if so, we can use # the version data obtained from it. revision_range = opts["revision"] if not revision_range: # If source was originally copied from target, and we are merging # changes from source to target (the copy target is the merge source, # and the copy source is the merge target), then we want to mark as # integrated up to the rev in which the copy was committed which # created the merge source: cf_source, cf_rev, copy_committed_in_rev = get_copyfrom(source_url) cf_pathid = None if cf_source: cf_url = get_repo_root(source_url) + cf_source if is_url(cf_url) and check_url(cf_url): cf_pathid = PathIdentifier.from_target(cf_url) if target_pathid == cf_pathid: report('the source "%s" was copied from "%s" in rev %s and committed in rev %s' % (source_url, target_dir, cf_rev, copy_committed_in_rev)) revision_range = "1-" + str(copy_committed_in_rev) if not revision_range: # If the reverse is true: copy source is the merge source, and # the copy target is the merge target, then we want to mark as # integrated up to the specific rev of the merge target from # which the merge source was copied. (Longer discussion at: # http://subversion.tigris.org/issues/show_bug.cgi?id=2810 ) cf_source, cf_rev, copy_committed_in_rev = get_copyfrom(target_dir) cf_pathid = None if cf_source: cf_url = get_repo_root(target_dir) + cf_source if is_url(cf_url) and check_url(cf_url): cf_pathid = PathIdentifier.from_target(cf_url) source_pathid = PathIdentifier.from_target(source_url) if source_pathid == cf_pathid: report('the target "%s" was copied the source "%s" in rev %s and committed in rev %s' % (target_dir, source_url, cf_rev, copy_committed_in_rev)) revision_range = "1-" + cf_rev # When neither the merge source nor target is a copy of the other, and # the user did not specify a revision range, then choose a default which is # the current revision; saying, in effect, "everything has been merged, so # mark as integrated up to the latest rev on source url). if not revision_range: revision_range = "1-" + get_latest_rev(source_url) revs = RevisionSet(revision_range) report('marking "%s" as already containing revisions "%s" of "%s"' % (target_dir, revs, source_url)) revs = str(revs) # If the local svnmerge-integrated property already has an entry # for the source-pathid, simply error out. if not opts["force"] and target_props.has_key(source_pathid): error('Repository-relative path %s has already been initialized at %s\n' 'Use --force to re-initialize' % (source_pathid, target_dir)) # set the pathid's external_form based on the user's options source_pathid.external_form = source_pathid.format(opts['location-type']) revs = str(revs) target_props[source_pathid] = revs # Set property set_merge_props(target_dir, target_props) # Write out commit message if desired if opts["commit-file"]: f = open(opts["commit-file"], "w") print >>f, 'Initialized merge tracking via "%s" with revisions "%s" from ' \ % (NAME, revs) print >>f, '%s' % source_url f.close() report('wrote commit message to "%s"' % opts["commit-file"]) def action_avail(branch_dir, branch_props): """Show commits available for merges.""" source_revs, phantom_revs, reflected_revs, initialized_revs = \ analyze_source_revs(branch_dir, opts["source-url"], find_reflected= should_find_reflected(branch_dir)) report('skipping phantom revisions: %s' % phantom_revs) if reflected_revs: report('skipping reflected revisions: %s' % reflected_revs) report('skipping initialized revisions: %s' % initialized_revs) blocked_revs = get_blocked_revs(branch_dir, opts["source-pathid"]) avail_revs = source_revs - opts["merged-revs"] - blocked_revs - \ reflected_revs - initialized_revs # Compose the set of revisions to show revs = RevisionSet("") report_msg = "revisions available to be merged are:" if "avail" in opts["avail-showwhat"]: revs |= avail_revs if "blocked" in opts["avail-showwhat"]: revs |= blocked_revs report_msg = "revisions blocked are:" # Limit to revisions specified by -r (if any) if opts["revision"]: revs = revs & RevisionSet(opts["revision"]) display_revisions(revs, opts["avail-display"], report_msg, opts["source-url"]) def action_integrated(branch_dir, branch_props): """Show change sets already merged. This set of revisions is calculated from taking svnmerge-integrated property from the branch, and subtracting any revision older than the branch creation revision.""" # Extract the integration info for the branch_dir branch_props = get_merge_props(branch_dir) revs = merge_props_to_revision_set(branch_props, opts["source-pathid"]) # Lookup the oldest revision on the branch path. oldest_src_rev = get_created_rev(opts["source-url"]) # Subtract any revisions which pre-date the branch. report("subtracting revisions which pre-date the source URL (%d)" % oldest_src_rev) revs = revs - RevisionSet(range(1, oldest_src_rev)) # Limit to revisions specified by -r (if any) if opts["revision"]: revs = revs & RevisionSet(opts["revision"]) display_revisions(revs, opts["integrated-display"], "revisions already integrated are:", opts["source-url"]) def action_merge(branch_dir, branch_props): """Record merge meta data, and do the actual merge (if not requested otherwise via --record-only).""" # Check branch directory is ready for being modified check_dir_clean(branch_dir) source_revs, phantom_revs, reflected_revs, initialized_revs = \ analyze_source_revs(branch_dir, opts["source-url"], find_reflected= should_find_reflected(branch_dir)) if opts["revision"]: revs = RevisionSet(opts["revision"]) else: revs = source_revs blocked_revs = get_blocked_revs(branch_dir, opts["source-pathid"]) merged_revs = opts["merged-revs"] # Show what we're doing if opts["verbose"]: # just to avoid useless calculations if merged_revs & revs: report('"%s" already contains revisions %s' % (branch_dir, merged_revs & revs)) if phantom_revs: report('memorizing phantom revision(s): %s' % phantom_revs) if reflected_revs: report('memorizing reflected revision(s): %s' % reflected_revs) if blocked_revs & revs: report('skipping blocked revisions(s): %s' % (blocked_revs & revs)) if initialized_revs: report('skipping initialized revision(s): %s' % initialized_revs) # Compute final merge set. revs = revs - merged_revs - blocked_revs - reflected_revs - \ phantom_revs - initialized_revs if not revs: report('no revisions to merge, exiting') return # When manually marking revisions as merged, we only update the # integration meta data, and don't perform an actual merge. record_only = opts["record-only"] if record_only: report('recording merge of revision(s) %s from "%s"' % (revs, opts["source-url"])) else: report('merging in revision(s) %s from "%s"' % (revs, opts["source-url"])) # Do the merge(s). Note: the starting revision number to 'svn merge' # is NOT inclusive so we have to subtract one from start. # We try to keep the number of merge operations as low as possible, # because it is faster and reduces the number of conflicts. old_block_props = get_block_props(branch_dir) merge_metadata = logs[opts["source-url"]].merge_metadata() block_metadata = logs[opts["source-url"]].block_metadata() for start,end in minimal_merge_intervals(revs, phantom_revs): if not record_only: # Preset merge/blocked properties to the source value at # the start rev to avoid spurious property conflicts set_merge_props(branch_dir, merge_metadata.get(start - 1)) set_block_props(branch_dir, block_metadata.get(start - 1)) # Do the merge svn_command("merge --force -r %d:%d %s %s" % \ (start - 1, end, opts["source-url"], branch_dir)) # TODO: to support graph merging, add logic to merge the property # meta-data manually # Update the set of merged revisions. merged_revs = merged_revs | revs | reflected_revs | phantom_revs | initialized_revs branch_props[opts["source-pathid"]] = str(merged_revs) set_merge_props(branch_dir, branch_props) # Reset the blocked revs set_block_props(branch_dir, old_block_props) # Write out commit message if desired if opts["commit-file"]: f = open(opts["commit-file"], "w") if record_only: print >>f, 'Recorded merge of revisions %s via %s from ' % \ (revs, NAME) else: print >>f, 'Merged revisions %s via %s from ' % \ (revs, NAME) print >>f, '%s' % opts["source-url"] if opts["commit-verbose"]: print >>f print >>f, construct_merged_log_message(opts["source-url"], revs), f.close() report('wrote commit message to "%s"' % opts["commit-file"]) def action_block(branch_dir, branch_props): """Block revisions.""" # Check branch directory is ready for being modified check_dir_clean(branch_dir) source_revs, phantom_revs, reflected_revs, initialized_revs = \ analyze_source_revs(branch_dir, opts["source-url"]) revs_to_block = source_revs - opts["merged-revs"] # Limit to revisions specified by -r (if any) if opts["revision"]: revs_to_block = RevisionSet(opts["revision"]) & revs_to_block if not revs_to_block: error('no available revisions to block') # Change blocked information blocked_revs = get_blocked_revs(branch_dir, opts["source-pathid"]) blocked_revs = blocked_revs | revs_to_block set_blocked_revs(branch_dir, opts["source-pathid"], blocked_revs) # Write out commit message if desired if opts["commit-file"]: f = open(opts["commit-file"], "w") print >>f, 'Blocked revisions %s via %s' % (revs_to_block, NAME) if opts["commit-verbose"]: print >>f print >>f, construct_merged_log_message(opts["source-url"], revs_to_block), f.close() report('wrote commit message to "%s"' % opts["commit-file"]) def action_unblock(branch_dir, branch_props): """Unblock revisions.""" # Check branch directory is ready for being modified check_dir_clean(branch_dir) blocked_revs = get_blocked_revs(branch_dir, opts["source-pathid"]) revs_to_unblock = blocked_revs # Limit to revisions specified by -r (if any) if opts["revision"]: revs_to_unblock = revs_to_unblock & RevisionSet(opts["revision"]) if not revs_to_unblock: error('no available revisions to unblock') # Change blocked information blocked_revs = blocked_revs - revs_to_unblock set_blocked_revs(branch_dir, opts["source-pathid"], blocked_revs) # Write out commit message if desired if opts["commit-file"]: f = open(opts["commit-file"], "w") print >>f, 'Unblocked revisions %s via %s' % (revs_to_unblock, NAME) if opts["commit-verbose"]: print >>f print >>f, construct_merged_log_message(opts["source-url"], revs_to_unblock), f.close() report('wrote commit message to "%s"' % opts["commit-file"]) def action_rollback(branch_dir, branch_props): """Rollback previously integrated revisions.""" # Make sure the revision arguments are present if not opts["revision"]: error("The '-r' option is mandatory for rollback") # Check branch directory is ready for being modified check_dir_clean(branch_dir) # Extract the integration info for the branch_dir branch_props = get_merge_props(branch_dir) # Get the list of all revisions already merged into this source-pathid. merged_revs = merge_props_to_revision_set(branch_props, opts["source-pathid"]) # At which revision was the src created? oldest_src_rev = get_created_rev(opts["source-url"]) src_pre_exist_range = RevisionSet("1-%d" % oldest_src_rev) # Limit to revisions specified by -r (if any) revs = merged_revs & RevisionSet(opts["revision"]) # make sure there's some revision to rollback if not revs: report("Nothing to rollback in revision range r%s" % opts["revision"]) return # If even one specified revision lies outside the lifetime of the # merge source, error out. if revs & src_pre_exist_range: err_str = "Specified revision range falls out of the rollback range.\n" err_str += "%s was created at r%d" % (opts["source-pathid"], oldest_src_rev) error(err_str) record_only = opts["record-only"] if record_only: report('recording rollback of revision(s) %s from "%s"' % (revs, opts["source-url"])) else: report('rollback of revision(s) %s from "%s"' % (revs, opts["source-url"])) # Do the reverse merge(s). Note: the starting revision number # to 'svn merge' is NOT inclusive so we have to subtract one from start. # We try to keep the number of merge operations as low as possible, # because it is faster and reduces the number of conflicts. rollback_intervals = minimal_merge_intervals(revs, []) # rollback in the reverse order of merge rollback_intervals.reverse() for start, end in rollback_intervals: if not record_only: # Do the merge svn_command("merge --force -r %d:%d %s %s" % \ (end, start - 1, opts["source-url"], branch_dir)) # Write out commit message if desired # calculate the phantom revs first if opts["commit-file"]: f = open(opts["commit-file"], "w") if record_only: print >>f, 'Recorded rollback of revisions %s via %s from ' % \ (revs , NAME) else: print >>f, 'Rolled back revisions %s via %s from ' % \ (revs , NAME) print >>f, '%s' % opts["source-url"] f.close() report('wrote commit message to "%s"' % opts["commit-file"]) # Update the set of merged revisions. merged_revs = merged_revs - revs branch_props[opts["source-pathid"]] = str(merged_revs) set_merge_props(branch_dir, branch_props) def action_uninit(branch_dir, branch_props): """Uninit SOURCE URL.""" # Check branch directory is ready for being modified check_dir_clean(branch_dir) # If the source-pathid does not have an entry in the svnmerge-integrated # property, simply error out. if not branch_props.has_key(opts["source-pathid"]): error('Repository-relative path "%s" does not contain merge ' 'tracking information for "%s"' \ % (opts["source-pathid"], branch_dir)) del branch_props[opts["source-pathid"]] # Set merge property with the selected source deleted set_merge_props(branch_dir, branch_props) # Set blocked revisions for the selected source to None set_blocked_revs(branch_dir, opts["source-pathid"], None) # Write out commit message if desired if opts["commit-file"]: f = open(opts["commit-file"], "w") print >>f, 'Removed merge tracking for "%s" for ' % NAME print >>f, '%s' % opts["source-url"] f.close() report('wrote commit message to "%s"' % opts["commit-file"]) ############################################################################### # Command line parsing -- options and commands management ############################################################################### class OptBase: def __init__(self, *args, **kwargs): self.help = kwargs["help"] del kwargs["help"] self.lflags = [] self.sflags = [] for a in args: if a.startswith("--"): self.lflags.append(a) elif a.startswith("-"): self.sflags.append(a) else: raise TypeError, "invalid flag name: %s" % a if kwargs.has_key("dest"): self.dest = kwargs["dest"] del kwargs["dest"] else: if not self.lflags: raise TypeError, "cannot deduce dest name without long options" self.dest = self.lflags[0][2:] if kwargs: raise TypeError, "invalid keyword arguments: %r" % kwargs.keys() def repr_flags(self): f = self.sflags + self.lflags r = f[0] for fl in f[1:]: r += " [%s]" % fl return r class Option(OptBase): def __init__(self, *args, **kwargs): self.default = kwargs.setdefault("default", 0) del kwargs["default"] self.value = kwargs.setdefault("value", None) del kwargs["value"] OptBase.__init__(self, *args, **kwargs) def apply(self, state, value): assert value == "" if self.value is not None: state[self.dest] = self.value else: state[self.dest] += 1 class OptionArg(OptBase): def __init__(self, *args, **kwargs): self.default = kwargs["default"] del kwargs["default"] self.metavar = kwargs.setdefault("metavar", None) del kwargs["metavar"] OptBase.__init__(self, *args, **kwargs) if self.metavar is None: if self.dest is not None: self.metavar = self.dest.upper() else: self.metavar = "arg" if self.default: self.help += " (default: %s)" % self.default def apply(self, state, value): assert value is not None state[self.dest] = value def repr_flags(self): r = OptBase.repr_flags(self) return r + " " + self.metavar class CommandOpts: class Cmd: def __init__(self, *args): self.name, self.func, self.usage, self.help, self.opts = args def short_help(self): return self.help.split(".")[0] def __str__(self): return self.name def __call__(self, *args, **kwargs): return self.func(*args, **kwargs) def __init__(self, global_opts, common_opts, command_table, version=None): self.progname = NAME self.version = version.replace("%prog", self.progname) self.cwidth = console_width() - 2 self.ctable = command_table.copy() self.gopts = global_opts[:] self.copts = common_opts[:] self._add_builtins() for k in self.ctable.keys(): cmd = self.Cmd(k, *self.ctable[k]) opts = [] for o in cmd.opts: if isinstance(o, types.StringType) or \ isinstance(o, types.UnicodeType): o = self._find_common(o) opts.append(o) cmd.opts = opts self.ctable[k] = cmd def _add_builtins(self): self.gopts.append( Option("-h", "--help", help="show help for this command and exit")) if self.version is not None: self.gopts.append( Option("-V", "--version", help="show version info and exit")) self.ctable["help"] = (self._cmd_help, "help [COMMAND]", "Display help for a specific command. If COMMAND is omitted, " "display brief command description.", []) def _cmd_help(self, cmd=None, *args): if args: self.error("wrong number of arguments", "help") if cmd is not None: cmd = self._command(cmd) self.print_command_help(cmd) else: self.print_command_list() def _paragraph(self, text, width=78): chunks = re.split("\s+", text.strip()) chunks.reverse() lines = [] while chunks: L = chunks.pop() while chunks and len(L) + len(chunks[-1]) + 1 <= width: L += " " + chunks.pop() lines.append(L) return lines def _paragraphs(self, text, *args, **kwargs): pars = text.split("\n\n") lines = self._paragraph(pars[0], *args, **kwargs) for p in pars[1:]: lines.append("") lines.extend(self._paragraph(p, *args, **kwargs)) return lines def _print_wrapped(self, text, indent=0): text = self._paragraphs(text, self.cwidth - indent) print text.pop(0) for t in text: print " " * indent + t def _find_common(self, fl): for o in self.copts: if fl in o.lflags+o.sflags: return o assert False, fl def _compute_flags(self, opts, check_conflicts=True): back = {} sfl = "" lfl = [] for o in opts: sapp = lapp = "" if isinstance(o, OptionArg): sapp, lapp = ":", "=" for s in o.sflags: if check_conflicts and back.has_key(s): raise RuntimeError, "option conflict: %s" % s back[s] = o sfl += s[1:] + sapp for l in o.lflags: if check_conflicts and back.has_key(l): raise RuntimeError, "option conflict: %s" % l back[l] = o lfl.append(l[2:] + lapp) return sfl, lfl, back def _extract_command(self, args): """ Try to extract the command name from the argument list. This is non-trivial because we want to allow command-specific options even before the command itself. """ opts = self.gopts[:] for cmd in self.ctable.values(): opts.extend(cmd.opts) sfl, lfl, _ = self._compute_flags(opts, check_conflicts=False) lopts,largs = getopt.getopt(args, sfl, lfl) if not largs: return None return self._command(largs[0]) def _fancy_getopt(self, args, opts, state=None): if state is None: state= {} for o in opts: if not state.has_key(o.dest): state[o.dest] = o.default sfl, lfl, back = self._compute_flags(opts) try: lopts,args = getopt.gnu_getopt(args, sfl, lfl) except AttributeError: # Before Python 2.3, there was no gnu_getopt support. # So we can't parse intermixed positional arguments # and options. lopts,args = getopt.getopt(args, sfl, lfl) for o,v in lopts: back[o].apply(state, v) return state, args def _command(self, cmd): if not self.ctable.has_key(cmd): self.error("unknown command: '%s'" % cmd) return self.ctable[cmd] def parse(self, args): if not args: self.print_small_help() sys.exit(0) cmd = None try: cmd = self._extract_command(args) opts = self.gopts[:] if cmd: opts.extend(cmd.opts) args.remove(cmd.name) state, args = self._fancy_getopt(args, opts) except getopt.GetoptError, e: self.error(e, cmd) # Handle builtins if self.version is not None and state["version"]: self.print_version() sys.exit(0) if state["help"]: # special case for --help if cmd: self.print_command_help(cmd) sys.exit(0) cmd = self.ctable["help"] else: if cmd is None: self.error("command argument required") if str(cmd) == "help": cmd(*args) sys.exit(0) return cmd, args, state def error(self, s, cmd=None): print >>sys.stderr, "%s: %s" % (self.progname, s) if cmd is not None: self.print_command_help(cmd) else: self.print_small_help() sys.exit(1) def print_small_help(self): print "Type '%s help' for usage" % self.progname def print_usage_line(self): print "usage: %s <subcommand> [options...] [args...]\n" % self.progname def print_command_list(self): print "Available commands (use '%s help COMMAND' for more details):\n" \ % self.progname cmds = self.ctable.keys() cmds.sort() indent = max(map(len, cmds)) for c in cmds: h = self.ctable[c].short_help() print " %-*s " % (indent, c), self._print_wrapped(h, indent+6) def print_command_help(self, cmd): cmd = self.ctable[str(cmd)] print 'usage: %s %s\n' % (self.progname, cmd.usage) self._print_wrapped(cmd.help) def print_opts(opts, self=self): if not opts: return flags = [o.repr_flags() for o in opts] indent = max(map(len, flags)) for f,o in zip(flags, opts): print " %-*s :" % (indent, f), self._print_wrapped(o.help, indent+5) print '\nCommand options:' print_opts(cmd.opts) print '\nGlobal options:' print_opts(self.gopts) def print_version(self): print self.version ############################################################################### # Options and Commands description ############################################################################### global_opts = [ Option("-F", "--force", help="force operation even if the working copy is not clean, or " "there are pending updates"), Option("-n", "--dry-run", help="don't actually change anything, just pretend; " "implies --show-changes"), Option("-s", "--show-changes", help="show subversion commands that make changes"), Option("-v", "--verbose", help="verbose mode: output more information about progress"), OptionArg("-u", "--username", default=None, help="invoke subversion commands with the supplied username"), OptionArg("-p", "--password", default=None, help="invoke subversion commands with the supplied password"), OptionArg("-c", "--config-dir", metavar="DIR", default=None, help="cause subversion commands to consult runtime config directory DIR"), ] common_opts = [ Option("-b", "--bidirectional", value=True, default=False, help="remove reflected and initialized revisions from merge candidates. " "Not required but may be specified to speed things up slightly"), OptionArg("-f", "--commit-file", metavar="FILE", default="svnmerge-commit-message.txt", help="set the name of the file where the suggested log message " "is written to"), Option("-M", "--record-only", value=True, default=False, help="do not perform an actual merge of the changes, yet record " "that a merge happened"), OptionArg("-r", "--revision", metavar="REVLIST", default="", help="specify a revision list, consisting of revision numbers " 'and ranges separated by commas, e.g., "534,537-539,540"'), OptionArg("-S", "--source", "--head", default=None, help="specify a merge source for this branch. It can be either " "a working directory path, a full URL, or an unambiguous " "substring of one of the locations for which merge tracking was " "already initialized. Needed only to disambiguate in case of " "multiple merge sources"), ] command_table = { "init": (action_init, "init [OPTION...] [SOURCE]", """Initialize merge tracking from SOURCE on the current working directory. If SOURCE is specified, all the revisions in SOURCE are marked as already merged; if this is not correct, you can use --revision to specify the exact list of already-merged revisions. If SOURCE is omitted, then it is computed from the "svn cp" history of the current working directory (searching back for the branch point); in this case, %s assumes that no revision has been integrated yet since the branch point (unless you teach it with --revision).""" % NAME, [ "-f", "-r", # import common opts OptionArg("-L", "--location-type", dest="location-type", default="path", help="Use this type of location identifier in the new " + "Subversion properties; 'uuid', 'url', or 'path' " + "(default)"), ]), "avail": (action_avail, "avail [OPTION...] [PATH]", """Show unmerged revisions available for PATH as a revision list. If --revision is given, the revisions shown will be limited to those also specified in the option. When svnmerge is used to bidirectionally merge changes between a branch and its source, it is necessary to not merge the same changes forth and back: e.g., if you committed a merge of a certain revision of the branch into the source, you do not want that commit to appear as available to merged into the branch (as the code originated in the branch itself!). svnmerge will automatically exclude these so-called "reflected" revisions.""", [ Option("-A", "--all", dest="avail-showwhat", value=["blocked", "avail"], default=["avail"], help="show both available and blocked revisions (aka ignore " "blocked revisions)"), "-b", Option("-B", "--blocked", dest="avail-showwhat", value=["blocked"], help="show the blocked revision list (see '%s block')" % NAME), Option("-d", "--diff", dest="avail-display", value="diffs", default="revisions", help="show corresponding diff instead of revision list"), Option("--summarize", dest="avail-display", value="summarize", help="show summarized diff instead of revision list"), Option("-l", "--log", dest="avail-display", value="logs", help="show corresponding log history instead of revision list"), "-r", "-S", ]), "integrated": (action_integrated, "integrated [OPTION...] [PATH]", """Show merged revisions available for PATH as a revision list. If --revision is given, the revisions shown will be limited to those also specified in the option.""", [ Option("-d", "--diff", dest="integrated-display", value="diffs", default="revisions", help="show corresponding diff instead of revision list"), Option("-l", "--log", dest="integrated-display", value="logs", help="show corresponding log history instead of revision list"), "-r", "-S", ]), "rollback": (action_rollback, "rollback [OPTION...] [PATH]", """Rollback previously merged in revisions from PATH. The --revision option is mandatory, and specifies which revisions will be rolled back. Only the previously integrated merges will be rolled back. When manually rolling back changes, --record-only can be used to instruct %s that a manual rollback of a certain revision already happened, so that it can record it and offer that revision for merge henceforth.""" % (NAME), [ "-f", "-r", "-S", "-M", # import common opts ]), "merge": (action_merge, "merge [OPTION...] [PATH]", """Merge in revisions into PATH from its source. If --revision is omitted, all the available revisions will be merged. In any case, already merged-in revisions will NOT be merged again. When svnmerge is used to bidirectionally merge changes between a branch and its source, it is necessary to not merge the same changes forth and back: e.g., if you committed a merge of a certain revision of the branch into the source, you do not want that commit to appear as available to merged into the branch (as the code originated in the branch itself!). svnmerge will automatically exclude these so-called "reflected" revisions. When manually merging changes across branches, --record-only can be used to instruct %s that a manual merge of a certain revision already happened, so that it can record it and not offer that revision for merge anymore. Conversely, when there are revisions which should not be merged, use '%s block'.""" % (NAME, NAME), [ "-b", "-f", "-r", "-S", "-M", # import common opts ]), "block": (action_block, "block [OPTION...] [PATH]", """Block revisions within PATH so that they disappear from the available list. This is useful to hide revisions which will not be integrated. If --revision is omitted, it defaults to all the available revisions. Do not use this option to hide revisions that were manually merged into the branch. Instead, use '%s merge --record-only', which records that a merge happened (as opposed to a merge which should not happen).""" % NAME, [ "-f", "-r", "-S", # import common opts ]), "unblock": (action_unblock, "unblock [OPTION...] [PATH]", """Revert the effect of '%s block'. If --revision is omitted, all the blocked revisions are unblocked""" % NAME, [ "-f", "-r", "-S", # import common opts ]), "uninit": (action_uninit, "uninit [OPTION...] [PATH]", """Remove merge tracking information from PATH. It cleans any kind of merge tracking information (including the list of blocked revisions). If there are multiple sources, use --source to indicate which source you want to forget about.""", [ "-f", "-S", # import common opts ]), } def main(args): global opts # Initialize default options opts = default_opts.copy() logs.clear() optsparser = CommandOpts(global_opts, common_opts, command_table, version="%%prog r%s\n modified: %s\n\n" "Copyright (C) 2004,2005 Awarix Inc.\n" "Copyright (C) 2005, Giovanni Bajo" % (__revision__, __date__)) cmd, args, state = optsparser.parse(args) opts.update(state) source = opts.get("source", None) branch_dir = "." if str(cmd) == "init": if len(args) == 1: source = args[0] elif len(args) > 1: optsparser.error("wrong number of parameters", cmd) elif str(cmd) in command_table.keys(): if len(args) == 1: branch_dir = args[0] elif len(args) > 1: optsparser.error("wrong number of parameters", cmd) else: assert False, "command not handled: %s" % cmd # Validate branch_dir if not is_wc(branch_dir): if str(cmd) == "avail": info = None # it should be noted here that svn info does not error exit # if an invalid target is specified to it (as is # intuitive). so the try, except code is not absolutely # necessary. but, I retain it to indicate the intuitive # handling. try: info = get_svninfo(branch_dir) except LaunchError: pass # test that we definitely targeted a subversion directory, # mirroring the purpose of the earlier is_wc() call if info is None or not info.has_key("Node Kind") or info["Node Kind"] != "directory": error('"%s" is neither a valid URL, nor a working directory' % branch_dir) else: error('"%s" is not a subversion working directory' % branch_dir) # give out some hints as to potential pathids PathIdentifier.hint(branch_dir) if source: PathIdentifier.hint(source) # Extract the integration info for the branch_dir branch_props = get_merge_props(branch_dir) # Calculate source_url and source_path report("calculate source path for the branch") if not source: if str(cmd) == "init": cf_source, cf_rev, copy_committed_in_rev = get_copyfrom(branch_dir) if not cf_source: error('no copyfrom info available. ' 'Explicit source argument (-S/--source) required.') opts["source-url"] = get_repo_root(branch_dir) + cf_source opts["source-pathid"] = PathIdentifier.from_target(opts["source-url"]) if not opts["revision"]: opts["revision"] = "1-" + cf_rev else: opts["source-pathid"] = get_default_source(branch_dir, branch_props) opts["source-url"] = opts["source-pathid"].get_url() assert is_pathid(opts["source-pathid"]) assert is_url(opts["source-url"]) else: # The source was given as a command line argument and is stored in # SOURCE. Ensure that the specified source does not end in a /, # otherwise it's easy to have the same source path listed more # than once in the integrated version properties, with and without # trailing /'s. source = rstrip(source, "/") if not is_wc(source) and not is_url(source): # Check if it is a substring of a pathid recorded # within the branch properties. found = [] for pathid in branch_props.keys(): if pathid.match_substring(source): found.append(pathid) if len(found) == 1: # (assumes pathid is a repository-relative-path) source_pathid = found[0] source = source_pathid.get_url() else: error('"%s" is neither a valid URL, nor an unambiguous ' 'substring of a repository path, nor a working directory' % source) else: source_pathid = PathIdentifier.from_target(source) source_pathid = PathIdentifier.from_target(source) if str(cmd) == "init" and \ source_pathid == PathIdentifier.from_target("."): error("cannot init integration source path '%s'\n" "Its repository-relative path must differ from the " "repository-relative path of the current directory." % source_pathid) opts["source-pathid"] = source_pathid opts["source-url"] = target_to_url(source) # Sanity check source_url assert is_url(opts["source-url"]) # SVN does not support non-normalized URL (and we should not # have created them) assert opts["source-url"].find("/..") < 0 report('source is "%s"' % opts["source-url"]) # Get previously merged revisions (except when command is init) if str(cmd) != "init": opts["merged-revs"] = merge_props_to_revision_set(branch_props, opts["source-pathid"]) # Perform the action cmd(branch_dir, branch_props) if __name__ == "__main__": try: main(sys.argv[1:]) except LaunchError, (ret, cmd, out): err_msg = "command execution failed (exit code: %d)\n" % ret err_msg += cmd + "\n" err_msg += "".join(out) error(err_msg) except KeyboardInterrupt: # Avoid traceback on CTRL+C print "aborted by user" sys.exit(1)