Merge branch 'nd/ignore-then-not-ignore'
[git] / git-p4.py
1 #!/usr/bin/env python
2 #
3 # git-p4.py -- A tool for bidirectional operation between a Perforce depot and git.
4 #
5 # Author: Simon Hausmann <simon@lst.de>
6 # Copyright: 2007 Simon Hausmann <simon@lst.de>
7 #            2007 Trolltech ASA
8 # License: MIT <http://www.opensource.org/licenses/mit-license.php>
9 #
10 import sys
11 if sys.hexversion < 0x02040000:
12     # The limiter is the subprocess module
13     sys.stderr.write("git-p4: requires Python 2.4 or later.\n")
14     sys.exit(1)
15 import os
16 import optparse
17 import marshal
18 import subprocess
19 import tempfile
20 import time
21 import platform
22 import re
23 import shutil
24 import stat
25
26 try:
27     from subprocess import CalledProcessError
28 except ImportError:
29     # from python2.7:subprocess.py
30     # Exception classes used by this module.
31     class CalledProcessError(Exception):
32         """This exception is raised when a process run by check_call() returns
33         a non-zero exit status.  The exit status will be stored in the
34         returncode attribute."""
35         def __init__(self, returncode, cmd):
36             self.returncode = returncode
37             self.cmd = cmd
38         def __str__(self):
39             return "Command '%s' returned non-zero exit status %d" % (self.cmd, self.returncode)
40
41 verbose = False
42
43 # Only labels/tags matching this will be imported/exported
44 defaultLabelRegexp = r'[a-zA-Z0-9_\-.]+$'
45
46 # Grab changes in blocks of this many revisions, unless otherwise requested
47 defaultBlockSize = 512
48
49 def p4_build_cmd(cmd):
50     """Build a suitable p4 command line.
51
52     This consolidates building and returning a p4 command line into one
53     location. It means that hooking into the environment, or other configuration
54     can be done more easily.
55     """
56     real_cmd = ["p4"]
57
58     user = gitConfig("git-p4.user")
59     if len(user) > 0:
60         real_cmd += ["-u",user]
61
62     password = gitConfig("git-p4.password")
63     if len(password) > 0:
64         real_cmd += ["-P", password]
65
66     port = gitConfig("git-p4.port")
67     if len(port) > 0:
68         real_cmd += ["-p", port]
69
70     host = gitConfig("git-p4.host")
71     if len(host) > 0:
72         real_cmd += ["-H", host]
73
74     client = gitConfig("git-p4.client")
75     if len(client) > 0:
76         real_cmd += ["-c", client]
77
78
79     if isinstance(cmd,basestring):
80         real_cmd = ' '.join(real_cmd) + ' ' + cmd
81     else:
82         real_cmd += cmd
83     return real_cmd
84
85 def chdir(path, is_client_path=False):
86     """Do chdir to the given path, and set the PWD environment
87        variable for use by P4.  It does not look at getcwd() output.
88        Since we're not using the shell, it is necessary to set the
89        PWD environment variable explicitly.
90
91        Normally, expand the path to force it to be absolute.  This
92        addresses the use of relative path names inside P4 settings,
93        e.g. P4CONFIG=.p4config.  P4 does not simply open the filename
94        as given; it looks for .p4config using PWD.
95
96        If is_client_path, the path was handed to us directly by p4,
97        and may be a symbolic link.  Do not call os.getcwd() in this
98        case, because it will cause p4 to think that PWD is not inside
99        the client path.
100        """
101
102     os.chdir(path)
103     if not is_client_path:
104         path = os.getcwd()
105     os.environ['PWD'] = path
106
107 def die(msg):
108     if verbose:
109         raise Exception(msg)
110     else:
111         sys.stderr.write(msg + "\n")
112         sys.exit(1)
113
114 def write_pipe(c, stdin):
115     if verbose:
116         sys.stderr.write('Writing pipe: %s\n' % str(c))
117
118     expand = isinstance(c,basestring)
119     p = subprocess.Popen(c, stdin=subprocess.PIPE, shell=expand)
120     pipe = p.stdin
121     val = pipe.write(stdin)
122     pipe.close()
123     if p.wait():
124         die('Command failed: %s' % str(c))
125
126     return val
127
128 def p4_write_pipe(c, stdin):
129     real_cmd = p4_build_cmd(c)
130     return write_pipe(real_cmd, stdin)
131
132 def read_pipe(c, ignore_error=False):
133     if verbose:
134         sys.stderr.write('Reading pipe: %s\n' % str(c))
135
136     expand = isinstance(c,basestring)
137     p = subprocess.Popen(c, stdout=subprocess.PIPE, shell=expand)
138     pipe = p.stdout
139     val = pipe.read()
140     if p.wait() and not ignore_error:
141         die('Command failed: %s' % str(c))
142
143     return val
144
145 def p4_read_pipe(c, ignore_error=False):
146     real_cmd = p4_build_cmd(c)
147     return read_pipe(real_cmd, ignore_error)
148
149 def read_pipe_lines(c):
150     if verbose:
151         sys.stderr.write('Reading pipe: %s\n' % str(c))
152
153     expand = isinstance(c, basestring)
154     p = subprocess.Popen(c, stdout=subprocess.PIPE, shell=expand)
155     pipe = p.stdout
156     val = pipe.readlines()
157     if pipe.close() or p.wait():
158         die('Command failed: %s' % str(c))
159
160     return val
161
162 def p4_read_pipe_lines(c):
163     """Specifically invoke p4 on the command supplied. """
164     real_cmd = p4_build_cmd(c)
165     return read_pipe_lines(real_cmd)
166
167 def p4_has_command(cmd):
168     """Ask p4 for help on this command.  If it returns an error, the
169        command does not exist in this version of p4."""
170     real_cmd = p4_build_cmd(["help", cmd])
171     p = subprocess.Popen(real_cmd, stdout=subprocess.PIPE,
172                                    stderr=subprocess.PIPE)
173     p.communicate()
174     return p.returncode == 0
175
176 def p4_has_move_command():
177     """See if the move command exists, that it supports -k, and that
178        it has not been administratively disabled.  The arguments
179        must be correct, but the filenames do not have to exist.  Use
180        ones with wildcards so even if they exist, it will fail."""
181
182     if not p4_has_command("move"):
183         return False
184     cmd = p4_build_cmd(["move", "-k", "@from", "@to"])
185     p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
186     (out, err) = p.communicate()
187     # return code will be 1 in either case
188     if err.find("Invalid option") >= 0:
189         return False
190     if err.find("disabled") >= 0:
191         return False
192     # assume it failed because @... was invalid changelist
193     return True
194
195 def system(cmd):
196     expand = isinstance(cmd,basestring)
197     if verbose:
198         sys.stderr.write("executing %s\n" % str(cmd))
199     retcode = subprocess.call(cmd, shell=expand)
200     if retcode:
201         raise CalledProcessError(retcode, cmd)
202
203 def p4_system(cmd):
204     """Specifically invoke p4 as the system command. """
205     real_cmd = p4_build_cmd(cmd)
206     expand = isinstance(real_cmd, basestring)
207     retcode = subprocess.call(real_cmd, shell=expand)
208     if retcode:
209         raise CalledProcessError(retcode, real_cmd)
210
211 _p4_version_string = None
212 def p4_version_string():
213     """Read the version string, showing just the last line, which
214        hopefully is the interesting version bit.
215
216        $ p4 -V
217        Perforce - The Fast Software Configuration Management System.
218        Copyright 1995-2011 Perforce Software.  All rights reserved.
219        Rev. P4/NTX86/2011.1/393975 (2011/12/16).
220     """
221     global _p4_version_string
222     if not _p4_version_string:
223         a = p4_read_pipe_lines(["-V"])
224         _p4_version_string = a[-1].rstrip()
225     return _p4_version_string
226
227 def p4_integrate(src, dest):
228     p4_system(["integrate", "-Dt", wildcard_encode(src), wildcard_encode(dest)])
229
230 def p4_sync(f, *options):
231     p4_system(["sync"] + list(options) + [wildcard_encode(f)])
232
233 def p4_add(f):
234     # forcibly add file names with wildcards
235     if wildcard_present(f):
236         p4_system(["add", "-f", f])
237     else:
238         p4_system(["add", f])
239
240 def p4_delete(f):
241     p4_system(["delete", wildcard_encode(f)])
242
243 def p4_edit(f):
244     p4_system(["edit", wildcard_encode(f)])
245
246 def p4_revert(f):
247     p4_system(["revert", wildcard_encode(f)])
248
249 def p4_reopen(type, f):
250     p4_system(["reopen", "-t", type, wildcard_encode(f)])
251
252 def p4_move(src, dest):
253     p4_system(["move", "-k", wildcard_encode(src), wildcard_encode(dest)])
254
255 def p4_last_change():
256     results = p4CmdList(["changes", "-m", "1"])
257     return int(results[0]['change'])
258
259 def p4_describe(change):
260     """Make sure it returns a valid result by checking for
261        the presence of field "time".  Return a dict of the
262        results."""
263
264     ds = p4CmdList(["describe", "-s", str(change)])
265     if len(ds) != 1:
266         die("p4 describe -s %d did not return 1 result: %s" % (change, str(ds)))
267
268     d = ds[0]
269
270     if "p4ExitCode" in d:
271         die("p4 describe -s %d exited with %d: %s" % (change, d["p4ExitCode"],
272                                                       str(d)))
273     if "code" in d:
274         if d["code"] == "error":
275             die("p4 describe -s %d returned error code: %s" % (change, str(d)))
276
277     if "time" not in d:
278         die("p4 describe -s %d returned no \"time\": %s" % (change, str(d)))
279
280     return d
281
282 #
283 # Canonicalize the p4 type and return a tuple of the
284 # base type, plus any modifiers.  See "p4 help filetypes"
285 # for a list and explanation.
286 #
287 def split_p4_type(p4type):
288
289     p4_filetypes_historical = {
290         "ctempobj": "binary+Sw",
291         "ctext": "text+C",
292         "cxtext": "text+Cx",
293         "ktext": "text+k",
294         "kxtext": "text+kx",
295         "ltext": "text+F",
296         "tempobj": "binary+FSw",
297         "ubinary": "binary+F",
298         "uresource": "resource+F",
299         "uxbinary": "binary+Fx",
300         "xbinary": "binary+x",
301         "xltext": "text+Fx",
302         "xtempobj": "binary+Swx",
303         "xtext": "text+x",
304         "xunicode": "unicode+x",
305         "xutf16": "utf16+x",
306     }
307     if p4type in p4_filetypes_historical:
308         p4type = p4_filetypes_historical[p4type]
309     mods = ""
310     s = p4type.split("+")
311     base = s[0]
312     mods = ""
313     if len(s) > 1:
314         mods = s[1]
315     return (base, mods)
316
317 #
318 # return the raw p4 type of a file (text, text+ko, etc)
319 #
320 def p4_type(f):
321     results = p4CmdList(["fstat", "-T", "headType", wildcard_encode(f)])
322     return results[0]['headType']
323
324 #
325 # Given a type base and modifier, return a regexp matching
326 # the keywords that can be expanded in the file
327 #
328 def p4_keywords_regexp_for_type(base, type_mods):
329     if base in ("text", "unicode", "binary"):
330         kwords = None
331         if "ko" in type_mods:
332             kwords = 'Id|Header'
333         elif "k" in type_mods:
334             kwords = 'Id|Header|Author|Date|DateTime|Change|File|Revision'
335         else:
336             return None
337         pattern = r"""
338             \$              # Starts with a dollar, followed by...
339             (%s)            # one of the keywords, followed by...
340             (:[^$\n]+)?     # possibly an old expansion, followed by...
341             \$              # another dollar
342             """ % kwords
343         return pattern
344     else:
345         return None
346
347 #
348 # Given a file, return a regexp matching the possible
349 # RCS keywords that will be expanded, or None for files
350 # with kw expansion turned off.
351 #
352 def p4_keywords_regexp_for_file(file):
353     if not os.path.exists(file):
354         return None
355     else:
356         (type_base, type_mods) = split_p4_type(p4_type(file))
357         return p4_keywords_regexp_for_type(type_base, type_mods)
358
359 def setP4ExecBit(file, mode):
360     # Reopens an already open file and changes the execute bit to match
361     # the execute bit setting in the passed in mode.
362
363     p4Type = "+x"
364
365     if not isModeExec(mode):
366         p4Type = getP4OpenedType(file)
367         p4Type = re.sub('^([cku]?)x(.*)', '\\1\\2', p4Type)
368         p4Type = re.sub('(.*?\+.*?)x(.*?)', '\\1\\2', p4Type)
369         if p4Type[-1] == "+":
370             p4Type = p4Type[0:-1]
371
372     p4_reopen(p4Type, file)
373
374 def getP4OpenedType(file):
375     # Returns the perforce file type for the given file.
376
377     result = p4_read_pipe(["opened", wildcard_encode(file)])
378     match = re.match(".*\((.+)\)( \*exclusive\*)?\r?$", result)
379     if match:
380         return match.group(1)
381     else:
382         die("Could not determine file type for %s (result: '%s')" % (file, result))
383
384 # Return the set of all p4 labels
385 def getP4Labels(depotPaths):
386     labels = set()
387     if isinstance(depotPaths,basestring):
388         depotPaths = [depotPaths]
389
390     for l in p4CmdList(["labels"] + ["%s..." % p for p in depotPaths]):
391         label = l['label']
392         labels.add(label)
393
394     return labels
395
396 # Return the set of all git tags
397 def getGitTags():
398     gitTags = set()
399     for line in read_pipe_lines(["git", "tag"]):
400         tag = line.strip()
401         gitTags.add(tag)
402     return gitTags
403
404 def diffTreePattern():
405     # This is a simple generator for the diff tree regex pattern. This could be
406     # a class variable if this and parseDiffTreeEntry were a part of a class.
407     pattern = re.compile(':(\d+) (\d+) (\w+) (\w+) ([A-Z])(\d+)?\t(.*?)((\t(.*))|$)')
408     while True:
409         yield pattern
410
411 def parseDiffTreeEntry(entry):
412     """Parses a single diff tree entry into its component elements.
413
414     See git-diff-tree(1) manpage for details about the format of the diff
415     output. This method returns a dictionary with the following elements:
416
417     src_mode - The mode of the source file
418     dst_mode - The mode of the destination file
419     src_sha1 - The sha1 for the source file
420     dst_sha1 - The sha1 fr the destination file
421     status - The one letter status of the diff (i.e. 'A', 'M', 'D', etc)
422     status_score - The score for the status (applicable for 'C' and 'R'
423                    statuses). This is None if there is no score.
424     src - The path for the source file.
425     dst - The path for the destination file. This is only present for
426           copy or renames. If it is not present, this is None.
427
428     If the pattern is not matched, None is returned."""
429
430     match = diffTreePattern().next().match(entry)
431     if match:
432         return {
433             'src_mode': match.group(1),
434             'dst_mode': match.group(2),
435             'src_sha1': match.group(3),
436             'dst_sha1': match.group(4),
437             'status': match.group(5),
438             'status_score': match.group(6),
439             'src': match.group(7),
440             'dst': match.group(10)
441         }
442     return None
443
444 def isModeExec(mode):
445     # Returns True if the given git mode represents an executable file,
446     # otherwise False.
447     return mode[-3:] == "755"
448
449 def isModeExecChanged(src_mode, dst_mode):
450     return isModeExec(src_mode) != isModeExec(dst_mode)
451
452 def p4CmdList(cmd, stdin=None, stdin_mode='w+b', cb=None):
453
454     if isinstance(cmd,basestring):
455         cmd = "-G " + cmd
456         expand = True
457     else:
458         cmd = ["-G"] + cmd
459         expand = False
460
461     cmd = p4_build_cmd(cmd)
462     if verbose:
463         sys.stderr.write("Opening pipe: %s\n" % str(cmd))
464
465     # Use a temporary file to avoid deadlocks without
466     # subprocess.communicate(), which would put another copy
467     # of stdout into memory.
468     stdin_file = None
469     if stdin is not None:
470         stdin_file = tempfile.TemporaryFile(prefix='p4-stdin', mode=stdin_mode)
471         if isinstance(stdin,basestring):
472             stdin_file.write(stdin)
473         else:
474             for i in stdin:
475                 stdin_file.write(i + '\n')
476         stdin_file.flush()
477         stdin_file.seek(0)
478
479     p4 = subprocess.Popen(cmd,
480                           shell=expand,
481                           stdin=stdin_file,
482                           stdout=subprocess.PIPE)
483
484     result = []
485     try:
486         while True:
487             entry = marshal.load(p4.stdout)
488             if cb is not None:
489                 cb(entry)
490             else:
491                 result.append(entry)
492     except EOFError:
493         pass
494     exitCode = p4.wait()
495     if exitCode != 0:
496         entry = {}
497         entry["p4ExitCode"] = exitCode
498         result.append(entry)
499
500     return result
501
502 def p4Cmd(cmd):
503     list = p4CmdList(cmd)
504     result = {}
505     for entry in list:
506         result.update(entry)
507     return result;
508
509 def p4Where(depotPath):
510     if not depotPath.endswith("/"):
511         depotPath += "/"
512     depotPathLong = depotPath + "..."
513     outputList = p4CmdList(["where", depotPathLong])
514     output = None
515     for entry in outputList:
516         if "depotFile" in entry:
517             # Search for the base client side depot path, as long as it starts with the branch's P4 path.
518             # The base path always ends with "/...".
519             if entry["depotFile"].find(depotPath) == 0 and entry["depotFile"][-4:] == "/...":
520                 output = entry
521                 break
522         elif "data" in entry:
523             data = entry.get("data")
524             space = data.find(" ")
525             if data[:space] == depotPath:
526                 output = entry
527                 break
528     if output == None:
529         return ""
530     if output["code"] == "error":
531         return ""
532     clientPath = ""
533     if "path" in output:
534         clientPath = output.get("path")
535     elif "data" in output:
536         data = output.get("data")
537         lastSpace = data.rfind(" ")
538         clientPath = data[lastSpace + 1:]
539
540     if clientPath.endswith("..."):
541         clientPath = clientPath[:-3]
542     return clientPath
543
544 def currentGitBranch():
545     return read_pipe("git name-rev HEAD").split(" ")[1].strip()
546
547 def isValidGitDir(path):
548     if (os.path.exists(path + "/HEAD")
549         and os.path.exists(path + "/refs") and os.path.exists(path + "/objects")):
550         return True;
551     return False
552
553 def parseRevision(ref):
554     return read_pipe("git rev-parse %s" % ref).strip()
555
556 def branchExists(ref):
557     rev = read_pipe(["git", "rev-parse", "-q", "--verify", ref],
558                      ignore_error=True)
559     return len(rev) > 0
560
561 def extractLogMessageFromGitCommit(commit):
562     logMessage = ""
563
564     ## fixme: title is first line of commit, not 1st paragraph.
565     foundTitle = False
566     for log in read_pipe_lines("git cat-file commit %s" % commit):
567        if not foundTitle:
568            if len(log) == 1:
569                foundTitle = True
570            continue
571
572        logMessage += log
573     return logMessage
574
575 def extractSettingsGitLog(log):
576     values = {}
577     for line in log.split("\n"):
578         line = line.strip()
579         m = re.search (r"^ *\[git-p4: (.*)\]$", line)
580         if not m:
581             continue
582
583         assignments = m.group(1).split (':')
584         for a in assignments:
585             vals = a.split ('=')
586             key = vals[0].strip()
587             val = ('='.join (vals[1:])).strip()
588             if val.endswith ('\"') and val.startswith('"'):
589                 val = val[1:-1]
590
591             values[key] = val
592
593     paths = values.get("depot-paths")
594     if not paths:
595         paths = values.get("depot-path")
596     if paths:
597         values['depot-paths'] = paths.split(',')
598     return values
599
600 def gitBranchExists(branch):
601     proc = subprocess.Popen(["git", "rev-parse", branch],
602                             stderr=subprocess.PIPE, stdout=subprocess.PIPE);
603     return proc.wait() == 0;
604
605 _gitConfig = {}
606
607 def gitConfig(key):
608     if not _gitConfig.has_key(key):
609         cmd = [ "git", "config", key ]
610         s = read_pipe(cmd, ignore_error=True)
611         _gitConfig[key] = s.strip()
612     return _gitConfig[key]
613
614 def gitConfigBool(key):
615     """Return a bool, using git config --bool.  It is True only if the
616        variable is set to true, and False if set to false or not present
617        in the config."""
618
619     if not _gitConfig.has_key(key):
620         cmd = [ "git", "config", "--bool", key ]
621         s = read_pipe(cmd, ignore_error=True)
622         v = s.strip()
623         _gitConfig[key] = v == "true"
624     return _gitConfig[key]
625
626 def gitConfigList(key):
627     if not _gitConfig.has_key(key):
628         s = read_pipe(["git", "config", "--get-all", key], ignore_error=True)
629         _gitConfig[key] = s.strip().split(os.linesep)
630     return _gitConfig[key]
631
632 def p4BranchesInGit(branchesAreInRemotes=True):
633     """Find all the branches whose names start with "p4/", looking
634        in remotes or heads as specified by the argument.  Return
635        a dictionary of { branch: revision } for each one found.
636        The branch names are the short names, without any
637        "p4/" prefix."""
638
639     branches = {}
640
641     cmdline = "git rev-parse --symbolic "
642     if branchesAreInRemotes:
643         cmdline += "--remotes"
644     else:
645         cmdline += "--branches"
646
647     for line in read_pipe_lines(cmdline):
648         line = line.strip()
649
650         # only import to p4/
651         if not line.startswith('p4/'):
652             continue
653         # special symbolic ref to p4/master
654         if line == "p4/HEAD":
655             continue
656
657         # strip off p4/ prefix
658         branch = line[len("p4/"):]
659
660         branches[branch] = parseRevision(line)
661
662     return branches
663
664 def branch_exists(branch):
665     """Make sure that the given ref name really exists."""
666
667     cmd = [ "git", "rev-parse", "--symbolic", "--verify", branch ]
668     p = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
669     out, _ = p.communicate()
670     if p.returncode:
671         return False
672     # expect exactly one line of output: the branch name
673     return out.rstrip() == branch
674
675 def findUpstreamBranchPoint(head = "HEAD"):
676     branches = p4BranchesInGit()
677     # map from depot-path to branch name
678     branchByDepotPath = {}
679     for branch in branches.keys():
680         tip = branches[branch]
681         log = extractLogMessageFromGitCommit(tip)
682         settings = extractSettingsGitLog(log)
683         if settings.has_key("depot-paths"):
684             paths = ",".join(settings["depot-paths"])
685             branchByDepotPath[paths] = "remotes/p4/" + branch
686
687     settings = None
688     parent = 0
689     while parent < 65535:
690         commit = head + "~%s" % parent
691         log = extractLogMessageFromGitCommit(commit)
692         settings = extractSettingsGitLog(log)
693         if settings.has_key("depot-paths"):
694             paths = ",".join(settings["depot-paths"])
695             if branchByDepotPath.has_key(paths):
696                 return [branchByDepotPath[paths], settings]
697
698         parent = parent + 1
699
700     return ["", settings]
701
702 def createOrUpdateBranchesFromOrigin(localRefPrefix = "refs/remotes/p4/", silent=True):
703     if not silent:
704         print ("Creating/updating branch(es) in %s based on origin branch(es)"
705                % localRefPrefix)
706
707     originPrefix = "origin/p4/"
708
709     for line in read_pipe_lines("git rev-parse --symbolic --remotes"):
710         line = line.strip()
711         if (not line.startswith(originPrefix)) or line.endswith("HEAD"):
712             continue
713
714         headName = line[len(originPrefix):]
715         remoteHead = localRefPrefix + headName
716         originHead = line
717
718         original = extractSettingsGitLog(extractLogMessageFromGitCommit(originHead))
719         if (not original.has_key('depot-paths')
720             or not original.has_key('change')):
721             continue
722
723         update = False
724         if not gitBranchExists(remoteHead):
725             if verbose:
726                 print "creating %s" % remoteHead
727             update = True
728         else:
729             settings = extractSettingsGitLog(extractLogMessageFromGitCommit(remoteHead))
730             if settings.has_key('change') > 0:
731                 if settings['depot-paths'] == original['depot-paths']:
732                     originP4Change = int(original['change'])
733                     p4Change = int(settings['change'])
734                     if originP4Change > p4Change:
735                         print ("%s (%s) is newer than %s (%s). "
736                                "Updating p4 branch from origin."
737                                % (originHead, originP4Change,
738                                   remoteHead, p4Change))
739                         update = True
740                 else:
741                     print ("Ignoring: %s was imported from %s while "
742                            "%s was imported from %s"
743                            % (originHead, ','.join(original['depot-paths']),
744                               remoteHead, ','.join(settings['depot-paths'])))
745
746         if update:
747             system("git update-ref %s %s" % (remoteHead, originHead))
748
749 def originP4BranchesExist():
750         return gitBranchExists("origin") or gitBranchExists("origin/p4") or gitBranchExists("origin/p4/master")
751
752
753 def p4ParseNumericChangeRange(parts):
754     changeStart = int(parts[0][1:])
755     if parts[1] == '#head':
756         changeEnd = p4_last_change()
757     else:
758         changeEnd = int(parts[1])
759
760     return (changeStart, changeEnd)
761
762 def chooseBlockSize(blockSize):
763     if blockSize:
764         return blockSize
765     else:
766         return defaultBlockSize
767
768 def p4ChangesForPaths(depotPaths, changeRange, requestedBlockSize):
769     assert depotPaths
770
771     # Parse the change range into start and end. Try to find integer
772     # revision ranges as these can be broken up into blocks to avoid
773     # hitting server-side limits (maxrows, maxscanresults). But if
774     # that doesn't work, fall back to using the raw revision specifier
775     # strings, without using block mode.
776
777     if changeRange is None or changeRange == '':
778         changeStart = 1
779         changeEnd = p4_last_change()
780         block_size = chooseBlockSize(requestedBlockSize)
781     else:
782         parts = changeRange.split(',')
783         assert len(parts) == 2
784         try:
785             (changeStart, changeEnd) = p4ParseNumericChangeRange(parts)
786             block_size = chooseBlockSize(requestedBlockSize)
787         except:
788             changeStart = parts[0][1:]
789             changeEnd = parts[1]
790             if requestedBlockSize:
791                 die("cannot use --changes-block-size with non-numeric revisions")
792             block_size = None
793
794     # Accumulate change numbers in a dictionary to avoid duplicates
795     changes = {}
796
797     for p in depotPaths:
798         # Retrieve changes a block at a time, to prevent running
799         # into a MaxResults/MaxScanRows error from the server.
800
801         while True:
802             cmd = ['changes']
803
804             if block_size:
805                 end = min(changeEnd, changeStart + block_size)
806                 revisionRange = "%d,%d" % (changeStart, end)
807             else:
808                 revisionRange = "%s,%s" % (changeStart, changeEnd)
809
810             cmd += ["%s...@%s" % (p, revisionRange)]
811
812             for line in p4_read_pipe_lines(cmd):
813                 changeNum = int(line.split(" ")[1])
814                 changes[changeNum] = True
815
816             if not block_size:
817                 break
818
819             if end >= changeEnd:
820                 break
821
822             changeStart = end + 1
823
824     changelist = changes.keys()
825     changelist.sort()
826     return changelist
827
828 def p4PathStartsWith(path, prefix):
829     # This method tries to remedy a potential mixed-case issue:
830     #
831     # If UserA adds  //depot/DirA/file1
832     # and UserB adds //depot/dira/file2
833     #
834     # we may or may not have a problem. If you have core.ignorecase=true,
835     # we treat DirA and dira as the same directory
836     if gitConfigBool("core.ignorecase"):
837         return path.lower().startswith(prefix.lower())
838     return path.startswith(prefix)
839
840 def getClientSpec():
841     """Look at the p4 client spec, create a View() object that contains
842        all the mappings, and return it."""
843
844     specList = p4CmdList("client -o")
845     if len(specList) != 1:
846         die('Output from "client -o" is %d lines, expecting 1' %
847             len(specList))
848
849     # dictionary of all client parameters
850     entry = specList[0]
851
852     # the //client/ name
853     client_name = entry["Client"]
854
855     # just the keys that start with "View"
856     view_keys = [ k for k in entry.keys() if k.startswith("View") ]
857
858     # hold this new View
859     view = View(client_name)
860
861     # append the lines, in order, to the view
862     for view_num in range(len(view_keys)):
863         k = "View%d" % view_num
864         if k not in view_keys:
865             die("Expected view key %s missing" % k)
866         view.append(entry[k])
867
868     return view
869
870 def getClientRoot():
871     """Grab the client directory."""
872
873     output = p4CmdList("client -o")
874     if len(output) != 1:
875         die('Output from "client -o" is %d lines, expecting 1' % len(output))
876
877     entry = output[0]
878     if "Root" not in entry:
879         die('Client has no "Root"')
880
881     return entry["Root"]
882
883 #
884 # P4 wildcards are not allowed in filenames.  P4 complains
885 # if you simply add them, but you can force it with "-f", in
886 # which case it translates them into %xx encoding internally.
887 #
888 def wildcard_decode(path):
889     # Search for and fix just these four characters.  Do % last so
890     # that fixing it does not inadvertently create new %-escapes.
891     # Cannot have * in a filename in windows; untested as to
892     # what p4 would do in such a case.
893     if not platform.system() == "Windows":
894         path = path.replace("%2A", "*")
895     path = path.replace("%23", "#") \
896                .replace("%40", "@") \
897                .replace("%25", "%")
898     return path
899
900 def wildcard_encode(path):
901     # do % first to avoid double-encoding the %s introduced here
902     path = path.replace("%", "%25") \
903                .replace("*", "%2A") \
904                .replace("#", "%23") \
905                .replace("@", "%40")
906     return path
907
908 def wildcard_present(path):
909     m = re.search("[*#@%]", path)
910     return m is not None
911
912 class Command:
913     def __init__(self):
914         self.usage = "usage: %prog [options]"
915         self.needsGit = True
916         self.verbose = False
917
918 class P4UserMap:
919     def __init__(self):
920         self.userMapFromPerforceServer = False
921         self.myP4UserId = None
922
923     def p4UserId(self):
924         if self.myP4UserId:
925             return self.myP4UserId
926
927         results = p4CmdList("user -o")
928         for r in results:
929             if r.has_key('User'):
930                 self.myP4UserId = r['User']
931                 return r['User']
932         die("Could not find your p4 user id")
933
934     def p4UserIsMe(self, p4User):
935         # return True if the given p4 user is actually me
936         me = self.p4UserId()
937         if not p4User or p4User != me:
938             return False
939         else:
940             return True
941
942     def getUserCacheFilename(self):
943         home = os.environ.get("HOME", os.environ.get("USERPROFILE"))
944         return home + "/.gitp4-usercache.txt"
945
946     def getUserMapFromPerforceServer(self):
947         if self.userMapFromPerforceServer:
948             return
949         self.users = {}
950         self.emails = {}
951
952         for output in p4CmdList("users"):
953             if not output.has_key("User"):
954                 continue
955             self.users[output["User"]] = output["FullName"] + " <" + output["Email"] + ">"
956             self.emails[output["Email"]] = output["User"]
957
958
959         s = ''
960         for (key, val) in self.users.items():
961             s += "%s\t%s\n" % (key.expandtabs(1), val.expandtabs(1))
962
963         open(self.getUserCacheFilename(), "wb").write(s)
964         self.userMapFromPerforceServer = True
965
966     def loadUserMapFromCache(self):
967         self.users = {}
968         self.userMapFromPerforceServer = False
969         try:
970             cache = open(self.getUserCacheFilename(), "rb")
971             lines = cache.readlines()
972             cache.close()
973             for line in lines:
974                 entry = line.strip().split("\t")
975                 self.users[entry[0]] = entry[1]
976         except IOError:
977             self.getUserMapFromPerforceServer()
978
979 class P4Debug(Command):
980     def __init__(self):
981         Command.__init__(self)
982         self.options = []
983         self.description = "A tool to debug the output of p4 -G."
984         self.needsGit = False
985
986     def run(self, args):
987         j = 0
988         for output in p4CmdList(args):
989             print 'Element: %d' % j
990             j += 1
991             print output
992         return True
993
994 class P4RollBack(Command):
995     def __init__(self):
996         Command.__init__(self)
997         self.options = [
998             optparse.make_option("--local", dest="rollbackLocalBranches", action="store_true")
999         ]
1000         self.description = "A tool to debug the multi-branch import. Don't use :)"
1001         self.rollbackLocalBranches = False
1002
1003     def run(self, args):
1004         if len(args) != 1:
1005             return False
1006         maxChange = int(args[0])
1007
1008         if "p4ExitCode" in p4Cmd("changes -m 1"):
1009             die("Problems executing p4");
1010
1011         if self.rollbackLocalBranches:
1012             refPrefix = "refs/heads/"
1013             lines = read_pipe_lines("git rev-parse --symbolic --branches")
1014         else:
1015             refPrefix = "refs/remotes/"
1016             lines = read_pipe_lines("git rev-parse --symbolic --remotes")
1017
1018         for line in lines:
1019             if self.rollbackLocalBranches or (line.startswith("p4/") and line != "p4/HEAD\n"):
1020                 line = line.strip()
1021                 ref = refPrefix + line
1022                 log = extractLogMessageFromGitCommit(ref)
1023                 settings = extractSettingsGitLog(log)
1024
1025                 depotPaths = settings['depot-paths']
1026                 change = settings['change']
1027
1028                 changed = False
1029
1030                 if len(p4Cmd("changes -m 1 "  + ' '.join (['%s...@%s' % (p, maxChange)
1031                                                            for p in depotPaths]))) == 0:
1032                     print "Branch %s did not exist at change %s, deleting." % (ref, maxChange)
1033                     system("git update-ref -d %s `git rev-parse %s`" % (ref, ref))
1034                     continue
1035
1036                 while change and int(change) > maxChange:
1037                     changed = True
1038                     if self.verbose:
1039                         print "%s is at %s ; rewinding towards %s" % (ref, change, maxChange)
1040                     system("git update-ref %s \"%s^\"" % (ref, ref))
1041                     log = extractLogMessageFromGitCommit(ref)
1042                     settings =  extractSettingsGitLog(log)
1043
1044
1045                     depotPaths = settings['depot-paths']
1046                     change = settings['change']
1047
1048                 if changed:
1049                     print "%s rewound to %s" % (ref, change)
1050
1051         return True
1052
1053 class P4Submit(Command, P4UserMap):
1054
1055     conflict_behavior_choices = ("ask", "skip", "quit")
1056
1057     def __init__(self):
1058         Command.__init__(self)
1059         P4UserMap.__init__(self)
1060         self.options = [
1061                 optparse.make_option("--origin", dest="origin"),
1062                 optparse.make_option("-M", dest="detectRenames", action="store_true"),
1063                 # preserve the user, requires relevant p4 permissions
1064                 optparse.make_option("--preserve-user", dest="preserveUser", action="store_true"),
1065                 optparse.make_option("--export-labels", dest="exportLabels", action="store_true"),
1066                 optparse.make_option("--dry-run", "-n", dest="dry_run", action="store_true"),
1067                 optparse.make_option("--prepare-p4-only", dest="prepare_p4_only", action="store_true"),
1068                 optparse.make_option("--conflict", dest="conflict_behavior",
1069                                      choices=self.conflict_behavior_choices),
1070                 optparse.make_option("--branch", dest="branch"),
1071         ]
1072         self.description = "Submit changes from git to the perforce depot."
1073         self.usage += " [name of git branch to submit into perforce depot]"
1074         self.origin = ""
1075         self.detectRenames = False
1076         self.preserveUser = gitConfigBool("git-p4.preserveUser")
1077         self.dry_run = False
1078         self.prepare_p4_only = False
1079         self.conflict_behavior = None
1080         self.isWindows = (platform.system() == "Windows")
1081         self.exportLabels = False
1082         self.p4HasMoveCommand = p4_has_move_command()
1083         self.branch = None
1084
1085     def check(self):
1086         if len(p4CmdList("opened ...")) > 0:
1087             die("You have files opened with perforce! Close them before starting the sync.")
1088
1089     def separate_jobs_from_description(self, message):
1090         """Extract and return a possible Jobs field in the commit
1091            message.  It goes into a separate section in the p4 change
1092            specification.
1093
1094            A jobs line starts with "Jobs:" and looks like a new field
1095            in a form.  Values are white-space separated on the same
1096            line or on following lines that start with a tab.
1097
1098            This does not parse and extract the full git commit message
1099            like a p4 form.  It just sees the Jobs: line as a marker
1100            to pass everything from then on directly into the p4 form,
1101            but outside the description section.
1102
1103            Return a tuple (stripped log message, jobs string)."""
1104
1105         m = re.search(r'^Jobs:', message, re.MULTILINE)
1106         if m is None:
1107             return (message, None)
1108
1109         jobtext = message[m.start():]
1110         stripped_message = message[:m.start()].rstrip()
1111         return (stripped_message, jobtext)
1112
1113     def prepareLogMessage(self, template, message, jobs):
1114         """Edits the template returned from "p4 change -o" to insert
1115            the message in the Description field, and the jobs text in
1116            the Jobs field."""
1117         result = ""
1118
1119         inDescriptionSection = False
1120
1121         for line in template.split("\n"):
1122             if line.startswith("#"):
1123                 result += line + "\n"
1124                 continue
1125
1126             if inDescriptionSection:
1127                 if line.startswith("Files:") or line.startswith("Jobs:"):
1128                     inDescriptionSection = False
1129                     # insert Jobs section
1130                     if jobs:
1131                         result += jobs + "\n"
1132                 else:
1133                     continue
1134             else:
1135                 if line.startswith("Description:"):
1136                     inDescriptionSection = True
1137                     line += "\n"
1138                     for messageLine in message.split("\n"):
1139                         line += "\t" + messageLine + "\n"
1140
1141             result += line + "\n"
1142
1143         return result
1144
1145     def patchRCSKeywords(self, file, pattern):
1146         # Attempt to zap the RCS keywords in a p4 controlled file matching the given pattern
1147         (handle, outFileName) = tempfile.mkstemp(dir='.')
1148         try:
1149             outFile = os.fdopen(handle, "w+")
1150             inFile = open(file, "r")
1151             regexp = re.compile(pattern, re.VERBOSE)
1152             for line in inFile.readlines():
1153                 line = regexp.sub(r'$\1$', line)
1154                 outFile.write(line)
1155             inFile.close()
1156             outFile.close()
1157             # Forcibly overwrite the original file
1158             os.unlink(file)
1159             shutil.move(outFileName, file)
1160         except:
1161             # cleanup our temporary file
1162             os.unlink(outFileName)
1163             print "Failed to strip RCS keywords in %s" % file
1164             raise
1165
1166         print "Patched up RCS keywords in %s" % file
1167
1168     def p4UserForCommit(self,id):
1169         # Return the tuple (perforce user,git email) for a given git commit id
1170         self.getUserMapFromPerforceServer()
1171         gitEmail = read_pipe(["git", "log", "--max-count=1",
1172                               "--format=%ae", id])
1173         gitEmail = gitEmail.strip()
1174         if not self.emails.has_key(gitEmail):
1175             return (None,gitEmail)
1176         else:
1177             return (self.emails[gitEmail],gitEmail)
1178
1179     def checkValidP4Users(self,commits):
1180         # check if any git authors cannot be mapped to p4 users
1181         for id in commits:
1182             (user,email) = self.p4UserForCommit(id)
1183             if not user:
1184                 msg = "Cannot find p4 user for email %s in commit %s." % (email, id)
1185                 if gitConfigBool("git-p4.allowMissingP4Users"):
1186                     print "%s" % msg
1187                 else:
1188                     die("Error: %s\nSet git-p4.allowMissingP4Users to true to allow this." % msg)
1189
1190     def lastP4Changelist(self):
1191         # Get back the last changelist number submitted in this client spec. This
1192         # then gets used to patch up the username in the change. If the same
1193         # client spec is being used by multiple processes then this might go
1194         # wrong.
1195         results = p4CmdList("client -o")        # find the current client
1196         client = None
1197         for r in results:
1198             if r.has_key('Client'):
1199                 client = r['Client']
1200                 break
1201         if not client:
1202             die("could not get client spec")
1203         results = p4CmdList(["changes", "-c", client, "-m", "1"])
1204         for r in results:
1205             if r.has_key('change'):
1206                 return r['change']
1207         die("Could not get changelist number for last submit - cannot patch up user details")
1208
1209     def modifyChangelistUser(self, changelist, newUser):
1210         # fixup the user field of a changelist after it has been submitted.
1211         changes = p4CmdList("change -o %s" % changelist)
1212         if len(changes) != 1:
1213             die("Bad output from p4 change modifying %s to user %s" %
1214                 (changelist, newUser))
1215
1216         c = changes[0]
1217         if c['User'] == newUser: return   # nothing to do
1218         c['User'] = newUser
1219         input = marshal.dumps(c)
1220
1221         result = p4CmdList("change -f -i", stdin=input)
1222         for r in result:
1223             if r.has_key('code'):
1224                 if r['code'] == 'error':
1225                     die("Could not modify user field of changelist %s to %s:%s" % (changelist, newUser, r['data']))
1226             if r.has_key('data'):
1227                 print("Updated user field for changelist %s to %s" % (changelist, newUser))
1228                 return
1229         die("Could not modify user field of changelist %s to %s" % (changelist, newUser))
1230
1231     def canChangeChangelists(self):
1232         # check to see if we have p4 admin or super-user permissions, either of
1233         # which are required to modify changelists.
1234         results = p4CmdList(["protects", self.depotPath])
1235         for r in results:
1236             if r.has_key('perm'):
1237                 if r['perm'] == 'admin':
1238                     return 1
1239                 if r['perm'] == 'super':
1240                     return 1
1241         return 0
1242
1243     def prepareSubmitTemplate(self):
1244         """Run "p4 change -o" to grab a change specification template.
1245            This does not use "p4 -G", as it is nice to keep the submission
1246            template in original order, since a human might edit it.
1247
1248            Remove lines in the Files section that show changes to files
1249            outside the depot path we're committing into."""
1250
1251         template = ""
1252         inFilesSection = False
1253         for line in p4_read_pipe_lines(['change', '-o']):
1254             if line.endswith("\r\n"):
1255                 line = line[:-2] + "\n"
1256             if inFilesSection:
1257                 if line.startswith("\t"):
1258                     # path starts and ends with a tab
1259                     path = line[1:]
1260                     lastTab = path.rfind("\t")
1261                     if lastTab != -1:
1262                         path = path[:lastTab]
1263                         if not p4PathStartsWith(path, self.depotPath):
1264                             continue
1265                 else:
1266                     inFilesSection = False
1267             else:
1268                 if line.startswith("Files:"):
1269                     inFilesSection = True
1270
1271             template += line
1272
1273         return template
1274
1275     def edit_template(self, template_file):
1276         """Invoke the editor to let the user change the submission
1277            message.  Return true if okay to continue with the submit."""
1278
1279         # if configured to skip the editing part, just submit
1280         if gitConfigBool("git-p4.skipSubmitEdit"):
1281             return True
1282
1283         # look at the modification time, to check later if the user saved
1284         # the file
1285         mtime = os.stat(template_file).st_mtime
1286
1287         # invoke the editor
1288         if os.environ.has_key("P4EDITOR") and (os.environ.get("P4EDITOR") != ""):
1289             editor = os.environ.get("P4EDITOR")
1290         else:
1291             editor = read_pipe("git var GIT_EDITOR").strip()
1292         system(["sh", "-c", ('%s "$@"' % editor), editor, template_file])
1293
1294         # If the file was not saved, prompt to see if this patch should
1295         # be skipped.  But skip this verification step if configured so.
1296         if gitConfigBool("git-p4.skipSubmitEditCheck"):
1297             return True
1298
1299         # modification time updated means user saved the file
1300         if os.stat(template_file).st_mtime > mtime:
1301             return True
1302
1303         while True:
1304             response = raw_input("Submit template unchanged. Submit anyway? [y]es, [n]o (skip this patch) ")
1305             if response == 'y':
1306                 return True
1307             if response == 'n':
1308                 return False
1309
1310     def get_diff_description(self, editedFiles, filesToAdd):
1311         # diff
1312         if os.environ.has_key("P4DIFF"):
1313             del(os.environ["P4DIFF"])
1314         diff = ""
1315         for editedFile in editedFiles:
1316             diff += p4_read_pipe(['diff', '-du',
1317                                   wildcard_encode(editedFile)])
1318
1319         # new file diff
1320         newdiff = ""
1321         for newFile in filesToAdd:
1322             newdiff += "==== new file ====\n"
1323             newdiff += "--- /dev/null\n"
1324             newdiff += "+++ %s\n" % newFile
1325             f = open(newFile, "r")
1326             for line in f.readlines():
1327                 newdiff += "+" + line
1328             f.close()
1329
1330         return (diff + newdiff).replace('\r\n', '\n')
1331
1332     def applyCommit(self, id):
1333         """Apply one commit, return True if it succeeded."""
1334
1335         print "Applying", read_pipe(["git", "show", "-s",
1336                                      "--format=format:%h %s", id])
1337
1338         (p4User, gitEmail) = self.p4UserForCommit(id)
1339
1340         diff = read_pipe_lines("git diff-tree -r %s \"%s^\" \"%s\"" % (self.diffOpts, id, id))
1341         filesToAdd = set()
1342         filesToDelete = set()
1343         editedFiles = set()
1344         pureRenameCopy = set()
1345         filesToChangeExecBit = {}
1346
1347         for line in diff:
1348             diff = parseDiffTreeEntry(line)
1349             modifier = diff['status']
1350             path = diff['src']
1351             if modifier == "M":
1352                 p4_edit(path)
1353                 if isModeExecChanged(diff['src_mode'], diff['dst_mode']):
1354                     filesToChangeExecBit[path] = diff['dst_mode']
1355                 editedFiles.add(path)
1356             elif modifier == "A":
1357                 filesToAdd.add(path)
1358                 filesToChangeExecBit[path] = diff['dst_mode']
1359                 if path in filesToDelete:
1360                     filesToDelete.remove(path)
1361             elif modifier == "D":
1362                 filesToDelete.add(path)
1363                 if path in filesToAdd:
1364                     filesToAdd.remove(path)
1365             elif modifier == "C":
1366                 src, dest = diff['src'], diff['dst']
1367                 p4_integrate(src, dest)
1368                 pureRenameCopy.add(dest)
1369                 if diff['src_sha1'] != diff['dst_sha1']:
1370                     p4_edit(dest)
1371                     pureRenameCopy.discard(dest)
1372                 if isModeExecChanged(diff['src_mode'], diff['dst_mode']):
1373                     p4_edit(dest)
1374                     pureRenameCopy.discard(dest)
1375                     filesToChangeExecBit[dest] = diff['dst_mode']
1376                 if self.isWindows:
1377                     # turn off read-only attribute
1378                     os.chmod(dest, stat.S_IWRITE)
1379                 os.unlink(dest)
1380                 editedFiles.add(dest)
1381             elif modifier == "R":
1382                 src, dest = diff['src'], diff['dst']
1383                 if self.p4HasMoveCommand:
1384                     p4_edit(src)        # src must be open before move
1385                     p4_move(src, dest)  # opens for (move/delete, move/add)
1386                 else:
1387                     p4_integrate(src, dest)
1388                     if diff['src_sha1'] != diff['dst_sha1']:
1389                         p4_edit(dest)
1390                     else:
1391                         pureRenameCopy.add(dest)
1392                 if isModeExecChanged(diff['src_mode'], diff['dst_mode']):
1393                     if not self.p4HasMoveCommand:
1394                         p4_edit(dest)   # with move: already open, writable
1395                     filesToChangeExecBit[dest] = diff['dst_mode']
1396                 if not self.p4HasMoveCommand:
1397                     if self.isWindows:
1398                         os.chmod(dest, stat.S_IWRITE)
1399                     os.unlink(dest)
1400                     filesToDelete.add(src)
1401                 editedFiles.add(dest)
1402             else:
1403                 die("unknown modifier %s for %s" % (modifier, path))
1404
1405         diffcmd = "git diff-tree --full-index -p \"%s\"" % (id)
1406         patchcmd = diffcmd + " | git apply "
1407         tryPatchCmd = patchcmd + "--check -"
1408         applyPatchCmd = patchcmd + "--check --apply -"
1409         patch_succeeded = True
1410
1411         if os.system(tryPatchCmd) != 0:
1412             fixed_rcs_keywords = False
1413             patch_succeeded = False
1414             print "Unfortunately applying the change failed!"
1415
1416             # Patch failed, maybe it's just RCS keyword woes. Look through
1417             # the patch to see if that's possible.
1418             if gitConfigBool("git-p4.attemptRCSCleanup"):
1419                 file = None
1420                 pattern = None
1421                 kwfiles = {}
1422                 for file in editedFiles | filesToDelete:
1423                     # did this file's delta contain RCS keywords?
1424                     pattern = p4_keywords_regexp_for_file(file)
1425
1426                     if pattern:
1427                         # this file is a possibility...look for RCS keywords.
1428                         regexp = re.compile(pattern, re.VERBOSE)
1429                         for line in read_pipe_lines(["git", "diff", "%s^..%s" % (id, id), file]):
1430                             if regexp.search(line):
1431                                 if verbose:
1432                                     print "got keyword match on %s in %s in %s" % (pattern, line, file)
1433                                 kwfiles[file] = pattern
1434                                 break
1435
1436                 for file in kwfiles:
1437                     if verbose:
1438                         print "zapping %s with %s" % (line,pattern)
1439                     # File is being deleted, so not open in p4.  Must
1440                     # disable the read-only bit on windows.
1441                     if self.isWindows and file not in editedFiles:
1442                         os.chmod(file, stat.S_IWRITE)
1443                     self.patchRCSKeywords(file, kwfiles[file])
1444                     fixed_rcs_keywords = True
1445
1446             if fixed_rcs_keywords:
1447                 print "Retrying the patch with RCS keywords cleaned up"
1448                 if os.system(tryPatchCmd) == 0:
1449                     patch_succeeded = True
1450
1451         if not patch_succeeded:
1452             for f in editedFiles:
1453                 p4_revert(f)
1454             return False
1455
1456         #
1457         # Apply the patch for real, and do add/delete/+x handling.
1458         #
1459         system(applyPatchCmd)
1460
1461         for f in filesToAdd:
1462             p4_add(f)
1463         for f in filesToDelete:
1464             p4_revert(f)
1465             p4_delete(f)
1466
1467         # Set/clear executable bits
1468         for f in filesToChangeExecBit.keys():
1469             mode = filesToChangeExecBit[f]
1470             setP4ExecBit(f, mode)
1471
1472         #
1473         # Build p4 change description, starting with the contents
1474         # of the git commit message.
1475         #
1476         logMessage = extractLogMessageFromGitCommit(id)
1477         logMessage = logMessage.strip()
1478         (logMessage, jobs) = self.separate_jobs_from_description(logMessage)
1479
1480         template = self.prepareSubmitTemplate()
1481         submitTemplate = self.prepareLogMessage(template, logMessage, jobs)
1482
1483         if self.preserveUser:
1484            submitTemplate += "\n######## Actual user %s, modified after commit\n" % p4User
1485
1486         if self.checkAuthorship and not self.p4UserIsMe(p4User):
1487             submitTemplate += "######## git author %s does not match your p4 account.\n" % gitEmail
1488             submitTemplate += "######## Use option --preserve-user to modify authorship.\n"
1489             submitTemplate += "######## Variable git-p4.skipUserNameCheck hides this message.\n"
1490
1491         separatorLine = "######## everything below this line is just the diff #######\n"
1492         if not self.prepare_p4_only:
1493             submitTemplate += separatorLine
1494             submitTemplate += self.get_diff_description(editedFiles, filesToAdd)
1495
1496         (handle, fileName) = tempfile.mkstemp()
1497         tmpFile = os.fdopen(handle, "w+b")
1498         if self.isWindows:
1499             submitTemplate = submitTemplate.replace("\n", "\r\n")
1500         tmpFile.write(submitTemplate)
1501         tmpFile.close()
1502
1503         if self.prepare_p4_only:
1504             #
1505             # Leave the p4 tree prepared, and the submit template around
1506             # and let the user decide what to do next
1507             #
1508             print
1509             print "P4 workspace prepared for submission."
1510             print "To submit or revert, go to client workspace"
1511             print "  " + self.clientPath
1512             print
1513             print "To submit, use \"p4 submit\" to write a new description,"
1514             print "or \"p4 submit -i <%s\" to use the one prepared by" \
1515                   " \"git p4\"." % fileName
1516             print "You can delete the file \"%s\" when finished." % fileName
1517
1518             if self.preserveUser and p4User and not self.p4UserIsMe(p4User):
1519                 print "To preserve change ownership by user %s, you must\n" \
1520                       "do \"p4 change -f <change>\" after submitting and\n" \
1521                       "edit the User field."
1522             if pureRenameCopy:
1523                 print "After submitting, renamed files must be re-synced."
1524                 print "Invoke \"p4 sync -f\" on each of these files:"
1525                 for f in pureRenameCopy:
1526                     print "  " + f
1527
1528             print
1529             print "To revert the changes, use \"p4 revert ...\", and delete"
1530             print "the submit template file \"%s\"" % fileName
1531             if filesToAdd:
1532                 print "Since the commit adds new files, they must be deleted:"
1533                 for f in filesToAdd:
1534                     print "  " + f
1535             print
1536             return True
1537
1538         #
1539         # Let the user edit the change description, then submit it.
1540         #
1541         if self.edit_template(fileName):
1542             # read the edited message and submit
1543             ret = True
1544             tmpFile = open(fileName, "rb")
1545             message = tmpFile.read()
1546             tmpFile.close()
1547             if self.isWindows:
1548                 message = message.replace("\r\n", "\n")
1549             submitTemplate = message[:message.index(separatorLine)]
1550             p4_write_pipe(['submit', '-i'], submitTemplate)
1551
1552             if self.preserveUser:
1553                 if p4User:
1554                     # Get last changelist number. Cannot easily get it from
1555                     # the submit command output as the output is
1556                     # unmarshalled.
1557                     changelist = self.lastP4Changelist()
1558                     self.modifyChangelistUser(changelist, p4User)
1559
1560             # The rename/copy happened by applying a patch that created a
1561             # new file.  This leaves it writable, which confuses p4.
1562             for f in pureRenameCopy:
1563                 p4_sync(f, "-f")
1564
1565         else:
1566             # skip this patch
1567             ret = False
1568             print "Submission cancelled, undoing p4 changes."
1569             for f in editedFiles:
1570                 p4_revert(f)
1571             for f in filesToAdd:
1572                 p4_revert(f)
1573                 os.remove(f)
1574             for f in filesToDelete:
1575                 p4_revert(f)
1576
1577         os.remove(fileName)
1578         return ret
1579
1580     # Export git tags as p4 labels. Create a p4 label and then tag
1581     # with that.
1582     def exportGitTags(self, gitTags):
1583         validLabelRegexp = gitConfig("git-p4.labelExportRegexp")
1584         if len(validLabelRegexp) == 0:
1585             validLabelRegexp = defaultLabelRegexp
1586         m = re.compile(validLabelRegexp)
1587
1588         for name in gitTags:
1589
1590             if not m.match(name):
1591                 if verbose:
1592                     print "tag %s does not match regexp %s" % (name, validLabelRegexp)
1593                 continue
1594
1595             # Get the p4 commit this corresponds to
1596             logMessage = extractLogMessageFromGitCommit(name)
1597             values = extractSettingsGitLog(logMessage)
1598
1599             if not values.has_key('change'):
1600                 # a tag pointing to something not sent to p4; ignore
1601                 if verbose:
1602                     print "git tag %s does not give a p4 commit" % name
1603                 continue
1604             else:
1605                 changelist = values['change']
1606
1607             # Get the tag details.
1608             inHeader = True
1609             isAnnotated = False
1610             body = []
1611             for l in read_pipe_lines(["git", "cat-file", "-p", name]):
1612                 l = l.strip()
1613                 if inHeader:
1614                     if re.match(r'tag\s+', l):
1615                         isAnnotated = True
1616                     elif re.match(r'\s*$', l):
1617                         inHeader = False
1618                         continue
1619                 else:
1620                     body.append(l)
1621
1622             if not isAnnotated:
1623                 body = ["lightweight tag imported by git p4\n"]
1624
1625             # Create the label - use the same view as the client spec we are using
1626             clientSpec = getClientSpec()
1627
1628             labelTemplate  = "Label: %s\n" % name
1629             labelTemplate += "Description:\n"
1630             for b in body:
1631                 labelTemplate += "\t" + b + "\n"
1632             labelTemplate += "View:\n"
1633             for depot_side in clientSpec.mappings:
1634                 labelTemplate += "\t%s\n" % depot_side
1635
1636             if self.dry_run:
1637                 print "Would create p4 label %s for tag" % name
1638             elif self.prepare_p4_only:
1639                 print "Not creating p4 label %s for tag due to option" \
1640                       " --prepare-p4-only" % name
1641             else:
1642                 p4_write_pipe(["label", "-i"], labelTemplate)
1643
1644                 # Use the label
1645                 p4_system(["tag", "-l", name] +
1646                           ["%s@%s" % (depot_side, changelist) for depot_side in clientSpec.mappings])
1647
1648                 if verbose:
1649                     print "created p4 label for tag %s" % name
1650
1651     def run(self, args):
1652         if len(args) == 0:
1653             self.master = currentGitBranch()
1654             if len(self.master) == 0 or not gitBranchExists("refs/heads/%s" % self.master):
1655                 die("Detecting current git branch failed!")
1656         elif len(args) == 1:
1657             self.master = args[0]
1658             if not branchExists(self.master):
1659                 die("Branch %s does not exist" % self.master)
1660         else:
1661             return False
1662
1663         allowSubmit = gitConfig("git-p4.allowSubmit")
1664         if len(allowSubmit) > 0 and not self.master in allowSubmit.split(","):
1665             die("%s is not in git-p4.allowSubmit" % self.master)
1666
1667         [upstream, settings] = findUpstreamBranchPoint()
1668         self.depotPath = settings['depot-paths'][0]
1669         if len(self.origin) == 0:
1670             self.origin = upstream
1671
1672         if self.preserveUser:
1673             if not self.canChangeChangelists():
1674                 die("Cannot preserve user names without p4 super-user or admin permissions")
1675
1676         # if not set from the command line, try the config file
1677         if self.conflict_behavior is None:
1678             val = gitConfig("git-p4.conflict")
1679             if val:
1680                 if val not in self.conflict_behavior_choices:
1681                     die("Invalid value '%s' for config git-p4.conflict" % val)
1682             else:
1683                 val = "ask"
1684             self.conflict_behavior = val
1685
1686         if self.verbose:
1687             print "Origin branch is " + self.origin
1688
1689         if len(self.depotPath) == 0:
1690             print "Internal error: cannot locate perforce depot path from existing branches"
1691             sys.exit(128)
1692
1693         self.useClientSpec = False
1694         if gitConfigBool("git-p4.useclientspec"):
1695             self.useClientSpec = True
1696         if self.useClientSpec:
1697             self.clientSpecDirs = getClientSpec()
1698
1699         # Check for the existance of P4 branches
1700         branchesDetected = (len(p4BranchesInGit().keys()) > 1)
1701
1702         if self.useClientSpec and not branchesDetected:
1703             # all files are relative to the client spec
1704             self.clientPath = getClientRoot()
1705         else:
1706             self.clientPath = p4Where(self.depotPath)
1707
1708         if self.clientPath == "":
1709             die("Error: Cannot locate perforce checkout of %s in client view" % self.depotPath)
1710
1711         print "Perforce checkout for depot path %s located at %s" % (self.depotPath, self.clientPath)
1712         self.oldWorkingDirectory = os.getcwd()
1713
1714         # ensure the clientPath exists
1715         new_client_dir = False
1716         if not os.path.exists(self.clientPath):
1717             new_client_dir = True
1718             os.makedirs(self.clientPath)
1719
1720         chdir(self.clientPath, is_client_path=True)
1721         if self.dry_run:
1722             print "Would synchronize p4 checkout in %s" % self.clientPath
1723         else:
1724             print "Synchronizing p4 checkout..."
1725             if new_client_dir:
1726                 # old one was destroyed, and maybe nobody told p4
1727                 p4_sync("...", "-f")
1728             else:
1729                 p4_sync("...")
1730         self.check()
1731
1732         commits = []
1733         for line in read_pipe_lines(["git", "rev-list", "--no-merges", "%s..%s" % (self.origin, self.master)]):
1734             commits.append(line.strip())
1735         commits.reverse()
1736
1737         if self.preserveUser or gitConfigBool("git-p4.skipUserNameCheck"):
1738             self.checkAuthorship = False
1739         else:
1740             self.checkAuthorship = True
1741
1742         if self.preserveUser:
1743             self.checkValidP4Users(commits)
1744
1745         #
1746         # Build up a set of options to be passed to diff when
1747         # submitting each commit to p4.
1748         #
1749         if self.detectRenames:
1750             # command-line -M arg
1751             self.diffOpts = "-M"
1752         else:
1753             # If not explicitly set check the config variable
1754             detectRenames = gitConfig("git-p4.detectRenames")
1755
1756             if detectRenames.lower() == "false" or detectRenames == "":
1757                 self.diffOpts = ""
1758             elif detectRenames.lower() == "true":
1759                 self.diffOpts = "-M"
1760             else:
1761                 self.diffOpts = "-M%s" % detectRenames
1762
1763         # no command-line arg for -C or --find-copies-harder, just
1764         # config variables
1765         detectCopies = gitConfig("git-p4.detectCopies")
1766         if detectCopies.lower() == "false" or detectCopies == "":
1767             pass
1768         elif detectCopies.lower() == "true":
1769             self.diffOpts += " -C"
1770         else:
1771             self.diffOpts += " -C%s" % detectCopies
1772
1773         if gitConfigBool("git-p4.detectCopiesHarder"):
1774             self.diffOpts += " --find-copies-harder"
1775
1776         #
1777         # Apply the commits, one at a time.  On failure, ask if should
1778         # continue to try the rest of the patches, or quit.
1779         #
1780         if self.dry_run:
1781             print "Would apply"
1782         applied = []
1783         last = len(commits) - 1
1784         for i, commit in enumerate(commits):
1785             if self.dry_run:
1786                 print " ", read_pipe(["git", "show", "-s",
1787                                       "--format=format:%h %s", commit])
1788                 ok = True
1789             else:
1790                 ok = self.applyCommit(commit)
1791             if ok:
1792                 applied.append(commit)
1793             else:
1794                 if self.prepare_p4_only and i < last:
1795                     print "Processing only the first commit due to option" \
1796                           " --prepare-p4-only"
1797                     break
1798                 if i < last:
1799                     quit = False
1800                     while True:
1801                         # prompt for what to do, or use the option/variable
1802                         if self.conflict_behavior == "ask":
1803                             print "What do you want to do?"
1804                             response = raw_input("[s]kip this commit but apply"
1805                                                  " the rest, or [q]uit? ")
1806                             if not response:
1807                                 continue
1808                         elif self.conflict_behavior == "skip":
1809                             response = "s"
1810                         elif self.conflict_behavior == "quit":
1811                             response = "q"
1812                         else:
1813                             die("Unknown conflict_behavior '%s'" %
1814                                 self.conflict_behavior)
1815
1816                         if response[0] == "s":
1817                             print "Skipping this commit, but applying the rest"
1818                             break
1819                         if response[0] == "q":
1820                             print "Quitting"
1821                             quit = True
1822                             break
1823                     if quit:
1824                         break
1825
1826         chdir(self.oldWorkingDirectory)
1827
1828         if self.dry_run:
1829             pass
1830         elif self.prepare_p4_only:
1831             pass
1832         elif len(commits) == len(applied):
1833             print "All commits applied!"
1834
1835             sync = P4Sync()
1836             if self.branch:
1837                 sync.branch = self.branch
1838             sync.run([])
1839
1840             rebase = P4Rebase()
1841             rebase.rebase()
1842
1843         else:
1844             if len(applied) == 0:
1845                 print "No commits applied."
1846             else:
1847                 print "Applied only the commits marked with '*':"
1848                 for c in commits:
1849                     if c in applied:
1850                         star = "*"
1851                     else:
1852                         star = " "
1853                     print star, read_pipe(["git", "show", "-s",
1854                                            "--format=format:%h %s",  c])
1855                 print "You will have to do 'git p4 sync' and rebase."
1856
1857         if gitConfigBool("git-p4.exportLabels"):
1858             self.exportLabels = True
1859
1860         if self.exportLabels:
1861             p4Labels = getP4Labels(self.depotPath)
1862             gitTags = getGitTags()
1863
1864             missingGitTags = gitTags - p4Labels
1865             self.exportGitTags(missingGitTags)
1866
1867         # exit with error unless everything applied perfectly
1868         if len(commits) != len(applied):
1869                 sys.exit(1)
1870
1871         return True
1872
1873 class View(object):
1874     """Represent a p4 view ("p4 help views"), and map files in a
1875        repo according to the view."""
1876
1877     def __init__(self, client_name):
1878         self.mappings = []
1879         self.client_prefix = "//%s/" % client_name
1880         # cache results of "p4 where" to lookup client file locations
1881         self.client_spec_path_cache = {}
1882
1883     def append(self, view_line):
1884         """Parse a view line, splitting it into depot and client
1885            sides.  Append to self.mappings, preserving order.  This
1886            is only needed for tag creation."""
1887
1888         # Split the view line into exactly two words.  P4 enforces
1889         # structure on these lines that simplifies this quite a bit.
1890         #
1891         # Either or both words may be double-quoted.
1892         # Single quotes do not matter.
1893         # Double-quote marks cannot occur inside the words.
1894         # A + or - prefix is also inside the quotes.
1895         # There are no quotes unless they contain a space.
1896         # The line is already white-space stripped.
1897         # The two words are separated by a single space.
1898         #
1899         if view_line[0] == '"':
1900             # First word is double quoted.  Find its end.
1901             close_quote_index = view_line.find('"', 1)
1902             if close_quote_index <= 0:
1903                 die("No first-word closing quote found: %s" % view_line)
1904             depot_side = view_line[1:close_quote_index]
1905             # skip closing quote and space
1906             rhs_index = close_quote_index + 1 + 1
1907         else:
1908             space_index = view_line.find(" ")
1909             if space_index <= 0:
1910                 die("No word-splitting space found: %s" % view_line)
1911             depot_side = view_line[0:space_index]
1912             rhs_index = space_index + 1
1913
1914         # prefix + means overlay on previous mapping
1915         if depot_side.startswith("+"):
1916             depot_side = depot_side[1:]
1917
1918         # prefix - means exclude this path, leave out of mappings
1919         exclude = False
1920         if depot_side.startswith("-"):
1921             exclude = True
1922             depot_side = depot_side[1:]
1923
1924         if not exclude:
1925             self.mappings.append(depot_side)
1926
1927     def convert_client_path(self, clientFile):
1928         # chop off //client/ part to make it relative
1929         if not clientFile.startswith(self.client_prefix):
1930             die("No prefix '%s' on clientFile '%s'" %
1931                 (self.client_prefix, clientFile))
1932         return clientFile[len(self.client_prefix):]
1933
1934     def update_client_spec_path_cache(self, files):
1935         """ Caching file paths by "p4 where" batch query """
1936
1937         # List depot file paths exclude that already cached
1938         fileArgs = [f['path'] for f in files if f['path'] not in self.client_spec_path_cache]
1939
1940         if len(fileArgs) == 0:
1941             return  # All files in cache
1942
1943         where_result = p4CmdList(["-x", "-", "where"], stdin=fileArgs)
1944         for res in where_result:
1945             if "code" in res and res["code"] == "error":
1946                 # assume error is "... file(s) not in client view"
1947                 continue
1948             if "clientFile" not in res:
1949                 die("No clientFile in 'p4 where' output")
1950             if "unmap" in res:
1951                 # it will list all of them, but only one not unmap-ped
1952                 continue
1953             if gitConfigBool("core.ignorecase"):
1954                 res['depotFile'] = res['depotFile'].lower()
1955             self.client_spec_path_cache[res['depotFile']] = self.convert_client_path(res["clientFile"])
1956
1957         # not found files or unmap files set to ""
1958         for depotFile in fileArgs:
1959             if gitConfigBool("core.ignorecase"):
1960                 depotFile = depotFile.lower()
1961             if depotFile not in self.client_spec_path_cache:
1962                 self.client_spec_path_cache[depotFile] = ""
1963
1964     def map_in_client(self, depot_path):
1965         """Return the relative location in the client where this
1966            depot file should live.  Returns "" if the file should
1967            not be mapped in the client."""
1968
1969         if gitConfigBool("core.ignorecase"):
1970             depot_path = depot_path.lower()
1971
1972         if depot_path in self.client_spec_path_cache:
1973             return self.client_spec_path_cache[depot_path]
1974
1975         die( "Error: %s is not found in client spec path" % depot_path )
1976         return ""
1977
1978 class P4Sync(Command, P4UserMap):
1979     delete_actions = ( "delete", "move/delete", "purge" )
1980
1981     def __init__(self):
1982         Command.__init__(self)
1983         P4UserMap.__init__(self)
1984         self.options = [
1985                 optparse.make_option("--branch", dest="branch"),
1986                 optparse.make_option("--detect-branches", dest="detectBranches", action="store_true"),
1987                 optparse.make_option("--changesfile", dest="changesFile"),
1988                 optparse.make_option("--silent", dest="silent", action="store_true"),
1989                 optparse.make_option("--detect-labels", dest="detectLabels", action="store_true"),
1990                 optparse.make_option("--import-labels", dest="importLabels", action="store_true"),
1991                 optparse.make_option("--import-local", dest="importIntoRemotes", action="store_false",
1992                                      help="Import into refs/heads/ , not refs/remotes"),
1993                 optparse.make_option("--max-changes", dest="maxChanges",
1994                                      help="Maximum number of changes to import"),
1995                 optparse.make_option("--changes-block-size", dest="changes_block_size", type="int",
1996                                      help="Internal block size to use when iteratively calling p4 changes"),
1997                 optparse.make_option("--keep-path", dest="keepRepoPath", action='store_true',
1998                                      help="Keep entire BRANCH/DIR/SUBDIR prefix during import"),
1999                 optparse.make_option("--use-client-spec", dest="useClientSpec", action='store_true',
2000                                      help="Only sync files that are included in the Perforce Client Spec"),
2001                 optparse.make_option("-/", dest="cloneExclude",
2002                                      action="append", type="string",
2003                                      help="exclude depot path"),
2004         ]
2005         self.description = """Imports from Perforce into a git repository.\n
2006     example:
2007     //depot/my/project/ -- to import the current head
2008     //depot/my/project/@all -- to import everything
2009     //depot/my/project/@1,6 -- to import only from revision 1 to 6
2010
2011     (a ... is not needed in the path p4 specification, it's added implicitly)"""
2012
2013         self.usage += " //depot/path[@revRange]"
2014         self.silent = False
2015         self.createdBranches = set()
2016         self.committedChanges = set()
2017         self.branch = ""
2018         self.detectBranches = False
2019         self.detectLabels = False
2020         self.importLabels = False
2021         self.changesFile = ""
2022         self.syncWithOrigin = True
2023         self.importIntoRemotes = True
2024         self.maxChanges = ""
2025         self.changes_block_size = None
2026         self.keepRepoPath = False
2027         self.depotPaths = None
2028         self.p4BranchesInGit = []
2029         self.cloneExclude = []
2030         self.useClientSpec = False
2031         self.useClientSpec_from_options = False
2032         self.clientSpecDirs = None
2033         self.tempBranches = []
2034         self.tempBranchLocation = "git-p4-tmp"
2035
2036         if gitConfig("git-p4.syncFromOrigin") == "false":
2037             self.syncWithOrigin = False
2038
2039     # This is required for the "append" cloneExclude action
2040     def ensure_value(self, attr, value):
2041         if not hasattr(self, attr) or getattr(self, attr) is None:
2042             setattr(self, attr, value)
2043         return getattr(self, attr)
2044
2045     # Force a checkpoint in fast-import and wait for it to finish
2046     def checkpoint(self):
2047         self.gitStream.write("checkpoint\n\n")
2048         self.gitStream.write("progress checkpoint\n\n")
2049         out = self.gitOutput.readline()
2050         if self.verbose:
2051             print "checkpoint finished: " + out
2052
2053     def extractFilesFromCommit(self, commit):
2054         self.cloneExclude = [re.sub(r"\.\.\.$", "", path)
2055                              for path in self.cloneExclude]
2056         files = []
2057         fnum = 0
2058         while commit.has_key("depotFile%s" % fnum):
2059             path =  commit["depotFile%s" % fnum]
2060
2061             if [p for p in self.cloneExclude
2062                 if p4PathStartsWith(path, p)]:
2063                 found = False
2064             else:
2065                 found = [p for p in self.depotPaths
2066                          if p4PathStartsWith(path, p)]
2067             if not found:
2068                 fnum = fnum + 1
2069                 continue
2070
2071             file = {}
2072             file["path"] = path
2073             file["rev"] = commit["rev%s" % fnum]
2074             file["action"] = commit["action%s" % fnum]
2075             file["type"] = commit["type%s" % fnum]
2076             files.append(file)
2077             fnum = fnum + 1
2078         return files
2079
2080     def stripRepoPath(self, path, prefixes):
2081         """When streaming files, this is called to map a p4 depot path
2082            to where it should go in git.  The prefixes are either
2083            self.depotPaths, or self.branchPrefixes in the case of
2084            branch detection."""
2085
2086         if self.useClientSpec:
2087             # branch detection moves files up a level (the branch name)
2088             # from what client spec interpretation gives
2089             path = self.clientSpecDirs.map_in_client(path)
2090             if self.detectBranches:
2091                 for b in self.knownBranches:
2092                     if path.startswith(b + "/"):
2093                         path = path[len(b)+1:]
2094
2095         elif self.keepRepoPath:
2096             # Preserve everything in relative path name except leading
2097             # //depot/; just look at first prefix as they all should
2098             # be in the same depot.
2099             depot = re.sub("^(//[^/]+/).*", r'\1', prefixes[0])
2100             if p4PathStartsWith(path, depot):
2101                 path = path[len(depot):]
2102
2103         else:
2104             for p in prefixes:
2105                 if p4PathStartsWith(path, p):
2106                     path = path[len(p):]
2107                     break
2108
2109         path = wildcard_decode(path)
2110         return path
2111
2112     def splitFilesIntoBranches(self, commit):
2113         """Look at each depotFile in the commit to figure out to what
2114            branch it belongs."""
2115
2116         if self.clientSpecDirs:
2117             files = self.extractFilesFromCommit(commit)
2118             self.clientSpecDirs.update_client_spec_path_cache(files)
2119
2120         branches = {}
2121         fnum = 0
2122         while commit.has_key("depotFile%s" % fnum):
2123             path =  commit["depotFile%s" % fnum]
2124             found = [p for p in self.depotPaths
2125                      if p4PathStartsWith(path, p)]
2126             if not found:
2127                 fnum = fnum + 1
2128                 continue
2129
2130             file = {}
2131             file["path"] = path
2132             file["rev"] = commit["rev%s" % fnum]
2133             file["action"] = commit["action%s" % fnum]
2134             file["type"] = commit["type%s" % fnum]
2135             fnum = fnum + 1
2136
2137             # start with the full relative path where this file would
2138             # go in a p4 client
2139             if self.useClientSpec:
2140                 relPath = self.clientSpecDirs.map_in_client(path)
2141             else:
2142                 relPath = self.stripRepoPath(path, self.depotPaths)
2143
2144             for branch in self.knownBranches.keys():
2145                 # add a trailing slash so that a commit into qt/4.2foo
2146                 # doesn't end up in qt/4.2, e.g.
2147                 if relPath.startswith(branch + "/"):
2148                     if branch not in branches:
2149                         branches[branch] = []
2150                     branches[branch].append(file)
2151                     break
2152
2153         return branches
2154
2155     # output one file from the P4 stream
2156     # - helper for streamP4Files
2157
2158     def streamOneP4File(self, file, contents):
2159         relPath = self.stripRepoPath(file['depotFile'], self.branchPrefixes)
2160         if verbose:
2161             sys.stderr.write("%s\n" % relPath)
2162
2163         (type_base, type_mods) = split_p4_type(file["type"])
2164
2165         git_mode = "100644"
2166         if "x" in type_mods:
2167             git_mode = "100755"
2168         if type_base == "symlink":
2169             git_mode = "120000"
2170             # p4 print on a symlink sometimes contains "target\n";
2171             # if it does, remove the newline
2172             data = ''.join(contents)
2173             if not data:
2174                 # Some version of p4 allowed creating a symlink that pointed
2175                 # to nothing.  This causes p4 errors when checking out such
2176                 # a change, and errors here too.  Work around it by ignoring
2177                 # the bad symlink; hopefully a future change fixes it.
2178                 print "\nIgnoring empty symlink in %s" % file['depotFile']
2179                 return
2180             elif data[-1] == '\n':
2181                 contents = [data[:-1]]
2182             else:
2183                 contents = [data]
2184
2185         if type_base == "utf16":
2186             # p4 delivers different text in the python output to -G
2187             # than it does when using "print -o", or normal p4 client
2188             # operations.  utf16 is converted to ascii or utf8, perhaps.
2189             # But ascii text saved as -t utf16 is completely mangled.
2190             # Invoke print -o to get the real contents.
2191             #
2192             # On windows, the newlines will always be mangled by print, so put
2193             # them back too.  This is not needed to the cygwin windows version,
2194             # just the native "NT" type.
2195             #
2196             text = p4_read_pipe(['print', '-q', '-o', '-', "%s@%s" % (file['depotFile'], file['change']) ])
2197             if p4_version_string().find("/NT") >= 0:
2198                 text = text.replace("\r\n", "\n")
2199             contents = [ text ]
2200
2201         if type_base == "apple":
2202             # Apple filetype files will be streamed as a concatenation of
2203             # its appledouble header and the contents.  This is useless
2204             # on both macs and non-macs.  If using "print -q -o xx", it
2205             # will create "xx" with the data, and "%xx" with the header.
2206             # This is also not very useful.
2207             #
2208             # Ideally, someday, this script can learn how to generate
2209             # appledouble files directly and import those to git, but
2210             # non-mac machines can never find a use for apple filetype.
2211             print "\nIgnoring apple filetype file %s" % file['depotFile']
2212             return
2213
2214         # Note that we do not try to de-mangle keywords on utf16 files,
2215         # even though in theory somebody may want that.
2216         pattern = p4_keywords_regexp_for_type(type_base, type_mods)
2217         if pattern:
2218             regexp = re.compile(pattern, re.VERBOSE)
2219             text = ''.join(contents)
2220             text = regexp.sub(r'$\1$', text)
2221             contents = [ text ]
2222
2223         self.gitStream.write("M %s inline %s\n" % (git_mode, relPath))
2224
2225         # total length...
2226         length = 0
2227         for d in contents:
2228             length = length + len(d)
2229
2230         self.gitStream.write("data %d\n" % length)
2231         for d in contents:
2232             self.gitStream.write(d)
2233         self.gitStream.write("\n")
2234
2235     def streamOneP4Deletion(self, file):
2236         relPath = self.stripRepoPath(file['path'], self.branchPrefixes)
2237         if verbose:
2238             sys.stderr.write("delete %s\n" % relPath)
2239         self.gitStream.write("D %s\n" % relPath)
2240
2241     # handle another chunk of streaming data
2242     def streamP4FilesCb(self, marshalled):
2243
2244         # catch p4 errors and complain
2245         err = None
2246         if "code" in marshalled:
2247             if marshalled["code"] == "error":
2248                 if "data" in marshalled:
2249                     err = marshalled["data"].rstrip()
2250         if err:
2251             f = None
2252             if self.stream_have_file_info:
2253                 if "depotFile" in self.stream_file:
2254                     f = self.stream_file["depotFile"]
2255             # force a failure in fast-import, else an empty
2256             # commit will be made
2257             self.gitStream.write("\n")
2258             self.gitStream.write("die-now\n")
2259             self.gitStream.close()
2260             # ignore errors, but make sure it exits first
2261             self.importProcess.wait()
2262             if f:
2263                 die("Error from p4 print for %s: %s" % (f, err))
2264             else:
2265                 die("Error from p4 print: %s" % err)
2266
2267         if marshalled.has_key('depotFile') and self.stream_have_file_info:
2268             # start of a new file - output the old one first
2269             self.streamOneP4File(self.stream_file, self.stream_contents)
2270             self.stream_file = {}
2271             self.stream_contents = []
2272             self.stream_have_file_info = False
2273
2274         # pick up the new file information... for the
2275         # 'data' field we need to append to our array
2276         for k in marshalled.keys():
2277             if k == 'data':
2278                 self.stream_contents.append(marshalled['data'])
2279             else:
2280                 self.stream_file[k] = marshalled[k]
2281
2282         self.stream_have_file_info = True
2283
2284     # Stream directly from "p4 files" into "git fast-import"
2285     def streamP4Files(self, files):
2286         filesForCommit = []
2287         filesToRead = []
2288         filesToDelete = []
2289
2290         for f in files:
2291             # if using a client spec, only add the files that have
2292             # a path in the client
2293             if self.clientSpecDirs:
2294                 if self.clientSpecDirs.map_in_client(f['path']) == "":
2295                     continue
2296
2297             filesForCommit.append(f)
2298             if f['action'] in self.delete_actions:
2299                 filesToDelete.append(f)
2300             else:
2301                 filesToRead.append(f)
2302
2303         # deleted files...
2304         for f in filesToDelete:
2305             self.streamOneP4Deletion(f)
2306
2307         if len(filesToRead) > 0:
2308             self.stream_file = {}
2309             self.stream_contents = []
2310             self.stream_have_file_info = False
2311
2312             # curry self argument
2313             def streamP4FilesCbSelf(entry):
2314                 self.streamP4FilesCb(entry)
2315
2316             fileArgs = ['%s#%s' % (f['path'], f['rev']) for f in filesToRead]
2317
2318             p4CmdList(["-x", "-", "print"],
2319                       stdin=fileArgs,
2320                       cb=streamP4FilesCbSelf)
2321
2322             # do the last chunk
2323             if self.stream_file.has_key('depotFile'):
2324                 self.streamOneP4File(self.stream_file, self.stream_contents)
2325
2326     def make_email(self, userid):
2327         if userid in self.users:
2328             return self.users[userid]
2329         else:
2330             return "%s <a@b>" % userid
2331
2332     def streamTag(self, gitStream, labelName, labelDetails, commit, epoch):
2333         """ Stream a p4 tag.
2334         commit is either a git commit, or a fast-import mark, ":<p4commit>"
2335         """
2336
2337         if verbose:
2338             print "writing tag %s for commit %s" % (labelName, commit)
2339         gitStream.write("tag %s\n" % labelName)
2340         gitStream.write("from %s\n" % commit)
2341
2342         if labelDetails.has_key('Owner'):
2343             owner = labelDetails["Owner"]
2344         else:
2345             owner = None
2346
2347         # Try to use the owner of the p4 label, or failing that,
2348         # the current p4 user id.
2349         if owner:
2350             email = self.make_email(owner)
2351         else:
2352             email = self.make_email(self.p4UserId())
2353         tagger = "%s %s %s" % (email, epoch, self.tz)
2354
2355         gitStream.write("tagger %s\n" % tagger)
2356
2357         print "labelDetails=",labelDetails
2358         if labelDetails.has_key('Description'):
2359             description = labelDetails['Description']
2360         else:
2361             description = 'Label from git p4'
2362
2363         gitStream.write("data %d\n" % len(description))
2364         gitStream.write(description)
2365         gitStream.write("\n")
2366
2367     def commit(self, details, files, branch, parent = ""):
2368         epoch = details["time"]
2369         author = details["user"]
2370
2371         if self.verbose:
2372             print "commit into %s" % branch
2373
2374         # start with reading files; if that fails, we should not
2375         # create a commit.
2376         new_files = []
2377         for f in files:
2378             if [p for p in self.branchPrefixes if p4PathStartsWith(f['path'], p)]:
2379                 new_files.append (f)
2380             else:
2381                 sys.stderr.write("Ignoring file outside of prefix: %s\n" % f['path'])
2382
2383         if self.clientSpecDirs:
2384             self.clientSpecDirs.update_client_spec_path_cache(files)
2385
2386         self.gitStream.write("commit %s\n" % branch)
2387         self.gitStream.write("mark :%s\n" % details["change"])
2388         self.committedChanges.add(int(details["change"]))
2389         committer = ""
2390         if author not in self.users:
2391             self.getUserMapFromPerforceServer()
2392         committer = "%s %s %s" % (self.make_email(author), epoch, self.tz)
2393
2394         self.gitStream.write("committer %s\n" % committer)
2395
2396         self.gitStream.write("data <<EOT\n")
2397         self.gitStream.write(details["desc"])
2398         self.gitStream.write("\n[git-p4: depot-paths = \"%s\": change = %s" %
2399                              (','.join(self.branchPrefixes), details["change"]))
2400         if len(details['options']) > 0:
2401             self.gitStream.write(": options = %s" % details['options'])
2402         self.gitStream.write("]\nEOT\n\n")
2403
2404         if len(parent) > 0:
2405             if self.verbose:
2406                 print "parent %s" % parent
2407             self.gitStream.write("from %s\n" % parent)
2408
2409         self.streamP4Files(new_files)
2410         self.gitStream.write("\n")
2411
2412         change = int(details["change"])
2413
2414         if self.labels.has_key(change):
2415             label = self.labels[change]
2416             labelDetails = label[0]
2417             labelRevisions = label[1]
2418             if self.verbose:
2419                 print "Change %s is labelled %s" % (change, labelDetails)
2420
2421             files = p4CmdList(["files"] + ["%s...@%s" % (p, change)
2422                                                 for p in self.branchPrefixes])
2423
2424             if len(files) == len(labelRevisions):
2425
2426                 cleanedFiles = {}
2427                 for info in files:
2428                     if info["action"] in self.delete_actions:
2429                         continue
2430                     cleanedFiles[info["depotFile"]] = info["rev"]
2431
2432                 if cleanedFiles == labelRevisions:
2433                     self.streamTag(self.gitStream, 'tag_%s' % labelDetails['label'], labelDetails, branch, epoch)
2434
2435                 else:
2436                     if not self.silent:
2437                         print ("Tag %s does not match with change %s: files do not match."
2438                                % (labelDetails["label"], change))
2439
2440             else:
2441                 if not self.silent:
2442                     print ("Tag %s does not match with change %s: file count is different."
2443                            % (labelDetails["label"], change))
2444
2445     # Build a dictionary of changelists and labels, for "detect-labels" option.
2446     def getLabels(self):
2447         self.labels = {}
2448
2449         l = p4CmdList(["labels"] + ["%s..." % p for p in self.depotPaths])
2450         if len(l) > 0 and not self.silent:
2451             print "Finding files belonging to labels in %s" % `self.depotPaths`
2452
2453         for output in l:
2454             label = output["label"]
2455             revisions = {}
2456             newestChange = 0
2457             if self.verbose:
2458                 print "Querying files for label %s" % label
2459             for file in p4CmdList(["files"] +
2460                                       ["%s...@%s" % (p, label)
2461                                           for p in self.depotPaths]):
2462                 revisions[file["depotFile"]] = file["rev"]
2463                 change = int(file["change"])
2464                 if change > newestChange:
2465                     newestChange = change
2466
2467             self.labels[newestChange] = [output, revisions]
2468
2469         if self.verbose:
2470             print "Label changes: %s" % self.labels.keys()
2471
2472     # Import p4 labels as git tags. A direct mapping does not
2473     # exist, so assume that if all the files are at the same revision
2474     # then we can use that, or it's something more complicated we should
2475     # just ignore.
2476     def importP4Labels(self, stream, p4Labels):
2477         if verbose:
2478             print "import p4 labels: " + ' '.join(p4Labels)
2479
2480         ignoredP4Labels = gitConfigList("git-p4.ignoredP4Labels")
2481         validLabelRegexp = gitConfig("git-p4.labelImportRegexp")
2482         if len(validLabelRegexp) == 0:
2483             validLabelRegexp = defaultLabelRegexp
2484         m = re.compile(validLabelRegexp)
2485
2486         for name in p4Labels:
2487             commitFound = False
2488
2489             if not m.match(name):
2490                 if verbose:
2491                     print "label %s does not match regexp %s" % (name,validLabelRegexp)
2492                 continue
2493
2494             if name in ignoredP4Labels:
2495                 continue
2496
2497             labelDetails = p4CmdList(['label', "-o", name])[0]
2498
2499             # get the most recent changelist for each file in this label
2500             change = p4Cmd(["changes", "-m", "1"] + ["%s...@%s" % (p, name)
2501                                 for p in self.depotPaths])
2502
2503             if change.has_key('change'):
2504                 # find the corresponding git commit; take the oldest commit
2505                 changelist = int(change['change'])
2506                 if changelist in self.committedChanges:
2507                     gitCommit = ":%d" % changelist       # use a fast-import mark
2508                     commitFound = True
2509                 else:
2510                     gitCommit = read_pipe(["git", "rev-list", "--max-count=1",
2511                         "--reverse", ":/\[git-p4:.*change = %d\]" % changelist], ignore_error=True)
2512                     if len(gitCommit) == 0:
2513                         print "importing label %s: could not find git commit for changelist %d" % (name, changelist)
2514                     else:
2515                         commitFound = True
2516                         gitCommit = gitCommit.strip()
2517
2518                 if commitFound:
2519                     # Convert from p4 time format
2520                     try:
2521                         tmwhen = time.strptime(labelDetails['Update'], "%Y/%m/%d %H:%M:%S")
2522                     except ValueError:
2523                         print "Could not convert label time %s" % labelDetails['Update']
2524                         tmwhen = 1
2525
2526                     when = int(time.mktime(tmwhen))
2527                     self.streamTag(stream, name, labelDetails, gitCommit, when)
2528                     if verbose:
2529                         print "p4 label %s mapped to git commit %s" % (name, gitCommit)
2530             else:
2531                 if verbose:
2532                     print "Label %s has no changelists - possibly deleted?" % name
2533
2534             if not commitFound:
2535                 # We can't import this label; don't try again as it will get very
2536                 # expensive repeatedly fetching all the files for labels that will
2537                 # never be imported. If the label is moved in the future, the
2538                 # ignore will need to be removed manually.
2539                 system(["git", "config", "--add", "git-p4.ignoredP4Labels", name])
2540
2541     def guessProjectName(self):
2542         for p in self.depotPaths:
2543             if p.endswith("/"):
2544                 p = p[:-1]
2545             p = p[p.strip().rfind("/") + 1:]
2546             if not p.endswith("/"):
2547                p += "/"
2548             return p
2549
2550     def getBranchMapping(self):
2551         lostAndFoundBranches = set()
2552
2553         user = gitConfig("git-p4.branchUser")
2554         if len(user) > 0:
2555             command = "branches -u %s" % user
2556         else:
2557             command = "branches"
2558
2559         for info in p4CmdList(command):
2560             details = p4Cmd(["branch", "-o", info["branch"]])
2561             viewIdx = 0
2562             while details.has_key("View%s" % viewIdx):
2563                 paths = details["View%s" % viewIdx].split(" ")
2564                 viewIdx = viewIdx + 1
2565                 # require standard //depot/foo/... //depot/bar/... mapping
2566                 if len(paths) != 2 or not paths[0].endswith("/...") or not paths[1].endswith("/..."):
2567                     continue
2568                 source = paths[0]
2569                 destination = paths[1]
2570                 ## HACK
2571                 if p4PathStartsWith(source, self.depotPaths[0]) and p4PathStartsWith(destination, self.depotPaths[0]):
2572                     source = source[len(self.depotPaths[0]):-4]
2573                     destination = destination[len(self.depotPaths[0]):-4]
2574
2575                     if destination in self.knownBranches:
2576                         if not self.silent:
2577                             print "p4 branch %s defines a mapping from %s to %s" % (info["branch"], source, destination)
2578                             print "but there exists another mapping from %s to %s already!" % (self.knownBranches[destination], destination)
2579                         continue
2580
2581                     self.knownBranches[destination] = source
2582
2583                     lostAndFoundBranches.discard(destination)
2584
2585                     if source not in self.knownBranches:
2586                         lostAndFoundBranches.add(source)
2587
2588         # Perforce does not strictly require branches to be defined, so we also
2589         # check git config for a branch list.
2590         #
2591         # Example of branch definition in git config file:
2592         # [git-p4]
2593         #   branchList=main:branchA
2594         #   branchList=main:branchB
2595         #   branchList=branchA:branchC
2596         configBranches = gitConfigList("git-p4.branchList")
2597         for branch in configBranches:
2598             if branch:
2599                 (source, destination) = branch.split(":")
2600                 self.knownBranches[destination] = source
2601
2602                 lostAndFoundBranches.discard(destination)
2603
2604                 if source not in self.knownBranches:
2605                     lostAndFoundBranches.add(source)
2606
2607
2608         for branch in lostAndFoundBranches:
2609             self.knownBranches[branch] = branch
2610
2611     def getBranchMappingFromGitBranches(self):
2612         branches = p4BranchesInGit(self.importIntoRemotes)
2613         for branch in branches.keys():
2614             if branch == "master":
2615                 branch = "main"
2616             else:
2617                 branch = branch[len(self.projectName):]
2618             self.knownBranches[branch] = branch
2619
2620     def updateOptionDict(self, d):
2621         option_keys = {}
2622         if self.keepRepoPath:
2623             option_keys['keepRepoPath'] = 1
2624
2625         d["options"] = ' '.join(sorted(option_keys.keys()))
2626
2627     def readOptions(self, d):
2628         self.keepRepoPath = (d.has_key('options')
2629                              and ('keepRepoPath' in d['options']))
2630
2631     def gitRefForBranch(self, branch):
2632         if branch == "main":
2633             return self.refPrefix + "master"
2634
2635         if len(branch) <= 0:
2636             return branch
2637
2638         return self.refPrefix + self.projectName + branch
2639
2640     def gitCommitByP4Change(self, ref, change):
2641         if self.verbose:
2642             print "looking in ref " + ref + " for change %s using bisect..." % change
2643
2644         earliestCommit = ""
2645         latestCommit = parseRevision(ref)
2646
2647         while True:
2648             if self.verbose:
2649                 print "trying: earliest %s latest %s" % (earliestCommit, latestCommit)
2650             next = read_pipe("git rev-list --bisect %s %s" % (latestCommit, earliestCommit)).strip()
2651             if len(next) == 0:
2652                 if self.verbose:
2653                     print "argh"
2654                 return ""
2655             log = extractLogMessageFromGitCommit(next)
2656             settings = extractSettingsGitLog(log)
2657             currentChange = int(settings['change'])
2658             if self.verbose:
2659                 print "current change %s" % currentChange
2660
2661             if currentChange == change:
2662                 if self.verbose:
2663                     print "found %s" % next
2664                 return next
2665
2666             if currentChange < change:
2667                 earliestCommit = "^%s" % next
2668             else:
2669                 latestCommit = "%s" % next
2670
2671         return ""
2672
2673     def importNewBranch(self, branch, maxChange):
2674         # make fast-import flush all changes to disk and update the refs using the checkpoint
2675         # command so that we can try to find the branch parent in the git history
2676         self.gitStream.write("checkpoint\n\n");
2677         self.gitStream.flush();
2678         branchPrefix = self.depotPaths[0] + branch + "/"
2679         range = "@1,%s" % maxChange
2680         #print "prefix" + branchPrefix
2681         changes = p4ChangesForPaths([branchPrefix], range, self.changes_block_size)
2682         if len(changes) <= 0:
2683             return False
2684         firstChange = changes[0]
2685         #print "first change in branch: %s" % firstChange
2686         sourceBranch = self.knownBranches[branch]
2687         sourceDepotPath = self.depotPaths[0] + sourceBranch
2688         sourceRef = self.gitRefForBranch(sourceBranch)
2689         #print "source " + sourceBranch
2690
2691         branchParentChange = int(p4Cmd(["changes", "-m", "1", "%s...@1,%s" % (sourceDepotPath, firstChange)])["change"])
2692         #print "branch parent: %s" % branchParentChange
2693         gitParent = self.gitCommitByP4Change(sourceRef, branchParentChange)
2694         if len(gitParent) > 0:
2695             self.initialParents[self.gitRefForBranch(branch)] = gitParent
2696             #print "parent git commit: %s" % gitParent
2697
2698         self.importChanges(changes)
2699         return True
2700
2701     def searchParent(self, parent, branch, target):
2702         parentFound = False
2703         for blob in read_pipe_lines(["git", "rev-list", "--reverse",
2704                                      "--no-merges", parent]):
2705             blob = blob.strip()
2706             if len(read_pipe(["git", "diff-tree", blob, target])) == 0:
2707                 parentFound = True
2708                 if self.verbose:
2709                     print "Found parent of %s in commit %s" % (branch, blob)
2710                 break
2711         if parentFound:
2712             return blob
2713         else:
2714             return None
2715
2716     def importChanges(self, changes):
2717         cnt = 1
2718         for change in changes:
2719             description = p4_describe(change)
2720             self.updateOptionDict(description)
2721
2722             if not self.silent:
2723                 sys.stdout.write("\rImporting revision %s (%s%%)" % (change, cnt * 100 / len(changes)))
2724                 sys.stdout.flush()
2725             cnt = cnt + 1
2726
2727             try:
2728                 if self.detectBranches:
2729                     branches = self.splitFilesIntoBranches(description)
2730                     for branch in branches.keys():
2731                         ## HACK  --hwn
2732                         branchPrefix = self.depotPaths[0] + branch + "/"
2733                         self.branchPrefixes = [ branchPrefix ]
2734
2735                         parent = ""
2736
2737                         filesForCommit = branches[branch]
2738
2739                         if self.verbose:
2740                             print "branch is %s" % branch
2741
2742                         self.updatedBranches.add(branch)
2743
2744                         if branch not in self.createdBranches:
2745                             self.createdBranches.add(branch)
2746                             parent = self.knownBranches[branch]
2747                             if parent == branch:
2748                                 parent = ""
2749                             else:
2750                                 fullBranch = self.projectName + branch
2751                                 if fullBranch not in self.p4BranchesInGit:
2752                                     if not self.silent:
2753                                         print("\n    Importing new branch %s" % fullBranch);
2754                                     if self.importNewBranch(branch, change - 1):
2755                                         parent = ""
2756                                         self.p4BranchesInGit.append(fullBranch)
2757                                     if not self.silent:
2758                                         print("\n    Resuming with change %s" % change);
2759
2760                                 if self.verbose:
2761                                     print "parent determined through known branches: %s" % parent
2762
2763                         branch = self.gitRefForBranch(branch)
2764                         parent = self.gitRefForBranch(parent)
2765
2766                         if self.verbose:
2767                             print "looking for initial parent for %s; current parent is %s" % (branch, parent)
2768
2769                         if len(parent) == 0 and branch in self.initialParents:
2770                             parent = self.initialParents[branch]
2771                             del self.initialParents[branch]
2772
2773                         blob = None
2774                         if len(parent) > 0:
2775                             tempBranch = "%s/%d" % (self.tempBranchLocation, change)
2776                             if self.verbose:
2777                                 print "Creating temporary branch: " + tempBranch
2778                             self.commit(description, filesForCommit, tempBranch)
2779                             self.tempBranches.append(tempBranch)
2780                             self.checkpoint()
2781                             blob = self.searchParent(parent, branch, tempBranch)
2782                         if blob:
2783                             self.commit(description, filesForCommit, branch, blob)
2784                         else:
2785                             if self.verbose:
2786                                 print "Parent of %s not found. Committing into head of %s" % (branch, parent)
2787                             self.commit(description, filesForCommit, branch, parent)
2788                 else:
2789                     files = self.extractFilesFromCommit(description)
2790                     self.commit(description, files, self.branch,
2791                                 self.initialParent)
2792                     # only needed once, to connect to the previous commit
2793                     self.initialParent = ""
2794             except IOError:
2795                 print self.gitError.read()
2796                 sys.exit(1)
2797
2798     def importHeadRevision(self, revision):
2799         print "Doing initial import of %s from revision %s into %s" % (' '.join(self.depotPaths), revision, self.branch)
2800
2801         details = {}
2802         details["user"] = "git perforce import user"
2803         details["desc"] = ("Initial import of %s from the state at revision %s\n"
2804                            % (' '.join(self.depotPaths), revision))
2805         details["change"] = revision
2806         newestRevision = 0
2807
2808         fileCnt = 0
2809         fileArgs = ["%s...%s" % (p,revision) for p in self.depotPaths]
2810
2811         for info in p4CmdList(["files"] + fileArgs):
2812
2813             if 'code' in info and info['code'] == 'error':
2814                 sys.stderr.write("p4 returned an error: %s\n"
2815                                  % info['data'])
2816                 if info['data'].find("must refer to client") >= 0:
2817                     sys.stderr.write("This particular p4 error is misleading.\n")
2818                     sys.stderr.write("Perhaps the depot path was misspelled.\n");
2819                     sys.stderr.write("Depot path:  %s\n" % " ".join(self.depotPaths))
2820                 sys.exit(1)
2821             if 'p4ExitCode' in info:
2822                 sys.stderr.write("p4 exitcode: %s\n" % info['p4ExitCode'])
2823                 sys.exit(1)
2824
2825
2826             change = int(info["change"])
2827             if change > newestRevision:
2828                 newestRevision = change
2829
2830             if info["action"] in self.delete_actions:
2831                 # don't increase the file cnt, otherwise details["depotFile123"] will have gaps!
2832                 #fileCnt = fileCnt + 1
2833                 continue
2834
2835             for prop in ["depotFile", "rev", "action", "type" ]:
2836                 details["%s%s" % (prop, fileCnt)] = info[prop]
2837
2838             fileCnt = fileCnt + 1
2839
2840         details["change"] = newestRevision
2841
2842         # Use time from top-most change so that all git p4 clones of
2843         # the same p4 repo have the same commit SHA1s.
2844         res = p4_describe(newestRevision)
2845         details["time"] = res["time"]
2846
2847         self.updateOptionDict(details)
2848         try:
2849             self.commit(details, self.extractFilesFromCommit(details), self.branch)
2850         except IOError:
2851             print "IO error with git fast-import. Is your git version recent enough?"
2852             print self.gitError.read()
2853
2854
2855     def run(self, args):
2856         self.depotPaths = []
2857         self.changeRange = ""
2858         self.previousDepotPaths = []
2859         self.hasOrigin = False
2860
2861         # map from branch depot path to parent branch
2862         self.knownBranches = {}
2863         self.initialParents = {}
2864
2865         if self.importIntoRemotes:
2866             self.refPrefix = "refs/remotes/p4/"
2867         else:
2868             self.refPrefix = "refs/heads/p4/"
2869
2870         if self.syncWithOrigin:
2871             self.hasOrigin = originP4BranchesExist()
2872             if self.hasOrigin:
2873                 if not self.silent:
2874                     print 'Syncing with origin first, using "git fetch origin"'
2875                 system("git fetch origin")
2876
2877         branch_arg_given = bool(self.branch)
2878         if len(self.branch) == 0:
2879             self.branch = self.refPrefix + "master"
2880             if gitBranchExists("refs/heads/p4") and self.importIntoRemotes:
2881                 system("git update-ref %s refs/heads/p4" % self.branch)
2882                 system("git branch -D p4")
2883
2884         # accept either the command-line option, or the configuration variable
2885         if self.useClientSpec:
2886             # will use this after clone to set the variable
2887             self.useClientSpec_from_options = True
2888         else:
2889             if gitConfigBool("git-p4.useclientspec"):
2890                 self.useClientSpec = True
2891         if self.useClientSpec:
2892             self.clientSpecDirs = getClientSpec()
2893
2894         # TODO: should always look at previous commits,
2895         # merge with previous imports, if possible.
2896         if args == []:
2897             if self.hasOrigin:
2898                 createOrUpdateBranchesFromOrigin(self.refPrefix, self.silent)
2899
2900             # branches holds mapping from branch name to sha1
2901             branches = p4BranchesInGit(self.importIntoRemotes)
2902
2903             # restrict to just this one, disabling detect-branches
2904             if branch_arg_given:
2905                 short = self.branch.split("/")[-1]
2906                 if short in branches:
2907                     self.p4BranchesInGit = [ short ]
2908             else:
2909                 self.p4BranchesInGit = branches.keys()
2910
2911             if len(self.p4BranchesInGit) > 1:
2912                 if not self.silent:
2913                     print "Importing from/into multiple branches"
2914                 self.detectBranches = True
2915                 for branch in branches.keys():
2916                     self.initialParents[self.refPrefix + branch] = \
2917                         branches[branch]
2918
2919             if self.verbose:
2920                 print "branches: %s" % self.p4BranchesInGit
2921
2922             p4Change = 0
2923             for branch in self.p4BranchesInGit:
2924                 logMsg =  extractLogMessageFromGitCommit(self.refPrefix + branch)
2925
2926                 settings = extractSettingsGitLog(logMsg)
2927
2928                 self.readOptions(settings)
2929                 if (settings.has_key('depot-paths')
2930                     and settings.has_key ('change')):
2931                     change = int(settings['change']) + 1
2932                     p4Change = max(p4Change, change)
2933
2934                     depotPaths = sorted(settings['depot-paths'])
2935                     if self.previousDepotPaths == []:
2936                         self.previousDepotPaths = depotPaths
2937                     else:
2938                         paths = []
2939                         for (prev, cur) in zip(self.previousDepotPaths, depotPaths):
2940                             prev_list = prev.split("/")
2941                             cur_list = cur.split("/")
2942                             for i in range(0, min(len(cur_list), len(prev_list))):
2943                                 if cur_list[i] <> prev_list[i]:
2944                                     i = i - 1
2945                                     break
2946
2947                             paths.append ("/".join(cur_list[:i + 1]))
2948
2949                         self.previousDepotPaths = paths
2950
2951             if p4Change > 0:
2952                 self.depotPaths = sorted(self.previousDepotPaths)
2953                 self.changeRange = "@%s,#head" % p4Change
2954                 if not self.silent and not self.detectBranches:
2955                     print "Performing incremental import into %s git branch" % self.branch
2956
2957         # accept multiple ref name abbreviations:
2958         #    refs/foo/bar/branch -> use it exactly
2959         #    p4/branch -> prepend refs/remotes/ or refs/heads/
2960         #    branch -> prepend refs/remotes/p4/ or refs/heads/p4/
2961         if not self.branch.startswith("refs/"):
2962             if self.importIntoRemotes:
2963                 prepend = "refs/remotes/"
2964             else:
2965                 prepend = "refs/heads/"
2966             if not self.branch.startswith("p4/"):
2967                 prepend += "p4/"
2968             self.branch = prepend + self.branch
2969
2970         if len(args) == 0 and self.depotPaths:
2971             if not self.silent:
2972                 print "Depot paths: %s" % ' '.join(self.depotPaths)
2973         else:
2974             if self.depotPaths and self.depotPaths != args:
2975                 print ("previous import used depot path %s and now %s was specified. "
2976                        "This doesn't work!" % (' '.join (self.depotPaths),
2977                                                ' '.join (args)))
2978                 sys.exit(1)
2979
2980             self.depotPaths = sorted(args)
2981
2982         revision = ""
2983         self.users = {}
2984
2985         # Make sure no revision specifiers are used when --changesfile
2986         # is specified.
2987         bad_changesfile = False
2988         if len(self.changesFile) > 0:
2989             for p in self.depotPaths:
2990                 if p.find("@") >= 0 or p.find("#") >= 0:
2991                     bad_changesfile = True
2992                     break
2993         if bad_changesfile:
2994             die("Option --changesfile is incompatible with revision specifiers")
2995
2996         newPaths = []
2997         for p in self.depotPaths:
2998             if p.find("@") != -1:
2999                 atIdx = p.index("@")
3000                 self.changeRange = p[atIdx:]
3001                 if self.changeRange == "@all":
3002                     self.changeRange = ""
3003                 elif ',' not in self.changeRange:
3004                     revision = self.changeRange
3005                     self.changeRange = ""
3006                 p = p[:atIdx]
3007             elif p.find("#") != -1:
3008                 hashIdx = p.index("#")
3009                 revision = p[hashIdx:]
3010                 p = p[:hashIdx]
3011             elif self.previousDepotPaths == []:
3012                 # pay attention to changesfile, if given, else import
3013                 # the entire p4 tree at the head revision
3014                 if len(self.changesFile) == 0:
3015                     revision = "#head"
3016
3017             p = re.sub ("\.\.\.$", "", p)
3018             if not p.endswith("/"):
3019                 p += "/"
3020
3021             newPaths.append(p)
3022
3023         self.depotPaths = newPaths
3024
3025         # --detect-branches may change this for each branch
3026         self.branchPrefixes = self.depotPaths
3027
3028         self.loadUserMapFromCache()
3029         self.labels = {}
3030         if self.detectLabels:
3031             self.getLabels();
3032
3033         if self.detectBranches:
3034             ## FIXME - what's a P4 projectName ?
3035             self.projectName = self.guessProjectName()
3036
3037             if self.hasOrigin:
3038                 self.getBranchMappingFromGitBranches()
3039             else:
3040                 self.getBranchMapping()
3041             if self.verbose:
3042                 print "p4-git branches: %s" % self.p4BranchesInGit
3043                 print "initial parents: %s" % self.initialParents
3044             for b in self.p4BranchesInGit:
3045                 if b != "master":
3046
3047                     ## FIXME
3048                     b = b[len(self.projectName):]
3049                 self.createdBranches.add(b)
3050
3051         self.tz = "%+03d%02d" % (- time.timezone / 3600, ((- time.timezone % 3600) / 60))
3052
3053         self.importProcess = subprocess.Popen(["git", "fast-import"],
3054                                               stdin=subprocess.PIPE,
3055                                               stdout=subprocess.PIPE,
3056                                               stderr=subprocess.PIPE);
3057         self.gitOutput = self.importProcess.stdout
3058         self.gitStream = self.importProcess.stdin
3059         self.gitError = self.importProcess.stderr
3060
3061         if revision:
3062             self.importHeadRevision(revision)
3063         else:
3064             changes = []
3065
3066             if len(self.changesFile) > 0:
3067                 output = open(self.changesFile).readlines()
3068                 changeSet = set()
3069                 for line in output:
3070                     changeSet.add(int(line))
3071
3072                 for change in changeSet:
3073                     changes.append(change)
3074
3075                 changes.sort()
3076             else:
3077                 # catch "git p4 sync" with no new branches, in a repo that
3078                 # does not have any existing p4 branches
3079                 if len(args) == 0:
3080                     if not self.p4BranchesInGit:
3081                         die("No remote p4 branches.  Perhaps you never did \"git p4 clone\" in here.")
3082
3083                     # The default branch is master, unless --branch is used to
3084                     # specify something else.  Make sure it exists, or complain
3085                     # nicely about how to use --branch.
3086                     if not self.detectBranches:
3087                         if not branch_exists(self.branch):
3088                             if branch_arg_given:
3089                                 die("Error: branch %s does not exist." % self.branch)
3090                             else:
3091                                 die("Error: no branch %s; perhaps specify one with --branch." %
3092                                     self.branch)
3093
3094                 if self.verbose:
3095                     print "Getting p4 changes for %s...%s" % (', '.join(self.depotPaths),
3096                                                               self.changeRange)
3097                 changes = p4ChangesForPaths(self.depotPaths, self.changeRange, self.changes_block_size)
3098
3099                 if len(self.maxChanges) > 0:
3100                     changes = changes[:min(int(self.maxChanges), len(changes))]
3101
3102             if len(changes) == 0:
3103                 if not self.silent:
3104                     print "No changes to import!"
3105             else:
3106                 if not self.silent and not self.detectBranches:
3107                     print "Import destination: %s" % self.branch
3108
3109                 self.updatedBranches = set()
3110
3111                 if not self.detectBranches:
3112                     if args:
3113                         # start a new branch
3114                         self.initialParent = ""
3115                     else:
3116                         # build on a previous revision
3117                         self.initialParent = parseRevision(self.branch)
3118
3119                 self.importChanges(changes)
3120
3121                 if not self.silent:
3122                     print ""
3123                     if len(self.updatedBranches) > 0:
3124                         sys.stdout.write("Updated branches: ")
3125                         for b in self.updatedBranches:
3126                             sys.stdout.write("%s " % b)
3127                         sys.stdout.write("\n")
3128
3129         if gitConfigBool("git-p4.importLabels"):
3130             self.importLabels = True
3131
3132         if self.importLabels:
3133             p4Labels = getP4Labels(self.depotPaths)
3134             gitTags = getGitTags()
3135
3136             missingP4Labels = p4Labels - gitTags
3137             self.importP4Labels(self.gitStream, missingP4Labels)
3138
3139         self.gitStream.close()
3140         if self.importProcess.wait() != 0:
3141             die("fast-import failed: %s" % self.gitError.read())
3142         self.gitOutput.close()
3143         self.gitError.close()
3144
3145         # Cleanup temporary branches created during import
3146         if self.tempBranches != []:
3147             for branch in self.tempBranches:
3148                 read_pipe("git update-ref -d %s" % branch)
3149             os.rmdir(os.path.join(os.environ.get("GIT_DIR", ".git"), self.tempBranchLocation))
3150
3151         # Create a symbolic ref p4/HEAD pointing to p4/<branch> to allow
3152         # a convenient shortcut refname "p4".
3153         if self.importIntoRemotes:
3154             head_ref = self.refPrefix + "HEAD"
3155             if not gitBranchExists(head_ref) and gitBranchExists(self.branch):
3156                 system(["git", "symbolic-ref", head_ref, self.branch])
3157
3158         return True
3159
3160 class P4Rebase(Command):
3161     def __init__(self):
3162         Command.__init__(self)
3163         self.options = [
3164                 optparse.make_option("--import-labels", dest="importLabels", action="store_true"),
3165         ]
3166         self.importLabels = False
3167         self.description = ("Fetches the latest revision from perforce and "
3168                             + "rebases the current work (branch) against it")
3169
3170     def run(self, args):
3171         sync = P4Sync()
3172         sync.importLabels = self.importLabels
3173         sync.run([])
3174
3175         return self.rebase()
3176
3177     def rebase(self):
3178         if os.system("git update-index --refresh") != 0:
3179             die("Some files in your working directory are modified and different than what is in your index. You can use git update-index <filename> to bring the index up-to-date or stash away all your changes with git stash.");
3180         if len(read_pipe("git diff-index HEAD --")) > 0:
3181             die("You have uncommitted changes. Please commit them before rebasing or stash them away with git stash.");
3182
3183         [upstream, settings] = findUpstreamBranchPoint()
3184         if len(upstream) == 0:
3185             die("Cannot find upstream branchpoint for rebase")
3186
3187         # the branchpoint may be p4/foo~3, so strip off the parent
3188         upstream = re.sub("~[0-9]+$", "", upstream)
3189
3190         print "Rebasing the current branch onto %s" % upstream
3191         oldHead = read_pipe("git rev-parse HEAD").strip()
3192         system("git rebase %s" % upstream)
3193         system("git diff-tree --stat --summary -M %s HEAD --" % oldHead)
3194         return True
3195
3196 class P4Clone(P4Sync):
3197     def __init__(self):
3198         P4Sync.__init__(self)
3199         self.description = "Creates a new git repository and imports from Perforce into it"
3200         self.usage = "usage: %prog [options] //depot/path[@revRange]"
3201         self.options += [
3202             optparse.make_option("--destination", dest="cloneDestination",
3203                                  action='store', default=None,
3204                                  help="where to leave result of the clone"),
3205             optparse.make_option("--bare", dest="cloneBare",
3206                                  action="store_true", default=False),
3207         ]
3208         self.cloneDestination = None
3209         self.needsGit = False
3210         self.cloneBare = False
3211
3212     def defaultDestination(self, args):
3213         ## TODO: use common prefix of args?
3214         depotPath = args[0]
3215         depotDir = re.sub("(@[^@]*)$", "", depotPath)
3216         depotDir = re.sub("(#[^#]*)$", "", depotDir)
3217         depotDir = re.sub(r"\.\.\.$", "", depotDir)
3218         depotDir = re.sub(r"/$", "", depotDir)
3219         return os.path.split(depotDir)[1]
3220
3221     def run(self, args):
3222         if len(args) < 1:
3223             return False
3224
3225         if self.keepRepoPath and not self.cloneDestination:
3226             sys.stderr.write("Must specify destination for --keep-path\n")
3227             sys.exit(1)
3228
3229         depotPaths = args
3230
3231         if not self.cloneDestination and len(depotPaths) > 1:
3232             self.cloneDestination = depotPaths[-1]
3233             depotPaths = depotPaths[:-1]
3234
3235         self.cloneExclude = ["/"+p for p in self.cloneExclude]
3236         for p in depotPaths:
3237             if not p.startswith("//"):
3238                 sys.stderr.write('Depot paths must start with "//": %s\n' % p)
3239                 return False
3240
3241         if not self.cloneDestination:
3242             self.cloneDestination = self.defaultDestination(args)
3243
3244         print "Importing from %s into %s" % (', '.join(depotPaths), self.cloneDestination)
3245
3246         if not os.path.exists(self.cloneDestination):
3247             os.makedirs(self.cloneDestination)
3248         chdir(self.cloneDestination)
3249
3250         init_cmd = [ "git", "init" ]
3251         if self.cloneBare:
3252             init_cmd.append("--bare")
3253         retcode = subprocess.call(init_cmd)
3254         if retcode:
3255             raise CalledProcessError(retcode, init_cmd)
3256
3257         if not P4Sync.run(self, depotPaths):
3258             return False
3259
3260         # create a master branch and check out a work tree
3261         if gitBranchExists(self.branch):
3262             system([ "git", "branch", "master", self.branch ])
3263             if not self.cloneBare:
3264                 system([ "git", "checkout", "-f" ])
3265         else:
3266             print 'Not checking out any branch, use ' \
3267                   '"git checkout -q -b master <branch>"'
3268
3269         # auto-set this variable if invoked with --use-client-spec
3270         if self.useClientSpec_from_options:
3271             system("git config --bool git-p4.useclientspec true")
3272
3273         return True
3274
3275 class P4Branches(Command):
3276     def __init__(self):
3277         Command.__init__(self)
3278         self.options = [ ]
3279         self.description = ("Shows the git branches that hold imports and their "
3280                             + "corresponding perforce depot paths")
3281         self.verbose = False
3282
3283     def run(self, args):
3284         if originP4BranchesExist():
3285             createOrUpdateBranchesFromOrigin()
3286
3287         cmdline = "git rev-parse --symbolic "
3288         cmdline += " --remotes"
3289
3290         for line in read_pipe_lines(cmdline):
3291             line = line.strip()
3292
3293             if not line.startswith('p4/') or line == "p4/HEAD":
3294                 continue
3295             branch = line
3296
3297             log = extractLogMessageFromGitCommit("refs/remotes/%s" % branch)
3298             settings = extractSettingsGitLog(log)
3299
3300             print "%s <= %s (%s)" % (branch, ",".join(settings["depot-paths"]), settings["change"])
3301         return True
3302
3303 class HelpFormatter(optparse.IndentedHelpFormatter):
3304     def __init__(self):
3305         optparse.IndentedHelpFormatter.__init__(self)
3306
3307     def format_description(self, description):
3308         if description:
3309             return description + "\n"
3310         else:
3311             return ""
3312
3313 def printUsage(commands):
3314     print "usage: %s <command> [options]" % sys.argv[0]
3315     print ""
3316     print "valid commands: %s" % ", ".join(commands)
3317     print ""
3318     print "Try %s <command> --help for command specific help." % sys.argv[0]
3319     print ""
3320
3321 commands = {
3322     "debug" : P4Debug,
3323     "submit" : P4Submit,
3324     "commit" : P4Submit,
3325     "sync" : P4Sync,
3326     "rebase" : P4Rebase,
3327     "clone" : P4Clone,
3328     "rollback" : P4RollBack,
3329     "branches" : P4Branches
3330 }
3331
3332
3333 def main():
3334     if len(sys.argv[1:]) == 0:
3335         printUsage(commands.keys())
3336         sys.exit(2)
3337
3338     cmdName = sys.argv[1]
3339     try:
3340         klass = commands[cmdName]
3341         cmd = klass()
3342     except KeyError:
3343         print "unknown command %s" % cmdName
3344         print ""
3345         printUsage(commands.keys())
3346         sys.exit(2)
3347
3348     options = cmd.options
3349     cmd.gitdir = os.environ.get("GIT_DIR", None)
3350
3351     args = sys.argv[2:]
3352
3353     options.append(optparse.make_option("--verbose", "-v", dest="verbose", action="store_true"))
3354     if cmd.needsGit:
3355         options.append(optparse.make_option("--git-dir", dest="gitdir"))
3356
3357     parser = optparse.OptionParser(cmd.usage.replace("%prog", "%prog " + cmdName),
3358                                    options,
3359                                    description = cmd.description,
3360                                    formatter = HelpFormatter())
3361
3362     (cmd, args) = parser.parse_args(sys.argv[2:], cmd);
3363     global verbose
3364     verbose = cmd.verbose
3365     if cmd.needsGit:
3366         if cmd.gitdir == None:
3367             cmd.gitdir = os.path.abspath(".git")
3368             if not isValidGitDir(cmd.gitdir):
3369                 cmd.gitdir = read_pipe("git rev-parse --git-dir").strip()
3370                 if os.path.exists(cmd.gitdir):
3371                     cdup = read_pipe("git rev-parse --show-cdup").strip()
3372                     if len(cdup) > 0:
3373                         chdir(cdup);
3374
3375         if not isValidGitDir(cmd.gitdir):
3376             if isValidGitDir(cmd.gitdir + "/.git"):
3377                 cmd.gitdir += "/.git"
3378             else:
3379                 die("fatal: cannot locate git repository at %s" % cmd.gitdir)
3380
3381         os.environ["GIT_DIR"] = cmd.gitdir
3382
3383     if not cmd.run(args):
3384         parser.print_help()
3385         sys.exit(2)
3386
3387
3388 if __name__ == '__main__':
3389     main()