1 """Python GIT interface
5 Copyright (C) 2005, Catalin Marinas <catalin.marinas@gmail.com>
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License version 2 as
9 published by the Free Software Foundation.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 import sys, os, re, gitmergeonefile
22 from shutil import copyfile
24 from stgit import basedir
25 from stgit.utils import *
26 from stgit.out import *
27 from stgit.run import *
28 from stgit.config import config
31 class GitException(Exception):
34 # When a subprocess has a problem, we want the exception to be a
35 # subclass of GitException.
36 class GitRunException(GitException):
47 """An author, committer, etc."""
48 def __init__(self, name = None, email = None, date = '',
50 self.name = self.email = self.date = None
51 if name or email or date:
57 assert not (name or email or date)
59 m = re.match(r'^(.+)<(.+)>(.*)$', s)
61 return [x.strip() or None for x in m.groups()]
62 self.name, self.email, self.date = parse_desc(desc)
63 def set_name(self, val):
66 def set_email(self, val):
69 def set_date(self, val):
73 if self.name and self.email:
74 return '%s <%s>' % (self.name, self.email)
76 raise GitException, 'not enough identity data'
79 """Handle the commit objects
81 def __init__(self, id_hash):
82 self.__id_hash = id_hash
84 lines = GRun('git-cat-file', 'commit', id_hash).output_lines()
85 for i in range(len(lines)):
88 break # we've seen all the header fields
89 key, val = line.split(' ', 1)
94 elif key == 'committer':
95 self.__committer = val
97 pass # ignore other headers
98 self.__log = '\n'.join(lines[i+1:])
100 def get_id_hash(self):
101 return self.__id_hash
106 def get_parent(self):
107 parents = self.get_parents()
113 def get_parents(self):
114 return GRun('git-rev-list', '--parents', '--max-count=1', self.__id_hash
115 ).output_one_line().split()[1:]
117 def get_author(self):
120 def get_committer(self):
121 return self.__committer
127 return self.get_id_hash()
129 # dictionary of Commit objects, used to avoid multiple calls to git
136 def get_commit(id_hash):
137 """Commit objects factory. Save/look-up them in the __commits
142 if id_hash in __commits:
143 return __commits[id_hash]
145 commit = Commit(id_hash)
146 __commits[id_hash] = commit
150 """Return the list of file conflicts
152 conflicts_file = os.path.join(basedir.get(), 'conflicts')
153 if os.path.isfile(conflicts_file):
154 f = file(conflicts_file)
155 names = [line.strip() for line in f.readlines()]
162 files = [os.path.join(basedir.get(), 'info', 'exclude')]
163 user_exclude = config.get('core.excludesfile')
165 files.append(user_exclude)
168 def tree_status(files = None, tree_id = 'HEAD', unknown = False,
169 noexclude = True, verbose = False, diff_flags = []):
170 """Get the status of all changed files, or of a selected set of
171 files. Returns a list of pairs - (status, filename).
173 If 'files' is None, it will check all files, and optionally all
174 unknown files. If 'files' is a list, it will only check the files
177 assert files == None or not unknown
180 out.start('Checking for changes in the working directory')
188 cmd = ['git-ls-files', '-z', '--others', '--directory',
189 '--no-empty-directory']
191 cmd += ['--exclude=%s' % s for s in
192 ['*.[ao]', '*.pyc', '.*', '*~', '#*', 'TAGS', 'tags']]
193 cmd += ['--exclude-per-directory=.gitignore']
194 cmd += ['--exclude-from=%s' % fn
195 for fn in exclude_files()
196 if os.path.exists(fn)]
198 lines = GRun(*cmd).raw_output().split('\0')
199 cache_files += [('?', line) for line in lines if line]
202 conflicts = get_conflicts()
205 cache_files += [('C', filename) for filename in conflicts
206 if files == None or filename in files]
209 args = diff_flags + [tree_id]
211 args += ['--'] + files
212 for line in GRun('git-diff-index', *args).output_lines():
213 fs = tuple(line.rstrip().split(' ',4)[-1].split('\t',1))
214 if fs[1] not in conflicts:
215 cache_files.append(fs)
220 assert files == None or set(f for s,f in cache_files) <= set(files)
223 def local_changes(verbose = True):
224 """Return true if there are local changes in the tree
226 return len(tree_status(verbose = verbose)) != 0
230 hr = re.compile(r'^[0-9a-f]{40} refs/heads/(.+)$')
231 for line in GRun('git-show-ref', '--heads').output_lines():
233 heads.append(m.group(1))
240 """Verifies the HEAD and returns the SHA1 id that represents it
245 __head = rev_parse('HEAD')
249 """Returns the name of the file pointed to by the HEAD link
251 return strip_prefix('refs/heads/',
252 GRun('git-symbolic-ref', 'HEAD').output_one_line())
254 def set_head_file(ref):
255 """Resets HEAD to point to a new ref
257 # head cache flushing is needed since we might have a different value
261 GRun('git-symbolic-ref', 'HEAD', 'refs/heads/%s' % ref).run()
262 except GitRunException:
263 raise GitException, 'Could not set head to "%s"' % ref
265 def set_ref(ref, val):
266 """Point ref at a new commit object."""
268 GRun('git-update-ref', ref, val).run()
269 except GitRunException:
270 raise GitException, 'Could not update %s to "%s".' % (ref, val)
272 def set_branch(branch, val):
273 set_ref('refs/heads/%s' % branch, val)
276 """Sets the HEAD value
280 if not __head or __head != val:
284 # only allow SHA1 hashes
285 assert(len(__head) == 40)
287 def __clear_head_cache():
288 """Sets the __head to None so that a re-read is forced
295 """Refresh index with stat() information from the working directory.
297 GRun('git-update-index', '-q', '--unmerged', '--refresh').run()
299 def rev_parse(git_id):
300 """Parse the string and return a verified SHA1 id
303 return GRun('git-rev-parse', '--verify', git_id).output_one_line()
304 except GitRunException:
305 raise GitException, 'Unknown revision: %s' % git_id
314 def branch_exists(branch):
315 return ref_exists('refs/heads/%s' % branch)
317 def create_branch(new_branch, tree_id = None):
318 """Create a new branch in the git repository
320 if branch_exists(new_branch):
321 raise GitException, 'Branch "%s" already exists' % new_branch
323 current_head = get_head()
324 set_head_file(new_branch)
325 __set_head(current_head)
327 # a checkout isn't needed if new branch points to the current head
331 if os.path.isfile(os.path.join(basedir.get(), 'MERGE_HEAD')):
332 os.remove(os.path.join(basedir.get(), 'MERGE_HEAD'))
334 def switch_branch(new_branch):
335 """Switch to a git branch
339 if not branch_exists(new_branch):
340 raise GitException, 'Branch "%s" does not exist' % new_branch
342 tree_id = rev_parse('refs/heads/%s^{commit}' % new_branch)
343 if tree_id != get_head():
346 GRun('git-read-tree', '-u', '-m', get_head(), tree_id).run()
347 except GitRunException:
348 raise GitException, 'git-read-tree failed (local changes maybe?)'
350 set_head_file(new_branch)
352 if os.path.isfile(os.path.join(basedir.get(), 'MERGE_HEAD')):
353 os.remove(os.path.join(basedir.get(), 'MERGE_HEAD'))
356 if not ref_exists(ref):
357 raise GitException, '%s does not exist' % ref
358 sha1 = GRun('git-show-ref', '-s', ref).output_one_line()
360 GRun('git-update-ref', '-d', ref, sha1).run()
361 except GitRunException:
362 raise GitException, 'Failed to delete ref %s' % ref
364 def delete_branch(name):
365 delete_ref('refs/heads/%s' % name)
367 def rename_ref(from_ref, to_ref):
368 if not ref_exists(from_ref):
369 raise GitException, '"%s" does not exist' % from_ref
370 if ref_exists(to_ref):
371 raise GitException, '"%s" already exists' % to_ref
373 sha1 = GRun('git-show-ref', '-s', from_ref).output_one_line()
375 GRun('git-update-ref', to_ref, sha1, '0'*40).run()
376 except GitRunException:
377 raise GitException, 'Failed to create new ref %s' % to_ref
379 GRun('git-update-ref', '-d', from_ref, sha1).run()
380 except GitRunException:
381 raise GitException, 'Failed to delete ref %s' % from_ref
383 def rename_branch(from_name, to_name):
384 """Rename a git branch."""
385 rename_ref('refs/heads/%s' % from_name, 'refs/heads/%s' % to_name)
386 if get_head_file() == from_name:
387 set_head_file(to_name)
388 reflog_dir = os.path.join(basedir.get(), 'logs', 'refs', 'heads')
389 if os.path.exists(reflog_dir) \
390 and os.path.exists(os.path.join(reflog_dir, from_name)):
391 rename(reflog_dir, from_name, to_name)
394 """Add the files or recursively add the directory contents
396 # generate the file list
399 if not os.path.exists(i):
400 raise GitException, 'Unknown file or directory: %s' % i
403 # recursive search. We only add files
404 for root, dirs, local_files in os.walk(i):
405 for name in [os.path.join(root, f) for f in local_files]:
406 if os.path.isfile(name):
407 files.append(os.path.normpath(name))
408 elif os.path.isfile(i):
409 files.append(os.path.normpath(i))
411 raise GitException, '%s is not a file or directory' % i
415 GRun('git-update-index', '--add', '--').xargs(files)
416 except GitRunException:
417 raise GitException, 'Unable to add file'
419 def __copy_single(source, target, target2=''):
420 """Copy file or dir named 'source' to name target+target2"""
422 # "source" (file or dir) must match one or more git-controlled file
423 realfiles = GRun('git-ls-files', source).output_lines()
424 if len(realfiles) == 0:
425 raise GitException, '"%s" matches no git-controled files' % source
427 if os.path.isdir(source):
428 # physically copy the files, and record them to add them in one run
430 re_string='^'+source+'/(.*)$'
431 prefix_regexp = re.compile(re_string)
432 for f in [f.strip() for f in realfiles]:
433 m = prefix_regexp.match(f)
435 raise Exception, '"%s" does not match "%s"' % (f, re_string)
436 newname = target+target2+'/'+m.group(1)
437 if not os.path.exists(os.path.dirname(newname)):
438 os.makedirs(os.path.dirname(newname))
440 newfiles.append(newname)
443 else: # files, symlinks, ...
444 newname = target+target2
445 copyfile(source, newname)
449 def copy(filespecs, target):
450 if os.path.isdir(target):
451 # target is a directory: copy each entry on the command line,
452 # with the same name, into the target
453 target = target.rstrip('/')
455 # first, check that none of the children of the target
456 # matching the command line aleady exist
457 for filespec in filespecs:
458 entry = target+ '/' + os.path.basename(filespec.rstrip('/'))
459 if os.path.exists(entry):
460 raise GitException, 'Target "%s" already exists' % entry
462 for filespec in filespecs:
463 filespec = filespec.rstrip('/')
464 basename = '/' + os.path.basename(filespec)
465 __copy_single(filespec, target, basename)
467 elif os.path.exists(target):
468 raise GitException, 'Target "%s" exists but is not a directory' % target
469 elif len(filespecs) != 1:
470 raise GitException, 'Cannot copy more than one file to non-directory'
473 # at this point: len(filespecs)==1 and target does not exist
475 # check target directory
476 targetdir = os.path.dirname(target)
477 if targetdir != '' and not os.path.isdir(targetdir):
478 raise GitException, 'Target directory "%s" does not exist' % targetdir
480 __copy_single(filespecs[0].rstrip('/'), target)
483 def rm(files, force = False):
484 """Remove a file from the repository
488 if os.path.exists(f):
489 raise GitException, '%s exists. Remove it first' %f
491 GRun('git-update-index', '--remove', '--').xargs(files)
494 GRun('git-update-index', '--force-remove', '--').xargs(files)
502 """Return the user information.
506 name=config.get('user.name')
507 email=config.get('user.email')
508 __user = Person(name, email)
512 """Return the author information.
517 # the environment variables take priority over config
519 date = os.environ['GIT_AUTHOR_DATE']
522 __author = Person(os.environ['GIT_AUTHOR_NAME'],
523 os.environ['GIT_AUTHOR_EMAIL'],
530 """Return the author information.
535 # the environment variables take priority over config
537 date = os.environ['GIT_COMMITTER_DATE']
540 __committer = Person(os.environ['GIT_COMMITTER_NAME'],
541 os.environ['GIT_COMMITTER_EMAIL'],
547 def update_cache(files = None, force = False):
548 """Update the cache information for the given files
550 cache_files = tree_status(files, verbose = False)
552 # everything is up-to-date
553 if len(cache_files) == 0:
556 # check for unresolved conflicts
557 if not force and [x for x in cache_files
558 if x[0] not in ['M', 'N', 'A', 'D']]:
559 raise GitException, 'Updating cache failed: unresolved conflicts'
562 add_files = [x[1] for x in cache_files if x[0] in ['N', 'A']]
563 rm_files = [x[1] for x in cache_files if x[0] in ['D']]
564 m_files = [x[1] for x in cache_files if x[0] in ['M']]
566 GRun('git-update-index', '--add', '--').xargs(add_files)
567 GRun('git-update-index', '--force-remove', '--').xargs(rm_files)
568 GRun('git-update-index', '--').xargs(m_files)
572 def commit(message, files = None, parents = None, allowempty = False,
573 cache_update = True, tree_id = None, set_head = False,
574 author_name = None, author_email = None, author_date = None,
575 committer_name = None, committer_email = None):
576 """Commit the current tree to repository
581 # Get the tree status
582 if cache_update and parents != []:
583 changes = update_cache(files)
584 if not changes and not allowempty:
585 raise GitException, 'No changes to commit'
587 # get the commit message
590 elif message[-1:] != '\n':
593 # write the index to repository
595 tree_id = GRun('git-write-tree').output_one_line()
601 env['GIT_AUTHOR_NAME'] = author_name
603 env['GIT_AUTHOR_EMAIL'] = author_email
605 env['GIT_AUTHOR_DATE'] = author_date
607 env['GIT_COMMITTER_NAME'] = committer_name
609 env['GIT_COMMITTER_EMAIL'] = committer_email
610 commit_id = GRun('git-commit-tree', tree_id,
611 *sum([['-p', p] for p in parents], [])
612 ).env(env).raw_input(message).output_one_line()
614 __set_head(commit_id)
618 def apply_diff(rev1, rev2, check_index = True, files = None):
619 """Apply the diff between rev1 and rev2 onto the current
620 index. This function doesn't need to raise an exception since it
621 is only used for fast-pushing a patch. If this operation fails,
622 the pushing would fall back to the three-way merge.
625 index_opt = ['--index']
632 diff_str = diff(files, rev1, rev2)
635 GRun('git-apply', *index_opt).raw_input(
636 diff_str).discard_stderr().no_output()
637 except GitRunException:
642 def merge(base, head1, head2, recursive = False):
643 """Perform a 3-way merge between base, head1 and head2 into the
650 # this operation tracks renames but it is slower (used in
651 # general when pushing or picking patches)
653 # discard output to mask the verbose prints of the tool
654 GRun('git-merge-recursive', base, '--', head1, head2
656 except GitRunException, ex:
660 # the fast case where we don't track renames (used when the
661 # distance between base and heads is small, i.e. folding or
662 # synchronising patches)
664 GRun('git-read-tree', '-u', '-m', '--aggressive',
665 base, head1, head2).run()
666 except GitRunException:
667 raise GitException, 'git-read-tree failed (local changes maybe?)'
669 # check the index for unmerged entries
671 stages_re = re.compile('^([0-7]+) ([0-9a-f]{40}) ([1-3])\t(.*)$', re.S)
673 for line in GRun('git-ls-files', '--unmerged', '--stage', '-z'
674 ).raw_output().split('\0'):
678 mode, hash, stage, path = stages_re.findall(line)[0]
680 if not path in files:
682 files[path]['1'] = ('', '')
683 files[path]['2'] = ('', '')
684 files[path]['3'] = ('', '')
686 files[path][stage] = (mode, hash)
688 if err_output and not files:
689 # if no unmerged files, there was probably a different type of
690 # error and we have to abort the merge
691 raise GitException, err_output
693 # merge the unmerged files
696 # remove additional files that might be generated for some
697 # newer versions of GIT
698 for suffix in [base, head1, head2]:
701 fname = path + '~' + suffix
702 if os.path.exists(fname):
706 if gitmergeonefile.merge(stages['1'][1], stages['2'][1],
707 stages['3'][1], path, stages['1'][0],
708 stages['2'][0], stages['3'][0]) != 0:
712 raise GitException, 'GIT index merging failed (possible conflicts)'
714 def status(files = None, modified = False, new = False, deleted = False,
715 conflict = False, unknown = False, noexclude = False,
717 """Show the tree status
719 cache_files = tree_status(files,
720 unknown = (files == None),
721 noexclude = noexclude,
722 diff_flags = diff_flags)
723 filtered = (modified or new or deleted or conflict or unknown)
738 cache_files = [x for x in cache_files if x[0] in filestat]
740 for fs in cache_files:
741 assert files == None or fs[1] in files
743 out.stdout('%s %s' % (fs[0], fs[1]))
745 out.stdout('%s' % fs[1])
747 def diff(files = None, rev1 = 'HEAD', rev2 = None, diff_flags = []):
748 """Show the diff between rev1 and rev2
754 return GRun('git-diff-tree', '-p',
755 *(diff_flags + [rev1, rev2, '--'] + files)).raw_output()
759 return GRun('git-diff-index', '-p', '-R',
760 *(diff_flags + [rev2, '--'] + files)).raw_output()
762 return GRun('git-diff-index', '-p',
763 *(diff_flags + [rev1, '--'] + files)).raw_output()
767 # TODO: take another parameter representing a diff string as we
768 # usually invoke git.diff() form the calling functions
769 def diffstat(files = None, rev1 = 'HEAD', rev2 = None):
770 """Return the diffstat between rev1 and rev2."""
771 return GRun('git-apply', '--stat', '--summary'
772 ).raw_input(diff(files, rev1, rev2)).raw_output()
774 def files(rev1, rev2, diff_flags = []):
775 """Return the files modified between rev1 and rev2
779 for line in GRun('git-diff-tree', *(diff_flags + ['-r', rev1, rev2])
781 result.append('%s %s' % tuple(line.split(' ', 4)[-1].split('\t', 1)))
783 return '\n'.join(result)
785 def barefiles(rev1, rev2):
786 """Return the files modified between rev1 and rev2, without status info
790 for line in GRun('git-diff-tree', '-r', rev1, rev2).output_lines():
791 result.append(line.split(' ', 4)[-1].split('\t', 1)[-1])
793 return '\n'.join(result)
795 def pretty_commit(commit_id = 'HEAD', diff_flags = []):
796 """Return a given commit (log + diff)
798 return GRun('git-diff-tree',
800 + ['--cc', '--always', '--pretty', '-r', commit_id])
803 def checkout(files = None, tree_id = None, force = False):
804 """Check out the given or all files
808 GRun('git-read-tree', '--reset', tree_id).run()
809 except GitRunException:
810 raise GitException, 'Failed git-read-tree --reset %s' % tree_id
812 cmd = ['git-checkout-index', '-q', '-u']
816 GRun(*(cmd + ['--'])).xargs(files)
818 GRun(*(cmd + ['-a'])).run()
820 def switch(tree_id, keep = False):
821 """Switch the tree to the given id
826 GRun('git-read-tree', '-u', '-m', get_head(), tree_id).run()
827 except GitRunException:
828 raise GitException, 'git-read-tree failed (local changes maybe?)'
832 def reset(files = None, tree_id = None, check_out = True):
833 """Revert the tree changes relative to the given tree_id. It removes
840 cache_files = tree_status(files, tree_id)
841 # files which were added but need to be removed
842 rm_files = [x[1] for x in cache_files if x[0] in ['A']]
844 checkout(files, tree_id, True)
845 # checkout doesn't remove files
846 map(os.remove, rm_files)
848 # if the reset refers to the whole tree, switch the HEAD as well
852 def fetch(repository = 'origin', refspec = None):
853 """Fetches changes from the remote repository, using 'git-fetch'
863 command = config.get('branch.%s.stgit.fetchcmd' % get_head_file()) or \
864 config.get('stgit.fetchcmd')
865 GRun(*(command.split() + args)).run()
867 def pull(repository = 'origin', refspec = None):
868 """Fetches changes from the remote repository, using 'git-pull'
878 command = config.get('branch.%s.stgit.pullcmd' % get_head_file()) or \
879 config.get('stgit.pullcmd')
880 GRun(*(command.split() + args)).run()
883 """Repack all objects into a single pack
885 GRun('git-repack', '-a', '-d', '-f').run()
887 def apply_patch(filename = None, diff = None, base = None,
889 """Apply a patch onto the current or given index. There must not
890 be any local changes in the tree, otherwise the command fails
902 orig_head = get_head()
908 GRun('git-apply', '--index').raw_input(diff).no_output()
909 except GitRunException:
913 # write the failed diff to a file
914 f = file('.stgit-failed.patch', 'w+')
917 out.warn('Diff written to the .stgit-failed.patch file')
922 top = commit(message = 'temporary commit used for applying a patch',
925 merge(base, orig_head, top)
927 def clone(repository, local_dir):
928 """Clone a remote repository. At the moment, just use the
931 GRun('git-clone', repository, local_dir).run()
933 def modifying_revs(files, base_rev, head_rev):
934 """Return the revisions from the list modifying the given files."""
935 return GRun('git-rev-list', '%s..%s' % (base_rev, head_rev), '--', *files
938 def refspec_localpart(refspec):
939 m = re.match('^[^:]*:([^:]*)$', refspec)
943 raise GitException, 'Cannot parse refspec "%s"' % line
945 def refspec_remotepart(refspec):
946 m = re.match('^([^:]*):[^:]*$', refspec)
950 raise GitException, 'Cannot parse refspec "%s"' % line
953 def __remotes_from_config():
954 return config.sections_matching(r'remote\.(.*)\.url')
956 def __remotes_from_dir(dir):
957 d = os.path.join(basedir.get(), dir)
958 if os.path.exists(d):
964 """Return the list of remotes in the repository
966 return (set(__remotes_from_config())
967 | set(__remotes_from_dir('remotes'))
968 | set(__remotes_from_dir('branches')))
970 def remotes_local_branches(remote):
971 """Returns the list of local branches fetched from given remote
975 if remote in __remotes_from_config():
976 for line in config.getall('remote.%s.fetch' % remote):
977 branches.append(refspec_localpart(line))
978 elif remote in __remotes_from_dir('remotes'):
979 stream = open(os.path.join(basedir.get(), 'remotes', remote), 'r')
981 # Only consider Pull lines
982 m = re.match('^Pull: (.*)\n$', line)
984 branches.append(refspec_localpart(m.group(1)))
986 elif remote in __remotes_from_dir('branches'):
987 # old-style branches only declare one branch
988 branches.append('refs/heads/'+remote);
990 raise GitException, 'Unknown remote "%s"' % remote
994 def identify_remote(branchname):
995 """Return the name for the remote to pull the given branchname
996 from, or None if we believe it is a local branch.
999 for remote in remotes_list():
1000 if branchname in remotes_local_branches(remote):
1003 # if we get here we've found nothing, the branch is a local one
1007 """Return the git id for the tip of the parent branch as left by
1012 stream = open(os.path.join(basedir.get(), 'FETCH_HEAD'), "r")
1014 # Only consider lines not tagged not-for-merge
1015 m = re.match('^([^\t]*)\t\t', line)
1018 raise GitException, "StGit does not support multiple FETCH_HEAD"
1020 fetch_head=m.group(1)
1023 # here we are sure to have a single fetch_head
1027 """Return a list of all refs in the current repository.
1030 return [line.split()[1] for line in GRun('git-show-ref').output_lines()]