1 """Python GIT interface
5 Copyright (C) 2005, Catalin Marinas <catalin.marinas@gmail.com>
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License version 2 as
9 published by the Free Software Foundation.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 import sys, os, re, gitmergeonefile
22 from shutil import copyfile
24 from stgit import basedir
25 from stgit.utils import *
26 from stgit.out import *
27 from stgit.run import *
28 from stgit.config import config
32 class GitException(Exception):
35 # When a subprocess has a problem, we want the exception to be a
36 # subclass of GitException.
37 class GitRunException(GitException):
48 """An author, committer, etc."""
49 def __init__(self, name = None, email = None, date = '',
51 self.name = self.email = self.date = None
52 if name or email or date:
58 assert not (name or email or date)
60 m = re.match(r'^(.+)<(.+)>(.*)$', s)
62 return [x.strip() or None for x in m.groups()]
63 self.name, self.email, self.date = parse_desc(desc)
64 def set_name(self, val):
67 def set_email(self, val):
70 def set_date(self, val):
74 if self.name and self.email:
75 return '%s <%s>' % (self.name, self.email)
77 raise GitException, 'not enough identity data'
80 """Handle the commit objects
82 def __init__(self, id_hash):
83 self.__id_hash = id_hash
85 lines = GRun('git-cat-file', 'commit', id_hash).output_lines()
86 for i in range(len(lines)):
89 break # we've seen all the header fields
90 key, val = line.split(' ', 1)
95 elif key == 'committer':
96 self.__committer = val
98 pass # ignore other headers
99 self.__log = '\n'.join(lines[i+1:])
101 def get_id_hash(self):
102 return self.__id_hash
107 def get_parent(self):
108 parents = self.get_parents()
114 def get_parents(self):
115 return GRun('git-rev-list', '--parents', '--max-count=1', self.__id_hash
116 ).output_one_line().split()[1:]
118 def get_author(self):
121 def get_committer(self):
122 return self.__committer
128 return self.get_id_hash()
130 # dictionary of Commit objects, used to avoid multiple calls to git
137 def get_commit(id_hash):
138 """Commit objects factory. Save/look-up them in the __commits
143 if id_hash in __commits:
144 return __commits[id_hash]
146 commit = Commit(id_hash)
147 __commits[id_hash] = commit
151 """Return the list of file conflicts
153 conflicts_file = os.path.join(basedir.get(), 'conflicts')
154 if os.path.isfile(conflicts_file):
155 f = file(conflicts_file)
156 names = [line.strip() for line in f.readlines()]
163 files = [os.path.join(basedir.get(), 'info', 'exclude')]
164 user_exclude = config.get('core.excludesfile')
166 files.append(user_exclude)
169 def tree_status(files = None, tree_id = 'HEAD', unknown = False,
170 noexclude = True, verbose = False, diff_flags = []):
171 """Returns a list of pairs - (status, filename)
174 out.start('Checking for changes in the working directory')
184 cmd = ['git-ls-files', '-z', '--others', '--directory',
185 '--no-empty-directory']
187 cmd += ['--exclude=%s' % s for s in
188 ['*.[ao]', '*.pyc', '.*', '*~', '#*', 'TAGS', 'tags']]
189 cmd += ['--exclude-per-directory=.gitignore']
190 cmd += ['--exclude-from=%s' % fn
191 for fn in exclude_files()
192 if os.path.exists(fn)]
194 lines = GRun(*cmd).raw_output().split('\0')
195 cache_files += [('?', line) for line in lines if line]
198 conflicts = get_conflicts()
201 cache_files += [('C', filename) for filename in conflicts]
204 for line in GRun('git-diff-index', *(diff_flags + [tree_id, '--'] + files)
206 fs = tuple(line.rstrip().split(' ',4)[-1].split('\t',1))
207 if fs[1] not in conflicts:
208 cache_files.append(fs)
215 def local_changes(verbose = True):
216 """Return true if there are local changes in the tree
218 return len(tree_status(verbose = verbose)) != 0
222 hr = re.compile(r'^[0-9a-f]{40} refs/heads/(.+)$')
223 for line in GRun('git-show-ref', '--heads').output_lines():
225 heads.append(m.group(1))
232 """Verifies the HEAD and returns the SHA1 id that represents it
237 __head = rev_parse('HEAD')
241 """Returns the name of the file pointed to by the HEAD link
243 return strip_prefix('refs/heads/',
244 GRun('git-symbolic-ref', 'HEAD').output_one_line())
246 def set_head_file(ref):
247 """Resets HEAD to point to a new ref
249 # head cache flushing is needed since we might have a different value
253 GRun('git-symbolic-ref', 'HEAD', 'refs/heads/%s' % ref).run()
254 except GitRunException:
255 raise GitException, 'Could not set head to "%s"' % ref
257 def set_ref(ref, val):
258 """Point ref at a new commit object."""
260 GRun('git-update-ref', ref, val).run()
261 except GitRunException:
262 raise GitException, 'Could not update %s to "%s".' % (ref, val)
264 def set_branch(branch, val):
265 set_ref('refs/heads/%s' % branch, val)
268 """Sets the HEAD value
272 if not __head or __head != val:
276 # only allow SHA1 hashes
277 assert(len(__head) == 40)
279 def __clear_head_cache():
280 """Sets the __head to None so that a re-read is forced
287 """Refresh index with stat() information from the working directory.
289 GRun('git-update-index', '-q', '--unmerged', '--refresh').run()
291 def rev_parse(git_id):
292 """Parse the string and return a verified SHA1 id
295 return GRun('git-rev-parse', '--verify', git_id).output_one_line()
296 except GitRunException:
297 raise GitException, 'Unknown revision: %s' % git_id
306 def branch_exists(branch):
307 return ref_exists('refs/heads/%s' % branch)
309 def create_branch(new_branch, tree_id = None):
310 """Create a new branch in the git repository
312 if branch_exists(new_branch):
313 raise GitException, 'Branch "%s" already exists' % new_branch
315 current_head = get_head()
316 set_head_file(new_branch)
317 __set_head(current_head)
319 # a checkout isn't needed if new branch points to the current head
323 if os.path.isfile(os.path.join(basedir.get(), 'MERGE_HEAD')):
324 os.remove(os.path.join(basedir.get(), 'MERGE_HEAD'))
326 def switch_branch(new_branch):
327 """Switch to a git branch
331 if not branch_exists(new_branch):
332 raise GitException, 'Branch "%s" does not exist' % new_branch
334 tree_id = rev_parse('refs/heads/%s^{commit}' % new_branch)
335 if tree_id != get_head():
338 GRun('git-read-tree', '-u', '-m', get_head(), tree_id).run()
339 except GitRunException:
340 raise GitException, 'git-read-tree failed (local changes maybe?)'
342 set_head_file(new_branch)
344 if os.path.isfile(os.path.join(basedir.get(), 'MERGE_HEAD')):
345 os.remove(os.path.join(basedir.get(), 'MERGE_HEAD'))
348 if not ref_exists(ref):
349 raise GitException, '%s does not exist' % ref
350 sha1 = GRun('git-show-ref', '-s', ref).output_one_line()
352 GRun('git-update-ref', '-d', ref, sha1).run()
353 except GitRunException:
354 raise GitException, 'Failed to delete ref %s' % ref
356 def delete_branch(name):
357 delete_ref('refs/heads/%s' % name)
359 def rename_ref(from_ref, to_ref):
360 if not ref_exists(from_ref):
361 raise GitException, '"%s" does not exist' % from_ref
362 if ref_exists(to_ref):
363 raise GitException, '"%s" already exists' % to_ref
365 sha1 = GRun('git-show-ref', '-s', from_ref).output_one_line()
367 GRun('git-update-ref', to_ref, sha1, '0'*40).run()
368 except GitRunException:
369 raise GitException, 'Failed to create new ref %s' % to_ref
371 GRun('git-update-ref', '-d', from_ref, sha1).run()
372 except GitRunException:
373 raise GitException, 'Failed to delete ref %s' % from_ref
375 def rename_branch(from_name, to_name):
376 """Rename a git branch."""
377 rename_ref('refs/heads/%s' % from_name, 'refs/heads/%s' % to_name)
378 if get_head_file() == from_name:
379 set_head_file(to_name)
380 reflog_dir = os.path.join(basedir.get(), 'logs', 'refs', 'heads')
381 if os.path.exists(reflog_dir) \
382 and os.path.exists(os.path.join(reflog_dir, from_name)):
383 rename(reflog_dir, from_name, to_name)
386 """Add the files or recursively add the directory contents
388 # generate the file list
391 if not os.path.exists(i):
392 raise GitException, 'Unknown file or directory: %s' % i
395 # recursive search. We only add files
396 for root, dirs, local_files in os.walk(i):
397 for name in [os.path.join(root, f) for f in local_files]:
398 if os.path.isfile(name):
399 files.append(os.path.normpath(name))
400 elif os.path.isfile(i):
401 files.append(os.path.normpath(i))
403 raise GitException, '%s is not a file or directory' % i
407 GRun('git-update-index', '--add', '--').xargs(files)
408 except GitRunException:
409 raise GitException, 'Unable to add file'
411 def __copy_single(source, target, target2=''):
412 """Copy file or dir named 'source' to name target+target2"""
414 # "source" (file or dir) must match one or more git-controlled file
415 realfiles = GRun('git-ls-files', source).output_lines()
416 if len(realfiles) == 0:
417 raise GitException, '"%s" matches no git-controled files' % source
419 if os.path.isdir(source):
420 # physically copy the files, and record them to add them in one run
422 re_string='^'+source+'/(.*)$'
423 prefix_regexp = re.compile(re_string)
424 for f in [f.strip() for f in realfiles]:
425 m = prefix_regexp.match(f)
427 raise Exception, '"%s" does not match "%s"' % (f, re_string)
428 newname = target+target2+'/'+m.group(1)
429 if not os.path.exists(os.path.dirname(newname)):
430 os.makedirs(os.path.dirname(newname))
432 newfiles.append(newname)
435 else: # files, symlinks, ...
436 newname = target+target2
437 copyfile(source, newname)
441 def copy(filespecs, target):
442 if os.path.isdir(target):
443 # target is a directory: copy each entry on the command line,
444 # with the same name, into the target
445 target = target.rstrip('/')
447 # first, check that none of the children of the target
448 # matching the command line aleady exist
449 for filespec in filespecs:
450 entry = target+ '/' + os.path.basename(filespec.rstrip('/'))
451 if os.path.exists(entry):
452 raise GitException, 'Target "%s" already exists' % entry
454 for filespec in filespecs:
455 filespec = filespec.rstrip('/')
456 basename = '/' + os.path.basename(filespec)
457 __copy_single(filespec, target, basename)
459 elif os.path.exists(target):
460 raise GitException, 'Target "%s" exists but is not a directory' % target
461 elif len(filespecs) != 1:
462 raise GitException, 'Cannot copy more than one file to non-directory'
465 # at this point: len(filespecs)==1 and target does not exist
467 # check target directory
468 targetdir = os.path.dirname(target)
469 if targetdir != '' and not os.path.isdir(targetdir):
470 raise GitException, 'Target directory "%s" does not exist' % targetdir
472 __copy_single(filespecs[0].rstrip('/'), target)
475 def rm(files, force = False):
476 """Remove a file from the repository
480 if os.path.exists(f):
481 raise GitException, '%s exists. Remove it first' %f
483 GRun('git-update-index', '--remove', '--').xargs(files)
486 GRun('git-update-index', '--force-remove', '--').xargs(files)
494 """Return the user information.
498 name=config.get('user.name')
499 email=config.get('user.email')
500 __user = Person(name, email)
504 """Return the author information.
509 # the environment variables take priority over config
511 date = os.environ['GIT_AUTHOR_DATE']
514 __author = Person(os.environ['GIT_AUTHOR_NAME'],
515 os.environ['GIT_AUTHOR_EMAIL'],
522 """Return the author information.
527 # the environment variables take priority over config
529 date = os.environ['GIT_COMMITTER_DATE']
532 __committer = Person(os.environ['GIT_COMMITTER_NAME'],
533 os.environ['GIT_COMMITTER_EMAIL'],
539 def update_cache(files = None, force = False):
540 """Update the cache information for the given files
545 cache_files = tree_status(files, verbose = False)
547 # everything is up-to-date
548 if len(cache_files) == 0:
551 # check for unresolved conflicts
552 if not force and [x for x in cache_files
553 if x[0] not in ['M', 'N', 'A', 'D']]:
554 raise GitException, 'Updating cache failed: unresolved conflicts'
557 add_files = [x[1] for x in cache_files if x[0] in ['N', 'A']]
558 rm_files = [x[1] for x in cache_files if x[0] in ['D']]
559 m_files = [x[1] for x in cache_files if x[0] in ['M']]
561 GRun('git-update-index', '--add', '--').xargs(add_files)
562 GRun('git-update-index', '--force-remove', '--').xargs(rm_files)
563 GRun('git-update-index', '--').xargs(m_files)
567 def commit(message, files = None, parents = None, allowempty = False,
568 cache_update = True, tree_id = None, set_head = False,
569 author_name = None, author_email = None, author_date = None,
570 committer_name = None, committer_email = None):
571 """Commit the current tree to repository
578 # Get the tree status
579 if cache_update and parents != []:
580 changes = update_cache(files)
581 if not changes and not allowempty:
582 raise GitException, 'No changes to commit'
584 # get the commit message
587 elif message[-1:] != '\n':
590 # write the index to repository
592 tree_id = GRun('git-write-tree').output_one_line()
598 env['GIT_AUTHOR_NAME'] = author_name
600 env['GIT_AUTHOR_EMAIL'] = author_email
602 env['GIT_AUTHOR_DATE'] = author_date
604 env['GIT_COMMITTER_NAME'] = committer_name
606 env['GIT_COMMITTER_EMAIL'] = committer_email
607 commit_id = GRun('git-commit-tree', tree_id,
608 *sum([['-p', p] for p in parents], [])
609 ).env(env).raw_input(message).output_one_line()
611 __set_head(commit_id)
615 def apply_diff(rev1, rev2, check_index = True, files = None):
616 """Apply the diff between rev1 and rev2 onto the current
617 index. This function doesn't need to raise an exception since it
618 is only used for fast-pushing a patch. If this operation fails,
619 the pushing would fall back to the three-way merge.
622 index_opt = ['--index']
629 diff_str = diff(files, rev1, rev2)
632 GRun('git-apply', *index_opt).raw_input(diff_str).no_output()
633 except GitRunException:
638 def merge(base, head1, head2, recursive = False):
639 """Perform a 3-way merge between base, head1 and head2 into the
646 # this operation tracks renames but it is slower (used in
647 # general when pushing or picking patches)
649 # discard output to mask the verbose prints of the tool
650 GRun('git-merge-recursive', base, '--', head1, head2
652 except GitRunException, ex:
656 # the fast case where we don't track renames (used when the
657 # distance between base and heads is small, i.e. folding or
658 # synchronising patches)
660 GRun('git-read-tree', '-u', '-m', '--aggressive',
661 base, head1, head2).run()
662 except GitRunException:
663 raise GitException, 'git-read-tree failed (local changes maybe?)'
665 # check the index for unmerged entries
667 stages_re = re.compile('^([0-7]+) ([0-9a-f]{40}) ([1-3])\t(.*)$', re.S)
669 for line in GRun('git-ls-files', '--unmerged', '--stage', '-z'
670 ).raw_output().split('\0'):
674 mode, hash, stage, path = stages_re.findall(line)[0]
676 if not path in files:
678 files[path]['1'] = ('', '')
679 files[path]['2'] = ('', '')
680 files[path]['3'] = ('', '')
682 files[path][stage] = (mode, hash)
684 if err_output and not files:
685 # if no unmerged files, there was probably a different type of
686 # error and we have to abort the merge
687 raise GitException, err_output
689 # merge the unmerged files
692 # remove additional files that might be generated for some
693 # newer versions of GIT
694 for suffix in [base, head1, head2]:
697 fname = path + '~' + suffix
698 if os.path.exists(fname):
702 if gitmergeonefile.merge(stages['1'][1], stages['2'][1],
703 stages['3'][1], path, stages['1'][0],
704 stages['2'][0], stages['3'][0]) != 0:
708 raise GitException, 'GIT index merging failed (possible conflicts)'
710 def status(files = None, modified = False, new = False, deleted = False,
711 conflict = False, unknown = False, noexclude = False,
713 """Show the tree status
718 cache_files = tree_status(files, unknown = True, noexclude = noexclude,
719 diff_flags = diff_flags)
720 all = not (modified or new or deleted or conflict or unknown)
735 cache_files = [x for x in cache_files if x[0] in filestat]
737 for fs in cache_files:
738 if files and not fs[1] in files:
741 out.stdout('%s %s' % (fs[0], fs[1]))
743 out.stdout('%s' % fs[1])
745 def diff(files = None, rev1 = 'HEAD', rev2 = None, diff_flags = []):
746 """Show the diff between rev1 and rev2
752 return GRun('git-diff-tree', '-p',
753 *(diff_flags + [rev1, rev2, '--'] + files)).raw_output()
757 return GRun('git-diff-index', '-p', '-R',
758 *(diff_flags + [rev2, '--'] + files)).raw_output()
760 return GRun('git-diff-index', '-p',
761 *(diff_flags + [rev1, '--'] + files)).raw_output()
765 def diffstat(files = None, rev1 = 'HEAD', rev2 = None):
766 """Return the diffstat between rev1 and rev2."""
767 return GRun('git-apply', '--stat'
768 ).raw_input(diff(files, rev1, rev2)).raw_output()
770 def files(rev1, rev2, diff_flags = []):
771 """Return the files modified between rev1 and rev2
775 for line in GRun('git-diff-tree', *(diff_flags + ['-r', rev1, rev2])
777 result.append('%s %s' % tuple(line.split(' ', 4)[-1].split('\t', 1)))
779 return '\n'.join(result)
781 def barefiles(rev1, rev2):
782 """Return the files modified between rev1 and rev2, without status info
786 for line in GRun('git-diff-tree', '-r', rev1, rev2).output_lines():
787 result.append(line.split(' ', 4)[-1].split('\t', 1)[-1])
789 return '\n'.join(result)
791 def pretty_commit(commit_id = 'HEAD', diff_flags = []):
792 """Return a given commit (log + diff)
794 return GRun('git-diff-tree',
796 + ['--cc', '--always', '--pretty', '-r', commit_id])
799 def checkout(files = None, tree_id = None, force = False):
800 """Check out the given or all files
804 GRun('git-read-tree', '--reset', tree_id).run()
805 except GitRunException:
806 raise GitException, 'Failed git-read-tree --reset %s' % tree_id
808 cmd = ['git-checkout-index', '-q', '-u']
812 GRun(*(cmd + ['--'])).xargs(files)
814 GRun(*(cmd + ['-a'])).run()
816 def switch(tree_id, keep = False):
817 """Switch the tree to the given id
822 GRun('git-read-tree', '-u', '-m', get_head(), tree_id).run()
823 except GitRunException:
824 raise GitException, 'git-read-tree failed (local changes maybe?)'
828 def reset(files = None, tree_id = None, check_out = True):
829 """Revert the tree changes relative to the given tree_id. It removes
836 cache_files = tree_status(files, tree_id)
837 # files which were added but need to be removed
838 rm_files = [x[1] for x in cache_files if x[0] in ['A']]
840 checkout(files, tree_id, True)
841 # checkout doesn't remove files
842 map(os.remove, rm_files)
844 # if the reset refers to the whole tree, switch the HEAD as well
848 def fetch(repository = 'origin', refspec = None):
849 """Fetches changes from the remote repository, using 'git-fetch'
859 command = config.get('branch.%s.stgit.fetchcmd' % get_head_file()) or \
860 config.get('stgit.fetchcmd')
861 GRun(*(command.split() + args)).run()
863 def pull(repository = 'origin', refspec = None):
864 """Fetches changes from the remote repository, using 'git-pull'
874 command = config.get('branch.%s.stgit.pullcmd' % get_head_file()) or \
875 config.get('stgit.pullcmd')
876 GRun(*(command.split() + args)).run()
879 """Repack all objects into a single pack
881 GRun('git-repack', '-a', '-d', '-f').run()
883 def apply_patch(filename = None, diff = None, base = None,
885 """Apply a patch onto the current or given index. There must not
886 be any local changes in the tree, otherwise the command fails
898 orig_head = get_head()
904 GRun('git-apply', '--index').raw_input(diff).no_output()
905 except GitRunException:
909 # write the failed diff to a file
910 f = file('.stgit-failed.patch', 'w+')
913 out.warn('Diff written to the .stgit-failed.patch file')
918 top = commit(message = 'temporary commit used for applying a patch',
921 merge(base, orig_head, top)
923 def clone(repository, local_dir):
924 """Clone a remote repository. At the moment, just use the
927 GRun('git-clone', repository, local_dir).run()
929 def modifying_revs(files, base_rev, head_rev):
930 """Return the revisions from the list modifying the given files."""
931 return GRun('git-rev-list', '%s..%s' % (base_rev, head_rev), '--', *files
934 def refspec_localpart(refspec):
935 m = re.match('^[^:]*:([^:]*)$', refspec)
939 raise GitException, 'Cannot parse refspec "%s"' % line
941 def refspec_remotepart(refspec):
942 m = re.match('^([^:]*):[^:]*$', refspec)
946 raise GitException, 'Cannot parse refspec "%s"' % line
949 def __remotes_from_config():
950 return config.sections_matching(r'remote\.(.*)\.url')
952 def __remotes_from_dir(dir):
953 d = os.path.join(basedir.get(), dir)
954 if os.path.exists(d):
960 """Return the list of remotes in the repository
963 return Set(__remotes_from_config()) | \
964 Set(__remotes_from_dir('remotes')) | \
965 Set(__remotes_from_dir('branches'))
967 def remotes_local_branches(remote):
968 """Returns the list of local branches fetched from given remote
972 if remote in __remotes_from_config():
973 for line in config.getall('remote.%s.fetch' % remote):
974 branches.append(refspec_localpart(line))
975 elif remote in __remotes_from_dir('remotes'):
976 stream = open(os.path.join(basedir.get(), 'remotes', remote), 'r')
978 # Only consider Pull lines
979 m = re.match('^Pull: (.*)\n$', line)
981 branches.append(refspec_localpart(m.group(1)))
983 elif remote in __remotes_from_dir('branches'):
984 # old-style branches only declare one branch
985 branches.append('refs/heads/'+remote);
987 raise GitException, 'Unknown remote "%s"' % remote
991 def identify_remote(branchname):
992 """Return the name for the remote to pull the given branchname
993 from, or None if we believe it is a local branch.
996 for remote in remotes_list():
997 if branchname in remotes_local_branches(remote):
1000 # if we get here we've found nothing, the branch is a local one
1004 """Return the git id for the tip of the parent branch as left by
1009 stream = open(os.path.join(basedir.get(), 'FETCH_HEAD'), "r")
1011 # Only consider lines not tagged not-for-merge
1012 m = re.match('^([^\t]*)\t\t', line)
1015 raise GitException, "StGit does not support multiple FETCH_HEAD"
1017 fetch_head=m.group(1)
1020 # here we are sure to have a single fetch_head
1024 """Return a list of all refs in the current repository.
1027 return [line.split()[1] for line in GRun('git-show-ref').output_lines()]