repo.py 34 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012
  1. # repo.py -- For dealing with git repositories.
  2. # Copyright (C) 2007 James Westby <jw+debian@jameswestby.net>
  3. # Copyright (C) 2008-2013 Jelmer Vernooij <jelmer@samba.org>
  4. #
  5. # This program is free software; you can redistribute it and/or
  6. # modify it under the terms of the GNU General Public License
  7. # as published by the Free Software Foundation; version 2
  8. # of the License or (at your option) any later version of
  9. # the License.
  10. #
  11. # This program is distributed in the hope that it will be useful,
  12. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  14. # GNU General Public License for more details.
  15. #
  16. # You should have received a copy of the GNU General Public License
  17. # along with this program; if not, write to the Free Software
  18. # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  19. # MA 02110-1301, USA.
  20. """Repository access.
  21. This module contains the base class for git repositories
  22. (BaseRepo) and an implementation which uses a repository on
  23. local disk (Repo).
  24. """
  25. from cStringIO import StringIO
  26. import errno
  27. import os
  28. from dulwich.errors import (
  29. NoIndexPresent,
  30. NotBlobError,
  31. NotCommitError,
  32. NotGitRepository,
  33. NotTreeError,
  34. NotTagError,
  35. CommitError,
  36. RefFormatError,
  37. HookError,
  38. )
  39. from dulwich.file import (
  40. GitFile,
  41. )
  42. from dulwich.object_store import (
  43. DiskObjectStore,
  44. MemoryObjectStore,
  45. ObjectStoreGraphWalker,
  46. )
  47. from dulwich.objects import (
  48. check_hexsha,
  49. Blob,
  50. Commit,
  51. ShaFile,
  52. Tag,
  53. Tree,
  54. )
  55. from dulwich.hooks import (
  56. PreCommitShellHook,
  57. PostCommitShellHook,
  58. CommitMsgShellHook,
  59. )
  60. from dulwich.refs import (
  61. check_ref_format,
  62. RefsContainer,
  63. DictRefsContainer,
  64. InfoRefsContainer,
  65. DiskRefsContainer,
  66. read_packed_refs,
  67. read_packed_refs_with_peeled,
  68. write_packed_refs,
  69. SYMREF,
  70. )
  71. import warnings
  72. OBJECTDIR = 'objects'
  73. REFSDIR = 'refs'
  74. REFSDIR_TAGS = 'tags'
  75. REFSDIR_HEADS = 'heads'
  76. INDEX_FILENAME = "index"
  77. BASE_DIRECTORIES = [
  78. ["branches"],
  79. [REFSDIR],
  80. [REFSDIR, REFSDIR_TAGS],
  81. [REFSDIR, REFSDIR_HEADS],
  82. ["hooks"],
  83. ["info"]
  84. ]
  85. def parse_graftpoints(graftpoints):
  86. """Convert a list of graftpoints into a dict
  87. :param graftpoints: Iterator of graftpoint lines
  88. Each line is formatted as:
  89. <commit sha1> <parent sha1> [<parent sha1>]*
  90. Resulting dictionary is:
  91. <commit sha1>: [<parent sha1>*]
  92. https://git.wiki.kernel.org/index.php/GraftPoint
  93. """
  94. grafts = {}
  95. for l in graftpoints:
  96. raw_graft = l.split(None, 1)
  97. commit = raw_graft[0]
  98. if len(raw_graft) == 2:
  99. parents = raw_graft[1].split()
  100. else:
  101. parents = []
  102. for sha in [commit] + parents:
  103. check_hexsha(sha, 'Invalid graftpoint')
  104. grafts[commit] = parents
  105. return grafts
  106. def serialize_graftpoints(graftpoints):
  107. """Convert a dictionary of grafts into string
  108. The graft dictionary is:
  109. <commit sha1>: [<parent sha1>*]
  110. Each line is formatted as:
  111. <commit sha1> <parent sha1> [<parent sha1>]*
  112. https://git.wiki.kernel.org/index.php/GraftPoint
  113. """
  114. graft_lines = []
  115. for commit, parents in graftpoints.iteritems():
  116. if parents:
  117. graft_lines.append('%s %s' % (commit, ' '.join(parents)))
  118. else:
  119. graft_lines.append(commit)
  120. return '\n'.join(graft_lines)
  121. class BaseRepo(object):
  122. """Base class for a git repository.
  123. :ivar object_store: Dictionary-like object for accessing
  124. the objects
  125. :ivar refs: Dictionary-like object with the refs in this
  126. repository
  127. """
  128. def __init__(self, object_store, refs):
  129. """Open a repository.
  130. This shouldn't be called directly, but rather through one of the
  131. base classes, such as MemoryRepo or Repo.
  132. :param object_store: Object store to use
  133. :param refs: Refs container to use
  134. """
  135. self.object_store = object_store
  136. self.refs = refs
  137. self._graftpoints = {}
  138. self.hooks = {}
  139. def _init_files(self, bare):
  140. """Initialize a default set of named files."""
  141. from dulwich.config import ConfigFile
  142. self._put_named_file('description', "Unnamed repository")
  143. f = StringIO()
  144. cf = ConfigFile()
  145. cf.set("core", "repositoryformatversion", "0")
  146. cf.set("core", "filemode", "true")
  147. cf.set("core", "bare", str(bare).lower())
  148. cf.set("core", "logallrefupdates", "true")
  149. cf.write_to_file(f)
  150. self._put_named_file('config', f.getvalue())
  151. self._put_named_file(os.path.join('info', 'exclude'), '')
  152. def get_named_file(self, path):
  153. """Get a file from the control dir with a specific name.
  154. Although the filename should be interpreted as a filename relative to
  155. the control dir in a disk-based Repo, the object returned need not be
  156. pointing to a file in that location.
  157. :param path: The path to the file, relative to the control dir.
  158. :return: An open file object, or None if the file does not exist.
  159. """
  160. raise NotImplementedError(self.get_named_file)
  161. def _put_named_file(self, path, contents):
  162. """Write a file to the control dir with the given name and contents.
  163. :param path: The path to the file, relative to the control dir.
  164. :param contents: A string to write to the file.
  165. """
  166. raise NotImplementedError(self._put_named_file)
  167. def open_index(self):
  168. """Open the index for this repository.
  169. :raise NoIndexPresent: If no index is present
  170. :return: The matching `Index`
  171. """
  172. raise NotImplementedError(self.open_index)
  173. def fetch(self, target, determine_wants=None, progress=None):
  174. """Fetch objects into another repository.
  175. :param target: The target repository
  176. :param determine_wants: Optional function to determine what refs to
  177. fetch.
  178. :param progress: Optional progress function
  179. :return: The local refs
  180. """
  181. if determine_wants is None:
  182. determine_wants = target.object_store.determine_wants_all
  183. target.object_store.add_objects(
  184. self.fetch_objects(determine_wants, target.get_graph_walker(),
  185. progress))
  186. return self.get_refs()
  187. def fetch_objects(self, determine_wants, graph_walker, progress,
  188. get_tagged=None):
  189. """Fetch the missing objects required for a set of revisions.
  190. :param determine_wants: Function that takes a dictionary with heads
  191. and returns the list of heads to fetch.
  192. :param graph_walker: Object that can iterate over the list of revisions
  193. to fetch and has an "ack" method that will be called to acknowledge
  194. that a revision is present.
  195. :param progress: Simple progress function that will be called with
  196. updated progress strings.
  197. :param get_tagged: Function that returns a dict of pointed-to sha -> tag
  198. sha for including tags.
  199. :return: iterator over objects, with __len__ implemented
  200. """
  201. wants = determine_wants(self.get_refs())
  202. if type(wants) is not list:
  203. raise TypeError("determine_wants() did not return a list")
  204. if wants == []:
  205. # TODO(dborowitz): find a way to short-circuit that doesn't change
  206. # this interface.
  207. return []
  208. haves = self.object_store.find_common_revisions(graph_walker)
  209. return self.object_store.iter_shas(
  210. self.object_store.find_missing_objects(haves, wants, progress,
  211. get_tagged))
  212. def get_graph_walker(self, heads=None):
  213. """Retrieve a graph walker.
  214. A graph walker is used by a remote repository (or proxy)
  215. to find out which objects are present in this repository.
  216. :param heads: Repository heads to use (optional)
  217. :return: A graph walker object
  218. """
  219. if heads is None:
  220. heads = self.refs.as_dict('refs/heads').values()
  221. return ObjectStoreGraphWalker(heads, self.get_parents)
  222. def ref(self, name):
  223. """Return the SHA1 a ref is pointing to.
  224. :param name: Name of the ref to look up
  225. :raise KeyError: when the ref (or the one it points to) does not exist
  226. :return: SHA1 it is pointing at
  227. """
  228. warnings.warn(
  229. "Repo.ref(name) is deprecated. Use Repo.refs[name] instead.",
  230. category=DeprecationWarning, stacklevel=2)
  231. return self.refs[name]
  232. def get_refs(self):
  233. """Get dictionary with all refs.
  234. :return: A ``dict`` mapping ref names to SHA1s
  235. """
  236. return self.refs.as_dict()
  237. def head(self):
  238. """Return the SHA1 pointed at by HEAD."""
  239. return self.refs['HEAD']
  240. def _get_object(self, sha, cls):
  241. assert len(sha) in (20, 40)
  242. ret = self.get_object(sha)
  243. if not isinstance(ret, cls):
  244. if cls is Commit:
  245. raise NotCommitError(ret)
  246. elif cls is Blob:
  247. raise NotBlobError(ret)
  248. elif cls is Tree:
  249. raise NotTreeError(ret)
  250. elif cls is Tag:
  251. raise NotTagError(ret)
  252. else:
  253. raise Exception("Type invalid: %r != %r" % (
  254. ret.type_name, cls.type_name))
  255. return ret
  256. def get_object(self, sha):
  257. """Retrieve the object with the specified SHA.
  258. :param sha: SHA to retrieve
  259. :return: A ShaFile object
  260. :raise KeyError: when the object can not be found
  261. """
  262. return self.object_store[sha]
  263. def get_parents(self, sha, commit=None):
  264. """Retrieve the parents of a specific commit.
  265. If the specific commit is a graftpoint, the graft parents
  266. will be returned instead.
  267. :param sha: SHA of the commit for which to retrieve the parents
  268. :param commit: Optional commit matching the sha
  269. :return: List of parents
  270. """
  271. try:
  272. return self._graftpoints[sha]
  273. except KeyError:
  274. if commit is None:
  275. commit = self[sha]
  276. return commit.parents
  277. def get_config(self):
  278. """Retrieve the config object.
  279. :return: `ConfigFile` object for the ``.git/config`` file.
  280. """
  281. raise NotImplementedError(self.get_config)
  282. def get_description(self):
  283. """Retrieve the description for this repository.
  284. :return: String with the description of the repository
  285. as set by the user.
  286. """
  287. raise NotImplementedError(self.get_description)
  288. def set_description(self, description):
  289. """Set the description for this repository.
  290. :param description: Text to set as description for this repository.
  291. """
  292. raise NotImplementedError(self.set_description)
  293. def get_config_stack(self):
  294. """Return a config stack for this repository.
  295. This stack accesses the configuration for both this repository
  296. itself (.git/config) and the global configuration, which usually
  297. lives in ~/.gitconfig.
  298. :return: `Config` instance for this repository
  299. """
  300. from dulwich.config import StackedConfig
  301. backends = [self.get_config()] + StackedConfig.default_backends()
  302. return StackedConfig(backends, writable=backends[0])
  303. def commit(self, sha):
  304. """Retrieve the commit with a particular SHA.
  305. :param sha: SHA of the commit to retrieve
  306. :raise NotCommitError: If the SHA provided doesn't point at a Commit
  307. :raise KeyError: If the SHA provided didn't exist
  308. :return: A `Commit` object
  309. """
  310. warnings.warn("Repo.commit(sha) is deprecated. Use Repo[sha] instead.",
  311. category=DeprecationWarning, stacklevel=2)
  312. return self._get_object(sha, Commit)
  313. def tree(self, sha):
  314. """Retrieve the tree with a particular SHA.
  315. :param sha: SHA of the tree to retrieve
  316. :raise NotTreeError: If the SHA provided doesn't point at a Tree
  317. :raise KeyError: If the SHA provided didn't exist
  318. :return: A `Tree` object
  319. """
  320. warnings.warn("Repo.tree(sha) is deprecated. Use Repo[sha] instead.",
  321. category=DeprecationWarning, stacklevel=2)
  322. return self._get_object(sha, Tree)
  323. def tag(self, sha):
  324. """Retrieve the tag with a particular SHA.
  325. :param sha: SHA of the tag to retrieve
  326. :raise NotTagError: If the SHA provided doesn't point at a Tag
  327. :raise KeyError: If the SHA provided didn't exist
  328. :return: A `Tag` object
  329. """
  330. warnings.warn("Repo.tag(sha) is deprecated. Use Repo[sha] instead.",
  331. category=DeprecationWarning, stacklevel=2)
  332. return self._get_object(sha, Tag)
  333. def get_blob(self, sha):
  334. """Retrieve the blob with a particular SHA.
  335. :param sha: SHA of the blob to retrieve
  336. :raise NotBlobError: If the SHA provided doesn't point at a Blob
  337. :raise KeyError: If the SHA provided didn't exist
  338. :return: A `Blob` object
  339. """
  340. warnings.warn("Repo.get_blob(sha) is deprecated. Use Repo[sha] "
  341. "instead.", category=DeprecationWarning, stacklevel=2)
  342. return self._get_object(sha, Blob)
  343. def get_peeled(self, ref):
  344. """Get the peeled value of a ref.
  345. :param ref: The refname to peel.
  346. :return: The fully-peeled SHA1 of a tag object, after peeling all
  347. intermediate tags; if the original ref does not point to a tag, this
  348. will equal the original SHA1.
  349. """
  350. cached = self.refs.get_peeled(ref)
  351. if cached is not None:
  352. return cached
  353. return self.object_store.peel_sha(self.refs[ref]).id
  354. def get_walker(self, include=None, *args, **kwargs):
  355. """Obtain a walker for this repository.
  356. :param include: Iterable of SHAs of commits to include along with their
  357. ancestors. Defaults to [HEAD]
  358. :param exclude: Iterable of SHAs of commits to exclude along with their
  359. ancestors, overriding includes.
  360. :param order: ORDER_* constant specifying the order of results. Anything
  361. other than ORDER_DATE may result in O(n) memory usage.
  362. :param reverse: If True, reverse the order of output, requiring O(n)
  363. memory.
  364. :param max_entries: The maximum number of entries to yield, or None for
  365. no limit.
  366. :param paths: Iterable of file or subtree paths to show entries for.
  367. :param rename_detector: diff.RenameDetector object for detecting
  368. renames.
  369. :param follow: If True, follow path across renames/copies. Forces a
  370. default rename_detector.
  371. :param since: Timestamp to list commits after.
  372. :param until: Timestamp to list commits before.
  373. :param queue_cls: A class to use for a queue of commits, supporting the
  374. iterator protocol. The constructor takes a single argument, the
  375. Walker.
  376. :return: A `Walker` object
  377. """
  378. from dulwich.walk import Walker
  379. if include is None:
  380. include = [self.head()]
  381. if isinstance(include, str):
  382. include = [include]
  383. kwargs['get_parents'] = lambda commit: self.get_parents(commit.id, commit)
  384. return Walker(self.object_store, include, *args, **kwargs)
  385. def revision_history(self, head):
  386. """Returns a list of the commits reachable from head.
  387. :param head: The SHA of the head to list revision history for.
  388. :return: A list of commit objects reachable from head, starting with
  389. head itself, in descending commit time order.
  390. :raise MissingCommitError: if any missing commits are referenced,
  391. including if the head parameter isn't the SHA of a commit.
  392. """
  393. warnings.warn("Repo.revision_history() is deprecated."
  394. "Use dulwich.walker.Walker(repo) instead.",
  395. category=DeprecationWarning, stacklevel=2)
  396. return [e.commit for e in self.get_walker(include=[head])]
  397. def __getitem__(self, name):
  398. """Retrieve a Git object by SHA1 or ref.
  399. :param name: A Git object SHA1 or a ref name
  400. :return: A `ShaFile` object, such as a Commit or Blob
  401. :raise KeyError: when the specified ref or object does not exist
  402. """
  403. if len(name) in (20, 40):
  404. try:
  405. return self.object_store[name]
  406. except (KeyError, ValueError):
  407. pass
  408. try:
  409. return self.object_store[self.refs[name]]
  410. except RefFormatError:
  411. raise KeyError(name)
  412. def __contains__(self, name):
  413. """Check if a specific Git object or ref is present.
  414. :param name: Git object SHA1 or ref name
  415. """
  416. if len(name) in (20, 40):
  417. return name in self.object_store or name in self.refs
  418. else:
  419. return name in self.refs
  420. def __setitem__(self, name, value):
  421. """Set a ref.
  422. :param name: ref name
  423. :param value: Ref value - either a ShaFile object, or a hex sha
  424. """
  425. if name.startswith("refs/") or name == "HEAD":
  426. if isinstance(value, ShaFile):
  427. self.refs[name] = value.id
  428. elif isinstance(value, str):
  429. self.refs[name] = value
  430. else:
  431. raise TypeError(value)
  432. else:
  433. raise ValueError(name)
  434. def __delitem__(self, name):
  435. """Remove a ref.
  436. :param name: Name of the ref to remove
  437. """
  438. if name.startswith("refs/") or name == "HEAD":
  439. del self.refs[name]
  440. else:
  441. raise ValueError(name)
  442. def _get_user_identity(self):
  443. """Determine the identity to use for new commits.
  444. """
  445. config = self.get_config_stack()
  446. return "%s <%s>" % (
  447. config.get(("user", ), "name"),
  448. config.get(("user", ), "email"))
  449. def _add_graftpoints(self, updated_graftpoints):
  450. """Add or modify graftpoints
  451. :param updated_graftpoints: Dict of commit shas to list of parent shas
  452. """
  453. # Simple validation
  454. for commit, parents in updated_graftpoints.iteritems():
  455. for sha in [commit] + parents:
  456. check_hexsha(sha, 'Invalid graftpoint')
  457. self._graftpoints.update(updated_graftpoints)
  458. def _remove_graftpoints(self, to_remove=[]):
  459. """Remove graftpoints
  460. :param to_remove: List of commit shas
  461. """
  462. for sha in to_remove:
  463. del self._graftpoints[sha]
  464. def do_commit(self, message=None, committer=None,
  465. author=None, commit_timestamp=None,
  466. commit_timezone=None, author_timestamp=None,
  467. author_timezone=None, tree=None, encoding=None,
  468. ref='HEAD', merge_heads=None):
  469. """Create a new commit.
  470. :param message: Commit message
  471. :param committer: Committer fullname
  472. :param author: Author fullname (defaults to committer)
  473. :param commit_timestamp: Commit timestamp (defaults to now)
  474. :param commit_timezone: Commit timestamp timezone (defaults to GMT)
  475. :param author_timestamp: Author timestamp (defaults to commit timestamp)
  476. :param author_timezone: Author timestamp timezone
  477. (defaults to commit timestamp timezone)
  478. :param tree: SHA1 of the tree root to use (if not specified the
  479. current index will be committed).
  480. :param encoding: Encoding
  481. :param ref: Optional ref to commit to (defaults to current branch)
  482. :param merge_heads: Merge heads (defaults to .git/MERGE_HEADS)
  483. :return: New commit SHA1
  484. """
  485. import time
  486. c = Commit()
  487. if tree is None:
  488. index = self.open_index()
  489. c.tree = index.commit(self.object_store)
  490. else:
  491. if len(tree) != 40:
  492. raise ValueError("tree must be a 40-byte hex sha string")
  493. c.tree = tree
  494. try:
  495. self.hooks['pre-commit'].execute()
  496. except HookError, e:
  497. raise CommitError(e)
  498. except KeyError: # no hook defined, silent fallthrough
  499. pass
  500. if merge_heads is None:
  501. # FIXME: Read merge heads from .git/MERGE_HEADS
  502. merge_heads = []
  503. if committer is None:
  504. # FIXME: Support GIT_COMMITTER_NAME/GIT_COMMITTER_EMAIL environment
  505. # variables
  506. committer = self._get_user_identity()
  507. c.committer = committer
  508. if commit_timestamp is None:
  509. # FIXME: Support GIT_COMMITTER_DATE environment variable
  510. commit_timestamp = time.time()
  511. c.commit_time = int(commit_timestamp)
  512. if commit_timezone is None:
  513. # FIXME: Use current user timezone rather than UTC
  514. commit_timezone = 0
  515. c.commit_timezone = commit_timezone
  516. if author is None:
  517. # FIXME: Support GIT_AUTHOR_NAME/GIT_AUTHOR_EMAIL environment
  518. # variables
  519. author = committer
  520. c.author = author
  521. if author_timestamp is None:
  522. # FIXME: Support GIT_AUTHOR_DATE environment variable
  523. author_timestamp = commit_timestamp
  524. c.author_time = int(author_timestamp)
  525. if author_timezone is None:
  526. author_timezone = commit_timezone
  527. c.author_timezone = author_timezone
  528. if encoding is not None:
  529. c.encoding = encoding
  530. if message is None:
  531. # FIXME: Try to read commit message from .git/MERGE_MSG
  532. raise ValueError("No commit message specified")
  533. try:
  534. c.message = self.hooks['commit-msg'].execute(message)
  535. if c.message is None:
  536. c.message = message
  537. except HookError, e:
  538. raise CommitError(e)
  539. except KeyError: # no hook defined, message not modified
  540. c.message = message
  541. try:
  542. old_head = self.refs[ref]
  543. c.parents = [old_head] + merge_heads
  544. self.object_store.add_object(c)
  545. ok = self.refs.set_if_equals(ref, old_head, c.id)
  546. except KeyError:
  547. c.parents = merge_heads
  548. self.object_store.add_object(c)
  549. ok = self.refs.add_if_new(ref, c.id)
  550. if not ok:
  551. # Fail if the atomic compare-and-swap failed, leaving the commit and
  552. # all its objects as garbage.
  553. raise CommitError("%s changed during commit" % (ref,))
  554. try:
  555. self.hooks['post-commit'].execute()
  556. except HookError, e: # silent failure
  557. warnings.warn("post-commit hook failed: %s" % e, UserWarning)
  558. except KeyError: # no hook defined, silent fallthrough
  559. pass
  560. return c.id
  561. class Repo(BaseRepo):
  562. """A git repository backed by local disk.
  563. To open an existing repository, call the contructor with
  564. the path of the repository.
  565. To create a new repository, use the Repo.init class method.
  566. """
  567. def __init__(self, root):
  568. if os.path.isdir(os.path.join(root, ".git", OBJECTDIR)):
  569. self.bare = False
  570. self._controldir = os.path.join(root, ".git")
  571. elif (os.path.isdir(os.path.join(root, OBJECTDIR)) and
  572. os.path.isdir(os.path.join(root, REFSDIR))):
  573. self.bare = True
  574. self._controldir = root
  575. elif (os.path.isfile(os.path.join(root, ".git"))):
  576. import re
  577. f = open(os.path.join(root, ".git"), 'r')
  578. try:
  579. _, path = re.match('(gitdir: )(.+$)', f.read()).groups()
  580. finally:
  581. f.close()
  582. self.bare = False
  583. self._controldir = os.path.join(root, path)
  584. else:
  585. raise NotGitRepository(
  586. "No git repository was found at %(path)s" % dict(path=root)
  587. )
  588. self.path = root
  589. object_store = DiskObjectStore(os.path.join(self.controldir(),
  590. OBJECTDIR))
  591. refs = DiskRefsContainer(self.controldir())
  592. BaseRepo.__init__(self, object_store, refs)
  593. graft_file = self.get_named_file(os.path.join("info", "grafts"))
  594. if graft_file:
  595. self._graftpoints = parse_graftpoints(graft_file)
  596. self.hooks['pre-commit'] = PreCommitShellHook(self.controldir())
  597. self.hooks['commit-msg'] = CommitMsgShellHook(self.controldir())
  598. self.hooks['post-commit'] = PostCommitShellHook(self.controldir())
  599. def controldir(self):
  600. """Return the path of the control directory."""
  601. return self._controldir
  602. def _put_named_file(self, path, contents):
  603. """Write a file to the control dir with the given name and contents.
  604. :param path: The path to the file, relative to the control dir.
  605. :param contents: A string to write to the file.
  606. """
  607. path = path.lstrip(os.path.sep)
  608. f = GitFile(os.path.join(self.controldir(), path), 'wb')
  609. try:
  610. f.write(contents)
  611. finally:
  612. f.close()
  613. def get_named_file(self, path):
  614. """Get a file from the control dir with a specific name.
  615. Although the filename should be interpreted as a filename relative to
  616. the control dir in a disk-based Repo, the object returned need not be
  617. pointing to a file in that location.
  618. :param path: The path to the file, relative to the control dir.
  619. :return: An open file object, or None if the file does not exist.
  620. """
  621. # TODO(dborowitz): sanitize filenames, since this is used directly by
  622. # the dumb web serving code.
  623. path = path.lstrip(os.path.sep)
  624. try:
  625. return open(os.path.join(self.controldir(), path), 'rb')
  626. except (IOError, OSError), e:
  627. if e.errno == errno.ENOENT:
  628. return None
  629. raise
  630. def index_path(self):
  631. """Return path to the index file."""
  632. return os.path.join(self.controldir(), INDEX_FILENAME)
  633. def open_index(self):
  634. """Open the index for this repository.
  635. :raise NoIndexPresent: If no index is present
  636. :return: The matching `Index`
  637. """
  638. from dulwich.index import Index
  639. if not self.has_index():
  640. raise NoIndexPresent()
  641. return Index(self.index_path())
  642. def has_index(self):
  643. """Check if an index is present."""
  644. # Bare repos must never have index files; non-bare repos may have a
  645. # missing index file, which is treated as empty.
  646. return not self.bare
  647. def stage(self, paths):
  648. """Stage a set of paths.
  649. :param paths: List of paths, relative to the repository path
  650. """
  651. if isinstance(paths, basestring):
  652. paths = [paths]
  653. from dulwich.index import index_entry_from_stat
  654. index = self.open_index()
  655. for path in paths:
  656. full_path = os.path.join(self.path, path)
  657. try:
  658. st = os.stat(full_path)
  659. except OSError:
  660. # File no longer exists
  661. try:
  662. del index[path]
  663. except KeyError:
  664. pass # already removed
  665. else:
  666. blob = Blob()
  667. f = open(full_path, 'rb')
  668. try:
  669. blob.data = f.read()
  670. finally:
  671. f.close()
  672. self.object_store.add_object(blob)
  673. index[path] = index_entry_from_stat(st, blob.id, 0)
  674. index.write()
  675. def clone(self, target_path, mkdir=True, bare=False,
  676. origin="origin"):
  677. """Clone this repository.
  678. :param target_path: Target path
  679. :param mkdir: Create the target directory
  680. :param bare: Whether to create a bare repository
  681. :param origin: Base name for refs in target repository
  682. cloned from this repository
  683. :return: Created repository as `Repo`
  684. """
  685. if not bare:
  686. target = self.init(target_path, mkdir=mkdir)
  687. else:
  688. target = self.init_bare(target_path)
  689. self.fetch(target)
  690. target.refs.import_refs(
  691. 'refs/remotes/' + origin, self.refs.as_dict('refs/heads'))
  692. target.refs.import_refs(
  693. 'refs/tags', self.refs.as_dict('refs/tags'))
  694. try:
  695. target.refs.add_if_new(
  696. 'refs/heads/master',
  697. self.refs['refs/heads/master'])
  698. except KeyError:
  699. pass
  700. # Update target head
  701. head, head_sha = self.refs._follow('HEAD')
  702. if head is not None and head_sha is not None:
  703. target.refs.set_symbolic_ref('HEAD', head)
  704. target['HEAD'] = head_sha
  705. if not bare:
  706. # Checkout HEAD to target dir
  707. target._build_tree()
  708. return target
  709. def _build_tree(self):
  710. from dulwich.index import build_index_from_tree
  711. config = self.get_config()
  712. honor_filemode = config.get_boolean('core', 'filemode', os.name != "nt")
  713. return build_index_from_tree(self.path, self.index_path(),
  714. self.object_store, self['HEAD'].tree,
  715. honor_filemode=honor_filemode)
  716. def get_config(self):
  717. """Retrieve the config object.
  718. :return: `ConfigFile` object for the ``.git/config`` file.
  719. """
  720. from dulwich.config import ConfigFile
  721. path = os.path.join(self._controldir, 'config')
  722. try:
  723. return ConfigFile.from_path(path)
  724. except (IOError, OSError), e:
  725. if e.errno != errno.ENOENT:
  726. raise
  727. ret = ConfigFile()
  728. ret.path = path
  729. return ret
  730. def get_description(self):
  731. """Retrieve the description of this repository.
  732. :return: A string describing the repository or None.
  733. """
  734. path = os.path.join(self._controldir, 'description')
  735. try:
  736. f = GitFile(path, 'rb')
  737. try:
  738. return f.read()
  739. finally:
  740. f.close()
  741. except (IOError, OSError), e:
  742. if e.errno != errno.ENOENT:
  743. raise
  744. return None
  745. def __repr__(self):
  746. return "<Repo at %r>" % self.path
  747. def set_description(self, description):
  748. """Set the description for this repository.
  749. :param description: Text to set as description for this repository.
  750. """
  751. path = os.path.join(self._controldir, 'description')
  752. f = open(path, 'w')
  753. try:
  754. f.write(description)
  755. finally:
  756. f.close()
  757. @classmethod
  758. def _init_maybe_bare(cls, path, bare):
  759. for d in BASE_DIRECTORIES:
  760. os.mkdir(os.path.join(path, *d))
  761. DiskObjectStore.init(os.path.join(path, OBJECTDIR))
  762. ret = cls(path)
  763. ret.refs.set_symbolic_ref("HEAD", "refs/heads/master")
  764. ret._init_files(bare)
  765. return ret
  766. @classmethod
  767. def init(cls, path, mkdir=False):
  768. """Create a new repository.
  769. :param path: Path in which to create the repository
  770. :param mkdir: Whether to create the directory
  771. :return: `Repo` instance
  772. """
  773. if mkdir:
  774. os.mkdir(path)
  775. controldir = os.path.join(path, ".git")
  776. os.mkdir(controldir)
  777. cls._init_maybe_bare(controldir, False)
  778. return cls(path)
  779. @classmethod
  780. def init_bare(cls, path):
  781. """Create a new bare repository.
  782. ``path`` should already exist and be an emty directory.
  783. :param path: Path to create bare repository in
  784. :return: a `Repo` instance
  785. """
  786. return cls._init_maybe_bare(path, True)
  787. create = init_bare
  788. class MemoryRepo(BaseRepo):
  789. """Repo that stores refs, objects, and named files in memory.
  790. MemoryRepos are always bare: they have no working tree and no index, since
  791. those have a stronger dependency on the filesystem.
  792. """
  793. def __init__(self):
  794. BaseRepo.__init__(self, MemoryObjectStore(), DictRefsContainer({}))
  795. self._named_files = {}
  796. self.bare = True
  797. def _put_named_file(self, path, contents):
  798. """Write a file to the control dir with the given name and contents.
  799. :param path: The path to the file, relative to the control dir.
  800. :param contents: A string to write to the file.
  801. """
  802. self._named_files[path] = contents
  803. def get_named_file(self, path):
  804. """Get a file from the control dir with a specific name.
  805. Although the filename should be interpreted as a filename relative to
  806. the control dir in a disk-baked Repo, the object returned need not be
  807. pointing to a file in that location.
  808. :param path: The path to the file, relative to the control dir.
  809. :return: An open file object, or None if the file does not exist.
  810. """
  811. contents = self._named_files.get(path, None)
  812. if contents is None:
  813. return None
  814. return StringIO(contents)
  815. def open_index(self):
  816. """Fail to open index for this repo, since it is bare.
  817. :raise NoIndexPresent: Raised when no index is present
  818. """
  819. raise NoIndexPresent()
  820. def get_config(self):
  821. """Retrieve the config object.
  822. :return: `ConfigFile` object.
  823. """
  824. from dulwich.config import ConfigFile
  825. return ConfigFile()
  826. def get_description(self):
  827. """Retrieve the repository description.
  828. This defaults to None, for no description.
  829. """
  830. return None
  831. @classmethod
  832. def init_bare(cls, objects, refs):
  833. """Create a new bare repository in memory.
  834. :param objects: Objects for the new repository,
  835. as iterable
  836. :param refs: Refs as dictionary, mapping names
  837. to object SHA1s
  838. """
  839. ret = cls()
  840. for obj in objects:
  841. ret.object_store.add_object(obj)
  842. for refname, sha in refs.iteritems():
  843. ret.refs[refname] = sha
  844. ret._init_files(bare=True)
  845. return ret