swift.py 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023
  1. # swift.py -- Repo implementation atop OpenStack SWIFT
  2. # Copyright (C) 2013 eNovance SAS <licensing@enovance.com>
  3. #
  4. # Author: Fabien Boucher <fabien.boucher@enovance.com>
  5. #
  6. # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
  7. # General Public License as public by the Free Software Foundation; version 2.0
  8. # or (at your option) any later version. You can redistribute it and/or
  9. # modify it under the terms of either of these two licenses.
  10. #
  11. # Unless required by applicable law or agreed to in writing, software
  12. # distributed under the License is distributed on an "AS IS" BASIS,
  13. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. # See the License for the specific language governing permissions and
  15. # limitations under the License.
  16. #
  17. # You should have received a copy of the licenses; if not, see
  18. # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
  19. # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
  20. # License, Version 2.0.
  21. #
  22. """Repo implementation atop OpenStack SWIFT."""
  23. # TODO: Refactor to share more code with dulwich/repo.py.
  24. # TODO(fbo): Second attempt to _send() must be notified via real log
  25. # TODO(fbo): More logs for operations
  26. import json
  27. import os
  28. import posixpath
  29. import stat
  30. import sys
  31. import tempfile
  32. import urllib.parse as urlparse
  33. import zlib
  34. from configparser import ConfigParser
  35. from io import BytesIO
  36. from geventhttpclient import HTTPClient
  37. from ..greenthreads import GreenThreadsMissingObjectFinder
  38. from ..lru_cache import LRUSizeCache
  39. from ..object_store import INFODIR, PACKDIR, PackBasedObjectStore
  40. from ..objects import S_ISGITLINK, Blob, Commit, Tag, Tree
  41. from ..pack import (
  42. Pack,
  43. PackData,
  44. PackIndexer,
  45. PackStreamCopier,
  46. _compute_object_size,
  47. compute_file_sha,
  48. iter_sha1,
  49. load_pack_index_file,
  50. read_pack_header,
  51. unpack_object,
  52. write_pack_header,
  53. write_pack_index_v2,
  54. write_pack_object,
  55. )
  56. from ..protocol import TCP_GIT_PORT
  57. from ..refs import InfoRefsContainer, read_info_refs, write_info_refs
  58. from ..repo import OBJECTDIR, BaseRepo
  59. from ..server import Backend, TCPGitServer
  60. """
  61. # Configuration file sample
  62. [swift]
  63. # Authentication URL (Keystone or Swift)
  64. auth_url = http://127.0.0.1:5000/v2.0
  65. # Authentication version to use
  66. auth_ver = 2
  67. # The tenant and username separated by a semicolon
  68. username = admin;admin
  69. # The user password
  70. password = pass
  71. # The Object storage region to use (auth v2) (Default RegionOne)
  72. region_name = RegionOne
  73. # The Object storage endpoint URL to use (auth v2) (Default internalURL)
  74. endpoint_type = internalURL
  75. # Concurrency to use for parallel tasks (Default 10)
  76. concurrency = 10
  77. # Size of the HTTP pool (Default 10)
  78. http_pool_length = 10
  79. # Timeout delay for HTTP connections (Default 20)
  80. http_timeout = 20
  81. # Chunk size to read from pack (Bytes) (Default 12228)
  82. chunk_length = 12228
  83. # Cache size (MBytes) (Default 20)
  84. cache_length = 20
  85. """
  86. class PackInfoMissingObjectFinder(GreenThreadsMissingObjectFinder):
  87. def next(self):
  88. while True:
  89. if not self.objects_to_send:
  90. return None
  91. (sha, name, leaf) = self.objects_to_send.pop()
  92. if sha not in self.sha_done:
  93. break
  94. if not leaf:
  95. info = self.object_store.pack_info_get(sha)
  96. if info[0] == Commit.type_num:
  97. self.add_todo([(info[2], "", False)])
  98. elif info[0] == Tree.type_num:
  99. self.add_todo([tuple(i) for i in info[1]])
  100. elif info[0] == Tag.type_num:
  101. self.add_todo([(info[1], None, False)])
  102. if sha in self._tagged:
  103. self.add_todo([(self._tagged[sha], None, True)])
  104. self.sha_done.add(sha)
  105. self.progress("counting objects: %d\r" % len(self.sha_done))
  106. return (sha, name)
  107. def load_conf(path=None, file=None):
  108. """Load configuration in global var CONF.
  109. Args:
  110. path: The path to the configuration file
  111. file: If provided read instead the file like object
  112. """
  113. conf = ConfigParser()
  114. if file:
  115. try:
  116. conf.read_file(file, path)
  117. except AttributeError:
  118. # read_file only exists in Python3
  119. conf.readfp(file)
  120. return conf
  121. confpath = None
  122. if not path:
  123. try:
  124. confpath = os.environ["DULWICH_SWIFT_CFG"]
  125. except KeyError as exc:
  126. raise Exception("You need to specify a configuration file") from exc
  127. else:
  128. confpath = path
  129. if not os.path.isfile(confpath):
  130. raise Exception("Unable to read configuration file %s" % confpath)
  131. conf.read(confpath)
  132. return conf
  133. def swift_load_pack_index(scon, filename):
  134. """Read a pack index file from Swift.
  135. Args:
  136. scon: a `SwiftConnector` instance
  137. filename: Path to the index file objectise
  138. Returns: a `PackIndexer` instance
  139. """
  140. with scon.get_object(filename) as f:
  141. return load_pack_index_file(filename, f)
  142. def pack_info_create(pack_data, pack_index):
  143. pack = Pack.from_objects(pack_data, pack_index)
  144. info = {}
  145. for obj in pack.iterobjects():
  146. # Commit
  147. if obj.type_num == Commit.type_num:
  148. info[obj.id] = (obj.type_num, obj.parents, obj.tree)
  149. # Tree
  150. elif obj.type_num == Tree.type_num:
  151. shas = [
  152. (s, n, not stat.S_ISDIR(m))
  153. for n, m, s in obj.items()
  154. if not S_ISGITLINK(m)
  155. ]
  156. info[obj.id] = (obj.type_num, shas)
  157. # Blob
  158. elif obj.type_num == Blob.type_num:
  159. info[obj.id] = None
  160. # Tag
  161. elif obj.type_num == Tag.type_num:
  162. info[obj.id] = (obj.type_num, obj.object[1])
  163. return zlib.compress(json.dumps(info))
  164. def load_pack_info(filename, scon=None, file=None):
  165. if not file:
  166. f = scon.get_object(filename)
  167. else:
  168. f = file
  169. if not f:
  170. return None
  171. try:
  172. return json.loads(zlib.decompress(f.read()))
  173. finally:
  174. f.close()
  175. class SwiftException(Exception):
  176. pass
  177. class SwiftConnector:
  178. """A Connector to swift that manage authentication and errors catching."""
  179. def __init__(self, root, conf) -> None:
  180. """Initialize a SwiftConnector.
  181. Args:
  182. root: The swift container that will act as Git bare repository
  183. conf: A ConfigParser Object
  184. """
  185. self.conf = conf
  186. self.auth_ver = self.conf.get("swift", "auth_ver")
  187. if self.auth_ver not in ["1", "2"]:
  188. raise NotImplementedError("Wrong authentication version use either 1 or 2")
  189. self.auth_url = self.conf.get("swift", "auth_url")
  190. self.user = self.conf.get("swift", "username")
  191. self.password = self.conf.get("swift", "password")
  192. self.concurrency = self.conf.getint("swift", "concurrency") or 10
  193. self.http_timeout = self.conf.getint("swift", "http_timeout") or 20
  194. self.http_pool_length = self.conf.getint("swift", "http_pool_length") or 10
  195. self.region_name = self.conf.get("swift", "region_name") or "RegionOne"
  196. self.endpoint_type = self.conf.get("swift", "endpoint_type") or "internalURL"
  197. self.cache_length = self.conf.getint("swift", "cache_length") or 20
  198. self.chunk_length = self.conf.getint("swift", "chunk_length") or 12228
  199. self.root = root
  200. block_size = 1024 * 12 # 12KB
  201. if self.auth_ver == "1":
  202. self.storage_url, self.token = self.swift_auth_v1()
  203. else:
  204. self.storage_url, self.token = self.swift_auth_v2()
  205. token_header = {"X-Auth-Token": str(self.token)}
  206. self.httpclient = HTTPClient.from_url(
  207. str(self.storage_url),
  208. concurrency=self.http_pool_length,
  209. block_size=block_size,
  210. connection_timeout=self.http_timeout,
  211. network_timeout=self.http_timeout,
  212. headers=token_header,
  213. )
  214. self.base_path = str(
  215. posixpath.join(urlparse.urlparse(self.storage_url).path, self.root)
  216. )
  217. def swift_auth_v1(self):
  218. self.user = self.user.replace(";", ":")
  219. auth_httpclient = HTTPClient.from_url(
  220. self.auth_url,
  221. connection_timeout=self.http_timeout,
  222. network_timeout=self.http_timeout,
  223. )
  224. headers = {"X-Auth-User": self.user, "X-Auth-Key": self.password}
  225. path = urlparse.urlparse(self.auth_url).path
  226. ret = auth_httpclient.request("GET", path, headers=headers)
  227. # Should do something with redirections (301 in my case)
  228. if ret.status_code < 200 or ret.status_code >= 300:
  229. raise SwiftException(
  230. "AUTH v1.0 request failed on "
  231. + f"{str(auth_httpclient.get_base_url()) + path} with error code {ret.status_code} ({ret.items()!s})"
  232. )
  233. storage_url = ret["X-Storage-Url"]
  234. token = ret["X-Auth-Token"]
  235. return storage_url, token
  236. def swift_auth_v2(self):
  237. self.tenant, self.user = self.user.split(";")
  238. auth_dict = {}
  239. auth_dict["auth"] = {
  240. "passwordCredentials": {
  241. "username": self.user,
  242. "password": self.password,
  243. },
  244. "tenantName": self.tenant,
  245. }
  246. auth_json = json.dumps(auth_dict)
  247. headers = {"Content-Type": "application/json"}
  248. auth_httpclient = HTTPClient.from_url(
  249. self.auth_url,
  250. connection_timeout=self.http_timeout,
  251. network_timeout=self.http_timeout,
  252. )
  253. path = urlparse.urlparse(self.auth_url).path
  254. if not path.endswith("tokens"):
  255. path = posixpath.join(path, "tokens")
  256. ret = auth_httpclient.request("POST", path, body=auth_json, headers=headers)
  257. if ret.status_code < 200 or ret.status_code >= 300:
  258. raise SwiftException(
  259. "AUTH v2.0 request failed on "
  260. + f"{str(auth_httpclient.get_base_url()) + path} with error code {ret.status_code} ({ret.items()!s})"
  261. )
  262. auth_ret_json = json.loads(ret.read())
  263. token = auth_ret_json["access"]["token"]["id"]
  264. catalogs = auth_ret_json["access"]["serviceCatalog"]
  265. object_store = next(
  266. o_store for o_store in catalogs if o_store["type"] == "object-store"
  267. )
  268. endpoints = object_store["endpoints"]
  269. endpoint = next(
  270. endp for endp in endpoints if endp["region"] == self.region_name
  271. )
  272. return endpoint[self.endpoint_type], token
  273. def test_root_exists(self):
  274. """Check that Swift container exist.
  275. Returns: True if exist or None it not
  276. """
  277. ret = self.httpclient.request("HEAD", self.base_path)
  278. if ret.status_code == 404:
  279. return None
  280. if ret.status_code < 200 or ret.status_code > 300:
  281. raise SwiftException(
  282. "HEAD request failed with error code %s" % ret.status_code
  283. )
  284. return True
  285. def create_root(self):
  286. """Create the Swift container.
  287. Raises:
  288. SwiftException: if unable to create
  289. """
  290. if not self.test_root_exists():
  291. ret = self.httpclient.request("PUT", self.base_path)
  292. if ret.status_code < 200 or ret.status_code > 300:
  293. raise SwiftException(
  294. "PUT request failed with error code %s" % ret.status_code
  295. )
  296. def get_container_objects(self):
  297. """Retrieve objects list in a container.
  298. Returns: A list of dict that describe objects
  299. or None if container does not exist
  300. """
  301. qs = "?format=json"
  302. path = self.base_path + qs
  303. ret = self.httpclient.request("GET", path)
  304. if ret.status_code == 404:
  305. return None
  306. if ret.status_code < 200 or ret.status_code > 300:
  307. raise SwiftException(
  308. "GET request failed with error code %s" % ret.status_code
  309. )
  310. content = ret.read()
  311. return json.loads(content)
  312. def get_object_stat(self, name):
  313. """Retrieve object stat.
  314. Args:
  315. name: The object name
  316. Returns:
  317. A dict that describe the object or None if object does not exist
  318. """
  319. path = self.base_path + "/" + name
  320. ret = self.httpclient.request("HEAD", path)
  321. if ret.status_code == 404:
  322. return None
  323. if ret.status_code < 200 or ret.status_code > 300:
  324. raise SwiftException(
  325. "HEAD request failed with error code %s" % ret.status_code
  326. )
  327. resp_headers = {}
  328. for header, value in ret.items():
  329. resp_headers[header.lower()] = value
  330. return resp_headers
  331. def put_object(self, name, content):
  332. """Put an object.
  333. Args:
  334. name: The object name
  335. content: A file object
  336. Raises:
  337. SwiftException: if unable to create
  338. """
  339. content.seek(0)
  340. data = content.read()
  341. path = self.base_path + "/" + name
  342. headers = {"Content-Length": str(len(data))}
  343. def _send():
  344. ret = self.httpclient.request("PUT", path, body=data, headers=headers)
  345. return ret
  346. try:
  347. # Sometime got Broken Pipe - Dirty workaround
  348. ret = _send()
  349. except Exception:
  350. # Second attempt work
  351. ret = _send()
  352. if ret.status_code < 200 or ret.status_code > 300:
  353. raise SwiftException(
  354. "PUT request failed with error code %s" % ret.status_code
  355. )
  356. def get_object(self, name, range=None):
  357. """Retrieve an object.
  358. Args:
  359. name: The object name
  360. range: A string range like "0-10" to
  361. retrieve specified bytes in object content
  362. Returns:
  363. A file like instance or bytestring if range is specified
  364. """
  365. headers = {}
  366. if range:
  367. headers["Range"] = "bytes=%s" % range
  368. path = self.base_path + "/" + name
  369. ret = self.httpclient.request("GET", path, headers=headers)
  370. if ret.status_code == 404:
  371. return None
  372. if ret.status_code < 200 or ret.status_code > 300:
  373. raise SwiftException(
  374. "GET request failed with error code %s" % ret.status_code
  375. )
  376. content = ret.read()
  377. if range:
  378. return content
  379. return BytesIO(content)
  380. def del_object(self, name):
  381. """Delete an object.
  382. Args:
  383. name: The object name
  384. Raises:
  385. SwiftException: if unable to delete
  386. """
  387. path = self.base_path + "/" + name
  388. ret = self.httpclient.request("DELETE", path)
  389. if ret.status_code < 200 or ret.status_code > 300:
  390. raise SwiftException(
  391. "DELETE request failed with error code %s" % ret.status_code
  392. )
  393. def del_root(self):
  394. """Delete the root container by removing container content.
  395. Raises:
  396. SwiftException: if unable to delete
  397. """
  398. for obj in self.get_container_objects():
  399. self.del_object(obj["name"])
  400. ret = self.httpclient.request("DELETE", self.base_path)
  401. if ret.status_code < 200 or ret.status_code > 300:
  402. raise SwiftException(
  403. "DELETE request failed with error code %s" % ret.status_code
  404. )
  405. class SwiftPackReader:
  406. """A SwiftPackReader that mimic read and sync method.
  407. The reader allows to read a specified amount of bytes from
  408. a given offset of a Swift object. A read offset is kept internally.
  409. The reader will read from Swift a specified amount of data to complete
  410. its internal buffer. chunk_length specify the amount of data
  411. to read from Swift.
  412. """
  413. def __init__(self, scon, filename, pack_length) -> None:
  414. """Initialize a SwiftPackReader.
  415. Args:
  416. scon: a `SwiftConnector` instance
  417. filename: the pack filename
  418. pack_length: The size of the pack object
  419. """
  420. self.scon = scon
  421. self.filename = filename
  422. self.pack_length = pack_length
  423. self.offset = 0
  424. self.base_offset = 0
  425. self.buff = b""
  426. self.buff_length = self.scon.chunk_length
  427. def _read(self, more=False):
  428. if more:
  429. self.buff_length = self.buff_length * 2
  430. offset = self.base_offset
  431. r = min(self.base_offset + self.buff_length, self.pack_length)
  432. ret = self.scon.get_object(self.filename, range=f"{offset}-{r}")
  433. self.buff = ret
  434. def read(self, length):
  435. """Read a specified amount of Bytes form the pack object.
  436. Args:
  437. length: amount of bytes to read
  438. Returns:
  439. a bytestring
  440. """
  441. end = self.offset + length
  442. if self.base_offset + end > self.pack_length:
  443. data = self.buff[self.offset :]
  444. self.offset = end
  445. return data
  446. if end > len(self.buff):
  447. # Need to read more from swift
  448. self._read(more=True)
  449. return self.read(length)
  450. data = self.buff[self.offset : end]
  451. self.offset = end
  452. return data
  453. def seek(self, offset):
  454. """Seek to a specified offset.
  455. Args:
  456. offset: the offset to seek to
  457. """
  458. self.base_offset = offset
  459. self._read()
  460. self.offset = 0
  461. def read_checksum(self):
  462. """Read the checksum from the pack.
  463. Returns: the checksum bytestring
  464. """
  465. return self.scon.get_object(self.filename, range="-20")
  466. class SwiftPackData(PackData):
  467. """The data contained in a packfile.
  468. We use the SwiftPackReader to read bytes from packs stored in Swift
  469. using the Range header feature of Swift.
  470. """
  471. def __init__(self, scon, filename) -> None:
  472. """Initialize a SwiftPackReader.
  473. Args:
  474. scon: a `SwiftConnector` instance
  475. filename: the pack filename
  476. """
  477. self.scon = scon
  478. self._filename = filename
  479. self._header_size = 12
  480. headers = self.scon.get_object_stat(self._filename)
  481. self.pack_length = int(headers["content-length"])
  482. pack_reader = SwiftPackReader(self.scon, self._filename, self.pack_length)
  483. (version, self._num_objects) = read_pack_header(pack_reader.read)
  484. self._offset_cache = LRUSizeCache(
  485. 1024 * 1024 * self.scon.cache_length,
  486. compute_size=_compute_object_size,
  487. )
  488. self.pack = None
  489. def get_object_at(self, offset):
  490. if offset in self._offset_cache:
  491. return self._offset_cache[offset]
  492. assert offset >= self._header_size
  493. pack_reader = SwiftPackReader(self.scon, self._filename, self.pack_length)
  494. pack_reader.seek(offset)
  495. unpacked, _ = unpack_object(pack_reader.read)
  496. return (unpacked.pack_type_num, unpacked._obj())
  497. def get_stored_checksum(self):
  498. pack_reader = SwiftPackReader(self.scon, self._filename, self.pack_length)
  499. return pack_reader.read_checksum()
  500. def close(self):
  501. pass
  502. class SwiftPack(Pack):
  503. """A Git pack object.
  504. Same implementation as pack.Pack except that _idx_load and
  505. _data_load are bounded to Swift version of load_pack_index and
  506. PackData.
  507. """
  508. def __init__(self, *args, **kwargs) -> None:
  509. self.scon = kwargs["scon"]
  510. del kwargs["scon"]
  511. super().__init__(*args, **kwargs)
  512. self._pack_info_path = self._basename + ".info"
  513. self._pack_info = None
  514. self._pack_info_load = lambda: load_pack_info(self._pack_info_path, self.scon)
  515. self._idx_load = lambda: swift_load_pack_index(self.scon, self._idx_path)
  516. self._data_load = lambda: SwiftPackData(self.scon, self._data_path)
  517. @property
  518. def pack_info(self):
  519. """The pack data object being used."""
  520. if self._pack_info is None:
  521. self._pack_info = self._pack_info_load()
  522. return self._pack_info
  523. class SwiftObjectStore(PackBasedObjectStore):
  524. """A Swift Object Store.
  525. Allow to manage a bare Git repository from Openstack Swift.
  526. This object store only supports pack files and not loose objects.
  527. """
  528. def __init__(self, scon) -> None:
  529. """Open a Swift object store.
  530. Args:
  531. scon: A `SwiftConnector` instance
  532. """
  533. super().__init__()
  534. self.scon = scon
  535. self.root = self.scon.root
  536. self.pack_dir = posixpath.join(OBJECTDIR, PACKDIR)
  537. self._alternates = None
  538. def _update_pack_cache(self):
  539. objects = self.scon.get_container_objects()
  540. pack_files = [
  541. o["name"].replace(".pack", "")
  542. for o in objects
  543. if o["name"].endswith(".pack")
  544. ]
  545. ret = []
  546. for basename in pack_files:
  547. pack = SwiftPack(basename, scon=self.scon)
  548. self._pack_cache[basename] = pack
  549. ret.append(pack)
  550. return ret
  551. def _iter_loose_objects(self):
  552. """Loose objects are not supported by this repository."""
  553. return []
  554. def pack_info_get(self, sha):
  555. for pack in self.packs:
  556. if sha in pack:
  557. return pack.pack_info[sha]
  558. def _collect_ancestors(self, heads, common=set()):
  559. def _find_parents(commit):
  560. for pack in self.packs:
  561. if commit in pack:
  562. try:
  563. parents = pack.pack_info[commit][1]
  564. except KeyError:
  565. # Seems to have no parents
  566. return []
  567. return parents
  568. bases = set()
  569. commits = set()
  570. queue = []
  571. queue.extend(heads)
  572. while queue:
  573. e = queue.pop(0)
  574. if e in common:
  575. bases.add(e)
  576. elif e not in commits:
  577. commits.add(e)
  578. parents = _find_parents(e)
  579. queue.extend(parents)
  580. return (commits, bases)
  581. def add_pack(self):
  582. """Add a new pack to this object store.
  583. Returns: Fileobject to write to and a commit function to
  584. call when the pack is finished.
  585. """
  586. f = BytesIO()
  587. def commit():
  588. f.seek(0)
  589. pack = PackData(file=f, filename="")
  590. entries = pack.sorted_entries()
  591. if entries:
  592. basename = posixpath.join(
  593. self.pack_dir,
  594. "pack-%s" % iter_sha1(entry[0] for entry in entries),
  595. )
  596. index = BytesIO()
  597. write_pack_index_v2(index, entries, pack.get_stored_checksum())
  598. self.scon.put_object(basename + ".pack", f)
  599. f.close()
  600. self.scon.put_object(basename + ".idx", index)
  601. index.close()
  602. final_pack = SwiftPack(basename, scon=self.scon)
  603. final_pack.check_length_and_checksum()
  604. self._add_cached_pack(basename, final_pack)
  605. return final_pack
  606. else:
  607. return None
  608. def abort():
  609. pass
  610. return f, commit, abort
  611. def add_object(self, obj):
  612. self.add_objects(
  613. [
  614. (obj, None),
  615. ]
  616. )
  617. def _pack_cache_stale(self):
  618. return False
  619. def _get_loose_object(self, sha):
  620. return None
  621. def add_thin_pack(self, read_all, read_some):
  622. """Read a thin pack.
  623. Read it from a stream and complete it in a temporary file.
  624. Then the pack and the corresponding index file are uploaded to Swift.
  625. """
  626. fd, path = tempfile.mkstemp(prefix="tmp_pack_")
  627. f = os.fdopen(fd, "w+b")
  628. try:
  629. indexer = PackIndexer(f, resolve_ext_ref=self.get_raw)
  630. copier = PackStreamCopier(read_all, read_some, f, delta_iter=indexer)
  631. copier.verify()
  632. return self._complete_thin_pack(f, path, copier, indexer)
  633. finally:
  634. f.close()
  635. os.unlink(path)
  636. def _complete_thin_pack(self, f, path, copier, indexer):
  637. entries = list(indexer)
  638. # Update the header with the new number of objects.
  639. f.seek(0)
  640. write_pack_header(f, len(entries) + len(indexer.ext_refs()))
  641. # Must flush before reading (http://bugs.python.org/issue3207)
  642. f.flush()
  643. # Rescan the rest of the pack, computing the SHA with the new header.
  644. new_sha = compute_file_sha(f, end_ofs=-20)
  645. # Must reposition before writing (http://bugs.python.org/issue3207)
  646. f.seek(0, os.SEEK_CUR)
  647. # Complete the pack.
  648. for ext_sha in indexer.ext_refs():
  649. assert len(ext_sha) == 20
  650. type_num, data = self.get_raw(ext_sha)
  651. offset = f.tell()
  652. crc32 = write_pack_object(f, type_num, data, sha=new_sha)
  653. entries.append((ext_sha, offset, crc32))
  654. pack_sha = new_sha.digest()
  655. f.write(pack_sha)
  656. f.flush()
  657. # Move the pack in.
  658. entries.sort()
  659. pack_base_name = posixpath.join(
  660. self.pack_dir,
  661. "pack-" + os.fsdecode(iter_sha1(e[0] for e in entries)),
  662. )
  663. self.scon.put_object(pack_base_name + ".pack", f)
  664. # Write the index.
  665. filename = pack_base_name + ".idx"
  666. index_file = BytesIO()
  667. write_pack_index_v2(index_file, entries, pack_sha)
  668. self.scon.put_object(filename, index_file)
  669. # Write pack info.
  670. f.seek(0)
  671. pack_data = PackData(filename="", file=f)
  672. index_file.seek(0)
  673. pack_index = load_pack_index_file("", index_file)
  674. serialized_pack_info = pack_info_create(pack_data, pack_index)
  675. f.close()
  676. index_file.close()
  677. pack_info_file = BytesIO(serialized_pack_info)
  678. filename = pack_base_name + ".info"
  679. self.scon.put_object(filename, pack_info_file)
  680. pack_info_file.close()
  681. # Add the pack to the store and return it.
  682. final_pack = SwiftPack(pack_base_name, scon=self.scon)
  683. final_pack.check_length_and_checksum()
  684. self._add_cached_pack(pack_base_name, final_pack)
  685. return final_pack
  686. class SwiftInfoRefsContainer(InfoRefsContainer):
  687. """Manage references in info/refs object."""
  688. def __init__(self, scon, store) -> None:
  689. self.scon = scon
  690. self.filename = "info/refs"
  691. self.store = store
  692. f = self.scon.get_object(self.filename)
  693. if not f:
  694. f = BytesIO(b"")
  695. super().__init__(f)
  696. def _load_check_ref(self, name, old_ref):
  697. self._check_refname(name)
  698. f = self.scon.get_object(self.filename)
  699. if not f:
  700. return {}
  701. refs = read_info_refs(f)
  702. if old_ref is not None:
  703. if refs[name] != old_ref:
  704. return False
  705. return refs
  706. def _write_refs(self, refs):
  707. f = BytesIO()
  708. f.writelines(write_info_refs(refs, self.store))
  709. self.scon.put_object(self.filename, f)
  710. def set_if_equals(self, name, old_ref, new_ref):
  711. """Set a refname to new_ref only if it currently equals old_ref."""
  712. if name == "HEAD":
  713. return True
  714. refs = self._load_check_ref(name, old_ref)
  715. if not isinstance(refs, dict):
  716. return False
  717. refs[name] = new_ref
  718. self._write_refs(refs)
  719. self._refs[name] = new_ref
  720. return True
  721. def remove_if_equals(self, name, old_ref):
  722. """Remove a refname only if it currently equals old_ref."""
  723. if name == "HEAD":
  724. return True
  725. refs = self._load_check_ref(name, old_ref)
  726. if not isinstance(refs, dict):
  727. return False
  728. del refs[name]
  729. self._write_refs(refs)
  730. del self._refs[name]
  731. return True
  732. def allkeys(self):
  733. try:
  734. self._refs["HEAD"] = self._refs["refs/heads/master"]
  735. except KeyError:
  736. pass
  737. return self._refs.keys()
  738. class SwiftRepo(BaseRepo):
  739. def __init__(self, root, conf) -> None:
  740. """Init a Git bare Repository on top of a Swift container.
  741. References are managed in info/refs objects by
  742. `SwiftInfoRefsContainer`. The root attribute is the Swift
  743. container that contain the Git bare repository.
  744. Args:
  745. root: The container which contains the bare repo
  746. conf: A ConfigParser object
  747. """
  748. self.root = root.lstrip("/")
  749. self.conf = conf
  750. self.scon = SwiftConnector(self.root, self.conf)
  751. objects = self.scon.get_container_objects()
  752. if not objects:
  753. raise Exception("There is not any GIT repo here : %s" % self.root)
  754. objects = [o["name"].split("/")[0] for o in objects]
  755. if OBJECTDIR not in objects:
  756. raise Exception("This repository (%s) is not bare." % self.root)
  757. self.bare = True
  758. self._controldir = self.root
  759. object_store = SwiftObjectStore(self.scon)
  760. refs = SwiftInfoRefsContainer(self.scon, object_store)
  761. BaseRepo.__init__(self, object_store, refs)
  762. def _determine_file_mode(self):
  763. """Probe the file-system to determine whether permissions can be trusted.
  764. Returns: True if permissions can be trusted, False otherwise.
  765. """
  766. return False
  767. def _put_named_file(self, filename, contents):
  768. """Put an object in a Swift container.
  769. Args:
  770. filename: the path to the object to put on Swift
  771. contents: the content as bytestring
  772. """
  773. with BytesIO() as f:
  774. f.write(contents)
  775. self.scon.put_object(filename, f)
  776. @classmethod
  777. def init_bare(cls, scon, conf):
  778. """Create a new bare repository.
  779. Args:
  780. scon: a `SwiftConnector` instance
  781. conf: a ConfigParser object
  782. Returns:
  783. a `SwiftRepo` instance
  784. """
  785. scon.create_root()
  786. for obj in [
  787. posixpath.join(OBJECTDIR, PACKDIR),
  788. posixpath.join(INFODIR, "refs"),
  789. ]:
  790. scon.put_object(obj, BytesIO(b""))
  791. ret = cls(scon.root, conf)
  792. ret._init_files(True)
  793. return ret
  794. class SwiftSystemBackend(Backend):
  795. def __init__(self, logger, conf) -> None:
  796. self.conf = conf
  797. self.logger = logger
  798. def open_repository(self, path):
  799. self.logger.info("opening repository at %s", path)
  800. return SwiftRepo(path, self.conf)
  801. def cmd_daemon(args):
  802. """Entry point for starting a TCP git server."""
  803. import optparse
  804. parser = optparse.OptionParser()
  805. parser.add_option(
  806. "-l",
  807. "--listen_address",
  808. dest="listen_address",
  809. default="127.0.0.1",
  810. help="Binding IP address.",
  811. )
  812. parser.add_option(
  813. "-p",
  814. "--port",
  815. dest="port",
  816. type=int,
  817. default=TCP_GIT_PORT,
  818. help="Binding TCP port.",
  819. )
  820. parser.add_option(
  821. "-c",
  822. "--swift_config",
  823. dest="swift_config",
  824. default="",
  825. help="Path to the configuration file for Swift backend.",
  826. )
  827. options, args = parser.parse_args(args)
  828. try:
  829. import gevent
  830. import geventhttpclient # noqa: F401
  831. except ImportError:
  832. print(
  833. "gevent and geventhttpclient libraries are mandatory "
  834. " for use the Swift backend."
  835. )
  836. sys.exit(1)
  837. import gevent.monkey
  838. gevent.monkey.patch_socket()
  839. from dulwich import log_utils
  840. logger = log_utils.getLogger(__name__)
  841. conf = load_conf(options.swift_config)
  842. backend = SwiftSystemBackend(logger, conf)
  843. log_utils.default_logging_config()
  844. server = TCPGitServer(backend, options.listen_address, port=options.port)
  845. server.serve_forever()
  846. def cmd_init(args):
  847. import optparse
  848. parser = optparse.OptionParser()
  849. parser.add_option(
  850. "-c",
  851. "--swift_config",
  852. dest="swift_config",
  853. default="",
  854. help="Path to the configuration file for Swift backend.",
  855. )
  856. options, args = parser.parse_args(args)
  857. conf = load_conf(options.swift_config)
  858. if args == []:
  859. parser.error("missing repository name")
  860. repo = args[0]
  861. scon = SwiftConnector(repo, conf)
  862. SwiftRepo.init_bare(scon, conf)
  863. def main(argv=sys.argv):
  864. commands = {
  865. "init": cmd_init,
  866. "daemon": cmd_daemon,
  867. }
  868. if len(sys.argv) < 2:
  869. print(
  870. "Usage: {} <{}> [OPTIONS...]".format(sys.argv[0], "|".join(commands.keys()))
  871. )
  872. sys.exit(1)
  873. cmd = sys.argv[1]
  874. if cmd not in commands:
  875. print("No such subcommand: %s" % cmd)
  876. sys.exit(1)
  877. commands[cmd](sys.argv[2:])
  878. if __name__ == "__main__":
  879. main()