12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178 |
- # server.py -- Implementation of the server side git protocols
- # Copyright (C) 2008 John Carr <john.carr@unrouted.co.uk>
- # Coprygith (C) 2011-2012 Jelmer Vernooij <jelmer@jelmer.uk>
- #
- # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
- # General Public License as public by the Free Software Foundation; version 2.0
- # or (at your option) any later version. You can redistribute it and/or
- # modify it under the terms of either of these two licenses.
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- # You should have received a copy of the licenses; if not, see
- # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
- # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
- # License, Version 2.0.
- #
- """Git smart network protocol server implementation.
- For more detailed implementation on the network protocol, see the
- Documentation/technical directory in the cgit distribution, and in particular:
- * Documentation/technical/protocol-capabilities.txt
- * Documentation/technical/pack-protocol.txt
- Currently supported capabilities:
- * include-tag
- * thin-pack
- * multi_ack_detailed
- * multi_ack
- * side-band-64k
- * ofs-delta
- * no-progress
- * report-status
- * delete-refs
- * shallow
- * symref
- """
- import collections
- import os
- import socket
- import sys
- import time
- import zlib
- try:
- import SocketServer
- except ImportError:
- import socketserver as SocketServer
- from dulwich.archive import tar_stream
- from dulwich.errors import (
- ApplyDeltaError,
- ChecksumMismatch,
- GitProtocolError,
- NotGitRepository,
- UnexpectedCommandError,
- ObjectFormatException,
- )
- from dulwich import log_utils
- from dulwich.objects import (
- Commit,
- valid_hexsha,
- )
- from dulwich.pack import (
- write_pack_objects,
- )
- from dulwich.protocol import ( # noqa: F401
- BufferedPktLineWriter,
- capability_agent,
- CAPABILITIES_REF,
- CAPABILITY_DELETE_REFS,
- CAPABILITY_INCLUDE_TAG,
- CAPABILITY_MULTI_ACK_DETAILED,
- CAPABILITY_MULTI_ACK,
- CAPABILITY_NO_DONE,
- CAPABILITY_NO_PROGRESS,
- CAPABILITY_OFS_DELTA,
- CAPABILITY_QUIET,
- CAPABILITY_REPORT_STATUS,
- CAPABILITY_SHALLOW,
- CAPABILITY_SIDE_BAND_64K,
- CAPABILITY_THIN_PACK,
- COMMAND_DEEPEN,
- COMMAND_DONE,
- COMMAND_HAVE,
- COMMAND_SHALLOW,
- COMMAND_UNSHALLOW,
- COMMAND_WANT,
- MULTI_ACK,
- MULTI_ACK_DETAILED,
- Protocol,
- ProtocolFile,
- ReceivableProtocol,
- SIDE_BAND_CHANNEL_DATA,
- SIDE_BAND_CHANNEL_PROGRESS,
- SIDE_BAND_CHANNEL_FATAL,
- SINGLE_ACK,
- TCP_GIT_PORT,
- ZERO_SHA,
- ack_type,
- extract_capabilities,
- extract_want_line_capabilities,
- symref_capabilities,
- )
- from dulwich.refs import (
- ANNOTATED_TAG_SUFFIX,
- write_info_refs,
- )
- from dulwich.repo import (
- Repo,
- )
- logger = log_utils.getLogger(__name__)
- class Backend(object):
- """A backend for the Git smart server implementation."""
- def open_repository(self, path):
- """Open the repository at a path.
- :param path: Path to the repository
- :raise NotGitRepository: no git repository was found at path
- :return: Instance of BackendRepo
- """
- raise NotImplementedError(self.open_repository)
- class BackendRepo(object):
- """Repository abstraction used by the Git server.
- The methods required here are a subset of those provided by
- dulwich.repo.Repo.
- """
- object_store = None
- refs = None
- def get_refs(self):
- """
- Get all the refs in the repository
- :return: dict of name -> sha
- """
- raise NotImplementedError
- def get_peeled(self, name):
- """Return the cached peeled value of a ref, if available.
- :param name: Name of the ref to peel
- :return: The peeled value of the ref. If the ref is known not point to
- a tag, this will be the SHA the ref refers to. If no cached
- information about a tag is available, this method may return None,
- but it should attempt to peel the tag if possible.
- """
- return None
- def fetch_objects(self, determine_wants, graph_walker, progress,
- get_tagged=None):
- """
- Yield the objects required for a list of commits.
- :param progress: is a callback to send progress messages to the client
- :param get_tagged: Function that returns a dict of pointed-to sha ->
- tag sha for including tags.
- """
- raise NotImplementedError
- class DictBackend(Backend):
- """Trivial backend that looks up Git repositories in a dictionary."""
- def __init__(self, repos):
- self.repos = repos
- def open_repository(self, path):
- logger.debug('Opening repository at %s', path)
- try:
- return self.repos[path]
- except KeyError:
- raise NotGitRepository(
- "No git repository was found at %(path)s" % dict(path=path)
- )
- class FileSystemBackend(Backend):
- """Simple backend looking up Git repositories in the local file system."""
- def __init__(self, root=os.sep):
- super(FileSystemBackend, self).__init__()
- self.root = (os.path.abspath(root) + os.sep).replace(
- os.sep * 2, os.sep)
- def open_repository(self, path):
- logger.debug('opening repository at %s', path)
- abspath = os.path.abspath(os.path.join(self.root, path)) + os.sep
- normcase_abspath = os.path.normcase(abspath)
- normcase_root = os.path.normcase(self.root)
- if not normcase_abspath.startswith(normcase_root):
- raise NotGitRepository(
- "Path %r not inside root %r" %
- (path, self.root))
- return Repo(abspath)
- class Handler(object):
- """Smart protocol command handler base class."""
- def __init__(self, backend, proto, http_req=None):
- self.backend = backend
- self.proto = proto
- self.http_req = http_req
- def handle(self):
- raise NotImplementedError(self.handle)
- class PackHandler(Handler):
- """Protocol handler for packs."""
- def __init__(self, backend, proto, http_req=None):
- super(PackHandler, self).__init__(backend, proto, http_req)
- self._client_capabilities = None
- # Flags needed for the no-done capability
- self._done_received = False
- @classmethod
- def capability_line(cls, capabilities):
- logger.info('Sending capabilities: %s', capabilities)
- return b"".join([b" " + c for c in capabilities])
- @classmethod
- def capabilities(cls):
- raise NotImplementedError(cls.capabilities)
- @classmethod
- def innocuous_capabilities(cls):
- return [CAPABILITY_INCLUDE_TAG, CAPABILITY_THIN_PACK,
- CAPABILITY_NO_PROGRESS, CAPABILITY_OFS_DELTA,
- capability_agent()]
- @classmethod
- def required_capabilities(cls):
- """Return a list of capabilities that we require the client to have."""
- return []
- def set_client_capabilities(self, caps):
- allowable_caps = set(self.innocuous_capabilities())
- allowable_caps.update(self.capabilities())
- for cap in caps:
- if cap not in allowable_caps:
- raise GitProtocolError('Client asked for capability %s that '
- 'was not advertised.' % cap)
- for cap in self.required_capabilities():
- if cap not in caps:
- raise GitProtocolError('Client does not support required '
- 'capability %s.' % cap)
- self._client_capabilities = set(caps)
- logger.info('Client capabilities: %s', caps)
- def has_capability(self, cap):
- if self._client_capabilities is None:
- raise GitProtocolError('Server attempted to access capability %s '
- 'before asking client' % cap)
- return cap in self._client_capabilities
- def notify_done(self):
- self._done_received = True
- class UploadPackHandler(PackHandler):
- """Protocol handler for uploading a pack to the client."""
- def __init__(self, backend, args, proto, http_req=None,
- advertise_refs=False):
- super(UploadPackHandler, self).__init__(
- backend, proto, http_req=http_req)
- self.repo = backend.open_repository(args[0])
- self._graph_walker = None
- self.advertise_refs = advertise_refs
- # A state variable for denoting that the have list is still
- # being processed, and the client is not accepting any other
- # data (such as side-band, see the progress method here).
- self._processing_have_lines = False
- @classmethod
- def capabilities(cls):
- return [CAPABILITY_MULTI_ACK_DETAILED, CAPABILITY_MULTI_ACK,
- CAPABILITY_SIDE_BAND_64K, CAPABILITY_THIN_PACK,
- CAPABILITY_OFS_DELTA, CAPABILITY_NO_PROGRESS,
- CAPABILITY_INCLUDE_TAG, CAPABILITY_SHALLOW, CAPABILITY_NO_DONE]
- @classmethod
- def required_capabilities(cls):
- return (CAPABILITY_SIDE_BAND_64K, CAPABILITY_THIN_PACK,
- CAPABILITY_OFS_DELTA)
- def progress(self, message):
- if (self.has_capability(CAPABILITY_NO_PROGRESS) or
- self._processing_have_lines):
- return
- self.proto.write_sideband(SIDE_BAND_CHANNEL_PROGRESS, message)
- def get_tagged(self, refs=None, repo=None):
- """Get a dict of peeled values of tags to their original tag shas.
- :param refs: dict of refname -> sha of possible tags; defaults to all
- of the backend's refs.
- :param repo: optional Repo instance for getting peeled refs; defaults
- to the backend's repo, if available
- :return: dict of peeled_sha -> tag_sha, where tag_sha is the sha of a
- tag whose peeled value is peeled_sha.
- """
- if not self.has_capability(CAPABILITY_INCLUDE_TAG):
- return {}
- if refs is None:
- refs = self.repo.get_refs()
- if repo is None:
- repo = getattr(self.repo, "repo", None)
- if repo is None:
- # Bail if we don't have a Repo available; this is ok since
- # clients must be able to handle if the server doesn't include
- # all relevant tags.
- # TODO: fix behavior when missing
- return {}
- tagged = {}
- for name, sha in refs.items():
- peeled_sha = repo.get_peeled(name)
- if peeled_sha != sha:
- tagged[peeled_sha] = sha
- return tagged
- def handle(self):
- def write(x):
- return self.proto.write_sideband(SIDE_BAND_CHANNEL_DATA, x)
- graph_walker = _ProtocolGraphWalker(
- self, self.repo.object_store, self.repo.get_peeled,
- self.repo.refs.get_symrefs)
- objects_iter = self.repo.fetch_objects(
- graph_walker.determine_wants, graph_walker, self.progress,
- get_tagged=self.get_tagged)
- # Note the fact that client is only processing responses related
- # to the have lines it sent, and any other data (including side-
- # band) will be be considered a fatal error.
- self._processing_have_lines = True
- # Did the process short-circuit (e.g. in a stateless RPC call)? Note
- # that the client still expects a 0-object pack in most cases.
- # Also, if it also happens that the object_iter is instantiated
- # with a graph walker with an implementation that talks over the
- # wire (which is this instance of this class) this will actually
- # iterate through everything and write things out to the wire.
- if len(objects_iter) == 0:
- return
- # The provided haves are processed, and it is safe to send side-
- # band data now.
- self._processing_have_lines = False
- if not graph_walker.handle_done(
- not self.has_capability(CAPABILITY_NO_DONE),
- self._done_received):
- return
- self.progress(
- ("counting objects: %d, done.\n" % len(objects_iter)).encode(
- 'ascii'))
- write_pack_objects(ProtocolFile(None, write), objects_iter)
- # we are done
- self.proto.write_pkt_line(None)
- def _split_proto_line(line, allowed):
- """Split a line read from the wire.
- :param line: The line read from the wire.
- :param allowed: An iterable of command names that should be allowed.
- Command names not listed below as possible return values will be
- ignored. If None, any commands from the possible return values are
- allowed.
- :return: a tuple having one of the following forms:
- ('want', obj_id)
- ('have', obj_id)
- ('done', None)
- (None, None) (for a flush-pkt)
- :raise UnexpectedCommandError: if the line cannot be parsed into one of the
- allowed return values.
- """
- if not line:
- fields = [None]
- else:
- fields = line.rstrip(b'\n').split(b' ', 1)
- command = fields[0]
- if allowed is not None and command not in allowed:
- raise UnexpectedCommandError(command)
- if len(fields) == 1 and command in (COMMAND_DONE, None):
- return (command, None)
- elif len(fields) == 2:
- if command in (COMMAND_WANT, COMMAND_HAVE, COMMAND_SHALLOW,
- COMMAND_UNSHALLOW):
- if not valid_hexsha(fields[1]):
- raise GitProtocolError("Invalid sha")
- return tuple(fields)
- elif command == COMMAND_DEEPEN:
- return command, int(fields[1])
- raise GitProtocolError('Received invalid line from client: %r' % line)
- def _find_shallow(store, heads, depth):
- """Find shallow commits according to a given depth.
- :param store: An ObjectStore for looking up objects.
- :param heads: Iterable of head SHAs to start walking from.
- :param depth: The depth of ancestors to include. A depth of one includes
- only the heads themselves.
- :return: A tuple of (shallow, not_shallow), sets of SHAs that should be
- considered shallow and unshallow according to the arguments. Note that
- these sets may overlap if a commit is reachable along multiple paths.
- """
- parents = {}
- def get_parents(sha):
- result = parents.get(sha, None)
- if not result:
- result = store[sha].parents
- parents[sha] = result
- return result
- todo = [] # stack of (sha, depth)
- for head_sha in heads:
- obj = store.peel_sha(head_sha)
- if isinstance(obj, Commit):
- todo.append((obj.id, 1))
- not_shallow = set()
- shallow = set()
- while todo:
- sha, cur_depth = todo.pop()
- if cur_depth < depth:
- not_shallow.add(sha)
- new_depth = cur_depth + 1
- todo.extend((p, new_depth) for p in get_parents(sha))
- else:
- shallow.add(sha)
- return shallow, not_shallow
- def _want_satisfied(store, haves, want, earliest):
- o = store[want]
- pending = collections.deque([o])
- known = set([want])
- while pending:
- commit = pending.popleft()
- if commit.id in haves:
- return True
- if commit.type_name != b"commit":
- # non-commit wants are assumed to be satisfied
- continue
- for parent in commit.parents:
- if parent in known:
- continue
- known.add(parent)
- parent_obj = store[parent]
- # TODO: handle parents with later commit times than children
- if parent_obj.commit_time >= earliest:
- pending.append(parent_obj)
- return False
- def _all_wants_satisfied(store, haves, wants):
- """Check whether all the current wants are satisfied by a set of haves.
- :param store: Object store to retrieve objects from
- :param haves: A set of commits we know the client has.
- :param wants: A set of commits the client wants
- :note: Wants are specified with set_wants rather than passed in since
- in the current interface they are determined outside this class.
- """
- haves = set(haves)
- if haves:
- earliest = min([store[h].commit_time for h in haves])
- else:
- earliest = 0
- for want in wants:
- if not _want_satisfied(store, haves, want, earliest):
- return False
- return True
- class _ProtocolGraphWalker(object):
- """A graph walker that knows the git protocol.
- As a graph walker, this class implements ack(), next(), and reset(). It
- also contains some base methods for interacting with the wire and walking
- the commit tree.
- The work of determining which acks to send is passed on to the
- implementation instance stored in _impl. The reason for this is that we do
- not know at object creation time what ack level the protocol requires. A
- call to set_ack_type() is required to set up the implementation, before
- any calls to next() or ack() are made.
- """
- def __init__(self, handler, object_store, get_peeled, get_symrefs):
- self.handler = handler
- self.store = object_store
- self.get_peeled = get_peeled
- self.get_symrefs = get_symrefs
- self.proto = handler.proto
- self.http_req = handler.http_req
- self.advertise_refs = handler.advertise_refs
- self._wants = []
- self.shallow = set()
- self.client_shallow = set()
- self.unshallow = set()
- self._cached = False
- self._cache = []
- self._cache_index = 0
- self._impl = None
- def determine_wants(self, heads):
- """Determine the wants for a set of heads.
- The given heads are advertised to the client, who then specifies which
- refs he wants using 'want' lines. This portion of the protocol is the
- same regardless of ack type, and in fact is used to set the ack type of
- the ProtocolGraphWalker.
- If the client has the 'shallow' capability, this method also reads and
- responds to the 'shallow' and 'deepen' lines from the client. These are
- not part of the wants per se, but they set up necessary state for
- walking the graph. Additionally, later code depends on this method
- consuming everything up to the first 'have' line.
- :param heads: a dict of refname->SHA1 to advertise
- :return: a list of SHA1s requested by the client
- """
- symrefs = self.get_symrefs()
- values = set(heads.values())
- if self.advertise_refs or not self.http_req:
- for i, (ref, sha) in enumerate(sorted(heads.items())):
- line = sha + b' ' + ref
- if not i:
- line += (b'\x00' +
- self.handler.capability_line(
- self.handler.capabilities() +
- symref_capabilities(symrefs.items())))
- self.proto.write_pkt_line(line + b'\n')
- peeled_sha = self.get_peeled(ref)
- if peeled_sha != sha:
- self.proto.write_pkt_line(
- peeled_sha + b' ' + ref + ANNOTATED_TAG_SUFFIX + b'\n')
- # i'm done..
- self.proto.write_pkt_line(None)
- if self.advertise_refs:
- return []
- # Now client will sending want want want commands
- want = self.proto.read_pkt_line()
- if not want:
- return []
- line, caps = extract_want_line_capabilities(want)
- self.handler.set_client_capabilities(caps)
- self.set_ack_type(ack_type(caps))
- allowed = (COMMAND_WANT, COMMAND_SHALLOW, COMMAND_DEEPEN, None)
- command, sha = _split_proto_line(line, allowed)
- want_revs = []
- while command == COMMAND_WANT:
- if sha not in values:
- raise GitProtocolError(
- 'Client wants invalid object %s' % sha)
- want_revs.append(sha)
- command, sha = self.read_proto_line(allowed)
- self.set_wants(want_revs)
- if command in (COMMAND_SHALLOW, COMMAND_DEEPEN):
- self.unread_proto_line(command, sha)
- self._handle_shallow_request(want_revs)
- if self.http_req and self.proto.eof():
- # The client may close the socket at this point, expecting a
- # flush-pkt from the server. We might be ready to send a packfile
- # at this point, so we need to explicitly short-circuit in this
- # case.
- return []
- return want_revs
- def unread_proto_line(self, command, value):
- if isinstance(value, int):
- value = str(value).encode('ascii')
- self.proto.unread_pkt_line(command + b' ' + value)
- def ack(self, have_ref):
- if len(have_ref) != 40:
- raise ValueError("invalid sha %r" % have_ref)
- return self._impl.ack(have_ref)
- def reset(self):
- self._cached = True
- self._cache_index = 0
- def next(self):
- if not self._cached:
- if not self._impl and self.http_req:
- return None
- return next(self._impl)
- self._cache_index += 1
- if self._cache_index > len(self._cache):
- return None
- return self._cache[self._cache_index]
- __next__ = next
- def read_proto_line(self, allowed):
- """Read a line from the wire.
- :param allowed: An iterable of command names that should be allowed.
- :return: A tuple of (command, value); see _split_proto_line.
- :raise UnexpectedCommandError: If an error occurred reading the line.
- """
- return _split_proto_line(self.proto.read_pkt_line(), allowed)
- def _handle_shallow_request(self, wants):
- while True:
- command, val = self.read_proto_line(
- (COMMAND_DEEPEN, COMMAND_SHALLOW))
- if command == COMMAND_DEEPEN:
- depth = val
- break
- self.client_shallow.add(val)
- self.read_proto_line((None,)) # consume client's flush-pkt
- shallow, not_shallow = _find_shallow(self.store, wants, depth)
- # Update self.shallow instead of reassigning it since we passed a
- # reference to it before this method was called.
- self.shallow.update(shallow - not_shallow)
- new_shallow = self.shallow - self.client_shallow
- unshallow = self.unshallow = not_shallow & self.client_shallow
- for sha in sorted(new_shallow):
- self.proto.write_pkt_line(COMMAND_SHALLOW + b' ' + sha)
- for sha in sorted(unshallow):
- self.proto.write_pkt_line(COMMAND_UNSHALLOW + b' ' + sha)
- self.proto.write_pkt_line(None)
- def notify_done(self):
- # relay the message down to the handler.
- self.handler.notify_done()
- def send_ack(self, sha, ack_type=b''):
- if ack_type:
- ack_type = b' ' + ack_type
- self.proto.write_pkt_line(b'ACK ' + sha + ack_type + b'\n')
- def send_nak(self):
- self.proto.write_pkt_line(b'NAK\n')
- def handle_done(self, done_required, done_received):
- # Delegate this to the implementation.
- return self._impl.handle_done(done_required, done_received)
- def set_wants(self, wants):
- self._wants = wants
- def all_wants_satisfied(self, haves):
- """Check whether all the current wants are satisfied by a set of haves.
- :param haves: A set of commits we know the client has.
- :note: Wants are specified with set_wants rather than passed in since
- in the current interface they are determined outside this class.
- """
- return _all_wants_satisfied(self.store, haves, self._wants)
- def set_ack_type(self, ack_type):
- impl_classes = {
- MULTI_ACK: MultiAckGraphWalkerImpl,
- MULTI_ACK_DETAILED: MultiAckDetailedGraphWalkerImpl,
- SINGLE_ACK: SingleAckGraphWalkerImpl,
- }
- self._impl = impl_classes[ack_type](self)
- _GRAPH_WALKER_COMMANDS = (COMMAND_HAVE, COMMAND_DONE, None)
- class SingleAckGraphWalkerImpl(object):
- """Graph walker implementation that speaks the single-ack protocol."""
- def __init__(self, walker):
- self.walker = walker
- self._common = []
- def ack(self, have_ref):
- if not self._common:
- self.walker.send_ack(have_ref)
- self._common.append(have_ref)
- def next(self):
- command, sha = self.walker.read_proto_line(_GRAPH_WALKER_COMMANDS)
- if command in (None, COMMAND_DONE):
- # defer the handling of done
- self.walker.notify_done()
- return None
- elif command == COMMAND_HAVE:
- return sha
- __next__ = next
- def handle_done(self, done_required, done_received):
- if not self._common:
- self.walker.send_nak()
- if done_required and not done_received:
- # we are not done, especially when done is required; skip
- # the pack for this request and especially do not handle
- # the done.
- return False
- if not done_received and not self._common:
- # Okay we are not actually done then since the walker picked
- # up no haves. This is usually triggered when client attempts
- # to pull from a source that has no common base_commit.
- # See: test_server.MultiAckDetailedGraphWalkerImplTestCase.\
- # test_multi_ack_stateless_nodone
- return False
- return True
- class MultiAckGraphWalkerImpl(object):
- """Graph walker implementation that speaks the multi-ack protocol."""
- def __init__(self, walker):
- self.walker = walker
- self._found_base = False
- self._common = []
- def ack(self, have_ref):
- self._common.append(have_ref)
- if not self._found_base:
- self.walker.send_ack(have_ref, b'continue')
- if self.walker.all_wants_satisfied(self._common):
- self._found_base = True
- # else we blind ack within next
- def next(self):
- while True:
- command, sha = self.walker.read_proto_line(_GRAPH_WALKER_COMMANDS)
- if command is None:
- self.walker.send_nak()
- # in multi-ack mode, a flush-pkt indicates the client wants to
- # flush but more have lines are still coming
- continue
- elif command == COMMAND_DONE:
- self.walker.notify_done()
- return None
- elif command == COMMAND_HAVE:
- if self._found_base:
- # blind ack
- self.walker.send_ack(sha, b'continue')
- return sha
- __next__ = next
- def handle_done(self, done_required, done_received):
- if done_required and not done_received:
- # we are not done, especially when done is required; skip
- # the pack for this request and especially do not handle
- # the done.
- return False
- if not done_received and not self._common:
- # Okay we are not actually done then since the walker picked
- # up no haves. This is usually triggered when client attempts
- # to pull from a source that has no common base_commit.
- # See: test_server.MultiAckDetailedGraphWalkerImplTestCase.\
- # test_multi_ack_stateless_nodone
- return False
- # don't nak unless no common commits were found, even if not
- # everything is satisfied
- if self._common:
- self.walker.send_ack(self._common[-1])
- else:
- self.walker.send_nak()
- return True
- class MultiAckDetailedGraphWalkerImpl(object):
- """Graph walker implementation speaking the multi-ack-detailed protocol."""
- def __init__(self, walker):
- self.walker = walker
- self._common = []
- def ack(self, have_ref):
- # Should only be called iff have_ref is common
- self._common.append(have_ref)
- self.walker.send_ack(have_ref, b'common')
- def next(self):
- while True:
- command, sha = self.walker.read_proto_line(_GRAPH_WALKER_COMMANDS)
- if command is None:
- if self.walker.all_wants_satisfied(self._common):
- self.walker.send_ack(self._common[-1], b'ready')
- self.walker.send_nak()
- if self.walker.http_req:
- # The HTTP version of this request a flush-pkt always
- # signifies an end of request, so we also return
- # nothing here as if we are done (but not really, as
- # it depends on whether no-done capability was
- # specified and that's handled in handle_done which
- # may or may not call post_nodone_check depending on
- # that).
- return None
- elif command == COMMAND_DONE:
- # Let the walker know that we got a done.
- self.walker.notify_done()
- break
- elif command == COMMAND_HAVE:
- # return the sha and let the caller ACK it with the
- # above ack method.
- return sha
- # don't nak unless no common commits were found, even if not
- # everything is satisfied
- __next__ = next
- def handle_done(self, done_required, done_received):
- if done_required and not done_received:
- # we are not done, especially when done is required; skip
- # the pack for this request and especially do not handle
- # the done.
- return False
- if not done_received and not self._common:
- # Okay we are not actually done then since the walker picked
- # up no haves. This is usually triggered when client attempts
- # to pull from a source that has no common base_commit.
- # See: test_server.MultiAckDetailedGraphWalkerImplTestCase.\
- # test_multi_ack_stateless_nodone
- return False
- # don't nak unless no common commits were found, even if not
- # everything is satisfied
- if self._common:
- self.walker.send_ack(self._common[-1])
- else:
- self.walker.send_nak()
- return True
- class ReceivePackHandler(PackHandler):
- """Protocol handler for downloading a pack from the client."""
- def __init__(self, backend, args, proto, http_req=None,
- advertise_refs=False):
- super(ReceivePackHandler, self).__init__(
- backend, proto, http_req=http_req)
- self.repo = backend.open_repository(args[0])
- self.advertise_refs = advertise_refs
- @classmethod
- def capabilities(cls):
- return [CAPABILITY_REPORT_STATUS, CAPABILITY_DELETE_REFS,
- CAPABILITY_QUIET, CAPABILITY_OFS_DELTA,
- CAPABILITY_SIDE_BAND_64K, CAPABILITY_NO_DONE]
- def _apply_pack(self, refs):
- all_exceptions = (IOError, OSError, ChecksumMismatch, ApplyDeltaError,
- AssertionError, socket.error, zlib.error,
- ObjectFormatException)
- status = []
- will_send_pack = False
- for command in refs:
- if command[1] != ZERO_SHA:
- will_send_pack = True
- if will_send_pack:
- # TODO: more informative error messages than just the exception
- # string
- try:
- recv = getattr(self.proto, "recv", None)
- self.repo.object_store.add_thin_pack(self.proto.read, recv)
- status.append((b'unpack', b'ok'))
- except all_exceptions as e:
- status.append((b'unpack', str(e).replace('\n', '')))
- # The pack may still have been moved in, but it may contain
- # broken objects. We trust a later GC to clean it up.
- else:
- # The git protocol want to find a status entry related to unpack
- # process even if no pack data has been sent.
- status.append((b'unpack', b'ok'))
- for oldsha, sha, ref in refs:
- ref_status = b'ok'
- try:
- if sha == ZERO_SHA:
- if CAPABILITY_DELETE_REFS not in self.capabilities():
- raise GitProtocolError(
- 'Attempted to delete refs without delete-refs '
- 'capability.')
- try:
- self.repo.refs.remove_if_equals(ref, oldsha)
- except all_exceptions:
- ref_status = b'failed to delete'
- else:
- try:
- self.repo.refs.set_if_equals(ref, oldsha, sha)
- except all_exceptions:
- ref_status = b'failed to write'
- except KeyError:
- ref_status = b'bad ref'
- status.append((ref, ref_status))
- return status
- def _report_status(self, status):
- if self.has_capability(CAPABILITY_SIDE_BAND_64K):
- writer = BufferedPktLineWriter(
- lambda d: self.proto.write_sideband(SIDE_BAND_CHANNEL_DATA, d))
- write = writer.write
- def flush():
- writer.flush()
- self.proto.write_pkt_line(None)
- else:
- write = self.proto.write_pkt_line
- def flush():
- pass
- for name, msg in status:
- if name == b'unpack':
- write(b'unpack ' + msg + b'\n')
- elif msg == b'ok':
- write(b'ok ' + name + b'\n')
- else:
- write(b'ng ' + name + b' ' + msg + b'\n')
- write(None)
- flush()
- def handle(self):
- if self.advertise_refs or not self.http_req:
- refs = sorted(self.repo.get_refs().items())
- symrefs = sorted(self.repo.refs.get_symrefs().items())
- if not refs:
- refs = [(CAPABILITIES_REF, ZERO_SHA)]
- self.proto.write_pkt_line(
- refs[0][1] + b' ' + refs[0][0] + b'\0' +
- self.capability_line(
- self.capabilities() + symref_capabilities(symrefs)) + b'\n')
- for i in range(1, len(refs)):
- ref = refs[i]
- self.proto.write_pkt_line(ref[1] + b' ' + ref[0] + b'\n')
- self.proto.write_pkt_line(None)
- if self.advertise_refs:
- return
- client_refs = []
- ref = self.proto.read_pkt_line()
- # if ref is none then client doesnt want to send us anything..
- if ref is None:
- return
- ref, caps = extract_capabilities(ref)
- self.set_client_capabilities(caps)
- # client will now send us a list of (oldsha, newsha, ref)
- while ref:
- client_refs.append(ref.split())
- ref = self.proto.read_pkt_line()
- # backend can now deal with this refs and read a pack using self.read
- status = self._apply_pack(client_refs)
- # when we have read all the pack from the client, send a status report
- # if the client asked for it
- if self.has_capability(CAPABILITY_REPORT_STATUS):
- self._report_status(status)
- class UploadArchiveHandler(Handler):
- def __init__(self, backend, args, proto, http_req=None):
- super(UploadArchiveHandler, self).__init__(backend, proto, http_req)
- self.repo = backend.open_repository(args[0])
- def handle(self):
- def write(x):
- return self.proto.write_sideband(SIDE_BAND_CHANNEL_DATA, x)
- arguments = []
- for pkt in self.proto.read_pkt_seq():
- (key, value) = pkt.split(b' ', 1)
- if key != b'argument':
- raise GitProtocolError('unknown command %s' % key)
- arguments.append(value.rstrip(b'\n'))
- prefix = b''
- format = 'tar'
- i = 0
- store = self.repo.object_store
- while i < len(arguments):
- argument = arguments[i]
- if argument == b'--prefix':
- i += 1
- prefix = arguments[i]
- elif argument == b'--format':
- i += 1
- format = arguments[i].decode('ascii')
- else:
- commit_sha = self.repo.refs[argument]
- tree = store[store[commit_sha].tree]
- i += 1
- self.proto.write_pkt_line(b'ACK\n')
- self.proto.write_pkt_line(None)
- for chunk in tar_stream(
- store, tree, mtime=time.time(), prefix=prefix, format=format):
- write(chunk)
- self.proto.write_pkt_line(None)
- # Default handler classes for git services.
- DEFAULT_HANDLERS = {
- b'git-upload-pack': UploadPackHandler,
- b'git-receive-pack': ReceivePackHandler,
- b'git-upload-archive': UploadArchiveHandler,
- }
- class TCPGitRequestHandler(SocketServer.StreamRequestHandler):
- def __init__(self, handlers, *args, **kwargs):
- self.handlers = handlers
- SocketServer.StreamRequestHandler.__init__(self, *args, **kwargs)
- def handle(self):
- proto = ReceivableProtocol(self.connection.recv, self.wfile.write)
- command, args = proto.read_cmd()
- logger.info('Handling %s request, args=%s', command, args)
- cls = self.handlers.get(command, None)
- if not callable(cls):
- raise GitProtocolError('Invalid service %s' % command)
- h = cls(self.server.backend, args, proto)
- h.handle()
- class TCPGitServer(SocketServer.TCPServer):
- allow_reuse_address = True
- serve = SocketServer.TCPServer.serve_forever
- def _make_handler(self, *args, **kwargs):
- return TCPGitRequestHandler(self.handlers, *args, **kwargs)
- def __init__(self, backend, listen_addr, port=TCP_GIT_PORT, handlers=None):
- self.handlers = dict(DEFAULT_HANDLERS)
- if handlers is not None:
- self.handlers.update(handlers)
- self.backend = backend
- logger.info('Listening for TCP connections on %s:%d',
- listen_addr, port)
- SocketServer.TCPServer.__init__(self, (listen_addr, port),
- self._make_handler)
- def verify_request(self, request, client_address):
- logger.info('Handling request from %s', client_address)
- return True
- def handle_error(self, request, client_address):
- logger.exception('Exception happened during processing of request '
- 'from %s', client_address)
- def main(argv=sys.argv):
- """Entry point for starting a TCP git server."""
- import optparse
- parser = optparse.OptionParser()
- parser.add_option("-l", "--listen_address", dest="listen_address",
- default="localhost",
- help="Binding IP address.")
- parser.add_option("-p", "--port", dest="port", type=int,
- default=TCP_GIT_PORT,
- help="Binding TCP port.")
- options, args = parser.parse_args(argv)
- log_utils.default_logging_config()
- if len(args) > 1:
- gitdir = args[1]
- else:
- gitdir = '.'
- # TODO(jelmer): Support git-daemon-export-ok and --export-all.
- backend = FileSystemBackend(gitdir)
- server = TCPGitServer(backend, options.listen_address, options.port)
- server.serve_forever()
- def serve_command(handler_cls, argv=sys.argv, backend=None, inf=sys.stdin,
- outf=sys.stdout):
- """Serve a single command.
- This is mostly useful for the implementation of commands used by e.g.
- git+ssh.
- :param handler_cls: `Handler` class to use for the request
- :param argv: execv-style command-line arguments. Defaults to sys.argv.
- :param backend: `Backend` to use
- :param inf: File-like object to read from, defaults to standard input.
- :param outf: File-like object to write to, defaults to standard output.
- :return: Exit code for use with sys.exit. 0 on success, 1 on failure.
- """
- if backend is None:
- backend = FileSystemBackend()
- def send_fn(data):
- outf.write(data)
- outf.flush()
- proto = Protocol(inf.read, send_fn)
- handler = handler_cls(backend, argv[1:], proto)
- # FIXME: Catch exceptions and write a single-line summary to outf.
- handler.handle()
- return 0
- def generate_info_refs(repo):
- """Generate an info refs file."""
- refs = repo.get_refs()
- return write_info_refs(refs, repo.object_store)
- def generate_objects_info_packs(repo):
- """Generate an index for for packs."""
- for pack in repo.object_store.packs:
- yield (
- b'P ' + pack.data.filename.encode(sys.getfilesystemencoding()) +
- b'\n')
- def update_server_info(repo):
- """Generate server info for dumb file access.
- This generates info/refs and objects/info/packs,
- similar to "git update-server-info".
- """
- repo._put_named_file(
- os.path.join('info', 'refs'),
- b"".join(generate_info_refs(repo)))
- repo._put_named_file(
- os.path.join('objects', 'info', 'packs'),
- b"".join(generate_objects_info_packs(repo)))
- if __name__ == '__main__':
- main()
|