123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312 |
- # protocol.py -- Shared parts of the git protocols
- # Copryight (C) 2008 John Carr <john.carr@unrouted.co.uk>
- # Copyright (C) 2008 Jelmer Vernooij <jelmer@samba.org>
- #
- # This program is free software; you can redistribute it and/or
- # modify it under the terms of the GNU General Public License
- # as published by the Free Software Foundation; version 2
- # or (at your option) any later version of the License.
- #
- # This program is distributed in the hope that it will be useful,
- # but WITHOUT ANY WARRANTY; without even the implied warranty of
- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- # GNU General Public License for more details.
- #
- # You should have received a copy of the GNU General Public License
- # along with this program; if not, write to the Free Software
- # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
- # MA 02110-1301, USA.
- """Generic functions for talking the git smart server protocol."""
- from cStringIO import StringIO
- import os
- import socket
- from dulwich.errors import (
- HangupException,
- GitProtocolError,
- )
- from dulwich.misc import (
- SEEK_END,
- )
- TCP_GIT_PORT = 9418
- ZERO_SHA = "0" * 40
- SINGLE_ACK = 0
- MULTI_ACK = 1
- MULTI_ACK_DETAILED = 2
- class ProtocolFile(object):
- """
- Some network ops are like file ops. The file ops expect to operate on
- file objects, so provide them with a dummy file.
- """
- def __init__(self, read, write):
- self.read = read
- self.write = write
- def tell(self):
- pass
- def close(self):
- pass
- class Protocol(object):
- def __init__(self, read, write, report_activity=None):
- self.read = read
- self.write = write
- self.report_activity = report_activity
- def read_pkt_line(self):
- """
- Reads a 'pkt line' from the remote git process
- :return: The next string from the stream
- """
- try:
- sizestr = self.read(4)
- if not sizestr:
- raise HangupException()
- size = int(sizestr, 16)
- if size == 0:
- if self.report_activity:
- self.report_activity(4, 'read')
- return None
- if self.report_activity:
- self.report_activity(size, 'read')
- return self.read(size-4)
- except socket.error, e:
- raise GitProtocolError(e)
- def read_pkt_seq(self):
- pkt = self.read_pkt_line()
- while pkt:
- yield pkt
- pkt = self.read_pkt_line()
- def write_pkt_line(self, line):
- """
- Sends a 'pkt line' to the remote git process
- :param line: A string containing the data to send
- """
- try:
- if line is None:
- self.write("0000")
- if self.report_activity:
- self.report_activity(4, 'write')
- else:
- self.write("%04x%s" % (len(line)+4, line))
- if self.report_activity:
- self.report_activity(4+len(line), 'write')
- except socket.error, e:
- raise GitProtocolError(e)
- def write_file(self):
- class ProtocolFile(object):
- def __init__(self, proto):
- self._proto = proto
- self._offset = 0
- def write(self, data):
- self._proto.write(data)
- self._offset += len(data)
- def tell(self):
- return self._offset
- def close(self):
- pass
- return ProtocolFile(self)
- def write_sideband(self, channel, blob):
- """
- Write data to the sideband (a git multiplexing method)
- :param channel: int specifying which channel to write to
- :param blob: a blob of data (as a string) to send on this channel
- """
- # a pktline can be a max of 65520. a sideband line can therefore be
- # 65520-5 = 65515
- # WTF: Why have the len in ASCII, but the channel in binary.
- while blob:
- self.write_pkt_line("%s%s" % (chr(channel), blob[:65515]))
- blob = blob[65515:]
- def send_cmd(self, cmd, *args):
- """
- Send a command and some arguments to a git server
- Only used for git://
- :param cmd: The remote service to access
- :param args: List of arguments to send to remove service
- """
- self.write_pkt_line("%s %s" % (cmd, "".join(["%s\0" % a for a in args])))
- def read_cmd(self):
- """
- Read a command and some arguments from the git client
- Only used for git://
- :return: A tuple of (command, [list of arguments])
- """
- line = self.read_pkt_line()
- splice_at = line.find(" ")
- cmd, args = line[:splice_at], line[splice_at+1:]
- assert args[-1] == "\x00"
- return cmd, args[:-1].split(chr(0))
- _RBUFSIZE = 8192 # Default read buffer size.
- class ReceivableProtocol(Protocol):
- """Variant of Protocol that allows reading up to a size without blocking.
- This class has a recv() method that behaves like socket.recv() in addition
- to a read() method.
- If you want to read n bytes from the wire and block until exactly n bytes
- (or EOF) are read, use read(n). If you want to read at most n bytes from the
- wire but don't care if you get less, use recv(n). Note that recv(n) will
- still block until at least one byte is read.
- """
- def __init__(self, recv, write, report_activity=None, rbufsize=_RBUFSIZE):
- super(ReceivableProtocol, self).__init__(self.read, write,
- report_activity)
- self._recv = recv
- self._rbuf = StringIO()
- self._rbufsize = rbufsize
- def read(self, size):
- # From _fileobj.read in socket.py in the Python 2.6.5 standard library,
- # with the following modifications:
- # - omit the size <= 0 branch
- # - seek back to start rather than 0 in case some buffer has been
- # consumed.
- # - use SEEK_END instead of the magic number.
- # Copyright (c) 2001-2010 Python Software Foundation; All Rights Reserved
- # Licensed under the Python Software Foundation License.
- # TODO: see if buffer is more efficient than cStringIO.
- assert size > 0
- # Our use of StringIO rather than lists of string objects returned by
- # recv() minimizes memory usage and fragmentation that occurs when
- # rbufsize is large compared to the typical return value of recv().
- buf = self._rbuf
- start = buf.tell()
- buf.seek(0, SEEK_END)
- # buffer may have been partially consumed by recv()
- buf_len = buf.tell() - start
- if buf_len >= size:
- # Already have size bytes in our buffer? Extract and return.
- buf.seek(start)
- rv = buf.read(size)
- self._rbuf = StringIO()
- self._rbuf.write(buf.read())
- self._rbuf.seek(0)
- return rv
- self._rbuf = StringIO() # reset _rbuf. we consume it via buf.
- while True:
- left = size - buf_len
- # recv() will malloc the amount of memory given as its
- # parameter even though it often returns much less data
- # than that. The returned data string is short lived
- # as we copy it into a StringIO and free it. This avoids
- # fragmentation issues on many platforms.
- data = self._recv(left)
- if not data:
- break
- n = len(data)
- if n == size and not buf_len:
- # Shortcut. Avoid buffer data copies when:
- # - We have no data in our buffer.
- # AND
- # - Our call to recv returned exactly the
- # number of bytes we were asked to read.
- return data
- if n == left:
- buf.write(data)
- del data # explicit free
- break
- assert n <= left, "_recv(%d) returned %d bytes" % (left, n)
- buf.write(data)
- buf_len += n
- del data # explicit free
- #assert buf_len == buf.tell()
- buf.seek(start)
- return buf.read()
- def recv(self, size):
- assert size > 0
- buf = self._rbuf
- start = buf.tell()
- buf.seek(0, SEEK_END)
- buf_len = buf.tell()
- buf.seek(start)
- left = buf_len - start
- if not left:
- # only read from the wire if our read buffer is exhausted
- data = self._recv(self._rbufsize)
- if len(data) == size:
- # shortcut: skip the buffer if we read exactly size bytes
- return data
- buf = StringIO()
- buf.write(data)
- buf.seek(0)
- del data # explicit free
- self._rbuf = buf
- return buf.read(size)
- def extract_capabilities(text):
- """Extract a capabilities list from a string, if present.
- :param text: String to extract from
- :return: Tuple with text with capabilities removed and list of capabilities
- """
- if not "\0" in text:
- return text, []
- text, capabilities = text.rstrip().split("\0")
- return (text, capabilities.strip().split(" "))
- def extract_want_line_capabilities(text):
- """Extract a capabilities list from a want line, if present.
- Note that want lines have capabilities separated from the rest of the line
- by a space instead of a null byte. Thus want lines have the form:
- want obj-id cap1 cap2 ...
- :param text: Want line to extract from
- :return: Tuple with text with capabilities removed and list of capabilities
- """
- split_text = text.rstrip().split(" ")
- if len(split_text) < 3:
- return text, []
- return (" ".join(split_text[:2]), split_text[2:])
- def ack_type(capabilities):
- """Extract the ack type from a capabilities list."""
- if 'multi_ack_detailed' in capabilities:
- return MULTI_ACK_DETAILED
- elif 'multi_ack' in capabilities:
- return MULTI_ACK
- return SINGLE_ACK
|