sapling/eden/scm/edenscm/mercurial/sshpeer.py

391 lines
12 KiB
Python
Raw Normal View History

# Portions Copyright (c) Facebook, Inc. and its affiliates.
#
# This software may be used and distributed according to the terms of the
# GNU General Public License version 2.
# sshpeer.py - ssh repository proxy class for mercurial
#
2006-08-12 23:30:02 +04:00
# Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
#
# This software may be used and distributed according to the terms of the
2010-01-20 07:20:08 +03:00
# GNU General Public License version 2 or any later version.
2015-08-09 05:55:01 +03:00
from __future__ import absolute_import
import re
import threading
from typing import Any
2015-08-09 05:55:01 +03:00
from . import error, progress, pycompat, util, wireproto
2015-08-09 05:55:01 +03:00
from .i18n import _
from .pycompat import decodeutf8, encodeutf8
# Record of the bytes sent and received to SSH peers. This records the
# cumulative total bytes sent to all peers for the life of the process.
_totalbytessent = 0
_totalbytesreceived = 0
2011-11-26 03:10:31 +04:00
def _serverquote(s):
if not s:
return s
"""quote a string for the remote shell ... which we assume is sh"""
if re.match("[a-zA-Z0-9@%_+=:,./-]*$", s):
return s
2011-11-26 03:10:31 +04:00
return "'%s'" % s.replace("'", "'\\''")
def _writessherror(ui, s):
# type: (Any, bytes) -> None
if s and not ui.quiet:
for l in s.splitlines():
if l.startswith(b"ssh:"):
prefix = ""
else:
prefix = _("remote: ")
ui.write_err(prefix, decodeutf8(l, errors="replace"), "\n")
class countingpipe(object):
"""Wraps a pipe that count the number of bytes read/written to it
"""
def __init__(self, ui, pipe):
self._ui = ui
self._pipe = pipe
self._totalbytes = 0
def write(self, data):
assert isinstance(data, bytes)
self._totalbytes += len(data)
self._ui.metrics.gauge("ssh_write_bytes", len(data))
return self._pipe.write(data)
def read(self, size):
# type: (int) -> bytes
r = self._pipe.read(size)
bufs = [r]
# In Python 3 _pipe is a FileIO and is not guaranteed to return size
# bytes. So let's loop until we get the bytes, or we get 0 bytes,
# indicating the end of the pipe.
if len(r) < size:
totalread = len(r)
while totalread < size and len(r) != 0:
r = self._pipe.read(size - totalread)
totalread += len(r)
bufs.append(r)
r = b"".join(bufs)
self._totalbytes += len(r)
self._ui.metrics.gauge("ssh_read_bytes", len(r))
return r
def readline(self):
r = self._pipe.readline()
self._totalbytes += len(r)
self._ui.metrics.gauge("ssh_read_bytes", len(r))
return r
def close(self):
return self._pipe.close()
def flush(self):
return self._pipe.flush()
class threadedstderr(object):
def __init__(self, ui, stderr):
self._ui = ui
self._stderr = stderr
self._stop = False
self._thread = None
def start(self):
# type: () -> None
thread = threading.Thread(target=self.run)
thread.daemon = True
thread.start()
self._thread = thread
def run(self):
# type: () -> None
while not self._stop:
buf = self._stderr.readline()
if len(buf) == 0:
break
_writessherror(self._ui, buf)
def close(self):
# type: () -> None
self._stop = True
def join(self, timeout):
if self._thread:
self._thread.join(timeout)
class sshpeer(wireproto.wirepeer):
def __init__(self, ui, path, create=False):
self._url = path
self._ui = ui
self._pipeo = self._pipei = self._pipee = None
u = util.url(path, parsequery=False, parsefragment=False)
if u.scheme != "ssh" or not u.host or u.path is None:
2010-07-15 02:07:13 +04:00
self._abort(error.RepoError(_("couldn't parse location %s") % path))
util.checksafessh(path)
if u.passwd is not None:
self._abort(error.RepoError(_("password in URL not supported")))
self._user = u.user
self._host = u.host
self._port = u.port
self._path = u.path or "."
codemod: register core configitems using a script This is done by a script [2] using RedBaron [1], a tool designed for doing code refactoring. All "default" values are decided by the script and are strongly consistent with the existing code. There are 2 changes done manually to fix tests: [warn] mercurial/exchange.py: experimental.bundle2-output-capture: default needs manual removal [warn] mercurial/localrepo.py: experimental.hook-track-tags: default needs manual removal Since RedBaron is not confident about how to indent things [2]. [1]: https://github.com/PyCQA/redbaron [2]: https://github.com/PyCQA/redbaron/issues/100 [3]: #!/usr/bin/env python # codemod_configitems.py - codemod tool to fill configitems # # Copyright 2017 Facebook, Inc. # # This software may be used and distributed according to the terms of the # GNU General Public License version 2 or any later version. from __future__ import absolute_import, print_function import os import sys import redbaron def readpath(path): with open(path) as f: return f.read() def writepath(path, content): with open(path, 'w') as f: f.write(content) _configmethods = {'config', 'configbool', 'configint', 'configbytes', 'configlist', 'configdate'} def extractstring(rnode): """get the string from a RedBaron string or call_argument node""" while rnode.type != 'string': rnode = rnode.value return rnode.value[1:-1] # unquote, "'str'" -> "str" def uiconfigitems(red): """match *.ui.config* pattern, yield (node, method, args, section, name)""" for node in red.find_all('atomtrailers'): entry = None try: obj = node[-3].value method = node[-2].value args = node[-1] section = args[0].value name = args[1].value if (obj in ('ui', 'self') and method in _configmethods and section.type == 'string' and name.type == 'string'): entry = (node, method, args, extractstring(section), extractstring(name)) except Exception: pass else: if entry: yield entry def coreconfigitems(red): """match coreconfigitem(...) pattern, yield (node, args, section, name)""" for node in red.find_all('atomtrailers'): entry = None try: args = node[1] section = args[0].value name = args[1].value if (node[0].value == 'coreconfigitem' and section.type == 'string' and name.type == 'string'): entry = (node, args, extractstring(section), extractstring(name)) except Exception: pass else: if entry: yield entry def registercoreconfig(cfgred, section, name, defaultrepr): """insert coreconfigitem to cfgred AST section and name are plain string, defaultrepr is a string """ # find a place to insert the "coreconfigitem" item entries = list(coreconfigitems(cfgred)) for node, args, nodesection, nodename in reversed(entries): if (nodesection, nodename) < (section, name): # insert after this entry node.insert_after( 'coreconfigitem(%r, %r,\n' ' default=%s,\n' ')' % (section, name, defaultrepr)) return def main(argv): if not argv: print('Usage: codemod_configitems.py FILES\n' 'For example, FILES could be "{hgext,mercurial}/*/**.py"') dirname = os.path.dirname reporoot = dirname(dirname(dirname(os.path.abspath(__file__)))) # register configitems to this destination cfgpath = os.path.join(reporoot, 'mercurial', 'configitems.py') cfgred = redbaron.RedBaron(readpath(cfgpath)) # state about what to do registered = set((s, n) for n, a, s, n in coreconfigitems(cfgred)) toregister = {} # {(section, name): defaultrepr} coreconfigs = set() # {(section, name)}, whether it's used in core # first loop: scan all files before taking any action for i, path in enumerate(argv): print('(%d/%d) scanning %s' % (i + 1, len(argv), path)) iscore = ('mercurial' in path) and ('hgext' not in path) red = redbaron.RedBaron(readpath(path)) # find all repo.ui.config* and ui.config* calls, and collect their # section, name and default value information. for node, method, args, section, name in uiconfigitems(red): if section == 'web': # [web] section has some weirdness, ignore them for now continue defaultrepr = None key = (section, name) if len(args) == 2: if key in registered: continue if method == 'configlist': defaultrepr = 'list' elif method == 'configbool': defaultrepr = 'False' else: defaultrepr = 'None' elif len(args) >= 3 and (args[2].target is None or args[2].target.value == 'default'): # try to understand the "default" value dnode = args[2].value if dnode.type == 'name': if dnode.value in {'None', 'True', 'False'}: defaultrepr = dnode.value elif dnode.type == 'string': defaultrepr = repr(dnode.value[1:-1]) elif dnode.type in ('int', 'float'): defaultrepr = dnode.value # inconsistent default if key in toregister and toregister[key] != defaultrepr: defaultrepr = None # interesting to rewrite if key not in registered: if defaultrepr is None: print('[note] %s: %s.%s: unsupported default' % (path, section, name)) registered.add(key) # skip checking it again else: toregister[key] = defaultrepr if iscore: coreconfigs.add(key) # second loop: rewrite files given "toregister" result for path in argv: # reconstruct redbaron - trade CPU for memory red = redbaron.RedBaron(readpath(path)) changed = False for node, method, args, section, name in uiconfigitems(red): key = (section, name) defaultrepr = toregister.get(key) if defaultrepr is None or key not in coreconfigs: continue if len(args) >= 3 and (args[2].target is None or args[2].target.value == 'default'): try: del args[2] changed = True except Exception: # redbaron fails to do the rewrite due to indentation # see https://github.com/PyCQA/redbaron/issues/100 print('[warn] %s: %s.%s: default needs manual removal' % (path, section, name)) if key not in registered: print('registering %s.%s' % (section, name)) registercoreconfig(cfgred, section, name, defaultrepr) registered.add(key) if changed: print('updating %s' % path) writepath(path, red.dumps()) if toregister: print('updating configitems.py') writepath(cfgpath, cfgred.dumps()) if __name__ == "__main__": sys.exit(main(sys.argv[1:]))
2017-07-15 00:22:40 +03:00
sshcmd = self.ui.config("ui", "ssh")
remotecmd = self.ui.config("ui", "remotecmd")
sshaddenv = dict(self.ui.configitems("sshenv"))
sshenv = util.shellenviron(sshaddenv)
args = util.sshargs(sshcmd, self._host, self._user, self._port)
if create:
cmd = "%s %s %s" % (
sshcmd,
args,
util.shellquote(
"%s init %s" % (_serverquote(remotecmd), _serverquote(self._path))
),
)
ui.debug("running %s\n" % cmd)
res = ui.system(cmd, blockedtag="sshpeer", environ=sshenv)
if res != 0:
2010-07-15 02:07:13 +04:00
self._abort(error.RepoError(_("could not create remote repo")))
with self.ui.timeblockedsection("sshsetup"), progress.suspend():
self._validaterepo(sshcmd, args, remotecmd, sshenv)
# Begin of _basepeer interface.
@util.propertycache
def ui(self):
return self._ui
def url(self):
return self._url
def local(self):
return None
def peer(self):
return self
def canpush(self):
return True
def close(self):
pass
# End of _basepeer interface.
# Begin of _basewirecommands interface.
def capabilities(self):
return self._caps
# End of _basewirecommands interface.
def _validaterepo(self, sshcmd, args, remotecmd, sshenv=None):
# cleanup up previous run
self._cleanup()
cmd = "%s %s %s" % (
sshcmd,
args,
util.shellquote(
"%s -R %s serve --stdio"
% (_serverquote(remotecmd), _serverquote(self._path))
),
)
self.ui.debug("running %s\n" % cmd)
2011-11-26 03:10:31 +04:00
cmd = util.quotecommand(cmd)
# while self._subprocess isn't used, having it allows the subprocess to
# to clean up correctly later
sub = util.popen4(cmd, bufsize=0, env=sshenv)
pipeo, pipei, pipee, self._subprocess = sub
self._pipee = threadedstderr(self.ui, pipee)
self._pipee.start()
self._pipei = countingpipe(self.ui, pipei)
self._pipeo = countingpipe(self.ui, pipeo)
self.ui.metrics.gauge("ssh_connections")
def badresponse(errortext):
msg = _("no suitable response from remote hg")
if errortext:
msg += ": '%s'" % errortext
hint = self.ui.config("ui", "ssherrorhint")
self._abort(error.RepoError(msg, hint=hint))
try:
# skip any noise generated by remote shell
self._callstream("hello")
r = self._callstream("between", pairs=("%s-%s" % ("0" * 40, "0" * 40)))
except IOError as ex:
badresponse(str(ex))
lines = ["", "dummy"]
max_noise = 500
while lines[-1] and max_noise:
try:
l = decodeutf8(r.readline())
if lines[-1] == "1\n" and l == "\n":
break
if l:
self.ui.debug("remote: ", l)
lines.append(l)
max_noise -= 1
except IOError as ex:
badresponse(str(ex))
else:
badresponse("".join(lines[2:]))
self._caps = set()
2009-04-27 01:50:44 +04:00
for l in reversed(lines):
if l.startswith("capabilities:"):
self._caps.update(l[:-1].split(":")[1].split())
break
def _abort(self, exception):
self._cleanup()
raise exception
def _cleanup(self):
global _totalbytessent, _totalbytesreceived
if self._pipeo is None:
return
self._pipeo.close()
self._pipei.close()
_totalbytessent += self._pipeo._totalbytes
_totalbytesreceived += self._pipei._totalbytes
self.ui.log(
"sshbytes",
"",
sshbytessent=_totalbytessent,
sshbytesreceived=_totalbytesreceived,
)
self._pipee.close()
if util.istest():
# Let's give the thread a bit of time to complete, in the case
# where the pipe is somehow still open, the read call will block on it
# forever. In this case, there isn't anything to read anyway, so
# waiting more would just cause Mercurial to hang.
self._pipee.join(1)
__del__ = _cleanup
def _submitbatch(self, req):
rsp = self._callstream("batch", cmds=wireproto.encodebatchcmds(req))
available = self._getamount()
# TODO this response parsing is probably suboptimal for large
# batches with large responses.
toread = min(available, 1024)
work = rsp.read(toread)
available -= toread
chunk = work
while chunk:
while b";" in work:
one, work = work.split(b";", 1)
yield wireproto.unescapearg(one)
toread = min(available, 1024)
chunk = rsp.read(toread)
available -= toread
work += chunk
yield wireproto.unescapearg(work)
def _callstream(self, cmd, **args):
args = pycompat.byteskwargs(args)
self.ui.debug("sending %s command\n" % cmd)
self._pipeo.write(encodeutf8("%s\n" % cmd))
_func, names = wireproto.commands[cmd]
keys = names.split()
wireargs = {}
for k in keys:
if k == "*":
wireargs["*"] = args
break
else:
wireargs[k] = args[k]
del args[k]
for k, v in sorted(pycompat.iteritems(wireargs)):
self._pipeo.write(encodeutf8("%s %d\n" % (k, len(v))))
if isinstance(v, dict):
for dk, dv in pycompat.iteritems(v):
self._pipeo.write(encodeutf8("%s %d\n" % (dk, len(dv))))
self._pipeo.write(encodeutf8(dv))
else:
self._pipeo.write(encodeutf8(v))
self._pipeo.flush()
return self._pipei
def _callcompressable(self, cmd, **args):
return self._callstream(cmd, **args)
def _call(self, cmd, **args):
self._callstream(cmd, **args)
return self._recv()
def _callpush(self, cmd, fp, **args):
r = self._call(cmd, **args)
if r:
return b"", r
for d in iter(lambda: fp.read(4096), b""):
self._send(d)
self._send(b"", flush=True)
r = self._recv()
if r:
return b"", r
return self._recv(), b""
def _calltwowaystream(self, cmd, fp, **args):
r = self._call(cmd, **args)
if r:
# XXX needs to be made better
raise error.Abort(_("unexpected remote reply: %s") % r)
for d in iter(lambda: fp.read(4096), ""):
self._send(d)
self._send("", flush=True)
return self._pipei
def _getamount(self):
l = self._pipei.readline()
if l == "\n":
msg = _("check previous remote output")
self._abort(error.OutOfBandError(hint=msg))
try:
return int(l)
2011-04-23 01:51:25 +04:00
except ValueError:
2010-07-15 02:07:13 +04:00
self._abort(error.ResponseError(_("unexpected response:"), l))
def _recv(self):
return self._pipei.read(self._getamount())
def _send(self, data, flush=False):
self._pipeo.write("%d\n" % len(data))
if data:
self._pipeo.write(data)
if flush:
self._pipeo.flush()
instance = sshpeer