sapling/eden/cli/systemd.py

#!/usr/bin/env python3
#
# Copyright (c) 2016-present, Facebook, Inc.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree. An additional grant
# of patent rights can be found in the PATENTS file in the same directory.

import re
import typing


class SystemdEnvironmentFile:
    _comment_characters = b"#;"
    _escape_characters = b"\\"
    _name_characters = (
        b"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789_"
    )
    _newline_characters = b"\n\r"
    _quote_characters = b"'\""
    _whitespace_characters = b" \t"

    def __init__(self, entries: typing.Sequence[typing.Tuple[bytes, bytes]]) -> None:
        super().__init__()
        self.__entries = list(entries)

    @classmethod
    def loads(cls, content: bytes) -> "SystemdEnvironmentFile":
        content = _truncated_at_null_byte(content)
        entries = _EnvironmentFileParser(content).parse_entries()
        return cls(entries=entries)

    @classmethod
    def dumps(cls, variables: typing.Mapping[bytes, bytes]) -> bytes:
        output = bytearray()
        for name, value in variables.items():
            cls._validate_entry(name, value)
            output.extend(name)
            output.extend(b"=")
            output.extend(cls.__escape_value(value))
            output.extend(b"\n")
        return output

    @staticmethod
    def __escape_value(value: bytes) -> bytes:
        return (
            b'"'
            + re.sub(b'[\\\\"]', lambda match: b"\\" + match.group(0), value)
            + b'"'
        )

    @classmethod
    def _is_valid_entry(cls, name: bytes, value: bytes) -> bool:
        try:
            cls._validate_entry(name, value)
            return True
        except (VariableNameError, VariableValueError):
            return False

    @classmethod
    def _validate_entry(cls, name: bytes, value: bytes) -> None:
        if not name:
            raise VariableNameError("Variables must have a non-empty name")
        if name[0:1].isdigit():
            raise VariableNameError("Variable names must not begin with a digit")
        for c in name:
            if c in cls._whitespace_characters:
                raise VariableNameError("Variable names must not contain whitespace")
            if c in cls._newline_characters:
                raise VariableNameError(
                    "Variable names must not contain any newline characters"
                )
            if c < 0x20:
                raise VariableNameError(
                    f"Variable names must not contain any control characters"
                )
            if c < 0x80 and c not in cls._name_characters:
                offending_character = bytes([c]).decode("utf-8")
                raise VariableNameError(
                    f"Variable names must not contain '{offending_character}'"
                )
        for c in value:
            if c in b"\r":
                raise VariableValueError(
                    "Variable values must not contain carriage returns"
                )
            if c < 0x20 and c not in b"\n\t":
                raise VariableValueError(
                    "Variable values must not contain any control characters"
                )

    @property
    def entries(self) -> typing.List[typing.Tuple[bytes, bytes]]:
        return self.__entries


class VariableNameError(ValueError):
    pass


class VariableValueError(ValueError):
    pass


class _Scanner:
    def __init__(self, input: bytes) -> None:
        super().__init__()
        self.__input = input
        self.__index = 0

    @property
    def at_eof(self) -> bool:
        return self.__index == len(self.__input)

    def scan_one_byte(self) -> int:
        if self.at_eof:
            raise ValueError("Cannot scan past end of file")
        c = self.__input[self.__index]
        self.__index += 1
        return c

    def peek_one_byte(self) -> int:
        if self.at_eof:
            raise ValueError("Cannot peek past end of file")
        return self.__input[self.__index]

    def skip_one_byte(self) -> None:
        if self.at_eof:
            raise ValueError("Cannot skip past end of file")
        self.__index += 1

    def scan_while_any(self, scan_bytes: typing.Sequence[int]) -> bytes:
        return self.__scan_while(lambda c: c in scan_bytes)

    def scan_until_any(self, stop_bytes: typing.Sequence[int]) -> bytes:
        return self.__scan_while(lambda c: c not in stop_bytes)

    def skip_while_any(self, skip_bytes: typing.Sequence[int]) -> None:
        self.__skip_while(lambda c: c in skip_bytes)

    def skip_until_any(self, stop_bytes: typing.Sequence[int]) -> None:
        self.__skip_while(lambda c: c not in stop_bytes)

    def __scan_while(self, scan_predicate: typing.Callable[[int], bool]) -> bytes:
        begin_index = self.__index
        while not self.at_eof:
            if not scan_predicate(self.__input[self.__index]):
                break
            self.__index += 1
        end_index = self.__index
        return self.__input[begin_index:end_index]

    def __skip_while(self, skip_predicate: typing.Callable[[int], bool]) -> None:
        while not self.at_eof:
            if not skip_predicate(self.__input[self.__index]):
                break
            self.__index += 1


class _EnvironmentFileParser(_Scanner):
    comment_characters = SystemdEnvironmentFile._comment_characters
    escape_characters = SystemdEnvironmentFile._escape_characters
    newline_characters = SystemdEnvironmentFile._newline_characters
    quote_characters = SystemdEnvironmentFile._quote_characters
    whitespace_characters = SystemdEnvironmentFile._whitespace_characters

    def parse_entries(self) -> typing.List[typing.Tuple[bytes, bytes]]:
        entries = []
        while not self.at_eof:
            entry = self.parse_entry()
            if entry is not None:
                entries.append(entry)
        return entries

    def parse_entry(self) -> typing.Optional[typing.Tuple[bytes, bytes]]:
        self.skip_whitespace()
        if self.at_eof:
            return None
        c = self.peek_one_byte()
        if c in self.comment_characters:
            self.parse_comment()
            return None
        elif c in self.newline_characters:
            self.skip_one_byte()
            return None

        name = self.parse_entry_name_and_equal_sign()
        if name is None:
            return None
        self.skip_whitespace()
        value = self.parse_entry_value()
        if not SystemdEnvironmentFile._is_valid_entry(name, value):
            return None
        return (name, value)

    def parse_entry_name_and_equal_sign(self) -> typing.Optional[bytes]:
        name = bytearray([self.scan_one_byte()])
        name.extend(self.scan_until_any(b"=" + self.newline_characters))
        if self.at_eof:
            return None
        c = self.scan_one_byte()
        if c in self.newline_characters:
            return None
        assert c == b"="[0]
        return bytes(name.rstrip(self.whitespace_characters))

    def parse_entry_value(self) -> bytes:
        value = bytearray()
        self.parse_quoted_entry_value(out_value=value)
        self.parse_unquoted_entry_value(out_value=value)
        return bytes(value)

    def parse_quoted_entry_value(self, out_value: bytearray) -> None:
        while not self.at_eof:
            c = self.peek_one_byte()
            if c not in self.quote_characters:
                return
            terminating_quote_characters = bytes([c])

            self.skip_one_byte()

            while not self.at_eof:
                scanned = self.scan_until_any(
                    self.escape_characters + terminating_quote_characters
                )
                out_value.extend(scanned)
                if self.at_eof:
                    return

                c = self.scan_one_byte()
                if c in self.escape_characters:
                    if self.at_eof:
                        return
                    c = self.scan_one_byte()
                    if c not in self.newline_characters:
                        out_value.append(c)
                elif c in terminating_quote_characters:
                    break
                else:
                    raise AssertionError()

            self.skip_whitespace()

    def parse_unquoted_entry_value(self, out_value: bytearray) -> None:
        while not self.at_eof:
            scanned = self.scan_until_any(
                self.escape_characters
                + self.newline_characters
                + self.whitespace_characters
            )
            out_value.extend(scanned)
            if self.at_eof:
                return

            c = self.scan_one_byte()
            if c in self.escape_characters:
                if self.at_eof:
                    return
                c = self.scan_one_byte()
                if c not in self.newline_characters:
                    out_value.append(c)
            elif c in self.newline_characters:
                return
            elif c in self.whitespace_characters:
                scanned = self.scan_while_any(self.whitespace_characters)
                is_trailing_whitespace = (
                    self.at_eof or self.peek_one_byte() in self.newline_characters
                )
                if is_trailing_whitespace:
                    return
                out_value.append(c)
                out_value.extend(scanned)
            else:
                raise AssertionError()

    def parse_comment(self) -> None:
        c = self.scan_one_byte()
        assert c in self.comment_characters
        while not self.at_eof:
            self.skip_until_any(self.escape_characters + self.newline_characters)
            if self.at_eof:
                break
            c = self.scan_one_byte()
            if c in self.escape_characters:
                if self.at_eof:
                    break
                self.skip_one_byte()
            elif c in self.newline_characters:
                break
            else:
                raise AssertionError()

    def skip_whitespace(self) -> None:
        self.skip_while_any(self.whitespace_characters)


def _truncated_at_null_byte(data: bytes) -> bytes:
    end_of_file_index = data.find(b"\x00")
    if end_of_file_index == -1:
        return data
    return data[:end_of_file_index]
Add systemd EnvironmentFile reader/writer Summary: EdenFS' systemd service will be configurable using config files. The Eden CLI will communicate information, such as extra daemon arguments, to systemd using a file specified using EnvironmentFile= [1]. Write code to serialize and deserialize these files. The code introduced by this diff isn't used yet, but it will be used in future diffs. [1] https://www.freedesktop.org/software/systemd/man/systemd.exec.html#EnvironmentFile= Reviewed By: chadaustin Differential Revision: D12066543 fbshipit-source-id: 28ba38d823b92f7a3a7ad97c416120a7f95be122 2018-11-16 22:11:08 +03:00			`#!/usr/bin/env python3`
			`#`
			`# Copyright (c) 2016-present, Facebook, Inc.`
			`# All rights reserved.`
			`#`
			`# This source code is licensed under the BSD-style license found in the`
			`# LICENSE file in the root directory of this source tree. An additional grant`
			`# of patent rights can be found in the PATENTS file in the same directory.`

			`import re`
			`import typing`


			`class SystemdEnvironmentFile:`
			`_comment_characters = b"#;"`
			`_escape_characters = b"\\"`
			`_name_characters = (`
			`b"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789_"`
			`)`
			`_newline_characters = b"\n\r"`
			`_quote_characters = b"'\""`
			`_whitespace_characters = b" \t"`

			`def __init__(self, entries: typing.Sequence[typing.Tuple[bytes, bytes]]) -> None:`
			`super().__init__()`
			`self.__entries = list(entries)`

			`@classmethod`
			`def loads(cls, content: bytes) -> "SystemdEnvironmentFile":`
			`content = _truncated_at_null_byte(content)`
			`entries = _EnvironmentFileParser(content).parse_entries()`
			`return cls(entries=entries)`

			`@classmethod`
			`def dumps(cls, variables: typing.Mapping[bytes, bytes]) -> bytes:`
			`output = bytearray()`
			`for name, value in variables.items():`
			`cls._validate_entry(name, value)`
			`output.extend(name)`
			`output.extend(b"=")`
			`output.extend(cls.__escape_value(value))`
			`output.extend(b"\n")`
			`return output`

			`@staticmethod`
			`def __escape_value(value: bytes) -> bytes:`
			`return (`
			`b'"'`
			`+ re.sub(b'[\\\\"]', lambda match: b"\\" + match.group(0), value)`
			`+ b'"'`
			`)`

			`@classmethod`
			`def _is_valid_entry(cls, name: bytes, value: bytes) -> bool:`
			`try:`
			`cls._validate_entry(name, value)`
			`return True`
			`except (VariableNameError, VariableValueError):`
			`return False`

			`@classmethod`
			`def _validate_entry(cls, name: bytes, value: bytes) -> None:`
			`if not name:`
			`raise VariableNameError("Variables must have a non-empty name")`
			`if name[0:1].isdigit():`
			`raise VariableNameError("Variable names must not begin with a digit")`
			`for c in name:`
			`if c in cls._whitespace_characters:`
			`raise VariableNameError("Variable names must not contain whitespace")`
			`if c in cls._newline_characters:`
			`raise VariableNameError(`
			`"Variable names must not contain any newline characters"`
			`)`
			`if c < 0x20:`
			`raise VariableNameError(`
			`f"Variable names must not contain any control characters"`
			`)`
			`if c < 0x80 and c not in cls._name_characters:`
			`offending_character = bytes([c]).decode("utf-8")`
			`raise VariableNameError(`
			`f"Variable names must not contain '{offending_character}'"`
			`)`
			`for c in value:`
			`if c in b"\r":`
			`raise VariableValueError(`
			`"Variable values must not contain carriage returns"`
			`)`
			`if c < 0x20 and c not in b"\n\t":`
			`raise VariableValueError(`
			`"Variable values must not contain any control characters"`
			`)`

			`@property`
			`def entries(self) -> typing.List[typing.Tuple[bytes, bytes]]:`
			`return self.__entries`


			`class VariableNameError(ValueError):`
			`pass`


			`class VariableValueError(ValueError):`
			`pass`


			`class _Scanner:`
			`def __init__(self, input: bytes) -> None:`
			`super().__init__()`
			`self.__input = input`
			`self.__index = 0`

			`@property`
			`def at_eof(self) -> bool:`
			`return self.__index == len(self.__input)`

			`def scan_one_byte(self) -> int:`
			`if self.at_eof:`
			`raise ValueError("Cannot scan past end of file")`
			`c = self.__input[self.__index]`
			`self.__index += 1`
			`return c`

			`def peek_one_byte(self) -> int:`
			`if self.at_eof:`
			`raise ValueError("Cannot peek past end of file")`
			`return self.__input[self.__index]`

			`def skip_one_byte(self) -> None:`
			`if self.at_eof:`
			`raise ValueError("Cannot skip past end of file")`
			`self.__index += 1`

			`def scan_while_any(self, scan_bytes: typing.Sequence[int]) -> bytes:`
			`return self.__scan_while(lambda c: c in scan_bytes)`

			`def scan_until_any(self, stop_bytes: typing.Sequence[int]) -> bytes:`
			`return self.__scan_while(lambda c: c not in stop_bytes)`

			`def skip_while_any(self, skip_bytes: typing.Sequence[int]) -> None:`
			`self.__skip_while(lambda c: c in skip_bytes)`

			`def skip_until_any(self, stop_bytes: typing.Sequence[int]) -> None:`
			`self.__skip_while(lambda c: c not in stop_bytes)`

			`def __scan_while(self, scan_predicate: typing.Callable[[int], bool]) -> bytes:`
			`begin_index = self.__index`
			`while not self.at_eof:`
			`if not scan_predicate(self.__input[self.__index]):`
			`break`
			`self.__index += 1`
			`end_index = self.__index`
			`return self.__input[begin_index:end_index]`

			`def __skip_while(self, skip_predicate: typing.Callable[[int], bool]) -> None:`
			`while not self.at_eof:`
			`if not skip_predicate(self.__input[self.__index]):`
			`break`
			`self.__index += 1`


			`class _EnvironmentFileParser(_Scanner):`
			`comment_characters = SystemdEnvironmentFile._comment_characters`
			`escape_characters = SystemdEnvironmentFile._escape_characters`
			`newline_characters = SystemdEnvironmentFile._newline_characters`
			`quote_characters = SystemdEnvironmentFile._quote_characters`
			`whitespace_characters = SystemdEnvironmentFile._whitespace_characters`

			`def parse_entries(self) -> typing.List[typing.Tuple[bytes, bytes]]:`
			`entries = []`
			`while not self.at_eof:`
			`entry = self.parse_entry()`
			`if entry is not None:`
			`entries.append(entry)`
			`return entries`

			`def parse_entry(self) -> typing.Optional[typing.Tuple[bytes, bytes]]:`
			`self.skip_whitespace()`
			`if self.at_eof:`
			`return None`
			`c = self.peek_one_byte()`
			`if c in self.comment_characters:`
			`self.parse_comment()`
			`return None`
			`elif c in self.newline_characters:`
			`self.skip_one_byte()`
			`return None`

			`name = self.parse_entry_name_and_equal_sign()`
			`if name is None:`
			`return None`
			`self.skip_whitespace()`
			`value = self.parse_entry_value()`
			`if not SystemdEnvironmentFile._is_valid_entry(name, value):`
			`return None`
			`return (name, value)`

			`def parse_entry_name_and_equal_sign(self) -> typing.Optional[bytes]:`
			`name = bytearray([self.scan_one_byte()])`
			`name.extend(self.scan_until_any(b"=" + self.newline_characters))`
			`if self.at_eof:`
			`return None`
			`c = self.scan_one_byte()`
			`if c in self.newline_characters:`
			`return None`
			`assert c == b"="[0]`
			`return bytes(name.rstrip(self.whitespace_characters))`

			`def parse_entry_value(self) -> bytes:`
			`value = bytearray()`
			`self.parse_quoted_entry_value(out_value=value)`
			`self.parse_unquoted_entry_value(out_value=value)`
			`return bytes(value)`

			`def parse_quoted_entry_value(self, out_value: bytearray) -> None:`
			`while not self.at_eof:`
			`c = self.peek_one_byte()`
			`if c not in self.quote_characters:`
			`return`
			`terminating_quote_characters = bytes([c])`

			`self.skip_one_byte()`

			`while not self.at_eof:`
			`scanned = self.scan_until_any(`
			`self.escape_characters + terminating_quote_characters`
			`)`
			`out_value.extend(scanned)`
			`if self.at_eof:`
			`return`

			`c = self.scan_one_byte()`
			`if c in self.escape_characters:`
			`if self.at_eof:`
			`return`
			`c = self.scan_one_byte()`
			`if c not in self.newline_characters:`
			`out_value.append(c)`
			`elif c in terminating_quote_characters:`
			`break`
			`else:`
			`raise AssertionError()`

			`self.skip_whitespace()`

			`def parse_unquoted_entry_value(self, out_value: bytearray) -> None:`
			`while not self.at_eof:`
			`scanned = self.scan_until_any(`
			`self.escape_characters`
			`+ self.newline_characters`
			`+ self.whitespace_characters`
			`)`
			`out_value.extend(scanned)`
			`if self.at_eof:`
			`return`

			`c = self.scan_one_byte()`
			`if c in self.escape_characters:`
			`if self.at_eof:`
			`return`
			`c = self.scan_one_byte()`
			`if c not in self.newline_characters:`
			`out_value.append(c)`
			`elif c in self.newline_characters:`
			`return`
			`elif c in self.whitespace_characters:`
			`scanned = self.scan_while_any(self.whitespace_characters)`
			`is_trailing_whitespace = (`
			`self.at_eof or self.peek_one_byte() in self.newline_characters`
			`)`
			`if is_trailing_whitespace:`
			`return`
			`out_value.append(c)`
			`out_value.extend(scanned)`
			`else:`
			`raise AssertionError()`

			`def parse_comment(self) -> None:`
			`c = self.scan_one_byte()`
			`assert c in self.comment_characters`
			`while not self.at_eof:`
			`self.skip_until_any(self.escape_characters + self.newline_characters)`
			`if self.at_eof:`
			`break`
			`c = self.scan_one_byte()`
			`if c in self.escape_characters:`
			`if self.at_eof:`
			`break`
			`self.skip_one_byte()`
			`elif c in self.newline_characters:`
			`break`
			`else:`
			`raise AssertionError()`

			`def skip_whitespace(self) -> None:`
			`self.skip_while_any(self.whitespace_characters)`


			`def _truncated_at_null_byte(data: bytes) -> bytes:`
			`end_of_file_index = data.find(b"\x00")`
			`if end_of_file_index == -1:`
			`return data`
			`return data[:end_of_file_index]`