2022-01-04 10:04:20 +01:00
|
|
|
from enum import Enum, auto
|
|
|
|
from typing import (
|
|
|
|
Any,
|
|
|
|
Iterator,
|
|
|
|
NamedTuple,
|
|
|
|
Optional,
|
|
|
|
List,
|
|
|
|
NoReturn,
|
|
|
|
Type,
|
|
|
|
Union,
|
|
|
|
)
|
2022-01-13 17:45:16 +01:00
|
|
|
from httpie.cli.constants import OPEN_BRACKET, CLOSE_BRACKET, BACKSLASH, HIGHLIGHTER
|
2022-01-04 10:04:20 +01:00
|
|
|
|
|
|
|
|
|
|
|
class HTTPieSyntaxError(ValueError):
|
|
|
|
def __init__(
|
|
|
|
self,
|
|
|
|
source: str,
|
|
|
|
token: Optional['Token'],
|
|
|
|
message: str,
|
|
|
|
message_kind: str = 'Syntax',
|
|
|
|
) -> None:
|
|
|
|
self.source = source
|
|
|
|
self.token = token
|
|
|
|
self.message = message
|
|
|
|
self.message_kind = message_kind
|
|
|
|
|
|
|
|
def __str__(self):
|
|
|
|
lines = [f'HTTPie {self.message_kind} Error: {self.message}']
|
|
|
|
if self.token is not None:
|
|
|
|
lines.append(self.source)
|
|
|
|
lines.append(
|
|
|
|
' ' * (self.token.start)
|
2022-01-13 17:45:16 +01:00
|
|
|
+ HIGHLIGHTER * (self.token.end - self.token.start)
|
2022-01-04 10:04:20 +01:00
|
|
|
)
|
|
|
|
return '\n'.join(lines)
|
|
|
|
|
|
|
|
|
|
|
|
class TokenKind(Enum):
|
|
|
|
TEXT = auto()
|
|
|
|
NUMBER = auto()
|
|
|
|
LEFT_BRACKET = auto()
|
|
|
|
RIGHT_BRACKET = auto()
|
|
|
|
|
|
|
|
def to_name(self) -> str:
|
|
|
|
for key, value in OPERATORS.items():
|
|
|
|
if value is self:
|
|
|
|
return repr(key)
|
|
|
|
else:
|
|
|
|
return 'a ' + self.name.lower()
|
|
|
|
|
|
|
|
|
2022-01-13 17:45:16 +01:00
|
|
|
OPERATORS = {OPEN_BRACKET: TokenKind.LEFT_BRACKET, CLOSE_BRACKET: TokenKind.RIGHT_BRACKET}
|
|
|
|
SPECIAL_CHARS = OPERATORS.keys() | {BACKSLASH}
|
2022-01-04 10:04:20 +01:00
|
|
|
|
|
|
|
|
|
|
|
class Token(NamedTuple):
|
|
|
|
kind: TokenKind
|
|
|
|
value: Union[str, int]
|
|
|
|
start: int
|
|
|
|
end: int
|
|
|
|
|
|
|
|
|
|
|
|
def assert_cant_happen() -> NoReturn:
|
2022-01-07 10:52:13 +01:00
|
|
|
raise ValueError('Unexpected value')
|
|
|
|
|
|
|
|
|
|
|
|
def check_escaped_int(value: str) -> str:
|
2022-01-13 17:45:16 +01:00
|
|
|
if not value.startswith(BACKSLASH):
|
2022-01-07 10:52:13 +01:00
|
|
|
raise ValueError('Not an escaped int')
|
|
|
|
|
|
|
|
try:
|
|
|
|
int(value[1:])
|
|
|
|
except ValueError as exc:
|
|
|
|
raise ValueError('Not an escaped int') from exc
|
|
|
|
else:
|
|
|
|
return value[1:]
|
2022-01-04 10:04:20 +01:00
|
|
|
|
|
|
|
|
|
|
|
def tokenize(source: str) -> Iterator[Token]:
|
|
|
|
cursor = 0
|
|
|
|
backslashes = 0
|
|
|
|
buffer = []
|
|
|
|
|
|
|
|
def send_buffer() -> Iterator[Token]:
|
|
|
|
nonlocal backslashes
|
|
|
|
if not buffer:
|
|
|
|
return None
|
|
|
|
|
|
|
|
value = ''.join(buffer)
|
2022-02-01 11:10:55 +01:00
|
|
|
kind = TokenKind.TEXT
|
|
|
|
if not backslashes:
|
|
|
|
for variation, kind in [
|
|
|
|
(int, TokenKind.NUMBER),
|
|
|
|
(check_escaped_int, TokenKind.TEXT),
|
|
|
|
]:
|
|
|
|
try:
|
|
|
|
value = variation(value)
|
|
|
|
except ValueError:
|
|
|
|
continue
|
|
|
|
else:
|
|
|
|
break
|
2022-01-04 10:04:20 +01:00
|
|
|
|
|
|
|
yield Token(
|
|
|
|
kind, value, start=cursor - (len(buffer) + backslashes), end=cursor
|
|
|
|
)
|
|
|
|
buffer.clear()
|
|
|
|
backslashes = 0
|
|
|
|
|
|
|
|
def can_advance() -> bool:
|
|
|
|
return cursor < len(source)
|
|
|
|
|
|
|
|
while can_advance():
|
|
|
|
index = source[cursor]
|
|
|
|
if index in OPERATORS:
|
|
|
|
yield from send_buffer()
|
|
|
|
yield Token(OPERATORS[index], index, cursor, cursor + 1)
|
2022-01-13 17:45:16 +01:00
|
|
|
elif index == BACKSLASH and can_advance():
|
2022-01-04 10:04:20 +01:00
|
|
|
if source[cursor + 1] in SPECIAL_CHARS:
|
|
|
|
backslashes += 1
|
|
|
|
else:
|
|
|
|
buffer.append(index)
|
|
|
|
|
|
|
|
buffer.append(source[cursor + 1])
|
|
|
|
cursor += 1
|
|
|
|
else:
|
|
|
|
buffer.append(index)
|
|
|
|
|
|
|
|
cursor += 1
|
|
|
|
|
|
|
|
yield from send_buffer()
|
|
|
|
|
|
|
|
|
2022-01-12 18:37:15 +01:00
|
|
|
class PathAction(Enum):
|
|
|
|
KEY = auto()
|
|
|
|
INDEX = auto()
|
|
|
|
APPEND = auto()
|
|
|
|
|
|
|
|
# Pseudo action, used by the interpreter
|
|
|
|
SET = auto()
|
|
|
|
|
|
|
|
def to_string(self) -> str:
|
|
|
|
return self.name.lower()
|
|
|
|
|
|
|
|
|
2022-01-04 10:04:20 +01:00
|
|
|
class Path:
|
|
|
|
def __init__(
|
|
|
|
self,
|
2022-01-12 18:37:15 +01:00
|
|
|
kind: PathAction,
|
2022-01-04 10:04:20 +01:00
|
|
|
accessor: Optional[Union[str, int]] = None,
|
|
|
|
tokens: Optional[List[Token]] = None,
|
|
|
|
is_root: bool = False,
|
|
|
|
):
|
|
|
|
self.kind = kind
|
|
|
|
self.accessor = accessor
|
|
|
|
self.tokens = tokens or []
|
|
|
|
self.is_root = is_root
|
|
|
|
|
|
|
|
def reconstruct(self) -> str:
|
2022-01-12 18:37:15 +01:00
|
|
|
if self.kind is PathAction.KEY:
|
2022-01-04 10:04:20 +01:00
|
|
|
if self.is_root:
|
2022-01-07 12:19:50 +01:00
|
|
|
return str(self.accessor)
|
2022-01-13 17:45:16 +01:00
|
|
|
return OPEN_BRACKET + self.accessor + CLOSE_BRACKET
|
2022-01-12 18:37:15 +01:00
|
|
|
elif self.kind is PathAction.INDEX:
|
2022-01-13 17:45:16 +01:00
|
|
|
return OPEN_BRACKET + str(self.accessor) + CLOSE_BRACKET
|
2022-01-12 18:37:15 +01:00
|
|
|
elif self.kind is PathAction.APPEND:
|
2022-01-13 17:45:16 +01:00
|
|
|
return OPEN_BRACKET + CLOSE_BRACKET
|
2022-01-04 10:04:20 +01:00
|
|
|
else:
|
|
|
|
assert_cant_happen()
|
|
|
|
|
|
|
|
|
|
|
|
def parse(source: str) -> Iterator[Path]:
|
|
|
|
"""
|
|
|
|
start: literal? path*
|
|
|
|
|
|
|
|
literal: TEXT | NUMBER
|
|
|
|
|
|
|
|
path:
|
|
|
|
key_path
|
|
|
|
| index_path
|
|
|
|
| append_path
|
|
|
|
key_path: LEFT_BRACKET TEXT RIGHT_BRACKET
|
|
|
|
index_path: LEFT_BRACKET NUMBER RIGHT_BRACKET
|
|
|
|
append_path: LEFT_BRACKET RIGHT_BRACKET
|
|
|
|
"""
|
|
|
|
|
|
|
|
tokens = list(tokenize(source))
|
|
|
|
cursor = 0
|
|
|
|
|
|
|
|
def can_advance():
|
|
|
|
return cursor < len(tokens)
|
|
|
|
|
|
|
|
def expect(*kinds):
|
|
|
|
nonlocal cursor
|
|
|
|
|
|
|
|
assert len(kinds) > 0
|
|
|
|
if can_advance():
|
|
|
|
token = tokens[cursor]
|
|
|
|
cursor += 1
|
|
|
|
if token.kind in kinds:
|
|
|
|
return token
|
2022-01-07 12:19:50 +01:00
|
|
|
elif tokens:
|
2022-01-04 10:04:20 +01:00
|
|
|
token = tokens[-1]._replace(
|
|
|
|
start=tokens[-1].end + 0, end=tokens[-1].end + 1
|
|
|
|
)
|
2022-01-07 12:19:50 +01:00
|
|
|
else:
|
|
|
|
token = None
|
2022-01-04 10:04:20 +01:00
|
|
|
|
|
|
|
if len(kinds) == 1:
|
|
|
|
suffix = kinds[0].to_name()
|
|
|
|
else:
|
|
|
|
suffix = ', '.join(kind.to_name() for kind in kinds[:-1])
|
|
|
|
suffix += ' or ' + kinds[-1].to_name()
|
|
|
|
|
|
|
|
message = f'Expecting {suffix}'
|
|
|
|
raise HTTPieSyntaxError(source, token, message)
|
|
|
|
|
2022-01-12 18:37:15 +01:00
|
|
|
root = Path(PathAction.KEY, '', is_root=True)
|
2022-01-04 10:04:20 +01:00
|
|
|
if can_advance():
|
|
|
|
token = tokens[cursor]
|
|
|
|
if token.kind in {TokenKind.TEXT, TokenKind.NUMBER}:
|
|
|
|
token = expect(TokenKind.TEXT, TokenKind.NUMBER)
|
|
|
|
root.accessor = str(token.value)
|
|
|
|
root.tokens.append(token)
|
|
|
|
|
|
|
|
yield root
|
|
|
|
|
|
|
|
while can_advance():
|
|
|
|
path_tokens = []
|
|
|
|
path_tokens.append(expect(TokenKind.LEFT_BRACKET))
|
|
|
|
|
|
|
|
token = expect(
|
|
|
|
TokenKind.TEXT, TokenKind.NUMBER, TokenKind.RIGHT_BRACKET
|
|
|
|
)
|
|
|
|
path_tokens.append(token)
|
|
|
|
if token.kind is TokenKind.RIGHT_BRACKET:
|
2022-01-12 18:37:15 +01:00
|
|
|
path = Path(PathAction.APPEND, tokens=path_tokens)
|
2022-01-04 10:04:20 +01:00
|
|
|
elif token.kind is TokenKind.TEXT:
|
2022-01-12 18:37:15 +01:00
|
|
|
path = Path(PathAction.KEY, token.value, tokens=path_tokens)
|
2022-01-04 10:04:20 +01:00
|
|
|
path_tokens.append(expect(TokenKind.RIGHT_BRACKET))
|
|
|
|
elif token.kind is TokenKind.NUMBER:
|
2022-01-12 18:37:15 +01:00
|
|
|
path = Path(PathAction.INDEX, token.value, tokens=path_tokens)
|
2022-01-04 10:04:20 +01:00
|
|
|
path_tokens.append(expect(TokenKind.RIGHT_BRACKET))
|
|
|
|
else:
|
|
|
|
assert_cant_happen()
|
|
|
|
yield path
|
|
|
|
|
|
|
|
|
|
|
|
JSON_TYPE_MAPPING = {
|
|
|
|
dict: 'object',
|
|
|
|
list: 'array',
|
|
|
|
int: 'number',
|
|
|
|
float: 'number',
|
|
|
|
str: 'string',
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
def interpret(context: Any, key: str, value: Any) -> Any:
|
|
|
|
cursor = context
|
|
|
|
|
|
|
|
paths = list(parse(key))
|
2022-01-12 18:37:15 +01:00
|
|
|
paths.append(Path(PathAction.SET, value))
|
2022-01-04 10:04:20 +01:00
|
|
|
|
|
|
|
def type_check(index: int, path: Path, expected_type: Type[Any]) -> None:
|
|
|
|
if not isinstance(cursor, expected_type):
|
|
|
|
if path.tokens:
|
|
|
|
pseudo_token = Token(
|
|
|
|
None, None, path.tokens[0].start, path.tokens[-1].end
|
|
|
|
)
|
|
|
|
else:
|
|
|
|
pseudo_token = None
|
|
|
|
|
|
|
|
cursor_type = JSON_TYPE_MAPPING.get(
|
|
|
|
type(cursor), type(cursor).__name__
|
|
|
|
)
|
|
|
|
required_type = JSON_TYPE_MAPPING[expected_type]
|
|
|
|
|
2022-01-12 18:37:15 +01:00
|
|
|
message = f"Can't perform {path.kind.to_string()!r} based access on "
|
2022-01-04 10:04:20 +01:00
|
|
|
message += repr(
|
|
|
|
''.join(path.reconstruct() for path in paths[:index])
|
|
|
|
)
|
|
|
|
message += (
|
|
|
|
f' which has a type of {cursor_type!r} but this operation'
|
|
|
|
)
|
|
|
|
message += f' requires a type of {required_type!r}.'
|
|
|
|
raise HTTPieSyntaxError(
|
|
|
|
key, pseudo_token, message, message_kind='Type'
|
|
|
|
)
|
|
|
|
|
2022-01-07 12:19:50 +01:00
|
|
|
def object_for(kind: str) -> Any:
|
2022-01-12 18:37:15 +01:00
|
|
|
if kind is PathAction.KEY:
|
2022-01-04 10:04:20 +01:00
|
|
|
return {}
|
2022-01-12 18:37:15 +01:00
|
|
|
elif kind in {PathAction.INDEX, PathAction.APPEND}:
|
2022-01-04 10:04:20 +01:00
|
|
|
return []
|
|
|
|
else:
|
|
|
|
assert_cant_happen()
|
|
|
|
|
|
|
|
for index, (path, next_path) in enumerate(zip(paths, paths[1:])):
|
2022-01-12 18:37:15 +01:00
|
|
|
if path.kind is PathAction.KEY:
|
2022-01-04 10:04:20 +01:00
|
|
|
type_check(index, path, dict)
|
2022-01-12 18:37:15 +01:00
|
|
|
if next_path.kind is PathAction.SET:
|
2022-01-04 10:04:20 +01:00
|
|
|
cursor[path.accessor] = next_path.accessor
|
|
|
|
break
|
|
|
|
|
|
|
|
cursor = cursor.setdefault(
|
|
|
|
path.accessor, object_for(next_path.kind)
|
|
|
|
)
|
2022-01-12 18:37:15 +01:00
|
|
|
elif path.kind is PathAction.INDEX:
|
2022-01-04 10:04:20 +01:00
|
|
|
type_check(index, path, list)
|
|
|
|
if path.accessor < 0:
|
|
|
|
raise HTTPieSyntaxError(
|
|
|
|
key,
|
|
|
|
path.tokens[1],
|
|
|
|
'Negative indexes are not supported.',
|
|
|
|
message_kind='Value',
|
|
|
|
)
|
|
|
|
cursor.extend([None] * (path.accessor - len(cursor) + 1))
|
2022-01-12 18:37:15 +01:00
|
|
|
if next_path.kind is PathAction.SET:
|
2022-01-04 10:04:20 +01:00
|
|
|
cursor[path.accessor] = next_path.accessor
|
|
|
|
break
|
|
|
|
|
|
|
|
if cursor[path.accessor] is None:
|
|
|
|
cursor[path.accessor] = object_for(next_path.kind)
|
|
|
|
|
|
|
|
cursor = cursor[path.accessor]
|
2022-01-12 18:37:15 +01:00
|
|
|
elif path.kind is PathAction.APPEND:
|
2022-01-04 10:04:20 +01:00
|
|
|
type_check(index, path, list)
|
2022-01-12 18:37:15 +01:00
|
|
|
if next_path.kind is PathAction.SET:
|
2022-01-04 10:04:20 +01:00
|
|
|
cursor.append(next_path.accessor)
|
|
|
|
break
|
|
|
|
|
|
|
|
cursor.append(object_for(next_path.kind))
|
|
|
|
cursor = cursor[-1]
|
|
|
|
else:
|
|
|
|
assert_cant_happen()
|
|
|
|
|
|
|
|
return context
|
|
|
|
|
|
|
|
|
|
|
|
def interpret_nested_json(pairs):
|
|
|
|
context = {}
|
|
|
|
for key, value in pairs:
|
|
|
|
interpret(context, key, value)
|
|
|
|
return context
|