2011-07-19 23:50:39 +04:00
|
|
|
#
|
|
|
|
# QAPI helper library
|
|
|
|
#
|
|
|
|
# Copyright IBM, Corp. 2011
|
2018-02-26 22:19:40 +03:00
|
|
|
# Copyright (c) 2013-2018 Red Hat Inc.
|
2011-07-19 23:50:39 +04:00
|
|
|
#
|
|
|
|
# Authors:
|
|
|
|
# Anthony Liguori <aliguori@us.ibm.com>
|
qapi.py: Restructure lexer and parser
The parser has a rather unorthodox structure:
Until EOF:
Read a section:
Generator function get_expr() yields one section after the
other, as a string. An unindented, non-empty line that
isn't a comment starts a new section.
Lexing:
Split section into a list of tokens (strings), with help
of generator function tokenize().
Parsing:
Parse the first expression from the list of tokens, with
parse(), throw away any remaining tokens.
In parse_schema(): record value of an enum, union or
struct key (if any) in the appropriate global table,
append expression to the list of expressions.
Return list of expressions.
Known issues:
(1) Indentation is significant, unlike in real JSON.
(2) Neither lexer nor parser have any idea of source positions. Error
reporting is hard, let's go shopping.
(3) The one error we bother to detect, we "report" via raise.
(4) The lexer silently ignores invalid characters.
(5) If everything in a section gets ignored, the parser crashes.
(6) The lexer treats a string containing a structural character exactly
like the structural character.
(7) Tokens trailing the first expression in a section are silently
ignored.
(8) The parser accepts any token in place of a colon.
(9) The parser treats comma as optional.
(10) parse() crashes on unexpected EOF.
(11) parse_schema() crashes when a section's expression isn't a JSON
object.
Replace this piece of original art by a thoroughly unoriginal design.
Takes care of (1), (2), (5), (6) and (7), and lays the groundwork for
addressing the others. Generated source files remain unchanged.
Signed-off-by: Markus Armbruster <armbru@redhat.com>
Reviewed-by: Eric Blake <eblake@redhat.com>
Message-id: 1374939721-7876-4-git-send-email-armbru@redhat.com
Signed-off-by: Anthony Liguori <aliguori@us.ibm.com>
2013-07-27 19:41:55 +04:00
|
|
|
# Markus Armbruster <armbru@redhat.com>
|
2011-07-19 23:50:39 +04:00
|
|
|
#
|
2014-03-01 11:40:34 +04:00
|
|
|
# This work is licensed under the terms of the GNU GPL, version 2.
|
|
|
|
# See the COPYING file in the top-level directory.
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2017-03-15 15:57:35 +03:00
|
|
|
import re
|
2021-08-04 11:30:59 +03:00
|
|
|
from typing import (
|
2021-08-04 11:31:01 +03:00
|
|
|
Any,
|
|
|
|
Dict,
|
2021-08-04 11:30:59 +03:00
|
|
|
Match,
|
|
|
|
Optional,
|
2021-08-31 15:38:03 +03:00
|
|
|
Sequence,
|
2021-08-04 11:30:59 +03:00
|
|
|
Union,
|
|
|
|
)
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:38 +03:00
|
|
|
#: Magic string that gets removed along with all space to its right.
|
2020-10-09 19:15:34 +03:00
|
|
|
EATSPACE = '\033EATSPACE.'
|
|
|
|
POINTER_SUFFIX = ' *' + EATSPACE
|
|
|
|
|
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def camel_to_upper(value: str) -> str:
|
2020-10-09 19:15:38 +03:00
|
|
|
"""
|
|
|
|
Converts CamelCase to CAMEL_CASE.
|
|
|
|
|
|
|
|
Examples::
|
|
|
|
|
|
|
|
ENUMName -> ENUM_NAME
|
|
|
|
EnumName1 -> ENUM_NAME1
|
|
|
|
ENUM_NAME -> ENUM_NAME
|
|
|
|
ENUM_NAME1 -> ENUM_NAME1
|
|
|
|
ENUM_Name2 -> ENUM_NAME2
|
|
|
|
ENUM24_Name -> ENUM24_NAME
|
|
|
|
"""
|
2015-05-14 15:50:53 +03:00
|
|
|
c_fun_str = c_name(value, False)
|
|
|
|
if value.isupper():
|
|
|
|
return c_fun_str
|
|
|
|
|
|
|
|
new_name = ''
|
2018-06-21 11:35:51 +03:00
|
|
|
length = len(c_fun_str)
|
|
|
|
for i in range(length):
|
2020-10-09 19:15:35 +03:00
|
|
|
char = c_fun_str[i]
|
|
|
|
# When char is upper case and no '_' appears before, do more checks
|
|
|
|
if char.isupper() and (i > 0) and c_fun_str[i - 1] != '_':
|
2018-06-21 11:35:51 +03:00
|
|
|
if i < length - 1 and c_fun_str[i + 1].islower():
|
2015-09-30 01:21:02 +03:00
|
|
|
new_name += '_'
|
|
|
|
elif c_fun_str[i - 1].isdigit():
|
2015-05-14 15:50:53 +03:00
|
|
|
new_name += '_'
|
2020-10-09 19:15:35 +03:00
|
|
|
new_name += char
|
2015-05-14 15:50:53 +03:00
|
|
|
return new_name.lstrip('_').upper()
|
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def c_enum_const(type_name: str,
|
|
|
|
const_name: str,
|
|
|
|
prefix: Optional[str] = None) -> str:
|
2020-10-09 19:15:38 +03:00
|
|
|
"""
|
|
|
|
Generate a C enumeration constant name.
|
|
|
|
|
|
|
|
:param type_name: The name of the enumeration.
|
|
|
|
:param const_name: The name of this constant.
|
|
|
|
:param prefix: Optional, prefix that overrides the type_name.
|
|
|
|
"""
|
2015-08-26 16:21:20 +03:00
|
|
|
if prefix is not None:
|
|
|
|
type_name = prefix
|
qapi: Change munging of CamelCase enum values
When munging enum values, the fact that we were passing the entire
prefix + value through camel_to_upper() meant that enum values
spelled with CamelCase could be turned into CAMEL_CASE. However,
this provides a potential collision (both OneTwo and One-Two would
munge into ONE_TWO) for enum types, when the same two names are
valid side-by-side as QAPI member names. By changing the generation
of enum constants to always be prefix + '_' + c_name(value,
False).upper(), and ensuring that there are no case collisions (in
the next patches), we no longer have to worry about names that
would be distinct as QAPI members but collide as variant tag names,
without having to think about what munging the heuristics in
camel_to_upper() will actually perform on an enum value.
Making the change will affect enums that did not follow coding
conventions, using 'CamelCase' rather than desired 'lower-case'.
Thankfully, there are only two culprits: InputButton and ErrorClass.
We already tweaked ErrorClass to make it an alias of QapiErrorClass,
where only the alias needs changing rather than the whole tree. So
the bulk of this change is modifying INPUT_BUTTON_WHEEL_UP to the
new INPUT_BUTTON_WHEELUP (and likewise for WHEELDOWN). That part
of this commit may later need reverting if we rename the enum
constants from 'WheelUp' to 'wheel-up' as part of moving
x-input-send-event to a stable interface; but at least we have
documentation bread crumbs in place to remind us (commit 513e7cd),
and it matches the fact that SDL constants are also spelled
SDL_BUTTON_WHEELUP.
Suggested by: Markus Armbruster <armbru@redhat.com>
Signed-off-by: Eric Blake <eblake@redhat.com>
Message-Id: <1447836791-369-27-git-send-email-eblake@redhat.com>
[Commit message tweaked]
Signed-off-by: Markus Armbruster <armbru@redhat.com>
2015-11-18 11:53:01 +03:00
|
|
|
return camel_to_upper(type_name) + '_' + c_name(const_name, False).upper()
|
2015-05-14 15:50:53 +03:00
|
|
|
|
2018-06-21 11:35:51 +03:00
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def c_name(name: str, protect: bool = True) -> str:
|
2020-10-09 19:15:38 +03:00
|
|
|
"""
|
|
|
|
Map ``name`` to a valid C identifier.
|
|
|
|
|
|
|
|
Used for converting 'name' from a 'name':'type' qapi definition
|
|
|
|
into a generated struct member, as well as converting type names
|
|
|
|
into substrings of a generated C function name.
|
|
|
|
|
|
|
|
'__a.b_c' -> '__a_b_c', 'x-foo' -> 'x_foo'
|
|
|
|
protect=True: 'int' -> 'q_int'; protect=False: 'int' -> 'int'
|
|
|
|
|
|
|
|
:param name: The name to map.
|
|
|
|
:param protect: If true, avoid returning certain ticklish identifiers
|
|
|
|
(like C keywords) by prepending ``q_``.
|
|
|
|
"""
|
2012-07-30 19:46:55 +04:00
|
|
|
# ANSI X3J11/88-090, 3.1.1
|
|
|
|
c89_words = set(['auto', 'break', 'case', 'char', 'const', 'continue',
|
2015-09-30 01:21:02 +03:00
|
|
|
'default', 'do', 'double', 'else', 'enum', 'extern',
|
|
|
|
'float', 'for', 'goto', 'if', 'int', 'long', 'register',
|
|
|
|
'return', 'short', 'signed', 'sizeof', 'static',
|
|
|
|
'struct', 'switch', 'typedef', 'union', 'unsigned',
|
|
|
|
'void', 'volatile', 'while'])
|
2012-07-30 19:46:55 +04:00
|
|
|
# ISO/IEC 9899:1999, 6.4.1
|
|
|
|
c99_words = set(['inline', 'restrict', '_Bool', '_Complex', '_Imaginary'])
|
|
|
|
# ISO/IEC 9899:2011, 6.4.1
|
2015-09-30 01:21:02 +03:00
|
|
|
c11_words = set(['_Alignas', '_Alignof', '_Atomic', '_Generic',
|
|
|
|
'_Noreturn', '_Static_assert', '_Thread_local'])
|
2012-07-30 19:46:55 +04:00
|
|
|
# GCC http://gcc.gnu.org/onlinedocs/gcc-4.7.1/gcc/C-Extensions.html
|
|
|
|
# excluding _.*
|
|
|
|
gcc_words = set(['asm', 'typeof'])
|
2013-08-07 19:39:43 +04:00
|
|
|
# C++ ISO/IEC 14882:2003 2.11
|
|
|
|
cpp_words = set(['bool', 'catch', 'class', 'const_cast', 'delete',
|
|
|
|
'dynamic_cast', 'explicit', 'false', 'friend', 'mutable',
|
|
|
|
'namespace', 'new', 'operator', 'private', 'protected',
|
|
|
|
'public', 'reinterpret_cast', 'static_cast', 'template',
|
|
|
|
'this', 'throw', 'true', 'try', 'typeid', 'typename',
|
|
|
|
'using', 'virtual', 'wchar_t',
|
|
|
|
# alternative representations
|
|
|
|
'and', 'and_eq', 'bitand', 'bitor', 'compl', 'not',
|
|
|
|
'not_eq', 'or', 'or_eq', 'xor', 'xor_eq'])
|
2012-09-19 18:31:07 +04:00
|
|
|
# namespace pollution:
|
2018-04-27 22:28:49 +03:00
|
|
|
polluted_words = set(['unix', 'errno', 'mips', 'sparc', 'i386'])
|
2021-03-23 12:40:05 +03:00
|
|
|
name = re.sub(r'[^A-Za-z0-9_]', '_', name)
|
|
|
|
if protect and (name in (c89_words | c99_words | c11_words | gcc_words
|
|
|
|
| cpp_words | polluted_words)
|
|
|
|
or name[0].isdigit()):
|
2017-03-15 15:57:08 +03:00
|
|
|
return 'q_' + name
|
2015-11-18 11:52:52 +03:00
|
|
|
return name
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2018-06-21 11:35:51 +03:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
class Indentation:
|
|
|
|
"""
|
|
|
|
Indentation level management.
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
:param initial: Initial number of spaces, default 0.
|
|
|
|
"""
|
|
|
|
def __init__(self, initial: int = 0) -> None:
|
|
|
|
self._level = initial
|
2018-06-21 11:35:51 +03:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
def __int__(self) -> int:
|
|
|
|
return self._level
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
def __repr__(self) -> str:
|
|
|
|
return "{}({:d})".format(type(self).__name__, self._level)
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
def __str__(self) -> str:
|
|
|
|
"""Return the current indentation as a string of spaces."""
|
|
|
|
return ' ' * self._level
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
def __bool__(self) -> bool:
|
|
|
|
"""True when there is a non-zero indentation."""
|
|
|
|
return bool(self._level)
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:33 +03:00
|
|
|
def increase(self, amount: int = 4) -> None:
|
|
|
|
"""Increase the indentation level by ``amount``, default 4."""
|
|
|
|
self._level += amount
|
|
|
|
|
|
|
|
def decrease(self, amount: int = 4) -> None:
|
|
|
|
"""Decrease the indentation level by ``amount``, default 4."""
|
|
|
|
if self._level < amount:
|
|
|
|
raise ArithmeticError(
|
|
|
|
f"Can't remove {amount:d} spaces from {self!r}")
|
|
|
|
self._level -= amount
|
|
|
|
|
|
|
|
|
2020-10-09 19:15:38 +03:00
|
|
|
#: Global, current indent level for code generation.
|
2020-10-09 19:15:33 +03:00
|
|
|
indent = Indentation()
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def cgen(code: str, **kwds: object) -> str:
|
2020-10-09 19:15:38 +03:00
|
|
|
"""
|
|
|
|
Generate ``code`` with ``kwds`` interpolated.
|
|
|
|
|
|
|
|
Obey `indent`, and strip `EATSPACE`.
|
|
|
|
"""
|
2015-06-24 20:27:32 +03:00
|
|
|
raw = code % kwds
|
2020-10-09 19:15:33 +03:00
|
|
|
if indent:
|
|
|
|
raw = re.sub(r'^(?!(#|$))', str(indent), raw, flags=re.MULTILINE)
|
2020-10-09 19:15:34 +03:00
|
|
|
return re.sub(re.escape(EATSPACE) + r' *', '', raw)
|
2011-07-19 23:50:39 +04:00
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def mcgen(code: str, **kwds: object) -> str:
|
2015-06-24 20:27:32 +03:00
|
|
|
if code[0] == '\n':
|
|
|
|
code = code[1:]
|
|
|
|
return cgen(code, **kwds)
|
2011-07-19 23:50:39 +04:00
|
|
|
|
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def c_fname(filename: str) -> str:
|
2019-03-01 18:40:48 +03:00
|
|
|
return re.sub(r'[^A-Za-z0-9_]', '_', filename)
|
2013-05-11 02:46:00 +04:00
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def guardstart(name: str) -> str:
|
2013-05-11 02:46:00 +04:00
|
|
|
return mcgen('''
|
|
|
|
#ifndef %(name)s
|
|
|
|
#define %(name)s
|
|
|
|
|
|
|
|
''',
|
2019-03-01 18:40:48 +03:00
|
|
|
name=c_fname(name).upper())
|
2013-05-11 02:46:00 +04:00
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2020-10-09 19:15:37 +03:00
|
|
|
def guardend(name: str) -> str:
|
2013-05-11 02:46:00 +04:00
|
|
|
return mcgen('''
|
|
|
|
|
|
|
|
#endif /* %(name)s */
|
|
|
|
''',
|
2019-03-01 18:40:48 +03:00
|
|
|
name=c_fname(name).upper())
|
2015-04-02 14:12:21 +03:00
|
|
|
|
2015-09-30 01:21:02 +03:00
|
|
|
|
2021-08-31 15:38:03 +03:00
|
|
|
def gen_ifcond(ifcond: Optional[Union[str, Dict[str, Any]]],
|
|
|
|
cond_fmt: str, not_fmt: str,
|
|
|
|
all_operator: str, any_operator: str) -> str:
|
|
|
|
|
2021-08-31 15:38:04 +03:00
|
|
|
def do_gen(ifcond: Union[str, Dict[str, Any]], need_parens: bool):
|
2021-08-31 15:38:03 +03:00
|
|
|
if isinstance(ifcond, str):
|
|
|
|
return cond_fmt % ifcond
|
|
|
|
assert isinstance(ifcond, dict) and len(ifcond) == 1
|
|
|
|
if 'not' in ifcond:
|
2021-08-31 15:38:04 +03:00
|
|
|
return not_fmt % do_gen(ifcond['not'], True)
|
2021-08-31 15:38:03 +03:00
|
|
|
if 'all' in ifcond:
|
|
|
|
gen = gen_infix(all_operator, ifcond['all'])
|
|
|
|
else:
|
|
|
|
gen = gen_infix(any_operator, ifcond['any'])
|
2021-08-31 15:38:04 +03:00
|
|
|
if need_parens:
|
|
|
|
gen = '(' + gen + ')'
|
2021-08-31 15:38:03 +03:00
|
|
|
return gen
|
|
|
|
|
|
|
|
def gen_infix(operator: str, operands: Sequence[Any]) -> str:
|
2021-08-31 15:38:04 +03:00
|
|
|
return operator.join([do_gen(o, True) for o in operands])
|
2021-08-31 15:38:03 +03:00
|
|
|
|
2021-08-04 11:30:59 +03:00
|
|
|
if not ifcond:
|
|
|
|
return ''
|
2021-08-31 15:38:04 +03:00
|
|
|
return do_gen(ifcond, False)
|
2021-08-04 11:30:59 +03:00
|
|
|
|
2021-08-31 15:38:03 +03:00
|
|
|
|
|
|
|
def cgen_ifcond(ifcond: Optional[Union[str, Dict[str, Any]]]) -> str:
|
|
|
|
return gen_ifcond(ifcond, 'defined(%s)', '!%s', ' && ', ' || ')
|
2021-08-04 11:30:59 +03:00
|
|
|
|
2021-08-04 11:31:01 +03:00
|
|
|
|
2021-08-31 15:37:59 +03:00
|
|
|
def docgen_ifcond(ifcond: Optional[Union[str, Dict[str, Any]]]) -> str:
|
2021-08-04 11:31:00 +03:00
|
|
|
# TODO Doc generated for conditions needs polish
|
2021-08-31 15:38:05 +03:00
|
|
|
return gen_ifcond(ifcond, '%s', 'not %s', ' and ', ' or ')
|
2021-08-04 11:31:00 +03:00
|
|
|
|
|
|
|
|
2021-08-04 11:30:59 +03:00
|
|
|
def gen_if(cond: str) -> str:
|
|
|
|
if not cond:
|
|
|
|
return ''
|
|
|
|
return mcgen('''
|
2018-07-03 18:56:40 +03:00
|
|
|
#if %(cond)s
|
2021-08-04 11:30:59 +03:00
|
|
|
''', cond=cond)
|
2018-07-03 18:56:40 +03:00
|
|
|
|
|
|
|
|
2021-08-04 11:30:59 +03:00
|
|
|
def gen_endif(cond: str) -> str:
|
|
|
|
if not cond:
|
|
|
|
return ''
|
|
|
|
return mcgen('''
|
2018-07-03 18:56:40 +03:00
|
|
|
#endif /* %(cond)s */
|
2021-08-04 11:30:59 +03:00
|
|
|
''', cond=cond)
|
2021-05-19 21:39:45 +03:00
|
|
|
|
|
|
|
|
|
|
|
def must_match(pattern: str, string: str) -> Match[str]:
|
|
|
|
match = re.match(pattern, string)
|
|
|
|
assert match is not None
|
|
|
|
return match
|