aboutsummaryrefslogtreecommitdiff
path: root/py/makeqstrdata.py
diff options
context:
space:
mode:
Diffstat (limited to 'py/makeqstrdata.py')
-rw-r--r--py/makeqstrdata.py121
1 files changed, 68 insertions, 53 deletions
diff --git a/py/makeqstrdata.py b/py/makeqstrdata.py
index 7799be0a9..403c40688 100644
--- a/py/makeqstrdata.py
+++ b/py/makeqstrdata.py
@@ -13,49 +13,50 @@ import sys
# - iterating through bytes is different
# - codepoint2name lives in a different module
import platform
-if platform.python_version_tuple()[0] == '2':
+
+if platform.python_version_tuple()[0] == "2":
bytes_cons = lambda val, enc=None: bytearray(val)
from htmlentitydefs import codepoint2name
-elif platform.python_version_tuple()[0] == '3':
+elif platform.python_version_tuple()[0] == "3":
bytes_cons = bytes
from html.entities import codepoint2name
# end compatibility code
-codepoint2name[ord('-')] = 'hyphen';
+codepoint2name[ord("-")] = "hyphen"
# add some custom names to map characters that aren't in HTML
-codepoint2name[ord(' ')] = 'space'
-codepoint2name[ord('\'')] = 'squot'
-codepoint2name[ord(',')] = 'comma'
-codepoint2name[ord('.')] = 'dot'
-codepoint2name[ord(':')] = 'colon'
-codepoint2name[ord(';')] = 'semicolon'
-codepoint2name[ord('/')] = 'slash'
-codepoint2name[ord('%')] = 'percent'
-codepoint2name[ord('#')] = 'hash'
-codepoint2name[ord('(')] = 'paren_open'
-codepoint2name[ord(')')] = 'paren_close'
-codepoint2name[ord('[')] = 'bracket_open'
-codepoint2name[ord(']')] = 'bracket_close'
-codepoint2name[ord('{')] = 'brace_open'
-codepoint2name[ord('}')] = 'brace_close'
-codepoint2name[ord('*')] = 'star'
-codepoint2name[ord('!')] = 'bang'
-codepoint2name[ord('\\')] = 'backslash'
-codepoint2name[ord('+')] = 'plus'
-codepoint2name[ord('$')] = 'dollar'
-codepoint2name[ord('=')] = 'equals'
-codepoint2name[ord('?')] = 'question'
-codepoint2name[ord('@')] = 'at_sign'
-codepoint2name[ord('^')] = 'caret'
-codepoint2name[ord('|')] = 'pipe'
-codepoint2name[ord('~')] = 'tilde'
+codepoint2name[ord(" ")] = "space"
+codepoint2name[ord("'")] = "squot"
+codepoint2name[ord(",")] = "comma"
+codepoint2name[ord(".")] = "dot"
+codepoint2name[ord(":")] = "colon"
+codepoint2name[ord(";")] = "semicolon"
+codepoint2name[ord("/")] = "slash"
+codepoint2name[ord("%")] = "percent"
+codepoint2name[ord("#")] = "hash"
+codepoint2name[ord("(")] = "paren_open"
+codepoint2name[ord(")")] = "paren_close"
+codepoint2name[ord("[")] = "bracket_open"
+codepoint2name[ord("]")] = "bracket_close"
+codepoint2name[ord("{")] = "brace_open"
+codepoint2name[ord("}")] = "brace_close"
+codepoint2name[ord("*")] = "star"
+codepoint2name[ord("!")] = "bang"
+codepoint2name[ord("\\")] = "backslash"
+codepoint2name[ord("+")] = "plus"
+codepoint2name[ord("$")] = "dollar"
+codepoint2name[ord("=")] = "equals"
+codepoint2name[ord("?")] = "question"
+codepoint2name[ord("@")] = "at_sign"
+codepoint2name[ord("^")] = "caret"
+codepoint2name[ord("|")] = "pipe"
+codepoint2name[ord("~")] = "tilde"
# static qstrs, should be sorted
static_qstr_list = [
"",
- "__dir__", # Put __dir__ after empty qstr for builtin dir() to work
+ "__dir__", # Put __dir__ after empty qstr for builtin dir() to work
"\n",
" ",
"*",
@@ -229,15 +230,18 @@ def compute_hash(qstr, bytes_hash):
# Make sure that valid hash is never zero, zero means "hash not computed"
return (hash & ((1 << (8 * bytes_hash)) - 1)) or 1
+
def qstr_escape(qst):
def esc_char(m):
c = ord(m.group(0))
try:
name = codepoint2name[c]
except KeyError:
- name = '0x%02x' % c
- return "_" + name + '_'
- return re.sub(r'[^A-Za-z0-9_]', esc_char, qst)
+ name = "0x%02x" % c
+ return "_" + name + "_"
+
+ return re.sub(r"[^A-Za-z0-9_]", esc_char, qst)
+
def parse_input_headers(infiles):
qcfgs = {}
@@ -257,22 +261,22 @@ def parse_input_headers(infiles):
# read the qstrs in from the input files
for infile in infiles:
- with open(infile, 'rt') as f:
+ with open(infile, "rt") as f:
for line in f:
line = line.strip()
# is this a config line?
- match = re.match(r'^QCFG\((.+), (.+)\)', line)
+ match = re.match(r"^QCFG\((.+), (.+)\)", line)
if match:
value = match.group(2)
- if value[0] == '(' and value[-1] == ')':
+ if value[0] == "(" and value[-1] == ")":
# strip parenthesis from config value
value = value[1:-1]
qcfgs[match.group(1)] = value
continue
# is this a QSTR line?
- match = re.match(r'^Q\((.*)\)$', line)
+ match = re.match(r"^Q\((.*)\)$", line)
if not match:
continue
@@ -280,10 +284,10 @@ def parse_input_headers(infiles):
qstr = match.group(1)
# special cases to specify control characters
- if qstr == '\\n':
- qstr = '\n'
- elif qstr == '\\r\\n':
- qstr = '\r\n'
+ if qstr == "\\n":
+ qstr = "\n"
+ elif qstr == "\\r\\n":
+ qstr = "\r\n"
# work out the corresponding qstr name
ident = qstr_escape(qstr)
@@ -312,43 +316,54 @@ def parse_input_headers(infiles):
return qcfgs, qstrs
+
def make_bytes(cfg_bytes_len, cfg_bytes_hash, qstr):
- qbytes = bytes_cons(qstr, 'utf8')
+ qbytes = bytes_cons(qstr, "utf8")
qlen = len(qbytes)
qhash = compute_hash(qbytes, cfg_bytes_hash)
- if all(32 <= ord(c) <= 126 and c != '\\' and c != '"' for c in qstr):
+ if all(32 <= ord(c) <= 126 and c != "\\" and c != '"' for c in qstr):
# qstr is all printable ASCII so render it as-is (for easier debugging)
qdata = qstr
else:
# qstr contains non-printable codes so render entire thing as hex pairs
- qdata = ''.join(('\\x%02x' % b) for b in qbytes)
+ qdata = "".join(("\\x%02x" % b) for b in qbytes)
if qlen >= (1 << (8 * cfg_bytes_len)):
- print('qstr is too long:', qstr)
+ print("qstr is too long:", qstr)
assert False
- qlen_str = ('\\x%02x' * cfg_bytes_len) % tuple(((qlen >> (8 * i)) & 0xff) for i in range(cfg_bytes_len))
- qhash_str = ('\\x%02x' * cfg_bytes_hash) % tuple(((qhash >> (8 * i)) & 0xff) for i in range(cfg_bytes_hash))
+ qlen_str = ("\\x%02x" * cfg_bytes_len) % tuple(
+ ((qlen >> (8 * i)) & 0xFF) for i in range(cfg_bytes_len)
+ )
+ qhash_str = ("\\x%02x" * cfg_bytes_hash) % tuple(
+ ((qhash >> (8 * i)) & 0xFF) for i in range(cfg_bytes_hash)
+ )
return '(const byte*)"%s%s" "%s"' % (qhash_str, qlen_str, qdata)
+
def print_qstr_data(qcfgs, qstrs):
# get config variables
- cfg_bytes_len = int(qcfgs['BYTES_IN_LEN'])
- cfg_bytes_hash = int(qcfgs['BYTES_IN_HASH'])
+ cfg_bytes_len = int(qcfgs["BYTES_IN_LEN"])
+ cfg_bytes_hash = int(qcfgs["BYTES_IN_HASH"])
# print out the starter of the generated C header file
- print('// This file was automatically generated by makeqstrdata.py')
- print('')
+ print("// This file was automatically generated by makeqstrdata.py")
+ print("")
# add NULL qstr with no hash or data
- print('QDEF(MP_QSTRnull, (const byte*)"%s%s" "")' % ('\\x00' * cfg_bytes_hash, '\\x00' * cfg_bytes_len))
+ print(
+ 'QDEF(MP_QSTRnull, (const byte*)"%s%s" "")'
+ % ("\\x00" * cfg_bytes_hash, "\\x00" * cfg_bytes_len)
+ )
# go through each qstr and print it out
for order, ident, qstr in sorted(qstrs.values(), key=lambda x: x[0]):
qbytes = make_bytes(cfg_bytes_len, cfg_bytes_hash, qstr)
- print('QDEF(MP_QSTR_%s, %s)' % (ident, qbytes))
+ print("QDEF(MP_QSTR_%s, %s)" % (ident, qbytes))
+
def do_work(infiles):
qcfgs, qstrs = parse_input_headers(infiles)
print_qstr_data(qcfgs, qstrs)
+
if __name__ == "__main__":
do_work(sys.argv[1:])