process_gperf.py 4.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160
  1. #!/usr/bin/env python3
  2. #
  3. # Copyright (c) 2017 Intel Corporation
  4. #
  5. # SPDX-License-Identifier: Apache-2.0
  6. """
  7. gperf C file post-processor
  8. We use gperf to build up a perfect hashtable of pointer values. The way gperf
  9. does this is to create a table 'wordlist' indexed by a string representation
  10. of a pointer address, and then doing memcmp() on a string passed in for
  11. comparison
  12. We are exclusively working with 4-byte pointer values. This script adjusts
  13. the generated code so that we work with pointers directly and not strings.
  14. This saves a considerable amount of space.
  15. """
  16. import sys
  17. import argparse
  18. import os
  19. import re
  20. from distutils.version import LooseVersion
  21. # --- debug stuff ---
  22. def debug(text):
  23. if not args.verbose:
  24. return
  25. sys.stdout.write(os.path.basename(sys.argv[0]) + ": " + text + "\n")
  26. def error(text):
  27. sys.exit(os.path.basename(sys.argv[0]) + " ERROR: " + text)
  28. def warn(text):
  29. sys.stdout.write(
  30. os.path.basename(
  31. sys.argv[0]) +
  32. " WARNING: " +
  33. text +
  34. "\n")
  35. def reformat_str(match_obj):
  36. addr_str = match_obj.group(0)
  37. # Nip quotes
  38. addr_str = addr_str[1:-1]
  39. addr_vals = [0, 0, 0, 0, 0, 0, 0 , 0]
  40. ctr = 7
  41. i = 0
  42. while True:
  43. if i >= len(addr_str):
  44. break
  45. if addr_str[i] == "\\":
  46. if addr_str[i + 1].isdigit():
  47. # Octal escape sequence
  48. val_str = addr_str[i + 1:i + 4]
  49. addr_vals[ctr] = int(val_str, 8)
  50. i += 4
  51. else:
  52. # Char value that had to be escaped by C string rules
  53. addr_vals[ctr] = ord(addr_str[i + 1])
  54. i += 2
  55. else:
  56. addr_vals[ctr] = ord(addr_str[i])
  57. i += 1
  58. ctr -= 1
  59. return "(char *)0x%02x%02x%02x%02x%02x%02x%02x%02x" % tuple(addr_vals)
  60. def process_line(line, fp):
  61. if line.startswith("#"):
  62. fp.write(line)
  63. return
  64. # Set the lookup function to static inline so it gets rolled into
  65. # z_object_find(), nothing else will use it
  66. if re.search(args.pattern + " [*]$", line):
  67. fp.write("static inline " + line)
  68. return
  69. m = re.search("gperf version (.*) [*][/]$", line)
  70. if m:
  71. v = LooseVersion(m.groups()[0])
  72. v_lo = LooseVersion("3.0")
  73. v_hi = LooseVersion("3.1")
  74. if (v < v_lo or v > v_hi):
  75. warn("gperf %s is not tested, versions %s through %s supported" %
  76. (v, v_lo, v_hi))
  77. # Replace length lookups with constant len since we're always
  78. # looking at pointers
  79. line = re.sub(r'lengthtable\[key\]', r'sizeof(void *)', line)
  80. # Empty wordlist entries to have NULLs instead of ""
  81. line = re.sub(r'[{]["]["][}]', r'{}', line)
  82. # Suppress a compiler warning since this table is no longer necessary
  83. line = re.sub(r'static unsigned char lengthtable',
  84. r'static unsigned char __unused lengthtable', line)
  85. # drop all use of register keyword, let compiler figure that out,
  86. # we have to do this since we change stuff to take the address of some
  87. # parameters
  88. line = re.sub(r'register', r'', line)
  89. # Hashing the address of the string
  90. line = re.sub(r"hash [(]str, len[)]",
  91. r"hash((const char *)&str, len)", line)
  92. # Just compare pointers directly instead of using memcmp
  93. if re.search("if [(][*]str", line):
  94. fp.write(" if (str == s)\n")
  95. return
  96. # Take the strings with the binary information for the pointer values,
  97. # and just turn them into pointers
  98. line = re.sub(r'["].*["]', reformat_str, line)
  99. fp.write(line)
  100. def parse_args():
  101. global args
  102. parser = argparse.ArgumentParser(
  103. description=__doc__,
  104. formatter_class=argparse.RawDescriptionHelpFormatter)
  105. parser.add_argument("-i", "--input", required=True,
  106. help="Input C file from gperf")
  107. parser.add_argument("-o", "--output", required=True,
  108. help="Output C file with processing done")
  109. parser.add_argument("-p", "--pattern", required=True,
  110. help="Search pattern for objects")
  111. parser.add_argument("-v", "--verbose", action="store_true",
  112. help="Print extra debugging information")
  113. args = parser.parse_args()
  114. if "VERBOSE" in os.environ:
  115. args.verbose = 1
  116. def main():
  117. parse_args()
  118. with open(args.input, "r") as in_fp, open(args.output, "w") as out_fp:
  119. for line in in_fp.readlines():
  120. process_line(line, out_fp)
  121. if __name__ == "__main__":
  122. main()