aboutsummaryrefslogtreecommitdiff
path: root/scripts/operator_api/generate_api.py
diff options
context:
space:
mode:
Diffstat (limited to 'scripts/operator_api/generate_api.py')
-rw-r--r--scripts/operator_api/generate_api.py349
1 files changed, 349 insertions, 0 deletions
diff --git a/scripts/operator_api/generate_api.py b/scripts/operator_api/generate_api.py
new file mode 100644
index 0000000..1f89f74
--- /dev/null
+++ b/scripts/operator_api/generate_api.py
@@ -0,0 +1,349 @@
+"""Generate extended reference model API with eager operator execution entrypoints"""
+# Copyright (c) 2021-2022, ARM Limited.
+# SPDX-License-Identifier: Apache-2.0
+import copy
+import os
+import subprocess
+from xml.dom import minidom
+
+from jinja2 import Environment
+from jinja2 import FileSystemLoader
+
+
+def getTosaArgTypes(tosaXml):
+ """
+ Returns a list of the TOSA argument types from tosa.xml.
+ """
+ argTypes = {"in_t", "out_t", "mul_t", "weight_t", "in_out_t"}
+ argTypesXml = tosaXml.getElementsByTagName("type")
+ for argTypeXml in argTypesXml:
+ argTypes.add(argTypeXml.getAttribute("name"))
+ argTypes.remove("TABLE_SIZE")
+ return argTypes
+
+
+def getTosaDataTypes(tosaXml):
+ """
+ Returns a list of the TOSA data types from tosa.xml.
+ """
+ argTypes = getTosaArgTypes(tosaXml)
+ dataTypes = set()
+ dataTypesXml = tosaXml.getElementsByTagName("typesupport")
+ for dataTypeXml in dataTypesXml:
+ for argType in argTypes:
+ dataType = dataTypeXml.getAttribute(argType)
+ if dataType != "":
+ dataTypes.add(f"tosa_datatype_{dataType}")
+ return sorted(dataTypes)
+
+
+def getSerializeOpType(tosaOpName):
+ """
+ Returns the Serialization library operator that matches the TOSA operator specified.
+ """
+ map = {
+ "avg_pool2d": "Pool",
+ "conv2d": "Conv",
+ "conv3d": "Conv",
+ "depthwise_conv2d": "Conv",
+ "fully_connected": "FullyConnected",
+ "matmul": "MatMul",
+ "max_pool2d": "Pool",
+ "transpose_conv2d": "Conv",
+ "clamp": "Clamp",
+ "arithmetic_right_shift": "ArithmeticRightShift",
+ "mul": "Mul",
+ "table": "Table",
+ "negate": "Negate",
+ "pad": "Pad",
+ "reshape": "Reshape",
+ "slice": "Slice",
+ "tile": "Tile",
+ "transpose": "Transpose",
+ "resize": "Resize",
+ "rescale": "Rescale",
+ "cond_if": "CondIf",
+ "while_loop": "WhileLoop",
+ }
+ if tosaOpName not in map.keys():
+ return "None"
+ else:
+ return map[tosaOpName]
+
+
+def getSerializeArgsForOp(tosaOpName, allSerializeArgs, tosaArgs):
+ """
+ Returns the arguments required by the Serialization library for the TOSA operator specified.
+ Generates code to initialize Serialization arguments. If a matching TOSA argument exists,
+ that value is used for initialization, otherwise a default value e.g. 0 is used.
+ """
+ serOpType = getSerializeOpType(tosaOpName)
+ if serOpType not in allSerializeArgs.keys():
+ return {}
+ else:
+ serOpArgs = copy.deepcopy(allSerializeArgs[serOpType])
+ tosaArgsDict = {arg["name"]: arg for arg in tosaArgs}
+ serTosaTypeMap = {"ResizeMode": "tosa_mode"}
+ for arg in serOpArgs:
+ argName = arg["name"]
+ init = ""
+ # Translate TOSA data types to Serialization data types for initialization
+ if arg["dType"] in serTosaTypeMap.keys():
+ init = f" = translate_client_{serTosaTypeMap[arg['dType']]}(client_{argName})"
+ # Initialize Serialization arguments to their matching function parameter
+ elif argName in tosaArgsDict:
+ if arg["SV"] == "V":
+ shape = tosaArgsDict[argName]["shape"]
+ if shape == "[]":
+ init = f"(&client_{argName}[0], &client_{argName}[0] + client_{argName}_len)"
+ else:
+ init = f"(&client_{argName}[0], &client_{argName}{shape})"
+ else:
+ init = f" = client_{argName}"
+ else:
+ # Initialize Serialization arguments with no matching fuction parameter
+ if arg["SV"] == "V":
+ init = ""
+ else:
+ if arg["dType"] == "DType":
+ arg["dType"] = "tosa::DType"
+ init = " = tosa::DType::DType_FP32"
+ else:
+ init = " = 0"
+ arg["init"] = init
+ return serOpArgs
+
+
+def updateTosaArgs(tosaArgs, serializeArgs, tosaXml):
+ """
+ Replace TOSA argument data types with their matching Serialization argument data types.
+ Delete TOSA arguments where the type couldn't be determined.
+ Add Serialization arguments that have no matching TOSA argument.
+ """
+ tosaArgTypes = getTosaArgTypes(tosaXml)
+ serArgsDict = {arg["name"]: arg for arg in serializeArgs}
+ tosaArgsNames = [arg["name"] for arg in tosaArgs]
+ delTosaArgs = []
+ # Replace TOSA argument data types with their matching Serialization argument data types.
+ for tosaArg in tosaArgs:
+ if tosaArg["type"] in tosaArgTypes:
+ if tosaArg["name"] in serArgsDict:
+ tosaArg["type"] = serArgsDict[tosaArg["name"]]["dType"]
+ else:
+ # Delete TOSA argument whose data type can't be determined
+ delTosaArgs.append(tosaArgsNames.index(tosaArg["name"]))
+ # Delete corresponding length argument if one exists
+ lenArgName = f"{tosaArg['name']}_len"
+ if lenArgName in tosaArgsNames:
+ delTosaArgs.append(tosaArgsNames.index(lenArgName))
+ # Delete TOSA arguments where the type couldn't be determined
+ for index in sorted(delTosaArgs, key=int, reverse=True):
+ del tosaArgs[index]
+ # Add Serialization arguments that have no matching TOSA argument
+ tosaArgNames = [arg["name"] for arg in tosaArgs]
+ for serArg in serializeArgs:
+ if (serArg["name"] not in tosaArgNames) and (
+ not serArg["dType"] == "tosa::DType"
+ ):
+ serArgName = serArg["name"]
+ if serArg["SV"] == "V":
+ # For vector data types, insert a matching length argument
+ tosaArgs.insert(
+ len(tosaArgs) - 1,
+ {
+ "name": f"{serArgName}_len",
+ "type": "int32_t",
+ "shape": "",
+ "category": "",
+ },
+ )
+ init = f"(&client_{serArgName}[0], &client_{serArgName}[0] + client_{serArgName}_len)"
+ shape = "[]"
+ else:
+ init = f" = client_{serArg['name']}"
+ shape = ""
+ serArg["init"] = init
+ # Insert new argument
+ tosaArgs.insert(
+ len(tosaArgs) - 1,
+ {
+ "name": serArgName,
+ "type": serArg["dType"],
+ "shape": shape,
+ "category": "",
+ },
+ )
+
+
+def getOperators(tosaXml):
+ """
+ Return a list of TOSA operators as defined by tosa.xml.
+ """
+ operators = []
+ ignoreOps = ["while_loop", "cond_if", "const", "custom", "fft2d", "rfft2d"]
+ opsXml = tosaXml.getElementsByTagName("operator")
+ allSerializeArgs = getSerializeArgs()
+ for opXml in opsXml:
+ opName = opXml.getElementsByTagName("name")[0].firstChild.data.lower()
+ if opName not in ignoreOps:
+ operator = {"name": opName}
+ operator["serializeAttType"] = getSerializeOpType(opName)
+ tosaArgs = getTosaArgs(opXml)
+ serializeArgs = getSerializeArgsForOp(opName, allSerializeArgs, tosaArgs)
+ updateTosaArgs(tosaArgs, serializeArgs, tosaXml)
+ operator["arguments"] = tosaArgs
+ operator["serializeArgs"] = serializeArgs
+ operator["inputs"] = [
+ arg["name"] for arg in tosaArgs if arg["category"] == "input"
+ ]
+ operator["outputs"] = [
+ arg["name"] for arg in tosaArgs if arg["category"] == "output"
+ ]
+ operators.append(operator)
+ return operators
+
+
+def getTosaArgs(opXml):
+ """
+ Return the arguments required for the TOSA operator specified.
+ """
+ arguments = []
+ argsXml = opXml.getElementsByTagName("argument")
+ tosaTensorTypes = getTosaArgTypes(tosaXml)
+ tosaTypeMap = {"bool_t": "bool", "uint6_t": "uint8_t", "mode_t": "tosa_mode_t"}
+ for xmlArg in argsXml:
+ argName = xmlArg.getAttribute("name").lower()
+ argType = xmlArg.getAttribute("type")
+ argShape = xmlArg.getAttribute("shape")
+ argCategory = xmlArg.getAttribute("category")
+ # Update argument type
+ if argType[-1:] == "*":
+ argType = argType[:-1]
+ if argCategory in ["input", "output"] and argType in tosaTensorTypes:
+ argType = "tosa_tensor_t"
+ argShape = ""
+ if argType in tosaTypeMap:
+ argType = tosaTypeMap[argType]
+ # Add a length argument for arrays with unknown compile-time size
+ if argShape != "" and argShape[0] == "[" and not argShape[1:-1].isnumeric():
+ argShape = "[]"
+ arguments.append(
+ {
+ "name": f"{argName}_len",
+ "type": "int32_t",
+ "shape": "",
+ "category": "",
+ }
+ )
+ elif argShape == "" or not argShape[0] == "[":
+ argShape = ""
+ # Append argument
+ arguments.append(
+ {
+ "name": argName,
+ "type": argType,
+ "shape": argShape,
+ "category": argCategory,
+ }
+ )
+ return arguments
+
+
+def clangFormat(filename):
+ cmd = ["clang-format", "-i", filename]
+ with open(os.devnull, "w") as devnull:
+ subprocess.check_call(cmd, stdout=devnull)
+
+
+def getSerializeArgs():
+ """
+ Parse attribute.def file and return a dictionary where the keys are Serialization library operator names.
+ The values are the arguments required by each Serialization library operator.
+ """
+ serializeArgs = {}
+ with open("../../thirdparty/serialization_lib/include/attribute.def") as file:
+ preamble = True
+ inAtt = False
+ opName = ""
+ args = []
+ for line in file:
+ if preamble and not line[: len("DEF_ATTRIBUTE(")] == "DEF_ATTRIBUTE(":
+ continue
+ else:
+ preamble = False
+ line = line.lstrip().rstrip()
+ if not inAtt and "DEF_ATTRIBUTE(" in line:
+ opName = line[len("DEF_ATTRIBUTE(") : line.find(",")]
+ inAtt = True
+ elif inAtt:
+ vals = line.split(",")
+ argName = vals[2].lstrip().strip()
+ if ")" in argName:
+ argName = argName[:-1]
+ arg = {
+ "name": argName,
+ "dType": vals[0].lstrip().strip(),
+ "SV": vals[1].lstrip().strip(),
+ }
+ args.append(arg)
+ if ")" in line:
+ serializeArgs[opName] = args
+ opName = ""
+ args = []
+ inAtt = False
+ return serializeArgs
+
+
+def renderTemplate(environment, dataTypes, operators, template, outfile):
+ content = template.render(dataTypes=dataTypes, operators=operators)
+ with open(outfile, mode="w", encoding="utf-8") as output:
+ output.write(content)
+ print(f"Created {outfile}")
+
+ clangFormat(outfile)
+
+
+def generate(environment, dataTypes, operators):
+ # Generate include/operators.h
+ template = environment.get_template("operators_h.j2")
+ outfile = os.path.join("..", "..", "reference_model", "include", "operators.h")
+ renderTemplate(environment, dataTypes, operators, template, outfile)
+
+ # Generate src/operators.cc
+ template = environment.get_template("operators_cc.j2")
+ outfile = os.path.join("..", "..", "reference_model", "src", "operators.cc")
+ renderTemplate(environment, dataTypes, operators, template, outfile)
+
+
+def getSerializeOpTypeMap():
+ """
+ Utility function for generating the map used in getSerializeOpType()
+ """
+ import re
+
+ allSerializeArgs = getSerializeArgs()
+ serArgs = [
+ re.sub(r"(?<!^)(?=[A-Z])", "_", name).lower()
+ for name in allSerializeArgs.keys()
+ ]
+ serArgs = sorted(serArgs, key=len, reverse=True)
+ tosaXml = minidom.parse("../../thirdparty/specification/tosa.xml")
+ opsXml = tosaXml.getElementsByTagName("operator")
+ opNames = [
+ op.getElementsByTagName("name")[0].firstChild.data.lower() for op in opsXml
+ ]
+ map = {}
+ for opName in opNames:
+ for serArg in serArgs:
+ if serArg in opName:
+ components = serArg.split("_")
+ map[opName] = "".join(x.title() for x in components)
+ return map
+
+
+if __name__ == "__main__":
+ environment = Environment(loader=FileSystemLoader("templates/"))
+ tosaXml = minidom.parse("../../thirdparty/specification/tosa.xml")
+ dataTypes = getTosaDataTypes(tosaXml)
+ operators = getOperators(tosaXml)
+ generate(environment, dataTypes, operators)