Additional variants of Softmax microkernels

PiperOrigin-RevId: 284483874
diff --git a/tools/ b/tools/
new file mode 100755
index 0000000..46982ed
--- /dev/null
+++ b/tools/
@@ -0,0 +1,148 @@
+#!/usr/bin/env python
+# Copyright 2019 Google LLC
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+import argparse
+import codecs
+import math
+import os
+import re
+import sys
+import yaml
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+import xngen
+import xnncommon
+parser = argparse.ArgumentParser(
+  description='RAddExpMinusMax microkernel test generator')
+parser.add_argument("-s", "--spec", metavar="FILE", required=True,
+                    help="Specification (YAML) file")
+parser.add_argument("-o", "--output", metavar="FILE", required=True,
+                    help='Output (C++ source) file')
+def split_ukernel_name(name):
+  match = re.match(r"^xnn_(f16|f32)_raddexpminusmax_ukernel__(.+)_x(\d+)(_acc(\d+))?$", name)
+  if match is None:
+    raise ValueError("Unexpected microkernel name: " + name)
+  elements_tile = int(
+  arch, isa = xnncommon.parse_target_name(
+  return elements_tile, arch, isa
+TEST(${TEST_NAME}, elements_eq_${ELEMENTS_TILE}) {
+  $if ISA_CHECK:
+    ${ISA_CHECK};
+  RAddExpMinusMaxMicrokernelTester()
+    .elements(${ELEMENTS_TILE})
+    .Test(${TEST_FUNCTION});
+  TEST(${TEST_NAME}, elements_div_${ELEMENTS_TILE}) {
+    $if ISA_CHECK:
+      ${ISA_CHECK};
+    for (size_t elements = ${ELEMENTS_TILE*2}; elements < ${ELEMENTS_TILE*10}; elements += ${ELEMENTS_TILE}) {
+      RAddExpMinusMaxMicrokernelTester()
+        .elements(elements)
+        .Test(${TEST_FUNCTION});
+    }
+  }
+  TEST(${TEST_NAME}, elements_lt_${ELEMENTS_TILE}) {
+    $if ISA_CHECK:
+      ${ISA_CHECK};
+    for (size_t elements = 1; elements < ${ELEMENTS_TILE}; elements++) {
+      RAddExpMinusMaxMicrokernelTester()
+        .elements(elements)
+        .Test(${TEST_FUNCTION});
+    }
+  }
+TEST(${TEST_NAME}, elements_gt_${ELEMENTS_TILE}) {
+  $if ISA_CHECK:
+    ${ISA_CHECK};
+  for (size_t elements = ${ELEMENTS_TILE+1}; elements < ${10 if ELEMENTS_TILE == 1 else ELEMENTS_TILE*2}; elements++) {
+    RAddExpMinusMaxMicrokernelTester()
+      .elements(elements)
+      .Test(${TEST_FUNCTION});
+  }
+def generate_test_cases(ukernel, elements_tile, isa):
+  """Generates all tests cases for a RAddExpMinusMax micro-kernel.
+  Args:
+    ukernel: C name of the micro-kernel function.
+    elements_tile: Number of batch elements processed per one iteration of the
+                   inner loop of the micro-kernel.
+    isa: instruction set required to run the micro-kernel. Generated unit test
+         will skip execution if the host processor doesn't support this ISA.
+  Returns:
+    Code for the test case.
+  """
+  _, test_name = ukernel.split("_", 1)
+  _, datatype, _ = ukernel.split("_", 2)
+  return xngen.preprocess(RADDEXPMINUSMAX_TEST_TEMPLATE, {
+      "TEST_FUNCTION": ukernel,
+      "TEST_NAME": test_name.upper().replace("UKERNEL_", ""),
+      "DATATYPE": datatype,
+      "ELEMENTS_TILE": elements_tile,
+      "ISA_CHECK": xnncommon.generate_isa_check_macro(isa),
+    })
+def main(args):
+  options = parser.parse_args(args)
+  with, "r", encoding="utf-8") as spec_file:
+    spec_yaml = yaml.safe_load(spec_file)
+    if not isinstance(spec_yaml, list):
+      raise ValueError("expected a list of micro-kernels in the spec")
+    tests = """\
+// Copyright 2019 Google LLC
+// This source code is licensed under the BSD-style license found in the
+// LICENSE file in the root directory of this source tree.
+// Auto-generated file. Do not edit!
+//   Specification: {specification}
+//   Generator: {generator}
+#include <gtest/gtest.h>
+#include <xnnpack/common.h>
+#include <xnnpack/isa-checks.h>
+#include <xnnpack/raddexpminusmax.h>
+#include "raddexpminusmax-microkernel-tester.h"
+""".format(specification=options.spec, generator=sys.argv[0])
+    for ukernel_spec in spec_yaml:
+      name = ukernel_spec["name"]
+      elements_tile, arch, isa = split_ukernel_name(name)
+      # specification can override architecture
+      arch = ukernel_spec.get("arch", arch)
+      test_case = generate_test_cases(name, elements_tile, isa)
+      tests += "\n\n" + xnncommon.postprocess_test_case(test_case, arch, isa)
+    with, "w", encoding="utf-8") as output_file:
+      output_file.write(tests)
+if __name__ == "__main__":
+  main(sys.argv[1:])