Add tosa VGF encapsulated compilation target for ahead of time.

robell · robell · commit 6730dd682022 · 2025-04-29T09:32:07.000Z
- Add a VgfQuantizer (same as TOSAQuantizer)
 - Add a VgfBackend and VgfPartitioner
 - Requires yet to be released converter_backend

Signed-off-by: Rob Elliott &lt;robert.elliott@arm.com&gt;
Change-Id: I764c32c33c503eb44200e9a7d98caa8fae8a4882
diff --git a/backends/arm/TARGETS b/backends/arm/TARGETS
@@ -7,6 +7,8 @@ python_library(
         "ethosu_partitioner.py",
         "tosa_backend.py",
         "tosa_partitioner.py",
+        "vgf_backend.py",
+        "vgf_partitioner.py",
     ],
     deps = [
         ":arm_backend",
diff --git a/backends/arm/arm_backend.py b/backends/arm/arm_backend.py
@@ -27,6 +27,23 @@ def __init__(self):
         self.tosa_spec = None
         self.input_order = None
 
+    def vgf_compile_spec(
+        self,
+        compiler_flags: Optional[str] = "",
+    ) -> "ArmCompileSpecBuilder":
+        """
+        Generate compile spec for VGF compatible targets
+
+        Args:
+            compiler_flags: Extra compiler flags for converter_backend
+        """
+        self.output_format = "vgf"
+        self.compiler_flags = [
+            compiler_flags,
+        ]
+        self.tosa_spec = TosaSpecification.create_from_string("TOSA-0.80+MI")
+        return self
+
     def ethosu_compile_spec(
         self,
         target: str,
@@ -126,13 +143,16 @@ def build(self) -> List[CompileSpec]:
         # Always supply a TOSA version
         self.compile_spec = [CompileSpec("tosa_spec", str(self.tosa_spec).encode())]
 
-        if self.output_format == "vela":
-            self.compile_spec += [
-                CompileSpec("output_format", "vela".encode()),
-                CompileSpec("compile_flags", " ".join(self.compiler_flags).encode()),
-            ]
-        elif self.output_format == "tosa":
-            self.compile_spec.append(CompileSpec("output_format", "tosa".encode()))
+        # Add compile flags, these are backend specific, refer to the backend
+        # documentation.
+        self.compile_spec += [
+            CompileSpec("compile_flags", " ".join(self.compiler_flags).encode()),
+        ]
+
+        # encode output format
+        self.compile_spec.append(
+            CompileSpec("output_format", self.output_format.encode())
+        )
 
         if self.path_for_intermediates is not None:
             self.compile_spec.append(
@@ -168,6 +188,13 @@ def is_ethosu(compile_spec: List[CompileSpec]) -> bool:
     return False
 
 
+def is_vgf(compile_spec: List[CompileSpec]) -> bool:
+    for spec in compile_spec:
+        if spec.key == "output_format":
+            return spec.value.decode() == "vgf"
+    return False
+
+
 def get_tosa_spec(compile_spec: List[CompileSpec]) -> TosaSpecification:
     for spec in compile_spec:
         if spec.key == "tosa_spec":
diff --git a/backends/arm/ethosu_backend.py b/backends/arm/ethosu_backend.py
@@ -35,7 +35,7 @@ class EthosUBackend(BackendDetails):
 
     @staticmethod
     def _compile_tosa_flatbuffer(
-        tosa_flatbuffer: bytes, compile_spec: list[CompileSpec]
+        tosa_flatbuffer: bytes, compile_spec: List[CompileSpec]
     ) -> bytes:
         """
         Static helper method to do the compilation of the TOSA flatbuffer
diff --git a/backends/arm/quantizer/arm_quantizer.py b/backends/arm/quantizer/arm_quantizer.py
@@ -27,6 +27,7 @@
 from executorch.backends.arm.arm_backend import (
     get_tosa_spec,
     is_ethosu,
+    is_vgf,
 )  # usort: skip
 from executorch.exir.backend.compile_spec_schema import CompileSpec
 from torch.ao.quantization.fake_quantize import (
@@ -52,6 +53,7 @@
 __all__ = [
     "TOSAQuantizer",
     "EthosUQuantizer",
+    "VgfQuantizer",
     "get_symmetric_quantization_config",
 ]
 
@@ -358,3 +360,12 @@ def __init__(self, compile_spec: list[CompileSpec]) -> None:
 
         tosa_spec = get_tosa_spec(compile_spec)
         super().__init__(tosa_spec)
+
+
+class VgfQuantizer(TOSAQuantizer):
+    def __init__(self, compile_spec: list[CompileSpec]) -> None:
+        if not is_vgf(compile_spec):
+            raise RuntimeError("compile spec is not targeting VGF")
+
+        tosa_spec = get_tosa_spec(compile_spec)
+        super().__init__(tosa_spec)
diff --git a/backends/arm/tosa_backend.py b/backends/arm/tosa_backend.py
@@ -35,15 +35,15 @@
 logger = logging.getLogger(__name__)
 
 
-def _get_first_delegation_tag(graph_module) -> str | None:
-    """Get the first delegation tag from the graph_module or return None."""
+def arm_get_first_delegation_tag(graph_module) -> str:
+    """Get the first delegation tag from the graph_module or return empty string."""
     for node in graph_module.graph.nodes:
         tag = node.meta.get("delegation_tag")
         if tag:
             return tag
 
     logger.debug("No delegation tag found in partition.")
-    return None
+    return ""
 
 
 @final
@@ -136,7 +136,7 @@ def preprocess(  # noqa: C901
                 )
 
         if artifact_path:
-            tag = _get_first_delegation_tag(graph_module)
+            tag = arm_get_first_delegation_tag(graph_module)
             dbg_tosa_dump(
                 tosa_graph,
                 artifact_path,
diff --git a/backends/arm/vgf_backend.py b/backends/arm/vgf_backend.py
@@ -0,0 +1,126 @@
+# Copyright 2025 Arm Limited and/or its affiliates.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+# pyre-unsafe
+
+#
+# Main implementation of AoT flow to partition and preprocess for VGF target
+# backends. This flow converts via TOSA, to an encoding of TOSA known as VGF
+# this form is used where the final JIT compile is performed on target (in the
+# runtime delegate executorch::runtime::BackendInterface::init
+#
+
+import logging
+import os
+import subprocess
+import tempfile
+from typing import final, List
+
+from executorch.backends.arm.tosa_backend import (
+    arm_get_first_delegation_tag,
+    TOSABackend,
+)
+from executorch.exir.backend.backend_details import BackendDetails, PreprocessResult
+from executorch.exir.backend.compile_spec_schema import CompileSpec
+from torch.export.exported_program import ExportedProgram
+
+# debug functionality
+logger = logging.getLogger(__name__)
+
+
+@final
+class VgfBackend(BackendDetails):
+    """
+    BackendDetails subclass for delegation to VGF compatible devices. This enables
+    encapsulated TOSA on target device and JIT compilation on suitable platforms.
+    """
+
+    @staticmethod
+    def _compile_tosa_flatbuffer(
+        tosa_flatbuffer: bytes,
+        compile_spec: List[CompileSpec],
+        tag_name: str = "",
+    ) -> bytes:
+        """
+        Static helper method to do the compilation of the TOSA flatbuffer
+        representation to a target specific binary stream.
+        """
+        compile_flags = []
+        artifact_path = None
+        for spec in compile_spec:
+            if spec.key == "compile_flags":
+                compile_flags.append(spec.value.decode())
+            if spec.key == "debug_artifact_path":
+                artifact_path = spec.value.decode()
+
+        # Pass on the TOSA flatbuffer to the vgf compiler.
+        binary = vgf_compile(tosa_flatbuffer, compile_flags, artifact_path, tag_name)
+        return binary
+
+    @staticmethod
+    def preprocess(
+        edge_program: ExportedProgram,
+        compile_spec: List[CompileSpec],
+    ) -> PreprocessResult:
+        logger.info(f"{VgfBackend.__name__} preprocess")
+
+        # deduce TOSA compile_spec from VGF compile spec. We get a new
+        # compile spec list, containing only elements relevant for the
+        # TOSABackend.
+        tosa_compile_spec = TOSABackend.filter_tosa_compile_specs(compile_spec)
+
+        # Backends doesn't allow inheritance, as stated in comments in exir/backend/backend_api.py
+        # ('All backend implementation are final...'), so use composition instead.
+        # preprocess returns the serialized TOSA flatbuffer in .processed_bytes,
+        # which can be passed on to next compilation step.
+        tosa_preprocess = TOSABackend.preprocess(edge_program, tosa_compile_spec)
+
+        tag_name = arm_get_first_delegation_tag(edge_program.graph_module)
+
+        binary = VgfBackend._compile_tosa_flatbuffer(
+            tosa_preprocess.processed_bytes, compile_spec, tag_name
+        )
+
+        return PreprocessResult(processed_bytes=binary)
+
+
+def vgf_compile(
+    tosa_flatbuffer: bytes,
+    compile_flags: List[str],
+    artifact_path: str | None = None,
+    tag_name: str = "",
+):
+    with tempfile.TemporaryDirectory() as tmpdir:
+
+        # We currently write out a flatbuffer as input to the converter
+        tosaname = f"output_{tag_name}.tosa"
+        tosa_path = os.path.join(tmpdir, tosaname)
+        with open(tosa_path, "wb") as f:
+            f.write(tosa_flatbuffer)
+
+        additional_flags = " ".join(compile_flags)
+        vgf_path = tosa_path + ".vgf"
+        conversion_command = (
+            f"converter-backend {additional_flags} -i {tosa_path} -o {vgf_path}"
+        )
+        try:
+            subprocess.run(
+                [conversion_command], shell=True, check=True, capture_output=True
+            )
+        except subprocess.CalledProcessError as process_error:
+            raise RuntimeError(
+                f"Vgf compiler ('{conversion_command}') failed with error:\n \
+                {process_error.stderr.decode()}\n \
+                Stdout:\n{process_error.stdout.decode()}"
+            )
+
+        if artifact_path is not None:
+            logger.info(f"Emitting debug output to: {vgf_path=}")
+            os.makedirs(artifact_path, exist_ok=True)
+            cp = f"cp {vgf_path} {artifact_path}"
+            subprocess.run(cp, shell=True, check=True, capture_output=False)
+
+        vgf_bytes = open(vgf_path, "rb").read()
+        return vgf_bytes
diff --git a/backends/arm/vgf_partitioner.py b/backends/arm/vgf_partitioner.py
@@ -0,0 +1,32 @@
+# Copyright 2025 Arm Limited and/or its affiliates.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+# pyre-unsafe
+
+from typing import final, List, Optional, Sequence
+
+from executorch.backends.arm.arm_backend import (
+    is_vgf,
+)  # usort: skip
+from executorch.backends.arm.tosa_partitioner import TOSAPartitioner
+from executorch.backends.arm.vgf_backend import VgfBackend
+from executorch.exir.backend.compile_spec_schema import CompileSpec
+from executorch.exir.backend.partitioner import DelegationSpec
+from torch.fx.passes.operator_support import OperatorSupportBase
+
+
+@final
+class VgfPartitioner(TOSAPartitioner):
+    def __init__(
+        self,
+        compile_spec: List[CompileSpec],
+        additional_checks: Optional[Sequence[OperatorSupportBase]] = None,
+    ) -> None:
+        if not is_vgf(compile_spec):
+            raise RuntimeError("compile spec is not targeting Vgf")
+
+        # Override the delegation spec for Vgf
+        self.delegation_spec = DelegationSpec(VgfBackend.__name__, compile_spec)
+        self.additional_checks = additional_checks
diff --git a/examples/arm/aot_arm_compiler.py b/examples/arm/aot_arm_compiler.py
@@ -22,12 +22,14 @@
     get_tosa_spec,
     is_ethosu,
     is_tosa,
+    is_vgf,
 )
 from executorch.backends.arm.ethosu_partitioner import EthosUPartitioner
 from executorch.backends.arm.quantizer import (
     EthosUQuantizer,
     get_symmetric_quantization_config,
     TOSAQuantizer,
+    VgfQuantizer,
 )
 from executorch.backends.arm.tosa_partitioner import TOSAPartitioner
 from executorch.backends.arm.tosa_specification import TosaSpecification
@@ -36,6 +38,8 @@
     GenericModelEvaluator,
     MobileNetV2Evaluator,
 )
+
+from executorch.backends.arm.vgf_partitioner import VgfPartitioner
 from executorch.devtools.backend_debug import get_delegation_info
 from executorch.devtools.bundled_program.config import MethodTestCase, MethodTestSuite
 
@@ -145,6 +149,8 @@ def quantize(
         quantizer = EthosUQuantizer(compile_specs)
     elif is_tosa(compile_specs):
         quantizer = TOSAQuantizer(get_tosa_spec(compile_specs))
+    elif is_vgf(compile_specs):
+        quantizer = VgfQuantizer(compile_specs)
     else:
         raise RuntimeError("Unsupported compilespecs for quantization!")
 
@@ -267,6 +273,7 @@ def forward(self, x: torch.Tensor, y: torch.Tensor):
     "ethos-u85-512",
     "ethos-u85-1024",
     "ethos-u85-2048",
+    "vgf",
     "TOSA",
 ]
 
@@ -324,6 +331,8 @@ def get_compile_spec(
             memory_mode=memory_mode,
             extra_flags="--verbose-operators --verbose-cycle-estimate",
         )
+    elif "vgf" in target:
+        spec_builder = ArmCompileSpecBuilder().vgf_compile_spec()
 
     if intermediates is not None:
         spec_builder.dump_intermediate_artifacts_to(intermediates)
@@ -635,6 +644,8 @@ def to_edge_TOSA_delegate(
         partitioner = EthosUPartitioner(compile_spec)
     elif is_tosa(compile_spec):
         partitioner = TOSAPartitioner(compile_spec)
+    elif is_vgf(compile_spec):
+        partitioner = VgfPartitioner(compile_spec)
     else:
         raise RuntimeError(f"Unhandled compile spec: {compile_spec}")