add onnx-subgraph tool baseline code

Samsung · Jan 18, 2025 · a5ec1e7 · a5ec1e7
1 parent 0eeb22c
commit a5ec1e7
Show file tree

Hide file tree

Showing 24 changed files with 13,418 additions and 0 deletions.
diff --git a/compiler/onnx-subgraph/.Readme.md.swp b/compiler/onnx-subgraph/.Readme.md.swp
diff --git a/compiler/onnx-subgraph/CMakeLists.txt b/compiler/onnx-subgraph/CMakeLists.txt
@@ -0,0 +1,80 @@
+# cmake version dependency
+cmake_minimum_required(VERSION 3.10)
+SET(CMAKE_BUILD_TYPE "Debug")
+SET(CMAKE_CXX_FLAGS_DEBUG "$ENV{CXXFLAGS} -O0 -Wall -g2 -ggdb")
+SET(CMAKE_CXX_FLAGS_RELEASE "$ENV{CXXFLAGS} -O3 -Wall")
+SET(CMAKE_CXX_STANDARD 17)
+
+project(onnx-subgraph-parser)
+
+find_package(Protobuf REQUIRED)
+set(PROTO_FILES onnx.proto)
+protobuf_generate_cpp(PROTO_SRCS PROTO_HDRS ${PROTO_FILES})
+
+
+include_directories(${CMAKE_CURRENT_BINARY_DIR})
+
+include_directories(${CMAKE_CURRENT_SOURCE_DIR}/include)
+include_directories(${CMAKE_CURRENT_SOURCE_DIR}/include/Device)
+include_directories(${CMAKE_CURRENT_SOURCE_DIR}/include/json)
+
+find_package(Python3 COMPONENTS Interpreter Development REQUIRED)
+include_directories(${Python3_INCLUDE_DIRS})
+
+
+file(GLOB SOURCES "lib/*.cpp" "lib/Device/*.cpp" )
+
+add_library(onnx-subgraph-parser STATIC ${SOURCES} ${PROTO_SRCS} ${PROTO_FILES})
+target_link_libraries(onnx-subgraph-parser protobuf)
+
+
+add_executable(onnx-subgraph main.cpp)
+target_link_libraries(onnx-subgraph onnx-subgraph-parser ${Python3_LIBRARIES})
+
+
+ set(ONNX_SUGRAPH_FILES                                                          
+   extract_onnx_lib.py
+	 extract_onnx.py
+	 single_vs_multiple_onnx.py
+	 quant.py
+	 model_inference.py
+	 model_inference_multiple_output.py
+	 onnx_subgraph_ut.py
+	 test.onnx
+	 config.json
+ )                                                                            
+
+ foreach(ONNX_SUGRAPH IN ITEMS ${ONNX_SUGRAPH_FILES})                               
+
+   set(ONNX_SUGRAPH_FILE ${ONNX_SUGRAPH})                                           
+   set(ONNX_SUGRAPH_SRC "${CMAKE_CURRENT_SOURCE_DIR}/${ONNX_SUGRAPH_FILE}")         
+   set(ONNX_SUGRAPH_BIN "${CMAKE_CURRENT_BINARY_DIR}/${ONNX_SUGRAPH_FILE}")         
+   set(ONNX_SUGRAPH_TARGET "${ONNX_SUGRAPH}_target")                                
+
+   add_custom_command(OUTPUT ${ONNX_SUGRAPH_BIN}                                 
+     COMMAND ${CMAKE_COMMAND} -E copy "${ONNX_SUGRAPH_SRC}" "${ONNX_SUGRAPH_BIN}"   
+     DEPENDS ${ONNX_SUGRAPH_SRC}                                                 
+     COMMENT "Generate ${ONNX_SUGRAPH_BIN}"                                      
+   )                                                                          
+
+   add_custom_target(${ONNX_SUGRAPH_TARGET} ALL DEPENDS ${ONNX_SUGRAPH_BIN})        
+
+   install(FILES ${ONNX_SUGRAPH_BIN}                                             
+           PERMISSIONS OWNER_WRITE OWNER_READ OWNER_EXECUTE                   
+                       GROUP_READ GROUP_EXECUTE                               
+                       WORLD_READ WORLD_EXECUTE                               
+           DESTINATION bin)                                                   
+
+ endforeach(ONNX_SUGRAPH)     
+
+set(Python_ADDITIONAL_VERSIONS 3.8)
+find_package(PythonInterp 3.8 QUIET)
+if(NOT ${PYTHONINTERP_FOUND}) 
+	message(FATAL_ERROR "Build onnx-subgraph_unittest: FAIL (Python3 is missing)")
+endif() 
+
+  add_test(
+ 		 NAME onnx-subgraph_unittest
+ 		 COMMAND ${PYTHON_EXECUTABLE} -m unittest
+ 		 WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}
+  )
diff --git a/compiler/onnx-subgraph/Readme.md b/compiler/onnx-subgraph/Readme.md
@@ -0,0 +1,48 @@
+## onnx_autosubgraphs
+in this project, we can support onnx AI model auto subgraph, the AI model can be  splitted by model size, operators etc, it help much for on-device AI acceleration, and has been verified on Rose-P NPU and Qualcomm DSP.
+
+### OS environment
+     1. ubuntu >=20.04
+     2. GCC >= 9.4.0
+     3. cmake >= 3.10
+     4. python >= 3.8
+     5. apt-get install libprotobuf-dev protobuf-compiler
+
+### Python packages
+    onnx                         1.16.0
+    onnxruntime                  1.18.1
+    onnxsim                      0.4.36
+    torch                        2.3.1
+
+### Pre-steps
+    1. prepare the target onnx AI model, we use test.onnx for example
+    2. use onnxsim to remove the complex structures before excution onnx-subgraph
+
+### building the onnx-subgraph
+    1. cd onnx-subgraph
+    2. mkdir build & cd build
+    3. cmake .. & make
+    4. onnx-subgraph will be generated at ./build
+
+### Parse the onnx model
+    1. edit the config.json as your needs
+       -> NPU_supported_ops mean operators that can be supported by NPU
+       -> CPU_supported_ops mean operators that can be supported by CPU
+       -> In case of operators supported by both CPU and NPU, we can describ the performance data at "performance_data"
+       -> "max_subgraph_size": can set the max size of subgraph, it works only if NPU_supported_ops is NULL
+
+    2. ./onnx-subgraph --onnx=test.onnx
+       after parse done, subgraphs_ios.txt will be generated
+       
+ ### Split the onnx model to subgraphs
+    1. edit the config path and model file path at extract_onnx.py 
+
+    2. python extract_onnx.py, after extraction done, the subgraphs will be saved at './subgraphs'
+
+### Verify the subgraphs inference with original model file
+    1. edit the model path, subgraph path and config path in single_vs_multiple_onnx.py
+
+    2. edit the input shape and name of onnx model in single_vs_multiple_onnx.py
+
+    3. compare the MSE of original inference result and subgraphs inference result
+       python single_vs_multiple_onnx.py
diff --git a/compiler/onnx-subgraph/config.json b/compiler/onnx-subgraph/config.json
@@ -0,0 +1,13 @@
+{
+    "NPU_supported_ops": ["Conv", "Reshape", "Transpose", "Add", "ReduceMean", "Sub", "Div", "Mul", "Sigmoid","MatMul"],
+    "CPU_supported_ops": ["Sub", "Pow", "ReduceMean", "Add", "Sqrt", "Div","Transpose", "Gather", "MatMul", "Mul", "Softmax", "Erf", "Gemm", "Conv", "Reshape",
+    "Sin", "Where", "ConstantOfShape", "Cast", "Sigmoid", "Cos", "Expand", "Slice", "Unsqueeze"],
+    "performance_data": [
+        {"name":"Conv","CPU_time": 0.1, "NPU_time": 0.05},
+		{"name":"Mul", "CPU_time": 0.15, "NPU_time": 0.07}
+    ],
+    "hardware_limits": {
+        "max_subgraph_size": 60024.0,
+        "max_subgraphs": 5
+    }
+}
diff --git a/compiler/onnx-subgraph/extract_onnx.py b/compiler/onnx-subgraph/extract_onnx.py
@@ -0,0 +1,33 @@
+
+# Copyright (c) 2024 Samsung Electronics Co., Ltd. All Rights Reserved
+
+#
+
+# Licensed under the Apache License, Version 2.0 (the "License");
+
+# you may not use this file except in compliance with the License.
+
+# You may obtain a copy of the License at
+
+#
+
+#    http://www.apache.org/licenses/LICENSE-2.0
+
+#
+
+# Unless required by applicable law or agreed to in writing, software
+
+# distributed under the License is distributed on an "AS IS" BASIS,
+
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+
+# See the License for the specific language governing permissions and
+
+# limitations under the License.
+import extract_onnx_lib
+import torch
+import onnx
+import re
+print("python executed")
+extract_onnx_lib.split_onnx_ios('subgraphs_ios.txt','net/vit_large_simplify.onnx')
+
diff --git a/compiler/onnx-subgraph/extract_onnx_lib.py b/compiler/onnx-subgraph/extract_onnx_lib.py
@@ -0,0 +1,216 @@
+
+# Copyright (c) 2024 Samsung Electronics Co., Ltd. All Rights Reserved
+
+#
+
+# Licensed under the Apache License, Version 2.0 (the "License");
+
+# you may not use this file except in compliance with the License.
+
+# You may obtain a copy of the License at
+
+#
+
+#    http://www.apache.org/licenses/LICENSE-2.0
+
+#
+
+# Unless required by applicable law or agreed to in writing, software
+
+# distributed under the License is distributed on an "AS IS" BASIS,
+
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+
+# See the License for the specific language governing permissions and
+
+# limitations under the License.
+import torch
+import onnx
+import re
+import os
+def splitinstruction(instr):
+    iolist=re.split('--input-name \"|\" --output-name \"|\" --input-shape \"',instr)
+    del iolist[0]
+    del iolist[-1]
+    in_=iolist[0].split(';')
+    out_=iolist[1].split(';')
+    return in_,out_
+def splitsubgraph_ios(iofile):
+    iolist=re.split('--input-name |;--output-name ',iofile)
+    in_=iolist[1].split(';')
+    out_=iolist[2].split(';')
+    del out_[-1]
+    type=iolist[0].split('subgraph')[0]
+    return in_,out_,type
+
+def split_onnx(instrfile,type):
+    print("module found")
+    f1=open(instrfile,"r")
+    lines=f1.readlines()
+    count=0
+    for line in lines:
+        input_names, output_names = splitinstruction(line)
+        input_path ='net/diffusion_model_fp32_with_shape.onnx'
+        output_path ='diffusion_model_fp32_subgraphs_'+type+'/'+type+'subgraph'+str(count)+'.onnx'
+        count=count+1
+        if((input_names!=['']) and (output_names!=[''])):
+            onnx.utils.extract_model(input_path, output_path, input_names, output_names)
+    f1.close()
+
+def split_onnx_ios(instrfile, input_path ='net/generation_model_simplify.onnx', out_folder = 'subgraphs/'):
+    if not os.path.exists(input_path):
+        print(input_path +" not exist")
+        return
+
+    model = onnx.load(input_path)
+    onnx.checker.check_model(input_path)
+    for output in model.graph.output:
+        model.graph.value_info.append(output)
+    onnx.save(model, input_path)
+    f1=open(instrfile,"r")
+    lines=f1.readlines()
+    cpu_count = 0
+    npu_count = 0
+    count=0
+    if not os.path.exists(out_folder):
+        os.makedirs(out_folder)
+    for line in lines:
+        input_names, output_names,type = splitsubgraph_ios(line)
+        if(type=='CPU'):
+            count=cpu_count
+            cpu_count=cpu_count+1
+        else:
+            count=npu_count
+            npu_count=npu_count+1
+        output_path_folder =out_folder+type+'/'
+        if not os.path.exists(output_path_folder):
+            os.makedirs(output_path_folder)
+        output_path = output_path_folder+type+'subgraph'+str(count)+'.onnx'
+        if((input_names!=['']) and (output_names!=[''])):
+            onnx.utils.extract_model(input_path, output_path, input_names, output_names)
+            print("succeed",count)
+            count = count+1
+    f1.close()
+
+def rename_node_io(file_path):
+    model = onnx.load(file_path)
+    graph = model.graph
+    for inputs in graph.input :
+        inputs.name = re.sub(r'[/.]','',inputs.name)
+    for outputs in graph.output :
+        outputs.name = re.sub(r'[/.]','',outputs.name)
+    for value_infos in graph.value_info :
+        value_infos.name = re.sub(r'[/.]','',value_infos.name)
+    for initializers in graph.initializer :
+        initializers.name = re.sub(r'[/.]','',initializers.name)
+    for node in graph.node:
+        node.name = re.sub(r'[/.]','',node.name)
+        for i in range(len(node.input)):
+            node.input[i] = re.sub(r'[/.]','',node.input[i])
+        for i in range(len(node.output)):
+            node.output[i] = re.sub(r'[/.]','',node.output[i])
+    return model
+
+def rename_subgraph_node_ios(in_file_path,out_file_path):
+    file_names = os.listdir(in_file_path)
+    for filename in file_names:
+        filename_=in_file_path+'/'+filename
+        model=rename_node_io(filename_)
+        output_file_path = out_file_path+'/'+filename
+        onnx.save(model, output_file_path)
+        print(f'Modified model saved to {output_file_path}')
+
+
+def print_model(file_path):
+    model = onnx.load(file_path)
+    graph = model.graph
+    size=0
+    for node in graph.node:
+        size=size+1
+    print(size)
+
+def sort(ifile_path,ofile_path):
+    finished_flag = 0
+    sort_count = 0
+    f1=open(ifile_path,"r")
+    lines=f1.readlines()
+    graphs_inputs = {}
+    graphs_outputs = {}
+    order_Subgraphs = {}
+    issort_Subgraphs = {}
+    TYPE = {}
+    index = 0
+    for line in lines:
+        input_names, output_names,type = splitsubgraph_ios(line)
+        graphs_inputs[index] = input_names
+        graphs_outputs[index] = output_names
+        TYPE[index] = type
+        index = index + 1
+    graph_num = index 
+    f1.close()
+    while finished_flag == 0:
+        finished_flag = 1
+        if(sort_count) == 0:
+            for i in range(graph_num):
+                find_flag = 0
+                for g_input in graphs_inputs[i]:
+                    for j in range(graph_num):
+                        if g_input in graphs_outputs[j]:
+                            find_flag = 1
+                            break
+                    if find_flag == 1:
+                        break
+                if find_flag == 0:
+                    order_Subgraphs[i] = 0
+                    issort_Subgraphs[i] = 1
+                else:
+                    order_Subgraphs[i] = 1
+                    issort_Subgraphs[i] = 0
+                    finished_flag = 0 
+        else:
+            for i in range(graph_num):
+                find_flag = 0
+                if issort_Subgraphs[i] == 1:
+                    continue
+                for g_input in graphs_inputs[i]:
+                    for j in range(graph_num):
+                        if g_input in graphs_outputs[j]:
+                            if issort_Subgraphs[j] == 0:
+                                find_flag = 1
+                            break
+                    if find_flag == 1:
+                        break
+                if find_flag == 0:
+                    order_Subgraphs[i] = sort_count
+                    issort_Subgraphs[i] = 1
+                else:
+                    order_Subgraphs[i] = sort_count + 1
+                    issort_Subgraphs[i] = 0
+                    finished_flag = 0 
+                if i == graph_num - 1:
+                    for j in range(graph_num):
+                        if order_Subgraphs[j]==sort_count:
+                            issort_Subgraphs[j] = 1
+        print(order_Subgraphs)
+        print(issort_Subgraphs)
+        sort_count = sort_count + 1
+        f2 = open(ofile_path,"w")
+        count_cpu = 0
+        count_npu = 0
+        for i in range(graph_num):
+            content = ""
+            if TYPE[i] == 'CPU':
+                content = "CPUsubgraph" + str(count_cpu) + ": order" + str(order_Subgraphs[i]) + "--input-name "
+                count_cpu = count_cpu + 1
+            if TYPE[i] == 'NPU':
+                content = "NPUsubgraph" + str(count_npu) + ": order" + str(order_Subgraphs[i]) + "--input-name "
+                count_npu = count_npu + 1
+            for graph_input in graphs_inputs[i]:
+                content = content + graph_input + ";"
+            content = content + "--output-name "
+            for graph_output in graphs_outputs[i]:
+                content = content + graph_output + ";"
+            content = content + "\n"
+            print(content)
+            f2.write(content)
+        f2.close()