Summary



info
docker_version kneron/toolchain:v0.25.1
comments
kdp720/input bitwidth int8
kdp720/output bitwidth int8
kdp720/cpu bitwidth int8
kdp720/datapath bitwidth int8
kdp720/weight bitwidth int8
kdp720/ip_eval/fps 671.399
kdp720/ip_eval/ITC(ms) 1.48943 ms
kdp720/ip_eval/C(GOPs) 3.01423e+08
kdp720/ip_eval/RV(mb) 0.702464
kdp720/ip_eval/WV(mb) 0.51776
kdp720/ip_eval/cpu_node N/A
kdp720/bie input.kdp720.scaled.bie
kdp720/onnx input.kdp720.decomposed.onnx
kdp720/nef models_720.nef
gen fx model report model_fx_report.html
gen fx model json model_fx_report.json


kdp720



node node origin type bw in bw out bw weight node backend CFUNC_runtime(ms) CMD_node_idx MAC_cycle MAC_runtime(ms) PFUNC_runtime(ms) RDMA_amount(Byte) RDMA_runtime(ms) SYNC_runtime(ms) WDMA_amount(Byte) WDMA_runtime(ms) Weight_amount(Byte) runtime(ms) in_fmt out_fmt
0 input.1 None NPU None [8] N/A None NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN
1 Conv_0 Conv_0 NPU [8] [16] [8] npu_fusion_node_Conv_0_Clip_3 0 0 61952 0.088503 0 200704 0 0 0 0 1024 0.114877 4W4C8B 1W16C8B
2 Clip_3 Clip_3 NPU [16] [8] [8]
3 Conv_4 Conv_4 NPU [8] [16] [8] npu_fusion_node_Conv_4_Clip_7 0 1 7776 0.011109 0 0 0 0 0 0 1024 0.011109 1W16C8B 1W16C8B
4 Clip_7 Clip_7 NPU [16] [8] [8]
5 Conv_8 Conv_8 NPU [8] [8] [8] Conv_8 0 2 8988 0.01284 0 0 0 0 0 0 1024 0.01284 1W16C8B 1W16C8B
6 Conv_9 Conv_9 NPU [8] [16] [8] npu_fusion_node_Conv_9_Clip_12 0 3 24660 0.035229 0 0 0 0 0 0 6144 0.035229 1W16C8B 1W16C8B
7 Clip_12 Clip_12 NPU [16] [8] [8]
8 Conv_13 Conv_13 NPU [8] [16] [8] npu_fusion_node_Conv_13_Clip_16 0 4 23328 0.033326 0 0 0 0 301056 0 6144 0.072788 1W16C8B 1W16C8B
9 Clip_16 Clip_16 NPU [16] [8] [8]
10 Conv_17 Conv_17 NPU [8] [8] [8] Conv_17 0 7 9219 0.01317 0 301056 0 0 0 0 4608 0.05258 1W16C8B 1W16C8B
11 Conv_17_split_KNOPT_dummy_bn_1 Add_27 NPU [8] [15] [8] Conv_17_split_KNOPT_dummy_bn_1 0 8 952 0.00136 0 0 0 0 200704 0 1024 0.027694 1W16C8B 1W16C8B_INTLV
12 Conv_18 Conv_18 NPU [8] [16] [8] npu_fusion_node_Conv_18_Clip_21 0 9 18018 0.02574 0 0 0 0 0 0 9216 0.02574 1W16C8B 1W16C8B
13 Clip_21 Clip_21 NPU [16] [8] [8]
14 Conv_22 Conv_22 NPU [8] [16] [8] npu_fusion_node_Conv_22_Clip_25 0 10 9288 0.013269 0 0 0 0 0 0 4608 0.013269 1W16C8B 1W16C8B
15 Clip_25 Clip_25 NPU [16] [8] [8]
16 Conv_26_KNOPT_Add_27_KNOPT_dummy_bn_0 Conv_26 NPU [8] [15] [8] Conv_26_KNOPT_Add_27_KNOPT_dummy_bn_0 0 11 13755 0.01965 0 200704 0 0 0 0 6912 0.046024 1W16C8B 1W16C8B_INTLV
17 Add_27 Add_27 NPU [15, 15] [8] [8] Add_27 0 12 1792 0.00256 0 0 0 0 0 0 512 0.00256 1W16C8B_INTLV 1W16C8B
18 Add_27_KNOPT_dummy_bn_1 Conv_28 NPU [8] [8] [8] Add_27_KNOPT_dummy_bn_1 0 13 952 0.00136 0 0 0 0 0 0 1024 0.00136 1W16C8B 1W16C8B
19 Conv_28 Conv_28 NPU [8] [16] [8] npu_fusion_node_Conv_28_Clip_31 0 14 18018 0.02574 0 0 0 0 0 0 9216 0.02574 1W16C8B 1W16C8B
20 Clip_31 Clip_31 NPU [16] [8] [8]
21 Conv_32 Conv_32 NPU [8] [16] [8] npu_fusion_node_Conv_32_Clip_35 0 15 9288 0.013269 0 0 0 0 0 0 4608 0.013269 1W16C8B 1W16C8B
22 Clip_35 Clip_35 NPU [16] [8] [8]
23 Conv_36 Conv_36 NPU [8] [8] [8] Conv_36 0 16 6240 0.008914 0 0 0 0 0 0 9216 0.008914 1W16C8B 1W16C8B
24 Conv_36_split_KNOPT_dummy_bn_1 Add_46 NPU [8] [15] [8] Conv_36_split_KNOPT_dummy_bn_1 0 17 312 0.000446 0 0 0 0 0 0 1024 0.000446 1W16C8B 1W16C8B_INTLV
25 Conv_37 Conv_37 NPU [8] [16] [8] npu_fusion_node_Conv_37_Clip_40 0 18 9696 0.013851 0 0 0 0 0 0 12288 0.013851 1W16C8B 1W16C8B
26 Clip_40 Clip_40 NPU [16] [8] [8]
27 Conv_41 Conv_41 NPU [8] [16] [8] npu_fusion_node_Conv_41_Clip_44 0 19 3456 0.004937 0 0 0 0 0 0 6144 0.004937 1W16C8B 1W16C8B
28 Clip_44 Clip_44 NPU [16] [8] [8]
29 Conv_45_KNOPT_Add_46_KNOPT_dummy_bn_0 Conv_45 NPU [8] [15] [8] Conv_45_KNOPT_Add_46_KNOPT_dummy_bn_0 0 20 8800 0.012571 0 0 0 0 0 0 12288 0.012571 1W16C8B 1W16C8B_INTLV
30 Add_46 Add_46 NPU [15, 15] [8] [8] Add_46 0 21 528 0.000754 0 0 0 0 0 0 512 0.000754 1W16C8B_INTLV 1W16C8B
31 Add_46_split_KNOPT_dummy_bn_1 Add_56 NPU [8] [15] [8] Add_46_split_KNOPT_dummy_bn_1 0 22 312 0.000446 0 0 0 0 0 0 1024 0.000446 1W16C8B 1W16C8B_INTLV
32 Add_46_split_KNOPT_dummy_bn_0 Conv_47 NPU [8] [8] [8] Add_46_split_KNOPT_dummy_bn_0 0 23 312 0.000446 0 0 0 0 0 0 1024 0.000446 1W16C8B 1W16C8B
33 Conv_47 Conv_47 NPU [8] [16] [8] npu_fusion_node_Conv_47_Clip_50 0 24 9696 0.013851 0 0 0 0 0 0 12288 0.013851 1W16C8B 1W16C8B
34 Clip_50 Clip_50 NPU [16] [8] [8]
35 Conv_51 Conv_51 NPU [8] [16] [8] npu_fusion_node_Conv_51_Clip_54 0 25 3456 0.004937 0 0 0 0 0 0 6144 0.004937 1W16C8B 1W16C8B
36 Clip_54 Clip_54 NPU [16] [8] [8]
37 Conv_55_KNOPT_Add_56_KNOPT_dummy_bn_0 Conv_55 NPU [8] [15] [8] Conv_55_KNOPT_Add_56_KNOPT_dummy_bn_0 0 26 8800 0.012571 0 0 0 0 0 0 12288 0.012571 1W16C8B 1W16C8B_INTLV
38 Add_56 Add_56 NPU [15, 15] [8] [8] Add_56 0 27 528 0.000754 0 0 0 0 0 0 512 0.000754 1W16C8B_INTLV 1W16C8B
39 Add_56_KNOPT_dummy_bn_1 Conv_57 NPU [8] [8] [8] Add_56_KNOPT_dummy_bn_1 0 28 312 0.000446 0 0 0 0 0 0 1024 0.000446 1W16C8B 1W16C8B
40 Conv_57 Conv_57 NPU [8] [16] [8] npu_fusion_node_Conv_57_Clip_60 0 29 9696 0.013851 0 0 0 0 0 0 12288 0.013851 1W16C8B 1W16C8B
41 Clip_60 Clip_60 NPU [16] [8] [8]
42 Conv_61 Conv_61 NPU [8] [16] [8] npu_fusion_node_Conv_61_Clip_64 0 30 3456 0.004937 0 0 0 0 0 0 6144 0.004937 1W16C8B 1W16C8B
43 Clip_64 Clip_64 NPU [16] [8] [8]
44 Conv_65 Conv_65 NPU [8] [8] [8] Conv_65 0 31 4352 0.006217 0 0 0 0 0 0 24576 0.006217 1W16C8B 1W16C8B
45 Conv_65_split_KNOPT_dummy_bn_1 Add_75 NPU [8] [15] [8] Conv_65_split_KNOPT_dummy_bn_1 0 32 192 0.000274 0 0 0 0 0 0 2048 0.000274 1W16C8B 1W16C8B_INTLV
46 Conv_66 Conv_66 NPU [8] [16] [8] npu_fusion_node_Conv_66_Clip_69 0 33 10272 0.014674 0 0 0 0 0 0 49152 0.014674 1W16C8B 1W16C8B
47 Clip_69 Clip_69 NPU [16] [8] [8]
48 Conv_70 Conv_70 NPU [8] [16] [8] npu_fusion_node_Conv_70_Clip_73 0 34 2064 0.002949 0 0 0 0 0 0 12288 0.002949 1W16C8B 1W16C8B
49 Clip_73 Clip_73 NPU [16] [8] [8]
50 Conv_74_KNOPT_Add_75_KNOPT_dummy_bn_0 Conv_74 NPU [8] [15] [8] Conv_74_KNOPT_Add_75_KNOPT_dummy_bn_0 0 35 8928 0.012754 0 0 0 0 0 0 49152 0.012754 1W16C8B 1W16C8B_INTLV
51 Add_75 Add_75 NPU [15, 15] [8] [8] Add_75 0 36 288 0.000411 0 0 0 0 0 0 1024 0.000411 1W16C8B_INTLV 1W16C8B
52 Add_75_split_KNOPT_dummy_bn_1 Add_85 NPU [8] [15] [8] Add_75_split_KNOPT_dummy_bn_1 0 37 192 0.000274 0 0 0 0 0 0 2048 0.000274 1W16C8B 1W16C8B_INTLV
53 Add_75_split_KNOPT_dummy_bn_0 Conv_76 NPU [8] [8] [8] Add_75_split_KNOPT_dummy_bn_0 0 38 192 0.000274 0 0 0 0 0 0 2048 0.000274 1W16C8B 1W16C8B
54 Conv_76 Conv_76 NPU [8] [16] [8] npu_fusion_node_Conv_76_Clip_79 0 39 10272 0.014674 0 0 0 0 0 0 49152 0.014674 1W16C8B 1W16C8B
55 Clip_79 Clip_79 NPU [16] [8] [8]
56 Conv_80 Conv_80 NPU [8] [16] [8] npu_fusion_node_Conv_80_Clip_83 0 40 2064 0.002949 0 0 0 0 0 0 12288 0.002949 1W16C8B 1W16C8B
57 Clip_83 Clip_83 NPU [16] [8] [8]
58 Conv_84_KNOPT_Add_85_KNOPT_dummy_bn_0 Conv_84 NPU [8] [15] [8] Conv_84_KNOPT_Add_85_KNOPT_dummy_bn_0 0 41 8928 0.012754 0 0 0 0 0 0 49152 0.012754 1W16C8B 1W16C8B_INTLV
59 Add_85 Add_85 NPU [15, 15] [8] [8] Add_85 0 42 288 0.000411 0 0 0 0 0 0 1024 0.000411 1W16C8B_INTLV 1W16C8B
60 Add_85_split_KNOPT_dummy_bn_1 Add_95 NPU [8] [15] [8] Add_85_split_KNOPT_dummy_bn_1 0 43 192 0.000274 0 0 0 0 0 0 2048 0.000274 1W16C8B 1W16C8B_INTLV
61 Add_85_split_KNOPT_dummy_bn_0 Conv_86 NPU [8] [8] [8] Add_85_split_KNOPT_dummy_bn_0 0 44 192 0.000274 0 0 0 0 0 0 2048 0.000274 1W16C8B 1W16C8B
62 Conv_86 Conv_86 NPU [8] [16] [8] npu_fusion_node_Conv_86_Clip_89 0 45 10272 0.014674 0 0 0 0 0 0 49152 0.014674 1W16C8B 1W16C8B
63 Clip_89 Clip_89 NPU [16] [8] [8]
64 Conv_90 Conv_90 NPU [8] [16] [8] npu_fusion_node_Conv_90_Clip_93 0 46 2064 0.002949 0 0 0 0 0 0 12288 0.002949 1W16C8B 1W16C8B
65 Clip_93 Clip_93 NPU [16] [8] [8]
66 Conv_94_KNOPT_Add_95_KNOPT_dummy_bn_0 Conv_94 NPU [8] [15] [8] Conv_94_KNOPT_Add_95_KNOPT_dummy_bn_0 0 47 8928 0.012754 0 0 0 0 0 0 49152 0.012754 1W16C8B 1W16C8B_INTLV
67 Add_95 Add_95 NPU [15, 15] [8] [8] Add_95 0 48 288 0.000411 0 0 0 0 0 0 1024 0.000411 1W16C8B_INTLV 1W16C8B
68 Add_95_KNOPT_dummy_bn_1 Conv_96 NPU [8] [8] [8] Add_95_KNOPT_dummy_bn_1 0 49 192 0.000274 0 0 0 0 0 0 2048 0.000274 1W16C8B 1W16C8B
69 Conv_96 Conv_96 NPU [8] [16] [8] npu_fusion_node_Conv_96_Clip_99 0 50 10272 0.014674 0 0 0 0 0 0 49152 0.014674 1W16C8B 1W16C8B
70 Clip_99 Clip_99 NPU [16] [8] [8]
71 Conv_100 Conv_100 NPU [8] [16] [8] npu_fusion_node_Conv_100_Clip_103 0 51 2064 0.002949 0 0 0 0 0 0 12288 0.002949 1W16C8B 1W16C8B
72 Clip_103 Clip_103 NPU [16] [8] [8]
73 Conv_104 Conv_104 NPU [8] [8] [8] Conv_104 0 52 13392 0.019131 0 0 0 0 0 0 73728 0.019131 1W16C8B 1W16C8B
74 Conv_104_split_KNOPT_dummy_bn_1 Add_114 NPU [8] [15] [8] Conv_104_split_KNOPT_dummy_bn_1 0 53 288 0.000411 0 0 0 0 0 0 3072 0.000411 1W16C8B 1W16C8B_INTLV
75 Conv_105 Conv_105 NPU [8] [16] [8] npu_fusion_node_Conv_105_Clip_108 0 54 21744 0.031063 0 0 0 0 0 0 110592 0.031063 1W16C8B 1W16C8B
76 Clip_108 Clip_108 NPU [16] [8] [8]
77 Conv_109 Conv_109 NPU [8] [16] [8] npu_fusion_node_Conv_109_Clip_112 0 55 3096 0.004423 0 0 0 0 0 0 18432 0.004423 1W16C8B 1W16C8B
78 Clip_112 Clip_112 NPU [16] [8] [8]
79 Conv_113_KNOPT_Add_114_KNOPT_dummy_bn_0 Conv_113 NPU [8] [15] [8] Conv_113_KNOPT_Add_114_KNOPT_dummy_bn_0 0 56 20184 0.028834 0 0 0 0 0 0 110592 0.028834 1W16C8B 1W16C8B_INTLV
80 Add_114 Add_114 NPU [15, 15] [8] [8] Add_114 0 57 432 0.000617 0 0 0 0 0 0 1536 0.000617 1W16C8B_INTLV 1W16C8B
81 Add_114_split_KNOPT_dummy_bn_1 Add_124 NPU [8] [15] [8] Add_114_split_KNOPT_dummy_bn_1 0 58 288 0.000411 0 0 0 0 0 0 3072 0.000411 1W16C8B 1W16C8B_INTLV
82 Add_114_split_KNOPT_dummy_bn_0 Conv_115 NPU [8] [8] [8] Add_114_split_KNOPT_dummy_bn_0 0 59 288 0.000411 0 0 0 0 0 0 3072 0.000411 1W16C8B 1W16C8B
83 Conv_115 Conv_115 NPU [8] [16] [8] npu_fusion_node_Conv_115_Clip_118 0 60 21744 0.031063 0 0 0 0 0 0 110592 0.031063 1W16C8B 1W16C8B
84 Clip_118 Clip_118 NPU [16] [8] [8]
85 Conv_119 Conv_119 NPU [8] [16] [8] npu_fusion_node_Conv_119_Clip_122 0 61 3096 0.004423 0 0 0 0 0 0 18432 0.004423 1W16C8B 1W16C8B
86 Clip_122 Clip_122 NPU [16] [8] [8]
87 Conv_123_KNOPT_Add_124_KNOPT_dummy_bn_0 Conv_123 NPU [8] [15] [8] Conv_123_KNOPT_Add_124_KNOPT_dummy_bn_0 0 62 20184 0.028834 0 0 0 0 0 0 110592 0.028834 1W16C8B 1W16C8B_INTLV
88 Add_124 Add_124 NPU [15, 15] [8] [8] Add_124 0 63 432 0.000617 0 0 0 0 0 0 1536 0.000617 1W16C8B_INTLV 1W16C8B
89 Add_124_KNOPT_dummy_bn_1 Conv_125 NPU [8] [8] [8] Add_124_KNOPT_dummy_bn_1 0 64 288 0.000411 0 0 0 0 0 0 3072 0.000411 1W16C8B 1W16C8B
90 Conv_125 Conv_125 NPU [8] [16] [8] npu_fusion_node_Conv_125_Clip_128 0 65 21744 0.031063 0 0 0 0 0 0 110592 0.031063 1W16C8B 1W16C8B
91 Clip_128 Clip_128 NPU [16] [8] [8]
92 Conv_129 Conv_129 NPU [8] [16] [8] npu_fusion_node_Conv_129_Clip_132 0 66 3096 0.004423 0 0 0 0 0 0 18432 0.004423 1W16C8B 1W16C8B
93 Clip_132 Clip_132 NPU [16] [8] [8]
94 Conv_133 Conv_133 NPU [8] [8] [8] Conv_133 0 67 17740 0.025343 0 0 0 0 0 0 184320 0.025343 1W16C8B 1W16C8B
95 Conv_133_split_KNOPT_dummy_bn_1 Add_143 NPU [8] [15] [8] Conv_133_split_KNOPT_dummy_bn_1 0 68 170 0.000243 0 0 0 0 0 0 5120 0.000243 1W16C8B 1W16C8B_INTLV
96 Conv_134 Conv_134 NPU [8] [16] [8] npu_fusion_node_Conv_134_Clip_137 0 69 29400 0.042 0 0 0 0 0 0 307200 0.042 1W16C8B 1W16C8B
97 Clip_137 Clip_137 NPU [16] [8] [8]
98 Conv_138 Conv_138 NPU [8] [16] [8] npu_fusion_node_Conv_138_Clip_141 0 70 1920 0.002743 0 0 0 0 0 0 30720 0.002743 1W16C8B 1W16C8B
99 Clip_141 Clip_141 NPU [16] [8] [8]
100 Conv_142_KNOPT_Add_143_KNOPT_dummy_bn_0 Conv_142 NPU [8] [15] [8] Conv_142_KNOPT_Add_143_KNOPT_dummy_bn_0 0 71 29740 0.042486 0 0 0 0 0 0 307200 0.042486 1W16C8B 1W16C8B_INTLV
101 Add_143 Add_143 NPU [15, 15] [8] [8] Add_143 0 72 220 0.000314 0 0 0 0 0 0 2560 0.000314 1W16C8B_INTLV 1W16C8B
102 Add_143_split_KNOPT_dummy_bn_1 Add_153 NPU [8] [15] [8] Add_143_split_KNOPT_dummy_bn_1 0 73 170 0.000243 0 0 0 0 0 0 5120 0.000243 1W16C8B 1W16C8B_INTLV
103 Add_143_split_KNOPT_dummy_bn_0 Conv_144 NPU [8] [8] [8] Add_143_split_KNOPT_dummy_bn_0 0 74 170 0.000243 0 0 0 0 0 0 5120 0.000243 1W16C8B 1W16C8B
104 Conv_144 Conv_144 NPU [8] [16] [8] npu_fusion_node_Conv_144_Clip_147 0 75 29400 0.042 0 0 0 0 0 0 307200 0.042 1W16C8B 1W16C8B
105 Clip_147 Clip_147 NPU [16] [8] [8]
106 Conv_148 Conv_148 NPU [8] [16] [8] npu_fusion_node_Conv_148_Clip_151 0 76 1920 0.002743 0 0 0 0 0 0 30720 0.002743 1W16C8B 1W16C8B
107 Clip_151 Clip_151 NPU [16] [8] [8]
108 Conv_152_KNOPT_Add_153_KNOPT_dummy_bn_0 Conv_152 NPU [8] [15] [8] Conv_152_KNOPT_Add_153_KNOPT_dummy_bn_0 0 77 29740 0.042486 0 0 0 0 0 0 307200 0.042486 1W16C8B 1W16C8B_INTLV
109 Add_153 Add_153 NPU [15, 15] [8] [8] Add_153 0 78 220 0.000314 0 0 0 0 0 0 2560 0.000314 1W16C8B_INTLV 1W16C8B
110 Add_153_KNOPT_dummy_bn_1 Conv_154 NPU [8] [8] [8] Add_153_KNOPT_dummy_bn_1 0 79 170 0.000243 0 0 0 0 0 0 5120 0.000243 1W16C8B 1W16C8B
111 Conv_154 Conv_154 NPU [8] [16] [8] npu_fusion_node_Conv_154_Clip_157 0 80 29400 0.042 0 0 0 0 0 0 307200 0.042 1W16C8B 1W16C8B
112 Clip_157 Clip_157 NPU [16] [8] [8]
113 Conv_158 Conv_158 NPU [8] [16] [8] npu_fusion_node_Conv_158_Clip_161 0 81 1920 0.002743 0 0 0 0 0 0 30720 0.002743 1W16C8B 1W16C8B
114 Clip_161 Clip_161 NPU [16] [8] [8]
115 Conv_162 Conv_162 NPU [8] [8] [8] Conv_162 0 82 59480 0.084971 0 0 0 0 0 0 614400 0.084971 1W16C8B 1W16C8B
116 Conv_163 Conv_163 NPU [8] [16] [8] npu_fusion_node_Conv_163_Clip_166 0 83 79200 0.113143 0 0 0 0 0 0 819200 0.113143 1W16C8B 1W16C8B
117 Clip_166 Clip_166 NPU [16] [15] [8]
118 GlobalAveragePool_167 GlobalAveragePool_167 NPU [15] [8] [16] GlobalAveragePool_167 0 84 3440 0.004914 0 0 0 0 0 0 20480 0.004914 1W16C8B 1W16C8B
119 Reshape_173 Reshape_173 NPU [8] [8] [8] None NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN NaN
120 Gemm_174 Gemm_174 NPU [8] [8] [8] Gemm_174 0 85 11125 0.015893 0 0 0 0 0 0 1440000 0.167813 1W16C8B 1W16C8B