pi-mmbert-v3.5 / trt_engine_layer_summary_h200_fp16.txt
Gerald001's picture
Upload TRT model for Nvidia H200 (#3)
6c5a42c
---- Resolved TRT Profile ----
MIN_BATCH=1
OPT_BATCH=3
MAX_BATCH=12
MIN_SEQ_LEN=1
OPT_SEQ_LEN=512
MAX_SEQ_LEN=512
WORKSPACE_SIZE=24696061952
BUILDER_OPTIMIZATION_LEVEL=3
PRECISION=fp16
==== TensorRT Engine ====
Total Layers: 212
==== Precision Statistics ====
Half: 696
Int64: 10
Float: 5
==== Layer Type Statistics ====
kgen: 116
gemm: 89
reshape: 2
cast: 2
shape_call: 1
fusion: 1
Reformat: 1
==== Layer List ====
# Type Precision Name
----------------------------------------------------------------------------------------------------
0 shape_call - __mye105005_0_myl0_0
1 kgen Half __myl_SlicCastReplSubCastIotaCastReshCastReshReshSubAbsEqlLtOrReshNotSeleSele_myl0_1
2 kgen Half __myl_MoveMul_myl0_2
3 kgen Half __myl_CastGathCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_3
4 gemm Half /model/layers_0/attn/Wqkv/MatMul_myl0_4
5 reshape Int64 __mye379021_myl0_5
6 cast Int64 cast_hvar^379017i64_myl0_6
7 reshape Int64 __mye379047_myl0_7
8 cast Int64 cast_hvar^379043i64_myl0_8
9 kgen Half __myl_ConcSinCosReshReshTranSlicSlicReshMulSlicNegSlicConcMulAddTranSlicReshMulSlicNegSlicConcMulEtc_myl0_9
10 kgen Half _gemm_mha_v2_myl0_10
11 gemm Half /model/layers_0/attn/Wo/MatMul_myl0_11
12 kgen Half __myl_ReshReshTranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_12
13 gemm Half /model/layers_0/mlp/Wi/MatMul_myl0_13
14 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_14
15 gemm Half /model/layers_0/mlp/Wo/MatMul_myl0_15
16 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_16
17 gemm Half /model/layers_1/attn/Wqkv/MatMul_myl0_17
18 kgen Half __myl_ConcSinCosReshReshReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshEtc_myl0_18
19 kgen Half _gemm_mha_v2_myl0_19
20 gemm Half /model/layers_1/attn/Wo/MatMul_myl0_20
21 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_21
22 gemm Half /model/layers_1/mlp/Wi/MatMul_myl0_22
23 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_23
24 gemm Half /model/layers_1/mlp/Wo/MatMul_myl0_24
25 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_25
26 gemm Half /model/layers_2/attn/Wqkv/MatMul_myl0_26
27 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_27
28 kgen Half _gemm_mha_v2_myl0_28
29 gemm Half /model/layers_2/attn/Wo/MatMul_myl0_29
30 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_30
31 gemm Half /model/layers_2/mlp/Wi/MatMul_myl0_31
32 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_32
33 gemm Half /model/layers_2/mlp/Wo/MatMul_myl0_33
34 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_34
35 gemm Half /model/layers_3/attn/Wqkv/MatMul_myl0_35
36 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_36
37 kgen Half _gemm_mha_v2_myl0_37
38 gemm Half /model/layers_3/attn/Wo/MatMul_myl0_38
39 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_39
40 gemm Half /model/layers_3/mlp/Wi/MatMul_myl0_40
41 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_41
42 gemm Half /model/layers_3/mlp/Wo/MatMul_myl0_42
43 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_43
44 gemm Half /model/layers_4/attn/Wqkv/MatMul_myl0_44
45 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_45
46 kgen Half _gemm_mha_v2_myl0_46
47 gemm Half /model/layers_4/attn/Wo/MatMul_myl0_47
48 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_48
49 gemm Half /model/layers_4/mlp/Wi/MatMul_myl0_49
50 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_50
51 gemm Half /model/layers_4/mlp/Wo/MatMul_myl0_51
52 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_52
53 gemm Half /model/layers_5/attn/Wqkv/MatMul_myl0_53
54 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_54
55 kgen Half _gemm_mha_v2_myl0_55
56 gemm Half /model/layers_5/attn/Wo/MatMul_myl0_56
57 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_57
58 gemm Half /model/layers_5/mlp/Wi/MatMul_myl0_58
59 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_59
60 gemm Half /model/layers_5/mlp/Wo/MatMul_myl0_60
61 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_61
62 gemm Half /model/layers_6/attn/Wqkv/MatMul_myl0_62
63 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_63
64 kgen Half _gemm_mha_v2_myl0_64
65 gemm Half /model/layers_6/attn/Wo/MatMul_myl0_65
66 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_66
67 gemm Half /model/layers_6/mlp/Wi/MatMul_myl0_67
68 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_68
69 gemm Half /model/layers_6/mlp/Wo/MatMul_myl0_69
70 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_70
71 gemm Half /model/layers_7/attn/Wqkv/MatMul_myl0_71
72 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_72
73 kgen Half _gemm_mha_v2_myl0_73
74 gemm Half /model/layers_7/attn/Wo/MatMul_myl0_74
75 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_75
76 gemm Half /model/layers_7/mlp/Wi/MatMul_myl0_76
77 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_77
78 gemm Half /model/layers_7/mlp/Wo/MatMul_myl0_78
79 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_79
80 gemm Half /model/layers_8/attn/Wqkv/MatMul_myl0_80
81 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_81
82 kgen Half _gemm_mha_v2_myl0_82
83 gemm Half /model/layers_8/attn/Wo/MatMul_myl0_83
84 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_84
85 gemm Half /model/layers_8/mlp/Wi/MatMul_myl0_85
86 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_86
87 gemm Half /model/layers_8/mlp/Wo/MatMul_myl0_87
88 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_88
89 gemm Half /model/layers_9/attn/Wqkv/MatMul_myl0_89
90 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_90
91 kgen Half _gemm_mha_v2_myl0_91
92 gemm Half /model/layers_9/attn/Wo/MatMul_myl0_92
93 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_93
94 gemm Half /model/layers_9/mlp/Wi/MatMul_myl0_94
95 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_95
96 gemm Half /model/layers_9/mlp/Wo/MatMul_myl0_96
97 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_97
98 gemm Half /model/layers_10/attn/Wqkv/MatMul_myl0_98
99 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_99
100 kgen Half _gemm_mha_v2_myl0_100
101 gemm Half /model/layers_10/attn/Wo/MatMul_myl0_101
102 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_102
103 gemm Half /model/layers_10/mlp/Wi/MatMul_myl0_103
104 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_104
105 gemm Half /model/layers_10/mlp/Wo/MatMul_myl0_105
106 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_106
107 gemm Half /model/layers_11/attn/Wqkv/MatMul_myl0_107
108 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_108
109 kgen Half _gemm_mha_v2_myl0_109
110 gemm Half /model/layers_11/attn/Wo/MatMul_myl0_110
111 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_111
112 gemm Half /model/layers_11/mlp/Wi/MatMul_myl0_112
113 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_113
114 gemm Half /model/layers_11/mlp/Wo/MatMul_myl0_114
115 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_115
116 gemm Half /model/layers_12/attn/Wqkv/MatMul_myl0_116
117 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_117
118 kgen Half _gemm_mha_v2_myl0_118
119 gemm Half /model/layers_12/attn/Wo/MatMul_myl0_119
120 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_120
121 gemm Half /model/layers_12/mlp/Wi/MatMul_myl0_121
122 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_122
123 gemm Half /model/layers_12/mlp/Wo/MatMul_myl0_123
124 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_124
125 gemm Half /model/layers_13/attn/Wqkv/MatMul_myl0_125
126 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_126
127 kgen Half _gemm_mha_v2_myl0_127
128 gemm Half /model/layers_13/attn/Wo/MatMul_myl0_128
129 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_129
130 gemm Half /model/layers_13/mlp/Wi/MatMul_myl0_130
131 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_131
132 gemm Half /model/layers_13/mlp/Wo/MatMul_myl0_132
133 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_133
134 gemm Half /model/layers_14/attn/Wqkv/MatMul_myl0_134
135 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_135
136 kgen Half _gemm_mha_v2_myl0_136
137 gemm Half /model/layers_14/attn/Wo/MatMul_myl0_137
138 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_138
139 gemm Half /model/layers_14/mlp/Wi/MatMul_myl0_139
140 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_140
141 gemm Half /model/layers_14/mlp/Wo/MatMul_myl0_141
142 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_142
143 gemm Half /model/layers_15/attn/Wqkv/MatMul_myl0_143
144 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_144
145 kgen Half _gemm_mha_v2_myl0_145
146 gemm Half /model/layers_15/attn/Wo/MatMul_myl0_146
147 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_147
148 gemm Half /model/layers_15/mlp/Wi/MatMul_myl0_148
149 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_149
150 gemm Half /model/layers_15/mlp/Wo/MatMul_myl0_150
151 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_151
152 gemm Half /model/layers_16/attn/Wqkv/MatMul_myl0_152
153 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_153
154 kgen Half _gemm_mha_v2_myl0_154
155 gemm Half /model/layers_16/attn/Wo/MatMul_myl0_155
156 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_156
157 gemm Half /model/layers_16/mlp/Wi/MatMul_myl0_157
158 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_158
159 gemm Half /model/layers_16/mlp/Wo/MatMul_myl0_159
160 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_160
161 gemm Half /model/layers_17/attn/Wqkv/MatMul_myl0_161
162 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_162
163 kgen Half _gemm_mha_v2_myl0_163
164 gemm Half /model/layers_17/attn/Wo/MatMul_myl0_164
165 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_165
166 gemm Half /model/layers_17/mlp/Wi/MatMul_myl0_166
167 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_167
168 gemm Half /model/layers_17/mlp/Wo/MatMul_myl0_168
169 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_169
170 gemm Half /model/layers_18/attn/Wqkv/MatMul_myl0_170
171 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_171
172 kgen Half _gemm_mha_v2_myl0_172
173 gemm Half /model/layers_18/attn/Wo/MatMul_myl0_173
174 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_174
175 gemm Half /model/layers_18/mlp/Wi/MatMul_myl0_175
176 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_176
177 gemm Half /model/layers_18/mlp/Wo/MatMul_myl0_177
178 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_178
179 gemm Half /model/layers_19/attn/Wqkv/MatMul_myl0_179
180 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_180
181 kgen Half _gemm_mha_v2_myl0_181
182 gemm Half /model/layers_19/attn/Wo/MatMul_myl0_182
183 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_183
184 gemm Half /model/layers_19/mlp/Wi/MatMul_myl0_184
185 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_185
186 gemm Half /model/layers_19/mlp/Wo/MatMul_myl0_186
187 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_187
188 gemm Half /model/layers_20/attn/Wqkv/MatMul_myl0_188
189 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_189
190 kgen Half _gemm_mha_v2_myl0_190
191 gemm Half /model/layers_20/attn/Wo/MatMul_myl0_191
192 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_192
193 gemm Half /model/layers_20/mlp/Wi/MatMul_myl0_193
194 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_194
195 gemm Half /model/layers_20/mlp/Wo/MatMul_myl0_195
196 kgen Half __myl_TranReshAddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_196
197 gemm Half /model/layers_21/attn/Wqkv/MatMul_myl0_197
198 kgen Half __myl_ReshTranReshMoveReshTranSlicSlicReshSlicNegSlicConcMulMulAddTranSlicReshSlicNegSlicConcMulEtc_myl0_198
199 kgen Half _gemm_mha_v2_myl0_199
200 gemm Half /model/layers_21/attn/Wo/MatMul_myl0_200
201 kgen Half __myl_AddCastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_201
202 gemm Half /model/layers_21/mlp/Wi/MatMul_myl0_202
203 kgen Half __myl_TranReshSlicSlicDivCastErfCastAddMulMulMul_myl0_203
204 gemm Half /model/layers_21/mlp/Wo/MatMul_myl0_204
205 kgen Float __myl_TranReshAddCastMeanSubMulMean_myl0_205
206 kgen Half __myl_CastAddSqrtDivMulCastMulAddMoveReshTranReshMoveReshMulSum_myl0_206
207 kgen Half __myl_SumCastReshDivMul_myl0_207
208 fusion Half __myl_Fc_myl0_208
209 kgen Half __myl_CastMeanSubMulMeanAddSqrtDivMulCastMulAdd_myl0_209
210 gemm Half /classifier/Gemm_myl0_210
211 Reformat Float Reformatting CopyNode for Output Tensor 0 to {ForeignNode[/model/Unsqueeze_1 + /model/Unsqueeze_2...(Unnamed Layer* 6506) [ElementWise]]}