File tree Expand file tree Collapse file tree 1 file changed +14
-3
lines changed Expand file tree Collapse file tree 1 file changed +14
-3
lines changed Original file line number Diff line number Diff line change @@ -178,9 +178,11 @@ def forward(self, images):
178178
179179
180180def export_token_embedding (llava , prompt ):
181- # quantized_token_embed = get_quant_embedding_transform("8,32")(
182- # llava.model_.language_model.model
183- # )
181+ import copy
182+ model_copy = copy .deepcopy (llava .model_ .language_model .model )
183+ quantized_token_embed_copy = get_quant_embedding_transform ("8,32" )(
184+ model_copy ,
185+ )
184186 def quant_embedding (model ):
185187 return EmbeddingQuantHandler (
186188 model ,
@@ -200,6 +202,15 @@ def quant_embedding(model):
200202 dynamic_shapes = dynamic_shapes ,
201203 strict = True ,
202204 )
205+ token_embedding_ep_copy = torch .export .export (
206+ quantized_token_embed_copy .embed_tokens ,
207+ (prompt ,),
208+ dynamic_shapes = dynamic_shapes ,
209+ strict = True ,
210+ )
211+
212+ print ("token_embedding_ep_copy" , token_embedding_ep_copy )
213+ print ("token_embedding_ep" , token_embedding_ep )
203214 return token_embedding_ep
204215
205216
You can’t perform that action at this time.
0 commit comments