Skip to content

Commit 42f6c79

Browse files
committed
up
1 parent 37df147 commit 42f6c79

File tree

1 file changed

+14
-3
lines changed

1 file changed

+14
-3
lines changed

examples/models/llava/export_llava.py

Lines changed: 14 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -178,9 +178,11 @@ def forward(self, images):
178178

179179

180180
def export_token_embedding(llava, prompt):
181-
# quantized_token_embed = get_quant_embedding_transform("8,32")(
182-
# llava.model_.language_model.model
183-
# )
181+
import copy
182+
model_copy = copy.deepcopy(llava.model_.language_model.model)
183+
quantized_token_embed_copy = get_quant_embedding_transform("8,32")(
184+
model_copy,
185+
)
184186
def quant_embedding(model):
185187
return EmbeddingQuantHandler(
186188
model,
@@ -200,6 +202,15 @@ def quant_embedding(model):
200202
dynamic_shapes=dynamic_shapes,
201203
strict=True,
202204
)
205+
token_embedding_ep_copy = torch.export.export(
206+
quantized_token_embed_copy.embed_tokens,
207+
(prompt,),
208+
dynamic_shapes=dynamic_shapes,
209+
strict=True,
210+
)
211+
212+
print("token_embedding_ep_copy", token_embedding_ep_copy)
213+
print("token_embedding_ep", token_embedding_ep)
203214
return token_embedding_ep
204215

205216

0 commit comments

Comments
 (0)