We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 841e319 commit 07ec38fCopy full SHA for 07ec38f
lightllm/models/llama/model.py
@@ -23,7 +23,6 @@
23
logger = init_logger(__name__)
24
25
26
-@ModelRegistry("llama")
27
class LlamaFlashInferStateExtraInfo:
28
def __init__(self, model):
29
tp_world_size = get_dp_world_size()
@@ -45,6 +44,7 @@ def __init__(self, model):
45
44
self.kv_data_type = model.data_type
46
47
+@ModelRegistry("llama")
48
class LlamaTpPartModel(TpPartBaseModel):
49
# weight class
50
pre_and_post_weight_class = LlamaPreAndPostLayerWeight
0 commit comments