Skip to content

Commit b2bd4a8

Browse files
committed
update config_example
1 parent 0c0049d commit b2bd4a8

File tree

2 files changed

+53
-4
lines changed

2 files changed

+53
-4
lines changed

gpt_server/model_worker/utils.py

Lines changed: 39 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -39,9 +39,45 @@ async def load_base64_or_url(base64_or_url):
3939
return bytes_io
4040

4141

42+
def get_embedding_mode(model_path: str):
43+
from infinity_emb import EngineArgs
44+
from transformers import AutoConfig
45+
from infinity_emb.inference.select_model import get_engine_type_from_config
46+
47+
model_config = AutoConfig.from_pretrained(model_path, trust_remote_code=True)
48+
model_type_text = getattr(
49+
getattr(model_config, "text_config", {}), "model_type", None
50+
)
51+
model_type_vison = getattr(
52+
getattr(model_config, "vision_config", {}), "model_type", None
53+
)
54+
print(model_type_vison, model_type_text)
55+
model_type = model_type_vison or model_type_text
56+
57+
mode = "embedding"
58+
engine_args = EngineArgs(
59+
model_name_or_path=model_path,
60+
engine="torch",
61+
embedding_dtype="float32",
62+
dtype="float32",
63+
bettertransformer=True,
64+
)
65+
engine_type = get_engine_type_from_config(engine_args)
66+
engine_type_str = str(engine_type)
67+
68+
if "EmbedderEngine" in engine_type_str:
69+
mode = "embedding"
70+
elif "RerankEngine" in engine_type_str:
71+
mode = "rerank"
72+
elif "ImageEmbedEngine" in engine_type_str:
73+
mode = model_type or "image"
74+
elif "PredictEngine" in engine_type_str:
75+
mode = "classify"
76+
return mode
77+
78+
4279
if __name__ == "__main__":
4380

4481
# 示例用法
45-
data_url = "data:image/png;base64,iVBORw0KGgoAAAANSUhEUg..."
46-
pure_base64 = extract_base64(data_url)
47-
print(pure_base64) # 输出: iVBORw0KGgoAAAANSUhEUg...
82+
r = get_embedding_mode("BAAI/BGE-VL-MLLM-S1")
83+
print(r)

gpt_server/script/config_example.yaml

Lines changed: 14 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -106,13 +106,26 @@ models:
106106
- gpus:
107107
- 2
108108

109+
- bge-vl:
110+
# vl-embedding 模型
111+
alias: null
112+
enable: true
113+
model_config:
114+
model_name_or_path: /home/dev/model/BAAI/BGE-VL-base/
115+
model_type: embedding # 这里仅支持 embedding
116+
work_mode: hf
117+
device: gpu
118+
workers:
119+
- gpus:
120+
- 2
121+
109122
- text-moderation:
110123
# 文本审核模型
111124
alias: omni-moderation-latest
112125
enable: true
113126
model_config:
114127
model_name_or_path: /home/dev/model/KoalaAI/Text-Moderation
115-
model_type: embedding_infinity # embedding_infinity/embedding
128+
model_type: embedding_infinity # embedding_infinity
116129
work_mode: hf
117130
device: gpu
118131
workers:

0 commit comments

Comments
 (0)