Skip to content

Commit 82ba867

Browse files
committed
made it run
1 parent e053e0d commit 82ba867

File tree

8 files changed

+48
-41
lines changed

8 files changed

+48
-41
lines changed

.gitignore

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -142,7 +142,7 @@ dmypy.json
142142
**/multicache_serving.py
143143
**/modelcache_serving.py
144144

145-
**/model/
145+
**/model/text2vec-base-chinese
146146

147147
/data/milvus/db
148148
/data/mysql/db

docker-compose.yaml

Lines changed: 21 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
1-
version: 'Beta'
1+
name: "modelcache"
22
services:
33
mysql:
4-
image: mysql:8.0.23
4+
image: mysql:9.3.0
55
container_name: mysql
66
environment:
77
MYSQL_ROOT_PASSWORD: 'root'
@@ -19,7 +19,7 @@ services:
1919
- modelcache
2020

2121
milvus:
22-
image: milvusdb/milvus:v2.5.0-beta
22+
image: milvusdb/milvus:v2.5.10
2323
container_name: milvus
2424
security_opt:
2525
- seccomp:unconfined
@@ -47,24 +47,24 @@ services:
4747
restart: on-failure
4848
command: milvus run standalone
4949

50-
modelcache:
51-
build:
52-
context: .
53-
dockerfile: Dockerfile
54-
container_name: modelcache
55-
image: modelcache:0.1.0
56-
ports:
57-
- 5000:5000
58-
volumes:
59-
- ./model:/home/user/model
60-
- ./modelcache:/home/user/modelcache
61-
- ./modelcache_mm:/home/user/modelcache_mm
62-
- ./fastapi4modelcache.py:/home/user/fastapi4modelcache.py
63-
networks:
64-
- modelcache
65-
restart: on-failure
66-
command: sh -c "uvicorn fastapi4modelcache:app --reload --reload-dir /home/user --port=5000 --host=0.0.0.0"
50+
# modelcache:
51+
# build:
52+
# context: .
53+
# dockerfile: Dockerfile
54+
# container_name: modelcache
55+
# image: modelcache:0.1.0
56+
# ports:
57+
# - 5000:5000
58+
# volumes:
59+
# - ./model:/home/user/model
60+
# - ./modelcache:/home/user/modelcache
61+
# - ./modelcache_mm:/home/user/modelcache_mm
62+
# - ./fastapi4modelcache.py:/home/user/fastapi4modelcache.py
63+
# networks:
64+
# - modelcache
65+
# restart: on-failure
66+
# command: sh -c "uvicorn fastapi4modelcache:app --reload --reload-dir /home/user --port=5000 --host=0.0.0.0"
6767

6868
networks:
6969
modelcache:
70-
external: true
70+
driver: bridge

flask4modelcache.py

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -38,16 +38,16 @@ def response_hitquery(cache_resp):
3838
milvus_config = configparser.ConfigParser()
3939
milvus_config.read('modelcache/config/milvus_config.ini')
4040

41-
es_config = configparser.ConfigParser()
42-
es_config.read('modelcache/config/elasticsearch_config.ini')
41+
# es_config = configparser.ConfigParser()
42+
# es_config.read('modelcache/config/elasticsearch_config.ini')
4343

4444
# redis_config = configparser.ConfigParser()
4545
# redis_config.read('modelcache/config/redis_config.ini')
4646

4747
# chromadb_config = configparser.ConfigParser()
4848
# chromadb_config.read('modelcache/config/chromadb_config.ini')
4949

50-
data_manager = get_data_manager(CacheBase("elasticsearch", config=es_config),
50+
data_manager = get_data_manager(CacheBase("mysql", config=mysql_config),
5151
VectorBase("milvus", dimension=data2vec.dimension, milvus_config=milvus_config))
5252

5353

@@ -77,18 +77,19 @@ def first_flask(): # 视图函数
7777

7878
@app.route('/modelcache', methods=['GET', 'POST'])
7979
def user_backend():
80+
param_dict = []
8081
try:
8182
if request.method == 'POST':
82-
request_data = request.json
83+
param_dict = request.json
8384
elif request.method == 'GET':
84-
request_data = request.args
85-
param_dict = json.loads(request_data)
85+
param_dict = request.args
8686
except Exception as e:
8787
result = {"errorCode": 101, "errorDesc": str(e), "cacheHit": False, "delta_time": 0, "hit_query": '',
8888
"answer": ''}
8989
cache.data_manager.save_query_resp(result, model='', query='', delta_time=0)
9090
return json.dumps(result)
9191

92+
9293
# param parsing
9394
try:
9495
request_type = param_dict.get("type")
@@ -197,4 +198,4 @@ def user_backend():
197198

198199

199200
if __name__ == '__main__':
200-
app.run(host='0.0.0.0', port=5000, debug=True)
201+
app.run(host='0.0.0.0', port=5000)

model/clone_model_repository.bat

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
git lfs install
2+
git clone https://huggingface.co/shibing624/text2vec-base-chinese

modelcache/adapter/adapter_query.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
from modelcache.processor.pre import multi_analysis
88
from FlagEmbedding import FlagReranker
99

10-
USE_RERANKER = True # 如果为 True 则启用 reranker,否则使用原有逻辑
10+
USE_RERANKER = False # 如果为 True 则启用 reranker,否则使用原有逻辑
1111

1212
def adapt_query(cache_data_convert, *args, **kwargs):
1313
chat_cache = kwargs.pop("cache_obj", cache)
@@ -74,7 +74,7 @@ def adapt_query(cache_data_convert, *args, **kwargs):
7474
extra_param=context.get("evaluation_func", None),
7575
)
7676
if rank_pre < rank_threshold:
77-
return
77+
return None
7878

7979
if USE_RERANKER:
8080
reranker = FlagReranker('BAAI/bge-reranker-v2-m3', use_fp16=False)
@@ -86,7 +86,7 @@ def adapt_query(cache_data_convert, *args, **kwargs):
8686
if ret is None:
8787
continue
8888

89-
rank = reranker.compute_score([pre_embedding_data, ret[0]], normalize=True)
89+
rank = reranker.compute_score([pre_embedding_data, ret[0]], normalize=True)[0]
9090

9191
if "deps" in context and hasattr(ret.question, "deps"):
9292
eval_query_data = {
@@ -192,4 +192,6 @@ def adapt_query(cache_data_convert, *args, **kwargs):
192192
logging.info('update_hit_count except, please check!')
193193

194194
chat_cache.report.hint_cache()
195-
return cache_data_convert(return_message, return_query)
195+
return cache_data_convert(return_message, return_query)
196+
return None
197+
return None

modelcache/config/milvus_config.ini

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
[milvus]
2-
host = milvus
2+
host = localhost
33
port = 19530
44
user = ''
55
password = ''

modelcache/config/mysql_config.ini

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
[mysql]
2-
host = mysql
2+
host = localhost
33
port = 3306
44
username = modelcache
55
password = modelcache

requirements.txt

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -4,16 +4,18 @@ Flask==3.0.0
44
numpy==1.24.4
55
onnxruntime==1.16.1
66
openai==0.28.1
7-
pymilvus==2.3.1
8-
PyMySQL==1.1.0
9-
Requests==2.31.0
10-
torch==2.1.1
11-
transformers==4.38.2
7+
pymilvus==2.5.9
8+
PyMySQL==1.1.1
9+
Requests==2.32.3
10+
torch==2.7.0
11+
transformers==4.44.2
1212
faiss-cpu==1.7.4
1313
redis==5.0.1
14-
modelscope==1.14.0
14+
modelscope==1.26.0
1515
fastapi==0.115.5
1616
uvicorn==0.32.0
1717
chromadb==0.5.23
1818
elasticsearch==7.10.0
1919
snowflake-id==1.0.2
20+
flagembedding==1.3.4
21+
cryptography==45.0.2

0 commit comments

Comments
 (0)