codefuse-ai
diff --git a/‎.gitignore
Lines changed: 7 additions & 1 deletion b/‎.gitignore
Lines changed: 7 additions & 1 deletion
diff --git a/‎flask4modelcache.py
Lines changed: 0 additions & 1 deletion b/‎flask4modelcache.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎model/clip_zh/__init__.py
Lines changed: 12 additions & 0 deletions b/‎model/clip_zh/__init__.py
Lines changed: 12 additions & 0 deletions
diff --git a/‎modelcache/adapter/adapter_query.py
Lines changed: 5 additions & 2 deletions b/‎modelcache/adapter/adapter_query.py
Lines changed: 5 additions & 2 deletions
diff --git a/‎modelcache/core.py
Lines changed: 4 additions & 1 deletion b/‎modelcache/core.py
Lines changed: 4 additions & 1 deletion
diff --git a/‎modelcache/embedding/string.py renamed to ‎modelcache/embedding/string_text.py b/‎modelcache/embedding/string.py renamed to ‎modelcache/embedding/string_text.py
diff --git a/‎modelcache/embedding/timm.py renamed to ‎modelcache/embedding/timm_embedding.py b/‎modelcache/embedding/timm.py renamed to ‎modelcache/embedding/timm_embedding.py
diff --git a/‎modelcache/manager/data_manager.py
Lines changed: 1 addition & 0 deletions b/‎modelcache/manager/data_manager.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎modelcache/manager/scalar_data/base.py
Lines changed: 0 additions & 4 deletions b/‎modelcache/manager/scalar_data/base.py
Lines changed: 0 additions & 4 deletions
diff --git a/‎modelcache/manager/vector_data/milvus.py
Lines changed: 2 additions & 0 deletions b/‎modelcache/manager/vector_data/milvus.py
Lines changed: 2 additions & 0 deletions
@@ -135,5 +135,11 @@ dmypy.json
 /embedding_npy
 /flask_server
 *.bin
+**/maya_embedding_service
+
+*.ini
+
+**/multicache_serving.py
 **/modelcache_serving.py
-*.ini
+
+**/model/
@@ -177,7 +177,6 @@ def user_backend():
         return json.dumps(result)
 
     if request_type == 'register':
-        # iat_type = param_dict.get("iat_type")
         response = adapter.ChatCompletion.create_register(
             model=model
         )
 
@@ -0,0 +1,12 @@
+# -*- coding: utf-8 -*-
+"""
+   Alipay.com Inc.
+   Copyright (c) 2004-2023 All Rights Reserved.
+   ------------------------------------------------------
+   File Name : __init__.py.py
+   Author : fuhui.phe
+   Create Time : 2024/5/7 14:05
+   Description : description what the main function of this file
+   Change Activity: 
+        version0 : 2024/5/7 14:05 by fuhui.phe  init
+"""
@@ -30,17 +30,20 @@ def adapt_query(cache_data_convert, *args, **kwargs):
             report_func=chat_cache.report.embedding,
         )(pre_embedding_data)
 
+        # print('embedding_data: {}'.format(embedding_data))
+
     if cache_enable:
         cache_data_list = time_cal(
             chat_cache.data_manager.search,
-            func_name="milvus_search",
+            func_name="vector_search",
             report_func=chat_cache.report.search,
         )(
             embedding_data,
             extra_param=context.get("search_func", None),
             top_k=kwargs.pop("top_k", -1),
             model=model
         )
+        print('cache_data_list: {}'.format(cache_data_list))
         cache_answers = []
         cache_questions = []
         cache_ids = []
@@ -78,8 +81,8 @@ def adapt_query(cache_data_convert, *args, **kwargs):
             return
 
         for cache_data in cache_data_list:
+            print('cache_data: {}'.format(cache_data))
             primary_id = cache_data[1]
-            start_time = time.time()
             ret = chat_cache.data_manager.get_scalar_data(
                 cache_data, extra_param=context.get("get_scalar_data", None)
             )
 
@@ -4,7 +4,7 @@
 from modelcache.processor.post import first
 from modelcache.similarity_evaluation import ExactMatchEvaluation
 from modelcache.similarity_evaluation import SimilarityEvaluation
-from modelcache.embedding.string import to_embeddings as string_embedding
+from modelcache.embedding.string_text import to_embeddings as string_embedding
 from modelcache.report import Report
 from modelcache.config import Config
 from modelcache.utils.cache_func import cache_all
@@ -19,7 +19,10 @@ def __init__(self):
         self.cache_enable_func = None
         self.query_pre_embedding_func = None
         self.insert_pre_embedding_func = None
+        self.mm_query_pre_embedding_func = None
+        self.mm_insert_pre_embedding_func = None
         self.embedding_func = None
+        self.embedding_concurrent_func = None
         self.data_manager: Optional[DataManager] = None
         self.similarity_evaluation: Optional[SimilarityEvaluation] = None
         self.post_process_messages_func = None
 
@@ -212,6 +212,7 @@ def import_data(
             cache_datas.append([ans, question, embedding_data, model])
 
         ids = self.s.batch_insert(cache_datas)
+        print('ids: {}'.format(ids))
         logging.info('ids: {}'.format(ids))
         self.v.mul_add(
             [
 
@@ -94,10 +94,6 @@ class CacheStorage(metaclass=ABCMeta):
     def create(self):
         pass
 
-    @abstractmethod
-    def batch_insert(self, all_data: List[CacheData]):
-        pass
-
     @abstractmethod
     def insert_query_resp(self, query_resp, **kwargs):
         pass
 
@@ -136,6 +136,7 @@ def _get_collection(self, collection_name):
 
     def mul_add(self, datas: List[VectorData], model=None):
         collection_name_model = self.collection_name + '_' + model
+        print('collection_name_model: {}'.format(collection_name_model))
         self._create_collection(collection_name_model)
 
         data_array, id_array = map(list, zip(*((data.data, data.id) for data in datas)))
@@ -147,6 +148,7 @@ def search(self, data: np.ndarray, top_k: int = -1, model=None):
         if top_k == -1:
             top_k = self.top_k
         collection_name_model = self.collection_name + '_' + model
+        print('collection_name_model: {}'.format(collection_name_model))
         self._create_collection(collection_name_model)
         search_result = self.col.search(
             data=data.reshape(1, -1).tolist(),
Original file line number	Diff line number	Diff line change
`@@ -177,7 +177,6 @@ def user_backend():`
`177`	`177`	`return json.dumps(result)`
`178`	`178`
`179`	`179`	`if request_type == 'register':`
`180`		`- # iat_type = param_dict.get("iat_type")`
`181`	`180`	`response = adapter.ChatCompletion.create_register(`
`182`	`181`	`model=model`
`183`	`182`	`)`
Original file line number	Diff line number	Diff line change
`@@ -212,6 +212,7 @@ def import_data(`
`212`	`212`	`cache_datas.append([ans, question, embedding_data, model])`
`213`	`213`
`214`	`214`	`ids = self.s.batch_insert(cache_datas)`
	`215`	`+ print('ids: {}'.format(ids))`
`215`	`216`	`logging.info('ids: {}'.format(ids))`
`216`	`217`	`self.v.mul_add(`
`217`	`218`	`[`