updated the changes

viveksingh-ctrl · web-flow · commit 97a16d7a4519 · 2024-04-08T20:59:12.000+05:30
diff --git a/llmtune/cli/toolkit.py b/llmtune/cli/toolkit.py
@@ -2,8 +2,8 @@
 from os import listdir
 from os.path import exists, join
 
-import torch
 import pandas as pd
+import torch
 import typer
 import yaml
 from pydantic import ValidationError
@@ -13,10 +13,11 @@
 from llmtune.finetune.lora import LoRAFinetune
 from llmtune.inference.lora import LoRAInference
 from llmtune.pydantic_models.config_model import Config
+from llmtune.qa.generics import LLMTestSuite, QaTestRegistry
 from llmtune.ui.rich_ui import RichUI
 from llmtune.utils.ablation_utils import generate_permutations
 from llmtune.utils.save_utils import DirectoryHelper
-from llmtune.qa.generics import QaTestRegistry, LLMTestSuite
+
 
 hf_utils.logging.set_verbosity_error()
 torch._logging.set_logs(all=logging.CRITICAL)
@@ -82,13 +83,8 @@ def run_one_experiment(config: Config, config_path: str) -> None:
         tests = QaTestRegistry.create_tests_from_list(llm_tests)
         # TODO: Load results.csv
         results_df = pd.read_csv(results_file_path)
-        prompts = results_df["prompt"].tolist()
-        ground_truths = results_df["ground_truth"].tolist()
-        model_preds = results_df["model_prediction"].tolist()
-        # TODO: Run Unit Tests
-        test_suite = LLMTestSuite(tests, prompts, ground_truths, model_preds)
-        # TODO: Save Unit Test Results
-        test_suite.save_test_results("unit_test_results.csv")
+        test_suite = LLMTestSuite.from_csv(results_file_path, tests)
+        test_suite.save_test_results(os.path.join(qa_path, "unit_test_results.csv"))
 
 
 @app.command()
diff --git a/llmtune/qa/generics.py b/llmtune/qa/generics.py
@@ -50,6 +50,14 @@ def __init__(
 
         self.test_results = {}
 
+    @staticmethod
+    def from_csv(file_path: str, tests: List[LLMQaTest]) -> "LLMTestSuite":
+        results_df = pd.read_csv(file_path)
+        prompts = results_df["prompt"].tolist()
+        ground_truths = results_df["ground_truth"].tolist()
+        model_preds = results_df["model_prediction"].tolist()
+        return LLMTestSuite(tests, prompts, ground_truths, model_preds)
+
     def run_tests(self) -> Dict[str, List[Union[float, int, bool]]]:
         test_results = {}
         for test in zip(self.tests):