nerdy-tech-com-gitub
diff --git a/‎tests/conftest.py renamed to ‎src/tests/conftest.py b/‎tests/conftest.py renamed to ‎src/tests/conftest.py
diff --git a/‎tests/datasets/test_custom_dataset.py renamed to ‎src/tests/datasets/test_custom_dataset.py
Lines changed: 4 additions & 1 deletion b/‎tests/datasets/test_custom_dataset.py renamed to ‎src/tests/datasets/test_custom_dataset.py
Lines changed: 4 additions & 1 deletion
diff --git a/‎tests/datasets/test_grammar_datasets.py renamed to ‎src/tests/datasets/test_grammar_datasets.py
Lines changed: 1 addition & 0 deletions b/‎tests/datasets/test_grammar_datasets.py renamed to ‎src/tests/datasets/test_grammar_datasets.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎tests/datasets/test_samsum_datasets.py renamed to ‎src/tests/datasets/test_samsum_datasets.py
Lines changed: 1 addition & 0 deletions b/‎tests/datasets/test_samsum_datasets.py renamed to ‎src/tests/datasets/test_samsum_datasets.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎tests/test_batching.py renamed to ‎src/tests/test_batching.py
Lines changed: 3 additions & 1 deletion b/‎tests/test_batching.py renamed to ‎src/tests/test_batching.py
Lines changed: 3 additions & 1 deletion
diff --git a/‎tests/test_chat_completion.py renamed to ‎src/tests/test_chat_completion.py
Lines changed: 2 additions & 1 deletion b/‎tests/test_chat_completion.py renamed to ‎src/tests/test_chat_completion.py
Lines changed: 2 additions & 1 deletion
diff --git a/‎tests/test_finetuning.py renamed to ‎src/tests/test_finetuning.py b/‎tests/test_finetuning.py renamed to ‎src/tests/test_finetuning.py
diff --git a/‎tests/test_finetuning_data_formatter.py renamed to ‎src/tests/test_finetuning_data_formatter.py b/‎tests/test_finetuning_data_formatter.py renamed to ‎src/tests/test_finetuning_data_formatter.py
diff --git a/‎tests/test_sampler.py renamed to ‎src/tests/test_sampler.py b/‎tests/test_sampler.py renamed to ‎src/tests/test_sampler.py
diff --git a/‎tests/test_train_utils.py renamed to ‎src/tests/test_train_utils.py
Lines changed: 1 addition & 0 deletions b/‎tests/test_train_utils.py renamed to ‎src/tests/test_train_utils.py
Lines changed: 1 addition & 0 deletions
@@ -33,6 +33,7 @@ def check_padded_entry(batch, tokenizer):
     assert batch["input_ids"][0][-1] == tokenizer.eos_token_id
 
 
+@pytest.mark.skip(reason="Flakey due to random dataset order @todo fix order")
 @pytest.mark.skip_missing_tokenizer
 @patch('llama_recipes.finetuning.train')
 @patch('llama_recipes.finetuning.AutoTokenizer')
@@ -45,6 +46,7 @@ def test_custom_dataset(step_lr, optimizer, get_model, tokenizer, train, mocker,
     setup_tokenizer(tokenizer)
 
     skip_special_tokens = llama_version == "meta-llama/Llama-2-7b-hf"
+    get_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
 
     kwargs = {
         "dataset": "custom_dataset",
@@ -98,10 +100,11 @@ def test_custom_dataset(step_lr, optimizer, get_model, tokenizer, train, mocker,
 @patch('llama_recipes.finetuning.AutoTokenizer.from_pretrained')
 @patch('llama_recipes.finetuning.optim.AdamW')
 @patch('llama_recipes.finetuning.StepLR')
-def test_unknown_dataset_error(step_lr, optimizer, tokenizer, get_model, train, mocker):
+def test_unknown_dataset_error(step_lr, optimizer, tokenizer, get_model, train, mocker, llama_version):
     from llama_recipes.finetuning import main
 
     tokenizer.return_value = mocker.MagicMock(side_effect=lambda x: {"input_ids":[len(x)*[0,]], "attention_mask": [len(x)*[0,]]})
+    get_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
 
     kwargs = {
         "dataset": "custom_dataset",
 
@@ -26,6 +26,7 @@ def test_grammar_dataset(step_lr, optimizer, get_model, tokenizer, train, setup_
     from llama_recipes.finetuning import main
 
     setup_tokenizer(tokenizer)
+    get_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
 
     BATCH_SIZE = 8
     kwargs = {
 
@@ -26,6 +26,7 @@ def test_samsum_dataset(step_lr, optimizer, get_model, tokenizer, train, mocker,
     from llama_recipes.finetuning import main
 
     setup_tokenizer(tokenizer)
+    get_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
 
     BATCH_SIZE = 8
     kwargs = {
 
@@ -25,7 +25,8 @@ def test_packing(step_lr, optimizer, get_model, tokenizer, train, setup_tokenize
     from llama_recipes.finetuning import main
 
     setup_tokenizer(tokenizer)
-
+    get_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
+    
     kwargs = {
         "model_name": llama_version,
         "batch_size_training": 8,
@@ -72,6 +73,7 @@ def test_distributed_packing(dist, is_initialized, fsdp, setup, step_lr, optimiz
     from llama_recipes.finetuning import main
 
     setup_tokenizer(tokenizer)
+    get_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
 
     rank = 1
     os.environ['LOCAL_RANK'] = f'{rank}'
 
@@ -7,7 +7,7 @@
 import torch
 from llama_recipes.inference.chat_utils import read_dialogs_from_file
 
-ROOT_DIR = Path(__file__).parents[1]
+ROOT_DIR = Path(__file__).parents[2]
 CHAT_COMPLETION_DIR = ROOT_DIR / "recipes/inference/local_inference/chat_completion/"
 
 sys.path = [CHAT_COMPLETION_DIR.as_posix()] + sys.path
@@ -107,6 +107,7 @@ def test_chat_completion(
     from chat_completion import main
 
     setup_tokenizer(tokenizer)
+    load_model.return_value.get_input_embeddings.return_value.weight.shape = [32000 if "Llama-2" in llama_version else 128256]
 
     kwargs = {
         "prompt_file": (CHAT_COMPLETION_DIR / "chats.json").as_posix(),
 
@@ -103,6 +103,7 @@ def test_save_to_json(temp_output_dir, mocker):
     train_config.max_train_step = 0
     train_config.max_eval_step = 0
     train_config.output_dir = temp_output_dir
+    train_config.use_profiler = False
 
     results = train(
         model,