Skip to content

Latest commit

 

History

History
55 lines (48 loc) · 4.13 KB

File metadata and controls

55 lines (48 loc) · 4.13 KB

baseline performance

python evaluation/evaluate.py --combined_dir output/llama3_baseline.csv --output_dir results/llama3_baseline.json
python evaluation/evaluate.py --combined_dir output/llama3_recursive_chroma_top3.csv --output_dir results/llama3_recursive_chroma_top3.json

for hyperparameter tuning on chunk size

python evaluation/evaluate.py --combined_dir output/llama3_recursive_chroma_top3_sample100.csv --output_dir results/llama3_recursive_chroma_top3_sample100.json
python evaluation/evaluate.py --combined_dir output/llama3_recursive_chunk2000_chroma_top3_sample100.csv --output_dir results/llama3_recursive_chunk2000_chroma_top3_sample100.json
python evaluation/evaluate.py --combined_dir output/llama3_recursive_chunk500_chroma_top3_sample100.csv --output_dir results/llama3_recursive_chunk500_chroma_top3_sample100.json
python evaluation/evaluate.py --combined_dir output/llama3_recursive_chunk750_chroma_top3_sample100.csv --output_dir results/llama3_recursive_chunk750_chroma_top3_sample100.json
python evaluation/evaluate.py --combined_dir output/llama3_recursive_chunk1500_chroma_top3_sample100.csv --output_dir results/llama3_recursive_chunk1500_chroma_top3_sample100.json

for hyperparameter tuning on splitter

python evaluation/evaluate.py --combined_dir output/llama3_character_chroma_top3_sample100.csv --output_dir results/llama3_character_chroma_top3_sample100.json
python evaluation/evaluate.py --combined_dir output/llama3_tokensplit_chroma_top3_sample100.csv --output_dir results/llama3_tokensplit_chroma_top3_sample100.json
python evaluation/evaluate.py --combined_dir output/llama3_semantic_chroma_top3_sample100.csv --output_dir results/llama3_semantic_chroma_top3_sample100.json

for tuning reranking using faiss

python evaluation/evaluate.py --combined_dir output/llama3_faiss_test.csv --output_dir results/llama3_faiss_test.json
python evaluation/evaluate.py --combined_dir output/llama3_faiss_test_rerank.csv --output_dir results/llama3_faiss_test_rerank.json
python evaluation/evaluate.py --combined_dir output/llama3_faiss_test_rerank_t5.csv --output_dir results/llama3_faiss_test_rerank_t5.json
python evaluation/evaluate.py --combined_dir output/llama3_faiss_test_rerank_MiniLM.csv --output_dir results/llama3_faiss_test_rerank_MiniLM.json

for hyperparameter tuning on retriever choice (FAISS/Chroma)

python evaluation/evaluate.py --combined_dir output/lhj_100_chroma_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_chroma_all-MiniLM-L6-v2.json
python evaluation/evaluate.py --combined_dir output/lhj_100_faiss_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_faiss_all-MiniLM-L6-v2.json

for hyperparameter tuning on retriever algorithm

python evaluation/evaluate.py --combined_dir output/lhj_100_faiss_mmr_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_faiss_mmr_all-MiniLM-L6-v2.json
python evaluation/evaluate.py --combined_dir output/lhj_100_faiss_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_faiss_all-MiniLM-L6-v2.json

for hyperparameter tuning on retriever algo + choice for sublink files

python evaluation/evaluate.py --combined_dir output/lhj_100_1000sublinkfiles_faiss_similarity_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_1000sublinkfiles_faiss_similarity_all-MiniLM-L6-v2.json
python evaluation/evaluate.py --combined_dir output/lhj_100_1000sublinkfiles_faiss_mmr_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_1000sublinkfiles_faiss_mmr_all-MiniLM-L6-v2.json
python evaluation/evaluate.py --combined_dir output/lhj_100_1000sublinkfiles_chroma_similarity_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_1000sublinkfiles_chroma_similarity_all-MiniLM-L6-v2.json
python evaluation/evaluate.py --combined_dir output/lhj_100_1000sublinkfiles_chroma_mmr_all-MiniLM-L6-v2.csv --output_dir results/lhj_100_1000sublinkfiles_chroma_mmr_all-MiniLM-L6-v2.json

for tuning hypo_doc retrieval

python evaluation/evaluate.py --combined_dir output/llama3_faiss_test_hypo.csv --output_dir results/llama3_faiss_test_hypo.json
python evaluation/evaluate.py --combined_dir output/llama3_faiss_test_hypo_promptENG3.csv --output_dir results/llama3_faiss_test_hypo_promptENG3.json