File tree
1,253 files changed
+678745
-0
lines changed- database
- eval
- chat_benchmarks
- HumanEval
- data
- human_eval
- utils
- IFEval
- data
- MBPP
- data
- human_eval
- utils
- MTBench
- .github
- workflows
- assets
- docker
- docs
- commands
- fastchat
- data
- llm_judge
- data
- mt_bench
- misc
- model_answer
- model_judgment
- reference_answer
- vicuna_bench
- reference_answer
- model
- modules
- protocol
- serve
- example_images
- gateway
- monitor
- classify
- dataset_release_scripts
- arena_33k
- lmsys_chat_1m
- vote_time_stats
- vision
- train
- playground
- benchmark
- test_embedding
- scripts
- tests
- MixEval
- client
- mix_eval
- api
- data
- mixeval-2024-06-01
- mixeval-hard
- mixeval
- mixeval-2024-08-11
- mixeval-hard
- mixeval
- models
- prompts
- utils
- RepoBench
- archive_data
- assets
- data
- data
- evaluation
- WildBench
- .github
- ISSUE_TEMPLATE
- workflows
- docs
- css
- addons
- modules
- fonts
- images
- ico_example
- icons
- placehold/slides
- js
- addons
- min
- modules
- static/images
- evaluation
- leaderboard
- data_dir
- scripts
- src
- openai_batch_eval
- alpaca_eval
- .github/workflows
- client_configs
- docs
- data_AlpacaEval_2
- data_AlpacaEval
- figures
- scripts
- src/alpaca_eval
- annotators
- decoders
- evaluators_configs
- LlaMa-3-405B-SambaNova
- LlaMa-3-70B-SambaNova
- LlaMa-3-8B-SambaNova
- alpaca_eval_clf_cot_gpt4_turbo
- alpaca_eval_clf_gpt4_turbo
- alpaca_eval_cot_gpt4_turbo_fn
- alpaca_eval_gpt4_0314
- alpaca_eval_gpt4_0613
- alpaca_eval_gpt4_fn
- alpaca_eval_gpt4_turbo_fn
- alpaca_eval_gpt4
- alpaca_eval_llama3_70b_fn
- alpaca_eval_vllm_llama3_70b_fn
- alpaca_farm_greedy_gpt4
- alpaca_farm
- aviary_gpt4
- bedrock_claude_2
- bedrock_claude
- chatgpt_fn
- chatgpt
- claude_2
- claude_3_opus_ranking
- claude_ranking
- claude
- cohere
- gpt-3.5-turbo-1106_ranking
- gpt35_turbo_instruct
- gpt4_turbo_clf
- gpt4_turbo_cot_clf
- gpt4_turbo_cot_logprob
- gpt4_turbo_logprob
- gpt4_turbo
- gpt4
- guanaco_33b
- improved_aviary_gpt4
- improved_lmsys_gpt4
- lmsys_gpt4
- mistral-large-2402_ranking
- oasst_pythia_12b
- test
- text_davinci_003
- weighted_alpaca_eval_cot_gpt4_turbo
- weighted_alpaca_eval_gpt-4o-mini-2024-07-18
- weighted_alpaca_eval_gpt4_turbo_new
- weighted_alpaca_eval_gpt4_turbo
- leaderboards
- data_AlpacaEval_2
- data_AlpacaEval
- evaluators
- metrics
- weights
- claude_3_opus_ranking/length_controlled_v1
- mistral-large-2402_ranking/length_controlled_v1
- weighted_alpaca_eval_gpt4_turbo/length_controlled_v1
- models_configs
- Conifer-7B-DPO
- Contextual-KTO-Mistral-PairRM-Verified
- Contextual-KTO-Mistral-PairRM
- Ein-70B-v0.1
- FsfairX-Zephyr-Chat-v0.1
- Infinity-Instruct-3M-0613-Llama3-70B
- Infinity-Instruct-3M-0613-Mistral-7B
- Infinity-Instruct-3M-0625-Llama3-70B
- Infinity-Instruct-3M-0625-Llama3-8B
- Infinity-Instruct-3M-0625-Mistral-7B
- Infinity-Instruct-3M-0625-Qwen2-7B
- Infinity-Instruct-3M-0625-Yi-1.5-9B
- Infinity-Instruct-7M-Gen-Llama3_1-70B
- Infinity-Instruct-7M-Gen-Llama3_1-8B
- Infinity-Instruct-7M-Gen-mistral-7B
- LMCocktail-10.7B-v1
- Llama-3-Instruct-8B-SimPO-ExPO
- Llama-3-Instruct-8B-SimPO
- Llama-3-Instruct-8B-WPO-HB-v2
- Llama3-PBM-Nova-70B
- Meta-Llama-3-70B-Instruct
- Meta-Llama-3-8B-Instruct
- Meta-Llama-3.1-405B-Instruct-Turbo
- Meta-Llama-3.1-70B-Instruct-Turbo
- Meta-Llama-3.1-8B-Instruct-Turbo
- Mistral-7B+RAHF-DUAL+LoRA
- Mistral-7B-Instruct-v0.2
- Mistral-7B-Instruct-v0.3
- Mistral-7B-ReMax-v0.1
- Mixtral-8x22B-Instruct-v0.1
- Mixtral-8x7B-Instruct-v0.1_concise
- Mixtral-8x7B-Instruct-v0.1_verbose
- Mixtral-8x7B-Instruct-v0.1
- Nanbeige-Plus-Chat-v0.1
- Nanbeige2-16B-Chat
- Nanbeige2-8B-Chat
- OpenHermes-2.5-Mistral-7B
- Qwen-14B-Chat
- Qwen1.5-1.8B-Chat
- Qwen1.5-110B-Chat
- Qwen1.5-14B-Chat
- Qwen1.5-72B-Chat
- Qwen1.5-7B-Chat
- Qwen2-72B-Instruct
- REBEL-Llama-3-8B-Instruct-Armo
- REBEL-Llama-3-8B-Instruct
- SPPO-Gemma-2-9B-It-PairRM
- SPPO-Llama-3-Instruct-8B-PairRM
- SPPO-Mistral7B-PairRM-ExPO
- SPPO-Mistral7B-PairRM
- Samba-CoE-v0.1
- Samba-CoE-v0.2-best-of-16
- Samba-CoE-v0.2
- Shopee-SlimMoA-v1
- Snorkel-Mistral-PairRM-DPO-best-of-16
- Snorkel-Mistral-PairRM-DPO
- Starling-LM-7B-alpha-ExPO
- Starling-LM-7B-alpha
- Starling-LM-7B-beta-ExPO
- Storm-7B-best-of-64
- Storm-7B
- TempNet-LLaMA2-Chat-13B-v0.1
- TempNet-LLaMA2-Chat-70B-v0.1
- TempNet-LLaMA2-Chat-7B-v0.1
- Together-MoA-Lite
- Together-MoA
- Yi-34B-Chat-Verified
- Yi-34B-Chat
- airoboros-33b
- airoboros-65b
- aligner-2b_claude-3-opus-20240229
- aligner-2b_gpt-4-turbo-2024-04-09
- aligner-2b_qwen1.5-72b-chat
- alpaca-7b-neft
- alpaca-7b_concise
- alpaca-7b_verbose
- alpaca-7b
- alpaca-farm-ppo-human
- alpaca-farm-ppo-sim-gpt4-20k
- baichuan-13b-chat
- baize-v2-13b
- baize-v2-7b
- bedrock_claude_2
- bedrock_claude
- blendaxai-gm-l3-v35
- blendaxai-gm-l6-vo31
- causallm-14b
- chatglm2-6b
- claude-2.1_concise
- claude-2.1_verbose
- claude-2.1
- claude-2
- claude-3-5-sonnet-20240620
- claude-3-opus-20240229
- claude-3-sonnet-20240229
- claude-instant-1.2
- claude2-alpaca-13b
- claude
- cohere
- cut-13b
- dbrx-instruct
- deepseek-llm-67b-chat
- deita-7b-v1.0
- dolphin-2.2.1-mistral-7b
- evo-7b
- evo-v2-7b
- falcon-40b-instruct
- falcon-7b-instruct
- gemini-pro
- gemma-2-9b-it-DPO
- gemma-2-9b-it-SimPO
- gemma-2-9b-it-WPO-HB
- gemma-2b-it
- gemma-7b-it
- ghost-7b-alpha
- ghost-8b-beta-disl-0x5
- gpt-3.5-turbo-0301
- gpt-3.5-turbo-0613
- gpt-3.5-turbo-1106_concise
- gpt-3.5-turbo-1106_verbose
- gpt-3.5-turbo-1106
- gpt-3.5-turbo-16k-0613
- gpt-4-0125-preview
- gpt-4-turbo-2024-04-09
- gpt-4o-2024-05-13
- gpt-4o-2024-08-06
- gpt-4o-mini-2024-07-18
- gpt35_turbo_instruct
- gpt4_0314
- gpt4_0613_concise
- gpt4_0613_verbose
- gpt4_0613
- gpt4_1106_preview_concise
- gpt4_1106_preview_verbose
- gpt4_1106_preview
- gpt4_gamed
- gpt4
- guanaco-13b
- guanaco-33b-api
- guanaco-33b
- guanaco-65b
- guanaco-7b
- higgs-llama-3-70b-v2
- humpback-llama-65b
- humpback-llama2-70b
- internlm2-chat-20b-ExPO
- internlm2-chat-20b-ppo
- internlm2-chat-7b-ExPO
- jina-chat
- llama-2-13b-chat-hf
- llama-2-70b-chat-hf
- llama-2-7b-chat-hf
- llama-2-chat-7b-evol70k-neft
- merlinite-7B-AOT
- minichat-1.5-3b
- minichat-3b
- minotaur-13b
- mistral-large-2402
- mistral-medium
- mistral-orpo-beta
- nous-hermes-13b
- oasst-rlhf-llama-33b
- oasst-sft-llama-33b
- oasst-sft-pythia-12b
- openbuddy-falcon-40b-v9
- openbuddy-falcon-7b-v6
- openbuddy-llama-30b-v7.1
- openbuddy-llama-65b-v8
- openbuddy-llama2-13b-v11.1
- openbuddy-llama2-70b-v10.1
- openchat-13b
- openchat-v2-13b
- openchat-v2-w-13b
- openchat-v3.1-13b
- openchat8192-13b
- opencoderplus-15b
- openpipe-moa-gpt-4-turbo-v1
- pairrm-Yi-34B-Chat
- pairrm-tulu-2-13b
- pairrm-tulu-2-70b
- pairrm-zephyr-7b-beta
- phi-2-dpo
- phi-2-sft
- phi-2
- platolm-7b
- pythia-12b-mix-sft
- recycled-wizardlm-7b-v1.0
- recycled-wizardlm-7b-v2.0
- text_davinci_001
- text_davinci_003
- tulu-2-dpo-13b-ExPO
- tulu-2-dpo-13b
- tulu-2-dpo-70b-ExPO
- tulu-2-dpo-70b
- tulu-2-dpo-7b-ExPO
- tulu-2-dpo-7b
- ultralm-13b-best-of-16
- ultralm-13b-v2.0-best-of-16
- ultralm-13b-v2.0
- ultralm-13b
- vicuna-13b-v1.3
- vicuna-13b-v1.5-togetherai
- vicuna-13b-v1.5
- vicuna-13b
- vicuna-33b-v1.3
- vicuna-7b-v1.3
- vicuna-7b-v1.5
- vicuna-7b
- wizardlm-13b-v1.1
- wizardlm-13b-v1.2
- wizardlm-13b
- wizardlm-70b
- xwinlm-13b-v0.1
- xwinlm-70b-v0.1
- xwinlm-70b-v0.3
- xwinlm-7b-v0.1
- yi-large-preview
- zephyr-7b-alpha-ExPO
- zephyr-7b-alpha
- zephyr-7b-beta-ExPO
- zephyr-7b-beta
- tests
- integration_tests
- zeroeval
- .github/workflows
- data_prep
- docs
- zebra
- scripts
- local
- src
- evaluation
- legacy
- templates
- state_of_limit
- html
- examples
Some content is hidden
Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
1,253 files changed
+678745
-0
lines changedOriginal file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
| 1 | + | |
| 2 | + | |
| 3 | + | |
| 4 | + | |
| 5 | + | |
| 6 | + | |
| 7 | + | |
| 8 | + | |
| 9 | + | |
| 10 | + | |
| 11 | + | |
| 12 | + | |
| 13 | + | |
| 14 | + | |
| 15 | + | |
| 16 | + | |
| 17 | + | |
| 18 | + | |
| 19 | + | |
| 20 | + | |
| 21 | + | |
| 22 | + | |
| 23 | + | |
| 24 | + | |
| 25 | + | |
| 26 | + | |
| 27 | + | |
| 28 | + | |
| 29 | + | |
| 30 | + | |
| 31 | + | |
| 32 | + | |
| 33 | + | |
| 34 | + | |
| 35 | + | |
| 36 | + | |
| 37 | + | |
| 38 | + | |
| 39 | + | |
| 40 | + | |
| 41 | + | |
| 42 | + | |
| 43 | + | |
| 44 | + | |
| 45 | + | |
| 46 | + | |
| 47 | + | |
| 48 | + | |
| 49 | + | |
| 50 | + | |
| 51 | + | |
| 52 | + | |
| 53 | + | |
| 54 | + | |
| 55 | + | |
| 56 | + | |
| 57 | + | |
| 58 | + | |
| 59 | + | |
| 60 | + | |
| 61 | + | |
| 62 | + | |
| 63 | + | |
| 64 | + | |
| 65 | + | |
| 66 | + | |
| 67 | + | |
| 68 | + | |
| 69 | + | |
| 70 | + | |
| 71 | + | |
| 72 | + | |
| 73 | + | |
| 74 | + | |
| 75 | + | |
| 76 | + | |
| 77 | + | |
| 78 | + | |
| 79 | + | |
| 80 | + | |
| 81 | + | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
| 85 | + | |
| 86 | + | |
| 87 | + | |
| 88 | + | |
| 89 | + | |
| 90 | + | |
| 91 | + | |
| 92 | + | |
| 93 | + | |
| 94 | + | |
| 95 | + | |
| 96 | + | |
| 97 | + | |
| 98 | + | |
| 99 | + | |
| 100 | + | |
| 101 | + | |
| 102 | + | |
| 103 | + | |
| 104 | + | |
| 105 | + | |
| 106 | + | |
| 107 | + | |
| 108 | + | |
| 109 | + | |
| 110 | + | |
| 111 | + | |
| 112 | + | |
| 113 | + | |
| 114 | + | |
| 115 | + | |
| 116 | + | |
| 117 | + | |
| 118 | + | |
| 119 | + | |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
| 124 | + | |
| 125 | + | |
| 126 | + | |
| 127 | + | |
| 128 | + | |
| 129 | + | |
| 130 | + | |
| 131 | + | |
| 132 | + | |
| 133 | + | |
| 134 | + | |
| 135 | + | |
| 136 | + | |
| 137 | + | |
| 138 | + | |
| 139 | + | |
| 140 | + | |
| 141 | + | |
| 142 | + | |
| 143 | + | |
| 144 | + | |
| 145 | + | |
| 146 | + | |
| 147 | + | |
| 148 | + | |
| 149 | + | |
| 150 | + | |
| 151 | + | |
| 152 | + | |
| 153 | + | |
| 154 | + | |
| 155 | + | |
| 156 | + | |
| 157 | + | |
| 158 | + | |
| 159 | + | |
| 160 | + | |
| 161 | + | |
| 162 | + | |
| 163 | + | |
| 164 | + | |
| 165 | + | |
| 166 | + | |
| 167 | + | |
| 168 | + | |
| 169 | + | |
| 170 | + | |
| 171 | + | |
| 172 | + | |
| 173 | + | |
| 174 | + | |
| 175 | + | |
| 176 | + | |
| 177 | + | |
| 178 | + | |
| 179 | + | |
| 180 | + | |
| 181 | + | |
| 182 | + | |
| 183 | + | |
| 184 | + | |
| 185 | + | |
| 186 | + | |
| 187 | + | |
| 188 | + | |
| 189 | + | |
| 190 | + | |
| 191 | + | |
| 192 | + | |
| 193 | + | |
| 194 | + | |
| 195 | + | |
| 196 | + | |
| 197 | + | |
| 198 | + | |
| 199 | + | |
| 200 | + | |
| 201 | + | |
| 202 | + | |
| 203 | + | |
| 204 | + | |
| 205 | + | |
| 206 | + | |
| 207 | + | |
| 208 | + | |
| 209 | + | |
| 210 | + | |
| 211 | + | |
| 212 | + | |
| 213 | + | |
| 214 | + | |
| 215 | + | |
| 216 | + | |
| 217 | + | |
| 218 | + | |
| 219 | + | |
| 220 | + | |
| 221 | + | |
| 222 | + | |
| 223 | + | |
| 224 | + | |
| 225 | + | |
| 226 | + | |
| 227 | + |
0 commit comments