File tree Expand file tree Collapse file tree 2 files changed +5
-7
lines changed
Expand file tree Collapse file tree 2 files changed +5
-7
lines changed Original file line number Diff line number Diff line change 3636 - name : Setup model server
3737 run : |
3838 curl -fsSL https://ollama.com/install.sh | sh
39- export OLLAMA_NUM_PARALLEL=2
40- export OLLAMA_FLASH_ATTENTION=1
41- export OLLAMA_KV_CACHE_TYPE=q4_0
4239 ollama serve &
4340 sleep 5
4441 curl http://localhost:11434/api/generate -d '{"model": "llama3.2:3b", "keep_alive": -1}'
Original file line number Diff line number Diff line change 1616
1717const std::vector<std::string> question_bank =
1818{
19- " what is the capital of the united states ?" ,
20- " who was the 20th president of the united states ?" ,
21- " what state is minneapolis in ?"
19+ " be very brief; what is the capital of the united states ?" ,
20+ " be very brief; who was the 20th president of the united states ?" ,
21+ " be very brief; what state is minneapolis in ?"
2222};
2323
2424class PipeliningTest : public ::testing::Test
@@ -255,7 +255,8 @@ TEST_F(PipeliningTest, TestStreamingAndPipelining)
255255 vx_size size = question_bank.size ();
256256 std::vector<vx_array> in_arrs (size);
257257 std::vector<vx_array> out_arrs (size);
258- for (vx_size i = 0 ; i < size; ++i) {
258+ for (vx_size i = 0 ; i < size; ++i)
259+ {
259260 in_arrs[i] = vxCreateArray (context, VX_TYPE_CHAR, VX_MAX_FILE_NAME);
260261 out_arrs[i] = vxCreateArray (context, VX_TYPE_CHAR, VX_MAX_FILE_NAME);
261262 ASSERT_EQ (vxGetStatus (in_arrs[i]), VX_SUCCESS);
You can’t perform that action at this time.
0 commit comments