diff --git a/runner/run.cpp b/runner/run.cpp index 52d596749..b90ca4e81 100644 --- a/runner/run.cpp +++ b/runner/run.cpp @@ -835,7 +835,7 @@ int main(int argc, char* argv[]) { float topp = 0.9f; // top-p in nucleus sampling. 1.0 = off. 0.9 works well, // but slower - int steps = 256; // number of steps to run for + int steps = 128; // number of steps to run for const char* prompt = NULL; // prompt string unsigned long long rng_seed = 0; // seed rng with time by default const char* mode = "generate"; // generate|chat