Skip to content

Commit 822dc7f

Browse files
committed
Update
1 parent 90b321c commit 822dc7f

File tree

11 files changed

+29
-608
lines changed

11 files changed

+29
-608
lines changed

result.txt

Whitespace-only changes.

run.sh

Lines changed: 0 additions & 253 deletions
This file was deleted.

scripts/prepare_ruler.sh

Lines changed: 0 additions & 53 deletions
This file was deleted.

scripts/run_selfspec.sh

Lines changed: 0 additions & 58 deletions
This file was deleted.

tests/SnapKV/longspec_benchmark.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -63,9 +63,9 @@
6363
if rank != args.rank_group[0]:
6464
print = lambda *args, **kwargs: None
6565

66-
if rank == 0:
67-
with open("result.txt", "a") as file:
68-
file.write(f"Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}\n")
66+
# if rank == 0:
67+
# with open("result.txt", "a") as file:
68+
# file.write(f"Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}\n")
6969

7070
setup_seed(args.seed)
7171
print(f"Using device={DEVICE}")
@@ -316,7 +316,7 @@
316316
if use_tp:
317317
dist.barrier()
318318

319-
if rank == 0:
320-
with open("result.txt", "a") as file:
321-
file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
322-
file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))
319+
# if rank == 0:
320+
# with open("result.txt", "a") as file:
321+
# file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
322+
# file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))

tests/SnapKV/selfspec_benchmark.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -51,9 +51,9 @@
5151
if rank != args.rank_group[0]:
5252
print = lambda *args, **kwargs: None
5353

54-
if rank == 0:
55-
with open("result.txt", "a") as file:
56-
file.write(f"SnapKV-Selfspec: Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}; Draft budget:{args.draft_budget}\n")
54+
# if rank == 0:
55+
# with open("result.txt", "a") as file:
56+
# file.write(f"SnapKV-Selfspec: Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}; Draft budget:{args.draft_budget}\n")
5757

5858
setup_seed(args.seed)
5959
print(f"Using device={DEVICE}")
@@ -232,7 +232,7 @@
232232
if use_tp:
233233
dist.barrier()
234234

235-
if rank == 0:
236-
with open("result.txt", "a") as file:
237-
file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
238-
file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))
235+
# if rank == 0:
236+
# with open("result.txt", "a") as file:
237+
# file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
238+
# file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))

tests/StreamingLLM/longspec_benchmark.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -60,9 +60,9 @@
6060
if rank != args.rank_group[0]:
6161
print = lambda *args, **kwargs: None
6262

63-
if rank == 0:
64-
with open("result.txt", "a") as file:
65-
file.write(f"Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}; Draft budget:{args.draft_budget}\n")
63+
# if rank == 0:
64+
# with open("result.txt", "a") as file:
65+
# file.write(f"Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}; Draft budget:{args.draft_budget}\n")
6666

6767
setup_seed(args.seed)
6868
print(f"Using device={DEVICE}")
@@ -313,7 +313,7 @@
313313
if use_tp:
314314
dist.barrier()
315315

316-
if rank == 0:
317-
with open("result.txt", "a") as file:
318-
file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
319-
file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))
316+
# if rank == 0:
317+
# with open("result.txt", "a") as file:
318+
# file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
319+
# file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))

tests/StreamingLLM/selfspec_benchmark.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -48,9 +48,9 @@
4848
if rank != args.rank_group[0]:
4949
print = lambda *args, **kwargs: None
5050

51-
if rank == 0:
52-
with open("result.txt", "a") as file:
53-
file.write(f"Selfspec: Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}; Draft budget:{args.draft_budget}\n")
51+
# if rank == 0:
52+
# with open("result.txt", "a") as file:
53+
# file.write(f"Selfspec: Prefix:{args.prefix_len}; Bsz:{args.B}; Gamma:{args.gamma}; Draft budget:{args.draft_budget}\n")
5454

5555

5656
setup_seed(args.seed)
@@ -259,7 +259,7 @@
259259
if use_tp:
260260
dist.barrier()
261261

262-
if rank == 0:
263-
with open("result.txt", "a") as file:
264-
file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
265-
file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))
262+
# if rank == 0:
263+
# with open("result.txt", "a") as file:
264+
# file.write("total time :{:.5f}s, time per iter :{:.5f}s, decoding step: {}, large model step: {}, avg latency: {} \n".format(total_time, total_time / target_steps, num_gen_tokens, target_steps, total_time / num_gen_tokens * BATCH_SIZE))
265+
# file.write("target time :{:.5f}s, draft time :{:.5f}s, verify loop : {}, avg generate len per sentence: {} \n".format(target_time/target_steps, draft_time / target_steps, verify_loop/target_steps, num_gen_tokens/target_steps/BATCH_SIZE))

tests/baseline_benchmark.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@
9595
for i in range(BATCH_SIZE):
9696
print(tokenizer.decode(output[i, args.prefix_len:]))
9797
print(f"Tokens per second :{total_time/model_steps}")
98-
if step < 10:
98+
if step < 5:
9999
total_time = 0.0
100100
model_steps = 0
101101
if use_tp:

tests/test.py

Lines changed: 0 additions & 107 deletions
This file was deleted.

0 commit comments

Comments
 (0)