Skip to content

Commit a5f86ac

Browse files
Update generative-proof-of-concept-CPU-preprocessing-in-memory.py
Bypass package_non_instruct_samples.
1 parent 4830f23 commit a5f86ac

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

generative-proof-of-concept-CPU-preprocessing-in-memory.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -333,12 +333,12 @@ def package_non_instruct_text(text: str, desired_samples: int, max_length_tokens
333333
return samples
334334

335335
# Separate into samples
336-
non_instruct_samples = package_non_instruct_text(text=bible, desired_samples=SAMPLES_TO_CREATE, max_length_tokens=int(np.ceil(MAX_SEQ_LENGTH * .8))) ##
336+
# non_instruct_samples = package_non_instruct_text(text=bible, desired_samples=SAMPLES_TO_CREATE, max_length_tokens=int(np.ceil(MAX_SEQ_LENGTH * .8))) ##
337337

338-
del(bible)
339-
collect()
340-
341-
print(f"Samples from KJV bible consisting of {len(non_instruct_samples)} look like this (sub-sample of 3): {non_instruct_samples[:3]}")
338+
# del(bible)
339+
# collect()
340+
non_instruct_samples = bible[:SAMPLES_TO_CREATE]
341+
print(f"Samples from KJV bible consisting of {len(non_instruct_samples)} look like this (sub-sample of 3): {non_instruct_samples[:3]}")
342342

343343

344344
# Replace with imported text

0 commit comments

Comments
 (0)