Skip to content

Commit 04e841e

Browse files
Merge pull request #295 from david-thrower/293-from-289-retrofit-generate-loop-for-logits
293 from 289 retrofit generate loop for logits
2 parents 98895f2 + 79f407d commit 04e841e

File tree

2 files changed

+3
-4
lines changed

2 files changed

+3
-4
lines changed

cerebrosllmutils/llm_utils.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -485,9 +485,8 @@ def generate(self,
485485

486486
# Convert to tensor and get model prediction
487487
input_tensor = tf.constant([input_tokens], dtype=tf.int32)
488-
probs_nested = self.model(input_tensor)
489-
probs = probs_nested[0] # Already softmax probabilities (NOT logits as comment says)
490-
logits = tf.math.log(probs + 10 ** -20) # Convert to logits for penalty application
488+
logits_nested = self.model(input_tensor)
489+
logits = logits_nested[0] # Model outputs logits
491490

492491
if do_sample:
493492
# Apply repetition/frequency/presence penalties to logits

train_a_generative_llm.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -715,7 +715,7 @@ def test_text(test_prompt: str, max_new_tokens: int, result_cutoff: float, trial
715715
test_text(
716716
test_prompt=sample,
717717
max_new_tokens=MAX_NEW_TOKENS,
718-
result_cutoff=15,
718+
result_cutoff=999,
719719
trial_id=trial_number,
720720
test_sample_number=counter,
721721
result_0=phase_i_a_result)

0 commit comments

Comments
 (0)