Update phishing_email_detection_gpt2.py

david-thrower · web-flow · commit b800cf7664e3 · 2025-03-26T20:53:13.000-04:00
Restore the best model yet.
diff --git a/phishing_email_detection_gpt2.py b/phishing_email_detection_gpt2.py
@@ -85,7 +85,7 @@
 
 """### A custom GPT2 encoder layer for text embedding"""
 
-""" un - string out
+
 class GPT2Layer(tf.keras.layers.Layer):
 
     def __init__(self, max_seq_length, **kwargs):
@@ -183,7 +183,6 @@ def from_config(cls, config):
 hy_df = pd.DataFrame(history.history)
 print(hy_df)
 
-""" # end un - string out
 
 ### Cerebros model:
 
@@ -274,8 +273,8 @@ def from_config(cls, config):
 learning_rate = 0.0000511065
 epochs = 15  # [1, 100]
 batch_size = 20
-minimum_levels = 4
-maximum_levels = 4 # [3,7]
+minimum_levels = 2
+maximum_levels = 3 # [3,7]
 
 minimum_units_per_level = 4
 maximum_units_per_level = 8
@@ -353,8 +352,7 @@ def from_config(cls, config):
 cerebros_time_per_model = cerebros_time_all_models_min / models_tried
 
 print(f"Cerebros trained {models_tried} models FROM A COLD START in ONLY {cerebros_time_all_models_min} min. Cerebros took only {cerebros_time_per_model} minutes on average per model.")
-# Un-comment out the next line
-# print(f"GPT2 took {gpt_time_on_one_model_min} just to FINE TUNE one PRE - TRAINED model. Although this is a small scale test, this shows the advantage of scaling in ON timing VS ON**2 timing.")
+print(f"GPT2 took {gpt_time_on_one_model_min} just to FINE TUNE one PRE - TRAINED model. Although this is a small scale test, this shows the advantage of scaling in ON timing VS ON**2 timing.")
 
 
 print(f'Cerebros best accuracy achieved is {result}')