Skip to content

Commit 396316c

Browse files
Update generative-proof-of-concept-CPU-preprocessing-in-memory.py
Set sane values for CICD scale / linting / smoke testing run realistic on 4 CPU 16 GB RAM.
1 parent b1eae19 commit 396316c

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

generative-proof-of-concept-CPU-preprocessing-in-memory.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
DATA_SET_NAME = "WEB-Bible-Genesis-40-context-681-SPL"
1919

2020

21-
N_TRIALS = 50
21+
N_TRIALS = 10 # 50
2222

2323

2424
mlflow.set_tracking_uri(uri=f"http://127.0.0.1:{MLFLOW_PORT}")
@@ -63,7 +63,7 @@ def objective(trial: optuna.Trial) -> float:
6363
# Number of text samples to create: # Number of text samples (of approximately max_seq_len) to create
6464
# Raises RAM in a linear fashion
6565

66-
SAMPLES_TO_CREATE = 681
66+
SAMPLES_TO_CREATE = 10 # 681
6767

6868
# How many tokens to provide before expecting the next token to be predicted.
6969
# Half this = double RAM (inversely proportional to RAM requirement)
@@ -149,7 +149,7 @@ def objective(trial: optuna.Trial) -> float:
149149
# embedding output dim must be an even number
150150
# Maximize EMBEDDING_N based on available RAM and CPU / GPU
151151

152-
EMBEDDING_N = trial.suggest_int('embedding_n',6, 9) # 12
152+
EMBEDDING_N = 6 # trial.suggest_int('embedding_n',6, 9) # 12
153153
EMBEDDING_DIM = int(EMBEDDING_N * 2)
154154

155155
PROJECTION_N = 1 # Punatuve increase of ram, leaving this as 1 until we are running on HPC

0 commit comments

Comments
 (0)