chasebk
diff --git a/‎abfo_mlnn_script.py‎
Lines changed: 37 additions & 35 deletions b/‎abfo_mlnn_script.py‎
Lines changed: 37 additions & 35 deletions
diff --git a/‎cro_mlnn_script.py‎
Lines changed: 36 additions & 32 deletions b/‎cro_mlnn_script.py‎
Lines changed: 36 additions & 32 deletions
diff --git a/‎ga_mlnn_script.py‎
Lines changed: 35 additions & 33 deletions b/‎ga_mlnn_script.py‎
Lines changed: 35 additions & 33 deletions
diff --git a/‎lstm1hl_script.py‎
Lines changed: 36 additions & 32 deletions b/‎lstm1hl_script.py‎
Lines changed: 36 additions & 32 deletions
@@ -1,58 +1,60 @@
+#!/usr/bin/env python
+# ------------------------------------------------------------------------------------------------------%
+# Created by "Thieu Nguyen" at 00:51, 29/03/2020                                                        %
+#                                                                                                       %
+#       Email:      [email protected]                                                           %
+#       Homepage:   https://www.researchgate.net/profile/Thieu_Nguyen6                                  %
+#       Github:     https://github.com/thieunguyen5991                                                  %
+# -------------------------------------------------------------------------------------------------------%
+
+from os.path import splitext, basename, realpath
 from sklearn.model_selection import ParameterGrid
 from model.main.hybrid_mlnn import ABfoLSMlnn
-from utils.IOUtil import read_dataset_file
 from utils.SettingPaper import abfols_mlnn_paras_final as param_grid
-from utils.SettingPaper import ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup
+from utils.SettingPaper import *
+from utils.IOUtil import load_dataset
 
-rv_data = [ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup]
-data_file = ["google_5m", "google_5m", "google_5m", "google_5m", "it_eu_5m", "it_uk_5m", "worldcup98_5m"]
-test_type = "normal"                ### normal: for normal test, stability: for n_times test
-run_times = None
+if SP_RUN_TIMES == 1:
+    all_model_file_name = SP_LOG_FILENAME
+else:  # If runs with more than 1, like stability test --> name of the models ==> such as: rnn1hl.csv
+    all_model_file_name = str(splitext(basename(realpath(__file__)))[0])
 
-if test_type == "normal":           ### For normal test
-    run_times = 1
-    pathsave = "paper/results/final/"
-    all_model_file_name = "ffnn_log_models"
-elif test_type == "stability":      ### For stability test (n times run with the same parameters)
-    run_times = 15
-    pathsave = "paper/results/stability/"
-    all_model_file_name = "stability_abfols"
-else:
-    pass
 
 def train_model(item):
     root_base_paras = {
         "dataset": dataset,
-        "data_idx": (0.7, 0.15, 0.15),
+        "feature_size": feature_size,
+        "data_idx": SP_DATA_SPLIT_INDEX_2,
         "sliding": item["sliding"],
-        "multi_output": requirement_variables[2],
-        "output_idx": requirement_variables[3],
-        "method_statistic": 0,  # 0: sliding window, 1: mean, 2: min-mean-max, 3: min-median-max
+        "multi_output": multi_output,
+        "output_idx": output_index,
+        "method_statistic": SP_PREPROCESSING_METHOD,
         "log_filename": all_model_file_name,
-        "path_save_result": pathsave + requirement_variables[4],
-        "test_type": test_type,
-        "draw": True,
-        "print_train": 1  # 0: nothing, 1 : full detail, 2: short version
+        "n_runs": SP_RUN_TIMES,  # 1 or others
+        "path_save_result": SP_PATH_SAVE_BASE + SP_DATA_FILENAME[loop] + "/",
+        "draw": SP_DRAW,
+        "print_train": SP_PRINT_TRAIN,  # 0: nothing, 1 : full detail, 2: short version
     }
+    paras_name = "hs_{}-ep_{}-act_{}-Ci_{}-Ped_{}-Ns_{}-N_minmax_{}".format(item["hidden_size"], item["epoch"], item["activation"],
+                                                                            item["Ci"], item["Ped"], item["Ns"], item["N_minmax"])
     root_hybrid_paras = {
-        "hidden_size": item["hidden_size"], "activations": item["activations"], "epoch": item["epoch"],
-        "train_valid_rate": item["train_valid_rate"], "domain_range": item["domain_range"]
+        "hidden_size": item["hidden_size"], "activations": item["activations"], "epoch": item["epoch"], "domain_range": item["domain_range"],
+        "paras_name": paras_name
     }
     abfols_paras = {
-        "epoch": item["epoch"], "pop_size": item["pop_size"], "Ci": item["Ci"], "Ped": item["Ped"], "Ns": item["Ns"],
-        "N_minmax": item["N_minmax"]
+        "epoch": item["epoch"], "pop_size": item["pop_size"], "Ci": item["Ci"], "Ped": item["Ped"], "Ns": item["Ns"], "N_minmax": item["N_minmax"]
     }
     md = ABfoLSMlnn(root_base_paras=root_base_paras, root_hybrid_paras=root_hybrid_paras, abfols_paras=abfols_paras)
     md._running__()
 
 
-for _ in range(run_times):
-    for loop in range(len(rv_data)):
-        requirement_variables = rv_data[loop]
-        filename = requirement_variables[0] + data_file[loop] + ".csv"
-        dataset = read_dataset_file(filename, requirement_variables[1])
+for _ in range(SP_RUN_TIMES):
+    for loop in range(len(SP_DATA_FILENAME)):
+        filename = SP_LOAD_DATA_FROM + SP_DATA_FILENAME[loop]
+        dataset = load_dataset(filename, cols=SP_DATA_COLS[loop])
+        feature_size = len(SP_DATA_COLS[loop])
+        multi_output = SP_DATA_MULTI_OUTPUT[loop]
+        output_index = SP_OUTPUT_INDEX[loop]
         # Create combination of params.
         for item in list(ParameterGrid(param_grid)):
             train_model(item)
-
-
 
@@ -1,43 +1,45 @@
+#!/usr/bin/env python
+# ------------------------------------------------------------------------------------------------------%
+# Created by "Thieu Nguyen" at 00:51, 29/03/2020                                                        %
+#                                                                                                       %
+#       Email:      [email protected]                                                           %
+#       Homepage:   https://www.researchgate.net/profile/Thieu_Nguyen6                                  %
+#       Github:     https://github.com/thieunguyen5991                                                  %
+# -------------------------------------------------------------------------------------------------------%
+
+from os.path import splitext, basename, realpath
 from sklearn.model_selection import ParameterGrid
 from model.main.hybrid_mlnn import CroMlnn
-from utils.IOUtil import read_dataset_file
 from utils.SettingPaper import cro_mlnn_paras_final as param_grid
-from utils.SettingPaper import ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup
-
-rv_data = [ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup]
-data_file = ["google_5m", "google_5m", "google_5m", "google_5m", "it_eu_5m", "it_uk_5m", "worldcup98_5m"]
-test_type = "normal"  ### normal: for normal test, stability: for n_times test
-run_times = None
+from utils.SettingPaper import *
+from utils.IOUtil import load_dataset
 
-if test_type == "normal":  ### For normal test
-    run_times = 1
-    pathsave = "paper/results/final/"
-    all_model_file_name = "ffnn_log_models"
-elif test_type == "stability":  ### For stability test (n times run with the same parameters)
-    run_times = 15
-    pathsave = "paper/results/stability/mlnn/"
-    all_model_file_name = "stability_cro_mlnn"
-else:
-    pass
+if SP_RUN_TIMES == 1:
+    all_model_file_name = SP_LOG_FILENAME
+else:  # If runs with more than 1, like stability test --> name of the models ==> such as: rnn1hl.csv
+    all_model_file_name = str(splitext(basename(realpath(__file__)))[0])
 
 
 def train_model(item):
     root_base_paras = {
         "dataset": dataset,
-        "data_idx": (0.7, 0.15, 0.15),
+        "feature_size": feature_size,
+        "data_idx": SP_DATA_SPLIT_INDEX_2,
         "sliding": item["sliding"],
-        "multi_output": requirement_variables[2],
-        "output_idx": requirement_variables[3],
-        "method_statistic": 0,  # 0: sliding window, 1: mean, 2: min-mean-max, 3: min-median-max
+        "multi_output": multi_output,
+        "output_idx": output_index,
+        "method_statistic": SP_PREPROCESSING_METHOD,
         "log_filename": all_model_file_name,
-        "path_save_result": pathsave + requirement_variables[4],
-        "test_type": test_type,
-        "draw": True,
-        "print_train": 1  # 0: nothing, 1 : full detail, 2: short version
+        "n_runs": SP_RUN_TIMES,  # 1 or others
+        "path_save_result": SP_PATH_SAVE_BASE + SP_DATA_FILENAME[loop] + "/",
+        "draw": SP_DRAW,
+        "print_train": SP_PRINT_TRAIN,  # 0: nothing, 1 : full detail, 2: short version
     }
+    paras_name = "hs_{}-ep_{}-act_{}-po_{}-Fb_{}-Fa_{}-Fd_{}-Pd_{}-G_{}-GCR_{}-k_{}".format(item["hidden_size"], item["epoch"], item["activations"],
+                                                item["po"], item["Fb"], item["Fa"], item["Fd"], item["Pd"], item["G"], item["GCR"], item["k"])
     root_hybrid_paras = {
-        "hidden_size": item["hidden_size"], "activations": item["activations"], "epoch": item["epoch"],
-        "train_valid_rate": item["train_valid_rate"], "domain_range": item["domain_range"]
+        "hidden_size": item["hidden_size"], "activations": item["activations"], "epoch": item["epoch"], "domain_range": item["domain_range"],
+        "paras_name": paras_name
     }
     cro_paras = {
         "epoch": item["epoch"], "pop_size": item["pop_size"], "po": item["po"], "Fb": item["Fb"], "Fa": item["Fa"],
@@ -47,11 +49,13 @@ def train_model(item):
     md._running__()
 
 
-for _ in range(run_times):
-    for loop in range(len(rv_data)):
-        requirement_variables = rv_data[loop]
-        filename = requirement_variables[0] + data_file[loop] + ".csv"
-        dataset = read_dataset_file(filename, requirement_variables[1])
+for _ in range(SP_RUN_TIMES):
+    for loop in range(len(SP_DATA_FILENAME)):
+        filename = SP_LOAD_DATA_FROM + SP_DATA_FILENAME[loop]
+        dataset = load_dataset(filename, cols=SP_DATA_COLS[loop])
+        feature_size = len(SP_DATA_COLS[loop])
+        multi_output = SP_DATA_MULTI_OUTPUT[loop]
+        output_index = SP_OUTPUT_INDEX[loop]
         # Create combination of params.
         for item in list(ParameterGrid(param_grid)):
             train_model(item)
@@ -1,43 +1,44 @@
+#!/usr/bin/env python
+# ------------------------------------------------------------------------------------------------------%
+# Created by "Thieu Nguyen" at 00:51, 29/03/2020                                                        %
+#                                                                                                       %
+#       Email:      [email protected]                                                           %
+#       Homepage:   https://www.researchgate.net/profile/Thieu_Nguyen6                                  %
+#       Github:     https://github.com/thieunguyen5991                                                  %
+# -------------------------------------------------------------------------------------------------------%
+
+from os.path import splitext, basename, realpath
 from sklearn.model_selection import ParameterGrid
 from model.main.hybrid_mlnn import GaMlnn
-from utils.IOUtil import read_dataset_file
 from utils.SettingPaper import ga_mlnn_paras_final as param_grid
-from utils.SettingPaper import ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup
-
-rv_data = [ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup]
-data_file = ["google_5m", "google_5m", "google_5m", "google_5m", "it_eu_5m", "it_uk_5m", "worldcup98_5m"]
-test_type = "normal"  ### normal: for normal test, stability: for n_times test
-run_times = None
+from utils.SettingPaper import *
+from utils.IOUtil import load_dataset
 
-if test_type == "normal":  ### For normal test
-    run_times = 1
-    pathsave = "paper/results/final/"
-    all_model_file_name = "ffnn_log_models"
-elif test_type == "stability":  ### For stability test (n times run with the same parameters)
-    run_times = 15
-    pathsave = "paper/results/stability/mlnn/"
-    all_model_file_name = "stability_ga_mlnn"
-else:
-    pass
+if SP_RUN_TIMES == 1:
+    all_model_file_name = SP_LOG_FILENAME
+else:  # If runs with more than 1, like stability test --> name of the models ==> such as: rnn1hl.csv
+    all_model_file_name = str(splitext(basename(realpath(__file__)))[0])
 
 
 def train_model(item):
     root_base_paras = {
         "dataset": dataset,
-        "data_idx": (0.7, 0.15, 0.15),
+        "feature_size": feature_size,
+        "data_idx": SP_DATA_SPLIT_INDEX_2,
         "sliding": item["sliding"],
-        "multi_output": requirement_variables[2],
-        "output_idx": requirement_variables[3],
-        "method_statistic": 0,  # 0: sliding window, 1: mean, 2: min-mean-max, 3: min-median-max
+        "multi_output": multi_output,
+        "output_idx": output_index,
+        "method_statistic": SP_PREPROCESSING_METHOD,
         "log_filename": all_model_file_name,
-        "path_save_result": pathsave + requirement_variables[4],
-        "test_type": test_type,
-        "draw": True,
-        "print_train": 1  # 0: nothing, 1 : full detail, 2: short version
+        "n_runs": SP_RUN_TIMES,  # 1 or others
+        "path_save_result": SP_PATH_SAVE_BASE + SP_DATA_FILENAME[loop] + "/",
+        "draw": SP_DRAW,
+        "print_train": SP_PRINT_TRAIN,  # 0: nothing, 1 : full detail, 2: short version
     }
+    paras_name = "hs_{}-ep_{}-act_{}-pc_{}-pm_{}".format(item["hidden_size"], item["epoch"], item["activations"], item["pc"], item["pm"])
     root_hybrid_paras = {
-        "hidden_size": item["hidden_size"], "activations": item["activations"], "epoch": item["epoch"],
-        "train_valid_rate": item["train_valid_rate"], "domain_range": item["domain_range"]
+        "hidden_size": item["hidden_size"], "activations": item["activations"], "epoch": item["epoch"], "domain_range": item["domain_range"],
+        "paras_name": paras_name
     }
     ga_paras = {
         "epoch": item["epoch"], "pop_size": item["pop_size"], "pc": item["pc"], "pm": item["pm"]
@@ -46,12 +47,13 @@ def train_model(item):
     md._running__()
 
 
-for _ in range(run_times):
-    for loop in range(len(rv_data)):
-        requirement_variables = rv_data[loop]
-        filename = requirement_variables[0] + data_file[loop] + ".csv"
-        dataset = read_dataset_file(filename, requirement_variables[1])
+for _ in range(SP_RUN_TIMES):
+    for loop in range(len(SP_DATA_FILENAME)):
+        filename = SP_LOAD_DATA_FROM + SP_DATA_FILENAME[loop]
+        dataset = load_dataset(filename, cols=SP_DATA_COLS[loop])
+        feature_size = len(SP_DATA_COLS[loop])
+        multi_output = SP_DATA_MULTI_OUTPUT[loop]
+        output_index = SP_OUTPUT_INDEX[loop]
         # Create combination of params.
         for item in list(ParameterGrid(param_grid)):
             train_model(item)
-
 
@@ -1,53 +1,57 @@
+# !/usr/bin/env python
+# ------------------------------------------------------------------------------------------------------%
+# Created by "Thieu Nguyen" at 00:51, 29/03/2020                                                        %
+#                                                                                                       %
+#       Email:      [email protected]                                                           %
+#       Homepage:   https://www.researchgate.net/profile/Thieu_Nguyen6                                  %
+#       Github:     https://github.com/thieunguyen5991                                                  %
+# -------------------------------------------------------------------------------------------------------%
+
+from os.path import splitext, basename, realpath
 from sklearn.model_selection import ParameterGrid
 from model.main.traditional_rnn import Lstm1HL
-from utils.IOUtil import read_dataset_file
 from utils.SettingPaper import lstm1hl_paras_final as param_grid
-from utils.SettingPaper import ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup
+from utils.SettingPaper import *
+from utils.IOUtil import load_dataset
 
-rv_data = [ggtrace_cpu, ggtrace_ram, ggtrace_multi_cpu, ggtrace_multi_ram, traffic_eu, traffic_uk, worldcup]
-data_file = ["google_5m", "google_5m", "google_5m", "google_5m", "it_eu_5m", "it_uk_5m", "worldcup98_5m"]
-test_type = "normal"  ### normal: for normal test, stability: for n_times test
-run_times = None
+if SP_RUN_TIMES == 1:
+    all_model_file_name = SP_LOG_FILENAME
+else:  # If runs with more than 1, like stability test --> name of the models ==> such as: rnn1hl.csv
+    all_model_file_name = str(splitext(basename(realpath(__file__)))[0])
 
-if test_type == "normal":  ### For normal test
-    run_times = 1
-    pathsave = "paper/results/final/"
-    all_model_file_name = "nn_log_models"
-elif test_type == "stability":  ### For stability test (n times run with the same parameters)
-    run_times = 15
-    pathsave = "paper/results/stability/network/"
-    all_model_file_name = "stability_lstm1hl"
-else:
-    pass
 
 def train_model(item):
     root_base_paras = {
         "dataset": dataset,
-        "data_idx": (0.8, 0, 0.2),
+        "feature_size": feature_size,
+        "data_idx": SP_DATA_SPLIT_INDEX,
         "sliding": item["sliding"],
-        "multi_output": requirement_variables[2],
-        "output_idx": requirement_variables[3],
-        "method_statistic": 0,  # 0: sliding window, 1: mean, 2: min-mean-max, 3: min-median-max
+        "multi_output": multi_output,
+        "output_idx": output_index,
+        "method_statistic": SP_PREPROCESSING_METHOD,
         "log_filename": all_model_file_name,
-        "path_save_result": pathsave + requirement_variables[4],
-        "test_type": test_type,
-        "draw": True,
-        "print_train": 0  # 0: nothing, 1 : full detail, 2: short version
+        "n_runs": SP_RUN_TIMES,  # 1 or others
+        "path_save_result": SP_PATH_SAVE_BASE + SP_DATA_FILENAME[loop] + "/",
+        "draw": SP_DRAW,
+        "print_train": SP_PRINT_TRAIN,  # 0: nothing, 1 : full detail, 2: short version
     }
+    paras_name = "hs_{}-ep_{}-bs_{}-lr_{}-ac_{}-op_{}-lo_{}".format(item["hidden_sizes"], item["epoch"], item["batch_size"], item["learning_rate"],
+                                                                    item["activations"], item["optimizer"], item["loss"])
     root_rnn_paras = {
-        "hidden_sizes": item["hidden_sizes"], "epoch": item["epoch"], "batch_size": item["batch_size"],
-        "learning_rate": item["learning_rate"], "activations": item["activations"],
-        "optimizer": item["optimizer"], "loss": item["loss"], "dropouts": item["dropouts"]
+        "hidden_sizes": item["hidden_sizes"], "epoch": item["epoch"], "batch_size": item["batch_size"], "learning_rate": item["learning_rate"],
+        "activations": item["activations"], "optimizer": item["optimizer"], "loss": item["loss"], "dropouts": item["dropouts"], "paras_name": paras_name
     }
     md = Lstm1HL(root_base_paras=root_base_paras, root_rnn_paras=root_rnn_paras)
     md._running__()
 
 
-for _ in range(run_times):
-    for loop in range(len(rv_data)):
-        requirement_variables = rv_data[loop]
-        filename = requirement_variables[0] + data_file[loop] + ".csv"
-        dataset = read_dataset_file(filename, requirement_variables[1])
+for _ in range(SP_RUN_TIMES):
+    for loop in range(len(SP_DATA_FILENAME)):
+        filename = SP_LOAD_DATA_FROM + SP_DATA_FILENAME[loop]
+        dataset = load_dataset(filename, cols=SP_DATA_COLS[loop])
+        feature_size = len(SP_DATA_COLS[loop])
+        multi_output = SP_DATA_MULTI_OUTPUT[loop]
+        output_index = SP_OUTPUT_INDEX[loop]
         # Create combination of params.
         for item in list(ParameterGrid(param_grid)):
             train_model(item)