josarago · josarago · Feb 20, 2023 · Feb 20, 2023 · Feb 20, 2023 · Feb 20, 2023
diff --git a/.gitignore b/.gitignore
@@ -156,10 +156,12 @@ cython_debug/
 
 # tensorflow
 **/logs/*
+**/tuner/*
 
 #vscode
 *.code-workspace
 
 # plot_model
 *.png
 draft.py
+
diff --git a/config.py b/config.py
@@ -1,5 +1,6 @@
 import os
 import logging
+from dataclasses import dataclass
 
 # logging
 LOGGING_FORMAT = "%(asctime)s %(levelname)-8s [%(filename)s:%(lineno)d] %(message)s"
@@ -25,3 +26,20 @@ def get_logger(name):
 # SizeManager config
 SIZING_DIR_NAME = "sizing_systems"
 SIZING_SYSTEM_DIR_PATH = os.path.join(DATA_DIR_PATH, SIZING_DIR_NAME)
+
+
+@dataclass
+class ModelConfig:
+    test_size: float = 0.3
+    embedding_dim: int = 4
+    learning_rate: float = 0.005
+    batch_size: int = 256
+    checkpoint_path: str = os.path.join(os.getcwd(), "model_checkpoints")
+    validation_split: float = 0.2
+    epochs: int = 2_000
+    fit_verbose: int = 0
+    asym_loss_gamma: float = 0.5
+    classification_loss: str = "categorical_crossentropy"
+    embedding_func: str = "subtract"
+    early_stopping__patience: int = 50
+    early_stopping__restore_best_weights: bool = True
diff --git a/pipelines.py b/pipelines.py
@@ -106,11 +106,4 @@
     ]
 )
 
-USED_COLUMNS = (
-    EMBEDDING_COLUMNS
-    + USER_CATEGORICAL_COLUMNS
-    + SKU_NUMERICAL_COLUMNS
-    + [TARGET_COLUMN]
-)
-
 target_pipe = LabelBinarizer()