datadrivenmodel/ddm_trainer.py

71 строка
2.0 KiB
Python

import os
import logging
logging.basicConfig()
logging.root.setLevel(logging.INFO)
logger = logging.getLogger("datamodeler")
from model_loader import available_models
from omegaconf import DictConfig, OmegaConf, ListConfig
import hydra
dir_path = os.path.dirname(os.path.realpath(__file__))
@hydra.main(config_path="conf", config_name="config")
def main(cfg: DictConfig) -> None:
logger.info("Configuration: ")
logger.info(f"\n{OmegaConf.to_yaml(cfg)}")
input_cols = cfg["data"]["inputs"]
output_cols = cfg["data"]["outputs"]
augmented_cols = cfg["data"]["augmented_cols"]
iteration_order = cfg["data"]["iteration_order"]
episode_col = cfg["data"]["episode_col"]
iteration_col = cfg["data"]["iteration_col"]
dataset_path = cfg["data"]["path"]
max_rows = cfg["data"]["max_rows"]
save_path = cfg["model"]["saver"]["filename"]
model_name = cfg["model"]["name"]
scale_data = cfg["model"]["build_params"]["scale_data"]
Model = available_models[model_name]
if cfg["data"]["full_or_relative"] == "relative":
dataset_path = os.path.join(dir_path, dataset_path)
save_path = os.path.join(dir_path, save_path + ".pkl")
if type(input_cols) == ListConfig:
input_cols = list(input_cols)
if type(output_cols) == ListConfig:
output_cols = list(output_cols)
if type(augmented_cols) == ListConfig:
augmented_cols = list(augmented_cols)
model = Model()
X, y = model.load_csv(
input_cols=input_cols,
output_cols=output_cols,
augm_cols=augmented_cols,
dataset_path=dataset_path,
iteration_order=iteration_order,
episode_col=episode_col,
iteration_col=iteration_col,
max_rows=max_rows,
)
logger.info("Building model...")
model.build_model(scale_data=scale_data)
logger.info("Fitting model...")
model.fit(X, y)
logger.info(f"Saving model to {save_path}")
model.save_model(filename=save_path)
if __name__ == "__main__":
main()