ml_experiment.dig

ml_experiment.dig#

_export:
  !include : config/params.yaml
  td:
    database: ${ml.output_database}
    engine: presto

+create_db_tbl_if_not_exists:
  td_ddl>:
  create_databases: ["${ml.output_database}"]
  create_tables: ["automl_experiments", "automl_eval_results"]

+gluon_train:
  ml_train>:
    docker:
      task_mem: 128g # 64g/128g/256g/384g/512g
    notebook: gluon_train
    input_table: ${ml.input_database}.${ml.train_data_table}
    target_column: ${ml.target_column}
    eval_metric: ${ml.eval_metric}
    model_name: gluon_model_${session_id}
    share_model: true
    time_limit: ${ml.fit_time_limit}
    export_leaderboard: ${ml.output_database}.leaderboard_${ml.train_data_table}
    export_feature_importance: ${ml.output_database}.feature_importance_${ml.train_data_table}
     
+track_experiment:
  td>: queries/track_experiment.sql
  insert_into: ${ml.output_database}.automl_experiments
  last_executed_notebook: ${automl.last_executed_notebook}
  user_id: ${automl.last_executed_user_id}
  user_email: ${automl.last_executed_user_email}
  model_name: gluon_model_${session_id}
  shared_model: ${automl.shared_model}
  task_attempt_id: ${attempt_id}
  session_time: ${session_local_time}
  engine: presto
  trained_table: ${ml.input_database}.${ml.train_data_table}
  target_column: ${ml.target_column}
  eval_metric: ${ml.eval_metric}