From c4408038d961288d813b075c3355009b8226dfdb Mon Sep 17 00:00:00 2001 From: amesar Date: Thu, 16 Mar 2023 05:18:44 +0000 Subject: [PATCH] Issue #10 - added Dump_Run notebook --- databricks_notebooks/display/Dump_Run.py | 75 ++++++++++++++++++++++++ databricks_notebooks/display/_README.py | 5 +- 2 files changed, 78 insertions(+), 2 deletions(-) create mode 100644 databricks_notebooks/display/Dump_Run.py diff --git a/databricks_notebooks/display/Dump_Run.py b/databricks_notebooks/display/Dump_Run.py new file mode 100644 index 0000000..caaa9f2 --- /dev/null +++ b/databricks_notebooks/display/Dump_Run.py @@ -0,0 +1,75 @@ +# Databricks notebook source +# MAGIC %md ## Dump a run +# MAGIC +# MAGIC **Overview** +# MAGIC * Shows run info, params, metrics and tags +# MAGIC * Recursively shows all artifacts up to the specified level +# MAGIC +# MAGIC +# MAGIC **Widgets** +# MAGIC * `Run ID` +# MAGIC * `Show tags as dictionary` - show MLflow tags as a dictionary instead of a list of key/value pairs +# MAGIC * `Artifact max level` - number of artifact levels to show +# MAGIC * `Format` - JSON or YAML +# MAGIC * `Output file` - if set, write output to file + +# COMMAND ---------- + +# MAGIC %run ./Common + +# COMMAND ---------- + +# MAGIC %md ### Widgets + +# COMMAND ---------- + +#dbutils.widgets.removeAll() + + +# COMMAND ---------- + +dbutils.widgets.text("1. Run ID", "") +dbutils.widgets.dropdown("2. Show tags as dictionary","no",["yes","no"]) +dbutils.widgets.text("3. Artifact max level", "1") +dbutils.widgets.dropdown("4. Format","json",["json","yaml"]) +dbutils.widgets.text("5. Output file", "") + +run_id = dbutils.widgets.get("1. Run ID") +show_tags_as_dict = dbutils.widgets.get("2. Show tags as dictionary") == "yes" +artifact_max_level = int(dbutils.widgets.get("3. Artifact max level")) +format = dbutils.widgets.get("4. Format") +output_file = dbutils.widgets.get("5. Output file") + +print("run_id:", run_id) +print("show_tags_as_dict:", show_tags_as_dict) +print("artifact_max_level:", artifact_max_level) +print("format:", format) +print("output_file:", output_file) + +# COMMAND ---------- + +assert_widget(run_id, "1. Run ID") + +# COMMAND ---------- + +# MAGIC %md ### Display run details + +# COMMAND ---------- + +from mlflow_tools.display import dump_run + +dct = dump_run.dump_run_id( + run_id = run_id, + show_tags_as_dict = show_tags_as_dict, + artifact_max_level = artifact_max_level, + format = format, + explode_json_string = False +) + +# COMMAND ---------- + +# MAGIC %md ### Write output to file + +# COMMAND ---------- + +write_file(dct, output_file, format) diff --git a/databricks_notebooks/display/_README.py b/databricks_notebooks/display/_README.py index 312202a..da39a80 100644 --- a/databricks_notebooks/display/_README.py +++ b/databricks_notebooks/display/_README.py @@ -16,8 +16,9 @@ # MAGIC * [MLflow_Version_Analytics]($MLflow_Version_Analytics) - list versions by model, etc. # MAGIC # MAGIC **Dump Tools** -# MAGIC * [Dump_Experiment]($Dump_Experiment) # MAGIC * [Dump_Registered_Model]($Dump_Registered_Model) +# MAGIC * [Dump_Experiment]($Dump_Experiment) +# MAGIC * [Dump_Run]($Dump_Run) # MAGIC # MAGIC **Other** # MAGIC * [Common]($Common) @@ -25,4 +26,4 @@ # MAGIC **Documentation** # MAGIC * [MLflow Spark Datasource Example](https://docs.databricks.com/_static/notebooks/mlflow/mlflow-datasource.html) - Databricks documentation. # MAGIC -# MAGIC Last updated: 2023-03-15 +# MAGIC Last updated: 2023-03-16