Small fixes to discharge prediction notebook

amrit110 · amrit110 · commit b1f9d6a89676 · 2024-02-29T12:41:16.000-05:00
diff --git a/benchmarks/mimiciv/discharge_prediction.ipynb b/benchmarks/mimiciv/discharge_prediction.ipynb
@@ -933,6 +933,17 @@
     ")"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "**Log the performance metrics to the report.**\n",
+    "\n",
+    "We can add a performance metric to the model card using the `log_performance_metric` method, which expects a dictionary where the keys are in the following format: `slice_name/metric_name`. For instance, `overall/accuracy`. \n",
+    "\n",
+    "We first need to process the evaluation results to get the metrics in the right format."
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -947,6 +958,67 @@
     ")"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "test_datasets = [\n",
+    "    test_dataset.shard(NUM_EVALS, i, contiguous=True) for i in range(NUM_EVALS)\n",
+    "]\n",
+    "eval_timestamps = [test_dataset[\"dischtime\"][-1] for test_dataset in test_datasets]\n",
+    "\n",
+    "for i, test_dataset in enumerate(test_datasets):\n",
+    "    report = ModelCardReport()\n",
+    "    report.log_owner(\n",
+    "        name=\"CyclOps Team\",\n",
+    "        contact=\"vectorinstitute.github.io/cyclops/\",\n",
+    "        email=\"cyclops@vectorinstitute.ai\",\n",
+    "    )\n",
+    "    results, dataset_with_preds = mortality_task.evaluate(\n",
+    "        test_dataset,\n",
+    "        metric_collection,\n",
+    "        model_names=model_name,\n",
+    "        transforms=preprocessor,\n",
+    "        prediction_column_prefix=\"preds\",\n",
+    "        slice_spec=slice_spec,\n",
+    "        batch_size=64,\n",
+    "        fairness_config=fairness_config,\n",
+    "        override_fairness_metrics=False,\n",
+    "    )\n",
+    "    results_flat = flatten_results_dict(\n",
+    "        results=results,\n",
+    "        remove_metrics=[\"BinaryROC\", \"BinaryPrecisionRecallCurve\"],\n",
+    "        model_name=model_name_results,\n",
+    "    )\n",
+    "    for name, metric in results_flat.items():\n",
+    "        split, name = name.split(\"/\")  # noqa: PLW2901\n",
+    "        descriptions = {\n",
+    "            \"BinaryPrecision\": \"The proportion of predicted positive instances that are correctly predicted.\",\n",
+    "            \"BinaryRecall\": \"The proportion of actual positive instances that are correctly predicted. Also known as recall or true positive rate.\",\n",
+    "            \"BinaryAccuracy\": \"The proportion of all instances that are correctly predicted.\",\n",
+    "            \"BinaryAUROC\": \"The area under the receiver operating characteristic curve (AUROC) is a measure of the performance of a binary classification model.\",\n",
+    "            \"BinaryAveragePrecision\": \"The area under the precision-recall curve (AUPRC) is a measure of the performance of a binary classification model.\",\n",
+    "            \"BinaryF1Score\": \"The harmonic mean of precision and recall.\",\n",
+    "        }\n",
+    "        report.log_quantitative_analysis(\n",
+    "            \"performance\",\n",
+    "            name=name,\n",
+    "            value=metric.tolist(),\n",
+    "            description=descriptions[name],\n",
+    "            metric_slice=split,\n",
+    "            pass_fail_thresholds=0.7,\n",
+    "            pass_fail_threshold_fns=lambda x, threshold: bool(x >= threshold),\n",
+    "        )\n",
+    "    print(str(eval_timestamps[i]))\n",
+    "    report_path = report.export(\n",
+    "        output_filename=\"discharge_prediction_report_periodic.html\",\n",
+    "        synthetic_timestamp=str(eval_timestamps[i]),\n",
+    "    )\n",
+    "    shutil.copy(f\"{report_path}\", \".\")"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -1165,9 +1237,9 @@
    "source": [
     "report.log_from_dict(\n",
     "    data={\n",
-    "        \"name\": \"Mortality Prediction Model\",\n",
+    "        \"name\": \"Discharge Prediction Model\",\n",
     "        \"description\": \"The model was trained on the MIMICIV dataset \\\n",
-    "            to predict risk of in-hospital mortality.\",\n",
+    "            to predict probability of patient being discharged.\",\n",
     "    },\n",
     "    section_name=\"model_details\",\n",
     ")\n",
@@ -1176,11 +1248,6 @@
     "    date=str(date.today()),\n",
     "    description=\"Initial Release\",\n",
     ")\n",
-    "report.log_owner(\n",
-    "    name=\"CyclOps Team\",\n",
-    "    contact=\"vectorinstitute.github.io/cyclops/\",\n",
-    "    email=\"cyclops@vectorinstitute.ai\",\n",
-    ")\n",
     "report.log_license(identifier=\"Apache-2.0\")\n",
     "report.log_reference(\n",
     "    link=\"https://xgboost.readthedocs.io/en/stable/python/python_api.html\",  # noqa: E501\n",
@@ -1241,85 +1308,17 @@
     "Once the model card is populated, you can generate the report using the `export` method. The report is generated in the form of an HTML file. A JSON file containing the model card data will also be generated along with the HTML file. By default, the files will be saved in a folder named `cyclops_reports` in the current working directory. You can change the path by passing a `output_dir` argument when instantiating the `ModelCardReport` class."
    ]
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Log the performance metrics to the report.**\n",
-    "\n",
-    "We can add a performance metric to the model card using the `log_performance_metric` method, which expects a dictionary where the keys are in the following format: `slice_name/metric_name`. For instance, `overall/accuracy`. \n",
-    "\n",
-    "We first need to process the evaluation results to get the metrics in the right format."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "tags": []
-   },
-   "outputs": [],
-   "source": [
-    "test_datasets = [\n",
-    "    test_dataset.shard(NUM_EVALS, i, contiguous=True) for i in range(NUM_EVALS)\n",
-    "]"
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
-    "eval_timestamps = [test_dataset[\"dischtime\"][-1] for test_dataset in test_datasets]\n",
-    "\n",
-    "for i, test_dataset in enumerate(test_datasets):\n",
-    "    if i > 0:\n",
-    "        report = ModelCardReport()\n",
-    "        report.log_owner(\n",
-    "            name=\"CyclOps Team\",\n",
-    "            contact=\"vectorinstitute.github.io/cyclops/\",\n",
-    "            email=\"cyclops@vectorinstitute.ai\",\n",
-    "        )\n",
-    "    results, dataset_with_preds = mortality_task.evaluate(\n",
-    "        test_dataset,\n",
-    "        metric_collection,\n",
-    "        model_names=model_name,\n",
-    "        transforms=preprocessor,\n",
-    "        prediction_column_prefix=\"preds\",\n",
-    "        slice_spec=slice_spec,\n",
-    "        batch_size=64,\n",
-    "    )\n",
-    "    results_flat = flatten_results_dict(\n",
-    "        results=results,\n",
-    "        remove_metrics=[\"BinaryROC\", \"BinaryPrecisionRecallCurve\"],\n",
-    "        model_name=model_name_results,\n",
-    "    )\n",
-    "    for name, metric in results_flat.items():\n",
-    "        split, name = name.split(\"/\")  # noqa: PLW2901\n",
-    "        descriptions = {\n",
-    "            \"BinaryPrecision\": \"The proportion of predicted positive instances that are correctly predicted.\",\n",
-    "            \"BinaryRecall\": \"The proportion of actual positive instances that are correctly predicted. Also known as recall or true positive rate.\",\n",
-    "            \"BinaryAccuracy\": \"The proportion of all instances that are correctly predicted.\",\n",
-    "            \"BinaryAUROC\": \"The area under the receiver operating characteristic curve (AUROC) is a measure of the performance of a binary classification model.\",\n",
-    "            \"BinaryAveragePrecision\": \"The area under the precision-recall curve (AUPRC) is a measure of the performance of a binary classification model.\",\n",
-    "            \"BinaryF1Score\": \"The harmonic mean of precision and recall.\",\n",
-    "        }\n",
-    "        report.log_quantitative_analysis(\n",
-    "            \"performance\",\n",
-    "            name=name,\n",
-    "            value=metric.tolist(),\n",
-    "            description=descriptions[name],\n",
-    "            metric_slice=split,\n",
-    "            pass_fail_thresholds=0.7,\n",
-    "            pass_fail_threshold_fns=lambda x, threshold: bool(x >= threshold),\n",
-    "        )\n",
-    "    print(str(eval_timestamps[i]))\n",
-    "    report_path = report.export(\n",
-    "        output_filename=\"discharge_prediction_report_periodic.html\",\n",
-    "        synthetic_timestamp=str(eval_timestamps[i]),\n",
-    "    )\n",
-    "    shutil.copy(f\"{report_path}\", \".\")\n",
+    "report_path = report.export(\n",
+    "    output_filename=\"discharge_prediction_report_periodic.html\",\n",
+    "    synthetic_timestamp=str(eval_timestamps[-1]),\n",
+    ")\n",
+    "shutil.copy(f\"{report_path}\", \".\")\n",
     "shutil.rmtree(\"./cyclops_reports\")"
    ]
   },
diff --git a/benchmarks/mimiciv/icu_mortality_prediction.ipynb b/benchmarks/mimiciv/icu_mortality_prediction.ipynb
@@ -1214,9 +1214,9 @@
    "source": [
     "report.log_from_dict(\n",
     "    data={\n",
-    "        \"name\": \"Mortality Prediction Model\",\n",
+    "        \"name\": \"ICU Mortality Prediction Model\",\n",
     "        \"description\": \"The model was trained on the MIMICIV dataset \\\n",
-    "            to predict risk of in-hospital mortality.\",\n",
+    "            to predict risk of mortality in the ICU.\",\n",
     "    },\n",
     "    section_name=\"model_details\",\n",
     ")\n",
@@ -1265,7 +1265,7 @@
     ")\n",
     "report.log_user(description=\"ML Engineers\")\n",
     "report.log_use_case(\n",
-    "    description=\"Predicting prolonged length of stay\",\n",
+    "    description=\"Predicting ICU mortality\",\n",
     "    kind=\"primary\",\n",
     ")\n",
     "report.log_fairness_assessment(\n",
diff --git a/docs/source/tutorials/nihcxr/monitor_api.ipynb b/docs/source/tutorials/nihcxr/monitor_api.ipynb
@@ -291,6 +291,9 @@
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
    "version": "3.10.12"
+  },
+  "nbsphinx": {
+   "execute": "never"
   }
  },
  "nbformat": 4,