janosh
diff --git a/‎.pre-commit-config.yaml
+4-4 b/‎.pre-commit-config.yaml
+4-4
diff --git a/‎matbench_discovery/energy.py
+1-2 b/‎matbench_discovery/energy.py
+1-2
diff --git a/‎scripts/compile_metrics.py
+37-29 b/‎scripts/compile_metrics.py
+37-29
diff --git a/‎scripts/cumulative_clf_metrics.py
+1-1 b/‎scripts/cumulative_clf_metrics.py
+1-1
diff --git a/‎scripts/hist_classified_stable_vs_hull_dist_batches.py
+1-3 b/‎scripts/hist_classified_stable_vs_hull_dist_batches.py
+1-3
diff --git a/‎scripts/hist_classified_stable_vs_hull_dist_models.py
+3-3 b/‎scripts/hist_classified_stable_vs_hull_dist_models.py
+3-3
diff --git a/‎scripts/rolling_mae_vs_hull_dist_all_models.py
+1-1 b/‎scripts/rolling_mae_vs_hull_dist_all_models.py
+1-1
diff --git a/‎scripts/scatter_e_above_hull_models.py
+3-3 b/‎scripts/scatter_e_above_hull_models.py
+3-3
diff --git a/‎site/package.json
+11-11 b/‎site/package.json
+11-11
diff --git a/‎site/src/lib/ModelCard.svelte
+2-2 b/‎site/src/lib/ModelCard.svelte
+2-2
diff --git a/‎site/src/lib/index.ts
+10-2 b/‎site/src/lib/index.ts
+10-2
@@ -7,7 +7,7 @@ default_install_hook_types: [pre-commit, commit-msg]
 
 repos:
   - repo: https://github.com/PyCQA/isort
-    rev: 5.11.4
+    rev: 5.12.0
     hooks:
       - id: isort
 
@@ -59,7 +59,7 @@ repos:
         exclude: ^(.+references.yaml)$
 
   - repo: https://github.com/PyCQA/autoflake
-    rev: v2.0.0
+    rev: v2.0.1
     hooks:
       - id: autoflake
 
@@ -75,7 +75,7 @@ repos:
         exclude: ^(site/src/figs/.+\.svelte|data/wbm/20.+\..+|site/src/routes/.+\.(yml|yaml|json))$
 
   - repo: https://github.com/pre-commit/mirrors-eslint
-    rev: v8.31.0
+    rev: v8.33.0
     hooks:
       - id: eslint
         types: [file]
@@ -90,7 +90,7 @@ repos:
           - "@typescript-eslint/parser"
 
   - repo: https://github.com/PyCQA/pydocstyle
-    rev: 6.1.1
+    rev: 6.3.0
     hooks:
       - id: pydocstyle
         exclude: tests
@@ -176,7 +176,7 @@ def stable_metrics(
 
     Returns:
         dict[str, float]: dictionary of classification metrics with keys DAF, Precision,
-            Recall, Prevalence, Accuracy, F1, TPR, FPR, TNR, FNR, MAE, RMSE, R2.
+            Recall, Accuracy, F1, TPR, FPR, TNR, FNR, MAE, RMSE, R2.
     """
     true_pos, false_neg, false_pos, true_neg = classify_stable(
         true, pred, stability_threshold
@@ -198,7 +198,6 @@ def stable_metrics(
         DAF=precision / prevalence,
         Precision=precision,
         Recall=recall,
-        Prevalence=prevalence,
         Accuracy=(n_true_pos + n_true_neg) / len(true),
         F1=2 * (precision * recall) / (precision + recall),
         TPR=n_true_pos / (n_true_pos + n_false_neg),
 
@@ -3,16 +3,17 @@
 
 from typing import Any
 
+import numpy as np
 import pandas as pd
 import requests
 import wandb
 import wandb.apis.public
 from pymatviz.utils import save_fig
-from sklearn.metrics import f1_score, r2_score
 from tqdm import tqdm
 
 from matbench_discovery import FIGS, MODELS, WANDB_PATH, today
 from matbench_discovery.data import PRED_FILENAMES, load_df_wbm_preds
+from matbench_discovery.energy import stable_metrics
 from matbench_discovery.plots import px
 
 __author__ = "Janosh Riebesell"
@@ -97,10 +98,10 @@
 
     n_gpu, n_cpu = metadata.get("gpu_count", 0), metadata.get("cpu_count", 0)
     model_stats[model] = {
-        "run_time_h": run_time_total / 3600,
+        (time_col := "Run Time (h)"): run_time_total / 3600,
         "GPU": n_gpu,
         "CPU": n_cpu,
-        "slurm_jobs": n_runs,
+        "Slurm Jobs": n_runs,
     }
 
 
@@ -110,6 +111,7 @@
 )
 
 df_metrics = pd.DataFrame(model_stats).T
+df_metrics.index.name = "Model"
 # on 2022-11-28:
 # run_times = {'Voronoi Random Forest': 739608,
 #  'Wrenformer': 208399,
@@ -121,46 +123,50 @@
 # %%
 df_wbm = load_df_wbm_preds(list(models))
 e_form_col = "e_form_per_atom_mp2020_corrected"
-each_col = "e_above_hull_mp2020_corrected_ppd_mp"
+each_true_col = "e_above_hull_mp2020_corrected_ppd_mp"
 
 
 # %%
 for model in models:
-    dct = {}
-    e_above_hull_pred = df_wbm[model] - df_wbm[e_form_col]
-    isna = e_above_hull_pred.isna() | df_wbm[each_col].isna()
+    each_pred = df_wbm[each_true_col] + df_wbm[model] - df_wbm[e_form_col]
 
-    dct["F1"] = f1_score(df_wbm[each_col] < 0, e_above_hull_pred < 0)
-    dct["Precision"] = f1_score(
-        df_wbm[each_col] < 0, e_above_hull_pred < 0, pos_label=True
-    )
-    dct["Recall"] = f1_score(
-        df_wbm[each_col] < 0, e_above_hull_pred < 0, pos_label=False
-    )
-
-    dct["MAE"] = (e_above_hull_pred - df_wbm[each_col]).abs().mean()
+    metrics = stable_metrics(df_wbm[each_true_col], each_pred)
 
-    dct["RMSE"] = ((e_above_hull_pred - df_wbm[each_col]) ** 2).mean() ** 0.5
-    dct["R2"] = r2_score(df_wbm[each_col][~isna], e_above_hull_pred[~isna])
+    df_metrics.loc[model, list(metrics)] = metrics.values()
 
-    df_metrics.loc[model, list(dct)] = dct.values()
 
-
-df_styled = df_metrics.style.format(precision=3).background_gradient(
-    cmap="viridis",
-    # gmap=np.log10(df_table) # for log scaled color map
+# %%
+df_styled = (
+    df_metrics.reset_index()
+    .drop(columns=["GPU", "CPU", "Slurm Jobs"])
+    .style.format(precision=2)
+    .background_gradient(
+        cmap="viridis_r",  # lower is better so reverse color map
+        subset=["MAE", "RMSE", "FNR", "FPR"],
+    )
+    .background_gradient(
+        cmap="viridis_r",
+        subset=[time_col],
+        gmap=np.log10(df_metrics[time_col].to_numpy()),  # for log scaled color map
+    )
+    .background_gradient(
+        cmap="viridis",  # higher is better
+        subset=["DAF", "R2", "Precision", "Recall", "F1", "Accuracy", "TPR", "TNR"],
+    )
+    .hide(axis="index")
 )
+df_styled
 
 
 # %% export model metrics as styled HTML table
 styles = {
     "": "font-family: sans-serif; border-collapse: collapse;",
-    "td, th": "border: 1px solid #ddd; text-align: left; padding: 8px;",
+    "td, th": "border: 1px solid #ddd; text-align: left; padding: 8px; white-space: nowrap;",
 }
 df_styled.set_table_styles([dict(selector=sel, props=styles[sel]) for sel in styles])
 
-html_path = f"{FIGS}/{today}-metrics-table.html"
-# df_styled.to_html(html_path)
+html_path = f"{FIGS}/{today}-metrics-table.svelte"
+df_styled.to_html(html_path)
 
 
 # %% write model metrics to json for use by the website
@@ -169,14 +175,14 @@
     f"{x / len(df_wbm):.2%}" for x in df_metrics.missing_preds
 ]
 
-df_metrics.attrs["total_run_time"] = df_metrics.run_time.sum()
+df_metrics.attrs["Total Run Time"] = df_metrics[time_col].sum()
 
 df_metrics.round(2).to_json(f"{MODELS}/{today}-model-stats.json", orient="index")
 
 
 # %% plot model run times as pie chart
 fig = px.pie(
-    df_metrics, values="run_time", names=df_metrics.index, hole=0.5
+    df_metrics, values=time_col, names=df_metrics.index, hole=0.5
 ).update_traces(
     textinfo="percent+label",
     textfont_size=14,
@@ -189,12 +195,14 @@
 )
 fig.add_annotation(
     # add title in the middle saying "Total CPU+GPU time used"
-    text=f"Total CPU+GPU<br>time used:<br>{df_metrics.run_time.sum():.1f} h",
+    text=f"Total CPU+GPU<br>time used:<br>{df_metrics[time_col].sum():.1f} h",
     font=dict(size=18),
     x=0.5,
     y=0.5,
     showarrow=False,
 )
 fig.update_layout(margin=dict(l=0, r=0, t=0, b=0))
 
+
+# %%
 save_fig(fig, f"{FIGS}/{today}-model-run-times-pie.svelte")
@@ -15,7 +15,7 @@
     "CGCNN, Voronoi Random Forest, Wrenformer, MEGNet, M3GNet, BOWSR MEGNet"
 ).split(", ")
 
-df_wbm = load_df_wbm_preds(models=models).round(3)
+df_wbm = load_df_wbm_preds(models).round(3)
 
 # df_wbm.columns = [f"{col}_e_form" if col in models else col for col in df_wbm]
 e_form_col = "e_form_per_atom_mp2020_corrected"
 
@@ -35,9 +35,7 @@
 which_energy: WhichEnergy = "true"
 backend: Backend = "matplotlib"
 fig, axs = plt.subplots(2, 3, figsize=(18, 9))
-df_wbm[each_pred_col] = df_wbm[each_true_col] + (
-    df_wbm[model_name] - df_wbm[e_form_col]
-)
+df_wbm[each_pred_col] = df_wbm[each_true_col] + df_wbm[model_name] - df_wbm[e_form_col]
 
 
 for batch_idx, ax in zip(range(1, 6), axs.flat):
 
@@ -20,7 +20,7 @@
 models = sorted(
     "CGCNN, Voronoi Random Forest, Wrenformer, MEGNet, M3GNet, BOWSR MEGNet".split(", ")
 )
-df_wbm = load_df_wbm_preds(models=models).round(3)
+df_wbm = load_df_wbm_preds(models).round(3)
 
 e_form_col = "e_form_per_atom_mp2020_corrected"
 each_true_col = "e_above_hull_mp2020_corrected_ppd_mp"
@@ -39,8 +39,8 @@
     value_name=e_form_preds,
 )
 
-df_melt[each_pred_col] = df_melt[each_true_col] + (
-    df_melt[e_form_preds] - df_melt[e_form_col]
+df_melt[each_pred_col] = (
+    df_melt[each_true_col] + df_melt[e_form_preds] - df_melt[e_form_col]
 )
 
 
 
@@ -16,7 +16,7 @@
 e_form_col = "e_form_per_atom_mp2020_corrected"
 e_above_hull_col = "e_above_hull_mp2020_corrected_ppd_mp"
 
-df_wbm = load_df_wbm_preds(models=models).round(3)
+df_wbm = load_df_wbm_preds(models).round(3)
 
 
 # %%
 
@@ -16,7 +16,7 @@
 models = sorted(
     "CGCNN, Voronoi Random Forest, Wrenformer, MEGNet, M3GNet, BOWSR MEGNet".split(", ")
 )
-df_wbm = load_df_wbm_preds(models=models).round(3)
+df_wbm = load_df_wbm_preds(models).round(3)
 
 e_form_col = "e_form_per_atom_mp2020_corrected"
 each_true_col = "e_above_hull_mp2020_corrected_ppd_mp"
@@ -36,8 +36,8 @@
     value_name=e_form_pred_col,
 )
 
-df_melt[each_pred_col] = df_melt[each_true_col] + (
-    df_melt[e_form_pred_col] - df_melt[e_form_col]
+df_melt[each_pred_col] = (
+    df_melt[each_true_col] + df_melt[e_form_pred_col] - df_melt[e_form_col]
 )
 
 
 
@@ -17,14 +17,14 @@
     "make-api-docs": "cd .. && python scripts/make_api_docs.py"
   },
   "devDependencies": {
-    "@iconify/svelte": "^3.0.1",
+    "@iconify/svelte": "^3.1.0",
     "@rollup/plugin-yaml": "^4.0.1",
-    "@sveltejs/adapter-static": "^1.0.3",
-    "@sveltejs/kit": "^1.1.1",
+    "@sveltejs/adapter-static": "^1.0.5",
+    "@sveltejs/kit": "^1.3.7",
     "@sveltejs/vite-plugin-svelte": "^2.0.2",
-    "@typescript-eslint/eslint-plugin": "^5.48.1",
-    "@typescript-eslint/parser": "^5.48.1",
-    "eslint": "^8.32.0",
+    "@typescript-eslint/eslint-plugin": "^5.50.0",
+    "@typescript-eslint/parser": "^5.50.0",
+    "eslint": "^8.33.0",
     "eslint-plugin-svelte3": "^4.0.0",
     "hastscript": "^7.2.0",
     "katex": "^0.16.4",
@@ -36,14 +36,14 @@
     "rehype-slug": "^5.1.0",
     "remark-math": "3.0.0",
     "svelte": "^3.55.1",
-    "svelte-check": "^3.0.2",
-    "svelte-preprocess": "^5.0.0",
+    "svelte-check": "^3.0.3",
+    "svelte-preprocess": "^5.0.1",
     "svelte-toc": "^0.5.2",
-    "svelte-zoo": "^0.2.1",
+    "svelte-zoo": "^0.2.4",
     "svelte2tsx": "^0.6.0",
     "sveriodic-table": "^0.1.4",
-    "tslib": "^2.4.1",
-    "typescript": "^4.9.4",
+    "tslib": "^2.5.0",
+    "typescript": "^4.9.5",
     "vite": "^4.0.4"
   },
   "prettier": {
 
@@ -65,7 +65,7 @@
         <li>
           {#if ![`aviary`].includes(name)}
             {@const href = `https://pypi.org/project/${name}/${version}`}
-            {name}: <a {href}>{version}</a>
+            {name}: <a {href} {...target}>{version}</a>
           {:else}
             {name}: {version}
           {/if}
@@ -77,7 +77,7 @@
 <section class="metrics">
   <h3 class="toc-exclude">Metrics</h3>
   <ul>
-    {#each stats as [key, label, unit]}
+    {#each stats as { key, label, unit }}
       <li class:active={sort_by == key}>
         {@html label ?? key} = {data[key]}
         {unit ?? ``}
 
@@ -29,15 +29,23 @@ export type ModelStats = {
   missing_preds: number
   missing_percent: number
   Accuracy: number
-  run_time_h: string
+  'Run Time (h)': string
+  FPR: number
+  FNR: number
+  DAF: number
   GPUs: number
   CPUs: number
   slurm_jobs: number
   date_added: string
 }
 
 // [key, label?, unit?]
-export type ModelStatLabel = [keyof ModelStats, (string | null)?, string?]
+export type ModelStatLabel = {
+  key: keyof ModelStats
+  label?: string
+  unit?: string
+  tooltip?: string
+}
 
 export type Author = {
   name: string
Original file line number	Diff line number	Diff line change
`@@ -20,7 +20,7 @@`
`20`	`20`	`models = sorted(`
`21`	`21`	`"CGCNN, Voronoi Random Forest, Wrenformer, MEGNet, M3GNet, BOWSR MEGNet".split(", ")`
`22`	`22`	`)`
`23`		`-df_wbm = load_df_wbm_preds(models=models).round(3)`
	`23`	`+df_wbm = load_df_wbm_preds(models).round(3)`
`24`	`24`
`25`	`25`	`e_form_col = "e_form_per_atom_mp2020_corrected"`
`26`	`26`	`each_true_col = "e_above_hull_mp2020_corrected_ppd_mp"`
`@@ -39,8 +39,8 @@`
`39`	`39`	`value_name=e_form_preds,`
`40`	`40`	`)`
`41`	`41`
`42`		`-df_melt[each_pred_col] = df_melt[each_true_col] + (`
`43`		`- df_melt[e_form_preds] - df_melt[e_form_col]`
	`42`	`+df_melt[each_pred_col] = (`
	`43`	`+ df_melt[each_true_col] + df_melt[e_form_preds] - df_melt[e_form_col]`
`44`	`44`	`)`
`45`	`45`
`46`	`46`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@`
`16`	`16`	`models = sorted(`
`17`	`17`	`"CGCNN, Voronoi Random Forest, Wrenformer, MEGNet, M3GNet, BOWSR MEGNet".split(", ")`
`18`	`18`	`)`
`19`		`-df_wbm = load_df_wbm_preds(models=models).round(3)`
	`19`	`+df_wbm = load_df_wbm_preds(models).round(3)`
`20`	`20`
`21`	`21`	`e_form_col = "e_form_per_atom_mp2020_corrected"`
`22`	`22`	`each_true_col = "e_above_hull_mp2020_corrected_ppd_mp"`
`@@ -36,8 +36,8 @@`
`36`	`36`	`value_name=e_form_pred_col,`
`37`	`37`	`)`
`38`	`38`
`39`		`-df_melt[each_pred_col] = df_melt[each_true_col] + (`
`40`		`- df_melt[e_form_pred_col] - df_melt[e_form_col]`
	`39`	`+df_melt[each_pred_col] = (`
	`40`	`+ df_melt[each_true_col] + df_melt[e_form_pred_col] - df_melt[e_form_col]`
`41`	`41`	`)`
`42`	`42`
`43`	`43`