add kwarg show_dft_acc=False to rolling_mae_vs_hull_dist()

janosh · janosh · commit 9aebb08207ff · 2023-06-19T20:29:23.000-07:00
fix about-the-test-set page showing WBM element counts in MP heatmap's hover data
diff --git a/data/wbm/analysis.py b/data/wbm/analysis.py
@@ -113,7 +113,6 @@
 fig.update_layout(showlegend=False, paper_bgcolor="rgba(0,0,0,0)")
 fig.update_xaxes(title_text="WBM energy above MP convex hull (eV/atom)")
 
-
 for x_pos, label in zip(
     [mean, mean + std, mean - std],
     [f"{mean = :.2f}", f"{mean + std = :.2f}", f"{mean - std = :.2f}"],
diff --git a/data/wbm/readme.md b/data/wbm/readme.md
@@ -94,7 +94,9 @@ The WBM test set has an energy above the MP convex hull distribution with mean *
 
 The dummy MAE of always predicting the test set mean is **0.17 eV/atom**.
 
-The number of stable materials is **97k** out of 257k, resulting in a dummy stability hit rate of **37%**.
+The number of stable materials (according to the MP convex hull which is spanned by the training data the models have access to) is **97k** out of **257k**, resulting in a dummy stability hit rate of **37%**.
+
+> Incidentally, [according to the authors](https://www.nature.com/articles/s41524-020-00481-6#Sec2), a more accurate stability rate according to the combined MP+WBM convex hull of the first 3 rounds of elemental substitution is 18,479 out of 189,981 crystals ($\approx$ 9.7%).
 
 <slot name="wbm-each-hist">
   <img src="./figs/2023-01-26-wbm-each-hist.svg" alt="WBM energy above MP convex hull distribution">
diff --git a/matbench_discovery/plots.py b/matbench_discovery/plots.py
@@ -296,6 +296,7 @@ def rolling_mae_vs_hull_dist(
     y_label: str = "rolling MAE (eV/atom)",
     just_plot_lines: bool = False,
     with_sem: bool = True,
+    show_dft_acc: bool = False,
     **kwargs: Any,
 ) -> plt.Axes | go.Figure:
     """Rolling mean absolute error as the energy to the convex hull is varied. A scale
@@ -325,6 +326,9 @@ def rolling_mae_vs_hull_dist(
             to False.
         with_sem (bool, optional): If True, plot the standard error of the mean as
             shaded area around the rolling MAE. Defaults to True.
+        show_dft_acc (bool, optional): If True, change color of the cone of peril's tip
+            and annotate it with 'Corrected GGA Accuracy' at rolling MAE of 25 meV/atom.
+            Defaults to False.
 
     Returns:
         tuple[plt.Axes | go.Figure, pd.DataFrame, pd.DataFrame]: matplotlib Axes or
@@ -363,8 +367,8 @@ def rolling_mae_vs_hull_dist(
         # previous call
         return ax, df_rolling_err, df_err_std
 
-    # DFT accuracy at 25 meV/atom for e_above_hull calculations of chemically similar
-    # systems which is lower than formation energy error due to systematic error
+    # DFT accuracy at 25 meV/atom for relative difference of e_above_hull for chemically
+    # similar systems which is lower than formation energy error due to systematic error
     # cancellation among similar chemistries, supporting ref:
     href = "https://doi.org/10.1103/PhysRevB.85.155208"
     dft_acc = 0.025
@@ -397,32 +401,33 @@ def rolling_mae_vs_hull_dist(
         ax.add_artist(scale_bar)
 
         ax.fill_between(
-            (-1, -dft_acc, dft_acc, 1),
-            (1, 1, 1, 1),
-            (1, dft_acc, dft_acc, 1),
+            (-1, -dft_acc, dft_acc, 1) if show_dft_acc else (-1, 0, 1),
+            (1, 1, 1, 1) if show_dft_acc else (1, 1, 1),
+            (1, dft_acc, dft_acc, 1) if show_dft_acc else (1, 0, 1),
             color="tab:red",
             alpha=0.2,
         )
 
-        ax.fill_between(
-            (-dft_acc, 0, dft_acc),
-            (dft_acc, dft_acc, dft_acc),
-            (dft_acc, 0, dft_acc),
-            color="tab:orange",
-            alpha=0.2,
-        )
-        # shrink=0.1 means cut off 10% length from both sides of arrow line
-        arrowprops = dict(
-            facecolor="black", width=0.5, headwidth=5, headlength=5, shrink=0.1
-        )
-        ax.annotate(
-            xy=(-dft_acc, dft_acc),
-            xytext=(-2 * dft_acc, dft_acc),
-            text="Corrected\nGGA DFT\nAccuracy",
-            arrowprops=arrowprops,
-            verticalalignment="center",
-            horizontalalignment="right",
-        )
+        if show_dft_acc:
+            ax.fill_between(
+                (-dft_acc, 0, dft_acc),
+                (dft_acc, dft_acc, dft_acc),
+                (dft_acc, 0, dft_acc),
+                color="tab:orange",
+                alpha=0.2,
+            )
+            # shrink=0.1 means cut off 10% length from both sides of arrow line
+            arrowprops = dict(
+                facecolor="black", width=0.5, headwidth=5, headlength=5, shrink=0.1
+            )
+            ax.annotate(
+                xy=(-dft_acc, dft_acc),
+                xytext=(-2 * dft_acc, dft_acc),
+                text="Corrected GGA\nAccuracy",
+                arrowprops=arrowprops,
+                verticalalignment="center",
+                horizontalalignment="right",
+            )
 
         ax.text(
             0, 0.13, r"MAE > $|E_\mathrm{above\ hull}|$", horizontalalignment="center"
@@ -457,43 +462,49 @@ def rolling_mae_vs_hull_dist(
             yanchor="bottom",
             title_font=dict(size=13),
         )
-        ax.update_layout(
-            dict(
-                xaxis_title="E<sub>above MP hull</sub> (eV/atom)",
-                yaxis_title="rolling MAE (eV/atom)",
-            ),
-            legend=legend,
-        )
+        ax.layout.legend.update(legend)
+        ax.layout.xaxis.title.text = "E<sub>above MP hull</sub> (eV/atom)"
+        ax.layout.yaxis.title.text = "rolling MAE (eV/atom)"
         ax.update_xaxes(range=x_lim)
         ax.update_yaxes(range=y_lim)
-        scatter_kwds = dict(fill="toself", opacity=0.4)
-        ax.add_scatter(
-            x=(-1, -dft_acc, dft_acc, 1),
-            y=(1, dft_acc, dft_acc, 1),
-            name="MAE > |E<sub>above hull</sub>|",
-            # fillcolor="yellow",
-            **scatter_kwds,
-        )
+        scatter_kwds = dict(fill="toself", opacity=0.2)
+        peril_cone_anno = "MAE > |E<sub>above hull</sub>|"
         ax.add_scatter(
-            x=(-dft_acc, dft_acc, 0, -dft_acc),
-            y=(dft_acc, dft_acc, 0, dft_acc),
-            name="MAE < |DFT error|",
-            # fillcolor="red",
+            x=(-1, -dft_acc, dft_acc, 1) if show_dft_acc else (-1, 0, 1),
+            y=(1, dft_acc, dft_acc, 1) if show_dft_acc else (1, 0, 1),
+            name=peril_cone_anno,
+            fillcolor="red",
+            showlegend=False,
             **scatter_kwds,
         )
         ax.add_annotation(
-            x=-dft_acc,
-            y=dft_acc,
-            text=f"<a {href=}>Corrected GGA Accuracy<br>for rel. Energy</a> "
-            "[<a href='#hautier_accuracy_2012' target='_self'>ref</a>]",
-            showarrow=True,
-            xshift=-10,
-            arrowhead=2,
-            ax=-4 * dft_acc,
-            ay=2 * dft_acc,
-            axref="x",
-            ayref="y",
+            x=0,
+            y=0.8,
+            text=peril_cone_anno,
+            showarrow=False,
+            yref="paper",
         )
+        if show_dft_acc:
+            ax.add_scatter(
+                x=(-dft_acc, dft_acc, 0, -dft_acc),
+                y=(dft_acc, dft_acc, 0, dft_acc),
+                name="MAE < |Corrected GGA error|",
+                fillcolor="red",
+                **scatter_kwds,
+            )
+            ax.add_annotation(
+                x=-dft_acc,
+                y=dft_acc,
+                text=f"<a {href=}>Corrected GGA Accuracy<br>for rel. Energy</a> "
+                "[<a href='#hautier_accuracy_2012' target='_self'>ref</a>]",
+                showarrow=True,
+                xshift=-10,
+                arrowhead=2,
+                ax=-4 * dft_acc,
+                ay=2 * dft_acc,
+                axref="x",
+                ayref="y",
+            )
 
         ax.data = ax.data[::-1]  # bring px.line() to front
         # plot rectangle to indicate MAE window size
diff --git a/matbench_discovery/structure.py b/matbench_discovery/structure.py
@@ -25,3 +25,26 @@ def perturb_structure(struct: Structure, gamma: float = 1.5) -> Structure:
         site.to_unit_cell(in_place=True)
 
     return perturbed
+
+
+if __name__ == "__main__":
+    import matplotlib.pyplot as plt
+
+    gamma = 1.5
+    samples = np.array([np.random.weibull(gamma) for _ in range(10000)])
+    mean = samples.mean()
+
+    # reproduces the dist in https://www.nature.com/articles/s41524-022-00891-8#Fig5
+    ax = plt.hist(samples, bins=100)
+    # add vertical line at the mean
+    plt.axvline(mean, color="gray", linestyle="dashed", linewidth=1)
+    # annotate the mean line
+    plt.annotate(
+        f"{mean = :.2f}",
+        xy=(mean, 1),
+        # use ax coords for y
+        xycoords=("data", "axes fraction"),
+        # add text offset
+        xytext=(10, -20),
+        textcoords="offset points",
+    )
diff --git a/site/src/routes/about-the-test-set/+page.svelte b/site/src/routes/about-the-test-set/+page.svelte
@@ -69,11 +69,11 @@
       <TableInset slot="inset" grid_row="3">
         {#if active_mp_elem?.name}
           <strong>
-            {active_mp_elem?.name}: {pretty_num(wbm_elem_counts[active_mp_elem?.symbol])}
+            {active_mp_elem?.name}: {pretty_num(mp_elem_counts[active_mp_elem?.symbol])}
             <!-- compute percent of total -->
-            {#if wbm_elem_counts[active_mp_elem?.symbol] > 0}
+            {#if mp_elem_counts[active_mp_elem?.symbol] > 0}
               {@const total = wbm_heat_vals.reduce((a, b) => a + b, 0)}
-              ({pretty_num((wbm_elem_counts[active_mp_elem?.symbol] / total) * 100)}%)
+              ({pretty_num((mp_elem_counts[active_mp_elem?.symbol] / total) * 100)}%)
             {/if}
           </strong>
         {/if}