janosh
diff --git a/‎.github/workflows/test.yml
+10-10 b/‎.github/workflows/test.yml
+10-10
diff --git a/‎.gitignore
+2-1 b/‎.gitignore
+2-1
diff --git a/‎.pre-commit-config.yaml
+2 b/‎.pre-commit-config.yaml
+2
diff --git a/‎assets/scripts/brillouin/brillouin_zone_3d.py
+8-1 b/‎assets/scripts/brillouin/brillouin_zone_3d.py
+8-1
diff --git a/‎assets/scripts/classify/precision_recall_curve.py
+1-1 b/‎assets/scripts/classify/precision_recall_curve.py
+1-1
diff --git a/‎assets/scripts/cluster/composition/cluster_compositions_matbench.py
+9-1 b/‎assets/scripts/cluster/composition/cluster_compositions_matbench.py
+9-1
diff --git a/‎assets/scripts/sankey/sankey_from_2_df_cols.py
+14-18 b/‎assets/scripts/sankey/sankey_from_2_df_cols.py
+14-18
diff --git a/‎assets/scripts/structure_viz/structure_2d.py
+2-2 b/‎assets/scripts/structure_viz/structure_2d.py
+2-2
diff --git a/‎assets/scripts/sunburst/chem_sys_sunburst.py
+3-3 b/‎assets/scripts/sunburst/chem_sys_sunburst.py
+3-3
diff --git a/‎assets/scripts/track_pymatviz_citations.py
+1 b/‎assets/scripts/track_pymatviz_citations.py
+1
diff --git a/‎assets/scripts/treemap/chem_sys_treemap.py
+1-1 b/‎assets/scripts/treemap/chem_sys_treemap.py
+1-1
diff --git a/‎examples/dataset_exploration/boltztrap_mp/explore_boltztrap_mp.py ‎examples/boltztrap_mp/explore_boltztrap_mp.py b/‎examples/dataset_exploration/boltztrap_mp/explore_boltztrap_mp.py ‎examples/boltztrap_mp/explore_boltztrap_mp.py
diff --git a/‎examples/dataset_exploration/camd_2022/explore_camd_2022.py ‎examples/camd_2022/explore_camd_2022.py b/‎examples/dataset_exploration/camd_2022/explore_camd_2022.py ‎examples/camd_2022/explore_camd_2022.py
diff --git a/‎examples/compare_elastic_constants.py
+5-1 b/‎examples/compare_elastic_constants.py
+5-1
@@ -30,10 +30,10 @@ jobs:
       test-cmd: pytest --durations 20 --cov-branch --cov-report=xml --cov pymatviz --splits 4 --group ${{ matrix.split }} --splitting-algorithm least_duration
       upload-coverage: strict
 
-  find-scripts:
+  find-example-scripts:
     runs-on: ubuntu-latest
     outputs:
-      script_list: ${{ steps.set-matrix.outputs.script_list }}
+      example_scripts: ${{ steps.set-matrix.outputs.example_scripts }}
     steps:
       - name: Check out repository
         uses: actions/checkout@v4
@@ -42,26 +42,26 @@ jobs:
         id: set-matrix
         run: |
           SCRIPTS=$(find assets/scripts -name "*.py" | jq -R -s -c 'split("\n")[:-1]')
-          echo "script_list=$SCRIPTS" >> $GITHUB_OUTPUT
+          echo "example_scripts=$SCRIPTS" >> $GITHUB_OUTPUT
 
-  test-scripts:
-    needs: find-scripts
+  test-example-scripts:
+    needs: find-example-scripts
     runs-on: ubuntu-latest
     strategy:
       fail-fast: false
       matrix:
-        script: ${{fromJson(needs.find-scripts.outputs.script_list)}}
+        example_script: ${{fromJson(needs.find-example-scripts.outputs.example_scripts)}}
     steps:
       - name: Check out repository
         uses: actions/checkout@v4
 
       - name: Set up Python
         uses: actions/setup-python@v5
         with:
-          python-version: "3.10"
+          python-version: 3.11
 
-      - name: Install package and dependencies
-        run: pip install -e .[make-assets,cluster]
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v2
 
       - name: Run script
-        run: python ${{ matrix.script }}
+        run: uv run --with-editable .[make-assets] ${{ matrix.example_script }}
@@ -7,8 +7,9 @@ build/
 examples/*.html
 examples/**/*.json.gz
 examples/**/*.json.xz
+examples/**/*.csv.*
 examples/**/*.pt
-examples/dataset_exploration/**/*.pdf
+examples/**/*.pdf
 gnome
 assets/scripts/pmv-used-by-list-*.yaml*
 *.archive
 
@@ -38,6 +38,8 @@ repos:
         exclude: ^assets/.+\.(svg|html)$
       - id: mixed-line-ending
       - id: trailing-whitespace
+      - id: check-added-large-files
+        args: [--maxkb=1024]
 
   - repo: https://github.com/codespell-project/codespell
     rev: v2.4.1
 
@@ -1,3 +1,10 @@
+# /// script
+# dependencies = [
+#     "seekpath>=2.1",
+# ]
+# ///
+
+
 # %%
 from glob import glob
 
@@ -12,7 +19,7 @@
     tuple(
         path.split("/")[-1].replace(".json.gz", "").rsplit("-", maxsplit=2)
     ): Structure.from_file(path)
-    for path in glob(f"{TEST_FILES}/structures/*-*-*-*.json.gz")
+    for path in glob(f"{TEST_FILES}/structures/mp-*-*-*.json.gz")
 }
 
 
 
@@ -5,7 +5,7 @@
 import pymatviz as pmv
 
 
-pmv.set_plotly_template("pymatviz_dark")
+pmv.set_plotly_template("pymatviz_white")
 
 # Random classification data
 np_rng = np.random.default_rng(seed=0)
 
@@ -3,6 +3,13 @@
 Resulting plots are colored by target property of each dataset.
 """
 
+# /// script
+# dependencies = [
+#     "matminer>=0.9.1",
+#     "umap-learn>=0.5",
+# ]
+# ///
+
 from __future__ import annotations
 
 import gzip
@@ -163,8 +170,9 @@ def process_dataset(
     (*mb_steels, "magpie", "pca", 2, dict(x=0.01, xanchor="left")),
     # 2. Steels with t-SNE (2D) - shows non-linear clustering
     (*mb_steels, "magpie", "tsne", 2, dict(x=0.01, xanchor="left")),
+    # TODO umap-learn seemingly not installed by uv run in CI, fix later
     # 3. JDFT2D with UMAP (2D) - shows modern non-linear projection
-    (*mb_jdft2d, "magpie", "umap", 2, dict(x=0.01, xanchor="left")),
+    # (*mb_jdft2d, "magpie", "umap", 2, dict(x=0.01, xanchor="left")),
     # 4. JDFT2D with one-hot encoding and PCA (3D) - shows raw element relationships
     (*mb_jdft2d, "one-hot", "pca", 3, dict()),
     # 5. Steels with Matscholar embedding and t-SNE (3D) - shows advanced embedding
 
@@ -1,7 +1,6 @@
 # %%
 import pandas as pd
-from mp_api.client import MPRester
-from mp_api.client.core import MPRestError
+from matminer.datasets import load_dataset
 
 import pymatviz as pmv
 from pymatviz.enums import Key
@@ -11,31 +10,28 @@
 
 
 # %% Sankey diagram of crystal systems and space groups
-try:
-    with MPRester(use_document_model=False) as mpr:
-        fields = [Key.mat_id, "symmetry.crystal_system", "symmetry.symbol"]
-    docs = mpr.materials.summary.search(
-        num_elements=(1, 3), fields=fields, num_chunks=30, chunk_size=1000
-    )
-except MPRestError:
-    raise SystemExit(0) from None
+data_name = "matbench_phonons"
+df_phonons = load_dataset(data_name)
 
+df_sym = pd.DataFrame(
+    struct.get_symmetry_dataset(backend="moyopy", return_raw_dataset=True).as_dict()
+    for struct in df_phonons[Key.structure]
+).rename(columns={"number": Key.spg_num})
+df_sym[Key.crystal_system] = df_sym[Key.spg_num].map(pmv.utils.spg_to_crystal_sys)
 
-# %%
-df_mp = pd.json_normalize(docs).set_index(Key.mat_id)
-df_mp.columns = [Key.crystal_system, Key.spg_symbol]
 
-frequent_symbols = df_mp[Key.spg_symbol].value_counts().nlargest(20).index
+# %%
+frequent_symbols = df_sym[Key.spg_num].value_counts().nlargest(20).index
 
-df_spg = df_mp.query(f"{Key.spg_symbol} in @frequent_symbols")
+df_spg = df_sym.query(f"{Key.spg_num} in @frequent_symbols")
 
 
 # %%
 fig = pmv.sankey_from_2_df_cols(
-    df_spg, [Key.crystal_system, Key.spg_symbol], labels_with_counts="percent"
+    df_spg, [Key.crystal_system, Key.spg_num], labels_with_counts="percent"
 )
-title = "Common Space Groups in Materials Project"
+title = f"Common Space Groups in {data_name}"
 fig.layout.title = dict(text=title, x=0.5, y=0.95)
 fig.layout.margin.t = 50
 fig.show()
-pmv.io.save_and_compress_svg(fig, "sankey-crystal-sys-to-spg-symbol")
+pmv.io.save_and_compress_svg(fig, f"sankey-{data_name}")
@@ -4,7 +4,6 @@
 
 import matplotlib.pyplot as plt
 from matminer.datasets import load_dataset
-from mp_api.client import MPRester
 from pymatgen.core import Structure
 
 import pymatviz as pmv
@@ -29,7 +28,7 @@
 fig.show()
 
 
-# %% Plot some disordered structures in 2D
+# %% 2D plots of disordered structures
 struct_mp_ids = ("mp-19017", "mp-12712")
 structure_dir = f"{TEST_FILES}/structures"
 
@@ -41,6 +40,7 @@
             raise FileNotFoundError(
                 f"structure for {mp_id} not found, run this script locally to fetch it."
             )
+        from mp_api.client import MPRester
 
         struct: Structure = MPRester().get_structure_by_material_id(
             mp_id, conventional_unit_cell=True
 
@@ -62,9 +62,9 @@
 
 # %% Load the Ward metallic glasses https://pubs.acs.org/doi/10.1021/acs.chemmater.6b04153
 data_path = "ward_metallic_glasses/ward-metallic-glasses.csv.xz"
-df_mg = pd.read_csv(
-    f"{ROOT}/examples/dataset_exploration/{data_path}", na_values=()
-).query("comment.isna()")
+df_mg = pd.read_csv(f"{ROOT}/examples/{data_path}", na_values=()).query(
+    "comment.isna()"
+)
 
 fig = pmv.chem_sys_sunburst(
     df_mg[Key.composition],
 
@@ -11,6 +11,7 @@
 # dependencies = [
 #     "google-search-results>=2.4.2",
 #     "pyyaml>=6.0.2",
+#     "python-dotenv>=1.1",
 # ]
 # ///
 
 
@@ -35,7 +35,7 @@
 
 
 # %% Load the Ward metallic glass dataset https://pubs.acs.org/doi/10.1021/acs.chemmater.6b04153
-csv_path = f"{ROOT}/examples/dataset_exploration/ward_metallic_glasses/ward-metallic-glasses.csv.xz"  # noqa: E501
+csv_path = f"{ROOT}/examples/ward_metallic_glasses/ward-metallic-glasses.csv.xz"
 df_mg = pd.read_csv(csv_path, na_values=()).query("comment.isna()")
 
 fig = pmv.chem_sys_treemap(
 
@@ -19,12 +19,16 @@
 from emmet.core.elasticity import ElasticityDoc
 from mace.calculators import mace_mp
 from matcalc.elasticity import ElasticityCalc
-from mp_api.client import MPRester
 from tqdm import tqdm
 
 import pymatviz as pmv
 
 
+try:
+    from mp_api.client import MPRester
+except ImportError:
+    raise SystemExit(0) from None
+
 pmv.set_plotly_template("pymatviz_white")
 checkpoint = "https://github.com/ACEsuit/mace-mp/releases/download/mace_matpes_0/MACE-matpes-pbe-omat-ft.model"