Skip to content

Commit ba932c2

Browse files
committed
fix slurm_array_m3gnet_relax_wbm.py wandb project m3gnet->matbench-discovery
update data_path = f"{ROOT}/data/2022-06-26-wbm-cses-and-initial-structures.json.gz" to data_path = f"{ROOT}/data/wbm/2022-10-19-wbm-cses+init-structs.json.bz2"
1 parent 3b2be74 commit ba932c2

File tree

3 files changed

+17
-24
lines changed

3 files changed

+17
-24
lines changed

models/bowsr/slurm_array_bowsr_wbm.py

+4-4
Original file line numberDiff line numberDiff line change
@@ -21,9 +21,7 @@
2121
__date__ = "2022-08-15"
2222

2323
"""
24-
To slurm submit this file, run:
25-
26-
python path/to/file.py slurm-submit
24+
To slurm submit this file: python path/to/file.py slurm-submit
2725
2826
Requires MEGNet and MAML installation: pip install megnet maml
2927
"""
@@ -112,7 +110,9 @@
112110
print(f"Loading from {data_path = }")
113111
df_wbm = pd.read_json(data_path).set_index("material_id")
114112

115-
df_this_job = np.array_split(df_wbm, slurm_array_task_count)[slurm_array_task_id - 1]
113+
df_this_job: pd.DataFrame = np.array_split(df_wbm, slurm_array_task_count)[
114+
slurm_array_task_id - 1
115+
]
116116

117117

118118
# %%

models/m3gnet/join_m3gnet_relax_results.py

+7-14
Original file line numberDiff line numberDiff line change
@@ -21,8 +21,8 @@
2121

2222
# %%
2323
module_dir = os.path.dirname(__file__)
24-
task_type = "RS2RE"
25-
date = "2022-08-19"
24+
task_type = "IS2RE"
25+
date = "2022-10-31"
2626
glob_pattern = f"{date}-m3gnet-wbm-relax-{task_type}/*.json.gz"
2727
file_paths = sorted(glob(f"{module_dir}/{glob_pattern}"))
2828
print(f"Found {len(file_paths):,} files for {glob_pattern = }")
@@ -38,8 +38,7 @@
3838
continue
3939
try:
4040
# keep whole dataframe in memory
41-
df = pd.read_json(file_path)
42-
df.index = df.index.str.replace("_", "-")
41+
df = pd.read_json(file_path).set_index("material_id")
4342
df.index.name = "material_id"
4443
col_map = dict(
4544
final_structure="m3gnet_structure", trajectory="m3gnet_trajectory"
@@ -52,24 +51,18 @@
5251
df["volume"] = df.m3gnet_structure.map(lambda x: x.volume)
5352
df["n_sites"] = df.m3gnet_structure.map(len)
5453
dfs[file_path] = df.drop(columns=["m3gnet_trajectory"])
55-
except (ValueError, FileNotFoundError):
56-
# pandas v1.5+ correctly raises FileNotFoundError, below raises ValueError
54+
except FileNotFoundError:
5755
continue
5856

5957

6058
# %%
6159
df_m3gnet = pd.concat(dfs.values())
62-
if any(df_m3gnet.index.str.contains("_")):
63-
df_m3gnet.index = df_m3gnet.index.str.replace("_", "-")
6460

6561

6662
# %%
67-
pd_entries_m3gnet = [
68-
PDEntry(row.m3gnet_structure.composition, row.m3gnet_energy)
69-
for row in df_m3gnet.itertuples()
70-
]
71-
df_m3gnet["e_form_m3gnet_from_ppd"] = [
72-
get_e_form_per_atom(entry) for entry in pd_entries_m3gnet
63+
df_m3gnet["e_form_per_atom_m3gnet"] = [
64+
get_e_form_per_atom(PDEntry(row.m3gnet_structure.composition, row.m3gnet_energy))
65+
for row in tqdm(df_m3gnet.itertuples(), total=len(df_m3gnet), disable=None)
7366
]
7467
df_m3gnet.isna().sum()
7568

models/m3gnet/slurm_array_m3gnet_relax_wbm.py

+6-6
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,7 @@
1717
from matbench_discovery.slurm import slurm_submit_python
1818

1919
"""
20-
To slurm submit this file, run:
21-
22-
python path/to/file.py slurm-submit
20+
To slurm submit this file: python path/to/file.py slurm-submit
2321
2422
Requires M3GNet installation: pip install m3gnet
2523
"""
@@ -69,11 +67,13 @@
6967

7068

7169
# %%
72-
data_path = f"{ROOT}/data/2022-06-26-wbm-cses-and-initial-structures.json.gz"
70+
data_path = f"{ROOT}/data/wbm/2022-10-19-wbm-cses+init-structs.json.bz2"
7371
print(f"Loading from {data_path=}")
7472
df_wbm = pd.read_json(data_path).set_index("material_id")
7573

76-
df_this_job = np.array_split(df_wbm, slurm_array_task_count)[slurm_array_task_id - 1]
74+
df_this_job: pd.DataFrame = np.array_split(df_wbm, slurm_array_task_count)[
75+
slurm_array_task_id - 1
76+
]
7777

7878
run_params = dict(
7979
data_path=data_path,
@@ -89,7 +89,7 @@
8989
wandb.login()
9090

9191
wandb.init(
92-
project="m3gnet",
92+
project="matbench-discovery",
9393
name=f"{job_name}-{slurm_job_id}-{slurm_array_task_id}",
9494
config=run_params,
9595
)

0 commit comments

Comments
 (0)