Skip to content

Commit 1523f4a

Browse files
author
sfluegel
committed
clean up semantic loss eval / pubchem kmeans
1 parent 3851ee8 commit 1523f4a

File tree

2 files changed

+16
-21
lines changed

2 files changed

+16
-21
lines changed

chebai/preprocessing/datasets/pubchem.py

Lines changed: 0 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -559,16 +559,6 @@ def download(self):
559559
f.write("\n".join(smiles_list))
560560

561561

562-
if __name__ == "__main__":
563-
kmeans_data = PubChemKMeans(
564-
n_clusters=100,
565-
random_size=10000,
566-
exclude_data_from=ChEBIOver100(chebi_version=231),
567-
include_min_n_clusters=10,
568-
)
569-
kmeans_data.download()
570-
571-
572562
class SWJPreChem(PubChem):
573563
UNLABELED = True
574564

chebai/result/analyse_sem.py

Lines changed: 16 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -521,6 +521,7 @@ def run_all(
521521
print(traceback.format_exc())
522522

523523

524+
# run predictions / metrics calculations for semantic loss paper runs (NeSy 2024 submission)
524525
def run_semloss_eval(mode="eval"):
525526
non_wandb_runs = []
526527
if mode == "preds":
@@ -531,25 +532,29 @@ def run_semloss_eval(mode="eval"):
531532
run_all(ids, skip_analyse=True, nonwandb_runs=non_wandb_runs)
532533

533534
if mode == "eval":
534-
new_14 = [
535-
"e4ba0ff8",
535+
prod = [
536+
"tk15yznc",
537+
"uke62a8m",
538+
"w0h3zr5s",
539+
]
540+
xu19 = [
536541
"5ko8knb4",
537-
"hk8555ff",
542+
"061fd85t",
538543
"r50ioujs",
539-
"w0h3zr5s",
544+
]
545+
prod_mixed = [
546+
"hk8555ff",
540547
"e0lxw8py",
548+
"lig23cmg",
549+
]
550+
luka = [
541551
"0c0s48nh",
542552
"lfg384bp",
543-
"75o8bc3h",
544-
"lig23cmg",
545553
"qeghvubh",
546-
"uke62a8m",
547-
"061fd85t",
548-
"tk15yznc",
549554
]
550555
baseline = ["i4wtz1k4", "zd020wkv", "rc1q3t49"]
551-
k2 = ["ng3usn0p", "rp0wwzjv", "8fma1q7r"]
552-
ids = baseline
556+
prodk2 = ["ng3usn0p", "rp0wwzjv", "8fma1q7r"]
557+
ids = baseline + prod + prodk2 + xu19 + luka + prod_mixed
553558
run_all(
554559
ids,
555560
skip_preds=True,

0 commit comments

Comments
 (0)