shreyab21 commited on
Commit
38af4fb
·
verified ·
1 Parent(s): 469ab5a

Upload 6 files

Browse files
data/graph_utils.py ADDED
File without changes
data/processed/embeddings.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b762b7245a4b3741327b7df504a5fc01aa71cb123dab7589e4d397fce493a6
3
+ size 10234
data/processed/generate_dummy_embeddings.py ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ import pickle
3
+
4
+ # Example SMILES strings
5
+ smiles_list = ["CC(=O)OC1=CC=CC=C1C(=O)O", "C1CCCCC1", "CCN(CC)CC"]
6
+
7
+ # Create 256-D random embeddings
8
+ embeddings_dict = {smi: torch.randn(256) for smi in smiles_list}
9
+
10
+ # Save to embeddings.pkl
11
+ with open("data/processed/embeddings.pkl", "wb") as f:
12
+ pickle.dump(embeddings_dict, f)
13
+
14
+ print("Saved dummy embeddings to data/processed/embeddings.pkl")
data/protein_target.fasta ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ >Target_Protein_Demo
2
+ MKTAYIAKQRQISFVKSHFSRQDILDLIC
data/raw/test_smiles.csv ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ smiles
2
+ CCO
3
+ CC(=O)O
4
+ CC(=O)OC1=CC=CC=C1C(=O)O
data/raw/zone_iv_synthetic.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ smiles,shelf_life_days
2
+ CCO,365
3
+ CC(=O)O,400
4
+ CC(=O)OC1=CC=CC=C1C(=O)O,300
5
+ CCC,450
6
+ C1CCCCC1,500
7
+ C1=CC=CC=C1,480