moslem commited on
Commit
45e8fda
·
verified ·
1 Parent(s): aa7fb75

Upload Model

Browse files
Files changed (6) hide show
  1. .gitattributes +35 -35
  2. README.md +13 -13
  3. best_model.h5 +3 -0
  4. gradio_app.py +77 -0
  5. requirements.txt +4 -0
  6. utils.py +42 -0
.gitattributes CHANGED
@@ -1,35 +1,35 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,13 +1,13 @@
1
- ---
2
- title: Predict Tfbs
3
- emoji: 🐨
4
- colorFrom: green
5
- colorTo: purple
6
- sdk: gradio
7
- sdk_version: 5.49.1
8
- app_file: app.py
9
- pinned: false
10
- short_description: Predict Transcription Factor Binding Site – TFBS
11
- ---
12
-
13
- Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
 
1
+ ---
2
+ title: Predict Tfbs
3
+ emoji: 🐨
4
+ colorFrom: green
5
+ colorTo: purple
6
+ sdk: gradio
7
+ sdk_version: 5.49.1
8
+ app_file: app.py
9
+ pinned: false
10
+ short_description: Predict Transcription Factor Binding Site – TFBS
11
+ ---
12
+
13
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
best_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ceb5e3ce3c81064cf2bf7e736f302bf11cbddeb0b7aaebb41d29c4a2f401892
3
+ size 192032
gradio_app.py ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # gradio_app.py
2
+ # Gradio rewrite of the original Streamlit app for TFBS prediction
3
+
4
+ import os
5
+ import gradio as gr
6
+ import numpy as np
7
+ from utils import dnaseq_features
8
+ from keras.models import load_model
9
+
10
+ # Load model once at startup (make sure best_model.h5 is present in the repo)
11
+ model = load_model('best_model.h5')
12
+
13
+
14
+ def predict(dna_seq: str):
15
+ """Take a DNA sequence string, compute features, run the model and return a Markdown summary."""
16
+ dna_seq = (dna_seq or "").strip()
17
+ if not dna_seq:
18
+ return "**Please provide an input DNA sequence.**"
19
+
20
+ # compute features using user's util function
21
+ try:
22
+ dna_ohe_feat, ds_index, ds_val = dnaseq_features(seq=dna_seq)
23
+ except Exception as e:
24
+ return f"Error while computing features: {e}"
25
+
26
+ # predict
27
+ try:
28
+ predicted = model.predict(dna_ohe_feat)
29
+ except Exception as e:
30
+ return f"Error during model prediction: {e}"
31
+
32
+ # build output as Markdown list with probabilities/scores
33
+ lines = []
34
+ for i, j in zip(ds_val, predicted):
35
+ try:
36
+ # if prediction is a vector like [p0, p1]
37
+ if hasattr(j, "__len__") and len(j) >= 2:
38
+ prob = float(j[1])
39
+ label = "**TFBS found ✅**" if np.argmax(j) == 1 else "**TFBS not found ❌**"
40
+ lines.append(f"- `{i}` — {label} (probability: {prob:.4f})")
41
+ else:
42
+ # single scalar output
43
+ score = float(j)
44
+ label = "**TFBS found ✅**" if score > 0.5 else "**TFBS not found ❌**"
45
+ lines.append(f"- `{i}` — {label} (score: {score:.4f})")
46
+ except Exception:
47
+ # fallback
48
+ lines.append(f"- `{i}` — prediction: {j}")
49
+
50
+ if not lines:
51
+ return "No predictions were produced. Check the input or the model."
52
+
53
+ return "\n".join(lines)
54
+
55
+
56
+ # Gradio UI
57
+ title = "Simple Model Serving Web App for TFBS prediction"
58
+ description = "Get TFBS predictions from the latest model. Paste a DNA sequence and click **Make Prediction**."
59
+
60
+ with gr.Blocks(theme=None) as demo:
61
+ gr.Markdown(f"# {title}")
62
+ gr.Markdown(description)
63
+
64
+ with gr.Row():
65
+ seq_input = gr.Textbox(lines=6, placeholder="ATAGAGAC...", label="Input DNA sequence")
66
+
67
+ with gr.Row():
68
+ predict_btn = gr.Button("Make Prediction")
69
+
70
+ output = gr.Markdown()
71
+
72
+ predict_btn.click(fn=predict, inputs=seq_input, outputs=output)
73
+
74
+
75
+ if __name__ == "__main__":
76
+ port = int(os.environ.get("PORT", 7860))
77
+ demo.launch(server_name="0.0.0.0", server_port=port)
requirements.txt ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ gradio>=3.0
2
+ tensorflow>=2.10
3
+ keras
4
+ numpy
utils.py ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Function for when you want to prepare DNA sequence feature for ML applications
2
+ import numpy as np
3
+
4
+ # Function for when you want to prepare DNA sequence feature for ML applications
5
+ def dnaseq_features(seq):
6
+ start=0
7
+ n_segs=101
8
+ seq_name = 'seq'
9
+ remaind = len(seq)%n_segs
10
+ if(remaind != 0):
11
+ last_id = len(seq) - remaind
12
+ upd_seq = seq[start:last_id]
13
+ dic_seq = {}
14
+ for i in range(0,3):
15
+ a = int(i*n_segs) ; b = int(i*n_segs)+n_segs
16
+ identifier = f"{seq_name}_{a}:{b}"
17
+ dic_seq[identifier] = upd_seq[a:b]
18
+ lst_seq = dic_seq.values()
19
+ index = list(dic_seq.keys())
20
+ values = list(dic_seq.values())
21
+
22
+ # One hot encode
23
+ ii=-1
24
+ for data in lst_seq:
25
+ ii+=1
26
+ abc = 'ACGT'
27
+ char_to_int = dict((c, i) for i, c in enumerate(abc))
28
+ int_enc = [char_to_int[char] for char in data]
29
+ ohe = []
30
+ for value in int_enc:
31
+ base = [0 for _ in range(len(abc))]
32
+ base[value] = 1
33
+ ohe.append(base)
34
+ np_mat = np.array(ohe)
35
+ np_mat = np.expand_dims(np_mat,axis=0)
36
+
37
+ if(ii != 0):
38
+ matrix = np.concatenate([np_mat,matrix],axis=0)
39
+ else:
40
+ matrix = np_mat
41
+
42
+ return matrix,index,values