Upload 4 files
Browse files- README.md +10 -3
- app.py.txt +32 -0
- ldh_predictor.h5 +3 -0
- requirements.txt +3 -0
README.md
CHANGED
@@ -1,3 +1,10 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Lactate Dehydrogenase EC Number Predictor
|
2 |
+
|
3 |
+
This app predicts the EC number for lactate dehydrogenase based on the protein sequence.
|
4 |
+
|
5 |
+
## How to Use
|
6 |
+
1. Paste a protein sequence.
|
7 |
+
2. Click Predict.
|
8 |
+
3. See the predicted EC number.
|
9 |
+
|
10 |
+
Made using TensorFlow, Gradio, and Hugging Face Spaces.
|
app.py.txt
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import gradio as gr
|
2 |
+
import numpy as np
|
3 |
+
from tensorflow.keras.models import load_model
|
4 |
+
|
5 |
+
# Load model
|
6 |
+
model = load_model("ldh_predictor.h5")
|
7 |
+
|
8 |
+
# Encoding function
|
9 |
+
aa_to_int = {aa:i+1 for i, aa in enumerate('ACDEFGHIKLMNPQRSTVWY')}
|
10 |
+
max_length = 500
|
11 |
+
|
12 |
+
def predict_ldh(sequence):
|
13 |
+
encoded = [aa_to_int.get(aa, 0) for aa in sequence[:max_length]]
|
14 |
+
if len(encoded) < max_length:
|
15 |
+
encoded += [0] * (max_length - len(encoded))
|
16 |
+
prob = model.predict(np.array([encoded]))[0][0]
|
17 |
+
return {"LDH": float(prob), "Not LDH": float(1-prob)}
|
18 |
+
|
19 |
+
# Gradio interface
|
20 |
+
interface = gr.Interface(
|
21 |
+
fn=predict_ldh,
|
22 |
+
inputs=gr.Textbox(lines=5, placeholder="Paste protein sequence...", label="Protein Sequence"),
|
23 |
+
outputs=gr.Label(label="Prediction"),
|
24 |
+
title="🧬 DeepEnzyme: LDH Classifier",
|
25 |
+
examples=[
|
26 |
+
["MATLKDQLIYNLLKEEQTPQNKITVVGVGAVGMACAISILMKDLADELALVDVIEDKLKGEMMDLQHGSLFLRTPKIVSGKDYNVTANSKLVIITAGARQQEGESRLNLVQRNVNIFKFIIPNVVKYSPNCKLLIVSNPVDILTYVAWKISGFPKNRVIGSGCNLDSARFRYLMGERLGVHPLSCHGWVLGEHGDSSVPVWSGMNVAGVSLKTLHPDLGTDKDKEQWKEVHKQVVESAYEVIKLKGYTSWAIGLSVADLAESIMKNLRRVHPVSTMIKGLYGIKDDVFLSVPCILGQNGISDLVKVTLTSEEEARLKKSADTLWGIQKELQF"],
|
27 |
+
["MSEPIRVLVTGAAGQIAYSLLYSIGNGSVFGKDQPIILVLLDITPMMGVLDGVLMELQDCALPLLKDVIATDKEDVAFKDLDVAILVGSMPRREGMERKDLLKANVKIFKSQGAALDKYAKKSVKVIVVGNPANTNCLTASKSAPSIPKENFSCLTRLDHNRAKAQIALKLGVTANDVKNVIIWGNHSSTQYPDVNHAKVKLQGKEVGVYEALKDDSWLKGEFVTTVQQRGAAVIKARKLSSAMSAAKAICDHVRDIWFGTPEGEFVSMGVISDGNSYGVPDDLLYSFPVVIKNKTWKFVEGLPINDFSREKMDLTAKELTEEKESAFEFLSSA"]
|
28 |
+
],
|
29 |
+
description="Predict whether a protein is Lactate Dehydrogenase (LDH) using deep learning."
|
30 |
+
)
|
31 |
+
|
32 |
+
interface.launch()
|
ldh_predictor.h5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dec828e1ca53f77fe8298c8e2265a3a442a315cdfcdf6ae3b1436fbd9d19c739
|
3 |
+
size 12566936
|
requirements.txt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
tensorflow
|
2 |
+
gradio
|
3 |
+
numpy
|