Spaces:

samsl
/

conplex-dti

Sleeping

App Files Files Community

samsl commited on Jul 14

Commit

dfffe94

•

1 Parent(s): c394816

Switch to huggingface hosted model

Browse files

Files changed (3) hide show

app.py +2 -11
models/conplex_v1_bindingdb.pt +0 -3
publish_model.py +99 -0

app.py CHANGED Viewed

@@ -11,9 +11,8 @@ from tempfile import TemporaryDirectory
 from torch.utils.data import DataLoader
 from pathvalidate import sanitize_filename
 from conplex_dti.featurizer import MorganFeaturizer, ProtBertFeaturizer
-from conplex_dti.model.architectures import SimpleCoembeddingNoSigmoid
 theme = "Default"
 title = "ConPLex: Predicting Drug-Target Interactions"
@@ -55,10 +54,6 @@ The pairs file should be a tab-separated values file where each row is a candida
 def predict(run_name, model_name, csv_file, progress = gr.Progress()):
-    MODEL_MAP = {
-        "ConPLex_V1_BindingDB": "./models/conplex_v1_bindingdb.pt",
-    }
     try:
         with TemporaryDirectory() as tmpdir:
             run_id = uuid4()
@@ -84,11 +79,7 @@ def predict(run_name, model_name, csv_file, progress = gr.Progress()):
             drug_featurizer.preload(query_df["moleculeSmiles"].unique())
             target_featurizer.preload(query_df["proteinSequence"].unique())
-            model = SimpleCoembeddingNoSigmoid(
-                drug_featurizer.shape, target_featurizer.shape, 1024
-            )
-            model.load_state_dict(torch.load(MODEL_MAP[model_name], map_location=device))
             model = model.eval()
             model = model.to(device)

 from torch.utils.data import DataLoader
 from pathvalidate import sanitize_filename
 from conplex_dti.featurizer import MorganFeaturizer, ProtBertFeaturizer
+from publish_model import ConPLex_DTI
 theme = "Default"
 title = "ConPLex: Predicting Drug-Target Interactions"
 def predict(run_name, model_name, csv_file, progress = gr.Progress()):
     try:
         with TemporaryDirectory() as tmpdir:
             run_id = uuid4()
             drug_featurizer.preload(query_df["moleculeSmiles"].unique())
             target_featurizer.preload(query_df["proteinSequence"].unique())
+            model = ConPLex_DTI.from_pretrained(f"samsl/{model_name}")
             model = model.eval()
             model = model.to(device)

models/conplex_v1_bindingdb.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2b77a4c9179714eec84a40d6999b49b6c8efad0ec2bccd085cae9e5e08b94330
-size 12592799

publish_model.py ADDED Viewed

	@@ -0,0 +1,99 @@

+import torch
+import torch.nn as nn
+from huggingface_hub import PyTorchModelHubMixin
+#################################
+# Latent Space Distance Metrics #
+#################################
+class Cosine(nn.Module):
+    def forward(self, x1, x2):
+        return nn.CosineSimilarity()(x1, x2)
+class SquaredCosine(nn.Module):
+    def forward(self, x1, x2):
+        return nn.CosineSimilarity()(x1, x2) ** 2
+class Euclidean(nn.Module):
+    def forward(self, x1, x2):
+        return torch.cdist(x1, x2, p=2.0)
+class SquaredEuclidean(nn.Module):
+    def forward(self, x1, x2):
+        return torch.cdist(x1, x2, p=2.0) ** 2
+DISTANCE_METRICS = {
+    "Cosine": Cosine,
+    "SquaredCosine": SquaredCosine,
+    "Euclidean": Euclidean,
+    "SquaredEuclidean": SquaredEuclidean,
+}
+ACTIVATIONS = {"ReLU": nn.ReLU, "GELU": nn.GELU, "ELU": nn.ELU, "Sigmoid": nn.Sigmoid}
+class ConPLex_DTI(nn.Module, PyTorchModelHubMixin):
+    def __init__(
+        self,
+        drug_shape=2048,
+        target_shape=1024,
+        latent_dimension=1024,
+        latent_activation="ReLU",
+        latent_distance="Cosine",
+        classify=True,
+    ):
+        super().__init__()
+        self.drug_shape = drug_shape
+        self.target_shape = target_shape
+        self.latent_dimension = latent_dimension
+        self.do_classify = classify
+        self.latent_activation = ACTIVATIONS[latent_activation]
+        self.drug_projector = nn.Sequential(
+            nn.Linear(self.drug_shape, latent_dimension), self.latent_activation()
+        )
+        nn.init.xavier_normal_(self.drug_projector[0].weight)
+        self.target_projector = nn.Sequential(
+            nn.Linear(self.target_shape, latent_dimension), self.latent_activation()
+        )
+        nn.init.xavier_normal_(self.target_projector[0].weight)
+        if self.do_classify:
+            self.distance_metric = latent_distance
+            self.activator = DISTANCE_METRICS[self.distance_metric]()
+    def forward(self, drug, target):
+        if self.do_classify:
+            return self.classify(drug, target)
+        else:
+            return self.regress(drug, target)
+    def regress(self, drug, target):
+        drug_projection = self.drug_projector(drug)
+        target_projection = self.target_projector(target)
+        inner_prod = torch.bmm(
+            drug_projection.view(-1, 1, self.latent_dimension),
+            target_projection.view(-1, self.latent_dimension, 1),
+        ).squeeze()
+        return inner_prod.squeeze()
+    def classify(self, drug, target):
+        drug_projection = self.drug_projector(drug)
+        target_projection = self.target_projector(target)
+        distance = self.activator(drug_projection, target_projection)
+        return distance.squeeze()
+if __name__ == "__main__":
+    model_path = "./models/conplex_v1_bindingdb.pt"
+    model = ConPLex_DTI()
+    model.load_state_dict(torch.load(model_path, map_location=torch.device("cpu")))
+    model.save_pretrained("ConPLex_V1_BindingDB")
+    model.push_to_hub("ConPLex_V1_BindingDB")
+    model = ConPLex_DTI.from_pretrained("samsl/ConPLex_V1_BindingDB")