Spaces:

svasthaintelligence
/

MeSHClassify

Runtime error

App Files Files Community

akapoor commited on Dec 25, 2022

Commit

0623078

•

1 Parent(s): d36a844

Upload 3 files

Browse files

Files changed (3) hide show

app.py +106 -0
data.pt +3 -0
requirements.txt +7 -0

app.py ADDED Viewed

	@@ -0,0 +1,106 @@

+import pandas as pd
+import numpy as np
+import torch.nn.functional as F
+import torch
+import os
+import torch.nn as nn
+from torch.utils.data import Dataset, DataLoader
+from transformers import BertTokenizerFast as BertTokenizer, AutoModelForSequenceClassification, AutoTokenizer,AutoModel,BertModel, AdamW, get_linear_schedule_with_warmup
+import pytorch_lightning as pl
+from pytorch_lightning.callbacks import ModelCheckpoint, EarlyStopping
+from pytorch_lightning.loggers import TensorBoardLogger
+import streamlit as st
+import torchmetrics
+pwd = os.path.dirname(__file__)
+MODEL_PATH = os.path.join(pwd,"data.pt")
+print(MODEL_PATH)
+BERT_MODEL_NAME = 'albert-base-v1'
+tokenizer = AutoTokenizer.from_pretrained(BERT_MODEL_NAME)
+class MeshNetwork(pl.LightningModule):
+  def __init__(self):
+    super().__init__()
+    self.bert = AutoModelForSequenceClassification.from_pretrained(BERT_MODEL_NAME, num_labels=13,return_dict=True)
+    self.criterion = F.cross_entropy
+  def forward(self, input_ids, attention_mask):
+    output = self.bert(input_ids=input_ids, attention_mask=attention_mask)
+    return output.logits
+  def training_step(self, batch, batch_idx):
+    input_ids = batch["input_ids"]
+    attention_mask = batch["attention_mask"]
+    y = batch['labels']
+    y_hat = self.forward(input_ids, attention_mask)
+    loss = self.criterion(y_hat, y)
+    # Calculate acc
+    predictions = F.softmax(y_hat, dim=1).argmax(dim=1)
+    acc = torchmetrics.functional.accuracy(predictions, y)
+    self.log("train_acc", acc, on_step=False,prog_bar=True, on_epoch=True, logger=True)
+    self.log("train_loss", loss, prog_bar=True, on_epoch=True, logger=True)
+    return {"loss": loss, "predictions": y_hat, "labels": y}
+  def validation_step(self, batch, batch_idx):
+    input_ids = batch["input_ids"]
+    attention_mask = batch["attention_mask"]
+    y = batch["labels"]
+    y_hat = self.forward(input_ids, attention_mask)
+    loss = self.criterion(y_hat, y)
+    predictions = F.softmax(y_hat, dim=1).argmax(dim=1)
+    acc = torchmetrics.functional.accuracy(predictions, y)
+    self.log("val_acc", acc, prog_bar=True, on_step = False,on_epoch=True, logger=True)
+    self.log("val_loss", loss, prog_bar=True, on_epoch = True, logger=True)
+  def test_step(self, batch, batch_idx):
+    input_ids = batch["input_ids"]
+    attention_mask = batch["attention_mask"]
+    y = batch["labels"]
+    y_hat = self.forward(input_ids, attention_mask)
+    loss = self.criterion(y_hat, y)
+    predictions = F.softmax(y_hat, dim=1).argmax(dim=1)
+    acc = torchmetrics.functional.accuracy(predictions, y)
+    self.log("test_acc", acc, prog_bar=True, on_step=False,on_epoch=True, logger=True)
+    self.log("test_loss", loss, prog_bar=True, on_epoch = True, logger=True)
+  def configure_optimizers(self):
+    optimizer = torch.optim.Adam(params = self.parameters())
+    return optimizer
+st.title("MeSH Classify")
+model = MeshNetwork()
+with st.spinner("Loading model..."):
+    model.load_state_dict(torch.load(MODEL_PATH))
+    model.eval()
+    print(model)
+st.success("Model loaded.")
+user_input = st.text_input("Enter text to be classified.")
+st.write("Check MeSH categories: [link](https://www.ncbi.nlm.nih.gov/mesh/1000048)")
+st.markdown("***")
+if st.button("Classify Text"):
+    if user_input:
+      encoding = tokenizer.encode_plus(
+      user_input,
+      add_special_tokens=True,
+      return_token_type_ids=False,
+      padding="max_length",
+      truncation=True,
+      return_attention_mask=True,
+      return_tensors='pt',
+      )
+      input_ids=encoding["input_ids"].flatten()
+      attention_mask=encoding["attention_mask"].flatten()
+      y_hat = model(input_ids=input_ids.reshape(-1, 512),attention_mask = attention_mask.reshape(-1, 512))
+      prob = F.softmax(y_hat, dim=1)
+      probs = prob.detach().numpy()
+      st.table(probs)
+      predictions = prob.argmax(dim=1)
+      st.write(predictions.detach().numpy())

data.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb19f344593f34c9cb45609eccd24895e37df8eddcdc477e59b92d44b41b43fe
+size 46789201

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+numpy==1.22.4
+pandas==1.4.1
+pytorch_lightning==1.6.3
+streamlit==1.10.0
+torch==1.11.0
+torchmetrics==0.8.2
+transformers==4.20.1