Spaces:

fakeym
/

text_classify

Paused

App Files Files Community

fakeym commited on Jul 14

Commit

e7dc454

•

1 Parent(s): e5b5d59

Upload 5 files

Browse files

Files changed (5) hide show

app.py +48 -0
model/sst-2-english/config.json +31 -0
model/sst-2-english/pytorch_model.bin +3 -0
model/sst-2-english/tokenizer_config.json +1 -0
model/sst-2-english/vocab.txt +0 -0

app.py ADDED Viewed

	@@ -0,0 +1,48 @@

+import string
+import gradio as gr
+import requests
+import torch
+from transformers import (
+    AutoConfig,
+    AutoModelForSequenceClassification,
+    AutoTokenizer,
+)
+custom_labels = {0: "neg", 1: "pos"}
+model_dir = r'model\sst-2-english'
+# model = pipeline("sentiment-analysis",model=model_dir,device=0)
+# print(model("you are bad boy."))
+config = AutoConfig.from_pretrained(model_dir, num_labels=2, finetuning_task="text-classification")
+tokenizer = AutoTokenizer.from_pretrained(model_dir)
+model = AutoModelForSequenceClassification.from_pretrained(model_dir, config=config)
+model.config.id2label = custom_labels
+model.config.label2id = {v: k for k, v in custom_labels.items()}
+def inference(input_text):
+    inputs = tokenizer.batch_encode_plus(
+                [input_text],
+                max_length=512,
+                pad_to_max_length=True,
+                truncation=True,
+                padding="max_length",
+                return_tensors="pt",
+            )
+    with torch.no_grad():
+        logits = model(**inputs).logits
+    predicted_class_id = logits.argmax().item()
+    output = model.config.id2label[predicted_class_id]
+    return output
+demo = gr.Interface(
+    fn=inference,
+    inputs=gr.Textbox(label="Input Text", scale=2, container=False),
+    outputs=gr.Textbox(label="Output Label"),
+    examples = [
+        ["My last two weather pics from the storm on August 2nd. People packed up real fast after the temp dropped and winds picked up.", 1],
+        ["Lying Clinton sinking! Donald Trump singing: Let's Make America Great Again!", 0],
+        ],
+    title="Tutorial: BERT-based Text Classificatioin",
+    )
+demo.launch(debug=True)

model/sst-2-english/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "finetuning_task": "sst-2",
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "NEGATIVE",
+    "1": "POSITIVE"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "NEGATIVE": 0,
+    "POSITIVE": 1
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "output_past": true,
+  "pad_token_id": 0,
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "vocab_size": 30522
+}

model/sst-2-english/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60554cbd7781b09d87f1ececbea8c064b94e49a7f03fd88e8775bfe6cc3d9f88
+size 267844284

model/sst-2-english/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"model_max_length": 512, "do_lower_case": true}

model/sst-2-english/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff