Spaces:

xjlulu
/

intent_classifier

Runtime error

@@ -1,7 +1,127 @@
 import gradio as gr
-def greet(name):
-    return "Hello " + name + "!!"
-iface = gr.Interface(fn=greet, inputs="text", outputs="text")
-iface.launch()

 import gradio as gr
+from typing import Dict, List
+import torch
+import torch.nn as nn
+import torch.optim as optim
+from torch.utils.data import DataLoader
+import json
+import pickle
+from pathlib import Path
+from dataset import SeqClsDataset
+from utils import Vocab
+from model import SeqClassifier
+import ipdb
+max_len = 128
+hidden_size = 256
+num_layers = 2
+dropout = 0.1
+bidirectional = True
+lr = 1e-3
+batch_size = 64
+num_epoch = 5
+TRAIN = "train"
+DEV = "eval"
+TEST = "test"
+SPLITS = [TRAIN, DEV, TEST]
+device = "cpu"
+data_dir = Path("./data/intent/")
+ckpt_dir = Path("./ckpt/intent/")
+cache_dir = Path("./cache/intent/")
+# Before executing, place intent2idx.json, embeddings.pt, vocab.pkl, and utils.py in /content
+with open(cache_dir / "vocab.pkl", "rb") as f:
+    vocab: Vocab = pickle.load(f)
+intent_idx_path = cache_dir / "intent2idx.json"
+intent2idx: Dict[str, int] = json.loads(intent_idx_path.read_text())
+data_paths = {split: data_dir / f"{split}.json" for split in SPLITS}
+data = {split: json.loads(path.read_text()) for split, path in data_paths.items()}
+datasets: Dict[str, SeqClsDataset] = {
+    split: SeqClsDataset(split_data, vocab, intent2idx, max_len)
+    for split, split_data in data.items()
+}
+#ipdb.set_trace()
+test_loader = DataLoader(datasets['test'], batch_size=batch_size, shuffle=False)
+embeddings = torch.load(cache_dir / "embeddings.pt")
+embeddings.to(device)
+# Load the best model after training
+# Initialize a new model with the same architecture
+best_model = SeqClassifier(
+    embeddings=embeddings,
+    hidden_size=hidden_size,
+    num_layers=num_layers,
+    dropout=dropout,
+    bidirectional=bidirectional,
+    num_class=len(intent2idx)
+).to(device)
+# Define the path to the checkpoint file
+ckpt_path = ckpt_dir / "model_checkpoint.pth"
+# Load the model's state_dict and optimizer's state_dict from the checkpoint
+checkpoint = torch.load(ckpt_path, map_location=torch.device('cpu'))
+# Load the model's weights
+best_model.load_state_dict(checkpoint['model_state_dict']).to(device)
+# Reinitialize the optimizer with the model's parameters and load its state
+'''weight_decay = 1e-5
+optimizer = optim.Adam(best_model.parameters(), lr=lr, weight_decay=weight_decay)
+optimizer.load_state_dict(checkpoint['optimizer_state_dict'])'''
+# Retrieve the epoch number from the checkpoint
+epoch = checkpoint['epoch']
+# Set the best model to evaluation mode
+best_model.eval()
+dic_intent2idx: Dict[str, int] = json.loads(intent_idx_path.read_text())
+dic_idx2label = {idx: intent for intent, idx in dic_intent2idx.items()}
+def Tidx2label(idx: int):
+    return dic_idx2label[idx]
+with open(cache_dir / "vocab.pkl", "rb") as f:
+    vocab: Vocab = pickle.load(f)
+# 把句子做成embeddings的索引
+def collate_fn(texts: str) -> torch.tensor:
+    # 提取所有樣本的文本數據和標籤數據
+    texts = texts.split()
+    # 使用 vocab 將文本數據轉換為整數索引序列，並指定最大長度
+    encoded_texts = vocab.encode_batch([[text for text in texts]], to_len=max_len)
+    # 將整數索引序列轉換為 PyTorch 張量
+    encoded_text = torch.tensor(encoded_texts)
+    return encoded_text
+def classify(text):
+    encoded_text = collate_fn(text).to(device)
+    output = best_model(encoded_text[0])
+    Predicted_class = torch.argmax(output).item()
+    prediction = Tidx2label(Predicted_class)
+    return prediction
+demo = gr.Interface(
+        fn=classify,
+        inputs=gr.Textbox(placeholder="請輸入一段文字..."),
+        outputs="label",
+        interpretation="default",
+        examples=[
+            ["Take me to church"],
+            ["tell me what to call you"],
+            ["could you be a person"]
+        ]
+    )
+demo.launch()

cache/intent/embeddings.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f48c2a4bb711ddd28a95f849b676ab6c76a4aeff3ba01976ccea97a4808ce790
+size 7789931

cache/intent/intent2idx.json ADDED Viewed

	@@ -0,0 +1,152 @@

+{
+  "last_maintenance": 0,
+  "car_rental": 1,
+  "transactions": 2,
+  "user_name": 3,
+  "credit_limit": 4,
+  "date": 5,
+  "greeting": 6,
+  "international_fees": 7,
+  "gas": 8,
+  "calculator": 9,
+  "redeem_rewards": 10,
+  "change_ai_name": 11,
+  "alarm": 12,
+  "pin_change": 13,
+  "update_playlist": 14,
+  "what_can_i_ask_you": 15,
+  "translate": 16,
+  "change_accent": 17,
+  "text": 18,
+  "thank_you": 19,
+  "where_are_you_from": 20,
+  "goodbye": 21,
+  "recipe": 22,
+  "interest_rate": 23,
+  "ingredients_list": 24,
+  "tire_pressure": 25,
+  "definition": 26,
+  "who_do_you_work_for": 27,
+  "todo_list": 28,
+  "improve_credit_score": 29,
+  "meaning_of_life": 30,
+  "change_speed": 31,
+  "exchange_rate": 32,
+  "next_holiday": 33,
+  "make_call": 34,
+  "insurance_change": 35,
+  "spending_history": 36,
+  "meal_suggestion": 37,
+  "fun_fact": 38,
+  "restaurant_suggestion": 39,
+  "tire_change": 40,
+  "calendar_update": 41,
+  "confirm_reservation": 42,
+  "next_song": 43,
+  "are_you_a_bot": 44,
+  "yes": 45,
+  "find_phone": 46,
+  "cancel_reservation": 47,
+  "what_is_your_name": 48,
+  "bill_balance": 49,
+  "direct_deposit": 50,
+  "flight_status": 51,
+  "order_status": 52,
+  "maybe": 53,
+  "transfer": 54,
+  "freeze_account": 55,
+  "cancel": 56,
+  "shopping_list": 57,
+  "measurement_conversion": 58,
+  "jump_start": 59,
+  "international_visa": 60,
+  "travel_alert": 61,
+  "oil_change_when": 62,
+  "accept_reservations": 63,
+  "report_lost_card": 64,
+  "pto_request_status": 65,
+  "repeat": 66,
+  "directions": 67,
+  "payday": 68,
+  "smart_home": 69,
+  "damaged_card": 70,
+  "lost_luggage": 71,
+  "carry_on": 72,
+  "insurance": 73,
+  "what_song": 74,
+  "current_location": 75,
+  "ingredient_substitution": 76,
+  "order": 77,
+  "todo_list_update": 78,
+  "reset_settings": 79,
+  "replacement_card_duration": 80,
+  "order_checks": 81,
+  "roll_dice": 82,
+  "new_card": 83,
+  "vaccines": 84,
+  "pto_used": 85,
+  "time": 86,
+  "how_old_are_you": 87,
+  "account_blocked": 88,
+  "card_declined": 89,
+  "who_made_you": 90,
+  "shopping_list_update": 91,
+  "rewards_balance": 92,
+  "restaurant_reviews": 93,
+  "change_user_name": 94,
+  "spelling": 95,
+  "nutrition_info": 96,
+  "restaurant_reservation": 97,
+  "timer": 98,
+  "cook_time": 99,
+  "whisper_mode": 100,
+  "travel_notification": 101,
+  "routing": 102,
+  "book_hotel": 103,
+  "apr": 104,
+  "w2": 105,
+  "gas_type": 106,
+  "schedule_meeting": 107,
+  "meeting_schedule": 108,
+  "reminder": 109,
+  "income": 110,
+  "plug_type": 111,
+  "what_are_your_hobbies": 112,
+  "schedule_maintenance": 113,
+  "report_fraud": 114,
+  "food_last": 115,
+  "traffic": 116,
+  "no": 117,
+  "reminder_update": 118,
+  "book_flight": 119,
+  "mpg": 120,
+  "pto_balance": 121,
+  "tell_joke": 122,
+  "calories": 123,
+  "balance": 124,
+  "rollover_401k": 125,
+  "weather": 126,
+  "change_language": 127,
+  "distance": 128,
+  "play_music": 129,
+  "min_payment": 130,
+  "sync_device": 131,
+  "pay_bill": 132,
+  "taxes": 133,
+  "share_location": 134,
+  "bill_due": 135,
+  "pto_request": 136,
+  "calendar": 137,
+  "uber": 138,
+  "do_you_have_pets": 139,
+  "change_volume": 140,
+  "timezone": 141,
+  "application_status": 142,
+  "flip_coin": 143,
+  "credit_score": 144,
+  "oil_change_how": 145,
+  "expiration_date": 146,
+  "credit_limit_change": 147,
+  "how_busy": 148,
+  "travel_suggestion": 149
+}

cache/intent/vocab.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d4fa520420cf60655dd67114826cef0f8be23bc7ca07cdb3c072f2a400e242b
+size 78973

cache/slot/embeddings.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:faba49b73dfdd2a98dbbfe7b53eed50b8edd9df716169e8f837558c5e24c42bf
+size 4941099

cache/slot/tag2idx.json ADDED Viewed

	@@ -0,0 +1,11 @@

+{
+  "O": 0,
+  "B-date": 1,
+  "I-time": 2,
+  "B-time": 3,
+  "B-last_name": 4,
+  "I-people": 5,
+  "B-people": 6,
+  "I-date": 7,
+  "B-first_name": 8
+}

cache/slot/vocab.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c711af8ba9cba928df00a20913b2bcdd0738ab3b9210b4b9f10d0ff9dcf27f16
+size 49861

ckpt/intent/model_checkpoint.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:65fdb8e191b37fc6866acd1699f8978736bfb975b176d5ee0464f43301d928e8
+size 56947301

data/intent/eval.json ADDED Viewed