ntgiaky
/

ner-smart-home

Token Classification

named-entity-recognition

Model card Files Files and versions

ntgiaky commited on Jun 10

Commit

1c8072b

·

verified ·

1 Parent(s): 9888d64

Update README.md

Files changed (1) hide show

README.md +19 -39

README.md CHANGED Viewed

@@ -178,30 +178,25 @@ print(result)
 For a complete NLU pipeline:
 ```python
-from transformers import pipeline
-# Load both models
-intent_classifier = pipeline("text-classification", model="ntgiaky/phobert-intent-classifier-smart-home")
-ner = pipeline("token-classification", model="ntgiaky/phobert-ner-smart-home", aggregation_strategy="simple")
-def process_command(text):
-    # Get intent
-    intent_result = intent_classifier(text)
-    intent = intent_result[0]['label']
-    # Get entities
-    entities = ner(text)
-    # Combine results
-    return {
-        'text': text,
-        'intent': intent,
-        'entities': entities
-    }
-# Example
-command = "điều chỉnh nhiệt độ điều hòa 25 độ"
-result = process_command(command)
 print(result)
 ```
@@ -209,23 +204,8 @@ print(result)
 ```python
 # Input: "bật đèn phòng khách"
-# Entities: [
-#   {'type': 'device', 'text': 'đèn'},
-#   {'type': 'living_space', 'text': 'phòng khách'}
-# ]
-# Input: "tắt quạt phòng ngủ lúc 10 giờ tối"
-# Entities: [
-#   {'type': 'device', 'text': 'quạt'},
-#   {'type': 'living_space', 'text': 'phòng ngủ'},
-#   {'type': 'time_at', 'text': '10 giờ tối'}
-# ]
-# Input: "điều chỉnh nhiệt độ điều hòa 25 độ"
-# Entities: [
-#   {'type': 'device', 'text': 'điều hòa'},
-#   {'type': 'target_number', 'text': '25 độ'}
-# ]
 ```
 ## Citation

 For a complete NLU pipeline:
 ```python
+from transformers import AutoTokenizer, AutoModelForTokenClassification, pipeline
+# Load with PhoBERT tokenizer explicitly
+tokenizer = AutoTokenizer.from_pretrained("vinai/phobert-base")
+model = AutoModelForTokenClassification.from_pretrained(
+    "ntgiaky/phobert-ner-smart-home",
+    ignore_mismatched_sizes=True  # Add this if needed
+)
+# Create pipeline with explicit tokenizer
+ner = pipeline(
+    "token-classification",
+    model=model,
+    tokenizer=tokenizer,
+    aggregation_strategy="simple"
+)
+# Test
+result = ner("bật đèn phòng khách")
 print(result)
 ```
 ```python
 # Input: "bật đèn phòng khách"
+# [{'entity_group': 'living_space', 'score': np.float32(0.97212785), 'word': 'đèn', 'start': None, 'end': None},
+# {'entity_group': 'duration', 'score': np.float32(0.9332844), 'word': 'phòng khách', 'start': None, 'end': None}]
 ```
 ## Citation