multi_task_bert_model / inference.py
kowalsky's picture
Upload inference.py
b3f6ef0 verified
raw
history blame
3.99 kB
import torch
import os
import sys
project_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
sys.path.append(project_dir)
from model import MultiTaskBertModel
from data_loader import load_dataset
from utils import bert_config, tokenizer, intent_ids_to_labels, intent_labels_to_ids
def load_model(model_path):
"""
Load the pre-trained model weights from the specified path.
Args:
model_path (str): Path to the pre-trained model weights.
Returns:
model (MultiTaskBertModel): Loaded model with pre-trained weights.
"""
# Initialize model with configuration and dataset information
config = bert_config()
dataset = load_dataset("training_dataset")
model = MultiTaskBertModel(config, dataset)
# Load the model weights from the specified path
model.load_state_dict(torch.load(model_path))
model.eval()
return model
def preprocess_input(input_data):
"""
Preprocess the input text data for inference.
Args:
input_data (str): Input text data to be preprocessed.
Returns:
input_ids (torch.Tensor): Tensor of input IDs after tokenization.
attention_mask (torch.Tensor): Tensor of attention mask indicating input tokens.
offset_mapping (torch.Tensor): Tensor of offset mappings for input tokens.
"""
# Tokenize the input text and get offset mappings
tok = tokenizer()
preprocessed_input = tok(input_data,
return_offsets_mapping=True,
padding='max_length',
truncation=True,
max_length=128)
# Convert preprocessed inputs to PyTorch tensors
input_ids = torch.tensor([preprocessed_input['input_ids']])
attention_mask = torch.tensor([preprocessed_input['attention_mask']])
offset_mapping = torch.tensor(preprocessed_input['offset_mapping'])
return input_ids, attention_mask, offset_mapping
def perform_inference(model, input_ids, attention_mask):
with torch.no_grad():
ner_logits, intent_logits = model.forward(input_ids, attention_mask)
return ner_logits, intent_logits
def align_ner_predictions_with_input(predictions, offset_mapping, input_text):
aligned_predictions = []
current_word_idx = 0
# Iterate through each prediction and its offset mapping
for prediction, (start, end) in zip(predictions, offset_mapping):
if start == end:
continue
# Find the corresponding word in the input text
word = input_text[start:end]
# Check if the current word is a special token or part of padding
if not word.strip():
continue
# Assign the prediction to the word
aligned_predictions.append((word, prediction))
return aligned_predictions
def convert_intent_to_label(intent_logit):
labels = intent_labels_to_ids()
intent_labels = intent_ids_to_labels(labels)
return intent_labels[int(intent_logit)]
def main():
"""
Main function to perform inference using the pre-trained model.
"""
# Load the pre-trained model
model_path = "pytorch_model.bin"
model = load_model(model_path)
input_data = input("Enter the text to analyze: ")
# Preprocess the input text
input_ids, attention_mask, offset_mapping = preprocess_input(input_data)
# Perform inference using the pre-trained model
ner_logits, intent_logits = perform_inference(model, input_ids, attention_mask)
# Post-process the model outputs and print the results
ner_logits = torch.argmax(ner_logits.view(-1, 9), dim=1)
intent_logits = torch.argmax(intent_logits)
ner_logits = align_ner_predictions_with_input(ner_logits, offset_mapping, input_data)
intent_label = convert_intent_to_label(intent_logits)
print(f"Ner logits: {ner_logits}")
print(f"Intent logits: {intent_label}")
if __name__ == "__main__":
main()