kowalsky
/

multi_task_bert_model

Token Classification

Model card Files Files and versions

multi_task_bert_model / inference.py

kowalsky's picture

Upload inference.py

b3f6ef0 verified almost 2 years ago

history blame contribute delete

3.99 kB

	import torch
	import os
	import sys

	project_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
	sys.path.append(project_dir)

	from model import MultiTaskBertModel
	from data_loader import load_dataset
	from utils import bert_config, tokenizer, intent_ids_to_labels, intent_labels_to_ids


	def load_model(model_path):
	"""
	Load the pre-trained model weights from the specified path.

	Args:
	model_path (str): Path to the pre-trained model weights.

	Returns:
	model (MultiTaskBertModel): Loaded model with pre-trained weights.
	"""
	# Initialize model with configuration and dataset information
	config = bert_config()
	dataset = load_dataset("training_dataset")
	model = MultiTaskBertModel(config, dataset)

	# Load the model weights from the specified path
	model.load_state_dict(torch.load(model_path))

	model.eval()

	return model

	def preprocess_input(input_data):
	"""
	Preprocess the input text data for inference.

	Args:
	input_data (str): Input text data to be preprocessed.

	Returns:
	input_ids (torch.Tensor): Tensor of input IDs after tokenization.
	attention_mask (torch.Tensor): Tensor of attention mask indicating input tokens.
	offset_mapping (torch.Tensor): Tensor of offset mappings for input tokens.
	"""
	# Tokenize the input text and get offset mappings
	tok = tokenizer()
	preprocessed_input = tok(input_data,
	return_offsets_mapping=True,
	padding='max_length',
	truncation=True,
	max_length=128)

	# Convert preprocessed inputs to PyTorch tensors
	input_ids = torch.tensor([preprocessed_input['input_ids']])
	attention_mask = torch.tensor([preprocessed_input['attention_mask']])
	offset_mapping = torch.tensor(preprocessed_input['offset_mapping'])
	return input_ids, attention_mask, offset_mapping

	def perform_inference(model, input_ids, attention_mask):

	with torch.no_grad():

	ner_logits, intent_logits = model.forward(input_ids, attention_mask)

	return ner_logits, intent_logits

	def align_ner_predictions_with_input(predictions, offset_mapping, input_text):
	aligned_predictions = []
	current_word_idx = 0

	# Iterate through each prediction and its offset mapping
	for prediction, (start, end) in zip(predictions, offset_mapping):
	if start == end:
	continue
	# Find the corresponding word in the input text
	word = input_text[start:end]

	# Check if the current word is a special token or part of padding
	if not word.strip():
	continue

	# Assign the prediction to the word
	aligned_predictions.append((word, prediction))

	return aligned_predictions

	def convert_intent_to_label(intent_logit):
	labels = intent_labels_to_ids()
	intent_labels = intent_ids_to_labels(labels)
	return intent_labels[int(intent_logit)]


	def main():
	"""
	Main function to perform inference using the pre-trained model.
	"""
	# Load the pre-trained model
	model_path = "pytorch_model.bin"
	model = load_model(model_path)

	input_data = input("Enter the text to analyze: ")
	# Preprocess the input text
	input_ids, attention_mask, offset_mapping = preprocess_input(input_data)

	# Perform inference using the pre-trained model
	ner_logits, intent_logits = perform_inference(model, input_ids, attention_mask)

	# Post-process the model outputs and print the results
	ner_logits = torch.argmax(ner_logits.view(-1, 9), dim=1)
	intent_logits = torch.argmax(intent_logits)

	ner_logits = align_ner_predictions_with_input(ner_logits, offset_mapping, input_data)
	intent_label = convert_intent_to_label(intent_logits)

	print(f"Ner logits: {ner_logits}")
	print(f"Intent logits: {intent_label}")


	if __name__ == "__main__":
	main()