Spaces:

emmatliu
/

LLMReferenceLetterBias

Runtime error

App Files Files Community

LLMReferenceLetterBias / hallucination_detection.py

emmatliu

Upload 6 files

a269338 verified over 1 year ago

raw

history blame contribute delete

2.49 kB

	import re
	import pandas as pd
	from tqdm import tqdm
	import torch
	import torch.nn as nn
	from transformers import AutoTokenizer, AutoModelForSequenceClassification

	def detect_hallucinations(df,max_length=256):
	hg_model_hub_name = "ynie/albert-xxlarge-v2-snli_mnli_fever_anli_R1_R2_R3-nli"
	tokenizer = AutoTokenizer.from_pretrained(hg_model_hub_name)
	model = AutoModelForSequenceClassification.from_pretrained(hg_model_hub_name)
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	model = model.to(device)
	device_ids = [i for i in range(4)]
	model = nn.DataParallel(model, device_ids)

	cols = list(df.columns)[1:]
	for i in range(len(cols)):
	# 'per_pos' -> 'per_pos_1'
	if 'per_' in cols[i] or 'con_' in cols[i]:
	cols[i] = cols[i] + '_1'
	df = df[[cols]]
	df['hallucination'] = ''
	df['contradiction'] = ''

	INPUT = "text" #TODO: fix this!

	for i in tqdm(range(len(df)), ascii=True):
	premise = df['info'][i]
	hypotheses = re.split(r"\.\|\?\|\!",df[INPUT][i].replace('<return>', ''))
	l = len(hypotheses)
	for j in range(len(hypotheses)):
	hypothesis = hypotheses[j]
	tokenized_input_seq_pair = tokenizer.encode_plus(premise, hypothesis.format(df['first_name'][i]),
	max_length=max_length,
	return_token_type_ids=True, truncation=True)

	input_ids = torch.Tensor(tokenized_input_seq_pair['input_ids']).long().unsqueeze(0).to(device)
	token_type_ids = torch.Tensor(tokenized_input_seq_pair['token_type_ids']).long().unsqueeze(0).to(device)
	attention_mask = torch.Tensor(tokenized_input_seq_pair['attention_mask']).long().unsqueeze(0).to(device)

	outputs = model(input_ids,
	attention_mask=attention_mask,
	token_type_ids=token_type_ids,
	labels=None)

	predicted_probability = torch.softmax(outputs[0], dim=1)[0].tolist()

	m = max(predicted_probability)
	if (m == predicted_probability[1]) or (m == predicted_probability[2]):
	df['hallucination'][i] = df['hallucination'][i] + hypothesis + '. '
	if (m == predicted_probability[2]):
	df['contradiction'][i] = df['contradiction'][i] + hypothesis + '. '

	return df