Hasan Iqbal
Added LLM Evaluation on Datasets
eca534f unverified
raw
history blame
1.35 kB
from openfactcheck.core.state import FactCheckerState
from openfactcheck.core.solver import StandardTaskSolver, Solver
from .factool_utils.chat_api import OpenAIChat
from .factool_utils.prompt import CLAIM_EXTRACTION_PROMPT
@Solver.register("factool_claimprocessor", "response", "claims")
class FactoolClaimProcessor(StandardTaskSolver):
def __init__(self, args):
super().__init__(args)
self.gpt_model = self.global_config.get("factool_gpt_model", "gpt-3.5-turbo")
self.gpt = OpenAIChat(self.gpt_model)
self.claim_prompt = CLAIM_EXTRACTION_PROMPT
def __call__(self, state: FactCheckerState, *args, **kwargs):
response = state.get(self.input_name)
claims = self._claim_extraction(responses=[response])[0]
extracted_claims = [claim["claim"] for claim in claims]
state.set(self.output_name, extracted_claims)
return True, state
def _claim_extraction(self, responses):
messages_list = [
[
{"role": "system", "content": self.claim_prompt["system"]},
{
"role": "user",
"content": self.claim_prompt["user"].format(input=response),
},
]
for response in responses
]
return self.gpt.run(messages_list, list)