Merge pull request #27 from potsawee/openaiprompt

Add SelfCheckGPT-prompt with OpenAI API
potsawee · Mar 10, 2024 · a4f4c43 · a4f4c43
2 parents f678a98 + b84d1eb
commit a4f4c43
Show file tree

Hide file tree

Showing 2 changed files with 104 additions and 1 deletion.
diff --git a/README.md b/README.md
@@ -106,15 +106,20 @@ print(sent_scores_nli)
 
 ### SelfCheckGPT Usage: LLM Prompt
 
-Prompting an LLM (current support = open-source model, e.g., Llama2, Mistral) to assess information consistency in a zero-shot setup. We query an LLM to assess whether the i-th sentence is supported by the sample (as the context). Similar to other methods, a higher score indicates higher chance of being hallucination. An example when using Mistral is below:
+Prompting an LLM (Llama2, Mistral, OpenAI's GPT) to assess information consistency in a zero-shot setup. We query an LLM to assess whether the i-th sentence is supported by the sample (as the context). Similar to other methods, a higher score indicates higher chance of being hallucination. An example when using Mistral is below:
 
 
 ```python
+# Option1: open-source model
 from selfcheckgpt.modeling_selfcheck import SelfCheckLLMPrompt
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 llm_model = "mistralai/Mistral-7B-Instruct-v0.2"
 selfcheck_prompt = SelfCheckLLMPrompt(llm_model, device)
 
+# Option2: API access (currently only support client_type="openai")
+# from selfcheckgpt.modeling_selfcheck_apiprompt import SelfCheckAPIPrompt
+# selfcheck_prompt = SelfCheckAPIPrompt(client_type="openai", model="gpt-3.5-turbo")
+
 sent_scores_prompt = selfcheck_prompt.predict(
     sentences = sentences,                          # list of sentences
     sampled_passages = [sample1, sample2, sample3], # list of sampled passages

diff --git a/selfcheckgpt/modeling_selfcheck_apiprompt.py b/selfcheckgpt/modeling_selfcheck_apiprompt.py
@@ -0,0 +1,98 @@
+from openai import OpenAI
+from tqdm import tqdm
+from typing import Dict, List, Set, Tuple, Union
+import numpy as np
+
+class SelfCheckAPIPrompt:
+    """
+    SelfCheckGPT (LLM Prompt): Checking LLM's text against its own sampled texts via API-based prompting (e.g., OpenAI's GPT)
+    """
+    def __init__(
+        self,
+        client_type = "openai",
+        model = "gpt-3.5-turbo",
+    ):
+        assert client_type in ["openai"]
+        if client_type == "openai":
+            # using default keys
+            # os.environ.get("OPENAI_ORGANIZATION")
+            # os.environ.get("OPENAI_API_KEY")
+            self.client = OpenAI()
+            print("Initiate OpenAI client... model = {}".format(model)) 
+
+        self.client_type = client_type
+        self.model = model
+        self.prompt_template = "Context: {context}\n\nSentence: {sentence}\n\nIs the sentence supported by the context above? Answer Yes or No.\n\nAnswer: "
+        self.text_mapping = {'yes': 0.0, 'no': 1.0, 'n/a': 0.5}
+        self.not_defined_text = set()
+
+
+    def set_prompt_template(self, prompt_template: str):
+        self.prompt_template = prompt_template
+
+    def completion(self, prompt: str):
+        if self.client_type == "openai":
+            chat_completion = self.client.chat.completions.create(
+                model=self.model,
+                messages=[
+                    # {"role": "system", "content": "You are a helpful assistant."},
+                    {"role": "user", "content": prompt}
+                ],
+                temperature=0.0, # 0.0 = deterministic,
+                max_tokens=5, # max_tokens is the generated one,
+            )
+            return chat_completion.choices[0].message.content
+
+        else:
+            raise ValueError("client_type not implemented")
+
+    def predict(
+        self,
+        sentences: List[str],
+        sampled_passages: List[str],
+        verbose: bool = False,
+    ):
+        """
+        This function takes sentences (to be evaluated) with sampled passages (evidence), and return sent-level scores
+        :param sentences: list[str] -- sentences to be evaluated, e.g. GPT text response spilt by spacy
+        :param sampled_passages: list[str] -- stochastically generated responses (without sentence splitting)
+        :param verson: bool -- if True tqdm progress bar will be shown
+        :return sent_scores: sentence-level scores
+        """
+        num_sentences = len(sentences)
+        num_samples = len(sampled_passages)
+        scores = np.zeros((num_sentences, num_samples))
+        disable = not verbose
+        for sent_i in tqdm(range(num_sentences), disable=disable):
+            sentence = sentences[sent_i]
+            for sample_i, sample in enumerate(sampled_passages):
+                # this seems to improve performance when using the simple prompt template
+                sample = sample.replace("\n", " ") 
+                prompt = self.prompt_template.format(context=sample, sentence=sentence)
+                generate_text = self.completion(prompt)
+                score_ = self.text_postprocessing(generate_text)
+                scores[sent_i, sample_i] = score_
+        scores_per_sentence = scores.mean(axis=-1)
+        return scores_per_sentence
+
+    def text_postprocessing(
+        self,
+        text,
+    ):
+        """
+        To map from generated text to score
+        Yes -> 0.0
+        No  -> 1.0
+        everything else -> 0.5
+        """
+        text = text.lower().strip()
+        if text[:3] == 'yes':
+            text = 'yes'
+        elif text[:2] == 'no':
+            text = 'no'
+        else:
+            if text not in self.not_defined_text:
+                print(f"warning: {text} not defined")
+                self.not_defined_text.add(text)
+            text = 'n/a'
+        return self.text_mapping[text]