BatsResearch · dotpyu · Apr 29, 2024 · Apr 29, 2024
diff --git a/alfred/client/client.py b/alfred/client/client.py
@@ -427,7 +427,7 @@ def chat(self, log_save_path: Optional[str] = None, **kwargs: Any):
         :param log_save_path: The file to save the chat logs.
         :type log_save_path: Optional[str]
         """
-        if self.model_type in ["openai", "anthropic", "google"]:
+        if self.model_type in ["openai", "anthropic", "google", "huggingface"]:
             self.model.chat(log_save_path=log_save_path, **kwargs)
         else:
             logger.error(

diff --git a/alfred/client/ssh/utils.py b/alfred/client/ssh/utils.py
@@ -1,6 +1,7 @@
 """
 Modified with ideas originated from https://github.com/paramiko/paramiko/blob/main/demos/forward.py
 """
+
 import select
 import socket
 import threading

diff --git a/alfred/data/wrench.py b/alfred/data/wrench.py
@@ -1,8 +1,9 @@
 """
 
- Wrench Dataset Class is a dataset wrapper for Wrench, a weak supervision benchmark testbed.
+Wrench Dataset Class is a dataset wrapper for Wrench, a weak supervision benchmark testbed.
 
 """
+
 import json
 import logging
 import os

diff --git a/alfred/fm/anthropic.py b/alfred/fm/anthropic.py
@@ -15,7 +15,7 @@
     "claude-2",
     "claude-2.0",
     "claude-3-opus-20240229",
-    "claude-3-sonnet-20240229"
+    "claude-3-sonnet-20240229",
 )
 
 try:
@@ -103,7 +103,9 @@ def _anthropic_query(
             return response.content[0].text
 
     def __init__(
-        self, model_string: str = "claude-3-opus-20240229", api_key: Optional[str] = None
+        self,
+        model_string: str = "claude-3-opus-20240229",
+        api_key: Optional[str] = None,
     ):
         """
         Initialize the Anthropic API wrapper.
@@ -272,10 +274,13 @@ def _feedback(feedback: str, no_newline=False, override=False):
                     if isinstance(resp, MessageStopEvent):
                         break
                     if isinstance(resp, ContentBlockStartEvent):
-                        resp=resp.content_block
+                        resp = resp.content_block
                     if isinstance(resp, ContentBlockDeltaEvent):
-                        resp=resp.delta
-                    if resp.type == "content_block_stop" or resp.type == "message_delta":
+                        resp = resp.delta
+                    if (
+                        resp.type == "content_block_stop"
+                        or resp.type == "message_delta"
+                    ):
                         break
                     if resp.type != "text" and resp.type != "text_delta":
                         logger.warning(f"Unsupported response type {resp.type}")

diff --git a/alfred/fm/huggingface.py b/alfred/fm/huggingface.py
@@ -15,6 +15,9 @@
 
 from .model import LocalAccessFoundationModel
 from .response import CompletionResponse
+from .utils import colorize_str, type_print
+
+import json
 
 logger = logging.getLogger(__name__)
 
@@ -457,3 +460,101 @@ def _encode_batch(self, batch_instance, **kwargs) -> List[torch.Tensor]:
         _hidden_state = self._get_hidden_states(inputs, reduction=reduction)
 
         return list(_hidden_state)
+
+    def chat(self, **kwargs: Any):
+        """
+        Launch an interactive chat session
+        """
+
+        def _feedback(feedback: str, no_newline=False, override=False):
+            if override:
+                print("\r", end="")
+            print(
+                colorize_str("Chat AI: ", "GREEN"),
+                end="",
+            )
+            type_print(feedback)
+            print(
+                "",
+                end="\n" if not no_newline else "",
+            )
+
+        model = kwargs.get("model", self.model_string)
+        c_title = colorize_str("Alfred's Anthropic Chat", "BLUE")
+        c_model = colorize_str(model, "WARNING")
+        c_exit = colorize_str("exit", "FAIL")
+        c_ctrlc = colorize_str("Ctrl+C", "FAIL")
+
+        temperature = kwargs.get("temperature", 0.7)
+        max_tokens = kwargs.get("max_tokens", 1024)
+        log_save_path = kwargs.get("log_save_path", None)
+        manual_chat_sequence = kwargs.get("manual_chat_sequence", None)
+
+        print(f"Welcome to the {c_title} session!\nYou are using the {c_model} model.")
+        print(f"Type '{c_exit}' or hit {c_ctrlc} to exit the chat session.")
+
+        message_log = [
+            # {
+            #     "role": "system",
+            #     "content": "You are a friendly chatbot.",
+            # },
+        ]
+
+        print()
+        print("======== Chat Begin ========")
+        print()
+
+        try:
+            while True:
+                if manual_chat_sequence is not None:
+                    query = manual_chat_sequence.pop(0)
+                    _feedback(query, no_newline=True)
+                    print()
+                    if len(manual_chat_sequence) == 0:
+                        break
+                else:
+                    query = input(colorize_str("You: "))
+                if query == "exit":
+                    _feedback("Goodbye!")
+                    break
+
+                message_log.append({"role": "user", "content": query})
+                print(
+                    colorize_str("Chat AI: ", "GREEN"),
+                    end="",
+                )
+                try:
+                    tokenized_chat = self.tokenizer.apply_chat_template(
+                        message_log,
+                        tokenize=True,
+                        add_generation_prompt=True,
+                        return_tensors="pt",
+                    )
+                    tokenized_chat = tokenized_chat.to(self.model.device)
+                except Exception as e:
+                    _feedback(f"Error: {e}")
+                    break
+                outputs = self.model.generate(
+                    tokenized_chat,
+                    max_new_tokens=max_tokens,
+                    temperature=temperature,
+                    do_sample=False if temperature == 0 else True,
+                )
+                outputs = outputs[0][len(tokenized_chat[0]) :]
+                txt = self.tokenizer.decode(outputs, skip_special_tokens=True)
+                type_print(txt)
+                print()
+                response = txt.strip().replace("\n", "")
+                message_log.append({"role": "assistant", "content": response})
+        except KeyboardInterrupt:
+            _feedback("Goodbye!")
+
+        print()
+        print("======== Chat End ========")
+        print()
+        print(colorize_str("Thank you for using Alfred!"))
+
+        if log_save_path:
+            with open(log_save_path, "w") as f:
+                json.dump(message_log, f)
+            print(f"Your chat log is saved to {log_save_path}")
diff --git a/alfred/fm/query/ranked_query.py b/alfred/fm/query/ranked_query.py
@@ -3,6 +3,7 @@
 Ranked Query Class encompasses query tem
 
 """
+
 from typing import List, Union, Tuple, Callable
 
 import numpy as np

diff --git a/alfred/fm/remote/protos/query_pb2.py b/alfred/fm/remote/protos/query_pb2.py
diff --git a/alfred/fm/remote/protos/query_pb2_grpc.py b/alfred/fm/remote/protos/query_pb2_grpc.py
@@ -1,5 +1,6 @@
 # Generated by the gRPC Python protocol compiler plugin. DO NOT EDIT!
 """Client and server classes corresponding to protobuf-defined services."""
+
 import grpc
 
 from . import query_pb2 as query__pb2

diff --git a/alfred/fm/response/completion_response.py b/alfred/fm/response/completion_response.py
@@ -17,7 +17,7 @@ class CompletionResponse(Response):
 
     def __init__(
         self,
-        prediction: str,
+        prediction: str = None,
         score: Optional[float] = None,
         embedding: Optional[Union[torch.Tensor, np.ndarray]] = None,
     ):

diff --git a/alfred/fm/response/ranked_response.py b/alfred/fm/response/ranked_response.py
@@ -14,8 +14,8 @@ class RankedResponse(Response):
 
     def __init__(
         self,
-        prediction: str,
-        scores: Dict,
+        prediction: str = None,
+        scores: Dict = None,
         logits: Optional[Union[torch.Tensor, np.ndarray]] = None,
         embeddings: Optional[Union[torch.Tensor, np.ndarray]] = None,
     ):

diff --git a/alfred/template/string_template.py b/alfred/template/string_template.py
@@ -120,7 +120,9 @@ def from_promptsource(self, promptsource_template):
         self._metadata = promptsource_template["metadata"]
         self._answer_choices = promptsource_template["answer_choices"]
 
-    def apply(self, example: Union[Dict, List[Dict]], **kawrgs) -> Union[Query, List[Query]]:
+    def apply(
+        self, example: Union[Dict, List[Dict]], **kawrgs
+    ) -> Union[Query, List[Query]]:
         """
         Apply template to an example or a list of examples and returns a query object or a list of queries
 
@@ -138,7 +140,6 @@ def apply(self, example: Union[Dict, List[Dict]], **kawrgs) -> Union[Query, List
             else:
                 raise ValueError(f"Unsupported example type: {type(example)}")
 
-
         if "key_translator" in kawrgs:
             key_translator = kawrgs["key_translator"]
         else:

diff --git a/alfred/voter/voter.py b/alfred/voter/voter.py
@@ -154,12 +154,12 @@ def clear_calibration(self):
         self._calibration = None
 
     def __call__(
-            self,
-            responses: Union[Iterable[str], str, Iterable[Response], Response],
-            matching_function: Optional[Callable] = None,
-            label_map: Optional[Dict] = None,
-            **kwargs: Any,
-     ) -> np.ndarray:
+        self,
+        responses: Union[Iterable[str], str, Iterable[Response], Response],
+        matching_function: Optional[Callable] = None,
+        label_map: Optional[Dict] = None,
+        **kwargs: Any,
+    ) -> np.ndarray:
         """
         Vote for the responses based on the matching function and the label maps
         """
-Original file line number
+Diff line change
@@ Expand Up / @@ -3,6 +3,7 @@ @@
     Ranked Query Class encompasses query tem
     """
     from typing import List, Union, Tuple, Callable
     import numpy as np
@@ Expand Down @@