update vllm initializtion and fix inspect history

tjtanaa · noobHappylife · commit ca4efef8aa3b · 2024-04-16T11:15:23.000+08:00
diff --git a/dsp/modules/hf_client.py b/dsp/modules/hf_client.py
@@ -3,6 +3,7 @@
 import re
 import shutil
 import subprocess
+from typing import Literal
 
 # from dsp.modules.adapter import TurboAdapter, DavinciAdapter, LlamaAdapter
 import backoff
@@ -114,7 +115,7 @@ def send_hftgi_request_v00(arg, **kwargs):
 
 
 class HFClientVLLM(HFModel):
-    def __init__(self, model, port, url="http://localhost", **kwargs):
+    def __init__(self, model, port, model_type: Literal['chat', 'text'] = 'text', url="http://localhost", **kwargs):
         super().__init__(model=model, is_client=True)
 
         if isinstance(url, list):
@@ -126,27 +127,24 @@ def __init__(self, model, port, url="http://localhost", **kwargs):
         else:
             raise ValueError(f"The url provided to `HFClientVLLM` is neither a string nor a list of strings. It is of type {type(url)}.")
         
+        self.model_type = model_type
         self.headers = {"Content-Type": "application/json"}
         self.kwargs |= kwargs
         # kwargs needs to have model, port and url for the lm.copy() to work properly
         self.kwargs.update({
-            'model': model,
             'port': port,
-            'url': url
+            'url': url,
         })
 
 
     def _generate(self, prompt, **kwargs):
         kwargs = {**self.kwargs, **kwargs}
         
-        # get model_type
-        model_type = kwargs.get("model_type",None)
-
         # Round robin the urls.
         url = self.urls.pop(0)
         self.urls.append(url)
         
-        if model_type == "chat":
+        if self.model_type == "chat":
             system_prompt = kwargs.get("system_prompt",None)
             messages = [{"role": "user", "content": prompt}]
             if system_prompt:
diff --git a/dsp/modules/lm.py b/dsp/modules/lm.py
@@ -63,11 +63,11 @@ def inspect_history(self, n: int = 1, skip: int = 0):
             if len(printed) >= n:
                 break
 
-        for idx, (prompt, choices) in enumerate(printed):
+        printing_value = ""
+        for idx, (prompt, choices) in enumerate(reversed(printed)):
             # skip the first `skip` prompts
-            if (n - idx - 1) > skip:
+            if (n - idx - 1) < skip:
                 continue
-            printing_value = ""
             printing_value += "\n\n\n"
             printing_value += prompt