MenxLi
diff --git a/‎irbm/__init__.py‎
Lines changed: 15 additions & 0 deletions b/‎irbm/__init__.py‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎irbm/cmd/__init__.py‎ b/‎irbm/cmd/__init__.py‎
diff --git a/‎irbm/cmd/summarize.py‎
Lines changed: 38 additions & 0 deletions b/‎irbm/cmd/summarize.py‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎irbm/globalConfig.py‎
Lines changed: 10 additions & 0 deletions b/‎irbm/globalConfig.py‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎irbm/lmInterface.py‎
Lines changed: 241 additions & 0 deletions b/‎irbm/lmInterface.py‎
Lines changed: 241 additions & 0 deletions
@@ -0,0 +1,15 @@
+"""
+Intelligent resbibman,
+AI tools & GPU acceleration
+"""
+
+
+from resbibman.initLogger import setupLogger
+
+def initLogger(level = "info"):
+    return setupLogger(
+        "iRBM",
+        term_id="iserver",
+    )
+
+initLogger()
@@ -0,0 +1,38 @@
+import asyncio
+import argparse
+from resbibman.core.pdfTools import PDFAnalyser
+from ..lmTools import summarize, structuredSummerize, featurize
+from ..lmInterface import streamOutput
+
+def main():
+    parser = argparse.ArgumentParser()
+    parser.add_argument('pdf_path', type=str, help='path to pdf file')
+    parser.add_argument('--structured', action='store_true', help='structured summarization')
+    parser.add_argument('--model', type=str, default="gpt-3.5-turbo", help='model name')
+    parser.add_argument("--max-length", type=int, default=-1, help="max length of the input text, the rest will be truncated")
+
+    args = parser.parse_args()
+    with PDFAnalyser(args.pdf_path) as doc:
+        pdf_text = doc.getText()
+
+    max_len = args.max_length
+    if max_len == -1: max_len = len(pdf_text.split())
+    if len(pdf_text.split()) > max_len: 
+        txt = " ".join(pdf_text.split()[:max_len])
+    else: txt = pdf_text
+
+    # vec = asyncio.run(featurize(txt, verbose=True))
+    # print(vec.shape)
+    # exit()
+
+    if args.structured:
+        res = asyncio.run(structuredSummerize(txt, print_func=print, model=args.model))
+        vec = asyncio.run(featurize(res))
+        print("Get vectorized result: ", vec.shape)
+    else:
+        streamOutput(summarize(txt))
+
+        
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,10 @@
+"""
+Usage: 
+import globalConfig as config
+...
+"""
+import openai
+from typing import Optional
+
+openai_api_base: str = openai.api_base
+fastchat_api_base: str = "http://localhost:8000/v1"
@@ -0,0 +1,241 @@
+
+"""Language Model Interface"""
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from collections.abc import Iterator
+from typing import Any, TypedDict, Literal, Type
+import dataclasses, json
+import enum
+
+# check python version
+import sys, os
+if sys.version_info < (3, 9):
+    from typing import Iterator
+else:
+    from collections.abc import Iterator
+
+import openai
+from . import globalConfig as config
+import basaran.model
+
+
+ConvRole = Literal["user", "assistant"]
+ConvContent = str
+ConversationDictT = TypedDict("ConversationDictT", {
+    "system": str,
+    "conversations": list[tuple[ConvRole, ConvContent]]
+})
+@dataclasses.dataclass
+class Conversation:
+    system: str
+    conversations: list[tuple[ConvRole, ConvContent]]
+    def add(self, role: ConvRole, content: str):
+        self.conversations.append((role, content))
+    def clear(self):
+        self.conversations = []
+    def __str__(self) -> str:
+        template = "[system]\n> {}\n".format(self.system)
+        return template + "\n".join(["[{}]\n> {}".format(c[0], c[1]) for c in self.conversations])
+    def toDict(self) -> ConversationDictT:
+        return {
+            "system": self.system,
+            "conversations": self.conversations
+        }
+    def setFromDict(self, dict: ConversationDictT):
+        self.system = dict["system"]
+        self.conversations = dict["conversations"]
+        return self
+    @property
+    def openai_conversations(self):
+        system = [{"role": "system", "content": self.system}]
+        conv = [{"role": c[0], "content": c[1]} for c in self.conversations]
+        return system + conv
+
+def streamOutput(output_stream: Iterator[StreamData], print_callback: Any = lambda x, end=" ", flush=True: ...):
+    """
+    Obtain the output from the stream, and maybe print it to stdout
+    print_callback: a function that takes a string and print it to stdout, \
+        should have the same interface as print (i.e. print_callback("hello", end=" ", flush=True))
+    """
+    try:
+        print_callback("", end="", flush=True)
+    except TypeError:
+        raise TypeError("print_func should have the same interface as print, i.e. contains end and flush")
+
+    pre = 0
+    output_text = ""
+    for outputs in output_stream:
+        output_text = outputs["text"]
+        output_text = output_text.strip().split(" ")
+        now = len(output_text) - 1
+        if now > pre:
+            print_callback(" ".join(output_text[pre:now]), end=" ", flush=True)
+            pre = now
+    print_callback(" ".join(output_text[pre:]), flush=True)
+    return " ".join(output_text)
+
+
+class ErrorCodes(enum.Enum):
+    """Error codes for the model output stream"""
+    OK = 0
+
+class StreamData(TypedDict):
+    """a class to represent the data returned by the model output stream"""
+    text: str
+    error_code: ErrorCodes
+
+class ChatStreamIter(ABC):
+    """Abstract class for language model interface"""
+    temperature = 0.8
+    max_response_length = 1024
+    conversations: Conversation
+
+    # whether to return the pieces of the output stream or return the concatenated whole output stream
+    return_pieces: bool = False     
+
+    @abstractmethod
+    def call(self, message: str, temperature: float, max_len: int = 1024) -> Iterator[StreamData]:
+        ...
+    def __call__(self, prompt) -> Iterator[StreamData]:
+        return self.call(prompt, self.temperature, self.max_response_length)
+
+class OpenAIChatStreamIter(ChatStreamIter):
+    """
+    Connect to OpenAI API interface
+    """
+    def __init__(self, model: str = "gpt-3.5-turbo") -> None:
+        super().__init__()
+        self.model = model
+        self.conversations = Conversation(system="A conversation between a human and an AI assistant.", conversations=[])
+        if "vicunna" in model:
+            assert config.fastchat_api_base, "fastchat_api_base is not set"
+    
+    def generateMessages(self, prompt: str):
+        self.conversations.add(role = "user", content = prompt)
+        return self.conversations.openai_conversations
+    
+    @property
+    def openai_base(self):
+        if "vicuna" in self.model:
+            return config.fastchat_api_base
+        else:
+            return config.openai_api_base
+
+    def call(self, prompt: str, temperature: float, max_len: int = 1024) -> Iterator[StreamData]:
+        openai.api_base = self.openai_base      # set the api base according to the model
+
+        res = openai.ChatCompletion.create(
+            model=self.model, messages=self.generateMessages(prompt), temperature=temperature, stream=True
+        )
+        text = ""
+        for chunk in res:
+            piece: str = chunk["choices"][0]["delta"].get("content", "") # type: ignore
+            text += piece
+            data: StreamData = {
+                "text": piece if self.return_pieces else text,
+                "error_code": ErrorCodes.OK
+            }
+            yield data
+        self.conversations.add(role = "assistant", content = text)
+
+class HFChatStreamIter(ChatStreamIter):
+    """Offline models from huggingface"""
+    def __init__(
+            self, 
+            model: Literal["lmsys/vicuna-7b-v1.5-16k", "meta-llama/Llama-2-7b-chat", "stabilityai/StableBeluga-7B"], 
+            load_in_8bit: bool = True
+            ):
+        self.model_name = model
+        self.model = basaran.model.load_model(model, load_in_8bit=load_in_8bit)
+        self.conversations = Conversation(system="A conversation between a human and an AI assistant.", conversations=[])
+    
+    def getConv(self):
+        if "Llama-2" in self.model_name:
+            # Not sure if this is correct
+            ret = f"[INST]<<SYS>>\n{self.conversations.system.strip()}\n<<SYS>>\n"
+            for i, (role, content) in enumerate(self.conversations.conversations):
+                if i == 0:
+                    assert role == "user"
+                    ret += f"{content}[/INST]"
+                else:
+                    if role == "user":
+                        ret += f"[INST]{content}[/INST]"
+                    else:
+                        ret += f"{content}</s><s>"
+            if self.conversations.conversations[-1][0] == "user":
+                ret += "[INST]"
+            return ret
+        
+        elif "vicuna" in self.model_name:
+            # Not sure if this is correct
+            ret = f"{self.conversations.system.strip()}"
+            for i, (role, content) in enumerate(self.conversations.conversations):
+                if i == 0:
+                    assert role == "user"
+                if role == "user":
+                    ret += f"USER: {content} "
+                else:
+                    ret += f"ASSISTANT: {content}</s>"
+            if self.conversations.conversations[-1][0] == "user":
+                ret += "ASSISTANT: "
+            else:
+                ret += "USER: "
+            return ret
+        
+        elif "StableBeluga" in self.model_name:
+            """
+            ### System:
+            This is a system prompt, please behave and help the user.
+
+            ### User:
+            Your prompt here
+
+            ### Assistant:
+            The output of Stable Beluga 7B
+            """
+            ret = f"### System:\n{self.conversations.system.strip()}\n\n"
+            for i, (role, content) in enumerate(self.conversations.conversations):
+                if i == 0:
+                    assert role == "user"
+                if role == "user":
+                    ret += f"### User:\n{content}\n\n"
+                else:
+                    ret += f"### Assistant:\n{content}\n\n"
+            if self.conversations.conversations[-1][0] == "user":
+                ret += "### Assistant:\n"
+            else:
+                ret += "### User:\n"
+            return ret
+        
+        else:
+            raise NotImplementedError("Unknown model: {}".format(self.model_name))
+    
+    def call(self, prompt: str, temperature: float, max_len: int = 1024) -> Iterator[StreamData]:
+
+        self.conversations.add(role = "user", content = prompt)
+        text = ""
+        for choice in self.model(prompt=self.getConv(), max_tokens=max_len, temperature=temperature, return_full_text=False):
+            piece = choice["text"]
+            data: StreamData = {
+                "text": piece,
+                "error_code": ErrorCodes.OK
+            }
+            text += piece
+            yield data
+        self.conversations.add(role = "assistant", content = text)
+
+
+ChatStreamIterType = Literal[
+    "gpt-3.5-turbo", "gpt-3.5-turbo-16k", "vicuna-13b", "gpt-4", "gpt-4-32k", "vicuna-33b-v1.3-gptq-4bit", 
+    "lmsys/vicuna-7b-v1.5-16k", "meta-llama/Llama-2-7b-chat", "stabilityai/StableBeluga-7B"
+    ]
+def getStreamIter(itype: ChatStreamIterType = "gpt-3.5-turbo") -> ChatStreamIter:
+    if itype in ["gpt-3.5-turbo", "gpt-3.5-turbo-16k", "vicuna-13b", "gpt-4", "gpt-4-32k", "vicuna-33b-v1.3-gptq-4bit"]:
+        return OpenAIChatStreamIter(model=itype)
+    
+    else:
+        try:
+            return HFChatStreamIter(model=itype)    # type: ignore
+        except:
+            raise ValueError("Unknown interface type: {}".format(itype))