theodo-group · mattzcarey · Jul 20, 2023 · Jul 20, 2023 · Jul 20, 2023 · Jul 20, 2023
diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
@@ -0,0 +1,27 @@
+name: Tests
+
+on:
+  push:
+    branches: [main]
+  pull_request:
+    branches: [main]
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v3
+      - name: Set up Python 3.11
+        uses: actions/setup-python@v4
+        with:
+          python-version: "3.11"
+          cache: "pip"
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install pytest
+          if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
+      - name: Test with pytest
+        run: |
+          python -m pytest tests/
diff --git a/.gitignore b/.gitignore
@@ -1,6 +1,7 @@
-Genoss/*
 .DS_Store
-.gitignore
 **.pyc
-genoss/model/ggml-gpt4all-j-v1.3-groovy.bin
-llm/ggml-gpt4all-j-v1.3-groovy.bin
+
+local_models/*
+
+.env
+
diff --git a/.vscode/settings.json b/.vscode/settings.json
@@ -1,6 +1,7 @@
 {
-    "[python]": {
-        "editor.defaultFormatter": "ms-python.black-formatter"
-    },
-    "python.formatting.provider": "none"
-}
+  "[python]": {
+    "editor.defaultFormatter": "ms-python.black-formatter"
+  },
+  "python.formatting.provider": "black",
+  "python.linting.enabled": true
+}
diff --git a/README.md b/README.md
@@ -72,7 +72,7 @@ cd ../../gpt4all-bindings/python
 pip3 install -e .
 ```
 
-7. Download it to your local machine from [here](https://gpt4all.io/models/ggml-gpt4all-j-v1.3-groovy.bin) and put it in the `genoss/model` directory as `genoss/model/ggml-gpt4all-j-v1.3-groovy.bin`
+7. Download it to your local machine from [here](https://gpt4all.io/models/ggml-gpt4all-j-v1.3-groovy.bin) and put it in the `local_models` directory as `local_models/ggml-gpt4all-j-v1.3-groovy.bin`
 
 </details>
 

diff --git a/genoss/api/completions_routes.py b/genoss/api/completions_routes.py
@@ -1,10 +1,13 @@
+from typing import Dict, List, Optional
+
 from fastapi import APIRouter, Body, HTTPException
+from fastapi.params import Depends
+from pydantic import BaseModel
 
-from genoss.chat.messages import Message
+from genoss.auth.auth_handler import AuthHandler
+from genoss.entities.chat.message import Message
 from genoss.services.model_factory import ModelFactory
 from logger import get_logger
-from typing import List, Dict, Optional
-from pydantic import BaseModel
 
 logger = get_logger(__name__)
 
@@ -18,8 +21,10 @@ class RequestBody(BaseModel):
 
 
 @completions_router.post("/chat/completions", tags=["Chat Completions"])
-async def post_chat_completions(body: RequestBody = Body(...)) -> Dict:
-    model = ModelFactory.get_model_from_name(body.model)
+async def post_chat_completions(
+    body: RequestBody = Body(...), api_key=Depends(AuthHandler.check_auth_header)
+) -> Dict:
+    model = ModelFactory.get_model_from_name(body.model, api_key)
 
     if model is None:
         raise HTTPException(status_code=404, detail="Model not found")
@@ -28,4 +33,5 @@ async def post_chat_completions(body: RequestBody = Body(...)) -> Dict:
         f"Received chat completions request for {model.name} with messages {body.messages[-1].content}"
     )
 
+    # TODO: Add temperature to request body
     return model.generate_answer(body.messages[-1].content)
diff --git a/genoss/api/embeddings_routes.py b/genoss/api/embeddings_routes.py
@@ -1,6 +1,8 @@
 from ast import List
+
 from fastapi import APIRouter
-from genoss.model.gpt4all_llm import Gpt4AllLLM
+
+from genoss.llm.local.gpt4all import Gpt4AllLLM
 from logger import get_logger
 
 logger = get_logger(__name__)

diff --git a/genoss/api/misc_routes.py b/genoss/api/misc_routes.py
@@ -0,0 +1,12 @@
+from fastapi import APIRouter
+
+from logger import get_logger
+
+logger = get_logger(__name__)
+
+misc_router = APIRouter()
+
+
+@misc_router.get("/", tags=["Root"])
+async def get_root():
+    return "Genoss API is running!"
diff --git a/genoss/auth/auth_handler.py b/genoss/auth/auth_handler.py
@@ -0,0 +1,20 @@
+from typing import Optional
+
+from fastapi import Header, HTTPException
+
+
+class AuthHandler:
+    @staticmethod
+    async def check_auth_header(
+        authorization: Optional[str] = Header(None),
+    ):
+        if authorization is None:
+            return None
+
+        components = authorization.split()
+
+        if len(components) != 2 or components[0].lower() != "bearer":
+            raise HTTPException(status_code=403, detail="Invalid authorization header")
+
+        api_key = components[1]
+        return api_key
diff --git a/genoss/chat/chat_completion.py b/genoss/chat/chat_completion.py
diff --git a/genoss/entities/chat/chat_completion.py b/genoss/entities/chat/chat_completion.py
@@ -0,0 +1,57 @@
+import time
+import uuid
+from typing import Any, Dict
+
+from genoss.entities.chat.message import Message
+
+
+class ChatCompletion:
+    class Choice:
+        def __init__(
+            self, message: Message, finish_reason: str = "stop", index: int = 0
+        ):
+            self.message = message
+            self.finish_reason = finish_reason
+            self.index = index
+
+        def to_dict(self) -> Dict[str, Any]:
+            return {
+                "message": self.message.to_dict(),
+                "finish_reason": self.finish_reason,
+                "index": self.index,
+            }
+
+    class Usage:
+        def __init__(
+            self, prompt_tokens: int, completion_tokens: int, total_tokens: int
+        ):
+            self.prompt_tokens = prompt_tokens
+            self.completion_tokens = completion_tokens
+            self.total_tokens = total_tokens
+
+        def to_dict(self) -> Dict[str, Any]:
+            return {
+                "prompt_tokens": self.prompt_tokens,
+                "completion_tokens": self.completion_tokens,
+                "total_tokens": self.total_tokens,
+            }
+
+    def __init__(self, model: str, question: str, answer: str):
+        self.id = str(uuid.uuid4())
+        self.object = "chat.completion"
+        self.created = int(time.time())
+        self.model = model
+        self.usage = self.Usage(len(question), len(answer), len(question) + len(answer))
+        self.choices = [
+            self.Choice(Message(role="assistant", content=answer), "stop", 0)
+        ]
+
+    def to_dict(self) -> Dict[str, Any]:
+        return {
+            "id": self.id,
+            "object": self.object,
+            "created": self.created,
+            "model": self.model,
+            "usage": self.usage.to_dict(),
+            "choices": [choice.to_dict() for choice in self.choices],
+        }
diff --git a/genoss/chat/messages.py → genoss/entities/chat/message.py b/genoss/chat/messages.py → genoss/entities/chat/message.py
@@ -1,4 +1,4 @@
-from typing import List, Dict, Any
+from typing import Any, Dict
 
 from pydantic import BaseModel, Field
 
@@ -14,14 +14,4 @@ class Message(BaseModel):
     )
 
     def to_dict(self) -> Dict[str, Any]:
-        return {
-            "role": self.role,
-            "content": self.content
-        }
-
-
-class Messages(BaseModel):
-    messages: List[Message]
-
-    def to_dict(self) -> List[Dict[str, Any]]:
-        return [message.to_dict() for message in self.messages]
+        return {"role": self.role, "content": self.content}
diff --git a/genoss/model/base_genoss_llm.py → genoss/llm/base_genoss.py b/genoss/model/base_genoss_llm.py → genoss/llm/base_genoss.py
@@ -1,13 +1,12 @@
-from typing import List, Dict
-from abc import abstractmethod, abstractproperty
+from abc import abstractmethod
+from typing import Dict, List
 
 from pydantic import BaseModel
 
 
 class BaseGenossLLM(BaseModel):
     name: str
     description: str
-    model_path: str
 
     @abstractmethod
     def generate_answer(self, prompt: str) -> Dict:

diff --git a/genoss/model/fake_llm.py → genoss/llm/fake_llm.py b/genoss/model/fake_llm.py → genoss/llm/fake_llm.py
@@ -1,35 +1,37 @@
 from __future__ import annotations
+
 from typing import Dict
 
-from langchain import PromptTemplate, LLMChain
-from langchain.llms import FakeListLLM
+from langchain import LLMChain
 from langchain.embeddings import FakeEmbeddings
-from genoss.model.base_genoss_llm import BaseGenossLLM
-from genoss.chat.chat_completion import ChatCompletion
+from langchain.llms import FakeListLLM
+
+from genoss.entities.chat.chat_completion import ChatCompletion
+from genoss.llm.base_genoss import BaseGenossLLM
+from genoss.prompts.prompt_template import prompt_template
 
 FAKE_LLM_NAME = "fake"
 
 
 class FakeLLM(BaseGenossLLM):
     name: str = FAKE_LLM_NAME
     description: str = "Fake LLM for testing purpose"
-    model_path: str = ""
 
-    def generate_answer(self, messages: list) -> Dict:
+    def generate_answer(self, question: str) -> Dict:
         print("Generating Answer")
-        print(messages)
-        last_messages = messages
 
         llm = FakeListLLM(responses=["Hello from FakeLLM!"])
-        prompt_template = "Question from user: {question}?, Answer from bot:"
-        llm_chain = LLMChain(
-            llm=llm, prompt=PromptTemplate.from_template(prompt_template)
-        )
-        response_text = llm_chain(last_messages)
+
+        llm_chain = LLMChain(llm=llm, prompt=prompt_template)
+        response_text = llm_chain(question)
+
         print("###################")
         print(response_text)
+
         answer = response_text["text"]
-        chat_completion = ChatCompletion(model=self.name, answer=answer, last_messages=last_messages)
+        chat_completion = ChatCompletion(
+            model=self.name, answer=answer, question=question
+        )
 
         return chat_completion.to_dict()