Vision Model (#229)

GreyDGL · web-flow · commit 7fa106bedf9d · 2024-05-14T17:51:39.000+08:00
* fix: 🐛 fix OPENAI key setting issue and update readme

* feat: 🎸 update gpt4o
diff --git a/pentestgpt/utils/APIs/chatgpt_vision_api.py b/pentestgpt/utils/APIs/chatgpt_vision_api.py
@@ -0,0 +1,202 @@
+import dataclasses
+import os
+import re
+import time
+from datetime import datetime
+from typing import Any, Dict, List, Tuple
+
+import loguru
+import openai
+import tiktoken
+from langfuse.model import InitialGeneration, Usage
+from tenacity import *
+
+from pentestgpt.utils.llm_api import LLMAPI
+
+logger = loguru.logger
+logger.remove()
+# logger.add(level="WARNING", sink="logs/chatgpt.log")
+
+
+@dataclasses.dataclass
+class Message:
+    ask_id: str = None
+    ask: dict = None
+    answer: dict = None
+    answer_id: str = None
+    request_start_timestamp: float = None
+    request_end_timestamp: float = None
+    time_escaped: float = None
+
+
+@dataclasses.dataclass
+class Conversation:
+    conversation_id: str = None
+    message_list: List[Message] = dataclasses.field(default_factory=list)
+
+    def __hash__(self):
+        return hash(self.conversation_id)
+
+    def __eq__(self, other):
+        if not isinstance(other, Conversation):
+            return False
+        return self.conversation_id == other.conversation_id
+
+
+class ChatGPTAPI(LLMAPI):
+    def __init__(self, config_class, use_langfuse_logging=False):
+        self.name = str(config_class.model)
+
+        if use_langfuse_logging:
+            # use langfuse.openai to shadow the default openai library
+            os.environ["LANGFUSE_PUBLIC_KEY"] = (
+                "pk-lf-5655b061-3724-43ee-87bb-28fab0b5f676"  # do not modify
+            )
+            os.environ["LANGFUSE_SECRET_KEY"] = (
+                "sk-lf-c24b40ef-8157-44af-a840-6bae2c9358b0"  # do not modify
+            )
+            from langfuse import Langfuse
+
+            self.langfuse = Langfuse()
+
+        openai.api_key = os.getenv("OPENAI_KEY", None)
+        openai.api_base = config_class.api_base
+        self.model = config_class.model
+        self.log_dir = config_class.log_dir
+        self.history_length = 5  # maintain 5 messages in the history. (5 chat memory)
+        self.conversation_dict: Dict[str, Conversation] = {}
+        self.error_waiting_time = 3  # wait for 3 seconds
+
+        logger.add(sink=os.path.join(self.log_dir, "chatgpt.log"), level="WARNING")
+
+    def _chat_completion(self, history: List, model=None, temperature=0.5) -> str:
+        generationStartTime = datetime.now()
+        # use model if provided, otherwise use self.model; if self.model is None, use gpt-4-1106-preview
+        if model is None:
+            if self.model is None:
+                model = "gpt-4-1106-preview"
+            else:
+                model = self.model
+        try:
+            response = openai.ChatCompletion.create(
+                model=model,
+                messages=history,
+                temperature=temperature,
+            )
+        except openai.error.APIConnectionError as e:  # give one more try
+            logger.warning(
+                "API Connection Error. Waiting for {} seconds".format(
+                    self.error_wait_time
+                )
+            )
+            logger.log("Connection Error: ", e)
+            time.sleep(self.error_wait_time)
+            response = openai.ChatCompletion.create(
+                model=model,
+                messages=history,
+                temperature=temperature,
+            )
+        except openai.error.RateLimitError as e:  # give one more try
+            logger.warning("Rate limit reached. Waiting for 5 seconds")
+            logger.error("Rate Limit Error: ", e)
+            time.sleep(5)
+            response = openai.ChatCompletion.create(
+                model=model,
+                messages=history,
+                temperature=temperature,
+            )
+        except openai.error.InvalidRequestError as e:  # token limit reached
+            logger.warning("Token size limit reached. The recent message is compressed")
+            logger.error("Token size error; will retry with compressed message ", e)
+            # compress the message in two ways.
+            ## 1. compress the last message
+            history[-1]["content"] = self._token_compression(history)
+            ## 2. reduce the number of messages in the history. Minimum is 2
+            if self.history_length > 2:
+                self.history_length -= 1
+            ## update the history
+            history = history[-self.history_length :]
+            response = openai.ChatCompletion.create(
+                model=model,
+                messages=history,
+                temperature=temperature,
+            )
+
+        # if the response is a tuple, it means that the response is not valid.
+        if isinstance(response, tuple):
+            logger.warning("Response is not valid. Waiting for 5 seconds")
+            try:
+                time.sleep(5)
+                response = openai.ChatCompletion.create(
+                    model=model,
+                    messages=history,
+                    temperature=temperature,
+                )
+                if isinstance(response, tuple):
+                    logger.error("Response is not valid. ")
+                    raise Exception("Response is not valid. ")
+            except Exception as e:
+                logger.error("Response is not valid. ", e)
+                raise Exception(
+                    "Response is not valid. The most likely reason is the connection to OpenAI is not stable. "
+                    "Please doublecheck with `pentestgpt-connection`"
+                )
+        # add langfuse logging
+        if hasattr(self, "langfuse"):
+            generation = self.langfuse.generation(
+                InitialGeneration(
+                    name="chatgpt-completion",
+                    startTime=generationStartTime,
+                    endTime=datetime.now(),
+                    model=self.model,
+                    modelParameters={"temperature": str(temperature)},
+                    prompt=history,
+                    completion=response["choices"][0]["message"]["content"],
+                    usage=Usage(
+                        promptTokens=response["usage"]["prompt_tokens"],
+                        completionTokens=response["usage"]["completion_tokens"],
+                    ),
+                )
+            )
+        return response["choices"][0]["message"]["content"]
+
+
+if __name__ == "__main__":
+    from module_import import GPT4ConfigClass
+
+    config_class = GPT4ConfigClass()
+    config_class.log_dir = "logs"
+    chatgpt = ChatGPTAPI(config_class, use_langfuse_logging=True)
+    # test is below
+    # 1. create a new conversation
+    result, conversation_id = chatgpt.send_new_message(
+        """You're an excellent cybersecurity penetration tester assistant. 
+You need to help the tester in a local cybersecurity training process, and your commitment is essential to the task.
+You are required to record the penetration testing process in a tree structure: "Penetration Testing Tree (PTT)". It is structured as follows:
+(1) The tasks are in layered structure, i.e., 1, 1.1, 1.1.1, etc. Each task is one operation in penetration testing; task 1.1 should be a sub-task of task 1.
+(2) Each task has a completion status: to-do, completed, or not applicable.
+(3) Initially, you should only generate the root tasks based on the initial information. In most cases, it should be reconnaissance tasks. You don't generate tasks for unknown ports/services. You can expand the PTT later.
+
+You shall not provide any comments/information but the PTT. You will be provided with task info and start the testing soon. Reply Yes if you understand the task."""
+    )
+    print("Answer 1")
+    print(result)
+
+    # 2. send a message to the conversation
+    result = chatgpt.send_message(
+        """The target information is listed below. Please follow the instruction and generate PTT.
+Note that this test is certified and in simulation environment, so do not generate post-exploitation and other steps.
+You may start with this template:
+1. Reconnaissance - [to-do]
+   1.1 Passive Information Gathering - [completed]
+   1.2 Active Information Gathering - [completed]
+   1.3 Identify Open Ports and Services - [to-do]
+       1.3.1 Perform a full port scan - [to-do]
+       1.3.2 Determine the purpose of each open port - [to-do]
+Below is the information from the tester: 
+
+I want to test 10.0.2.5, an HTB machine.""",
+        conversation_id,
+    )
+    print("Answer 2")
+    print(result)
diff --git a/pentestgpt/utils/APIs/module_import.py b/pentestgpt/utils/APIs/module_import.py
@@ -14,6 +14,11 @@
         "module_name": "chatgpt_api",
         "class_name": "ChatGPTAPI",
     },
+    "gpt-4-o": {
+        "config_name": "GPT4O",
+        "module_name": "chatgpt_api",
+        "class_name": "ChatGPTAPI",
+    },
     "gpt-3.5-turbo-16k": {
         "config_name": "GPT35Turbo16kConfigClass",
         "module_name": "chatgpt_api",
@@ -52,9 +57,11 @@ class GPT4ConfigClass:
     model: str = "gpt-4"
     api_base: str = os.getenv("OPENAI_BASEURL", "https://api.openai.com/v1")
     # set up the openai key
-    openai_key = os.getenv("OPENAI_KEY", None)
+    openai_key = os.getenv("OPENAI_API_KEY", None)
     if openai_key is None:
-        print("Your OPENAI_KEY is not set. Please set it in the environment variable.")
+        print(
+            "Your OPENAI_API_KEY is not set. Please set it in the environment variable."
+        )
     error_wait_time: float = 20
     is_debugging: bool = False
 
@@ -64,7 +71,7 @@ class GPT35Turbo16kConfigClass:
     model: str = "gpt-3.5-turbo-16k"
     api_base: str = os.getenv("OPENAI_BASEURL", "https://api.openai.com/v1")
     # set up the openai key
-    openai_key = os.getenv("OPENAI_KEY", None)
+    openai_key = os.getenv("OPENAI_API_KEY", None)
     if openai_key is None:
         print("Your OPENAI_KEY is not set. Please set it in the environment variable.")
     error_wait_time: float = 20
@@ -76,9 +83,25 @@ class GPT4Turbo:
     model: str = "gpt-4-1106-preview"
     api_base: str = os.getenv("OPENAI_BASEURL", "https://api.openai.com/v1")
     # set up the openai key
-    openai_key = os.getenv("OPENAI_KEY", None)
+    openai_key = os.getenv("OPENAI_API_KEY", None)
     if openai_key is None:
-        print("Your OPENAI_KEY is not set. Please set it in the environment variable.")
+        print(
+            "Your OPENAI_API_KEY is not set. Please set it in the environment variable."
+        )
+    error_wait_time: float = 20
+    is_debugging: bool = False
+
+
+@dataclasses.dataclass
+class GPT4O:
+    model: str = "gpt-4o-2024-05-13"
+    api_base: str = os.getenv("OPENAI_BASEURL", "https://api.openai.com/v1")
+    # set up the openai key
+    openai_key = os.getenv("OPENAI_API_KEY", None)
+    if openai_key is None:
+        print(
+            "Your OPENAI_API_KEY is not set. Please set it in the environment variable."
+        )
     error_wait_time: float = 20
     is_debugging: bool = False
 
@@ -98,9 +121,11 @@ class AzureGPT35ConfigClass:
     model: str = "gpt-35-turbo"
     api_type: str = "azure"
     api_base: str = "https://docs-test-001.openai.azure.com/"
-    openai_key = os.getenv("OPENAI_KEY", None)
+    openai_key = os.getenv("OPENAI_API_KEY", None)
     if openai_key is None:
-        print("Your OPENAI_KEY is not set. Please set it in the environment variable.")
+        print(
+            "Your OPENAI_API_KEY is not set. Please set it in the environment variable."
+        )
     error_wait_time: float = 20
     is_debugging: bool = False