Removed system prompt from vectorq config

kyle65463 · kyle65463 · commit fb772b724607 · 2025-05-05T16:17:05.000-07:00
diff --git a/poetry.lock b/poetry.lock
diff --git a/vectorq/config.py b/vectorq/config.py
@@ -1,5 +1,3 @@
-from typing import Optional
-
 from vectorq.inference_engine.inference_engine import InferenceEngine
 from vectorq.inference_engine.strategies.openai import OpenAIInferenceEngine
 from vectorq.vectorq_core.cache.embedding_engine import OpenAIEmbeddingEngine
@@ -31,11 +29,9 @@ def __init__(
         vector_db: VectorDB = HNSWLibVectorDB(),
         embedding_metadata_storage: EmbeddingMetadataStorage = InMemoryEmbeddingMetadataStorage(),
         eviction_policy: EvictionPolicy = LRUEvictionPolicy(),
-        system_prompt: Optional[str] = None,
     ):
         self.inference_engine = inference_engine
         self.embedding_engine = embedding_engine
         self.vector_db = vector_db
         self.eviction_policy = eviction_policy
         self.embedding_metadata_storage = embedding_metadata_storage
-        self.system_prompt = system_prompt
diff --git a/vectorq/main.py b/vectorq/main.py
@@ -43,14 +43,11 @@ def infer_with_cache_info(
         Infer a response from the cache and return the cache hit status, the response, and the nearest neighbor response.
         Args
             prompt: str - The prompt to create a response for.
-            system_prompt: Optional[str] - The optional system prompt to use for the response. It will override the system prompt in the VectorQConfig if provided.
+            system_prompt: Optional[str] - The optional system prompt to use for the response. It will override the system prompt set in the InferenceEngine if provided.
             inference_engine_kwargs: Any - Additional arguments to pass to the underlying inference engine (e.g., max_tokens, temperature, etc).
         Returns
             Tuple[bool, str, str] - [is_cache_hit, response, nn_response] (the response is the one supposed to be used by the user, the nn_response is for benchmarking purposes)
         """
-        if system_prompt is None:
-            system_prompt = self.vectorq_config.system_prompt
-
         return self.vectorq_policy.process_request(
             prompt=prompt,
             system_prompt=system_prompt,
@@ -67,7 +64,7 @@ def infer(
         Infer a response from the cache and return the response.
         Args
             prompt: str - The prompt to create a response for.
-            system_prompt: Optional[str] - The optional system prompt to use for the response. It will override the system prompt in the VectorQConfig if provided.
+            system_prompt: Optional[str] - The optional system prompt to use for the response. It will override the system prompt in the InferenceEngine if provided.
             inference_engine_kwargs: Any - Additional arguments to pass to the underlying inference engine (e.g., max_tokens, temperature, etc).
         Returns
             str - The response to be used by the user