fix(prompt-optimizer): switch to built-in system prompt
- Replace the system prompt of the prompt optimization model with a built-in prompt. - Remove system prompt entries from the database. - Remove the API endpoint for managing system prompt configuration.
This commit is contained in:
@@ -1,4 +1,3 @@
|
||||
import json
|
||||
import re
|
||||
import uuid
|
||||
|
||||
@@ -12,13 +11,11 @@ from app.core.models import RedBearModelConfig
|
||||
from app.core.models.llm import RedBearLLM
|
||||
from app.models import ModelConfig, ModelApiKey, ModelType, PromptOptimizerSessionHistory
|
||||
from app.models.prompt_optimizer_model import (
|
||||
PromptOptimizerModelConfig,
|
||||
PromptOptimizerSession,
|
||||
RoleType
|
||||
)
|
||||
from app.repositories.model_repository import ModelConfigRepository
|
||||
from app.repositories.prompt_optimizer_repository import (
|
||||
PromptOptimizerModelConfigRepository,
|
||||
PromptOptimizerSessionRepository
|
||||
)
|
||||
from app.schemas.prompt_optimizer_schema import OptimizePromptResult
|
||||
@@ -34,32 +31,24 @@ class PromptOptimizerService:
|
||||
self,
|
||||
tenant_id: uuid.UUID,
|
||||
model_id: uuid.UUID
|
||||
) -> tuple[PromptOptimizerModelConfig, ModelConfig]:
|
||||
) -> ModelConfig:
|
||||
"""
|
||||
Retrieve the prompt optimizer model configuration and model configuration.
|
||||
Retrieve the model configuration for a specific tenant.
|
||||
|
||||
This method retrieves the prompt optimizer model configuration associated
|
||||
with the specified model ID and tenant. It also fetches the corresponding
|
||||
model configuration.
|
||||
This method fetches the model configuration associated with the given
|
||||
tenant_id and model_id. If no configuration is found, a BusinessException
|
||||
is raised.
|
||||
|
||||
Args:
|
||||
tenant_id (uuid.UUID): The unique identifier of the tenant.
|
||||
model_id (uuid.UUID): The unique identifier of the prompt optimization model.
|
||||
model_id (uuid.UUID): The unique identifier of the model.
|
||||
|
||||
Returns:
|
||||
tuple[PromptOptimzerModelConfig, ModelConfig]:
|
||||
A tuple containing the prompt optimizer model configuration
|
||||
and the corresponding model configuration.
|
||||
ModelConfig: The corresponding model configuration object.
|
||||
|
||||
Raises:
|
||||
BusinessException: If the prompt optimizer model configuration does not exist.
|
||||
BusinessException: If the model configuration does not exist.
|
||||
"""
|
||||
prompt_config = PromptOptimizerModelConfigRepository(self.db).get_by_tenant_id(
|
||||
tenant_id
|
||||
)
|
||||
if not prompt_config:
|
||||
raise BusinessException("提示词模型配置不存在", BizCode.NOT_FOUND)
|
||||
|
||||
model = ModelConfigRepository.get_by_id(
|
||||
self.db, model_id, tenant_id=tenant_id
|
||||
@@ -67,35 +56,7 @@ class PromptOptimizerService:
|
||||
if not model:
|
||||
raise BusinessException("模型配置不存在", BizCode.MODEL_NOT_FOUND)
|
||||
|
||||
return prompt_config, model
|
||||
|
||||
def create_update_model_config(
|
||||
self,
|
||||
tenant_id: uuid.UUID,
|
||||
config_id: uuid.UUID,
|
||||
system_prompt: str,
|
||||
) -> PromptOptimizerModelConfig:
|
||||
"""
|
||||
Create or update a prompt optimizer model configuration.
|
||||
|
||||
This method creates a new prompt optimizer model configuration or updates
|
||||
an existing one identified by the given configuration ID. The configuration
|
||||
defines the system prompt used for prompt optimization.
|
||||
|
||||
Args:
|
||||
tenant_id (uuid.UUID): The unique identifier of the tenant.
|
||||
config_id (uuid.UUID): The unique identifier of the configuration to create or update.
|
||||
system_prompt (str): The system prompt content used for prompt optimization.
|
||||
|
||||
Returns:
|
||||
PromptOptimzerModelConfig: The created or updated prompt optimizer model configuration.
|
||||
"""
|
||||
prompt_config = PromptOptimizerModelConfigRepository(self.db).create_or_update(
|
||||
config_id=config_id,
|
||||
tenant_id=tenant_id,
|
||||
system_prompt=system_prompt,
|
||||
)
|
||||
return prompt_config
|
||||
return model
|
||||
|
||||
def create_session(
|
||||
self,
|
||||
@@ -159,37 +120,46 @@ class PromptOptimizerService:
|
||||
session_id: uuid.UUID,
|
||||
user_id: uuid.UUID,
|
||||
current_prompt: str,
|
||||
message: str
|
||||
user_require: str
|
||||
) -> OptimizePromptResult:
|
||||
"""
|
||||
Optimize a prompt using a prompt optimizer LLM.
|
||||
Optimize a user-provided prompt using a configured prompt optimizer LLM.
|
||||
|
||||
This method uses a configured prompt optimizer model to refine an existing
|
||||
prompt based on the user's requirements. The optimized prompt is generated
|
||||
according to predefined system rules, including Jinja2 variable syntax and
|
||||
a strict JSON output format.
|
||||
This method refines the original prompt according to the user's requirements,
|
||||
generating an optimized version that is directly usable by AI tools. The
|
||||
optimization process follows strict rules, including:
|
||||
- Wrapping user-inserted variables in double curly braces {{}}.
|
||||
- Adhering to Jinja2 variable syntax if applicable.
|
||||
- Ensuring a clear logic flow, explicit instructions, and strong executability.
|
||||
- Producing output in a strict JSON format.
|
||||
|
||||
Steps performed:
|
||||
1. Retrieve the model configuration for the given tenant and model.
|
||||
2. Fetch the session message history for context.
|
||||
3. Instantiate the LLM with the appropriate API key and model configuration.
|
||||
4. Build system messages outlining optimization rules.
|
||||
5. Format the user's original prompt and requirements as a user message.
|
||||
6. Send messages to the LLM to generate the optimized prompt.
|
||||
7. Generate a concise description summarizing the changes made during optimization.
|
||||
|
||||
Args:
|
||||
tenant_id (uuid.UUID): The unique identifier of the tenant.
|
||||
model_id (uuid.UUID): The unique identifier of the prompt optimizer model.
|
||||
session_id (uuid.UUID): The unique identifier of the prompt optimization session.
|
||||
user_id (uuid.UUID): The unique identifier of the user associated with the session.
|
||||
current_prompt (str): The original prompt to be optimized.
|
||||
message (str): The user's requirements or modification instructions.
|
||||
tenant_id (uuid.UUID): Tenant identifier.
|
||||
model_id (uuid.UUID): Prompt optimizer model identifier.
|
||||
session_id (uuid.UUID): Prompt optimization session identifier.
|
||||
user_id (uuid.UUID): Identifier of the user associated with the session.
|
||||
current_prompt (str): Original prompt to optimize.
|
||||
user_require (str): User's requirements or instructions for optimization.
|
||||
|
||||
Returns:
|
||||
dict: A dictionary containing the optimized prompt and the description
|
||||
of changes, in the following format:
|
||||
{
|
||||
"prompt": "<optimized_prompt>",
|
||||
"desc": "<change_description>"
|
||||
}
|
||||
OptimizePromptResult: An object containing:
|
||||
- prompt: The optimized prompt string.
|
||||
- desc: A short description summarizing the changes.
|
||||
|
||||
Raises:
|
||||
BusinessException: If the model response cannot be parsed as valid JSON
|
||||
BusinessException: If the LLM response cannot be parsed as valid JSON
|
||||
or does not conform to the expected output format.
|
||||
"""
|
||||
prompt_config, model_config = self.get_model_config(tenant_id, model_id)
|
||||
model_config = self.get_model_config(tenant_id, model_id)
|
||||
session_history = self.get_session_message_history(session_id=session_id, user_id=user_id)
|
||||
|
||||
# Create LLM instance
|
||||
@@ -204,36 +174,65 @@ class PromptOptimizerService:
|
||||
# build message
|
||||
messages = [
|
||||
# init system_prompt
|
||||
(RoleType.SYSTEM.value, prompt_config.system_prompt),
|
||||
(
|
||||
RoleType.SYSTEM.value,
|
||||
"Your task is to optimize the original prompt provided by the user so that it can be directly used by AI tools,"
|
||||
"and the variables that the user needs to insert must be wrapped in {{}}. "
|
||||
"The optimized prompt should align with the optimization direction specified by the user (if any) and ensure clear logic, explicit instructions, and strong executability. "
|
||||
"Please follow these rules when optimizing: "
|
||||
'1. Ensure variables are wrapped in {{}}, e.g., optimize "Please enter your question" to "Please enter your {{question}}"'
|
||||
"2. Instructions must be specific and operable, avoiding vague expressions"
|
||||
"3. If the original prompt lacks key elements (such as output format requirements), supplement them completely "
|
||||
"4. Keep the language concise and avoid redundancy "
|
||||
"5. If the user does not specify an optimization direction, the default optimization is to make the prompt structurally clear and with explicit instructions"
|
||||
"Please directly output the optimized prompt without additional explanations. The optimized prompt should be directly usable with correct variable positions."
|
||||
),
|
||||
|
||||
# base model limit
|
||||
(RoleType.SYSTEM.value,
|
||||
"Optimization Rules:\n"
|
||||
"1. Fully adjust the prompt content according to the user's requirements.\n"
|
||||
"2. When the user requests the insertion of variables, you must use Jinja2 syntax {{variable_name}} "
|
||||
"(the variable name should be determined based on the user's requirement).\n"
|
||||
"When variables are required, use double curly braces {{variable_name}} as placeholders."
|
||||
"Variable names must be derived from the user's requirements.\n"
|
||||
"3. Keep the prompt logic clear and instructions explicit.\n"
|
||||
"4. Ensure that the modified prompt can be directly used.\n\n"
|
||||
"Output Requirements:\n"
|
||||
"Provide the result in JSON format, containing exactly two fields:\n"
|
||||
" - prompt: The modified prompt (string).\n"
|
||||
" - desc: A response addressing the user's optimization request (string).")
|
||||
"4. Ensure that the modified prompt can be directly used.\n\n")
|
||||
]
|
||||
messages.extend(session_history[:-1]) # last message is current message
|
||||
user_message_template = ChatPromptTemplate.from_messages([
|
||||
(RoleType.USER.value, "[current_prompt]\n{current_prompt}\n[user_require]\n{message}")
|
||||
(RoleType.USER.value, "[original_prompt]\n{current_prompt}\n[user_require]\n{user_require}")
|
||||
])
|
||||
formatted_user_message = user_message_template.format(current_prompt=current_prompt, message=message)
|
||||
formatted_user_message = user_message_template.format(current_prompt=current_prompt, user_require=user_require)
|
||||
messages.extend([(RoleType.USER.value, formatted_user_message)])
|
||||
logger.info(f"Prompt optimization message: {messages}")
|
||||
result = await llm.ainvoke(messages)
|
||||
try:
|
||||
data_dict = json.loads(result.content)
|
||||
model_resp = OptimizePromptResult.model_validate(data_dict)
|
||||
except Exception as e:
|
||||
logger.error(f"Failed to parse model reponse to json - Error: {str(e)}", exc_info=True)
|
||||
raise BusinessException("Failed to parse model response", BizCode.PARSER_NOT_SUPPORTED)
|
||||
return model_resp
|
||||
optim_prompt = await llm.ainvoke(messages)
|
||||
optim_desc = [
|
||||
(
|
||||
RoleType.SYSTEM.value,
|
||||
"You are a prompt optimization assistant.\n"
|
||||
"Compare the original prompt, the user's requirements, "
|
||||
"and the optimized prompt.\n"
|
||||
"Summarize the changes made during optimization.\n\n"
|
||||
"Rules:\n"
|
||||
"1. Output must be a single short sentence.\n"
|
||||
"2. Be concise and factual.\n"
|
||||
"3. Do not explain the prompts themselves.\n"
|
||||
"4. Do not include any extra text."
|
||||
),
|
||||
(
|
||||
"[Original Prompt]\n"
|
||||
f"{current_prompt}\n\n"
|
||||
"[User Requirements]\n"
|
||||
f"{user_require}\n\n"
|
||||
"[Optimized Prompt]\n"
|
||||
f"{optim_prompt.content}"
|
||||
)
|
||||
]
|
||||
optim_desc = await llm.ainvoke(optim_desc)
|
||||
|
||||
return OptimizePromptResult(
|
||||
prompt=optim_prompt.content,
|
||||
desc=optim_desc.content
|
||||
)
|
||||
|
||||
@staticmethod
|
||||
def parser_prompt_variables(prompt: str):
|
||||
@@ -277,4 +276,3 @@ class PromptOptimizerService:
|
||||
content=content
|
||||
)
|
||||
return message
|
||||
|
||||
|
||||
Reference in New Issue
Block a user