botserver/src/basic/compiler/mod.rs

411 lines
14 KiB
Rust
Raw Normal View History

use crate::basic::keywords::set_schedule::execute_set_schedule;
use crate::shared::models::TriggerKind;
use crate::shared::state::AppState;
use diesel::ExpressionMethods;
use diesel::QueryDsl;
use diesel::RunQueryDsl;
use log::warn;
2025-10-18 18:20:02 -03:00
use serde::{Deserialize, Serialize};
use std::collections::HashMap;
use std::collections::HashSet;
2025-10-18 18:20:02 -03:00
use std::error::Error;
use std::fs;
use std::path::Path;
use std::sync::Arc;
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ParamDeclaration {
pub name: String,
pub param_type: String,
pub example: Option<String>,
pub description: String,
pub required: bool,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ToolDefinition {
pub name: String,
pub description: String,
pub parameters: Vec<ParamDeclaration>,
pub source_file: String,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct MCPTool {
pub name: String,
pub description: String,
pub input_schema: MCPInputSchema,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct MCPInputSchema {
#[serde(rename = "type")]
pub schema_type: String,
pub properties: HashMap<String, MCPProperty>,
pub required: Vec<String>,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct MCPProperty {
#[serde(rename = "type")]
pub prop_type: String,
pub description: String,
#[serde(skip_serializing_if = "Option::is_none")]
pub example: Option<String>,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct OpenAITool {
#[serde(rename = "type")]
pub tool_type: String,
pub function: OpenAIFunction,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct OpenAIFunction {
pub name: String,
pub description: String,
pub parameters: OpenAIParameters,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct OpenAIParameters {
#[serde(rename = "type")]
pub param_type: String,
pub properties: HashMap<String, OpenAIProperty>,
pub required: Vec<String>,
}
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct OpenAIProperty {
#[serde(rename = "type")]
pub prop_type: String,
pub description: String,
#[serde(skip_serializing_if = "Option::is_none")]
pub example: Option<String>,
}
pub struct BasicCompiler {
state: Arc<AppState>,
bot_id: uuid::Uuid,
previous_schedules: HashSet<String>,
2025-10-18 18:20:02 -03:00
}
impl BasicCompiler {
pub fn new(state: Arc<AppState>, bot_id: uuid::Uuid) -> Self {
Self {
state,
bot_id,
previous_schedules: HashSet::new(),
}
2025-10-18 18:20:02 -03:00
}
pub fn compile_file(
&mut self,
2025-10-18 18:20:02 -03:00
source_path: &str,
output_dir: &str,
) -> Result<CompilationResult, Box<dyn Error + Send + Sync>> {
let source_content = fs::read_to_string(source_path)
.map_err(|e| format!("Failed to read source file: {}", e))?;
let tool_def = self.parse_tool_definition(&source_content, source_path)?;
let file_name = Path::new(source_path)
.file_stem()
.and_then(|s| s.to_str())
.ok_or("Invalid file name")?;
let ast_path = format!("{}/{}.ast", output_dir, file_name);
let ast_content = self.preprocess_basic(&source_content, source_path, self.bot_id)?;
2025-10-18 18:20:02 -03:00
fs::write(&ast_path, &ast_content)
.map_err(|e| format!("Failed to write AST file: {}", e))?;
let (mcp_json, tool_json) = if !tool_def.parameters.is_empty() {
let mcp = self.generate_mcp_tool(&tool_def)?;
let openai = self.generate_openai_tool(&tool_def)?;
let mcp_path = format!("{}/{}.mcp.json", output_dir, file_name);
let tool_path = format!("{}/{}.tool.json", output_dir, file_name);
let mcp_json_str = serde_json::to_string_pretty(&mcp)?;
fs::write(&mcp_path, mcp_json_str)
.map_err(|e| format!("Failed to write MCP JSON: {}", e))?;
let tool_json_str = serde_json::to_string_pretty(&openai)?;
fs::write(&tool_path, tool_json_str)
.map_err(|e| format!("Failed to write tool JSON: {}", e))?;
(Some(mcp), Some(openai))
} else {
(None, None)
};
Ok(CompilationResult {
mcp_tool: mcp_json,
_openai_tool: tool_json,
2025-10-18 18:20:02 -03:00
})
}
pub fn parse_tool_definition(
2025-10-18 18:20:02 -03:00
&self,
source: &str,
source_path: &str,
) -> Result<ToolDefinition, Box<dyn Error + Send + Sync>> {
let mut params = Vec::new();
let mut description = String::new();
let lines: Vec<&str> = source.lines().collect();
let mut i = 0;
while i < lines.len() {
let line = lines[i].trim();
if line.starts_with("PARAM ") {
if let Some(param) = self.parse_param_line(line)? {
params.push(param);
}
}
if line.starts_with("DESCRIPTION ") {
let desc_start = line.find('"').unwrap_or(0);
let desc_end = line.rfind('"').unwrap_or(line.len());
if desc_start < desc_end {
description = line[desc_start + 1..desc_end].to_string();
}
}
i += 1;
}
let tool_name = Path::new(source_path)
.file_stem()
.and_then(|s| s.to_str())
.unwrap_or("unknown")
.to_string();
Ok(ToolDefinition {
name: tool_name,
description,
parameters: params,
source_file: source_path.to_string(),
})
}
fn parse_param_line(
&self,
line: &str,
) -> Result<Option<ParamDeclaration>, Box<dyn Error + Send + Sync>> {
let line = line.trim();
if !line.starts_with("PARAM ") {
return Ok(None);
}
let parts: Vec<&str> = line.split_whitespace().collect();
if parts.len() < 4 {
warn!("Invalid PARAM line: {}", line);
return Ok(None);
}
let name = parts[1].to_string();
let as_index = parts.iter().position(|&p| p == "AS");
let param_type = if let Some(idx) = as_index {
if idx + 1 < parts.len() {
parts[idx + 1].to_lowercase()
} else {
"string".to_string()
}
} else {
"string".to_string()
};
let example = if let Some(like_pos) = line.find("LIKE") {
let rest = &line[like_pos + 4..].trim();
if let Some(start) = rest.find('"') {
if let Some(end) = rest[start + 1..].find('"') {
Some(rest[start + 1..start + 1 + end].to_string())
} else {
None
}
} else {
None
}
} else {
None
};
let description = if let Some(desc_pos) = line.find("DESCRIPTION") {
let rest = &line[desc_pos + 11..].trim();
if let Some(start) = rest.find('"') {
if let Some(end) = rest[start + 1..].rfind('"') {
rest[start + 1..start + 1 + end].to_string()
} else {
"".to_string()
}
} else {
"".to_string()
}
} else {
"".to_string()
};
Ok(Some(ParamDeclaration {
name,
param_type: self.normalize_type(&param_type),
example,
description,
required: true,
2025-10-18 18:20:02 -03:00
}))
}
fn normalize_type(&self, basic_type: &str) -> String {
match basic_type.to_lowercase().as_str() {
"string" | "text" => "string".to_string(),
"integer" | "int" | "number" => "integer".to_string(),
"float" | "double" | "decimal" => "number".to_string(),
"boolean" | "bool" => "boolean".to_string(),
"date" | "datetime" => "string".to_string(),
2025-10-18 18:20:02 -03:00
"array" | "list" => "array".to_string(),
"object" | "map" => "object".to_string(),
_ => "string".to_string(),
2025-10-18 18:20:02 -03:00
}
}
fn generate_mcp_tool(
&self,
tool_def: &ToolDefinition,
) -> Result<MCPTool, Box<dyn Error + Send + Sync>> {
let mut properties = HashMap::new();
let mut required = Vec::new();
for param in &tool_def.parameters {
properties.insert(
param.name.clone(),
MCPProperty {
prop_type: param.param_type.clone(),
description: param.description.clone(),
example: param.example.clone(),
},
);
if param.required {
required.push(param.name.clone());
}
}
Ok(MCPTool {
name: tool_def.name.clone(),
description: tool_def.description.clone(),
input_schema: MCPInputSchema {
schema_type: "object".to_string(),
properties,
required,
},
})
}
fn generate_openai_tool(
&self,
tool_def: &ToolDefinition,
) -> Result<OpenAITool, Box<dyn Error + Send + Sync>> {
let mut properties = HashMap::new();
let mut required = Vec::new();
for param in &tool_def.parameters {
properties.insert(
param.name.clone(),
OpenAIProperty {
prop_type: param.param_type.clone(),
description: param.description.clone(),
example: param.example.clone(),
},
);
if param.required {
required.push(param.name.clone());
}
}
Ok(OpenAITool {
tool_type: "function".to_string(),
function: OpenAIFunction {
name: tool_def.name.clone(),
description: tool_def.description.clone(),
parameters: OpenAIParameters {
param_type: "object".to_string(),
properties,
required,
},
},
})
}
fn preprocess_basic(
&mut self,
source: &str,
source_path: &str,
bot_id: uuid::Uuid,
) -> Result<String, Box<dyn Error + Send + Sync>> {
let bot_uuid = bot_id;
2025-10-18 18:20:02 -03:00
let mut result = String::new();
let mut has_schedule = false;
let script_name = Path::new(source_path)
.file_stem()
.and_then(|s| s.to_str())
.unwrap_or("unknown")
.to_string();
{
let mut conn = self
.state
.conn
.get()
.map_err(|e| format!("Failed to get database connection: {}", e))?;
use crate::shared::models::system_automations::dsl::*;
diesel::delete(
system_automations
.filter(bot_id.eq(bot_uuid))
.filter(kind.eq(TriggerKind::Scheduled as i32))
.filter(param.eq(&script_name)),
)
.execute(&mut conn)
.ok();
}
2025-10-18 18:20:02 -03:00
for line in source.lines() {
let trimmed = line.trim();
if trimmed.is_empty()
|| trimmed.starts_with("'")
|| trimmed.starts_with("//")
|| trimmed.starts_with("REM")
{
2025-10-18 18:20:02 -03:00
continue;
}
let normalized = trimmed
.replace("SET SCHEDULE", "SET_SCHEDULE")
.replace("ADD TOOL", "ADD_TOOL")
.replace("CLEAR TOOLS", "CLEAR_TOOLS")
.replace("LIST TOOLS", "LIST_TOOLS")
.replace("CREATE SITE", "CREATE_SITE")
.replace("FOR EACH", "FOR_EACH")
.replace("EXIT FOR", "EXIT_FOR")
.replace("SET USER", "SET_USER")
.replace("SET CONTEXT", "SET_CONTEXT")
.replace("CLEAR SUGGESTIONS", "CLEAR_SUGGESTIONS")
.replace("ADD SUGGESTION", "ADD_SUGGESTION")
.replace("SET KB", "SET_KB")
.replace("ADD KB", "ADD_KB")
.replace("ADD WEBSITE", "ADD_WEBSITE")
.replace("GET BOT MEMORY", "GET_BOT_MEMORY")
.replace("SET BOT MEMORY", "SET_BOT_MEMORY")
.replace("CREATE DRAFT", "CREATE_DRAFT");
if normalized.starts_with("SET_SCHEDULE") {
has_schedule = true;
let parts: Vec<&str> = normalized.split('"').collect();
if parts.len() >= 3 {
let cron = parts[1];
let mut conn = self
.state
.conn
.get()
.map_err(|e| format!("Failed to get database connection: {}", e))?;
if let Err(e) = execute_set_schedule(&mut conn, cron, &script_name, bot_id) {
log::error!(
"Failed to schedule SET_SCHEDULE during preprocessing: {}",
e
);
}
} else {
log::warn!("Malformed SET_SCHEDULE line ignored: {}", normalized);
}
continue;
}
if normalized.starts_with("PARAM ") || normalized.starts_with("DESCRIPTION ") {
2025-10-18 18:20:02 -03:00
continue;
}
result.push_str(&normalized);
2025-10-18 18:20:02 -03:00
result.push('\n');
}
if self.previous_schedules.contains(&script_name) && !has_schedule {
let mut conn = self
.state
.conn
.get()
.map_err(|e| format!("Failed to get database connection: {}", e))?;
use crate::shared::models::system_automations::dsl::*;
diesel::delete(
system_automations
.filter(bot_id.eq(bot_uuid))
.filter(kind.eq(TriggerKind::Scheduled as i32))
.filter(param.eq(&script_name)),
)
.execute(&mut conn)
.map_err(|e| log::error!("Failed to remove schedule for {}: {}", script_name, e))
.ok();
}
if has_schedule {
self.previous_schedules.insert(script_name);
} else {
self.previous_schedules.remove(&script_name);
}
2025-10-18 18:20:02 -03:00
Ok(result)
}
}
#[derive(Debug)]
pub struct CompilationResult {
pub mcp_tool: Option<MCPTool>,
pub _openai_tool: Option<OpenAITool>,
2025-10-18 18:20:02 -03:00
}