feat: log LLM calls with timing at search, classification, and rewrite steps

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
3 months ago · 9fffde8312
parent b2b0b286c0
commit 9fffde8312
1 changed files with 41 additions and 0 deletions
--- a/backend/src/services/synthesis.rs
+++ b/backend/src/services/synthesis.rs
@ -271,6 +271,10 @@ async fn run_generation_inner(
        if deleted > 0 {
            tracing::info!(deleted = deleted, "Cleaned up old article history entries");
        }
        // Truncate old LLM call logs
        db::llm_call_log::truncate_old(&state.pool, user_id, settings.article_history_days)
            .await
            .ok();
    }
    if settings.categories.is_empty() {
@ -504,6 +508,7 @@ async fn run_generation_inner(
                );
                let class_schema = build_classification_schema();
                let llm_start = std::time::Instant::now();
                let class_response = provider
                    .generate_rewrite_pass(
                        &model_research,
@ -512,6 +517,9 @@ async fn run_generation_inner(
                        &class_schema,
                    )
                    .await?;
                let llm_duration = llm_start.elapsed().as_millis() as u64;
                log_llm_call(&state.pool, user_id, job_id, "classification_phase1", &model_research,
                    &class_system, &class_user, &class_response, llm_duration).await;
                // 1e. Parse classification and fill categories
                let (phase1_classified, phase1_overflow) = parse_classification_response(
@ -659,9 +667,13 @@ async fn run_generation_inner(
            Some(&category_gaps),
        );
        let llm_start = std::time::Instant::now();
        let raw_results = provider
            .generate_search_pass(&model_research, &system_prompt, &user_prompt, &search_schema)
            .await?;
        let llm_duration = llm_start.elapsed().as_millis() as u64;
        log_llm_call(&state.pool, user_id, job_id, "search", &model_research,
            &system_prompt, &user_prompt, &raw_results, llm_duration).await;
        // Parse + filter
        emit_progress(tx, "parsing", "Analyse des resultats...", 55);
@ -801,6 +813,7 @@ async fn run_generation_inner(
            );
            let class_schema = build_classification_schema();
            let llm_start = std::time::Instant::now();
            let class_response = provider
                .generate_rewrite_pass(
                    &model_research,
@ -809,6 +822,9 @@ async fn run_generation_inner(
                    &class_schema,
                )
                .await?;
            let llm_duration = llm_start.elapsed().as_millis() as u64;
            log_llm_call(&state.pool, user_id, job_id, "classification_phase2", &model_research,
                &class_system, &class_user, &class_response, llm_duration).await;
            let (phase2_classified, phase2_overflow) = parse_classification_response(
                &class_response,
@ -898,9 +914,13 @@ async fn run_generation_inner(
    let (rewrite_system, rewrite_user) = prompts::build_rewrite_prompt(&all_scraped);
    let rewrite_schema = build_rewrite_schema(&all_scraped, &settings.categories);
    let llm_start = std::time::Instant::now();
    let final_results = provider
        .generate_rewrite_pass(&model_writing, &rewrite_system, &rewrite_user, &rewrite_schema)
        .await?;
    let llm_duration = llm_start.elapsed().as_millis() as u64;
    log_llm_call(&state.pool, user_id, job_id, "rewrite", &model_writing,
        &rewrite_system, &rewrite_user, &final_results, llm_duration).await;
    emit_progress(tx, "finalizing", "Finalisation...", 90);
    let mut final_sections = build_final_sections(&final_results, &settings.categories)?;
@ -999,6 +1019,27 @@ async fn trace_article(
    db::article_history::insert_entry(pool, &entry).await.ok();
 }
 /// Log an LLM call with full prompt, response, and timing.
 async fn log_llm_call(
    pool: &sqlx::PgPool,
    user_id: Uuid,
    job_id: Uuid,
    call_type: &str,
    model: &str,
    system_prompt: &str,
    user_prompt: &str,
    response: &serde_json::Value,
    duration_ms: u64,
 ) {
    let response_str = serde_json::to_string_pretty(response).unwrap_or_default();
    db::llm_call_log::insert(
        pool, user_id, job_id, call_type, model,
        system_prompt, user_prompt, &response_str, duration_ms as i32,
    )
    .await
    .ok(); // Don't fail synthesis if logging fails
 }
 /// Look up or create a per-user rate limiter stored in AppState.
 ///
 /// Returns `None` if the user has no rate limit overrides, in which case the