feat(cli): Wire --full flag for embed, add sync stage spinners

- Add --full / --no-full flag pair to EmbedArgs with overrides_with semantics matching the existing flag pattern. When active, atomically DELETEs all embedding_metadata and embeddings before re-embedding. - Thread the full flag through run_embed -> run_sync so that 'lore sync --full' triggers a complete re-embed alongside the full re-ingest it already performed. - Add indicatif spinners to sync stages with dynamic stage numbering that adjusts when --no-docs or --no-embed skip stages. Spinners are hidden in robot mode. - Update robot-docs manifest to advertise the new --full flag on the embed command. - Replace hardcoded schema version 9 in health check with the LATEST_SCHEMA_VERSION constant from db.rs. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-02-03 09:35:22 -05:00
parent 7d07f95d4c
commit aebbe6b795
4 changed files with 82 additions and 18 deletions
--- a/src/cli/commands/embed.rs
+++ b/src/cli/commands/embed.rs
@@ -21,6 +21,7 @@ pub struct EmbedCommandResult {
 /// Run the embed command.
 pub async fn run_embed(
    config: &Config,
+    full: bool,
    retry_failed: bool,
 ) -> Result<EmbedCommandResult> {
    let db_path = get_db_path(config.storage.db_path.as_deref());
@@ -37,8 +38,18 @@ pub async fn run_embed(
    // Health check — fail fast if Ollama is down or model missing
    client.health_check().await?;

-    // If retry_failed, clear errors so they become pending again
-    if retry_failed {
+    if full {
+        // Clear ALL embeddings and metadata atomically for a complete re-embed.
+        // Wrapped in a transaction so a crash between the two DELETEs can't
+        // leave orphaned data.
+        conn.execute_batch(
+            "BEGIN;
+             DELETE FROM embedding_metadata;
+             DELETE FROM embeddings;
+             COMMIT;",
+        )?;
+    } else if retry_failed {
+        // Clear errors so they become pending again
        conn.execute(
            "UPDATE embedding_metadata SET last_error = NULL, attempt_count = 0
             WHERE last_error IS NOT NULL",
--- a/src/cli/commands/sync.rs
+++ b/src/cli/commands/sync.rs
@@ -1,6 +1,7 @@
 //! Sync command: unified orchestrator for ingest -> generate-docs -> embed.

 use console::style;
+use indicatif::{ProgressBar, ProgressStyle};
 use serde::Serialize;
 use tracing::{info, warn};

@@ -31,6 +32,22 @@ pub struct SyncResult {
    pub documents_embedded: usize,
 }

+/// Create a styled spinner for a sync stage.
+fn stage_spinner(stage: u8, total: u8, msg: &str, robot_mode: bool) -> ProgressBar {
+    if robot_mode {
+        return ProgressBar::hidden();
+    }
+    let pb = ProgressBar::new_spinner();
+    pb.set_style(
+        ProgressStyle::default_spinner()
+            .template("{spinner:.blue} {msg}")
+            .expect("valid template"),
+    );
+    pb.enable_steady_tick(std::time::Duration::from_millis(80));
+    pb.set_message(format!("[{stage}/{total}] {msg}"));
+    pb
+}
+
 /// Run the full sync pipeline: ingest -> generate-docs -> embed.
 pub async fn run_sync(config: &Config, options: SyncOptions) -> Result<SyncResult> {
    let mut result = SyncResult::default();
@@ -41,41 +58,70 @@ pub async fn run_sync(config: &Config, options: SyncOptions) -> Result<SyncResul
        IngestDisplay::progress_only()
    };

+    let total_stages: u8 = if options.no_docs && options.no_embed {
+        2
+    } else if options.no_docs || options.no_embed {
+        3
+    } else {
+        4
+    };
+    let mut current_stage: u8 = 0;
+
    // Stage 1: Ingest issues
-    info!("Sync stage 1/4: ingesting issues");
+    current_stage += 1;
+    let spinner = stage_spinner(current_stage, total_stages, "Fetching issues from GitLab...", options.robot_mode);
+    info!("Sync stage {current_stage}/{total_stages}: ingesting issues");
    let issues_result = run_ingest(config, "issues", None, options.force, options.full, ingest_display).await?;
    result.issues_updated = issues_result.issues_upserted;
    result.discussions_fetched += issues_result.discussions_fetched;
+    spinner.finish_and_clear();

    // Stage 2: Ingest MRs
-    info!("Sync stage 2/4: ingesting merge requests");
+    current_stage += 1;
+    let spinner = stage_spinner(current_stage, total_stages, "Fetching merge requests from GitLab...", options.robot_mode);
+    info!("Sync stage {current_stage}/{total_stages}: ingesting merge requests");
    let mrs_result = run_ingest(config, "mrs", None, options.force, options.full, ingest_display).await?;
    result.mrs_updated = mrs_result.mrs_upserted;
    result.discussions_fetched += mrs_result.discussions_fetched;
+    spinner.finish_and_clear();

    // Stage 3: Generate documents (unless --no-docs)
-    if options.no_docs {
-        info!("Sync stage 3/4: skipping document generation (--no-docs)");
-    } else {
-        info!("Sync stage 3/4: generating documents");
+    if !options.no_docs {
+        current_stage += 1;
+        let spinner = stage_spinner(current_stage, total_stages, "Processing documents...", options.robot_mode);
+        info!("Sync stage {current_stage}/{total_stages}: generating documents");
        let docs_result = run_generate_docs(config, false, None)?;
        result.documents_regenerated = docs_result.regenerated;
+        spinner.finish_and_clear();
+    } else {
+        info!("Sync: skipping document generation (--no-docs)");
    }

    // Stage 4: Embed documents (unless --no-embed)
-    if options.no_embed {
-        info!("Sync stage 4/4: skipping embedding (--no-embed)");
-    } else {
-        info!("Sync stage 4/4: embedding documents");
-        match run_embed(config, false).await {
+    if !options.no_embed {
+        current_stage += 1;
+        let spinner = stage_spinner(current_stage, total_stages, "Generating embeddings...", options.robot_mode);
+        info!("Sync stage {current_stage}/{total_stages}: embedding documents");
+        match run_embed(config, options.full, false).await {
            Ok(embed_result) => {
                result.documents_embedded = embed_result.embedded;
+                spinner.finish_and_clear();
            }
            Err(e) => {
                // Graceful degradation: Ollama down is a warning, not an error
+                spinner.finish_and_clear();
+                if !options.robot_mode {
+                    eprintln!(
+                        "  {} Embedding skipped ({})",
+                        style("warn").yellow(),
+                        e
+                    );
+                }
                warn!(error = %e, "Embedding stage failed (Ollama may be unavailable), continuing");
            }
        }
+    } else {
+        info!("Sync: skipping embedding (--no-embed)");
    }

    info!(