mirror of
https://github.com/instructkr/claude-code.git
synced 2026-05-27 07:56:46 +00:00
176 lines
4.7 KiB
Rust
176 lines
4.7 KiB
Rust
//! `claw-rag-service` — HTTP API + `ingest` subcommand.
|
|
|
|
use std::path::PathBuf;
|
|
use std::sync::Arc;
|
|
|
|
use axum::{
|
|
extract::State,
|
|
http::StatusCode,
|
|
response::Html,
|
|
routing::{get, post},
|
|
Json, Router,
|
|
};
|
|
use clap::{Parser, Subcommand};
|
|
use claw_rag_service::{
|
|
chunk_count, open_db, query_index, run_ingest, EmbedConfig, QueryRequest, QueryResponse,
|
|
};
|
|
|
|
#[derive(Parser)]
|
|
#[command(
|
|
name = "claw-rag-service",
|
|
about = "Workspace RAG index + HTTP query API"
|
|
)]
|
|
struct Cli {
|
|
#[command(subcommand)]
|
|
command: Option<Cmd>,
|
|
}
|
|
|
|
#[derive(Subcommand)]
|
|
enum Cmd {
|
|
/// Run HTTP server (default when no subcommand).
|
|
Serve(ServeArgs),
|
|
/// Index a workspace into `SQLite` (calls embedding API).
|
|
Ingest(IngestArgs),
|
|
}
|
|
|
|
#[derive(Parser)]
|
|
struct ServeArgs {
|
|
#[arg(long, env = "CLAW_RAG_DB", default_value = ".claw-rag/index.sqlite")]
|
|
db: PathBuf,
|
|
}
|
|
|
|
#[derive(Parser)]
|
|
struct IngestArgs {
|
|
/// Workspace roots to ingest. Repeat `--workspace` to ingest multiple repos (cross-repo RAG).
|
|
#[arg(short, long)]
|
|
workspace: Vec<PathBuf>,
|
|
#[arg(long, env = "CLAW_RAG_DB", default_value = ".claw-rag/index.sqlite")]
|
|
db: PathBuf,
|
|
}
|
|
|
|
#[derive(Clone)]
|
|
struct AppState {
|
|
db_path: PathBuf,
|
|
client: reqwest::Client,
|
|
cfg: EmbedConfig,
|
|
}
|
|
|
|
/// Single-page UI for phase 3 (served at `GET /`).
|
|
static INDEX_HTML: &str = include_str!(concat!(env!("CARGO_MANIFEST_DIR"), "/static/index.html"));
|
|
|
|
async fn ui_index() -> Html<&'static str> {
|
|
Html(INDEX_HTML)
|
|
}
|
|
|
|
fn rag_router(state: Arc<AppState>) -> Router {
|
|
Router::new()
|
|
.route("/", get(ui_index))
|
|
.route("/health", get(|| async { "ok" }))
|
|
.route("/v1/stats", get(stats))
|
|
.route("/v1/query", post(query))
|
|
.with_state(state)
|
|
}
|
|
|
|
fn resolve_embed_config() -> Result<EmbedConfig, String> {
|
|
if let Some(c) = EmbedConfig::mock_from_env() {
|
|
return Ok(c);
|
|
}
|
|
EmbedConfig::from_env()
|
|
}
|
|
|
|
#[tokio::main]
|
|
async fn main() -> Result<(), Box<dyn std::error::Error + Send + Sync>> {
|
|
// Load `.env` if present (walks up parent directories).
|
|
// This is a convenience for local development; CI/production should set real env vars.
|
|
let _ = dotenvy::dotenv();
|
|
|
|
let cli = Cli::parse();
|
|
|
|
if let Some(Cmd::Ingest(a)) = cli.command {
|
|
let cfg = resolve_embed_config()?;
|
|
let client = reqwest::Client::new();
|
|
let st = run_ingest(&a.workspace, &a.db, &cfg, &client).await?;
|
|
eprintln!(
|
|
"ingest: files={} chunks={} embeddings={}",
|
|
st.files_indexed, st.chunks_total, st.embeddings_written
|
|
);
|
|
return Ok(());
|
|
}
|
|
|
|
let db = if let Some(Cmd::Serve(s)) = cli.command {
|
|
s.db
|
|
} else {
|
|
PathBuf::from(
|
|
std::env::var("CLAW_RAG_DB").unwrap_or_else(|_| ".claw-rag/index.sqlite".into()),
|
|
)
|
|
};
|
|
|
|
let cfg = resolve_embed_config()?;
|
|
let state = Arc::new(AppState {
|
|
db_path: db,
|
|
client: reqwest::Client::new(),
|
|
cfg,
|
|
});
|
|
|
|
let app = rag_router(state.clone());
|
|
|
|
let port: u16 = std::env::var("CLAW_RAG_PORT")
|
|
.ok()
|
|
.and_then(|s| s.parse().ok())
|
|
.unwrap_or(8787);
|
|
let host: std::net::IpAddr = std::env::var("CLAW_RAG_HOST")
|
|
.ok()
|
|
.and_then(|s| s.parse().ok())
|
|
.unwrap_or(std::net::IpAddr::V4(std::net::Ipv4Addr::LOCALHOST));
|
|
let addr = std::net::SocketAddr::from((host, port));
|
|
eprintln!(
|
|
"claw-rag-service db={} listen=http://{addr}",
|
|
state.db_path.display()
|
|
);
|
|
let listener = tokio::net::TcpListener::bind(addr).await?;
|
|
axum::serve(listener, app).await?;
|
|
Ok(())
|
|
}
|
|
|
|
async fn stats(State(state): State<Arc<AppState>>) -> Result<Json<serde_json::Value>, StatusCode> {
|
|
let path = state.db_path.clone();
|
|
if !path.is_file() {
|
|
return Ok(Json(serde_json::json!({
|
|
"chunks": 0,
|
|
"phase": "1-sqlite-no-db"
|
|
})));
|
|
}
|
|
let res = tokio::task::spawn_blocking(move || {
|
|
let conn = open_db(&path).map_err(|_| ())?;
|
|
chunk_count(&conn).map_err(|_| ())
|
|
})
|
|
.await
|
|
.map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?
|
|
.map_err(|()| StatusCode::INTERNAL_SERVER_ERROR)?;
|
|
Ok(Json(serde_json::json!({
|
|
"chunks": res,
|
|
"phase": "1-sqlite"
|
|
})))
|
|
}
|
|
|
|
async fn query(
|
|
State(state): State<Arc<AppState>>,
|
|
Json(req): Json<QueryRequest>,
|
|
) -> Result<Json<QueryResponse>, (StatusCode, String)> {
|
|
query_index(&state.db_path, &state.client, &state.cfg, &req)
|
|
.await
|
|
.map(Json)
|
|
.map_err(|e| (StatusCode::BAD_REQUEST, e))
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use super::INDEX_HTML;
|
|
|
|
#[test]
|
|
fn index_html_wires_api_paths() {
|
|
assert!(INDEX_HTML.contains("/v1/stats"));
|
|
assert!(INDEX_HTML.contains("/v1/query"));
|
|
}
|
|
}
|