feat(knowledge): Phase A 知识库可见性隔离 + 结构化数据源 + 蒸馏Worker
Some checks failed
CI / Lint & TypeCheck (push) Has been cancelled
CI / Unit Tests (push) Has been cancelled
CI / Build Frontend (push) Has been cancelled
CI / Rust Check (push) Has been cancelled
CI / Security Scan (push) Has been cancelled
CI / E2E Tests (push) Has been cancelled
Some checks failed
CI / Lint & TypeCheck (push) Has been cancelled
CI / Unit Tests (push) Has been cancelled
CI / Build Frontend (push) Has been cancelled
CI / Rust Check (push) Has been cancelled
CI / Security Scan (push) Has been cancelled
CI / E2E Tests (push) Has been cancelled
- knowledge_items 增加 visibility(public/private) + account_id 字段 - 新建 structured_sources + structured_rows 表 (Excel JSONB 行级存储) - 结构化数据源 CRUD API (5 路由: list/get/rows/delete/query) - 安全查询: JSONB GIN 索引 + 可见性过滤 + 行数限制 - 蒸馏 Worker: 复用 Provider Key Pool 调 DeepSeek/Qwen API - L0 质量过滤: 长度/隐私检测 - create_item 增加 is_admin 参数控制可见性默认值 - generate_embedding: extract_keywords_from_text 改为 pub 复用 Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
@@ -190,7 +190,8 @@ pub async fn create_item(
|
||||
return Err(SaasError::InvalidInput("内容不能超过 100KB".into()));
|
||||
}
|
||||
|
||||
let item = service::create_item(&state.db, &ctx.account_id, &req).await?;
|
||||
let is_admin = ctx.role == "admin" || ctx.role == "super_admin";
|
||||
let item = service::create_item(&state.db, &ctx.account_id, &req, is_admin).await?;
|
||||
|
||||
// 异步触发 embedding 生成
|
||||
if let Err(e) = state.worker_dispatcher.dispatch(
|
||||
@@ -219,6 +220,7 @@ pub async fn batch_create_items(
|
||||
return Err(SaasError::InvalidInput("单次批量创建不能超过 50 条".into()));
|
||||
}
|
||||
|
||||
let is_admin = ctx.role == "admin" || ctx.role == "super_admin";
|
||||
let mut created = Vec::new();
|
||||
for req in &items {
|
||||
if req.title.trim().is_empty() || req.content.trim().is_empty() {
|
||||
@@ -229,7 +231,7 @@ pub async fn batch_create_items(
|
||||
tracing::warn!("Batch create: skipping item '{}' (content too long)", req.title);
|
||||
continue;
|
||||
}
|
||||
match service::create_item(&state.db, &ctx.account_id, req).await {
|
||||
match service::create_item(&state.db, &ctx.account_id, req, is_admin).await {
|
||||
Ok(item) => {
|
||||
if let Err(e) = state.worker_dispatcher.dispatch(
|
||||
"generate_embedding",
|
||||
@@ -534,6 +536,7 @@ pub async fn import_items(
|
||||
return Err(SaasError::InvalidInput("单次导入不能超过 20 个文件".into()));
|
||||
}
|
||||
|
||||
let is_admin = ctx.role == "admin" || ctx.role == "super_admin";
|
||||
let mut created = Vec::new();
|
||||
for file in &req.files {
|
||||
// 内容长度检查(数据库限制 100KB)
|
||||
@@ -561,9 +564,10 @@ pub async fn import_items(
|
||||
related_questions: None,
|
||||
priority: None,
|
||||
tags: file.tags.clone(),
|
||||
visibility: None,
|
||||
};
|
||||
|
||||
match service::create_item(&state.db, &ctx.account_id, &item_req).await {
|
||||
match service::create_item(&state.db, &ctx.account_id, &item_req, is_admin).await {
|
||||
Ok(item) => {
|
||||
if let Err(e) = state.worker_dispatcher.dispatch(
|
||||
"generate_embedding",
|
||||
@@ -590,3 +594,94 @@ pub async fn import_items(
|
||||
fn check_permission(ctx: &AuthContext, permission: &str) -> SaasResult<()> {
|
||||
crate::auth::handlers::check_permission(ctx, permission)
|
||||
}
|
||||
|
||||
fn is_admin(ctx: &AuthContext) -> bool {
|
||||
ctx.role == "admin" || ctx.role == "super_admin"
|
||||
}
|
||||
|
||||
// === 结构化数据源管理 ===
|
||||
|
||||
/// GET /api/v1/structured/sources
|
||||
pub async fn list_structured_sources(
|
||||
State(state): State<AppState>,
|
||||
Extension(ctx): Extension<AuthContext>,
|
||||
Query(query): Query<ListStructuredSourcesQuery>,
|
||||
) -> SaasResult<Json<serde_json::Value>> {
|
||||
check_permission(&ctx, "knowledge:read")?;
|
||||
let page = query.page.unwrap_or(1).max(1);
|
||||
let page_size = query.page_size.unwrap_or(20).max(1).min(100);
|
||||
|
||||
let (sources, total) = service::list_structured_sources(
|
||||
&state.db,
|
||||
Some(&ctx.account_id),
|
||||
query.industry_id.as_deref(),
|
||||
query.status.as_deref(),
|
||||
page,
|
||||
page_size,
|
||||
).await?;
|
||||
|
||||
Ok(Json(serde_json::json!({
|
||||
"items": sources,
|
||||
"total": total,
|
||||
"page": page,
|
||||
"page_size": page_size,
|
||||
})))
|
||||
}
|
||||
|
||||
/// GET /api/v1/structured/sources/:id
|
||||
pub async fn get_structured_source(
|
||||
State(state): State<AppState>,
|
||||
Extension(ctx): Extension<AuthContext>,
|
||||
Path(id): Path<String>,
|
||||
) -> SaasResult<Json<serde_json::Value>> {
|
||||
check_permission(&ctx, "knowledge:read")?;
|
||||
let source = service::get_structured_source(&state.db, &id, Some(&ctx.account_id)).await?
|
||||
.ok_or_else(|| SaasError::NotFound("数据源不存在".into()))?;
|
||||
Ok(Json(serde_json::to_value(source).unwrap_or_default()))
|
||||
}
|
||||
|
||||
/// GET /api/v1/structured/sources/:id/rows
|
||||
pub async fn list_structured_source_rows(
|
||||
State(state): State<AppState>,
|
||||
Extension(ctx): Extension<AuthContext>,
|
||||
Path(id): Path<String>,
|
||||
Query(query): Query<ListStructuredRowsQuery>,
|
||||
) -> SaasResult<Json<serde_json::Value>> {
|
||||
check_permission(&ctx, "knowledge:read")?;
|
||||
let page = query.page.unwrap_or(1).max(1);
|
||||
let page_size = query.page_size.unwrap_or(50).max(1).min(200);
|
||||
|
||||
let (rows, total) = service::list_structured_rows(
|
||||
&state.db, &id, Some(&ctx.account_id),
|
||||
query.sheet_name.as_deref(), page, page_size,
|
||||
).await?;
|
||||
|
||||
Ok(Json(serde_json::json!({
|
||||
"rows": rows,
|
||||
"total": total,
|
||||
"page": page,
|
||||
"page_size": page_size,
|
||||
})))
|
||||
}
|
||||
|
||||
/// DELETE /api/v1/structured/sources/:id
|
||||
pub async fn delete_structured_source(
|
||||
State(state): State<AppState>,
|
||||
Extension(ctx): Extension<AuthContext>,
|
||||
Path(id): Path<String>,
|
||||
) -> SaasResult<Json<serde_json::Value>> {
|
||||
check_permission(&ctx, "knowledge:admin")?;
|
||||
service::delete_structured_source(&state.db, &id).await?;
|
||||
Ok(Json(serde_json::json!({"deleted": true})))
|
||||
}
|
||||
|
||||
/// POST /api/v1/structured/query
|
||||
pub async fn query_structured(
|
||||
State(state): State<AppState>,
|
||||
Extension(ctx): Extension<AuthContext>,
|
||||
Json(req): Json<StructuredQueryRequest>,
|
||||
) -> SaasResult<Json<Vec<StructuredQueryResult>>> {
|
||||
check_permission(&ctx, "knowledge:search")?;
|
||||
let results = service::query_structured(&state.db, &req, Some(&ctx.account_id)).await?;
|
||||
Ok(Json(results))
|
||||
}
|
||||
|
||||
@@ -1,4 +1,4 @@
|
||||
//! 知识库模块 — 行业知识管理、RAG 检索、版本控制
|
||||
//! 知识库模块 — 行业知识管理、RAG 检索、版本控制、结构化数据
|
||||
|
||||
pub mod types;
|
||||
pub mod service;
|
||||
@@ -36,4 +36,10 @@ pub fn routes() -> axum::Router<crate::state::AppState> {
|
||||
.route("/api/v1/knowledge/analytics/top-items", get(handlers::analytics_top_items))
|
||||
.route("/api/v1/knowledge/analytics/quality", get(handlers::analytics_quality))
|
||||
.route("/api/v1/knowledge/analytics/gaps", get(handlers::analytics_gaps))
|
||||
// 结构化数据源管理
|
||||
.route("/api/v1/structured/sources", get(handlers::list_structured_sources))
|
||||
.route("/api/v1/structured/sources/:id", get(handlers::get_structured_source))
|
||||
.route("/api/v1/structured/sources/:id/rows", get(handlers::list_structured_source_rows))
|
||||
.route("/api/v1/structured/sources/:id", delete(handlers::delete_structured_source))
|
||||
.route("/api/v1/structured/query", post(handlers::query_structured))
|
||||
}
|
||||
|
||||
@@ -276,6 +276,7 @@ pub async fn create_item(
|
||||
pool: &PgPool,
|
||||
account_id: &str,
|
||||
req: &CreateItemRequest,
|
||||
is_admin: bool,
|
||||
) -> SaasResult<KnowledgeItem> {
|
||||
let id = uuid::Uuid::new_v4().to_string();
|
||||
let keywords = req.keywords.as_deref().unwrap_or(&[]);
|
||||
@@ -283,6 +284,16 @@ pub async fn create_item(
|
||||
let priority = req.priority.unwrap_or(0);
|
||||
let tags = req.tags.as_deref().unwrap_or(&[]);
|
||||
|
||||
// visibility: Admin 默认 public,普通用户默认 private
|
||||
let visibility = req.visibility.as_deref().unwrap_or_else(|| {
|
||||
if is_admin { "public" } else { "private" }
|
||||
});
|
||||
if !is_admin && visibility == "public" {
|
||||
return Err(crate::error::SaasError::InvalidInput(
|
||||
"普通用户只能创建私有知识条目".into(),
|
||||
));
|
||||
}
|
||||
|
||||
// 验证 category_id 存在性
|
||||
let cat_exists: bool = sqlx::query_scalar(
|
||||
"SELECT EXISTS(SELECT 1 FROM knowledge_categories WHERE id = $1)"
|
||||
@@ -299,10 +310,12 @@ pub async fn create_item(
|
||||
// 使用事务保证 item + version 原子性
|
||||
let mut tx = pool.begin().await?;
|
||||
|
||||
let item_account_id: Option<&str> = if visibility == "public" { None } else { Some(account_id) };
|
||||
|
||||
let item = sqlx::query_as::<_, KnowledgeItem>(
|
||||
"INSERT INTO knowledge_items \
|
||||
(id, category_id, title, content, keywords, related_questions, priority, tags, created_by) \
|
||||
VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9) \
|
||||
(id, category_id, title, content, keywords, related_questions, priority, tags, created_by, visibility, account_id) \
|
||||
VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9, $10, $11) \
|
||||
RETURNING *"
|
||||
)
|
||||
.bind(&id)
|
||||
@@ -314,6 +327,8 @@ pub async fn create_item(
|
||||
.bind(priority)
|
||||
.bind(tags)
|
||||
.bind(account_id)
|
||||
.bind(visibility)
|
||||
.bind(item_account_id)
|
||||
.fetch_one(&mut *tx)
|
||||
.await?;
|
||||
|
||||
@@ -781,3 +796,257 @@ pub async fn analytics_gaps(pool: &PgPool) -> SaasResult<serde_json::Value> {
|
||||
"gaps": gaps.into_iter().map(|(v,)| v).collect::<Vec<_>>()
|
||||
}))
|
||||
}
|
||||
|
||||
// === 结构化数据源 CRUD ===
|
||||
|
||||
/// 创建结构化数据源
|
||||
pub async fn create_structured_source(
|
||||
pool: &PgPool,
|
||||
account_id: &str,
|
||||
is_admin: bool,
|
||||
req: &CreateStructuredSourceRequest,
|
||||
) -> SaasResult<StructuredSource> {
|
||||
let id = uuid::Uuid::new_v4().to_string();
|
||||
let visibility = req.visibility.as_deref().unwrap_or_else(|| {
|
||||
if is_admin { "public" } else { "private" }
|
||||
});
|
||||
let source_account_id: Option<&str> = if visibility == "public" { None } else { Some(account_id) };
|
||||
|
||||
let source = sqlx::query_as::<_, StructuredSource>(
|
||||
"INSERT INTO structured_sources \
|
||||
(id, account_id, title, description, original_file_name, sheet_names, column_headers, \
|
||||
visibility, industry_id, created_by) \
|
||||
VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9, $10) \
|
||||
RETURNING *"
|
||||
)
|
||||
.bind(&id)
|
||||
.bind(source_account_id)
|
||||
.bind(&req.title)
|
||||
.bind(&req.description)
|
||||
.bind(&req.original_file_name)
|
||||
.bind(req.sheet_names.as_deref().unwrap_or(&vec![]))
|
||||
.bind(req.column_headers.as_deref().unwrap_or(&vec![]))
|
||||
.bind(visibility)
|
||||
.bind(&req.industry_id)
|
||||
.bind(account_id)
|
||||
.fetch_one(pool)
|
||||
.await?;
|
||||
|
||||
Ok(source)
|
||||
}
|
||||
|
||||
/// 批量写入结构化数据行
|
||||
pub async fn insert_structured_rows(
|
||||
pool: &PgPool,
|
||||
source_id: &str,
|
||||
rows: &[(Option<String>, i32, Vec<String>, serde_json::Value)],
|
||||
) -> SaasResult<i64> {
|
||||
let mut tx = pool.begin().await?;
|
||||
let mut count: i64 = 0;
|
||||
|
||||
for (sheet_name, row_index, headers, row_data) in rows {
|
||||
let row_id = uuid::Uuid::new_v4().to_string();
|
||||
sqlx::query(
|
||||
"INSERT INTO structured_rows (id, source_id, sheet_name, row_index, headers, row_data) \
|
||||
VALUES ($1, $2, $3, $4, $5, $6)"
|
||||
)
|
||||
.bind(&row_id)
|
||||
.bind(source_id)
|
||||
.bind(sheet_name)
|
||||
.bind(*row_index)
|
||||
.bind(headers)
|
||||
.bind(row_data)
|
||||
.execute(&mut *tx)
|
||||
.await?;
|
||||
count += 1;
|
||||
}
|
||||
|
||||
sqlx::query(
|
||||
"UPDATE structured_sources SET row_count = (SELECT COUNT(*) FROM structured_rows WHERE source_id = $1), \
|
||||
updated_at = NOW() WHERE id = $1"
|
||||
)
|
||||
.bind(source_id)
|
||||
.execute(&mut *tx)
|
||||
.await?;
|
||||
|
||||
tx.commit().await?;
|
||||
Ok(count)
|
||||
}
|
||||
|
||||
/// 列出结构化数据源(分页,含可见性过滤)
|
||||
pub async fn list_structured_sources(
|
||||
pool: &PgPool,
|
||||
viewer_account_id: Option<&str>,
|
||||
industry_id: Option<&str>,
|
||||
status: Option<&str>,
|
||||
page: i64,
|
||||
page_size: i64,
|
||||
) -> SaasResult<(Vec<StructuredSource>, i64)> {
|
||||
let offset = (page - 1) * page_size;
|
||||
|
||||
let items: Vec<StructuredSource> = sqlx::query_as(
|
||||
"SELECT * FROM structured_sources \
|
||||
WHERE (visibility = 'public' OR account_id = $1) \
|
||||
AND ($2::text IS NULL OR industry_id = $2) \
|
||||
AND ($3::text IS NULL OR status = $3) \
|
||||
ORDER BY updated_at DESC \
|
||||
LIMIT $4 OFFSET $5"
|
||||
)
|
||||
.bind(viewer_account_id)
|
||||
.bind(industry_id)
|
||||
.bind(status)
|
||||
.bind(page_size)
|
||||
.bind(offset)
|
||||
.fetch_all(pool)
|
||||
.await?;
|
||||
|
||||
let total: (i64,) = sqlx::query_as(
|
||||
"SELECT COUNT(*) FROM structured_sources \
|
||||
WHERE (visibility = 'public' OR account_id = $1) \
|
||||
AND ($2::text IS NULL OR industry_id = $2) \
|
||||
AND ($3::text IS NULL OR status = $3)"
|
||||
)
|
||||
.bind(viewer_account_id)
|
||||
.bind(industry_id)
|
||||
.bind(status)
|
||||
.fetch_one(pool)
|
||||
.await?;
|
||||
|
||||
Ok((items, total.0))
|
||||
}
|
||||
|
||||
/// 获取结构化数据源详情
|
||||
pub async fn get_structured_source(
|
||||
pool: &PgPool,
|
||||
source_id: &str,
|
||||
viewer_account_id: Option<&str>,
|
||||
) -> SaasResult<Option<StructuredSource>> {
|
||||
let source = sqlx::query_as::<_, StructuredSource>(
|
||||
"SELECT * FROM structured_sources WHERE id = $1 \
|
||||
AND (visibility = 'public' OR account_id = $2)"
|
||||
)
|
||||
.bind(source_id)
|
||||
.bind(viewer_account_id)
|
||||
.fetch_optional(pool)
|
||||
.await?;
|
||||
Ok(source)
|
||||
}
|
||||
|
||||
/// 列出结构化数据源的行数据(分页)
|
||||
pub async fn list_structured_rows(
|
||||
pool: &PgPool,
|
||||
source_id: &str,
|
||||
viewer_account_id: Option<&str>,
|
||||
sheet_name: Option<&str>,
|
||||
page: i64,
|
||||
page_size: i64,
|
||||
) -> SaasResult<(Vec<StructuredRow>, i64)> {
|
||||
let source = get_structured_source(pool, source_id, viewer_account_id).await?;
|
||||
if source.is_none() {
|
||||
return Err(crate::error::SaasError::NotFound("数据源不存在或无权限".into()));
|
||||
}
|
||||
|
||||
let offset = (page - 1) * page_size;
|
||||
let rows: Vec<StructuredRow> = sqlx::query_as(
|
||||
"SELECT * FROM structured_rows \
|
||||
WHERE source_id = $1 \
|
||||
AND ($2::text IS NULL OR sheet_name = $2) \
|
||||
ORDER BY row_index \
|
||||
LIMIT $3 OFFSET $4"
|
||||
)
|
||||
.bind(source_id)
|
||||
.bind(sheet_name)
|
||||
.bind(page_size)
|
||||
.bind(offset)
|
||||
.fetch_all(pool)
|
||||
.await?;
|
||||
|
||||
let total: (i64,) = sqlx::query_as(
|
||||
"SELECT COUNT(*) FROM structured_rows \
|
||||
WHERE source_id = $1 \
|
||||
AND ($2::text IS NULL OR sheet_name = $2)"
|
||||
)
|
||||
.bind(source_id)
|
||||
.bind(sheet_name)
|
||||
.fetch_one(pool)
|
||||
.await?;
|
||||
|
||||
Ok((rows, total.0))
|
||||
}
|
||||
|
||||
/// 删除结构化数据源(级联删除行)
|
||||
pub async fn delete_structured_source(pool: &PgPool, source_id: &str) -> SaasResult<()> {
|
||||
let result = sqlx::query("DELETE FROM structured_sources WHERE id = $1")
|
||||
.bind(source_id)
|
||||
.execute(pool)
|
||||
.await?;
|
||||
if result.rows_affected() == 0 {
|
||||
return Err(crate::error::SaasError::NotFound("数据源不存在".into()));
|
||||
}
|
||||
Ok(())
|
||||
}
|
||||
|
||||
/// 安全的结构化查询(关键词匹配 + 可见性过滤)
|
||||
pub async fn query_structured(
|
||||
pool: &PgPool,
|
||||
request: &StructuredQueryRequest,
|
||||
viewer_account_id: Option<&str>,
|
||||
) -> SaasResult<Vec<StructuredQueryResult>> {
|
||||
let limit = request.limit.unwrap_or(20).min(50);
|
||||
let pattern = format!("%{}%",
|
||||
request.query.replace('\\', "\\\\").replace('%', "\\%").replace('_', "\\_")
|
||||
);
|
||||
|
||||
let source_filter = if let Some(ref sid) = request.source_id {
|
||||
format!("AND ss.id = '{}'", sid.replace('\'', "''"))
|
||||
} else {
|
||||
String::new()
|
||||
};
|
||||
let industry_filter = if let Some(ref iid) = request.industry_id {
|
||||
format!("AND ss.industry_id = '{}'", iid.replace('\'', "''"))
|
||||
} else {
|
||||
String::new()
|
||||
};
|
||||
|
||||
let rows: Vec<(String, String, Vec<String>, serde_json::Value)> = sqlx::query_as(
|
||||
&format!(
|
||||
"SELECT sr.source_id, ss.title, sr.headers, sr.row_data \
|
||||
FROM structured_rows sr \
|
||||
JOIN structured_sources ss ON sr.source_id = ss.id \
|
||||
WHERE (ss.visibility = 'public' OR ss.account_id = $1) \
|
||||
AND ss.status = 'active' \
|
||||
{} {} \
|
||||
AND (sr.row_data::text ILIKE $2 \
|
||||
OR array_to_string(sr.headers, ' ') ILIKE $2) \
|
||||
ORDER BY ss.title, sr.row_index \
|
||||
LIMIT {}",
|
||||
source_filter, industry_filter, limit
|
||||
)
|
||||
)
|
||||
.bind(viewer_account_id)
|
||||
.bind(&pattern)
|
||||
.fetch_all(pool)
|
||||
.await?;
|
||||
|
||||
let mut results_map: std::collections::HashMap<String, StructuredQueryResult> =
|
||||
std::collections::HashMap::new();
|
||||
|
||||
for (source_id, source_title, headers, row_data) in rows {
|
||||
let entry = results_map.entry(source_id.clone())
|
||||
.or_insert_with(|| StructuredQueryResult {
|
||||
source_id: source_id.clone(),
|
||||
source_title: source_title.clone(),
|
||||
headers: headers.clone(),
|
||||
rows: Vec::new(),
|
||||
total_matched: 0,
|
||||
generated_sql: None,
|
||||
});
|
||||
|
||||
if let Ok(map) = serde_json::from_value::<std::collections::HashMap<String, serde_json::Value>>(row_data) {
|
||||
entry.rows.push(map);
|
||||
}
|
||||
entry.total_matched += 1;
|
||||
}
|
||||
|
||||
Ok(results_map.into_values().collect())
|
||||
}
|
||||
|
||||
@@ -2,6 +2,7 @@
|
||||
|
||||
use chrono::{DateTime, Utc};
|
||||
use serde::{Deserialize, Serialize};
|
||||
use std::collections::HashMap;
|
||||
|
||||
// === 分类 ===
|
||||
|
||||
@@ -63,6 +64,8 @@ pub struct KnowledgeItem {
|
||||
pub source: String,
|
||||
pub tags: Vec<String>,
|
||||
pub created_by: String,
|
||||
pub visibility: Option<String>,
|
||||
pub account_id: Option<String>,
|
||||
pub created_at: DateTime<Utc>,
|
||||
pub updated_at: DateTime<Utc>,
|
||||
}
|
||||
@@ -76,6 +79,7 @@ pub struct CreateItemRequest {
|
||||
pub related_questions: Option<Vec<String>>,
|
||||
pub priority: Option<i32>,
|
||||
pub tags: Option<Vec<String>>,
|
||||
pub visibility: Option<String>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
@@ -115,6 +119,7 @@ pub struct ItemResponse {
|
||||
pub source: String,
|
||||
pub tags: Vec<String>,
|
||||
pub created_by: String,
|
||||
pub visibility: Option<String>,
|
||||
pub reference_count: i64,
|
||||
pub created_at: String,
|
||||
pub updated_at: String,
|
||||
@@ -167,14 +172,6 @@ pub struct KnowledgeUsage {
|
||||
|
||||
// === 搜索 ===
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
pub struct SearchRequest {
|
||||
pub query: String,
|
||||
pub category_id: Option<String>,
|
||||
pub limit: Option<i64>,
|
||||
pub min_score: Option<f64>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Serialize)]
|
||||
pub struct SearchResult {
|
||||
pub chunk_id: String,
|
||||
@@ -223,3 +220,114 @@ pub struct ImportRequest {
|
||||
pub category_id: String,
|
||||
pub files: Vec<ImportFile>,
|
||||
}
|
||||
|
||||
// === 搜索增强 ===
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
pub struct SearchRequest {
|
||||
pub query: String,
|
||||
pub category_id: Option<String>,
|
||||
pub industry_id: Option<String>,
|
||||
pub search_structured: Option<bool>,
|
||||
pub search_documents: Option<bool>,
|
||||
pub limit: Option<i64>,
|
||||
pub min_score: Option<f64>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Serialize)]
|
||||
pub struct UnifiedSearchResult {
|
||||
pub documents: Vec<SearchResult>,
|
||||
pub structured: Vec<StructuredQueryResult>,
|
||||
}
|
||||
|
||||
// === 结构化数据源 ===
|
||||
|
||||
#[derive(Debug, Clone, Serialize, Deserialize, sqlx::FromRow)]
|
||||
pub struct StructuredSource {
|
||||
pub id: String,
|
||||
pub account_id: Option<String>,
|
||||
pub title: String,
|
||||
pub description: Option<String>,
|
||||
pub original_file_name: Option<String>,
|
||||
pub sheet_names: Vec<String>,
|
||||
pub row_count: i32,
|
||||
pub column_headers: Vec<String>,
|
||||
pub visibility: Option<String>,
|
||||
pub industry_id: Option<String>,
|
||||
pub status: String,
|
||||
pub created_by: String,
|
||||
pub created_at: DateTime<Utc>,
|
||||
pub updated_at: DateTime<Utc>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
pub struct CreateStructuredSourceRequest {
|
||||
pub title: String,
|
||||
pub description: Option<String>,
|
||||
pub original_file_name: Option<String>,
|
||||
pub sheet_names: Option<Vec<String>>,
|
||||
pub column_headers: Option<Vec<String>>,
|
||||
pub visibility: Option<String>,
|
||||
pub industry_id: Option<String>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
pub struct ListStructuredSourcesQuery {
|
||||
pub page: Option<i64>,
|
||||
pub page_size: Option<i64>,
|
||||
pub industry_id: Option<String>,
|
||||
pub status: Option<String>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Serialize)]
|
||||
pub struct StructuredSourceResponse {
|
||||
pub id: String,
|
||||
pub title: String,
|
||||
pub description: Option<String>,
|
||||
pub original_file_name: Option<String>,
|
||||
pub sheet_names: Vec<String>,
|
||||
pub row_count: i64,
|
||||
pub column_headers: Vec<String>,
|
||||
pub visibility: Option<String>,
|
||||
pub industry_id: Option<String>,
|
||||
pub status: String,
|
||||
pub created_by: String,
|
||||
pub created_at: String,
|
||||
pub updated_at: String,
|
||||
}
|
||||
|
||||
#[derive(Debug, Clone, Serialize, Deserialize, sqlx::FromRow)]
|
||||
pub struct StructuredRow {
|
||||
pub id: String,
|
||||
pub source_id: String,
|
||||
pub sheet_name: Option<String>,
|
||||
pub row_index: i32,
|
||||
pub headers: Vec<String>,
|
||||
pub row_data: serde_json::Value,
|
||||
pub created_at: DateTime<Utc>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
pub struct ListStructuredRowsQuery {
|
||||
pub page: Option<i64>,
|
||||
pub page_size: Option<i64>,
|
||||
pub sheet_name: Option<String>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Deserialize)]
|
||||
pub struct StructuredQueryRequest {
|
||||
pub query: String,
|
||||
pub source_id: Option<String>,
|
||||
pub industry_id: Option<String>,
|
||||
pub limit: Option<i64>,
|
||||
}
|
||||
|
||||
#[derive(Debug, Serialize)]
|
||||
pub struct StructuredQueryResult {
|
||||
pub source_id: String,
|
||||
pub source_title: String,
|
||||
pub headers: Vec<String>,
|
||||
pub rows: Vec<HashMap<String, serde_json::Value>>,
|
||||
pub total_matched: i64,
|
||||
pub generated_sql: Option<String>,
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user