mirror of
https://github.com/perstarkse/minne.git
synced 2026-03-23 01:50:01 +01:00
wip query
This commit is contained in:
@@ -53,6 +53,8 @@ pub enum ApiError {
|
||||
QueryError(String),
|
||||
#[error("RabbitMQ error: {0}")]
|
||||
RabbitMQError(#[from] RabbitMQError),
|
||||
#[error("LLM processing error: {0}")]
|
||||
OpenAIerror(#[from] OpenAIError),
|
||||
}
|
||||
|
||||
impl IntoResponse for ApiError {
|
||||
@@ -61,6 +63,7 @@ impl IntoResponse for ApiError {
|
||||
ApiError::ProcessingError(_) => (StatusCode::INTERNAL_SERVER_ERROR, self.to_string()),
|
||||
ApiError::PublishingError(_) => (StatusCode::INTERNAL_SERVER_ERROR, self.to_string()),
|
||||
ApiError::DatabaseError(_) => (StatusCode::INTERNAL_SERVER_ERROR, self.to_string()),
|
||||
ApiError::OpenAIerror(_) => (StatusCode::INTERNAL_SERVER_ERROR, self.to_string()),
|
||||
ApiError::QueryError(_) => (StatusCode::BAD_REQUEST, self.to_string()),
|
||||
ApiError::IngressContentError(_) => {
|
||||
(StatusCode::INTERNAL_SERVER_ERROR, self.to_string())
|
||||
|
||||
@@ -1,8 +1,8 @@
|
||||
use crate::{
|
||||
error::ProcessingError,
|
||||
ingress::analysis::prompt::{get_ingress_analysis_schema, INGRESS_ANALYSIS_SYSTEM_MESSAGE},
|
||||
retrieval::vector::find_items_by_vector_similarity,
|
||||
storage::types::{knowledge_entity::KnowledgeEntity, StoredObject},
|
||||
retrieval::combined_knowledge_entity_retrieval,
|
||||
storage::types::knowledge_entity::KnowledgeEntity,
|
||||
};
|
||||
use async_openai::types::{
|
||||
ChatCompletionRequestSystemMessage, ChatCompletionRequestUserMessage,
|
||||
@@ -57,14 +57,7 @@ impl<'a> IngressAnalyzer<'a> {
|
||||
text, category, instructions
|
||||
);
|
||||
|
||||
find_items_by_vector_similarity(
|
||||
10,
|
||||
input_text,
|
||||
self.db_client,
|
||||
KnowledgeEntity::table_name().to_string(),
|
||||
self.openai_client,
|
||||
)
|
||||
.await
|
||||
combined_knowledge_entity_retrieval(self.db_client, self.openai_client, input_text).await
|
||||
}
|
||||
|
||||
fn prepare_llm_request(
|
||||
@@ -106,7 +99,7 @@ impl<'a> IngressAnalyzer<'a> {
|
||||
CreateChatCompletionRequestArgs::default()
|
||||
.model("gpt-4o-mini")
|
||||
.temperature(0.2)
|
||||
.max_tokens(2048u32)
|
||||
.max_tokens(3048u32)
|
||||
.messages([
|
||||
ChatCompletionRequestSystemMessage::from(INGRESS_ANALYSIS_SYSTEM_MESSAGE).into(),
|
||||
ChatCompletionRequestUserMessage::from(user_message).into(),
|
||||
|
||||
@@ -5,7 +5,6 @@ use tracing::{debug, info};
|
||||
|
||||
use crate::{
|
||||
error::ProcessingError,
|
||||
retrieval::vector::find_items_by_vector_similarity,
|
||||
storage::{
|
||||
db::{store_item, SurrealDbClient},
|
||||
types::{
|
||||
@@ -39,10 +38,8 @@ impl ContentProcessor {
|
||||
|
||||
let now = Instant::now();
|
||||
// Process in parallel where possible
|
||||
let (analysis, _similar_chunks) = tokio::try_join!(
|
||||
self.perform_semantic_analysis(content),
|
||||
self.find_similar_content(content),
|
||||
)?;
|
||||
let analysis = self.perform_semantic_analysis(content).await?;
|
||||
|
||||
let end = now.elapsed();
|
||||
info!(
|
||||
"{:?} time elapsed during creation of entities and relationships",
|
||||
@@ -74,20 +71,6 @@ impl ContentProcessor {
|
||||
.await
|
||||
}
|
||||
|
||||
async fn find_similar_content(
|
||||
&self,
|
||||
content: &TextContent,
|
||||
) -> Result<Vec<TextChunk>, ProcessingError> {
|
||||
find_items_by_vector_similarity(
|
||||
3,
|
||||
content.text.clone(),
|
||||
&self.db_client,
|
||||
"text_chunk".to_string(),
|
||||
&self.openai_client,
|
||||
)
|
||||
.await
|
||||
}
|
||||
|
||||
async fn store_graph_entities(
|
||||
&self,
|
||||
entities: Vec<KnowledgeEntity>,
|
||||
|
||||
@@ -1,5 +1,5 @@
|
||||
use surrealdb::{engine::remote::ws::Client, Surreal};
|
||||
use tracing::info;
|
||||
use tracing::debug;
|
||||
|
||||
use crate::{error::ProcessingError, storage::types::knowledge_entity::KnowledgeEntity};
|
||||
|
||||
@@ -71,23 +71,21 @@ pub async fn find_entities_by_relationship_by_source_ids(
|
||||
db_client: &Surreal<Client>,
|
||||
source_ids: &[String],
|
||||
) -> Result<Vec<KnowledgeEntity>, ProcessingError> {
|
||||
// Create a comma-separated list of IDs wrapped in backticks
|
||||
let ids = source_ids
|
||||
.iter()
|
||||
// .map(|id| format!("`{}`", id))
|
||||
.map(|id| format!("knowledge_entity:`{}`", id))
|
||||
.collect::<Vec<_>>()
|
||||
.join(", ");
|
||||
|
||||
info!("{:?}", ids);
|
||||
|
||||
// let first = format!("knowledge_entity:`{}`", source_ids.first().unwrap());
|
||||
debug!("{:?}", ids);
|
||||
|
||||
let query = format!(
|
||||
"SELECT *, array::complement(<->relates_to<->knowledge_entity, [id]) AS related FROM [{}] FETCH related",
|
||||
"SELECT *, <-> relates_to <-> knowledge_entity AS related FROM [{}]",
|
||||
ids
|
||||
);
|
||||
|
||||
info!("{}", query);
|
||||
debug!("{}", query);
|
||||
|
||||
let result: Vec<KnowledgeEntity> = db_client.query(query).await?.take(0)?;
|
||||
|
||||
@@ -95,14 +93,14 @@ pub async fn find_entities_by_relationship_by_source_ids(
|
||||
}
|
||||
pub async fn find_entities_by_relationship_by_id(
|
||||
db_client: &Surreal<Client>,
|
||||
source_id: &str,
|
||||
source_id: String,
|
||||
) -> Result<Vec<KnowledgeEntity>, ProcessingError> {
|
||||
let query = format!(
|
||||
"SELECT *, <-> relates_to <-> knowledge_entity AS related FROM knowledge_entity:`{}`",
|
||||
source_id
|
||||
);
|
||||
|
||||
info!("{}", query);
|
||||
debug!("{}", query);
|
||||
|
||||
let result: Vec<KnowledgeEntity> = db_client.query(query).await?.take(0)?;
|
||||
|
||||
|
||||
@@ -1,2 +1,94 @@
|
||||
pub mod graph;
|
||||
pub mod vector;
|
||||
|
||||
use crate::{
|
||||
error::ProcessingError,
|
||||
retrieval::{
|
||||
graph::{find_entities_by_relationship_by_id, find_entities_by_source_ids},
|
||||
vector::find_items_by_vector_similarity,
|
||||
},
|
||||
storage::types::{knowledge_entity::KnowledgeEntity, text_chunk::TextChunk},
|
||||
};
|
||||
use futures::future::{try_join, try_join_all};
|
||||
use std::collections::HashMap;
|
||||
use surrealdb::{engine::remote::ws::Client, Surreal};
|
||||
use tracing::info;
|
||||
|
||||
/// Performs a comprehensive knowledge entity retrieval using multiple search strategies
|
||||
/// to find the most relevant entities for a given query.
|
||||
///
|
||||
/// # Strategy
|
||||
/// The function employs a three-pronged approach to knowledge retrieval:
|
||||
/// 1. Direct vector similarity search on knowledge entities
|
||||
/// 2. Text chunk similarity search with source entity lookup
|
||||
/// 3. Graph relationship traversal from related entities
|
||||
///
|
||||
/// This combined approach ensures both semantic similarity matches and structurally
|
||||
/// related content are included in the results.
|
||||
///
|
||||
/// # Arguments
|
||||
/// * `db_client` - SurrealDB client for database operations
|
||||
/// * `openai_client` - OpenAI client for vector embeddings generation
|
||||
/// * `query` - The search query string to find relevant knowledge entities
|
||||
///
|
||||
/// # Returns
|
||||
/// * `Result<Vec<KnowledgeEntity>, ProcessingError>` - A deduplicated vector of relevant
|
||||
/// knowledge entities, or an error if the retrieval process fails
|
||||
pub async fn combined_knowledge_entity_retrieval(
|
||||
db_client: &Surreal<Client>,
|
||||
openai_client: &async_openai::Client<async_openai::config::OpenAIConfig>,
|
||||
query: String,
|
||||
) -> Result<Vec<KnowledgeEntity>, ProcessingError> {
|
||||
info!("Received input: {:?}", query);
|
||||
|
||||
let (items_from_knowledge_entity_similarity, closest_chunks) = try_join(
|
||||
find_items_by_vector_similarity(
|
||||
10,
|
||||
query.clone(),
|
||||
db_client,
|
||||
"knowledge_entity".to_string(),
|
||||
openai_client,
|
||||
),
|
||||
find_items_by_vector_similarity(
|
||||
5,
|
||||
query,
|
||||
db_client,
|
||||
"text_chunk".to_string(),
|
||||
openai_client,
|
||||
),
|
||||
)
|
||||
.await?;
|
||||
|
||||
let source_ids = closest_chunks
|
||||
.iter()
|
||||
.map(|chunk: &TextChunk| chunk.source_id.clone())
|
||||
.collect::<Vec<String>>();
|
||||
|
||||
let items_from_text_chunk_similarity: Vec<KnowledgeEntity> =
|
||||
find_entities_by_source_ids(source_ids, "knowledge_entity".to_string(), db_client).await?;
|
||||
|
||||
let items_from_relationships_futures: Vec<_> = items_from_text_chunk_similarity
|
||||
.clone()
|
||||
.into_iter()
|
||||
.map(|entity| find_entities_by_relationship_by_id(db_client, entity.id.clone()))
|
||||
.collect();
|
||||
|
||||
let items_from_relationships = try_join_all(items_from_relationships_futures)
|
||||
.await?
|
||||
.into_iter()
|
||||
.flatten()
|
||||
.collect::<Vec<KnowledgeEntity>>();
|
||||
|
||||
let entities: Vec<KnowledgeEntity> = items_from_knowledge_entity_similarity
|
||||
.into_iter()
|
||||
.chain(items_from_text_chunk_similarity.into_iter())
|
||||
.chain(items_from_relationships.into_iter())
|
||||
.fold(HashMap::new(), |mut map, entity| {
|
||||
map.insert(entity.id.clone(), entity);
|
||||
map
|
||||
})
|
||||
.into_values()
|
||||
.collect();
|
||||
|
||||
Ok(entities)
|
||||
}
|
||||
|
||||
@@ -1,21 +1,13 @@
|
||||
use crate::{
|
||||
error::ApiError,
|
||||
retrieval::{
|
||||
graph::{
|
||||
find_entities_by_relationship_by_id, find_entities_by_relationship_by_source_ids,
|
||||
find_entities_by_source_ids,
|
||||
},
|
||||
vector::find_items_by_vector_similarity,
|
||||
},
|
||||
storage::{
|
||||
db::SurrealDbClient,
|
||||
types::{knowledge_entity::KnowledgeEntity, text_chunk::TextChunk},
|
||||
},
|
||||
error::ApiError, retrieval::combined_knowledge_entity_retrieval, storage::db::SurrealDbClient,
|
||||
};
|
||||
use async_openai::types::{
|
||||
ChatCompletionRequestSystemMessage, ChatCompletionRequestUserMessage,
|
||||
CreateChatCompletionRequestArgs,
|
||||
};
|
||||
use axum::{response::IntoResponse, Extension, Json};
|
||||
use serde::Deserialize;
|
||||
use serde_json::json;
|
||||
use std::collections::HashMap;
|
||||
use std::sync::Arc;
|
||||
use tracing::info;
|
||||
|
||||
@@ -31,49 +23,9 @@ pub async fn query_handler(
|
||||
info!("Received input: {:?}", query);
|
||||
let openai_client = async_openai::Client::new();
|
||||
|
||||
let test = find_entities_by_relationship_by_id(&db_client, &query.query).await?;
|
||||
info!("{:?}", test);
|
||||
|
||||
let items_from_knowledge_entity_similarity: Vec<KnowledgeEntity> =
|
||||
find_items_by_vector_similarity(
|
||||
10,
|
||||
query.query.to_string(),
|
||||
&db_client,
|
||||
"knowledge_entity".to_string(),
|
||||
&openai_client,
|
||||
)
|
||||
.await?;
|
||||
|
||||
let closest_chunks: Vec<TextChunk> = find_items_by_vector_similarity(
|
||||
5,
|
||||
query.query,
|
||||
&db_client,
|
||||
"text_chunk".to_string(),
|
||||
&openai_client,
|
||||
)
|
||||
.await?;
|
||||
|
||||
let source_ids = closest_chunks
|
||||
.iter()
|
||||
.map(|chunk| chunk.source_id.clone())
|
||||
.collect::<Vec<String>>();
|
||||
|
||||
let items_from_text_chunk_similarity: Vec<KnowledgeEntity> = find_entities_by_source_ids(
|
||||
source_ids.clone(),
|
||||
"knowledge_entity".to_string(),
|
||||
&db_client,
|
||||
)
|
||||
.await?;
|
||||
|
||||
let entities: Vec<KnowledgeEntity> = items_from_knowledge_entity_similarity
|
||||
.into_iter()
|
||||
.chain(items_from_text_chunk_similarity.into_iter())
|
||||
.fold(HashMap::new(), |mut map, entity| {
|
||||
map.insert(entity.id.clone(), entity);
|
||||
map
|
||||
})
|
||||
.into_values()
|
||||
.collect();
|
||||
let entities =
|
||||
combined_knowledge_entity_retrieval(&db_client, &openai_client, query.query.clone())
|
||||
.await?;
|
||||
|
||||
let entities_json = json!(entities
|
||||
.iter()
|
||||
@@ -88,12 +40,68 @@ pub async fn query_handler(
|
||||
})
|
||||
.collect::<Vec<_>>());
|
||||
|
||||
let graph_retrieval =
|
||||
find_entities_by_relationship_by_source_ids(&db_client, &source_ids).await?;
|
||||
let system_message = r#"
|
||||
You are a knowledgeable assistant with access to a specialized knowledge base. You will be provided with relevant knowledge entities from the database as context. Each knowledge entity contains a name, description, and type, representing different concepts, ideas, and information.
|
||||
|
||||
info!("{:?}", graph_retrieval);
|
||||
Your task is to:
|
||||
1. Carefully analyze the provided knowledge entities in the context
|
||||
2. Answer user questions based on this information
|
||||
3. Provide clear, concise, and accurate responses
|
||||
4. When referencing information, briefly mention which knowledge entity it came from
|
||||
5. If the provided context doesn't contain enough information to answer the question confidently, clearly state this
|
||||
6. If only partial information is available, explain what you can answer and what information is missing
|
||||
7. Avoid making assumptions or providing information not supported by the context
|
||||
|
||||
// info!("{} Entities\n{:#?}", entities.len(), entities_json);
|
||||
Remember:
|
||||
- Be direct and honest about the limitations of your knowledge
|
||||
- Cite the relevant knowledge entities when providing information
|
||||
- If you need to combine information from multiple entities, explain how they connect
|
||||
- Don't speculate beyond what's provided in the context
|
||||
|
||||
Ok("we got some stuff".to_string())
|
||||
Example response formats:
|
||||
"Based on [Entity Name], [answer...]"
|
||||
"I found relevant information in multiple entries: [explanation...]"
|
||||
"I apologize, but the provided context doesn't contain information about [topic]"
|
||||
"#;
|
||||
|
||||
let user_message = format!(
|
||||
r#"
|
||||
Context Information:
|
||||
==================
|
||||
{}
|
||||
|
||||
User Question:
|
||||
==================
|
||||
{}
|
||||
"#,
|
||||
entities_json, query.query
|
||||
);
|
||||
|
||||
info!("{:?}", user_message);
|
||||
|
||||
let request = CreateChatCompletionRequestArgs::default()
|
||||
.model("gpt-4o-mini")
|
||||
.temperature(0.2)
|
||||
.max_tokens(3048u32)
|
||||
.messages([
|
||||
ChatCompletionRequestSystemMessage::from(system_message).into(),
|
||||
ChatCompletionRequestUserMessage::from(user_message).into(),
|
||||
])
|
||||
.build()?;
|
||||
|
||||
let response = openai_client.chat().create(request).await?;
|
||||
|
||||
let answer = response
|
||||
.choices
|
||||
.first()
|
||||
.and_then(|choice| choice.message.content.as_ref())
|
||||
.ok_or(ApiError::QueryError(
|
||||
"No content found in LLM response".to_string(),
|
||||
))?;
|
||||
|
||||
info!("{:?}", answer);
|
||||
|
||||
// info!("{:#?}", entities_json);
|
||||
|
||||
Ok(answer.clone().into_response())
|
||||
}
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
use crate::{error::ProcessingError, stored_object};
|
||||
use surrealdb::{engine::remote::ws::Client, Surreal};
|
||||
use tracing::info;
|
||||
use tracing::debug;
|
||||
use uuid::Uuid;
|
||||
|
||||
stored_object!(KnowledgeRelationship, "knowledge_relationship", {
|
||||
@@ -37,7 +37,7 @@ impl KnowledgeRelationship {
|
||||
|
||||
let result = db_client.query(query).await?;
|
||||
|
||||
info!("{:?}", result);
|
||||
debug!("{:?}", result);
|
||||
|
||||
Ok(())
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user