use axum::{extract::State, http::StatusCode, response::IntoResponse, Extension, Json}; use axum_typed_multipart::{FieldData, TryFromMultipart, TypedMultipart}; use common::{ error::AppError, storage::types::{ file_info::FileInfo, ingestion_payload::IngestionPayload, ingestion_task::IngestionTask, user::User, }, utils::ingest_limits::{validate_ingest_input, IngestValidationError}, }; use futures::{future::try_join_all, TryFutureExt}; use serde_json::json; use tempfile::NamedTempFile; use tracing::info; use crate::{api_state::ApiState, error::ApiError}; #[derive(Debug, TryFromMultipart)] pub struct IngestParams { pub content: Option, pub context: String, pub category: String, #[form_data(limit = "20000000")] #[form_data(default)] pub files: Vec>, } pub async fn ingest_data( State(state): State, Extension(user): Extension, TypedMultipart(input): TypedMultipart, ) -> Result { let user_id = user.id; let content_bytes = input.content.as_ref().map_or(0, |c| c.len()); let has_content = input.content.as_ref().is_some_and(|c| !c.trim().is_empty()); let context_bytes = input.context.len(); let category_bytes = input.category.len(); let file_count = input.files.len(); match validate_ingest_input( &state.config, input.content.as_deref(), &input.context, &input.category, file_count, ) { Ok(()) => {} Err(IngestValidationError::PayloadTooLarge(message)) => { return Err(ApiError::PayloadTooLarge(message)); } Err(IngestValidationError::BadRequest(message)) => { return Err(ApiError::ValidationError(message)); } } info!( user_id = %user_id, has_content, content_bytes, context_bytes, category_bytes, file_count, "Received ingest request" ); let file_infos = try_join_all(input.files.into_iter().map(|file| { FileInfo::new_with_storage(file, &state.db, &user_id, &state.storage) .map_err(AppError::from) })) .await?; let payloads = IngestionPayload::create_ingestion_payload( input.content, input.context, input.category, file_infos, &user_id, )?; let futures: Vec<_> = payloads .into_iter() .map(|object| IngestionTask::create_and_add_to_db(object, user_id.clone(), &state.db)) .collect(); try_join_all(futures).await?; Ok((StatusCode::OK, Json(json!({ "status": "success" })))) }