{
"indexing_technique": "high_quality",
"user_id": "20250526hongxmguochuang",
"dataset_info": {
"dataset_name": "双碳政策",
"dataset_description": "该知识库里面全是关于双碳政策文件的",
"data_source_type": "notion_import"
},
"process_rule": {
"rules": {
"pre_processing_rules": [
{
"id": "remove_extra_spaces",
"enabled": true
},
{
"id": "remove_urls_emails",
"enabled": false
}
],
"segmentation": {
"separator": "\n\n,\n,。,!,?,",
"max_tokens": 500,
"chunk_overlap": 50
}
},
"mode": "custom"
},
"doc_form": "text_model",
"doc_language": "Chinese",
"retrieval_model": {
"search_method": "hybrid_search",
"reranking_enable": true,
"reranking_model": {
"reranking_provider_name": "LOCAL",
"reranking_model_name": "gte-rerank"
},
"top_k": 3,
"score_threshold_enabled": true,
"score_threshold": 0.5,
"reranking_mode": "reranking_model",
"weights": {
"weight_type": "customized",
"vector_setting": {
"vector_weight": 0.7,
"embedding_provider_name": "",
"embedding_model_name": ""
},
"keyword_setting": {
"keyword_weight": 0.3
}
}
},
"embedding_model": "Qwen3-Embedding-0.6B",
"embedding_model_provider": "LOCAL"
}
curl --location --request POST 'http://172.29.50.10:2333/zhixin_agent/knowledge_database/init' \
--header 'Content-Type: application/json' \
--data-raw '{
"indexing_technique": "high_quality",
"user_id": "20250526hongxmguochuang",
"dataset_info": {
"dataset_name": "双碳政策",
"dataset_description": "该知识库里面全是关于双碳政策文件的",
"data_source_type": "notion_import"
},
"process_rule": {
"rules": {
"pre_processing_rules": [
{
"id": "remove_extra_spaces",
"enabled": true
},
{
"id": "remove_urls_emails",
"enabled": false
}
],
"segmentation": {
"separator": "\n\n,\n,。,!,?,",
"max_tokens": 500,
"chunk_overlap": 50
}
},
"mode": "custom"
},
"doc_form": "text_model",
"doc_language": "Chinese",
"retrieval_model": {
"search_method": "hybrid_search",
"reranking_enable": true,
"reranking_model": {
"reranking_provider_name": "LOCAL",
"reranking_model_name": "gte-rerank"
},
"top_k": 3,
"score_threshold_enabled": true,
"score_threshold": 0.5,
"reranking_mode": "reranking_model",
"weights": {
"weight_type": "customized",
"vector_setting": {
"vector_weight": 0.7,
"embedding_provider_name": "",
"embedding_model_name": ""
},
"keyword_setting": {
"keyword_weight": 0.3
}
}
},
"embedding_model": "Qwen3-Embedding-0.6B",
"embedding_model_provider": "LOCAL"
}'
{
"dataset": {
"id": "044aecc3-04c3-4a2c-a34a-e43ec146a71b",
"name": "1",
"description": "该知识库里面全是关于测试数据库的",
"permission": "only_me",
"data_source_type": "notion_import",
"indexing_technique": "high_quality",
"created_by": "0001",
"created_at": 1745913443
},
"status": 200
}