xinli/rag-python/app.py

159 lines
4.4 KiB
Python
Raw Normal View History

2025-12-20 12:08:33 +08:00
# -*- coding: utf-8 -*-
"""
RAG 知识库服务 - Flask API
支持与 jar 包同级目录部署
"""
import os
import sys
from flask import Flask, request, jsonify
from flask_cors import CORS
from config import HOST, PORT, KNOWLEDGE_DIR, BASE_DIR
from knowledge_service import knowledge_service
from file_watcher import FileWatcher
app = Flask(__name__)
CORS(app) # 允许跨域请求
# 文件监控器
file_watcher = None
@app.route('/api/health', methods=['GET'])
def health_check():
"""健康检查"""
return jsonify({
'status': 'ok',
'service': 'RAG Knowledge Service',
'knowledge_dir': KNOWLEDGE_DIR,
'base_dir': BASE_DIR
})
@app.route('/api/documents', methods=['GET'])
def list_documents():
"""列出所有文档"""
try:
documents = knowledge_service.list_documents()
return jsonify({
'success': True,
'data': documents
})
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
@app.route('/api/documents/upload', methods=['POST'])
def upload_document():
"""上传文档"""
try:
if 'file' not in request.files:
return jsonify({'success': False, 'error': '没有上传文件'}), 400
file = request.files['file']
if file.filename == '':
return jsonify({'success': False, 'error': '文件名为空'}), 400
result = knowledge_service.upload_and_index(file)
if result['success']:
return jsonify({
'success': True,
'data': result
})
else:
return jsonify({'success': False, 'error': result.get('error')}), 400
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
@app.route('/api/documents/<filename>', methods=['DELETE'])
def delete_document(filename):
"""删除文档"""
try:
result = knowledge_service.delete_document(filename)
return jsonify({
'success': result['success'],
'data': result
})
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
@app.route('/api/search', methods=['POST'])
def search():
"""搜索文档"""
try:
data = request.get_json()
query = data.get('query', '')
top_k = data.get('top_k', 5)
if not query:
return jsonify({'success': False, 'error': '查询内容不能为空'}), 400
results = knowledge_service.search(query, top_k)
return jsonify({
'success': True,
'data': results
})
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
@app.route('/api/stats', methods=['GET'])
def get_stats():
"""获取统计信息"""
try:
stats = knowledge_service.get_stats()
return jsonify({
'success': True,
'data': stats
})
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
@app.route('/api/rebuild', methods=['POST'])
def rebuild_index():
"""重建索引"""
try:
result = knowledge_service.rebuild_index()
return jsonify({
'success': True,
'data': result
})
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
@app.route('/api/scan', methods=['POST'])
def scan_folder():
"""扫描文件夹并索引新文件"""
try:
result = knowledge_service.scan_and_index_folder()
return jsonify({
'success': True,
'data': result
})
except Exception as e:
return jsonify({'success': False, 'error': str(e)}), 500
def init_service():
"""初始化服务"""
print("=" * 50)
print("RAG 知识库服务启动中...")
print("=" * 50)
# 初始化知识库服务
knowledge_service.init()
# 扫描并索引新文件
knowledge_service.scan_and_index_folder()
# 启动文件监控
global file_watcher
file_watcher = FileWatcher(knowledge_service)
file_watcher.start()
print("=" * 50)
print(f"服务已启动: http://{HOST}:{PORT}")
print(f"知识库文件夹: {KNOWLEDGE_DIR}")
print("=" * 50)
if __name__ == '__main__':
init_service()
app.run(host=HOST, port=PORT, debug=False, threaded=True)