一、Dify配置
1.查看或創建知識庫的API
二、下載程序配置
1. 安裝依賴resquirements.txt
######requirements.txt#####
flask==2.3.3
psycopg2-binary==2.9.9
requests==2.31.0
python-dotenv==1.0.0#####安裝依賴
pip3 install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple/
?2. 主程序代碼app.py
##app.pyfrom flask import Flask, render_template, jsonify, Response
import requests
import os
from dotenv import load_dotenv
import io
import zipfile
import urllib.parse
from config import API_KEY, BASE_URLapp = Flask(__name__)@app.route('/')
def index():return render_template('index.html')@app.route('/api/datasets')
def get_datasets():headers = {'Authorization': f'Bearer {API_KEY}','Content-Type': 'application/json'}response = requests.get(f'{BASE_URL}/v1/datasets?page=1&limit=20',headers=headers)if response.status_code == 200:data = response.json()datasets = [{'id': item['id'], 'name': item['name']} for item in data.get('data', [])]return jsonify(datasets)return jsonify({'error': '獲取知識庫列表失敗'}), response.status_code@app.route('/api/files/<dataset_id>')
def get_files(dataset_id):headers = {'Authorization': f'Bearer {API_KEY}','Content-Type': 'application/json'}response = requests.get(f'{BASE_URL}/v1/datasets/{dataset_id}/documents',headers=headers)if response.status_code == 200:data = response.json()files = []for item in data.get('data', []):file_id = item['id']file_name = item.get('data_source_detail_dict', {}).get('upload_file', {}).get('name', file_id)files.append({'id': file_id, 'name': file_name})return jsonify(files)return jsonify({'error': '獲取文件列表失敗'}), response.status_codedef download_single_file(dataset_id, document_id):headers = {'Authorization': f'Bearer {API_KEY}','Content-Type': 'application/json'}# 獲取文件下載地址response = requests.get(f'{BASE_URL}/v1/datasets/{dataset_id}/documents/{document_id}/upload-file',headers=headers)if response.status_code == 200:download_url = response.json().get('download_url')if download_url:# 拼接完整的下載URLfull_url = f'{BASE_URL}{download_url}'file_response = requests.get(full_url, headers=headers)if file_response.status_code == 200:return file_response.contentreturn None@app.route('/api/download/<dataset_id>/<document_id>')
def download_file(dataset_id, document_id):content = download_single_file(dataset_id, document_id)if content:return Response(content,mimetype='application/octet-stream',headers={'Content-Disposition': 'attachment'})return jsonify({'error': '文件下載失敗'}), 400@app.route('/api/download-dataset/<dataset_id>')
def download_dataset(dataset_id):# 獲取文件列表headers = {'Authorization': f'Bearer {API_KEY}','Content-Type': 'application/json'}response = requests.get(f'{BASE_URL}/v1/datasets/{dataset_id}/documents',headers=headers)if response.status_code != 200:return jsonify({'error': '獲取文件列表失敗'}), response.status_codefiles = []for item in response.json().get('data', []):file_id = item['id']file_name = item.get('data_source_detail_dict', {}).get('upload_file', {}).get('name', file_id)files.append({'id': file_id, 'name': file_name})# 創建ZIP文件memory_file = io.BytesIO()with zipfile.ZipFile(memory_file, 'w') as zf:for file in files:content = download_single_file(dataset_id, file['id'])if content:zf.writestr(file['name'], content)memory_file.seek(0)return Response(memory_file.getvalue(),mimetype='application/zip',headers={'Content-Disposition': f'attachment;filename=dataset_{dataset_id}.zip'})if __name__ == '__main__':app.run(debug=True)
3.? 配置知識庫的Base_URL和API_key
配置dify知識庫和數據庫鑒權信息,如下:
# 知識庫API配置
API_KEY = 'dataset-YNXAxOyNucHoyzVUN6MlPJXT'
BASE_URL = 'http://10.1.140.33'
?
三、啟動服務
#python3 app.py
訪問 http://127.0.0.1:5000/ 進行下載文件或整個知識庫