backend_api.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418
  1. from __future__ import annotations
  2. import json
  3. import flask
  4. import os
  5. import logging
  6. import asyncio
  7. import shutil
  8. import random
  9. import datetime
  10. from flask import Flask, Response, request, jsonify, render_template
  11. from typing import Generator
  12. from pathlib import Path
  13. from urllib.parse import quote_plus
  14. from hashlib import sha256
  15. from werkzeug.utils import secure_filename
  16. try:
  17. from flask_limiter import Limiter
  18. from flask_limiter.util import get_remote_address
  19. has_flask_limiter = True
  20. except ImportError:
  21. has_flask_limiter = False
  22. from ...image import is_allowed_extension, to_image
  23. from ...client.service import convert_to_provider
  24. from ...providers.asyncio import to_sync_generator
  25. from ...client.helper import filter_markdown
  26. from ...tools.files import supports_filename, get_streaming, get_bucket_dir, get_buckets
  27. from ...tools.run_tools import iter_run_tools
  28. from ...errors import ProviderNotFoundError
  29. from ...cookies import get_cookies_dir
  30. from ... import ChatCompletion
  31. from ... import models
  32. from .api import Api
  33. logger = logging.getLogger(__name__)
  34. def safe_iter_generator(generator: Generator) -> Generator:
  35. start = next(generator)
  36. def iter_generator():
  37. yield start
  38. yield from generator
  39. return iter_generator()
  40. class Backend_Api(Api):
  41. """
  42. Handles various endpoints in a Flask application for backend operations.
  43. This class provides methods to interact with models, providers, and to handle
  44. various functionalities like conversations, error handling, and version management.
  45. Attributes:
  46. app (Flask): A Flask application instance.
  47. routes (dict): A dictionary mapping API endpoints to their respective handlers.
  48. """
  49. def __init__(self, app: Flask) -> None:
  50. """
  51. Initialize the backend API with the given Flask application.
  52. Args:
  53. app (Flask): Flask application instance to attach routes to.
  54. """
  55. self.app: Flask = app
  56. if has_flask_limiter and app.demo:
  57. limiter = Limiter(
  58. get_remote_address,
  59. app=app,
  60. default_limits=["200 per day", "50 per hour"],
  61. storage_uri="memory://",
  62. auto_check=False,
  63. strategy="moving-window",
  64. )
  65. if has_flask_limiter and app.demo:
  66. @app.route('/', methods=['GET'])
  67. @limiter.exempt
  68. def home():
  69. return render_template('demo.html')
  70. else:
  71. @app.route('/', methods=['GET'])
  72. def home():
  73. return render_template('home.html')
  74. @app.route('/backend-api/v2/models', methods=['GET'])
  75. def jsonify_models(**kwargs):
  76. response = get_demo_models() if app.demo else self.get_models(**kwargs)
  77. if isinstance(response, list):
  78. return jsonify(response)
  79. return response
  80. @app.route('/backend-api/v2/models/<provider>', methods=['GET'])
  81. def jsonify_provider_models(**kwargs):
  82. response = self.get_provider_models(**kwargs)
  83. if isinstance(response, list):
  84. return jsonify(response)
  85. return response
  86. @app.route('/backend-api/v2/providers', methods=['GET'])
  87. def jsonify_providers(**kwargs):
  88. response = self.get_providers(**kwargs)
  89. if isinstance(response, list):
  90. return jsonify(response)
  91. return response
  92. def get_demo_models():
  93. return [{
  94. "name": model.name,
  95. "image": isinstance(model, models.ImageModel),
  96. "vision": isinstance(model, models.VisionModel),
  97. "providers": [
  98. getattr(provider, "parent", provider.__name__)
  99. for provider in providers
  100. ],
  101. "demo": True
  102. }
  103. for model, providers in models.demo_models.values()]
  104. def handle_conversation():
  105. """
  106. Handles conversation requests and streams responses back.
  107. Returns:
  108. Response: A Flask response object for streaming.
  109. """
  110. kwargs = {}
  111. if "files[]" in request.files:
  112. images = []
  113. for file in request.files.getlist('files[]'):
  114. if file.filename != '' and is_allowed_extension(file.filename):
  115. images.append((to_image(file.stream, file.filename.endswith('.svg')), file.filename))
  116. kwargs['images'] = images
  117. if "json" in request.form:
  118. json_data = json.loads(request.form['json'])
  119. else:
  120. json_data = request.json
  121. if app.demo and json_data.get("provider") not in ["Custom", "Feature"]:
  122. model = json_data.get("model")
  123. if model != "default" and model in models.demo_models:
  124. json_data["provider"] = random.choice(models.demo_models[model][1])
  125. else:
  126. json_data["model"] = models.demo_models["default"][0].name
  127. json_data["provider"] = random.choice(models.demo_models["default"][1])
  128. kwargs = self._prepare_conversation_kwargs(json_data, kwargs)
  129. return self.app.response_class(
  130. self._create_response_stream(
  131. kwargs,
  132. json_data.get("conversation_id"),
  133. json_data.get("provider"),
  134. json_data.get("download_images", True),
  135. ),
  136. mimetype='text/event-stream'
  137. )
  138. if has_flask_limiter and app.demo:
  139. @app.route('/backend-api/v2/conversation', methods=['POST'])
  140. @limiter.limit("4 per minute") # 1 request in 15 seconds
  141. def _handle_conversation():
  142. limiter.check()
  143. return handle_conversation()
  144. else:
  145. @app.route('/backend-api/v2/conversation', methods=['POST'])
  146. def _handle_conversation():
  147. return handle_conversation()
  148. @app.route('/backend-api/v2/usage', methods=['POST'])
  149. def add_usage():
  150. cache_dir = Path(get_cookies_dir()) / ".usage"
  151. cache_file = cache_dir / f"{datetime.date.today()}.jsonl"
  152. cache_dir.mkdir(parents=True, exist_ok=True)
  153. with cache_file.open("a" if cache_file.exists() else "w") as f:
  154. f.write(f"{json.dumps(request.json)}\n")
  155. return {}
  156. @app.route('/backend-api/v2/log', methods=['POST'])
  157. def add_log():
  158. cache_dir = Path(get_cookies_dir()) / ".logging"
  159. cache_file = cache_dir / f"{datetime.date.today()}.jsonl"
  160. cache_dir.mkdir(parents=True, exist_ok=True)
  161. data = {"origin": request.headers.get("origin"), **request.json}
  162. with cache_file.open("a" if cache_file.exists() else "w") as f:
  163. f.write(f"{json.dumps(data)}\n")
  164. return {}
  165. @app.route('/backend-api/v2/memory/<user_id>', methods=['POST'])
  166. def add_memory(user_id: str):
  167. api_key = request.headers.get("x_api_key")
  168. json_data = request.json
  169. from mem0 import MemoryClient
  170. client = MemoryClient(api_key=api_key)
  171. client.add(
  172. [{"role": item["role"], "content": item["content"]} for item in json_data.get("items")],
  173. user_id=user_id,
  174. metadata={"conversation_id": json_data.get("id")}
  175. )
  176. return {"count": len(json_data.get("items"))}
  177. @app.route('/backend-api/v2/memory/<user_id>', methods=['GET'])
  178. def read_memory(user_id: str):
  179. api_key = request.headers.get("x_api_key")
  180. from mem0 import MemoryClient
  181. client = MemoryClient(api_key=api_key)
  182. if request.args.get("search"):
  183. return client.search(
  184. request.args.get("search"),
  185. user_id=user_id,
  186. filters=json.loads(request.args.get("filters", "null")),
  187. metadata=json.loads(request.args.get("metadata", "null"))
  188. )
  189. return client.get_all(
  190. user_id=user_id,
  191. page=request.args.get("page", 1),
  192. page_size=request.args.get("page_size", 100),
  193. filters=json.loads(request.args.get("filters", "null")),
  194. )
  195. self.routes = {
  196. '/backend-api/v2/version': {
  197. 'function': self.get_version,
  198. 'methods': ['GET']
  199. },
  200. '/backend-api/v2/synthesize/<provider>': {
  201. 'function': self.handle_synthesize,
  202. 'methods': ['GET']
  203. },
  204. '/images/<path:name>': {
  205. 'function': self.serve_images,
  206. 'methods': ['GET']
  207. }
  208. }
  209. @app.route('/backend-api/v2/create', methods=['GET', 'POST'])
  210. def create():
  211. try:
  212. tool_calls = [{
  213. "function": {
  214. "name": "bucket_tool"
  215. },
  216. "type": "function"
  217. }]
  218. web_search = request.args.get("web_search")
  219. if web_search:
  220. tool_calls.append({
  221. "function": {
  222. "name": "search_tool",
  223. "arguments": {"query": web_search, "instructions": "", "max_words": 1000} if web_search != "true" else {}
  224. },
  225. "type": "function"
  226. })
  227. do_filter_markdown = request.args.get("filter_markdown")
  228. cache_id = request.args.get('cache')
  229. parameters = {
  230. "model": request.args.get("model"),
  231. "messages": [{"role": "user", "content": request.args.get("prompt")}],
  232. "provider": request.args.get("provider", None),
  233. "stream": not do_filter_markdown and not cache_id,
  234. "ignore_stream": not request.args.get("stream"),
  235. "tool_calls": tool_calls,
  236. }
  237. if cache_id:
  238. cache_id = sha256(cache_id.encode() + json.dumps(parameters, sort_keys=True).encode()).hexdigest()
  239. cache_dir = Path(get_cookies_dir()) / ".scrape_cache" / "create"
  240. cache_file = cache_dir / f"{quote_plus(request.args.get('prompt').strip()[:20])}.{cache_id}.txt"
  241. if cache_file.exists():
  242. with cache_file.open("r") as f:
  243. response = f.read()
  244. else:
  245. response = iter_run_tools(ChatCompletion.create, **parameters)
  246. cache_dir.mkdir(parents=True, exist_ok=True)
  247. with cache_file.open("w") as f:
  248. f.write(response)
  249. else:
  250. response = iter_run_tools(ChatCompletion.create, **parameters)
  251. if do_filter_markdown:
  252. return Response(filter_markdown(response, do_filter_markdown), mimetype='text/plain')
  253. def cast_str():
  254. for chunk in response:
  255. if not isinstance(chunk, Exception):
  256. yield str(chunk)
  257. return Response(cast_str(), mimetype='text/plain')
  258. except Exception as e:
  259. logger.exception(e)
  260. return jsonify({"error": {"message": f"{type(e).__name__}: {e}"}}), 500
  261. @app.route('/backend-api/v2/buckets', methods=['GET'])
  262. def list_buckets():
  263. try:
  264. buckets = get_buckets()
  265. if buckets is None:
  266. return jsonify({"error": {"message": "Error accessing bucket directory"}}), 500
  267. sanitized_buckets = [secure_filename(b) for b in buckets]
  268. return jsonify(sanitized_buckets), 200
  269. except Exception as e:
  270. return jsonify({"error": {"message": str(e)}}), 500
  271. @app.route('/backend-api/v2/files/<bucket_id>', methods=['GET', 'DELETE'])
  272. def manage_files(bucket_id: str):
  273. bucket_id = secure_filename(bucket_id)
  274. bucket_dir = get_bucket_dir(bucket_id)
  275. if not os.path.isdir(bucket_dir):
  276. return jsonify({"error": {"message": "Bucket directory not found"}}), 404
  277. if request.method == 'DELETE':
  278. try:
  279. shutil.rmtree(bucket_dir)
  280. return jsonify({"message": "Bucket deleted successfully"}), 200
  281. except OSError as e:
  282. return jsonify({"error": {"message": f"Error deleting bucket: {str(e)}"}}), 500
  283. except Exception as e:
  284. return jsonify({"error": {"message": str(e)}}), 500
  285. delete_files = request.args.get('delete_files', True)
  286. refine_chunks_with_spacy = request.args.get('refine_chunks_with_spacy', False)
  287. event_stream = 'text/event-stream' in request.headers.get('Accept', '')
  288. mimetype = "text/event-stream" if event_stream else "text/plain";
  289. return Response(get_streaming(bucket_dir, delete_files, refine_chunks_with_spacy, event_stream), mimetype=mimetype)
  290. @self.app.route('/backend-api/v2/files/<bucket_id>', methods=['POST'])
  291. def upload_files(bucket_id: str):
  292. bucket_id = secure_filename(bucket_id)
  293. bucket_dir = get_bucket_dir(bucket_id)
  294. os.makedirs(bucket_dir, exist_ok=True)
  295. filenames = []
  296. for file in request.files.getlist('files[]'):
  297. try:
  298. filename = secure_filename(file.filename)
  299. if supports_filename(filename):
  300. with open(os.path.join(bucket_dir, filename), 'wb') as f:
  301. shutil.copyfileobj(file.stream, f)
  302. filenames.append(filename)
  303. finally:
  304. file.stream.close()
  305. with open(os.path.join(bucket_dir, "files.txt"), 'w') as f:
  306. [f.write(f"{filename}\n") for filename in filenames]
  307. return {"bucket_id": bucket_id, "files": filenames}
  308. @app.route('/backend-api/v2/files/<bucket_id>/<filename>', methods=['PUT'])
  309. def upload_file(bucket_id, filename):
  310. bucket_id = secure_filename(bucket_id)
  311. bucket_dir = get_bucket_dir(bucket_id)
  312. filename = secure_filename(filename)
  313. bucket_path = Path(bucket_dir)
  314. if not supports_filename(filename):
  315. return jsonify({"error": {"message": f"File type not allowed"}}), 400
  316. if not bucket_path.exists():
  317. bucket_path.mkdir(parents=True, exist_ok=True)
  318. try:
  319. file_path = bucket_path / filename
  320. file_data = request.get_data()
  321. if not file_data:
  322. return jsonify({"error": {"message": "No file data received"}}), 400
  323. with file_path.open('wb') as f:
  324. f.write(file_data)
  325. return jsonify({"message": f"File '{filename}' uploaded successfully to bucket '{bucket_id}'"}), 201
  326. except Exception as e:
  327. return jsonify({"error": {"message": f"Error uploading file: {str(e)}"}}), 500
  328. @app.route('/backend-api/v2/upload_cookies', methods=['POST'])
  329. def upload_cookies(self):
  330. file = None
  331. if "file" in request.files:
  332. file = request.files['file']
  333. if file.filename == '':
  334. return 'No selected file', 400
  335. if file and file.filename.endswith(".json") or file.filename.endswith(".har"):
  336. filename = secure_filename(file.filename)
  337. file.save(os.path.join(get_cookies_dir(), filename))
  338. return "File saved", 200
  339. return 'Not supported file', 400
  340. def handle_synthesize(self, provider: str):
  341. try:
  342. provider_handler = convert_to_provider(provider)
  343. except ProviderNotFoundError:
  344. return "Provider not found", 404
  345. if not hasattr(provider_handler, "synthesize"):
  346. return "Provider doesn't support synthesize", 500
  347. response_data = provider_handler.synthesize({**request.args})
  348. if asyncio.iscoroutinefunction(provider_handler.synthesize):
  349. response_data = asyncio.run(response_data)
  350. else:
  351. if hasattr(response_data, "__aiter__"):
  352. response_data = to_sync_generator(response_data)
  353. response_data = safe_iter_generator(response_data)
  354. content_type = getattr(provider_handler, "synthesize_content_type", "application/octet-stream")
  355. response = flask.Response(response_data, content_type=content_type)
  356. response.headers['Cache-Control'] = "max-age=604800"
  357. return response
  358. def get_provider_models(self, provider: str):
  359. api_key = request.headers.get("x_api_key")
  360. api_base = request.headers.get("x_api_base")
  361. models = super().get_provider_models(provider, api_key, api_base)
  362. if models is None:
  363. return "Provider not found", 404
  364. return models
  365. def _format_json(self, response_type: str, content = None, **kwargs) -> str:
  366. """
  367. Formats and returns a JSON response.
  368. Args:
  369. response_type (str): The type of the response.
  370. content: The content to be included in the response.
  371. Returns:
  372. str: A JSON formatted string.
  373. """
  374. return json.dumps(super()._format_json(response_type, content, **kwargs)) + "\n"