helper.py 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105
  1. from __future__ import annotations
  2. import random
  3. import string
  4. from ..typing import Messages, Cookies, AsyncIterator, Iterator
  5. from .. import debug
  6. def format_prompt(messages: Messages, add_special_tokens: bool = False, do_continue: bool = False) -> str:
  7. """
  8. Format a series of messages into a single string, optionally adding special tokens.
  9. Args:
  10. messages (Messages): A list of message dictionaries, each containing 'role' and 'content'.
  11. add_special_tokens (bool): Whether to add special formatting tokens.
  12. Returns:
  13. str: A formatted string containing all messages.
  14. """
  15. if not add_special_tokens and len(messages) <= 1:
  16. return messages[0]["content"]
  17. formatted = "\n".join([
  18. f'{message["role"].capitalize()}: {message["content"]}'
  19. for message in messages
  20. ])
  21. if do_continue:
  22. return formatted
  23. return f"{formatted}\nAssistant:"
  24. def get_last_user_message(messages: Messages) -> str:
  25. user_messages = []
  26. last_message = None if len(messages) == 0 else messages[-1]
  27. while last_message is not None and messages:
  28. last_message = messages.pop()
  29. if last_message["role"] == "user":
  30. if isinstance(last_message["content"], str):
  31. user_messages.append(last_message["content"].strip())
  32. else:
  33. return "\n".join(user_messages[::-1])
  34. return "\n".join(user_messages[::-1])
  35. def format_image_prompt(messages, prompt: str = None) -> str:
  36. if prompt is None:
  37. return get_last_user_message(messages)
  38. return prompt
  39. def format_prompt_max_length(messages: Messages, max_lenght: int) -> str:
  40. prompt = format_prompt(messages)
  41. start = len(prompt)
  42. if start > max_lenght:
  43. if len(messages) > 6:
  44. prompt = format_prompt(messages[:3] + messages[-3:])
  45. if len(prompt) > max_lenght:
  46. if len(messages) > 2:
  47. prompt = format_prompt([m for m in messages if m["role"] == "system"] + messages[-1:])
  48. if len(prompt) > max_lenght:
  49. prompt = messages[-1]["content"]
  50. debug.log(f"Messages trimmed from: {start} to: {len(prompt)}")
  51. return prompt
  52. def get_random_string(length: int = 10) -> str:
  53. """
  54. Generate a random string of specified length, containing lowercase letters and digits.
  55. Args:
  56. length (int, optional): Length of the random string to generate. Defaults to 10.
  57. Returns:
  58. str: A random string of the specified length.
  59. """
  60. return ''.join(
  61. random.choice(string.ascii_lowercase + string.digits)
  62. for _ in range(length)
  63. )
  64. def get_random_hex(length: int = 32) -> str:
  65. """
  66. Generate a random hexadecimal string with n length.
  67. Returns:
  68. str: A random hexadecimal string of n characters.
  69. """
  70. return ''.join(
  71. random.choice("abcdef" + string.digits)
  72. for _ in range(length)
  73. )
  74. def filter_none(**kwargs) -> dict:
  75. return {
  76. key: value
  77. for key, value in kwargs.items()
  78. if value is not None
  79. }
  80. async def async_concat_chunks(chunks: AsyncIterator) -> str:
  81. return concat_chunks([chunk async for chunk in chunks])
  82. def concat_chunks(chunks: Iterator) -> str:
  83. return "".join([
  84. str(chunk) for chunk in chunks
  85. if chunk and not isinstance(chunk, Exception)
  86. ])
  87. def format_cookies(cookies: Cookies) -> str:
  88. return "; ".join([f"{k}={v}" for k, v in cookies.items()])