Copilot.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272
  1. from __future__ import annotations
  2. import os
  3. import json
  4. import asyncio
  5. import base64
  6. from urllib.parse import quote
  7. try:
  8. from curl_cffi.requests import Session
  9. from curl_cffi import CurlWsFlag
  10. has_curl_cffi = True
  11. except ImportError:
  12. has_curl_cffi = False
  13. try:
  14. import nodriver
  15. has_nodriver = True
  16. except ImportError:
  17. has_nodriver = False
  18. from .base_provider import AbstractProvider, ProviderModelMixin
  19. from .helper import format_prompt_max_length
  20. from .openai.har_file import get_headers, get_har_files
  21. from ..typing import CreateResult, Messages, MediaListType
  22. from ..errors import MissingRequirementsError, NoValidHarFileError, MissingAuthError
  23. from ..requests.raise_for_status import raise_for_status
  24. from ..providers.response import BaseConversation, JsonConversation, RequestLogin, ImageResponse, FinishReason, SuggestedFollowups
  25. from ..providers.asyncio import get_running_loop
  26. from ..tools.media import merge_media
  27. from ..requests import get_nodriver
  28. from ..image import to_bytes, is_accepted_format
  29. from .helper import get_last_user_message
  30. from .. import debug
  31. class Conversation(JsonConversation):
  32. conversation_id: str
  33. def __init__(self, conversation_id: str):
  34. self.conversation_id = conversation_id
  35. class Copilot(AbstractProvider, ProviderModelMixin):
  36. label = "Microsoft Copilot"
  37. url = "https://copilot.microsoft.com"
  38. working = True
  39. supports_stream = True
  40. default_model = "Copilot"
  41. models = [default_model, "Think Deeper"]
  42. model_aliases = {
  43. "gpt-4": default_model,
  44. "gpt-4o": default_model,
  45. "o1": "Think Deeper",
  46. "reasoning": "Think Deeper",
  47. "dall-e-3": default_model
  48. }
  49. websocket_url = "wss://copilot.microsoft.com/c/api/chat?api-version=2"
  50. conversation_url = f"{url}/c/api/conversations"
  51. _access_token: str = None
  52. _cookies: dict = None
  53. @classmethod
  54. def create_completion(
  55. cls,
  56. model: str,
  57. messages: Messages,
  58. stream: bool = False,
  59. proxy: str = None,
  60. timeout: int = 900,
  61. prompt: str = None,
  62. media: MediaListType = None,
  63. conversation: BaseConversation = None,
  64. return_conversation: bool = False,
  65. api_key: str = None,
  66. **kwargs
  67. ) -> CreateResult:
  68. if not has_curl_cffi:
  69. raise MissingRequirementsError('Install or update "curl_cffi" package | pip install -U curl_cffi')
  70. model = cls.get_model(model)
  71. websocket_url = cls.websocket_url
  72. headers = None
  73. if cls._access_token:
  74. if api_key is not None:
  75. cls._access_token = api_key
  76. if cls._access_token is None:
  77. try:
  78. cls._access_token, cls._cookies = readHAR(cls.url)
  79. except NoValidHarFileError as h:
  80. debug.log(f"Copilot: {h}")
  81. if has_nodriver:
  82. yield RequestLogin(cls.label, os.environ.get("G4F_LOGIN_URL", ""))
  83. get_running_loop(check_nested=True)
  84. cls._access_token, cls._cookies = asyncio.run(get_access_token_and_cookies(cls.url, proxy))
  85. else:
  86. raise h
  87. websocket_url = f"{websocket_url}&accessToken={quote(cls._access_token)}"
  88. headers = {"authorization": f"Bearer {cls._access_token}"}
  89. with Session(
  90. timeout=timeout,
  91. proxy=proxy,
  92. impersonate="chrome",
  93. headers=headers,
  94. cookies=cls._cookies,
  95. ) as session:
  96. if cls._access_token is not None:
  97. cls._cookies = session.cookies.jar if hasattr(session.cookies, "jar") else session.cookies
  98. # if cls._access_token is None:
  99. # try:
  100. # url = "https://copilot.microsoft.com/cl/eus-sc/collect"
  101. # headers = {
  102. # "Accept": "application/x-clarity-gzip",
  103. # "referrer": "https://copilot.microsoft.com/onboarding"
  104. # }
  105. # response = session.post(url, headers=headers, data=get_clarity())
  106. # clarity_token = json.loads(response.text.split(" ", maxsplit=1)[-1])[0]["value"]
  107. # debug.log(f"Copilot: Clarity Token: ...{clarity_token[-12:]}")
  108. # except Exception as e:
  109. # debug.log(f"Copilot: {e}")
  110. # else:
  111. # clarity_token = None
  112. response = session.get("https://copilot.microsoft.com/c/api/user")
  113. if response.status_code == 401:
  114. raise MissingAuthError("Status 401: Invalid access token")
  115. raise_for_status(response)
  116. user = response.json().get('firstName')
  117. if user is None:
  118. cls._access_token = None
  119. debug.log(f"Copilot: User: {user or 'null'}")
  120. if conversation is None:
  121. response = session.post(cls.conversation_url)
  122. raise_for_status(response)
  123. conversation_id = response.json().get("id")
  124. conversation = Conversation(conversation_id)
  125. if return_conversation:
  126. yield conversation
  127. if prompt is None:
  128. prompt = format_prompt_max_length(messages, 10000)
  129. debug.log(f"Copilot: Created conversation: {conversation_id}")
  130. else:
  131. conversation_id = conversation.conversation_id
  132. if prompt is None:
  133. prompt = get_last_user_message(messages)
  134. debug.log(f"Copilot: Use conversation: {conversation_id}")
  135. uploaded_images = []
  136. media, _ = [(None, None), *merge_media(media, messages)].pop()
  137. if media:
  138. if not isinstance(media, str):
  139. data = to_bytes(media)
  140. response = session.post(
  141. "https://copilot.microsoft.com/c/api/attachments",
  142. headers={"content-type": is_accepted_format(data)},
  143. data=data
  144. )
  145. raise_for_status(response)
  146. media = response.json().get("url")
  147. uploaded_images.append({"type":"image", "url": media})
  148. wss = session.ws_connect(cls.websocket_url)
  149. # if clarity_token is not None:
  150. # wss.send(json.dumps({
  151. # "event": "challengeResponse",
  152. # "token": clarity_token,
  153. # "method":"clarity"
  154. # }).encode(), CurlWsFlag.TEXT)
  155. wss.send(json.dumps({"event":"setOptions","supportedCards":["weather","local","image","sports","video","ads","finance"],"ads":{"supportedTypes":["multimedia","product","tourActivity","propertyPromotion","text"]}}));
  156. wss.send(json.dumps({
  157. "event": "send",
  158. "conversationId": conversation_id,
  159. "content": [*uploaded_images, {
  160. "type": "text",
  161. "text": prompt,
  162. }],
  163. "mode": "reasoning" if "Think" in model else "chat",
  164. }).encode(), CurlWsFlag.TEXT)
  165. is_started = False
  166. msg = None
  167. image_prompt: str = None
  168. last_msg = None
  169. try:
  170. while True:
  171. try:
  172. msg = wss.recv()[0]
  173. msg = json.loads(msg)
  174. except:
  175. break
  176. last_msg = msg
  177. if msg.get("event") == "appendText":
  178. is_started = True
  179. yield msg.get("text")
  180. elif msg.get("event") == "generatingImage":
  181. image_prompt = msg.get("prompt")
  182. elif msg.get("event") == "imageGenerated":
  183. yield ImageResponse(msg.get("url"), image_prompt, {"preview": msg.get("thumbnailUrl")})
  184. elif msg.get("event") == "done":
  185. yield FinishReason("stop")
  186. break
  187. elif msg.get("event") == "suggestedFollowups":
  188. yield SuggestedFollowups(msg.get("suggestions"))
  189. break
  190. elif msg.get("event") == "replaceText":
  191. yield msg.get("text")
  192. elif msg.get("event") == "error":
  193. raise RuntimeError(f"Error: {msg}")
  194. elif msg.get("event") not in ["received", "startMessage", "citation", "partCompleted"]:
  195. debug.log(f"Copilot Message: {msg}")
  196. if not is_started:
  197. raise RuntimeError(f"Invalid response: {last_msg}")
  198. finally:
  199. wss.close()
  200. async def get_access_token_and_cookies(url: str, proxy: str = None, target: str = "ChatAI",):
  201. browser, stop_browser = await get_nodriver(proxy=proxy, user_data_dir="copilot")
  202. try:
  203. page = await browser.get(url)
  204. access_token = None
  205. while access_token is None:
  206. access_token = await page.evaluate("""
  207. (() => {
  208. for (var i = 0; i < localStorage.length; i++) {
  209. try {
  210. item = JSON.parse(localStorage.getItem(localStorage.key(i)));
  211. if (item.credentialType == "AccessToken"
  212. && item.expiresOn > Math.floor(Date.now() / 1000)
  213. && item.target.includes("target")) {
  214. return item.secret;
  215. }
  216. } catch(e) {}
  217. }
  218. })()
  219. """.replace('"target"', json.dumps(target)))
  220. if access_token is None:
  221. await asyncio.sleep(1)
  222. cookies = {}
  223. for c in await page.send(nodriver.cdp.network.get_cookies([url])):
  224. cookies[c.name] = c.value
  225. await page.close()
  226. return access_token, cookies
  227. finally:
  228. stop_browser()
  229. def readHAR(url: str):
  230. api_key = None
  231. cookies = None
  232. for path in get_har_files():
  233. with open(path, 'rb') as file:
  234. try:
  235. harFile = json.loads(file.read())
  236. except json.JSONDecodeError:
  237. # Error: not a HAR file!
  238. continue
  239. for v in harFile['log']['entries']:
  240. if v['request']['url'].startswith(url):
  241. v_headers = get_headers(v)
  242. if "authorization" in v_headers:
  243. api_key = v_headers["authorization"].split(maxsplit=1).pop()
  244. if v['request']['cookies']:
  245. cookies = {c['name']: c['value'] for c in v['request']['cookies']}
  246. if api_key is None:
  247. raise NoValidHarFileError("No access token found in .har files")
  248. return api_key, cookies
  249. def get_clarity() -> bytes:
  250. #{"e":["0.7.58",5,7284,4779,"n59ae4ieqq","aln5en","1upufhz",1,0,0],"a":[[7323,12,65,217,324],[7344,12,65,214,329],[7385,12,65,211,334],[7407,12,65,210,337],[7428,12,65,209,338],[7461,12,65,209,339],[7497,12,65,209,339],[7531,12,65,208,340],[7545,12,65,208,342],[11654,13,65,208,342],[11728,14,65,208,342],[11728,9,65,208,342,17535,19455,0,0,0,"Annehmen",null,"52w7wqv1r.8ovjfyrpu",1],[7284,4,1,393,968,393,968,0,0,231,310,939,0],[12063,0,2,147,3,4,4,18,5,1,10,79,25,15],[12063,36,6,[11938,0]]]}
  251. body = base64.b64decode("H4sIAAAAAAAAA23RwU7DMAwG4HfJ2aqS2E5ibjxH1cMOnQYqYZvUTQPx7vyJRGGAemj01XWcP+9udg+j80MetDhSyrEISc5GrqrtZnmaTydHbrdUnSsWYT2u+8Obo0Ce/IQvaDBmjkwhUlKKIRNHmQgosqEArWPRDQMx90rxeUMPzB1j+UJvwNIxhTvsPcXyX1T+rizE4juK3mEEhpAUg/JvzW1/+U/tB1LATmhqotoiweMea50PLy2vui4LOY3XfD1dwnkor5fn/e18XBFgm6fHjSzZmCyV7d3aRByAEYextaTHEH3i5pgKGVP/s+DScE5PuLKIpW6FnCi1gY3Rbpqmj0/DI/+L7QEAAA==")
  252. return body