You.py 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222
  1. from __future__ import annotations
  2. import re
  3. import json
  4. import base64
  5. import uuid
  6. from ..typing import AsyncResult, Messages, ImageType, Cookies
  7. from .base_provider import AsyncGeneratorProvider, ProviderModelMixin
  8. from .helper import format_prompt
  9. from ..image import ImageResponse, ImagePreview, EXTENSIONS_MAP, to_bytes, is_accepted_format
  10. from ..requests import StreamSession, FormData, raise_for_status
  11. from .you.har_file import get_telemetry_ids
  12. from .. import debug
  13. class You(AsyncGeneratorProvider, ProviderModelMixin):
  14. label = "You.com"
  15. url = "https://you.com"
  16. working = True
  17. supports_gpt_35_turbo = True
  18. supports_gpt_4 = True
  19. default_model = "gpt-4o-mini"
  20. default_vision_model = "agent"
  21. image_models = ["dall-e"]
  22. models = [
  23. default_model,
  24. "gpt-4o",
  25. "gpt-4-turbo",
  26. "gpt-4",
  27. "claude-3.5-sonnet",
  28. "claude-3-opus",
  29. "claude-3-sonnet",
  30. "claude-3-haiku",
  31. "claude-2",
  32. "llama-3.1-70b",
  33. "llama-3",
  34. "gemini-1-5-flash",
  35. "gemini-1-5-pro",
  36. "gemini-1-0-pro",
  37. "databricks-dbrx-instruct",
  38. "command-r",
  39. "command-r-plus",
  40. "dolphin-2.5",
  41. default_vision_model,
  42. *image_models
  43. ]
  44. _cookies = None
  45. _cookies_used = 0
  46. _telemetry_ids = []
  47. @classmethod
  48. async def create_async_generator(
  49. cls,
  50. model: str,
  51. messages: Messages,
  52. stream: bool = True,
  53. image: ImageType = None,
  54. image_name: str = None,
  55. proxy: str = None,
  56. timeout: int = 240,
  57. chat_mode: str = "default",
  58. **kwargs,
  59. ) -> AsyncResult:
  60. if image is not None or model == cls.default_vision_model:
  61. chat_mode = "agent"
  62. elif not model or model == cls.default_model:
  63. ...
  64. elif model.startswith("dall-e"):
  65. chat_mode = "create"
  66. messages = [messages[-1]]
  67. else:
  68. chat_mode = "custom"
  69. model = cls.get_model(model)
  70. async with StreamSession(
  71. proxy=proxy,
  72. impersonate="chrome",
  73. timeout=(30, timeout)
  74. ) as session:
  75. cookies = await cls.get_cookies(session) if chat_mode != "default" else None
  76. upload = ""
  77. if image is not None:
  78. upload_file = await cls.upload_file(
  79. session, cookies,
  80. to_bytes(image), image_name
  81. )
  82. upload = json.dumps([upload_file])
  83. headers = {
  84. "Accept": "text/event-stream",
  85. "Referer": f"{cls.url}/search?fromSearchBar=true&tbm=youchat",
  86. }
  87. data = {
  88. "userFiles": upload,
  89. "q": format_prompt(messages),
  90. "domain": "youchat",
  91. "selectedChatMode": chat_mode,
  92. "conversationTurnId": str(uuid.uuid4()),
  93. "chatId": str(uuid.uuid4()),
  94. }
  95. params = {
  96. "userFiles": upload,
  97. "selectedChatMode": chat_mode,
  98. }
  99. if chat_mode == "custom":
  100. if debug.logging:
  101. print(f"You model: {model}")
  102. params["selectedAiModel"] = model.replace("-", "_")
  103. async with (session.post if chat_mode == "default" else session.get)(
  104. f"{cls.url}/api/streamingSearch",
  105. data=data if chat_mode == "default" else None,
  106. params=params if chat_mode == "default" else data,
  107. headers=headers,
  108. cookies=cookies
  109. ) as response:
  110. await raise_for_status(response)
  111. async for line in response.iter_lines():
  112. if line.startswith(b'event: '):
  113. event = line[7:].decode()
  114. elif line.startswith(b'data: '):
  115. if event in ["youChatUpdate", "youChatToken"]:
  116. data = json.loads(line[6:])
  117. if event == "youChatToken" and event in data and data[event]:
  118. yield data[event]
  119. elif event == "youChatUpdate" and "t" in data and data["t"]:
  120. if chat_mode == "create":
  121. match = re.search(r"!\[(.+?)\]\((.+?)\)", data["t"])
  122. if match:
  123. if match.group(1) == "fig":
  124. yield ImagePreview(match.group(2), messages[-1]["content"])
  125. else:
  126. yield ImageResponse(match.group(2), match.group(1))
  127. else:
  128. yield data["t"]
  129. else:
  130. yield data["t"]
  131. @classmethod
  132. async def upload_file(cls, client: StreamSession, cookies: Cookies, file: bytes, filename: str = None) -> dict:
  133. async with client.get(
  134. f"{cls.url}/api/get_nonce",
  135. cookies=cookies,
  136. ) as response:
  137. await raise_for_status(response)
  138. upload_nonce = await response.text()
  139. data = FormData()
  140. content_type = is_accepted_format(file)
  141. filename = f"image.{EXTENSIONS_MAP[content_type]}" if filename is None else filename
  142. data.add_field('file', file, content_type=content_type, filename=filename)
  143. async with client.post(
  144. f"{cls.url}/api/upload",
  145. data=data,
  146. headers={
  147. "X-Upload-Nonce": upload_nonce,
  148. },
  149. cookies=cookies
  150. ) as response:
  151. await raise_for_status(response)
  152. result = await response.json()
  153. result["user_filename"] = filename
  154. result["size"] = len(file)
  155. return result
  156. @classmethod
  157. async def get_cookies(cls, client: StreamSession) -> Cookies:
  158. if not cls._cookies or cls._cookies_used >= 5:
  159. cls._cookies = await cls.create_cookies(client)
  160. cls._cookies_used = 0
  161. cls._cookies_used += 1
  162. return cls._cookies
  163. @classmethod
  164. def get_sdk(cls) -> str:
  165. return base64.standard_b64encode(json.dumps({
  166. "event_id":f"event-id-{str(uuid.uuid4())}",
  167. "app_session_id":f"app-session-id-{str(uuid.uuid4())}",
  168. "persistent_id":f"persistent-id-{uuid.uuid4()}",
  169. "client_sent_at":"","timezone":"",
  170. "stytch_user_id":f"user-live-{uuid.uuid4()}",
  171. "stytch_session_id":f"session-live-{uuid.uuid4()}",
  172. "app":{"identifier":"you.com"},
  173. "sdk":{"identifier":"Stytch.js Javascript SDK","version":"3.3.0"
  174. }}).encode()).decode()
  175. def get_auth() -> str:
  176. auth_uuid = "507a52ad-7e69-496b-aee0-1c9863c7c819"
  177. auth_token = f"public-token-live-{auth_uuid}:public-token-live-{auth_uuid}"
  178. auth = base64.standard_b64encode(auth_token.encode()).decode()
  179. return f"Basic {auth}"
  180. @classmethod
  181. async def create_cookies(cls, client: StreamSession) -> Cookies:
  182. if not cls._telemetry_ids:
  183. cls._telemetry_ids = await get_telemetry_ids()
  184. user_uuid = str(uuid.uuid4())
  185. telemetry_id = cls._telemetry_ids.pop()
  186. if debug.logging:
  187. print(f"Use telemetry_id: {telemetry_id}")
  188. async with client.post(
  189. "https://web.stytch.com/sdk/v1/passwords",
  190. headers={
  191. "Authorization": cls.get_auth(),
  192. "X-SDK-Client": cls.get_sdk(),
  193. "X-SDK-Parent-Host": cls.url,
  194. "Origin": "https://you.com",
  195. "Referer": "https://you.com/"
  196. },
  197. json={
  198. "dfp_telemetry_id": telemetry_id,
  199. "email": f"{user_uuid}@gmail.com",
  200. "password": f"{user_uuid}#{user_uuid}",
  201. "session_duration_minutes": 129600
  202. }
  203. ) as response:
  204. await raise_for_status(response)
  205. session = (await response.json())["data"]
  206. return {
  207. "stytch_session": session["session_token"],
  208. 'stytch_session_jwt': session["session_jwt"],
  209. 'ydc_stytch_session': session["session_token"],
  210. 'ydc_stytch_session_jwt': session["session_jwt"],
  211. }