2023-04-26 18:20:18 +00:00
|
|
|
import re
|
|
|
|
from json import loads
|
|
|
|
from uuid import uuid4
|
|
|
|
|
|
|
|
from fake_useragent import UserAgent
|
|
|
|
from tls_client import Session
|
2023-04-09 23:03:55 +00:00
|
|
|
|
|
|
|
|
|
|
|
class Completion:
|
2023-04-26 18:20:18 +00:00
|
|
|
@staticmethod
|
2023-04-09 23:03:55 +00:00
|
|
|
def create(
|
2023-04-26 18:20:18 +00:00
|
|
|
prompt: str,
|
|
|
|
page: int = 1,
|
|
|
|
count: int = 10,
|
|
|
|
safe_search: str = 'Moderate',
|
|
|
|
on_shopping_page: bool = False,
|
|
|
|
mkt: str = '',
|
|
|
|
response_filter: str = 'WebPages,Translations,TimeZone,Computation,RelatedSearches',
|
|
|
|
domain: str = 'youchat',
|
|
|
|
query_trace_id: str = None,
|
|
|
|
chat: list = None,
|
|
|
|
include_links: bool = False,
|
|
|
|
detailed: bool = False,
|
|
|
|
debug: bool = False,
|
|
|
|
) -> dict:
|
|
|
|
if chat is None:
|
|
|
|
chat = []
|
|
|
|
|
|
|
|
client = Session(client_identifier='chrome_108')
|
|
|
|
client.headers = Completion.__get_headers()
|
2023-04-09 23:03:55 +00:00
|
|
|
|
2023-04-26 18:20:18 +00:00
|
|
|
response = client.get(
|
|
|
|
f'https://you.com/api/streamingSearch',
|
|
|
|
params={
|
|
|
|
'q': prompt,
|
|
|
|
'page': page,
|
|
|
|
'count': count,
|
|
|
|
'safeSearch': safe_search,
|
|
|
|
'onShoppingPage': on_shopping_page,
|
|
|
|
'mkt': mkt,
|
|
|
|
'responseFilter': response_filter,
|
|
|
|
'domain': domain,
|
|
|
|
'queryTraceId': str(uuid4()) if query_trace_id is None else query_trace_id,
|
|
|
|
'chat': str(chat), # {'question':'','answer':' ''}
|
|
|
|
},
|
2023-04-09 23:03:55 +00:00
|
|
|
)
|
2023-04-26 18:20:18 +00:00
|
|
|
|
2023-04-09 23:03:55 +00:00
|
|
|
if debug:
|
|
|
|
print('\n\n------------------\n\n')
|
|
|
|
print(response.text)
|
|
|
|
print('\n\n------------------\n\n')
|
|
|
|
|
2023-04-26 18:20:18 +00:00
|
|
|
if 'youChatToken' not in response.text:
|
|
|
|
return Completion.__get_failure_response()
|
|
|
|
|
|
|
|
you_chat_serp_results = re.search(
|
|
|
|
r'(?<=event: youChatSerpResults\ndata:)(.*\n)*?(?=event: )', response.text
|
|
|
|
).group()
|
|
|
|
third_party_search_results = re.search(
|
|
|
|
r'(?<=event: thirdPartySearchResults\ndata:)(.*\n)*?(?=event: )', response.text
|
|
|
|
).group()
|
|
|
|
# slots = findall(r"slots\ndata: (.*)\n\nevent", response.text)[0]
|
|
|
|
|
|
|
|
text = ''.join(re.findall(r'{\"youChatToken\": \"(.*?)\"}', response.text))
|
2023-04-26 00:16:27 +00:00
|
|
|
|
2023-04-09 23:03:55 +00:00
|
|
|
extra = {
|
2023-04-26 18:20:18 +00:00
|
|
|
'youChatSerpResults': loads(you_chat_serp_results),
|
|
|
|
# 'slots' : loads(slots)
|
2023-04-09 23:03:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return {
|
2023-04-26 18:20:18 +00:00
|
|
|
'response': text.replace('\\n', '\n').replace('\\\\', '\\'),
|
|
|
|
'links': loads(third_party_search_results)['search']['third_party_search_results']
|
|
|
|
if include_links
|
|
|
|
else None,
|
|
|
|
'extra': extra if detailed else None,
|
2023-04-26 00:16:27 +00:00
|
|
|
}
|
2023-04-26 18:20:18 +00:00
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def __get_headers(cls) -> dict:
|
|
|
|
return {
|
|
|
|
'authority': 'you.com',
|
|
|
|
'accept': 'text/event-stream',
|
|
|
|
'accept-language': 'en,fr-FR;q=0.9,fr;q=0.8,es-ES;q=0.7,es;q=0.6,en-US;q=0.5,am;q=0.4,de;q=0.3',
|
|
|
|
'cache-control': 'no-cache',
|
|
|
|
'referer': 'https://you.com/search?q=who+are+you&tbm=youchat',
|
|
|
|
'sec-ch-ua': '"Not_A Brand";v="99", "Google Chrome";v="109", "Chromium";v="109"',
|
|
|
|
'sec-ch-ua-mobile': '?0',
|
|
|
|
'sec-ch-ua-platform': '"Windows"',
|
|
|
|
'sec-fetch-dest': 'empty',
|
|
|
|
'sec-fetch-mode': 'cors',
|
|
|
|
'sec-fetch-site': 'same-origin',
|
|
|
|
'cookie': f'safesearch_guest=Moderate; uuid_guest={str(uuid4())}',
|
|
|
|
'user-agent': UserAgent().random,
|
|
|
|
}
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def __get_failure_response(cls) -> dict:
|
|
|
|
return dict(response='Unable to fetch the response, Please try again.', links=[], extra={})
|