Raju Komati
refactored you code added error handling and updated regex for parsing response
f43107a
unverified
import re | |
from json import loads | |
from uuid import uuid4 | |
from fake_useragent import UserAgent | |
from tls_client import Session | |
class Completion: | |
def create( | |
prompt: str, | |
page: int = 1, | |
count: int = 10, | |
safe_search: str = 'Moderate', | |
on_shopping_page: bool = False, | |
mkt: str = '', | |
response_filter: str = 'WebPages,Translations,TimeZone,Computation,RelatedSearches', | |
domain: str = 'youchat', | |
query_trace_id: str = None, | |
chat: list = None, | |
include_links: bool = False, | |
detailed: bool = False, | |
debug: bool = False, | |
) -> dict: | |
if chat is None: | |
chat = [] | |
client = Session(client_identifier='chrome_108') | |
client.headers = Completion.__get_headers() | |
response = client.get( | |
f'https://you.com/api/streamingSearch', | |
params={ | |
'q': prompt, | |
'page': page, | |
'count': count, | |
'safeSearch': safe_search, | |
'onShoppingPage': on_shopping_page, | |
'mkt': mkt, | |
'responseFilter': response_filter, | |
'domain': domain, | |
'queryTraceId': str(uuid4()) if query_trace_id is None else query_trace_id, | |
'chat': str(chat), # {'question':'','answer':' ''} | |
}, | |
) | |
if debug: | |
print('\n\n------------------\n\n') | |
print(response.text) | |
print('\n\n------------------\n\n') | |
if 'youChatToken' not in response.text: | |
return Completion.__get_failure_response() | |
you_chat_serp_results = re.search( | |
r'(?<=event: youChatSerpResults\ndata:)(.*\n)*?(?=event: )', response.text | |
).group() | |
third_party_search_results = re.search( | |
r'(?<=event: thirdPartySearchResults\ndata:)(.*\n)*?(?=event: )', response.text | |
).group() | |
# slots = findall(r"slots\ndata: (.*)\n\nevent", response.text)[0] | |
text = ''.join(re.findall(r'{\"youChatToken\": \"(.*?)\"}', response.text)) | |
extra = { | |
'youChatSerpResults': loads(you_chat_serp_results), | |
# 'slots' : loads(slots) | |
} | |
return { | |
'response': text.replace('\\n', '\n').replace('\\\\', '\\'), | |
'links': loads(third_party_search_results)['search']['third_party_search_results'] | |
if include_links | |
else None, | |
'extra': extra if detailed else None, | |
} | |
def __get_headers(cls) -> dict: | |
return { | |
'authority': 'you.com', | |
'accept': 'text/event-stream', | |
'accept-language': 'en,fr-FR;q=0.9,fr;q=0.8,es-ES;q=0.7,es;q=0.6,en-US;q=0.5,am;q=0.4,de;q=0.3', | |
'cache-control': 'no-cache', | |
'referer': 'https://you.com/search?q=who+are+you&tbm=youchat', | |
'sec-ch-ua': '"Not_A Brand";v="99", "Google Chrome";v="109", "Chromium";v="109"', | |
'sec-ch-ua-mobile': '?0', | |
'sec-ch-ua-platform': '"Windows"', | |
'sec-fetch-dest': 'empty', | |
'sec-fetch-mode': 'cors', | |
'sec-fetch-site': 'same-origin', | |
'cookie': f'safesearch_guest=Moderate; uuid_guest={str(uuid4())}', | |
'user-agent': UserAgent().random, | |
} | |
def __get_failure_response(cls) -> dict: | |
return dict(response='Unable to fetch the response, Please try again.', links=[], extra={}) | |