-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbingchat_async_v2.py
142 lines (102 loc) · 4.01 KB
/
bingchat_async_v2.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
import os
import sys
import asyncio
from queue import Queue
from threading import Thread
from playwright.sync_api import sync_playwright
from playwright.async_api import async_playwright
import requests
from bs4 import BeautifulSoup
import openai
from dotenv import load_dotenv
from multiple import compose_metric
import tiktoken
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
import openai_api
load_dotenv()
chatgpt = "gpt-3.5-turbo"
gpt4 = 'gpt-4'
openai_api = openai_api.OpenAI_API(model=gpt4) # gpt4
# OpenAI API Key 세팅하기
def clean_webtext(rawtext):
cleaned_text = rawtext.replace("\n", "")
return cleaned_text
def get_webpage_text(page, link):
page.goto(link, timeout=0)
# Get webpage text
response = requests.get(link, verify=False)
soup = BeautifulSoup(response.text, 'html.parser')
# Extract all text within the body tag
text_content = soup.body.get_text()
return text_content
async def playwright_init():
playwright = await async_playwright().start()
browser = await playwright.chromium.launch()
context = await browser.new_context()
page = await context.new_page()
def get_bingchat_result(query):
"""
returns 5 retrieved text
"""
with sync_playwright() as p:
browser = p.chromium.launch(headless=False)
page = browser.new_page()
google_query_url = f"https://www.google.com/search?q={query}"
page.goto(google_query_url)
print(f"went to {google_query_url}")
page.wait_for_selector('.g', timeout=0)
k = 2
links = page.eval_on_selector_all('.g', '''(results, k) => {
return Array.from(results).slice(0, k).map(result => {
const anchor = result.querySelector('a');
return {
title: anchor.textContent,
href: anchor.href
};
});
}''', k)
textList = []
for link in links:
text = get_webpage_text(page, link['href'])
textList.append(clean_webtext(text))
return textList
def main():
query = input("Enter Company names: ")
comp_names = compose_metric(query, 5)
tasks = []
for comp in comp_names:
def func(comp):
textList = get_bingchat_result(comp + " 뉴스")
enc = tiktoken.encoding_for_model("gpt-4")
if len(enc.encode("\n".join(textList))) < 6000:
textList = ["\n".join(textList)]
print('asking to GPT model ...')
summary = get_summary(comp, textList)
prompt = f"아래는 {comp}에 대한 최신 정보입니다. 정보를 바탕으로 이 기업의 주식에 어떤 영향을 줄지 예측해주세요. \n\nInfo: \n{summary} \n\n 예측:"
response = openai_api.chatgpt(prompt)
print(response)
async def async_job(comp):
task = asyncio.get_event_loop().run_in_executor(None, func, comp)
return await task
tasks.append(asyncio.get_event_loop().create_task(async_job(comp)))
await asyncio.gather(*tasks)
def get_summary(comp, text_list) -> str:
queue = Queue()
def thread_func(queue):
loop = asyncio.new_event_loop()
asyncio.set_event_loop(loop)
queue.put(loop.run_until_complete(gpt_async(comp, text_list)))
Thread(target=thread_func, args=(queue,)).start()
return queue.get()
async def gpt_async(comp, text_list) -> str:
tasks = []
for t in text_list:
prompt = f"아래는 {comp}에 대한 최신 정보입니다. 정보의 내용에 대해 긍정 부정을 판단하고, 아래의 요약문을 작성해주세요. \n\nInfo: \n{t} \n\n 요약문:"
tasks.append(asyncio.get_event_loop().create_task(ask_to_gpt(prompt)))
summarize_result = await asyncio.gather(*tasks)
return ''.join(summarize_result)
async def ask_to_gpt(prompt):
task = asyncio.get_event_loop().run_in_executor(None, openai_api.chatgpt, prompt)
return await task
if __name__ == "__main__":
main()