Spaces:
Running
Running
add topic, qa answer
Browse files- app.py +96 -83
- prompts/__pycache__/__init__.cpython-38.pyc +0 -0
- prompts/chat_combine_prompt.txt +2 -2
app.py
CHANGED
@@ -14,9 +14,10 @@ from langchain.prompts.chat import (
|
|
14 |
)
|
15 |
|
16 |
# Streaming endpoint
|
17 |
-
API_URL = "https://api.openai.com/v1/chat/completions"
|
18 |
cohere_key = '5IRbILAbjTI0VcqTsktBfKsr13Lych9iBAFbLpkj'
|
19 |
-
faiss_store = './indexer'
|
|
|
20 |
|
21 |
def gen_conversation(conversations):
|
22 |
messages = []
|
@@ -32,22 +33,28 @@ def gen_conversation(conversations):
|
|
32 |
return messages
|
33 |
|
34 |
|
35 |
-
def predict(inputs, top_p, temperature, openai_api_key, enable_index, max_tokens, model,
|
36 |
chat_counter, chatbot=[], history=[]):
|
37 |
model = model[0]
|
|
|
38 |
headers = {
|
39 |
"Content-Type": "application/json",
|
40 |
"Authorization": f"Bearer {openai_api_key}"
|
41 |
}
|
42 |
|
43 |
print(f"chat_counter - {chat_counter}")
|
44 |
-
#
|
|
|
|
|
|
|
|
|
45 |
if enable_index:
|
46 |
# Faiss 检索最近的embedding
|
47 |
-
|
48 |
-
|
|
|
49 |
else:
|
50 |
-
docsearch = FAISS.load_local(
|
51 |
# 构建模板
|
52 |
llm = ChatOpenAI(openai_api_key=openai_api_key, max_tokens=max_tokens)
|
53 |
messages_combine = [
|
@@ -67,66 +74,62 @@ def predict(inputs, top_p, temperature, openai_api_key, enable_index, max_tokens
|
|
67 |
)
|
68 |
result = chain({"query": inputs})
|
69 |
print(result)
|
70 |
-
|
71 |
-
|
72 |
-
|
73 |
-
|
|
|
|
|
74 |
else:
|
75 |
-
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
|
80 |
-
|
81 |
-
messages
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
-
|
92 |
-
"
|
93 |
-
|
94 |
-
|
95 |
-
|
96 |
-
|
97 |
-
|
98 |
-
|
99 |
-
|
100 |
-
|
101 |
-
|
102 |
-
|
103 |
-
|
104 |
-
|
105 |
-
|
106 |
-
|
107 |
-
|
108 |
-
# 逐字返回
|
109 |
-
counter = 0
|
110 |
-
for chunk in response.iter_lines():
|
111 |
-
if counter == 0:
|
112 |
counter += 1
|
113 |
-
|
114 |
-
|
115 |
-
|
116 |
-
|
117 |
-
|
118 |
-
|
119 |
-
|
120 |
-
|
121 |
-
|
122 |
-
|
123 |
-
|
124 |
-
|
125 |
-
|
126 |
-
|
127 |
-
|
128 |
-
|
129 |
-
yield chat, history, chat_counter
|
130 |
|
131 |
|
132 |
def reset_textbox():
|
@@ -138,30 +141,40 @@ with gr.Blocks(css="""#col_container {width: 1000px; margin-left: auto; margin-r
|
|
138 |
gr.HTML("""<h1 align="center">🚀Finance ChatBot🚀</h1>""")
|
139 |
with gr.Column(elem_id="col_container"):
|
140 |
openai_api_key = gr.Textbox(type='password', label="输入OPEN API Key")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
141 |
chatbot = gr.Chatbot(elem_id='chatbot')
|
142 |
inputs = gr.Textbox(placeholder="您有什么问题可以问我", label="输入数字经济,两会,硅谷银行相关的提问")
|
143 |
state = gr.State([])
|
144 |
|
145 |
-
|
146 |
-
|
|
|
147 |
|
148 |
-
|
149 |
-
|
150 |
-
|
151 |
-
label="Top-p (nucleus sampling)", )
|
152 |
-
max_tokens = gr.Slider(minimum=512, maximum=3000, value=3000, step=100, interactive=True,
|
153 |
-
label="Max Tokens", )
|
154 |
-
temperature = gr.Slider(minimum=-0, maximum=5.0, value=1.0, step=0.1, interactive=True,
|
155 |
-
label="Temperature", )
|
156 |
-
model = gr.CheckboxGroup(["cohere", "openai", "mpnet"])
|
157 |
-
chat_counter = gr.Number(value=0, precision=0)
|
158 |
-
enable_index = gr.Checkbox(label='是', info='是否使用研报等金融数据')
|
159 |
-
# 后续考虑加入搜索结果
|
160 |
-
enable_search = gr.Checkbox(label='是', info='是否使用搜索结果')
|
161 |
-
|
162 |
-
inputs.submit(predict, [inputs, top_p, temperature, openai_api_key, enable_index, max_tokens, model, chat_counter, chatbot, state],
|
163 |
[chatbot, state, chat_counter], )
|
164 |
-
run.click(predict,
|
|
|
|
|
165 |
[chatbot, state, chat_counter], )
|
166 |
|
167 |
# 每次对话结束都重置对话
|
|
|
14 |
)
|
15 |
|
16 |
# Streaming endpoint
|
17 |
+
API_URL = "https://api.openai.com/v1/chat/completions"
|
18 |
cohere_key = '5IRbILAbjTI0VcqTsktBfKsr13Lych9iBAFbLpkj'
|
19 |
+
faiss_store = './indexer/{}'
|
20 |
+
|
21 |
|
22 |
def gen_conversation(conversations):
|
23 |
messages = []
|
|
|
33 |
return messages
|
34 |
|
35 |
|
36 |
+
def predict(inputs, top_p, temperature, openai_api_key, enable_index, max_tokens, model, topic,
|
37 |
chat_counter, chatbot=[], history=[]):
|
38 |
model = model[0]
|
39 |
+
topic = topic[0]
|
40 |
headers = {
|
41 |
"Content-Type": "application/json",
|
42 |
"Authorization": f"Bearer {openai_api_key}"
|
43 |
}
|
44 |
|
45 |
print(f"chat_counter - {chat_counter}")
|
46 |
+
print(f'Histroy - {history}') # History: Original Input and Output in flatten list
|
47 |
+
print(f'chatbot - {chatbot}') # Chat Bot: 上一轮回复的[[user, AI]]
|
48 |
+
|
49 |
+
history.append(inputs)
|
50 |
+
# Debugging
|
51 |
if enable_index:
|
52 |
# Faiss 检索最近的embedding
|
53 |
+
store = faiss_store.format(topic)
|
54 |
+
if model == 'openai':
|
55 |
+
docsearch = FAISS.load_local(store, OpenAIEmbeddings(openai_api_key=openai_api_key))
|
56 |
else:
|
57 |
+
docsearch = FAISS.load_local(store, CohereEmbeddings(cohere_api_key=cohere_key))
|
58 |
# 构建模板
|
59 |
llm = ChatOpenAI(openai_api_key=openai_api_key, max_tokens=max_tokens)
|
60 |
messages_combine = [
|
|
|
74 |
)
|
75 |
result = chain({"query": inputs})
|
76 |
print(result)
|
77 |
+
result = result['result']
|
78 |
+
# 生成返回值
|
79 |
+
history.append(result)
|
80 |
+
chat = [(history[i], history[i + 1]) for i in range(0, len(history) - 1, 2)]
|
81 |
+
chat_counter += 1
|
82 |
+
yield chat, history, chat_counter
|
83 |
else:
|
84 |
+
if chat_counter == 0:
|
85 |
+
messages = [{"role": "user", "content": f"{inputs}"}]
|
86 |
+
else:
|
87 |
+
# 如果有历史对话,把对话拼接进入上下文
|
88 |
+
messages = gen_conversation(chatbot)
|
89 |
+
messages.append({'role': 'user', 'content': inputs})
|
90 |
+
# messages
|
91 |
+
payload = {
|
92 |
+
"model": "gpt-3.5-turbo",
|
93 |
+
"messages": messages, # [{"role": "user", "content": f"{inputs}"}],
|
94 |
+
"temperature": temperature, # 1.0,
|
95 |
+
"top_p": top_p, # 1.0,
|
96 |
+
"n": 1,
|
97 |
+
"stream": True,
|
98 |
+
"presence_penalty": 0,
|
99 |
+
"frequency_penalty": 0,
|
100 |
+
}
|
101 |
+
print(f"payload is - {payload}")
|
102 |
+
|
103 |
+
chat_counter += 1
|
104 |
+
|
105 |
+
# 请求OpenAI
|
106 |
+
response = requests.post(API_URL, headers=headers, json=payload, stream=True)
|
107 |
+
token_counter = 0
|
108 |
+
partial_words = ""
|
109 |
+
|
110 |
+
# 逐字返回
|
111 |
+
counter = 0
|
112 |
+
for chunk in response.iter_lines():
|
113 |
+
if counter == 0:
|
114 |
+
counter += 1
|
115 |
+
continue
|
|
|
|
|
|
|
|
|
|
|
116 |
counter += 1
|
117 |
+
# check whether each line is non-empty
|
118 |
+
if chunk:
|
119 |
+
# decode each line as response data is in bytes
|
120 |
+
delta = json.loads(chunk.decode()[6:])['choices'][0]["delta"]
|
121 |
+
if len(delta) == 0:
|
122 |
+
break
|
123 |
+
partial_words += delta["content"]
|
124 |
+
# Keep Updating history
|
125 |
+
if token_counter == 0:
|
126 |
+
history.append(" " + partial_words)
|
127 |
+
else:
|
128 |
+
history[-1] = partial_words
|
129 |
+
chat = [(history[i], history[i + 1]) for i in
|
130 |
+
range(0, len(history) - 1, 2)] # convert to tuples of list
|
131 |
+
token_counter += 1
|
132 |
+
yield chat, history, chat_counter
|
|
|
133 |
|
134 |
|
135 |
def reset_textbox():
|
|
|
141 |
gr.HTML("""<h1 align="center">🚀Finance ChatBot🚀</h1>""")
|
142 |
with gr.Column(elem_id="col_container"):
|
143 |
openai_api_key = gr.Textbox(type='password', label="输入OPEN API Key")
|
144 |
+
|
145 |
+
# inputs, top_p, temperature, top_k, repetition_penalty
|
146 |
+
with gr.Accordion("Parameters", open=True):
|
147 |
+
with gr.Row():
|
148 |
+
top_p = gr.Slider(minimum=-0, maximum=1.0, value=0.9, step=0.05, interactive=True,
|
149 |
+
label="Top-p (nucleus sampling)", )
|
150 |
+
|
151 |
+
temperature = gr.Slider(minimum=-0, maximum=5.0, value=0.8, step=0.1, interactive=True,
|
152 |
+
label="Temperature", )
|
153 |
+
with gr.Row():
|
154 |
+
model = gr.CheckboxGroup(["cohere", "openai", "mpnet"])
|
155 |
+
max_tokens = gr.Slider(minimum=100, maximum=2000, value=200, step=100, interactive=True,
|
156 |
+
label="Max Tokens", )
|
157 |
+
chat_counter = gr.Number(value=0, precision=0, label='对话轮数')
|
158 |
+
with gr.Row():
|
159 |
+
enable_index = gr.Checkbox(label='是', info='开启基于文档问答模式/关闭为聊天模式')
|
160 |
+
enable_search = gr.Checkbox(label='是', info='是否使用搜索结果')
|
161 |
+
topic = gr.CheckboxGroup(["两会", "数字经济", "硅谷银行"])
|
162 |
+
|
163 |
chatbot = gr.Chatbot(elem_id='chatbot')
|
164 |
inputs = gr.Textbox(placeholder="您有什么问题可以问我", label="输入数字经济,两会,硅谷银行相关的提问")
|
165 |
state = gr.State([])
|
166 |
|
167 |
+
with gr.Row():
|
168 |
+
clear = gr.Button("Clear Conversation")
|
169 |
+
run = gr.Button("Run")
|
170 |
|
171 |
+
inputs.submit(predict,
|
172 |
+
[inputs, top_p, temperature, openai_api_key, enable_index, max_tokens, model, topic, chat_counter, chatbot,
|
173 |
+
state],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
174 |
[chatbot, state, chat_counter], )
|
175 |
+
run.click(predict,
|
176 |
+
[inputs, top_p, temperature, openai_api_key, enable_index, max_tokens, model, topic, chat_counter, chatbot,
|
177 |
+
state],
|
178 |
[chatbot, state, chat_counter], )
|
179 |
|
180 |
# 每次对话结束都重置对话
|
prompts/__pycache__/__init__.cpython-38.pyc
ADDED
Binary file (545 Bytes). View file
|
|
prompts/chat_combine_prompt.txt
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
-
You are a DocsGPT, friendly and helpful AI assistant by
|
2 |
-
Use the following pieces of context to help answer the users question.
|
3 |
----------------
|
4 |
{summaries}
|
|
|
1 |
+
You are a DocsGPT, friendly and helpful AI assistant by TianHong Asset Managementthat provides help with documents and financial news. You give thorough answers with detail number and illustrated examples if possible.
|
2 |
+
Use the following pieces of context to help answer the users question, always answer in chinese.
|
3 |
----------------
|
4 |
{summaries}
|