Pinecone
Browse files
app.py
CHANGED
@@ -9,6 +9,8 @@ import time
|
|
9 |
from cnocr import CnOcr
|
10 |
import pinecone
|
11 |
|
|
|
|
|
12 |
|
13 |
# from langchain.document_loaders import PyPDFLoader
|
14 |
from langchain.document_loaders import UnstructuredWordDocumentLoader
|
@@ -39,6 +41,24 @@ pinecone.init(api_key="ffb1f594-0915-4ebf-835f-c1eaa62fdcdc",environment = "us-w
|
|
39 |
index = pinecone.Index(index_name="test")
|
40 |
|
41 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
42 |
def get_emb(text):
|
43 |
emb_url = 'https://Raghav001-API.hf.space/embeddings'
|
44 |
data = {"content": text}
|
@@ -251,7 +271,7 @@ with gr.Blocks() as demo:
|
|
251 |
chat_bu = gr.Button(value='Clear', visible=False)
|
252 |
|
253 |
file.change(up_file, [file], [txt, doc_bu, md]) #hiding the text
|
254 |
-
doc_bu.click(doc_emb, [txt], [doc_text_state, doc_emb_state, msg_txt, chat_bu, md, chat_bot])
|
255 |
msg_txt.submit(get_response, [msg_txt, chat_bot,doc_text_state, doc_emb_state], [chat_bot],queue=False)
|
256 |
chat_bu.click(lambda: None, None, chat_bot, queue=False)
|
257 |
|
|
|
9 |
from cnocr import CnOcr
|
10 |
import pinecone
|
11 |
|
12 |
+
from langchain.vectorstores import Pinecone
|
13 |
+
from langchain.embeddings.openai import OpenAIEmbeddings
|
14 |
|
15 |
# from langchain.document_loaders import PyPDFLoader
|
16 |
from langchain.document_loaders import UnstructuredWordDocumentLoader
|
|
|
41 |
index = pinecone.Index(index_name="test")
|
42 |
|
43 |
|
44 |
+
def pine(data):
|
45 |
+
char_text_spliter = CharacterTextSplitter(chunk_size = 1000, chunk_overlap=0)
|
46 |
+
doc_text = char_text_spliter.split_documents(data)
|
47 |
+
|
48 |
+
Embedding_model = "text-embedding-ada-002"
|
49 |
+
embeddings = OpenAIEmbeddings(openai_api_key="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")
|
50 |
+
|
51 |
+
pinecone.init(api_key = "ffb1f594-0915-4ebf-835f-c1eaa62fdcdc",
|
52 |
+
environment = "us-west4-gcp-free"
|
53 |
+
)
|
54 |
+
|
55 |
+
index_name = "test"
|
56 |
+
docstore = Pinecone.from_texts([d.page_content for d in doc_text],embeddings,index_name = index_name,namespace='a1')
|
57 |
+
|
58 |
+
|
59 |
+
|
60 |
+
|
61 |
+
|
62 |
def get_emb(text):
|
63 |
emb_url = 'https://Raghav001-API.hf.space/embeddings'
|
64 |
data = {"content": text}
|
|
|
271 |
chat_bu = gr.Button(value='Clear', visible=False)
|
272 |
|
273 |
file.change(up_file, [file], [txt, doc_bu, md]) #hiding the text
|
274 |
+
doc_bu.click([doc_emb,pine], [txt], [doc_text_state, doc_emb_state, msg_txt, chat_bu, md, chat_bot])
|
275 |
msg_txt.submit(get_response, [msg_txt, chat_bot,doc_text_state, doc_emb_state], [chat_bot],queue=False)
|
276 |
chat_bu.click(lambda: None, None, chat_bot, queue=False)
|
277 |
|