Raghav001 commited on
Commit
4a36a2e
·
1 Parent(s): 1a036c0
Files changed (1) hide show
  1. app.py +21 -1
app.py CHANGED
@@ -9,6 +9,8 @@ import time
9
  from cnocr import CnOcr
10
  import pinecone
11
 
 
 
12
 
13
  # from langchain.document_loaders import PyPDFLoader
14
  from langchain.document_loaders import UnstructuredWordDocumentLoader
@@ -39,6 +41,24 @@ pinecone.init(api_key="ffb1f594-0915-4ebf-835f-c1eaa62fdcdc",environment = "us-w
39
  index = pinecone.Index(index_name="test")
40
 
41
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  def get_emb(text):
43
  emb_url = 'https://Raghav001-API.hf.space/embeddings'
44
  data = {"content": text}
@@ -251,7 +271,7 @@ with gr.Blocks() as demo:
251
  chat_bu = gr.Button(value='Clear', visible=False)
252
 
253
  file.change(up_file, [file], [txt, doc_bu, md]) #hiding the text
254
- doc_bu.click(doc_emb, [txt], [doc_text_state, doc_emb_state, msg_txt, chat_bu, md, chat_bot])
255
  msg_txt.submit(get_response, [msg_txt, chat_bot,doc_text_state, doc_emb_state], [chat_bot],queue=False)
256
  chat_bu.click(lambda: None, None, chat_bot, queue=False)
257
 
 
9
  from cnocr import CnOcr
10
  import pinecone
11
 
12
+ from langchain.vectorstores import Pinecone
13
+ from langchain.embeddings.openai import OpenAIEmbeddings
14
 
15
  # from langchain.document_loaders import PyPDFLoader
16
  from langchain.document_loaders import UnstructuredWordDocumentLoader
 
41
  index = pinecone.Index(index_name="test")
42
 
43
 
44
+ def pine(data):
45
+ char_text_spliter = CharacterTextSplitter(chunk_size = 1000, chunk_overlap=0)
46
+ doc_text = char_text_spliter.split_documents(data)
47
+
48
+ Embedding_model = "text-embedding-ada-002"
49
+ embeddings = OpenAIEmbeddings(openai_api_key="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")
50
+
51
+ pinecone.init(api_key = "ffb1f594-0915-4ebf-835f-c1eaa62fdcdc",
52
+ environment = "us-west4-gcp-free"
53
+ )
54
+
55
+ index_name = "test"
56
+ docstore = Pinecone.from_texts([d.page_content for d in doc_text],embeddings,index_name = index_name,namespace='a1')
57
+
58
+
59
+
60
+
61
+
62
  def get_emb(text):
63
  emb_url = 'https://Raghav001-API.hf.space/embeddings'
64
  data = {"content": text}
 
271
  chat_bu = gr.Button(value='Clear', visible=False)
272
 
273
  file.change(up_file, [file], [txt, doc_bu, md]) #hiding the text
274
+ doc_bu.click([doc_emb,pine], [txt], [doc_text_state, doc_emb_state, msg_txt, chat_bu, md, chat_bot])
275
  msg_txt.submit(get_response, [msg_txt, chat_bot,doc_text_state, doc_emb_state], [chat_bot],queue=False)
276
  chat_bu.click(lambda: None, None, chat_bot, queue=False)
277