JuanKO commited on
Commit
d4ecaa1
·
1 Parent(s): 75916f6

Add application file

Browse files
Files changed (1) hide show
  1. app.py +57 -0
app.py ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!pip install openai langchain -q
2
+
3
+ import os
4
+ import openai
5
+
6
+ openai.api_key = "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"
7
+
8
+ os.environ["OPENAI_API_KEY"] = openai.api_key
9
+
10
+ from IPython.display import display, Markdown
11
+
12
+ def disp_markdown(text: str) -> None:
13
+ display(Markdown(text))
14
+
15
+
16
+ from langchain.chat_models import ChatOpenAI
17
+ from langchain.schema import HumanMessage
18
+
19
+ chat_model = ChatOpenAI(model_name="gpt-3.5-turbo")
20
+
21
+ #!wget https://huggingface.co/spaces/JuanKO/question_my_doc/blob/main/thelittleprince.txt
22
+
23
+ with open("thelittleprince.txt") as f:
24
+ thelittleprince = f.read()
25
+
26
+ from langchain.text_splitter import CharacterTextSplitter
27
+
28
+ text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0, separator = ".")
29
+ texts = text_splitter.split_text(thelittleprince)
30
+
31
+ from langchain.embeddings.openai import OpenAIEmbeddings
32
+
33
+ os.environ["OPENAI_API_KEY"] = openai.api_key
34
+
35
+ embeddings = OpenAIEmbeddings()
36
+
37
+ #!pip install tiktoken -q
38
+ #!pip install chromadb tiktoken -q
39
+
40
+ from langchain.vectorstores import Chroma
41
+
42
+ docsearch = Chroma.from_texts(texts, embeddings, metadatas=[{"source": str(i)} for i in range(len(texts))]).as_retriever() # YOUR CODE HERE
43
+
44
+
45
+
46
+ from langchain.chains.question_answering import load_qa_chain
47
+ from langchain.llms import OpenAI
48
+
49
+
50
+ query = "Who was the little prince?"
51
+ docs = docsearch.get_relevant_documents(query) # YOUR CODE HERE
52
+ chain =load_qa_chain(OpenAI(temperature=0), chain_type="stuff")
53
+
54
+ # run the chain
55
+ # YOUR CODE HERE
56
+ chain.run(input_documents=docs, question=query)
57
+