chat

Sleeping

App Files Files Community

sujitb commited on Apr 1

Commit

c5c24fb

•

1 Parent(s): fa30792

Update app.py

Browse files

Files changed (1) hide show

app.py +63 -7

app.py CHANGED Viewed

@@ -56,7 +56,42 @@ system_instructions_text='''
           If you are unable to answer the question from the text provided, please respond " Sorry. I do not have enough information to answer this"
            Do repeat the question. Do not make a pointed reference to the text provided. Directly answer the question
           '''
 def query_from_pinecone(index,namespace, question_embedding, top_k=3):
     # get embedding from THE SAME embedder as the documents
@@ -142,19 +177,40 @@ if QUESTION:
         score=resp[0]['score']
         title=resp[0]['metadata']['title']
         #+ '\n*************\n'+  resp[1]['metadata']['text'] + '\n*************\n'+ resp[2]['metadata']['text']
         if score>.5:
             client = OpenAI()
-            content="""
-            <text>
-            {}
-            </text>
-            """.format(out)
             response = client.chat.completions.create(
               model="gpt-3.5-turbo",
               messages=[
-                {"role": "system", "content":system_instructions_text },
                 {"role": "user", "content": content},
                 {"role": "user", "content": "Question:"+QUESTION}
               ]

           If you are unable to answer the question from the text provided, please respond " Sorry. I do not have enough information to answer this"
            Do repeat the question. Do not make a pointed reference to the text provided. Directly answer the question
           '''
+json_instructions='''
+          Your task is to extract the answer to a question from a body of text provided to you in a json array.
+          The json will contain two pieces of content in this format:
+          [
+              {"id":1 , "content": " first content"},
+              {"id":2 , "content": " second content"}
+          ]
+          You need to check which content is most appropriate to answer the question and prepare
+          an answer based on the content
+          For example,
+          [
+          { "id":1 , "content" : "General Preparation Tips for Verbal Section:\n
+          You need to develop an incessant habit of speed reading.
+          Start with reading newspapers, editorials, fiction and nonfiction novels and simple passages.
+          The more you read, the faster you read. Learn the basic grammar concepts like parts of speech, articles,verbs, adjectives, tenses, auxiliary verbs, modifiers, modals etc.
+          Revise at least 50 new words every day"},
+          { "id":2 , "content" : "General Preparation Tips for Quantitative Section:\n
+          You need to develop an speed in solving math problems.
+          Start with reading funda books,  math text books.
+          Learn the basic  concepts like arithmetic, geometry, numbers, probability,  etc.
+          Solve at least 50 new problems every day"}
+          ]
+          Question: What are some tips for preparing for Verbal exam?
+          Here are some tips for preparing for the VARC section:
+          1. develop an incessant habit of speed reading
+          2. Start reading newspapers, editorials, fiction and nonfiction novels
+          3. Learn basic grammar concepts\n
+          4. Revise at least 50 new words a day
+          Your response should be based on the information contained in the provided content in the json and should not included any other sources.
+          If you are unable to answer the question from the content provided, please respond " Sorry. I do not have enough information to answer this"
+           Do repeat the question. Do not make a pointed reference to the content provided. Directly answer the question
+          '''
 def query_from_pinecone(index,namespace, question_embedding, top_k=3):
     # get embedding from THE SAME embedder as the documents
         score=resp[0]['score']
         title=resp[0]['metadata']['title']
         #+ '\n*************\n'+  resp[1]['metadata']['text'] + '\n*************\n'+ resp[2]['metadata']['text']
+        d={}
+        d['id']=1
+        d['content']=resp[0]['metadata']['data']
+        if len(resp)>1:
+            d['id']=2
+            d['content']=resp[1]['metadata']['data']
+        # covert to array
+        json_array = [{'id': key, 'content': value} for key, value in d.items()]
+        json_data = json.dumps(json_array)
         if score>.5:
+            mode = "two"  # two passages
             client = OpenAI()
+            if mode=="one":
+                instr=system_instructions_text
+                content="""
+                <text>
+                {}
+                </text>
+                """.format(out)
+            if mode=="two":
+                instr=json_instructions
+                content=json_data
             response = client.chat.completions.create(
               model="gpt-3.5-turbo",
               messages=[
+                {"role": "system", "content":instr },
                 {"role": "user", "content": content},
                 {"role": "user", "content": "Question:"+QUESTION}
               ]