Spaces:

haihuynh
/

Job-KnowledgeGraph-QA

Build error

App Files Files Community

hari-huynh commited on Jun 28

Commit

dfc4889

•

1 Parent(s): fe81246

Update ReAct Agent with Web-search Tool

Browse files

Files changed (5) hide show

prompts/react_prompt_v2.txt +6 -4
react_agent_v2.py +29 -21
requirements.txt +1 -1
tools/tavily_search.py +100 -0
tools/tavily_search_v2.py +68 -0

prompts/react_prompt_v2.txt CHANGED Viewed

@@ -1,6 +1,6 @@
-Assistant is designed to be able to assist with a wide range of tasks, from answering simple questions to providing in-depth explanations and discussions on a wide range of topics. As a language model, Assistant is able to generate human-like text based on the input it receives, allowing it to engage in natural-sounding conversations and provide responses that are coherent and relevant to the topic at hand in Markdown format.
-Assistant is constantly learning and improving, and its capabilities are constantly evolving. It is able to process and understand large amounts of text, and can use this knowledge to provide accurate and informative responses to a wide range of questions. Additionally, Assistant is able to generate its own text based on the input it receives, allowing it to engage in discussions and provide explanations and descriptions on a wide range of topics.
-Overall, Assistant is a powerful tool that can help with a wide range of tasks and provide valuable insights and information on a wide range of topics. Whether you need help with a specific question or just want to have a conversation about a particular topic, Assistant is here to assist.
 TOOLS:
@@ -19,7 +19,9 @@ Action Input: the input to the action
 Observation: the result of the action
 ```
-If knowledge graph provide enough information, you MUST NOT use any tool.
 When you have a response to say to the Human, or if you do not need to use a tool, you MUST use the format:
 ```

+You are an assistant who helps users find suitable jobs by answering questions related to recruitment information from companies' job postings.
+You MUST answer briefly but with complete information in Markdown format.
+You MUST bold phrases related to jobs, skills, companies, etc.
 TOOLS:
 Observation: the result of the action
 ```
+You must prioritize searching on the Knowledge Graph. If the knowledge graph does not have enough information, you MUST search on the web.
+You MUST not duplicate queries.
+If both of you do not provide enough information, you must answer "I cannot answer this question."
 When you have a response to say to the Human, or if you do not need to use a tool, you MUST use the format:
 ```

react_agent_v2.py CHANGED Viewed

@@ -1,13 +1,17 @@
 from langchain.agents import Tool, AgentType, initialize_agent
 from langchain.memory import ConversationBufferMemory
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain.agents import AgentExecutor
 from langchain.agents.format_scratchpad import format_log_to_str
 from langchain.agents.output_parsers import ReActSingleInputOutputParser
 from langchain.tools.render import render_text_description
 import os
 from tools.kg_search import lookup_kg
 from dotenv import load_dotenv
 from langchain.agents import Tool
 from langchain_core.prompts import PromptTemplate
@@ -19,6 +23,12 @@ llm = ChatGoogleGenerativeAI(
     temperature = 0
 )
 kg_query = Tool(
     name = 'Query Knowledge Graph',
@@ -27,16 +37,14 @@ kg_query = Tool(
 )
-tools = [kg_query]
-# memory = ConversationBufferMemory(memory_key="chat_history")
-#
-# agent_chain = initialize_agent(tools,
-#                                llm,
-#                                agent=AgentType.CONVERSATIONAL_REACT_DESCRIPTION,
-#                                memory=memory,
-#                                verbose=True)
-# agent_prompt = hub.pull("hwchase17/react-chat")
 with open("prompts/react_prompt_v2.txt", "r") as file:
     react_template = file.read()
@@ -68,6 +76,17 @@ memory = ConversationBufferMemory(memory_key="chat_history")
 agent_executor = AgentExecutor(agent=agent, tools=tools, verbose=True, memory=memory)
 # result = agent_executor.invoke({"input": "Have any company recruit Machine Learning jobs?"})
 # print(result)
@@ -81,17 +100,6 @@ agent_executor = AgentExecutor(agent=agent, tools=tools, verbose=True, memory=me
 # result = agent_executor.invoke(question)
 # print(result)
-def get_react_agent(memory):
-    agent_executor = AgentExecutor(
-        agent = agent,
-        tools = tools,
-        verbose = True,
-        memory = memory
-    )
-    return agent_executor
 if __name__ == "__main__":
     while True:
         try:

 from langchain.agents import Tool, AgentType, initialize_agent
 from langchain.memory import ConversationBufferMemory
+# from langchain.utilities import DuckDuckGoSearchAPIWrapper
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain.agents import AgentExecutor
+from langchain import hub
 from langchain.agents.format_scratchpad import format_log_to_str
 from langchain.agents.output_parsers import ReActSingleInputOutputParser
 from langchain.tools.render import render_text_description
 import os
 from tools.kg_search import lookup_kg
+from tools.tavily_search import tavily_search
+from tools.tavily_search_v2 import tavily_search, tavily_qna_search
 from dotenv import load_dotenv
 from langchain.agents import Tool
 from langchain_core.prompts import PromptTemplate
     temperature = 0
 )
+# search = DuckDuckGoSearchAPIWrapper()
+#
+# search_tool = Tool(name="Current Search",
+#                    func=search.run,
+#                    description="Useful when you need to answer questions about detail jobs information or search a job."
+#                    )
 kg_query = Tool(
     name = 'Query Knowledge Graph',
 )
+web_search = Tool(
+    name = 'Web Search',
+    func = tavily_qna_search,
+    description = "Useful for when you need to search for external information."
+)
+tools = [kg_query, web_search]
 with open("prompts/react_prompt_v2.txt", "r") as file:
     react_template = file.read()
 agent_executor = AgentExecutor(agent=agent, tools=tools, verbose=True, memory=memory)
+def get_react_agent(memory):
+    agent_executor = AgentExecutor(
+        agent=agent,
+        tools=tools,
+        verbose=True,
+        memory=memory
+    )
+    return agent_executor
 # result = agent_executor.invoke({"input": "Have any company recruit Machine Learning jobs?"})
 # print(result)
 # result = agent_executor.invoke(question)
 # print(result)
 if __name__ == "__main__":
     while True:
         try:

requirements.txt CHANGED Viewed

@@ -6,4 +6,4 @@ langchain-core
 faiss-cpu
 neo4j
 langchainhub
-chainlit

 faiss-cpu
 neo4j
 langchainhub
+tavily-python

tools/tavily_search.py ADDED Viewed

	@@ -0,0 +1,100 @@

+import os
+from dotenv import load_dotenv
+from langchain_google_genai import ChatGoogleGenerativeAI
+from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain.tools import BaseTool, StructuredTool, tool
+load_dotenv()
+os.environ["TAVILY_API_KEY"] = os.getenv("TAVILY_API_KEY")
+os.environ["GOOGLE_API_KEY"] = os.getenv("GEMINI_API_KEY")
+def tavily_search(question: str) -> str:
+    """
+    useful for when you need to search relevant informations such as: jobs, companies from Web sites.
+    """
+    # setup prompt
+    # prompt = [{
+    #     "role": "system",
+    #     "content": f'You are an AI critical thinker research assistant. ' \
+    #                f'Your sole purpose is to write well written, critically acclaimed,' \
+    #                f'objective and structured reports on given text.'
+    # }, {
+    #     "role": "user",
+    #     "content": f'Information: """{content}"""\n\n' \
+    #                f'Using the above information, answer the following' \
+    #                f'query: "{query}" in a detailed report --' \
+    #                f'Please use MLA format and markdown syntax.'
+    # }]
+    tool_search = TavilySearchResults(
+        max_results = 3,
+        include_raw_content = True
+    )
+    # prompt_search = f"""You are an expert at finding information about the job,
+    #     the company, and the skills required for that job.
+    #     Try to find out what is relevant to the company, the job, and the skills required for that job.
+    #     If the questions are not relevant, answer them in your own words.
+    #
+    #     Query: {question}
+    # """
+    # Search
+    # for information on Web sites: Indeed, LinkedIn, TopCV
+    # by
+    # using
+    # entity in user
+    # question(Job
+    # Titles, Company, Location, etc).
+    # Using
+    # search
+    # pattern: site:indeed
+    search_prompt = f"""
+    Response to user question by search job descriptions include: job titles, company, required skill, education, etc related to job recruitment posts in Vietnam.
+    Query: {question}
+    """
+    result = tool_search.invoke({"query": search_prompt})
+    # llm_chat = ChatGoogleGenerativeAI(
+    #     model = "gemini-1.5-flash-latest",
+    #     temperature = 0
+    # )
+    # content = []
+    # for i in result:
+    #     content.append(i['content'])
+    # prompt = f"""
+    #
+    # You are a career consultant, based on the information you have  contents: {content},
+    # consider yourself an expert to summarize summary details not too short the content and
+    # highlight the content related to the company's job and the necessary skills and return must 1 URL
+    #
+    # You can add information you know about the question {question}
+    # """
+    # response_prompt = f"""
+    # Generate a concise and informative summary of the results in a polite and easy-to-understand manner based on question and Tavily search results.
+    # Returns URLs at the end of the summary for proof.
+    #
+    # Question: {question}
+    # Search Results: {str(result)}
+    #
+    # Answer:
+    # """
+    # response = llm_chat.invoke(response_prompt)
+    return result
+if __name__ == "__main__":
+    question = "Recruitment information for the position of Software Engineer?"
+    result = tavily_search(question)
+    print(result)

tools/tavily_search_v2.py ADDED Viewed

	@@ -0,0 +1,68 @@

+import os
+from dotenv import load_dotenv
+from langchain_google_genai import ChatGoogleGenerativeAI
+from tavily import TavilyClient
+from langchain.tools import BaseTool, StructuredTool, tool
+load_dotenv()
+os.environ["TAVILY_API_KEY"] = os.getenv("TAVILY_API_KEY")
+os.environ["GOOGLE_API_KEY"] = os.getenv("GEMINI_API_KEY")
+def tavily_search(question: str) -> str:
+    """
+    useful for when you need to search relevant informations such as: jobs, companies from Web sites.
+    """
+    search_prompt = f"""
+    Response to user question by search job descriptions include: job titles, company, required skill, education, etc related to job recruitment posts in Vietnam.
+    Query: {question}
+    """
+    tavily = TavilyClient(
+        api_key = os.environ["TAVILY_API_KEY"],
+    )
+    response = tavily.search(
+        query = question,
+        include_raw_content = True,
+        max_results = 5
+    )
+    search_results = ""
+    for obj in response["results"]:
+        search_results += f"""
+- Page content: {obj["raw_content"]}
+Source: {obj["url"]}
+        """
+    print(search_results)
+    response_prompt = f"""
+    Generate a concise and informative summary of the results in a polite and easy-to-understand manner based on question and Tavily search results.
+    Returns URLs at the end of the summary for proof.
+    Question: {question}
+    Search Results:
+    {search_results}
+    Answer:
+    """
+    # return context
+def tavily_qna_search(question: str) -> str:
+    tavily = TavilyClient(
+        api_key=os.environ["TAVILY_API_KEY"],
+    )
+    response = tavily.qna_search(query=question)
+    return response
+if __name__ == "__main__":
+    question = "Software Engineer job postings in Vietnam"
+    result = tavily_search(question)
+    print(result)