Spaces:

Priyanka-Balivada
/

SumLLAMA

No application file

App Files Files Community

Priyanka-Balivada commited on Apr 24

Commit

6cc785b

•

1 Parent(s): 73d84aa

Upload 2 files

Browse files

Files changed (2) hide show

docapp.py +72 -0
requirements.txt +81 -0

docapp.py ADDED Viewed

	@@ -0,0 +1,72 @@

+import streamlit as st
+from langchain.text_splitter import CharacterTextSplitter
+from langchain.docstore.document import Document
+from langchain.chains.summarize import load_summarize_chain
+from langchain_community.llms import CTransformers
+from langchain.callbacks.manager import CallbackManager
+from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
+from pypdf import PdfReader
+# Page title
+st.set_page_config(page_title='🦜🔗 Text Summarization App')
+st.title('🦜🔗 Text Summarization App')
+# Function to read all PDF files and return text
+def get_pdf_text(pdf_docs):
+    text = ""
+    for pdf in pdf_docs:
+        pdf_reader = PdfReader(pdf)
+        for page in pdf_reader.pages:
+            text += page.extract_text()
+    return text
+# Function to split the text into smaller chunks and convert it into document format
+def chunks_and_document(txt):
+    text_splitter = CharacterTextSplitter()
+    texts = text_splitter.split_text(txt)
+    docs = [Document(page_content=t) for t in texts]
+    return docs
+# Loading the Llama 2's LLM
+def load_llm():
+    # We instantiate the callback with a streaming stdout handler
+    callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])
+    # Loading the LLM model
+    llm = CTransformers(
+        model="llama-2-7b-chat.ggmlv3.q2_K.bin",
+        model_type="llama",
+        config={'max_new_tokens': 600,
+                              'temperature': 0.5,
+                              'context_length': 700}
+    )
+    return llm
+# Function to apply the LLM model with our document
+def chains_and_response(docs):
+    llm = load_llm()
+    chain = load_summarize_chain(llm, chain_type='map_reduce')
+    return chain.invoke(docs)
+def main():
+    # Initialize messages if not already present
+    if "messages" not in st.session_state.keys():
+        st.session_state.messages = []
+    # Sidebar for uploading PDF files
+    with st.sidebar:
+        st.title("Menu:")
+        pdf_docs = st.file_uploader(
+            "Upload your PDF Files and Click on the Submit & Process Button", accept_multiple_files=True
+        )
+        if st.button("Submit & Process"):
+            with st.spinner("Processing..."):
+                txt_input = get_pdf_text(pdf_docs)
+                docs = chunks_and_document(txt_input)
+                response = chains_and_response(docs)
+                st.title('📝✅ Summarization Result')
+                for res in response:
+                    st.info(res)
+main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,81 @@

+aiohttp==3.9.3
+aiosignal==1.3.1
+altair==5.2.0
+annotated-types==0.6.0
+anyio==4.2.0
+async-timeout==4.0.3
+attrs==23.2.0
+blinker==1.7.0
+cachetools==5.3.2
+certifi==2024.2.2
+charset-normalizer==3.3.2
+click==8.1.7
+colorama==0.4.6
+ctransformers==0.2.27
+dataclasses-json==0.6.4
+exceptiongroup==1.2.0
+filelock==3.13.1
+frozenlist==1.4.1
+fsspec==2024.2.0
+gitdb==4.0.11
+GitPython==3.1.41
+greenlet==3.0.3
+huggingface-hub==0.20.3
+idna==3.6
+importlib-metadata==7.0.1
+Jinja2==3.1.3
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema==4.21.1
+jsonschema-specifications==2023.12.1
+langchain==0.1.6
+langchain-community==0.0.19
+langchain-core==0.1.22
+langsmith==0.0.87
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+marshmallow==3.20.2
+mdurl==0.1.2
+multidict==6.0.5
+mypy-extensions==1.0.0
+numpy==1.26.4
+packaging==23.2
+pandas==2.2.0
+pillow==10.2.0
+protobuf==4.25.2
+py-cpuinfo==9.0.0
+pyarrow==15.0.0
+pydantic==2.6.1
+pydantic_core==2.16.2
+pydeck==0.8.1b0
+Pygments==2.17.2
+python-dateutil==2.8.2
+pytz==2024.1
+PyYAML==6.0.1
+referencing==0.33.0
+regex==2023.12.25
+requests==2.31.0
+rich==13.7.0
+rpds-py==0.17.1
+safetensors==0.4.2
+six==1.16.0
+smmap==5.0.1
+sniffio==1.3.0
+SQLAlchemy==2.0.25
+streamlit==1.31.0
+tenacity==8.2.3
+tokenizers==0.15.1
+toml==0.10.2
+toolz==0.12.1
+tornado==6.4
+tqdm==4.66.2
+transformers==4.37.2
+typing-inspect==0.9.0
+typing_extensions==4.9.0
+tzdata==2023.4
+tzlocal==5.2
+urllib3==2.2.0
+validators==0.22.0
+watchdog==4.0.0
+yarl==1.9.4
+zipp==3.17.0