Spaces:

FESG1234
/

Learningsw

Running

App Files Files Community

FESG1234 commited on 4 days ago

Commit

1d5f072

verified ·

1 Parent(s): 1919a0e

Update app.py

Browse files

Files changed (1) hide show

app.py +62 -46

app.py CHANGED Viewed

@@ -6,40 +6,53 @@ import os
 from huggingface_hub import login, HfFolder
 from getpass import getpass
 # Load and preprocess the PDF content
-with open('./LTDOCS.pdf', 'rb') as file:
-    pdf_reader = PyPDF2.PdfReader(file)
-    pdf_content = ' '.join([page.extract_text() for page in pdf_reader.pages])
-    pdf_content = pdf_content.lower().strip()
 def init_huggingface_auth():
-    """Initialize Hugging Face authentication"""
-    if HfFolder.get_token():
-        print("Already logged in to Hugging Face!")
-        return True
-    token = os.getenv('HUGGINGFACE_TOKEN') or getpass("Enter Hugging Face Token: ")
-    if token:
-        try:
-            login(token=token, add_to_git_credential=True)
-            print("Successfully logged in!")
-            return True
-        except Exception as e:
-            print(f"Login error: {e}")
-            return False
-    return False
 if not init_huggingface_auth():
     print("Warning: Authentication failed")
-# Initialize the pipeline
-pipe = pipeline(
-    "text-generation",
-    model="google/gemma-2-2b-jpn-it",
-    model_kwargs={"torch_dtype": torch.bfloat16},
-    device="cpu",
-)
 SYSTEM_PROMPT = f"""You are Foton, Swahili AI assistant. Tasks:
 1. Swahili translations
@@ -67,22 +80,26 @@ def format_messages(history):
 def generate_response(message, history):
     """Generate AI response"""
-    formatted_history = format_messages(history)
-    formatted_history.append({"role": "user", "content": message})
-    prompt = "\n".join([f"{m['role']}: {m['content']}" for m in formatted_history])
-    output = pipe(
-        prompt,
-        max_new_tokens=256,
-        temperature=0.1,
-        top_p=0.9,
-        do_sample=True,
-        return_full_text=False
-    )
-    return output[0]["generated_text"].strip()
-# Create Gradio interface with corrected settings
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("# Lugha Tausi - Swahili Assistant")
@@ -90,9 +107,10 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         value=[[None, WELCOME_MESSAGE]],
         height=600,
         show_label=False,
-        avatar_images=(
-            None, (os.path.join(os.path.dirname(__file__),"user.png"))
-        )
     )
     msg = gr.Textbox(placeholder="Andika ujumbe wako hapa...", show_label=False)
@@ -108,10 +126,8 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
 if __name__ == "__main__":
     demo.launch(
-        inline=False,  # Required for Spaces
-        share=True,    # Required for Spaces
-        debug=True,
         server_name="0.0.0.0",
         server_port=7860,
         show_error=True
     )

 from huggingface_hub import login, HfFolder
 from getpass import getpass
+# Space configuration
+SPACE_DIR = os.environ.get("HF_HOME", os.getcwd())
 # Load and preprocess the PDF content
+try:
+    pdf_path = os.path.join(SPACE_DIR, "LTDOCS.pdf")
+    with open(pdf_path, 'rb') as file:
+        pdf_reader = PyPDF2.PdfReader(file)
+        pdf_content = ' '.join([page.extract_text() for page in pdf_reader.pages])
+        pdf_content = pdf_content.lower().strip()
+except Exception as e:
+    pdf_content = ""
+    print(f"Error loading PDF: {e}")
 def init_huggingface_auth():
+    """Space-friendly authentication"""
+    token = os.getenv("HUGGINGFACE_TOKEN")
+    if not token:
+        print("No HF token found in environment")
+        return False
+    try:
+        login(token=token, add_to_git_credential=False)
+        print("HF authentication successful")
+        return True
+    except Exception as e:
+        print(f"Login error: {e}")
+        return False
 if not init_huggingface_auth():
     print("Warning: Authentication failed")
+# Initialize the pipeline with CPU optimization
+try:
+    pipe = pipeline(
+        "text-generation",
+        model="google/gemma-2-2b-jpn-it",
+        device_map="auto",
+        model_kwargs={
+            "torch_dtype": torch.float16,
+            "low_cpu_mem_usage": True
+        }
+    )
+except Exception as e:
+    print(f"Model loading error: {e}")
+    raise
 SYSTEM_PROMPT = f"""You are Foton, Swahili AI assistant. Tasks:
 1. Swahili translations
 def generate_response(message, history):
     """Generate AI response"""
+    try:
+        formatted_history = format_messages(history)
+        formatted_history.append({"role": "user", "content": message})
+        prompt = "\n".join([f"{m['role']}: {m['content']}" for m in formatted_history])
+        output = pipe(
+            prompt,
+            max_new_tokens=256,
+            temperature=0.1,
+            top_p=0.9,
+            do_sample=True,
+            return_full_text=False
+        )
+        return output[0]["generated_text"].strip()
+    except Exception as e:
+        print(f"Generation error: {e}")
+        return "Samahani, nimekutana na tatizo. Tafadhali jaribu tena baadaye."
+# Create Gradio interface with Space optimizations
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("# Lugha Tausi - Swahili Assistant")
         value=[[None, WELCOME_MESSAGE]],
         height=600,
         show_label=False,
+        avatar_images=(None, "user.png"),
+        bubble_full_width=False,
+        show_share_button=False,
+        type="messages"
     )
     msg = gr.Textbox(placeholder="Andika ujumbe wako hapa...", show_label=False)
 if __name__ == "__main__":
     demo.launch(
         server_name="0.0.0.0",
         server_port=7860,
+        auth=os.getenv("SPACE_AUTH"),
         show_error=True
     )