Spaces:

Luciferalive
/

RAG_db

Runtime error

Luciferalive commited on Jun 2, 2024

Commit

2e3e738

verified ·

1 Parent(s): 5d9b48f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,12 +17,12 @@ import os
 import boto3
 # AWS access credentials
-access_key = os.getenv("access_key")
-secret_key =  os.getenv("secret_key")
 # S3 bucket details
-bucket_name = os.getenv("bucket_name")
-prefix = os.getenv("prefix")
 HUGGINGFACEHUB_API_TOKEN = os.getenv("HUGGINGFACEHUB_API_TOKEN")
@@ -59,18 +59,22 @@ def compute_cosine_similarity_scores(query, retrieved_docs):
     readable_scores = [{"doc": doc, "score": float(score)} for doc, score in zip(retrieved_docs, cosine_scores.flatten())]
     return readable_scores
 def answer_query_with_similarity(query):
     try:
         # Fetch files from S3
-        s3 = boto3.client('s3', aws_access_key_id=access_key, aws_secret_access_key=secret_key)
-        objects = s3.list_objects_v2(Bucket=bucket_name, Prefix=prefix)
-        file_contents = []
-        for obj in objects.get('Contents', []):
-            if not obj['Key'].endswith('/'):  # Skip directories
-                response = s3.get_object(Bucket=bucket_name, Key=obj['Key'])
-                file_content = response['Body'].read()
-                file_contents.append(file_content)
         all_text = process_files(file_contents)

 import boto3
 # AWS access credentials
+access_key = os.getenv("ACCESS_KEY")
+secret_key = os.getenv("SECRET_KEY")
 # S3 bucket details
+bucket_name = os.getenv("BUCKET_NAME")
+prefix = os.getenv("PREFIX")
 HUGGINGFACEHUB_API_TOKEN = os.getenv("HUGGINGFACEHUB_API_TOKEN")
     readable_scores = [{"doc": doc, "score": float(score)} for doc, score in zip(retrieved_docs, cosine_scores.flatten())]
     return readable_scores
+def fetch_files_from_s3():
+    s3 = boto3.client('s3', aws_access_key_id=access_key, aws_secret_access_key=secret_key)
+    objects = s3.list_objects_v2(Bucket=bucket_name, Prefix=prefix)
+    file_contents = []
+    for obj in objects.get('Contents', []):
+        if not obj['Key'].endswith('/'):  # Skip directories
+            response = s3.get_object(Bucket=bucket_name, Key=obj['Key'])
+            file_content = response['Body'].read()
+            file_contents.append(file_content)
+    return file_contents
 def answer_query_with_similarity(query):
     try:
         # Fetch files from S3
+        file_contents = fetch_files_from_s3()
         all_text = process_files(file_contents)