Spaces:

Bijoy09
/

Bangla_spam_sms_detection_app

Running

App Files Files Community

Bijoy09 commited on 5 days ago

Commit

473261b

•

1 Parent(s): 2688a7f

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -47

app.py CHANGED Viewed

@@ -3,9 +3,14 @@ from pydantic import BaseModel
 import torch
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 import os
 app = FastAPI()
 # Set the cache directory for Hugging Face
 os.environ['TRANSFORMERS_CACHE'] = os.getenv('TRANSFORMERS_CACHE', '/app/cache')
@@ -14,7 +19,9 @@ model_name = "Bijoy09/MObilebert"
 try:
     model = AutoModelForSequenceClassification.from_pretrained(model_name)
     tokenizer = AutoTokenizer.from_pretrained(model_name)
 except Exception as e:
     raise RuntimeError(f"Failed to load model or tokenizer: {e}")
 class TextRequest(BaseModel):
@@ -42,6 +49,7 @@ async def predict(request: TextRequest):
             prediction = torch.argmax(logits, dim=1).item()
         return {"prediction": "Spam" if prediction == 1 else "Ham"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=f"Prediction failed: {e}")
@@ -49,56 +57,30 @@ async def predict(request: TextRequest):
 async def batch_predict(request: BatchTextRequest):
     try:
         model.eval()
-        results = []
-        for idx, text in enumerate(request.texts):
-            inputs = tokenizer.encode_plus(
-                text,
-                add_special_tokens=True,
-                max_length=64,
-                truncation=True,
-                padding='max_length',
-                return_attention_mask=True,
-                return_tensors='pt'
-            )
-            with torch.no_grad():
-                logits = model(inputs['input_ids'], attention_mask=inputs['attention_mask']).logits
-                prediction = torch.argmax(logits, dim=1).item()
-                results.append({"id": idx + 1, "text": text, "prediction": "Spam" if prediction == 1 else "Ham"})
         return {"results": results}
     except Exception as e:
         raise HTTPException(status_code=500, detail=f"Batch prediction failed: {e}")
-# @app.post("/batch_predict")
-# async def batch_predict(request: BatchTextRequest):
-#     try:
-#         model.eval()
-#         # Batch encode all texts in the request at once
-#         inputs = tokenizer(
-#             request.texts,
-#             add_special_tokens=True,
-#             max_length=64,
-#             truncation=True,
-#             padding='max_length',
-#             return_attention_mask=True,
-#             return_tensors='pt'
-#         )
-#         # Run batch inference
-#         with torch.no_grad():
-#             logits = model(inputs['input_ids'], attention_mask=inputs['attention_mask']).logits
-#             predictions = torch.argmax(logits, dim=1).tolist()
-#         # Format results
-#         results = [
-#             {"id": idx + 1, "text": text, "prediction": "Spam" if pred == 1 else "Ham"}
-#             for idx, (text, pred) in enumerate(zip(request.texts, predictions))
-#         ]
-#         return {"results": results}
-#     except Exception as e:
-#         logging.error(f"Batch prediction failed: {e}")
-#         raise HTTPException(status_code=500, detail="Batch prediction failed. Please try again.")
 @app.get("/")

 import torch
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 import os
+import logging
 app = FastAPI()
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 # Set the cache directory for Hugging Face
 os.environ['TRANSFORMERS_CACHE'] = os.getenv('TRANSFORMERS_CACHE', '/app/cache')
 try:
     model = AutoModelForSequenceClassification.from_pretrained(model_name)
     tokenizer = AutoTokenizer.from_pretrained(model_name)
+    logger.info("Model and tokenizer loaded successfully")
 except Exception as e:
+    logger.error(f"Failed to load model or tokenizer: {e}")
     raise RuntimeError(f"Failed to load model or tokenizer: {e}")
 class TextRequest(BaseModel):
             prediction = torch.argmax(logits, dim=1).item()
         return {"prediction": "Spam" if prediction == 1 else "Ham"}
     except Exception as e:
+        logger.error(f"Prediction failed: {e}")
         raise HTTPException(status_code=500, detail=f"Prediction failed: {e}")
 async def batch_predict(request: BatchTextRequest):
     try:
         model.eval()
+        logger.info(f"Received batch prediction request for {len(request.texts)} texts")
+        inputs = tokenizer(
+            request.texts,
+            add_special_tokens=True,
+            max_length=64,
+            truncation=True,
+            padding='max_length',
+            return_attention_mask=True,
+            return_tensors='pt'
+        )
+        with torch.no_grad():
+            logits = model(inputs['input_ids'], attention_mask=inputs['attention_mask']).logits
+            predictions = torch.argmax(logits, dim=1).tolist()
+        results = [
+            {"id": idx + 1, "text": text, "prediction": "Spam" if pred == 1 else "Ham"}
+            for idx, (text, pred) in enumerate(zip(request.texts, predictions))
+        ]
+        logger.info(f"Batch prediction results: {results}")
         return {"results": results}
     except Exception as e:
+        logger.error(f"Batch prediction failed: {e}")
         raise HTTPException(status_code=500, detail=f"Batch prediction failed: {e}")
 @app.get("/")