Spaces:

chenguittiMaroua
/

asm-app

Sleeping

App Files Files Community

chenguittiMaroua commited on Apr 8

Commit

4b33aa9

verified ·

1 Parent(s): 3c52e24

Update main.py

Browse files

Files changed (1) hide show

main.py +79 -49

main.py CHANGED Viewed

@@ -47,70 +47,100 @@ def get_translator():
 # Optimized QA Model Loading
 @lru_cache()
 def get_qa_model():
     model_name = "deepset/roberta-base-squad2"
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForQuestionAnswering.from_pretrained(model_name)
     return tokenizer, model
 def answer_question(question: str, context: str) -> dict:
     """
-    Fixed QA function without offset_mapping issue
     """
     tokenizer, model = get_qa_model()
-    # Tokenize inputs without offset mapping
-    inputs = tokenizer(
-        question,
-        context,
-        max_length=512,
-        truncation="only_second",
-        stride=128,
-        return_overflowing_tokens=True,
-        padding="max_length",
-        return_tensors="pt"
-    )
-    # Get model predictions
-    with torch.no_grad():
-        outputs = model(**{k: v for k, v in inputs.items() if k != "offset_mapping"})
-    # Process each possible answer
-    answers = []
-    for i in range(inputs["input_ids"].shape[0]):
-        start_logits = outputs.start_logits[i]
-        end_logits = outputs.end_logits[i]
-        # Get the most probable start and end positions
-        answer_start = torch.argmax(start_logits)
-        answer_end = torch.argmax(end_logits) + 1
-        # Skip invalid answers
-        if answer_start >= answer_end:
-            continue
-        # Get the answer text
         answer = tokenizer.decode(
-            inputs["input_ids"][i][answer_start:answer_end],
             skip_special_tokens=True
         ).strip()
-        # Calculate confidence score
-        start_score = torch.nn.functional.softmax(start_logits, dim=0)[answer_start]
-        end_score = torch.nn.functional.softmax(end_logits, dim=0)[answer_end-1]
         confidence = float((start_score + end_score) / 2)
-        if answer:  # Only keep valid answers
-            answers.append({
-                "answer": answer,
-                "confidence": confidence,
-                "start": answer_start.item(),
-                "end": answer_end.item()
-            })
-    if not answers:
-        return {"answer": "No answer found", "confidence": 0.0}
-    # Return the answer with highest confidence
-    return max(answers, key=lambda x: x["confidence"])
 # Home Route

 # Optimized QA Model Loading
 @lru_cache()
 def get_qa_model():
+    """Simplified model loading without unexpected parameters"""
     model_name = "deepset/roberta-base-squad2"
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     model = AutoModelForQuestionAnswering.from_pretrained(model_name)
     return tokenizer, model
 def answer_question(question: str, context: str) -> dict:
     """
+    Robust QA function with minimal parameters
     """
     tokenizer, model = get_qa_model()
+    try:
+        # Simple tokenization without problematic parameters
+        inputs = tokenizer(
+            question,
+            context,
+            max_length=512,
+            truncation="only_second",
+            padding="max_length",
+            return_tensors="pt"
+        )
+        # Filter inputs to only include what the model expects
+        model_inputs = {
+            "input_ids": inputs["input_ids"],
+            "attention_mask": inputs["attention_mask"]
+        }
+        with torch.no_grad():
+            outputs = model(**model_inputs)
+        # Get the most probable answer
+        answer_start = torch.argmax(outputs.start_logits)
+        answer_end = torch.argmax(outputs.end_logits) + 1
         answer = tokenizer.decode(
+            inputs["input_ids"][0][answer_start:answer_end],
             skip_special_tokens=True
         ).strip()
+        # Calculate confidence
+        start_score = torch.nn.functional.softmax(outputs.start_logits, dim=1)[0][answer_start]
+        end_score = torch.nn.functional.softmax(outputs.end_logits, dim=1)[0][answer_end-1]
         confidence = float((start_score + end_score) / 2)
+        return {
+            "answer": answer if answer else "No answer found",
+            "confidence": confidence
+        }
+    except Exception as e:
+        return {
+            "answer": f"Error processing answer: {str(e)}",
+            "confidence": 0.0
+        }
+@app.post("/ask")
+async def ask_question(
+    question: str = Form(...),
+    file: Optional[UploadFile] = File(None),
+    text: Optional[str] = Form(None)
+):
+    """
+    Final robust QA endpoint
+    """
+    try:
+        # [Keep your existing context extraction code here]
+        # ...
+        if not context.strip():
+            raise HTTPException(status_code=400, detail="No extractable content found.")
+        # Clean context
+        context = " ".join(context.split())
+        # Get answer with error handling
+        result = answer_question(question, context)
+        if result["confidence"] < 0.1:
+            # [Keep your fallback semantic search if you want]
+            pass
+        return {
+            "answer": result["answer"],
+            "confidence": result["confidence"],
+            "context_used": context[:500] + "..." if len(context) > 500 else context
+        }
+    except Exception as e:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Error processing question: {str(e)}"
+        )
 # Home Route