rahat15
diff --git a/‎apps/api/routers/interview_v2.py‎
Lines changed: 52 additions & 6 deletions b/‎apps/api/routers/interview_v2.py‎
Lines changed: 52 additions & 6 deletions
diff --git a/‎docs/COMPLETION_SUMMARY.md‎
Lines changed: 203 additions & 0 deletions b/‎docs/COMPLETION_SUMMARY.md‎
Lines changed: 203 additions & 0 deletions
@@ -109,7 +109,7 @@ async def fetch_jd_content(jd_id: str) -> str:
 
 
 async def extract_text_from_file(file: UploadFile) -> str:
-    """Extract text from uploaded file (PDF, DOCX, TXT)"""
+    """Extract text from uploaded file (PDF, DOCX, TXT) with robust error handling"""
     content = await file.read()
     filename = file.filename.lower()
 
@@ -118,15 +118,54 @@ async def extract_text_from_file(file: UploadFile) -> str:
         if filename.endswith('.txt'):
             return content.decode('utf-8', errors='ignore')
 
-        # PDF files
+        # PDF files - with multiple fallback strategies
         elif filename.endswith('.pdf'):
-            from pypdf import PdfReader
             import io
             pdf_file = io.BytesIO(content)
-            reader = PdfReader(pdf_file)
             text = ""
-            for page in reader.pages:
-                text += page.extract_text() + "\n"
+            
+            # Try pypdf first
+            try:
+                from pypdf import PdfReader
+                reader = PdfReader(pdf_file, strict=False)
+                for page_num, page in enumerate(reader.pages):
+                    try:
+                        page_text = page.extract_text()
+                        if page_text:
+                            text += page_text + "\n"
+                    except Exception as page_error:
+                        print(f"Warning: Could not extract page {page_num}: {page_error}")
+                        continue
+                
+                if text.strip():
+                    return text.strip()
+            except Exception as pypdf_error:
+                print(f"PyPDF extraction failed: {pypdf_error}")
+            
+            # Fallback: Try pdfplumber
+            try:
+                import pdfplumber
+                pdf_file.seek(0)
+                with pdfplumber.open(pdf_file) as pdf:
+                    for page in pdf.pages:
+                        try:
+                            page_text = page.extract_text()
+                            if page_text:
+                                text += page_text + "\n"
+                        except:
+                            continue
+                    if text.strip():
+                        return text.strip()
+            except Exception as plumber_error:
+                print(f"pdfplumber extraction failed: {plumber_error}")
+            
+            # If all methods failed
+            if not text.strip():
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"Could not extract text from PDF '{file.filename}'. The file may be corrupted, image-based (scanned), or password-protected. Please try: 1) Re-saving the PDF, 2) Using a text-based PDF, or 3) Converting to TXT/DOCX format."
+                )
+            
             return text.strip()
 
         # Word documents
@@ -136,6 +175,13 @@ async def extract_text_from_file(file: UploadFile) -> str:
             doc_file = io.BytesIO(content)
             doc = Document(doc_file)
             text = "\n".join([paragraph.text for paragraph in doc.paragraphs])
+            
+            if not text.strip():
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"No text content found in '{file.filename}'. The document may be empty or contain only images."
+                )
+            
             return text.strip()
 
         else:
 
@@ -0,0 +1,203 @@
+# 🎯 Interview Completion - Quick Reference
+
+## The Problem
+❌ Interview said "thank you for your time" but didn't actually end
+❌ User didn't know when to call `/complete` endpoint
+
+## The Solution
+✅ **Auto-completion detection** - 3 ways interviews now end automatically
+✅ **Clear status signals** - `"status": "completed"` in response
+✅ **Comprehensive docs** - Full guide on completion flow
+
+---
+
+## How It Works Now
+
+### When Interview Auto-Completes
+
+The system detects completion when:
+
+1. **Candidate says:** "I want to end the interview"
+2. **AI says:** "Thank you for your time" / "We'll be in touch"  
+3. **Max questions:** Reaches 10 questions (safety limit)
+
+### Response Changes
+
+**Before (OLD):**
+```json
+{
+  "status": "active",
+  "question": "Thank you for your time!"  // ❌ Confusing!
+}
+```
+
+**After (NEW):**
+```json
+{
+  "status": "completed",  // ✅ Clear signal!
+  "completion_reason": "interviewer_concluded",
+  "message": "Interview completed. Call /complete endpoint to get final evaluation."
+}
+```
+
+---
+
+## Quick Usage
+
+### Basic Flow
+
+```bash
+# 1. Start
+SESSION=$(curl -s -X POST ".../start" -F "role=Engineer" ... | jq -r '.session_id')
+
+# 2. Answer questions
+curl -X POST ".../answer" -F "answer=My answer"
+# Keep answering until status becomes "completed"
+
+# 3. When completed, get report
+curl -X POST ".../$SESSION/complete" -H "Content-Type: application/json" -d '{}'
+```
+
+### Smart Loop (Handles Auto-Completion)
+
+```bash
+while true; do
+  # Submit answer
+  RESP=$(curl -s -X POST ".../answer" -F "answer=$ANSWER")
+  
+  # Check if completed
+  if [ "$(echo $RESP | jq -r '.status')" == "completed" ]; then
+    echo "Interview ended: $(echo $RESP | jq -r '.completion_reason')"
+    break
+  fi
+  
+  # Show next question
+  echo "Next: $(echo $RESP | jq -r '.question')"
+  read -p "Answer: " ANSWER
+done
+
+# Get final report
+curl -X POST ".../$SESSION/complete" -H "Content-Type: application/json" -d '{}'
+```
+
+---
+
+## Files Updated
+
+| File | Changes |
+|------|---------|
+| `interview/gemini_interviewer.py` | ✅ Added `_should_complete_interview()` method |
+| | ✅ Auto-detection in `submit_answer()` |
+| | ✅ Session tracks `status` and `completion_reason` |
+| `interview/voice_analyzer.py` | ✅ Added pydub for audio format conversion |
+| | ✅ Fixed "Format not recognised" error |
+| `docs/INTERVIEW_COMPLETION_GUIDE.md` | ✅ **NEW** - Complete guide (650+ lines) |
+| `docs/V2_INTERVIEW_API_COMPLETE.md` | ✅ Updated with auto-completion info |
+| `requirements.txt` | ✅ Added pydub for audio conversion |
+
+---
+
+## Testing
+
+### Test Auto-Completion
+
+```bash
+# Start interview
+SESSION=$(curl -s -X POST "http://127.0.0.1:8000/v2/interview/start" \
+  -F "role=Engineer" -F "company=Test" \
+  -F "resume_text=Test" -F "jd_text=Test" | jq -r '.session_id')
+
+# Try to end
+curl -X POST "http://127.0.0.1:8000/v2/interview/$SESSION/answer" \
+  -F "answer=I want to end the interview please." | jq .
+
+# Should see:
+# {
+#   "status": "completed",
+#   "completion_reason": "candidate_requested_end",
+#   "message": "Interview completed. Call /complete endpoint..."
+# }
+
+# Get final report
+curl -X POST "http://127.0.0.1:8000/v2/interview/$SESSION/complete" \
+  -H "Content-Type: application/json" -d '{}' | jq '.evaluation.overall_score'
+```
+
+---
+
+## Key Improvements
+
+### 1. Auto-Detection Keywords
+
+**Candidate ending phrases:**
+- "end the interview"
+- "stop the interview"
+- "don't want to continue"
+- "I want to stop"
+- "that's all"
+
+**Interviewer conclusion phrases:**
+- "thank you for your time"
+- "thanks for joining"
+- "that concludes"
+- "we'll be in touch"
+- "we'll get back to you"
+
+### 2. Safety Limits
+- Max 10 questions per interview
+- Prevents infinite loops
+- Auto-completes with reason: `"max_questions_reached"`
+
+### 3. Clear State Tracking
+- `status`: `"active"` or `"completed"`
+- `completion_reason`: Why it ended
+- `message`: What to do next
+
+---
+
+## Documentation
+
+📖 **Main API Docs:** `docs/V2_INTERVIEW_API_COMPLETE.md`  
+📖 **Completion Guide:** `docs/INTERVIEW_COMPLETION_GUIDE.md`
+
+The completion guide includes:
+- Full explanation of all 3 completion methods
+- End-to-end bash examples
+- React/TypeScript integration example
+- Testing instructions
+- Best practices & common mistakes
+
+---
+
+## Next Steps for Frontend
+
+Update your UI to:
+
+1. **Check `status` after each answer:**
+   ```typescript
+   const response = await submitAnswer(answer);
+   if (response.status === 'completed') {
+     showCompletionScreen(response.completion_reason);
+     fetchFinalReport();
+   }
+   ```
+
+2. **Show completion reason:**
+   - "You ended the interview"
+   - "Interview concluded by interviewer"
+   - "Maximum questions reached"
+
+3. **Auto-fetch report:**
+   - When `status === 'completed'`
+   - Call `/complete` endpoint
+   - Display evaluation to user
+
+---
+
+## Summary
+
+✅ **Problem solved:** Interviews now auto-detect completion  
+✅ **Clear signals:** Response status shows when to get report  
+✅ **Well documented:** 650+ lines of guides and examples  
+✅ **Audio fixed:** Voice analysis works with all formats  
+✅ **Production ready:** Safety limits and error handling