Fix: multiple file upload issue ressolved

2025-10-07 00:22:57 +05:00
parent 6e648c2282
commit 38a0929865
1 changed files with 176 additions and 0 deletions
--- a/main.py
+++ b/main.py
@@ -0,0 +1,176 @@
 from fastapi import FastAPI, File, UploadFile, HTTPException
 from fastapi.responses import JSONResponse
 from fastapi.middleware.cors import CORSMiddleware
 from doctr.models import ocr_predictor
 from doctr.io import DocumentFile
 import tempfile
 import os
 from typing import List
 import uvicorn
 app = FastAPI(
    title="OCR API",
    description="Extract text from images using DocTR",
    version="1.0.0"
 )
 # Add CORS middleware
 app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
 )
 # Initialize the model once at startup
 model = None
@app.on_event("startup")
 async def load_model():
    global model
    print("Loading OCR model...")
    model = ocr_predictor(det_arch='db_resnet50', reco_arch='crnn_vgg16_bn', pretrained=True)
    print("Model loaded successfully!")
@app.get("/")
 async def root():
    return {
        "message": "OCR API is running",
        "endpoints": {
            "POST /ocr": "Extract text from a single image",
            "POST /ocr/batch": "Extract text from multiple images"
        }
    }
@app.post("/ocr")
 async def extract_text(file: UploadFile = File(...)):
    """
    Extract text from a single image file.
    Returns:
        - text: Extracted text as a single line
        - word_count: Number of words extracted
    """
    if not file.content_type.startswith('image/'):
        raise HTTPException(status_code=400, detail="File must be an image")
    try:
        # Save uploaded file temporarily
        with tempfile.NamedTemporaryFile(delete=False, suffix=os.path.splitext(file.filename)[1]) as tmp:
            content = await file.read()
            tmp.write(content)
            tmp_path = tmp.name
        # Process the image
        doc = DocumentFile.from_images(tmp_path)
        result = model(doc)
        # Extract all words
        all_words = []
        for page in result.pages:
            for block in page.blocks:
                for line in block.lines:
                    for word in line.words:
                        all_words.append(word.value)
        # Join as single line
        single_line = ' '.join(all_words)
        # Clean up temp file
        os.unlink(tmp_path)
        return JSONResponse({
            "success": True,
            "text": single_line,
            "word_count": len(all_words)
        })
    except Exception as e:
        # Clean up temp file if it exists
        if 'tmp_path' in locals():
            try:
                os.unlink(tmp_path)
            except:
                pass
        raise HTTPException(status_code=500, detail=f"Error processing image: {str(e)}")
@app.post("/ocr/batch")
 async def extract_text_batch(files: List[UploadFile] = File(...)):
    """
    Extract text from multiple image files.
    Returns:
        - results: List of extracted texts with metadata
    """
    if len(files) > 10:
        raise HTTPException(status_code=400, detail="Maximum 10 files allowed per batch")
    results = []
    for file in files:
        if not file.content_type.startswith('image/'):
            results.append({
                "filename": file.filename,
                "success": False,
                "error": "File must be an image"
            })
            continue
        try:
            # Save uploaded file temporarily
            with tempfile.NamedTemporaryFile(delete=False, suffix=os.path.splitext(file.filename)[1]) as tmp:
                content = await file.read()
                tmp.write(content)
                tmp_path = tmp.name
            # Process the image
            doc = DocumentFile.from_images(tmp_path)
            result = model(doc)
            # Extract all words
            all_words = []
            for page in result.pages:
                for block in page.blocks:
                    for line in block.lines:
                        for word in line.words:
                            all_words.append(word.value)
            # Join as single line
            single_line = ' '.join(all_words)
            # Clean up temp file
            os.unlink(tmp_path)
            results.append({
                "filename": file.filename,
                "success": True,
                "text": single_line,
                "word_count": len(all_words)
            })
        except Exception as e:
            # Clean up temp file if it exists
            if 'tmp_path' in locals():
                try:
                    os.unlink(tmp_path)
                except:
                    pass
            results.append({
                "filename": file.filename,
                "success": False,
                "error": str(e)
            })
    return JSONResponse({"results": results})
@app.get("/health")
 async def health_check():
    """Health check endpoint"""
    return {
        "status": "healthy",
        "model_loaded": model is not None
    }
 if __name__ == "__main__":
    uvicorn.run(app, host="0.0.0.0", port=8999)