Spaces:

asdfasdfdsafdsa
/

czech-correction

Paused

App Files Files Community

asdfasdfdsafdsa commited on Oct 3

Commit

bf696db

verified ·

1 Parent(s): 508f678

Upload api.py

Browse files

Files changed (1) hide show

api.py +15 -0

api.py CHANGED Viewed

@@ -364,11 +364,14 @@ async def correct_text(request: CorrectionRequest):
         if len(request.text) > 100000:
             raise HTTPException(status_code=400, detail="Text too long (max 100000 characters)")
         # Process text
         corrected = process_text(request.text)
         # Calculate processing time
         processing_time = (time.time() - start_time) * 1000
         # Include timing if requested
         response = CorrectionResponse(
@@ -401,6 +404,8 @@ async def correct_batch(request: BatchCorrectionRequest):
         if not request.texts:
             raise HTTPException(status_code=400, detail="No texts provided")
         # Validate text lengths
         validated_texts = []
         for text in request.texts:
@@ -411,10 +416,18 @@ async def correct_batch(request: BatchCorrectionRequest):
         # Process all texts in batch (GPU efficient!)
         # Step 1: Grammar correction (batched)
         gec_corrected_texts = apply_gec_correction_batch(validated_texts)
         # Step 2: Punctuation and capitalization (batched)
         final_texts = apply_punctuation_batch(gec_corrected_texts)
         # Mark texts that were too long
         corrected_texts = []
@@ -427,6 +440,8 @@ async def correct_batch(request: BatchCorrectionRequest):
         # Calculate processing time
         processing_time = (time.time() - start_time) * 1000
         response = BatchCorrectionResponse(
             success=True,
             corrected_texts=corrected_texts

         if len(request.text) > 100000:
             raise HTTPException(status_code=400, detail="Text too long (max 100000 characters)")
+        logger.info(f"📝 Single text request received ({len(request.text)} chars)")
         # Process text
         corrected = process_text(request.text)
         # Calculate processing time
         processing_time = (time.time() - start_time) * 1000
+        logger.info(f"✅ Completed in {processing_time:.1f}ms")
         # Include timing if requested
         response = CorrectionResponse(
         if not request.texts:
             raise HTTPException(status_code=400, detail="No texts provided")
+        logger.info(f"📦 Batch request received: {len(request.texts)} texts")
         # Validate text lengths
         validated_texts = []
         for text in request.texts:
         # Process all texts in batch (GPU efficient!)
         # Step 1: Grammar correction (batched)
+        logger.info(f"🔧 Starting GEC batch processing ({len(validated_texts)} texts)...")
+        gec_start = time.time()
         gec_corrected_texts = apply_gec_correction_batch(validated_texts)
+        gec_time = (time.time() - gec_start) * 1000
+        logger.info(f"✓ GEC completed in {gec_time:.1f}ms")
         # Step 2: Punctuation and capitalization (batched)
+        logger.info(f"📝 Starting punctuation batch processing...")
+        punct_start = time.time()
         final_texts = apply_punctuation_batch(gec_corrected_texts)
+        punct_time = (time.time() - punct_start) * 1000
+        logger.info(f"✓ Punctuation completed in {punct_time:.1f}ms")
         # Mark texts that were too long
         corrected_texts = []
         # Calculate processing time
         processing_time = (time.time() - start_time) * 1000
+        logger.info(f"✅ Batch completed: {len(corrected_texts)} texts in {processing_time:.1f}ms (avg {processing_time/len(corrected_texts):.1f}ms/text)")
         response = BatchCorrectionResponse(
             success=True,
             corrected_texts=corrected_texts