Spaces:

colin730
/

SummarizerApp

Running

ming commited on 4 days ago

Commit

db3b809

1 Parent(s): 45b6536

chore: code formatting improvements and update gitignore

- Format structured_summarizer.py with proper line breaks
- Add test output files to .gitignore
- Update V4_TESTING_LEARNINGS.md

Files changed (3) hide show

.gitignore CHANGED Viewed

@@ -59,3 +59,7 @@ Thumbs.db
 # Docker
 .dockerignore

 # Docker
 .dockerignore
+# Test output files
+*_test_output.txt
+*_scraping_test.txt

V4_TESTING_LEARNINGS.md CHANGED Viewed

@@ -252,3 +252,6 @@ ENABLE_V4_WARMUP=true
 **Best Overall**: 3B + NDJSON (once streaming issues resolved)
 **Most Reliable**: 3B + Outlines JSON (slower but works)


252	Best Overall: 3B + NDJSON (once streaming issues resolved)
253	Most Reliable: 3B + Outlines JSON (slower but works)
254
255	+
256	+
257	+

app/services/structured_summarizer.py CHANGED Viewed

@@ -90,14 +90,20 @@ class StructuredSummarizer:
             # Decide device / quantization strategy
             use_cuda = torch.cuda.is_available()
-            use_mps = torch.backends.mps.is_available() if hasattr(torch.backends, 'mps') else False
             use_gpu = use_cuda or use_mps
             quantization_desc = "None"
             if use_cuda:
                 logger.info("CUDA is available. Using NVIDIA GPU for V4 model.")
             elif use_mps:
-                logger.info("MPS (Metal Performance Shaders) is available. Using Apple Silicon GPU for V4 model.")
             else:
                 logger.info("No GPU available. V4 model will run on CPU.")
@@ -170,9 +176,7 @@ class StructuredSummarizer:
                 if use_mps:
                     # MPS fallback: Load without device_map, manually move to MPS
-                    logger.info(
-                        f"Loading V4 model for MPS with dtype={base_dtype}"
-                    )
                     self.model = AutoModelForCausalLM.from_pretrained(
                         settings.v4_model_id,
                         torch_dtype=base_dtype,

             # Decide device / quantization strategy
             use_cuda = torch.cuda.is_available()
+            use_mps = (
+                torch.backends.mps.is_available()
+                if hasattr(torch.backends, "mps")
+                else False
+            )
             use_gpu = use_cuda or use_mps
             quantization_desc = "None"
             if use_cuda:
                 logger.info("CUDA is available. Using NVIDIA GPU for V4 model.")
             elif use_mps:
+                logger.info(
+                    "MPS (Metal Performance Shaders) is available. Using Apple Silicon GPU for V4 model."
+                )
             else:
                 logger.info("No GPU available. V4 model will run on CPU.")
                 if use_mps:
                     # MPS fallback: Load without device_map, manually move to MPS
+                    logger.info(f"Loading V4 model for MPS with dtype={base_dtype}")
                     self.model = AutoModelForCausalLM.from_pretrained(
                         settings.v4_model_id,
                         torch_dtype=base_dtype,