Spaces:

ziem-io
/

whisky-wheel

Running on CPU Upgrade

App Files Files

ziem-io commited on Sep 29

Commit

ba84108

1 Parent(s): ec632c7

Update: Codestyle

Browse files

Files changed (1) hide show

app.py +31 -35

app.py CHANGED Viewed

@@ -1,42 +1,38 @@
 # Standardbibliotheken
-import os        # Umgebungsvariablen (z.B. HF_TOKEN)
-import types     # für Instanz-Monkeypatch (fastText .predict)
-import html      # HTML-Escaping für Ausgabe/Gradio
-import numpy as np  # Numerik (z.B. für Wahrscheinlichkeiten)
-import time
-import random
 # Machine Learning / NLP
-import torch                      # PyTorch (Model, Tensor, Device)
-import fasttext                   # Sprach-ID (lid.176)
-# Diese beiden werden oft nicht direkt aufgerufen, müssen aber installiert sein,
-# damit Hugging Face/Tokenizer korrekt funktionieren (SentencePiece-Backends, Converter).
-import sentencepiece              # Required für SentencePiece-basierte Tokenizer (DeBERTa v3)
-import tiktoken                   # Optionaler Converter; verhindert Fallback-Fehler/Warnungen
-from langid.langid import LanguageIdentifier, model
-# Hugging Face / Ökosystem
-import spaces
-from transformers import AutoTokenizer   # Tokenizer-Lader (mit use_fast=False für SentencePiece)
-from huggingface_hub import hf_hub_download  # Dateien/Weights aus dem HF Hub laden
-from safetensors.torch import load_file      # Sicheres & schnelles Laden von Weights (.safetensors)
 # UI / Serving
-import gradio as gr               # Web-UI für Demo/Spaces
-import deepl
 # Projektspezifische Module
 from lib.bert_regressor import BertMultiHeadRegressor
 from lib.bert_regressor_utils import (
-    #load_model_and_tokenizer,
-    predict_flavours,
-    #predict_is_review,
-    #TARGET_COLUMNS,
-    #ICONS
 )
-from lib.wheel import build_svg_with_values
-from lib.examples import EXAMPLES
 ### Stettings ####################################################################
@@ -76,14 +72,14 @@ model_flavours.to(device).eval()
 ID = LanguageIdentifier.from_modelstring(model, norm_probs=True)
-def is_eng(text: str, min_chars: int = 6, threshold: float = 0.1):
     t = (text or "").strip()
     if len(t) < min_chars:
         return True, 0.0
     lang, prob = ID.classify(t)  # prob ∈ [0,1]
     return (lang == "en" and prob >= threshold), float(prob)
-def translate_en(text: str, target_lang: str = "EN-GB"):
     deepl_client = deepl.Translator(DEEPL_API_KEY)
     result = deepl_client.translate_text(text, target_lang=target_lang)
     return result.text
@@ -102,11 +98,11 @@ def predict(review: str):
         return "Please enter a review.", {}
     # Check for lang of text
-    review_is_eng, review_lang_prob = is_eng(review)
     # Abort if text is not english
     if not review_is_eng:
-        review = translate_en(review)
         html_out += f"""<div style='border-radius: 2px; padding: 1px 5px; background-color: rgb(255, 237, 213);'>Your text has been automatically translated</div>
         <p>{review}</p>
         """
@@ -146,7 +142,7 @@ def predict(review: str):
 def random_text():
     return random.choice(EXAMPLES)
-def get_device_info():
     if torch.cuda.is_available():
         return f"<span style='border-radius: 2px; padding: 1px 5px; background-color: rgb(220, 252, 231);'>Runs on GPU: {torch.cuda.get_device_name(0)}</span>"
     else:
@@ -167,7 +163,7 @@ with gr.Blocks(css=custom_css) as demo:
     <h3>Automatically turns Whisky Tasting Notes into Flavour Wheels.</h3>
     <p>This model is a fine-tuned version of <a href='https://huggingface.co/microsoft/deberta-v3-base'>microsoft/deberta-v3-base</a> designed to analyze English whisky tasting notes. It predicts the intensity of eight sensory categories — <strong>grainy</strong>, <strong>grassy</strong>, <strong>fragrant</strong>, <strong>fruity</strong>, <strong>peated</strong>, <strong>woody</strong>, <strong>winey</strong> and <strong>off-notes</strong> — on a continuous scale from 0 (none) to 4 (extreme).</p>
 """)
-    gr.HTML(f"<span style='color: var(--block-title-text-color)'>{get_device_info()}</span>")
     with gr.Row():  # alles nebeneinander
         with gr.Column(scale=1):  # linke Seite: Input

 # Standardbibliotheken
+import os          # Umgebungsvariablen (z.B. HF_TOKEN)
+import time        # Timing / Performance-Messung
+import random      # Zufallswerte (z.B. Beispiel-Reviews)
+import html        # HTML-Escaping für sichere Ausgabe in Gradio
+import types       # Monkeypatching von Instanzen (fastText .predict)
+import numpy as np # Numerische Arrays und Wahrscheinlichkeiten
 # Machine Learning / NLP
+import torch       # PyTorch: Modelle, Tensoren, Devices
+import fasttext    # Sprach-ID-Modell (lid.176)
+# Folgende sind notwendig, auch wenn sie nicht explizit genutzt werden:
+import sentencepiece  # Pflicht für SentencePiece-basierte Tokenizer (z.B. DeBERTa v3)
+import tiktoken       # Optionaler Converter (verhindert Fallback-Fehler bei Tokenizer)
+from langid.langid import LanguageIdentifier, model  # Alternative Sprach-ID
+# Hugging Face Ökosystem
+import spaces                                     # HF Spaces-Dekoratoren (@spaces.GPU)
+from transformers import AutoTokenizer            # Tokenizer laden (use_fast=False für DeBERTa v3)
+from huggingface_hub import hf_hub_download       # Download von Dateien/Weights aus dem HF Hub
+from safetensors.torch import load_file           # Sicheres & schnelles Laden von Weights (.safetensors)
+# Übersetzung
+import deepl  # DeepL API für automatische Übersetzung
 # UI / Serving
+import gradio as gr  # Web-UI für Demo/Spaces
 # Projektspezifische Module
 from lib.bert_regressor import BertMultiHeadRegressor
 from lib.bert_regressor_utils import (
+    predict_flavours,  # Hauptfunktion: Vorhersage der 8 Aromenachsen
 )
+from lib.wheel import build_svg_with_values       # SVG-Rendering für Flavour Wheel
+from lib.examples import EXAMPLES                 # Beispiel-Reviews (vordefiniert)
 ### Stettings ####################################################################
 ID = LanguageIdentifier.from_modelstring(model, norm_probs=True)
+def _is_eng(text: str, min_chars: int = 6, threshold: float = 0.1):
     t = (text or "").strip()
     if len(t) < min_chars:
         return True, 0.0
     lang, prob = ID.classify(t)  # prob ∈ [0,1]
     return (lang == "en" and prob >= threshold), float(prob)
+def _translate_en(text: str, target_lang: str = "EN-GB"):
     deepl_client = deepl.Translator(DEEPL_API_KEY)
     result = deepl_client.translate_text(text, target_lang=target_lang)
     return result.text
         return "Please enter a review.", {}
     # Check for lang of text
+    review_is_eng, review_lang_prob = _is_eng(review)
     # Abort if text is not english
     if not review_is_eng:
+        review = _translate_en(review)
         html_out += f"""<div style='border-radius: 2px; padding: 1px 5px; background-color: rgb(255, 237, 213);'>Your text has been automatically translated</div>
         <p>{review}</p>
         """
 def random_text():
     return random.choice(EXAMPLES)
+def _get_device_info():
     if torch.cuda.is_available():
         return f"<span style='border-radius: 2px; padding: 1px 5px; background-color: rgb(220, 252, 231);'>Runs on GPU: {torch.cuda.get_device_name(0)}</span>"
     else:
     <h3>Automatically turns Whisky Tasting Notes into Flavour Wheels.</h3>
     <p>This model is a fine-tuned version of <a href='https://huggingface.co/microsoft/deberta-v3-base'>microsoft/deberta-v3-base</a> designed to analyze English whisky tasting notes. It predicts the intensity of eight sensory categories — <strong>grainy</strong>, <strong>grassy</strong>, <strong>fragrant</strong>, <strong>fruity</strong>, <strong>peated</strong>, <strong>woody</strong>, <strong>winey</strong> and <strong>off-notes</strong> — on a continuous scale from 0 (none) to 4 (extreme).</p>
 """)
+    gr.HTML(f"<span style='color: var(--block-title-text-color)'>{_get_device_info()}</span>")
     with gr.Row():  # alles nebeneinander
         with gr.Column(scale=1):  # linke Seite: Input