Spaces:

omer15699
/

tweet-UI

Sleeping

App Files Files Community

omer15699 commited on Sep 5

Commit

a54bd7b

verified ·

1 Parent(s): 450b693

Update app.py

Browse files

Files changed (1) hide show

app.py +1 -4

app.py CHANGED Viewed

@@ -34,25 +34,23 @@ def _l2norm(x: np.ndarray) -> np.ndarray:
         x = x.reshape(1, -1)
     return x / (np.linalg.norm(x, axis=1, keepdims=True) + 1e-12)
 # -------- Load sample data once (FAST: only a slice) --------
 @functools.lru_cache(maxsize=1)
 def load_sample_df():
     import pandas as pd
-    # 1) נסיון ראשון: sentiment140 קטן מראש
     try:
         from datasets import load_dataset
         ds = load_dataset("sentiment140", split=f"train[:{SAMPLE_SIZE}]")
         df = ds.to_pandas()
     except Exception:
-        # 2) נסיון שני: tweet_eval (עוד יותר קטן/אמין)
         try:
             from datasets import load_dataset
             ds = load_dataset("tweet_eval", "sentiment", split=f"train[:{SAMPLE_SIZE}]")
             df = ds.to_pandas().rename(columns={"text": "text"})
         except Exception:
-            # 3) פולבאק אחרון: רשימת טקסטים קטנה מקומית (כדי שה-UI ירוץ בכל מקרה)
             fallback_texts = [
                 "I love this product!", "This is terrible...", "Best purchase ever",
                 "Pretty good overall", "I am not happy with the service",
@@ -61,7 +59,6 @@ def load_sample_df():
             ]
             return pd.DataFrame({"text": fallback_texts, "clean_text": fallback_texts})
-    # ניקוי קל ושימור רק טקסט
     df = df.dropna(subset=["text"]).copy()
     df["text_length"] = df["text"].astype(str).str.len()
     df = df[(df["text_length"] >= 5) & (df["text_length"] <= 280)].copy()

         x = x.reshape(1, -1)
     return x / (np.linalg.norm(x, axis=1, keepdims=True) + 1e-12)
 # -------- Load sample data once (FAST: only a slice) --------
 @functools.lru_cache(maxsize=1)
 def load_sample_df():
     import pandas as pd
     try:
         from datasets import load_dataset
         ds = load_dataset("sentiment140", split=f"train[:{SAMPLE_SIZE}]")
         df = ds.to_pandas()
     except Exception:
         try:
             from datasets import load_dataset
             ds = load_dataset("tweet_eval", "sentiment", split=f"train[:{SAMPLE_SIZE}]")
             df = ds.to_pandas().rename(columns={"text": "text"})
         except Exception:
             fallback_texts = [
                 "I love this product!", "This is terrible...", "Best purchase ever",
                 "Pretty good overall", "I am not happy with the service",
             ]
             return pd.DataFrame({"text": fallback_texts, "clean_text": fallback_texts})
     df = df.dropna(subset=["text"]).copy()
     df["text_length"] = df["text"].astype(str).str.len()
     df = df[(df["text_length"] >= 5) & (df["text_length"] <= 280)].copy()