Spaces:

kusa04
/

g13_DL_project

Sleeping

kusa04 commited on Mar 20

Commit

1d43e3c

verified ·

1 Parent(s): 2a185f2

Update functions.py

Files changed (1) hide show

functions.py CHANGED Viewed

@@ -16,8 +16,6 @@ from transformers import (
     )
 from transformers.pipelines import AggregationStrategy
 # Function to normalize text by replacing multiple spaces/newlines with a single space
 def normalize_text(text):
     if not isinstance(text, str):
@@ -78,15 +76,24 @@ def safe_sentiment(sentiment_pipeline, text):
     return result
 def analyze_detail(text, tokenizer, sentiment_pipeline, max_tokens):
     text = preprocess_text(text)
     chunks = split_text_by_token_limit(text, tokenizer, max_tokens)
     if not chunks:
         return None
-    # Initialize accumulated scores for each sentiment category
     scores = {"POSITIVE": 0, "NEGATIVE": 0, "NEUTRAL": 0}
-    for chunk in chunks:
-        result = safe_sentiment(chunk)
         if result is not None:
             label = result['label'].upper()
             if label in scores:

     )
 from transformers.pipelines import AggregationStrategy
 # Function to normalize text by replacing multiple spaces/newlines with a single space
 def normalize_text(text):
     if not isinstance(text, str):
     return result
+def safe_sentiment_batch(sentiment_pipeline, texts):
+    try:
+        results = sentiment_pipeline(texts)
+    except Exception as e:
+        results = [None] * len(texts)
+    return results
 def analyze_detail(text, tokenizer, sentiment_pipeline, max_tokens):
     text = preprocess_text(text)
     chunks = split_text_by_token_limit(text, tokenizer, max_tokens)
     if not chunks:
         return None
+    # ここでバッチ処理を実行（チャンク全体を一括推論）
+    results = safe_sentiment_batch(sentiment_pipeline, chunks)
+    # 各チャンクの結果を集計
     scores = {"POSITIVE": 0, "NEGATIVE": 0, "NEUTRAL": 0}
+    for result in results:
         if result is not None:
             label = result['label'].upper()
             if label in scores: