Spaces:

ngrigg
/

test

Sleeping

ngrigg commited on Jul 24, 2024

Commit

cfa4436

1 Parent(s): 8270298

Fix processing to handle subset of descriptions and match DataFrame length

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,15 +12,18 @@ async def process_csv(file):
     df = pd.read_csv(file, header=None)  # Read the CSV file without a header
     descriptions = df[0].tolist()  # Access the first column directly
     SAMPLE_SIZE = min(5, len(descriptions))  # Adjust sample size as needed
-    descriptions = descriptions[:SAMPLE_SIZE]
-    model_name = "instruction-pretrain/finance-Llama3-8B"  # Ensure this is the correct model name
     results = []
-    for desc in descriptions:
         result = await process_text(model_name, desc)
         results.append(result)
     df['predictions'] = results
     return df

     df = pd.read_csv(file, header=None)  # Read the CSV file without a header
     descriptions = df[0].tolist()  # Access the first column directly
     SAMPLE_SIZE = min(5, len(descriptions))  # Adjust sample size as needed
+    descriptions_subset = descriptions[:SAMPLE_SIZE]
+    model_name = "instruction-pretrain/finance-Llama3-8B"  # or any other model you want to use
     results = []
+    for desc in descriptions_subset:
         result = await process_text(model_name, desc)
         results.append(result)
+    # Fill the rest of the results with empty strings to match the length of the DataFrame
+    results.extend([''] * (len(descriptions) - SAMPLE_SIZE))
     df['predictions'] = results
     return df