TEST-GIZ-Project-Search

Sleeping

annikwag commited on Mar 4

Commit

ba7bdf1

verified ·

1 Parent(s): 8598201

Update appStore/prep_data.py

Files changed (1) hide show

appStore/prep_data.py CHANGED Viewed

@@ -100,8 +100,12 @@ def process_giz_worldwide():
     giz_df['url'] = ''
     # Convert CRS value to numeric then to integer if possible.
     if 'crs_key' in giz_df.columns:
-        giz_df['crs_key'] = giz_df['crs_key'].apply(lambda x: str(int(float(x))) if pd.notnull(x) and str(x).strip() != "" else x)
     # Compute text_size based on merged_text and assign full text to the 'chunks' column
     giz_df['text_size'] = giz_df['merged_text'].apply(lambda text: len(text.split()) if isinstance(text, str) else 0)

     giz_df['url'] = ''
     # Convert CRS value to numeric then to integer if possible.
+    # After reading the JSON file into giz_df, convert the crs_key column:
     if 'crs_key' in giz_df.columns:
+        giz_df['crs_key'] = giz_df['crs_key'].apply(
+            lambda x: str(int(float(x))).replace('.0', '') if pd.notnull(x) and str(x).strip() != "" else x
+        )
     # Compute text_size based on merged_text and assign full text to the 'chunks' column
     giz_df['text_size'] = giz_df['merged_text'].apply(lambda text: len(text.split()) if isinstance(text, str) else 0)