GMARTINEZMILLA commited on
Commit
8541c9c
·
1 Parent(s): a383324

feat: generated files

Browse files
Files changed (1) hide show
  1. app.py +13 -4
app.py CHANGED
@@ -125,11 +125,20 @@ elif page == "Customer Analysis":
125
  # Ensure all values are numeric
126
  sales_data_filtered = sales_data_filtered.apply(pd.to_numeric, errors='coerce')
127
 
128
- # Combine manufacturers data
 
 
 
 
 
 
 
 
 
129
  combined_data = pd.DataFrame({
130
- 'units': all_manufacturers[all_manufacturers.columns[0]],
131
- 'sales': sales_data_filtered[sales_data_filtered.columns[0]]
132
- })
133
 
134
  # Sort by units, then by sales
135
  combined_data_sorted = combined_data.sort_values(by=['units', 'sales'], ascending=False)
 
125
  # Ensure all values are numeric
126
  sales_data_filtered = sales_data_filtered.apply(pd.to_numeric, errors='coerce')
127
 
128
+ # Sort manufacturers by percentage of units and get top 10
129
+ top_units = all_manufacturers.sort_values(by=all_manufacturers.columns[0], ascending=False).head(10)
130
+
131
+ # Sort manufacturers by total sales and get top 10
132
+ top_sales = sales_data_filtered.sort_values(by=sales_data_filtered.columns[0], ascending=False).head(10)
133
+
134
+ # Combine top manufacturers from both lists and get up to 20 unique manufacturers
135
+ combined_top = pd.concat([top_units, top_sales]).index.unique()[:20]
136
+
137
+ # Create a DataFrame with combined data for these top manufacturers
138
  combined_data = pd.DataFrame({
139
+ 'units': all_manufacturers.loc[combined_top, all_manufacturers.columns[0]],
140
+ 'sales': sales_data_filtered.loc[combined_top, sales_data_filtered.columns[0]]
141
+ }).fillna(0)
142
 
143
  # Sort by units, then by sales
144
  combined_data_sorted = combined_data.sort_values(by=['units', 'sales'], ascending=False)