Spaces:

SonFox2920
/

CV-resume_scoring

Sleeping

App Files Files Community

SonFox2920 commited on Mar 11

Commit

9cde47b

verified ·

1 Parent(s): 7827c20

Update analyze.py

Browse files

Files changed (1) hide show

analyze.py +182 -42

analyze.py CHANGED Viewed

@@ -3,6 +3,7 @@ import pandas as pd
 import plotly.express as px
 import plotly.graph_objects as go
 from plotly.subplots import make_subplots
 # Hàm để tải và xử lý dữ liệu
 @st.cache_data
@@ -65,11 +66,42 @@ def plot_criteria_comparison(df):
 # Hàm tạo biểu đồ phân bố ứng viên theo khoảng điểm
 def plot_score_range_distribution(df):
     df['Khoảng điểm'] = pd.cut(df['Điểm tổng quát'], bins=[0, 2, 4, 6, 8, 10], labels=['0-2', '2-4', '4-6', '6-8', '8-10'])
-    fig = px.bar(df['Khoảng điểm'].value_counts().sort_index(), title="Phân bố ứng viên theo khoảng điểm")
     fig.update_xaxes(title="Khoảng điểm")
     fig.update_yaxes(title="Số lượng ứng viên")
     return fig
 def dashboard():
     # Tiêu đề ứng dụng
     st.header("📈 Dashboard Phân tích Ứng viên")
@@ -81,63 +113,171 @@ def dashboard():
         # Tải dữ liệu
         df = load_data(uploaded_file)
         # Thông tin tổng quan
         st.header("📊 Thông tin tổng quan")
         col1, col2, col3, col4 = st.columns(4)
         col1.metric("Tổng số ứng viên", len(df))
-        col2.metric("Điểm trung bình", f"{df['Điểm tổng quát'].mean():.2f}")
-        col3.metric("Điểm cao nhất", df['Điểm tổng quát'].max())
-        col4.metric("Điểm thấp nhất", df['Điểm tổng quát'].min())
-        # Phân phối điểm và Ma trận tương quan
-        st.header("📈 Phân tích điểm số")
-        col1, col2 = st.columns(2)
-        with col1:
-            st.plotly_chart(plot_score_distribution(df, 'Điểm tổng quát'), use_container_width=True)
-        with col2:
-            st.plotly_chart(plot_correlation_heatmap(df), use_container_width=True)
-        # Phân tích đánh giá theo tiêu chí
-        st.header("🔬 Phân tích đánh giá theo tiêu chí")
-        st.plotly_chart(plot_criteria_comparison(df), use_container_width=True)
-        # Phân bố ứng viên theo khoảng điểm
-        st.plotly_chart(plot_score_range_distribution(df), use_container_width=True)
         # Biểu đồ radar cho từng ứng viên
-        st.header("🎯 Biểu đồ kỹ năng ứng viên")
-        col1, col2 = st.columns([1, 3])
-        with col1:
-            selected_candidate = st.selectbox("Chọn ứng viên", df['Tên ứng viên'].tolist())
-            candidate_summary = df[df['Tên ứng viên'] == selected_candidate]['Tóm tắt'].values[0]
-            st.subheader("Tóm tắt ứng viên")
-            st.write(candidate_summary)
-        with col2:
-            st.plotly_chart(plot_candidate_radar(df, selected_candidate), use_container_width=True)
         # Lọc và sắp xếp ứng viên
         st.header("🔍 Lọc và sắp xếp ứng viên")
-        col1, col2 = st.columns(2)
-        with col1:
-            min_score = st.slider("Điểm tổng quát tối thiểu", 0.0, 10.0, 0.0)
-        with col2:
-            sort_by = st.selectbox("Sắp xếp theo", ['Điểm tổng quát', 'Mức độ phù hợp', 'Kỹ năng kỹ thuật', 'Kinh nghiệm', 'Trình độ học vấn', 'Kỹ năng mềm'])
-        filtered_df = df[df['Điểm tổng quát'] >= min_score].sort_values(sort_by, ascending=False)
-        st.dataframe(filtered_df[['Tên ứng viên', 'Điểm tổng quát', 'Mức độ phù hợp', 'Kỹ năng kỹ thuật', 'Kinh nghiệm', 'Trình độ học vấn', 'Kỹ năng mềm', 'Link ứng viên']], column_config={
-        "Link ứng viên": st.column_config.LinkColumn()
-                }
-            )
         # Top ứng viên
-        st.header("🏆 Top ứng viên theo điểm tổng quát")
-        top_n = st.slider("Số lượng ứng viên hàng đầu", 1, 20, 5)
-        top_candidates = df.sort_values('Điểm tổng quát', ascending=False).head(top_n)
-        st.table(top_candidates[['Tên ứng viên', 'Điểm tổng quát', 'Mức độ phù hợp', 'Kỹ năng kỹ thuật', 'Kinh nghiệm', 'Trình độ học vấn', 'Kỹ năng mềm', 'Link ứng viên']])
         # Dữ liệu chi tiết
-        st.header("📋 Dữ liệu chi tiết")
-        st.dataframe(df)
     else:
         st.info("Vui lòng upload file CSV để bắt đầu phân tích.")

 import plotly.express as px
 import plotly.graph_objects as go
 from plotly.subplots import make_subplots
+import numpy as np
 # Hàm để tải và xử lý dữ liệu
 @st.cache_data
 # Hàm tạo biểu đồ phân bố ứng viên theo khoảng điểm
 def plot_score_range_distribution(df):
     df['Khoảng điểm'] = pd.cut(df['Điểm tổng quát'], bins=[0, 2, 4, 6, 8, 10], labels=['0-2', '2-4', '4-6', '6-8', '8-10'])
+    counts = df['Khoảng điểm'].value_counts().sort_index()
+    fig = px.bar(counts, title="Phân bố ứng viên theo khoảng điểm")
     fig.update_xaxes(title="Khoảng điểm")
     fig.update_yaxes(title="Số lượng ứng viên")
     return fig
+# Hàm tạo biểu đồ phân bố ứng viên theo giai đoạn
+def plot_stage_distribution(df):
+    if 'Giai đoạn' in df.columns:
+        fig = px.bar(df['Giai đoạn'].value_counts().sort_index(),
+                    title="Phân bố ứng viên theo giai đoạn tuyển dụng")
+        fig.update_xaxes(title="Giai đoạn")
+        fig.update_yaxes(title="Số lượng ứng viên")
+        return fig
+    return None
+# Hàm tạo biểu đồ điểm trung bình theo giai đoạn
+def plot_avg_score_by_stage(df):
+    if 'Giai đoạn' in df.columns:
+        avg_scores = df.groupby('Giai đoạn')['Điểm tổng quát'].mean().sort_values(ascending=False)
+        fig = px.bar(avg_scores, title="Điểm trung bình theo giai đoạn tuyển dụng")
+        fig.update_xaxes(title="Giai đoạn")
+        fig.update_yaxes(title="Điểm trung bình")
+        return fig
+    return None
+# Hàm tạo biểu đồ heatmap so sánh điểm trung bình các tiêu chí theo giai đoạn
+def plot_criteria_by_stage_heatmap(df):
+    if 'Giai đoạn' in df.columns:
+        criteria = ['Mức độ phù hợp', 'Kỹ năng kỹ thuật', 'Kinh nghiệm', 'Trình độ học vấn', 'Kỹ năng mềm']
+        pivot_df = df.pivot_table(index='Giai đoạn', values=criteria)
+        fig = px.imshow(pivot_df, text_auto=True, aspect="auto", color_continuous_scale="Blues",
+                        title="Điểm trung bình các tiêu chí theo giai đoạn")
+        return fig
+    return None
 def dashboard():
     # Tiêu đề ứng dụng
     st.header("📈 Dashboard Phân tích Ứng viên")
         # Tải dữ liệu
         df = load_data(uploaded_file)
+        # Kiểm tra và chuyển đổi các cột số nếu cần
+        numeric_columns = ['Mức độ phù hợp', 'Kỹ năng kỹ thuật', 'Kinh nghiệm',
+                          'Trình độ học vấn', 'Kỹ năng mềm', 'Điểm tổng quát']
+        for col in numeric_columns:
+            if col in df.columns:
+                df[col] = pd.to_numeric(df[col], errors='coerce')
         # Thông tin tổng quan
         st.header("📊 Thông tin tổng quan")
         col1, col2, col3, col4 = st.columns(4)
         col1.metric("Tổng số ứng viên", len(df))
+        if 'Điểm tổng quát' in df.columns:
+            avg_score = df['Điểm tổng quát'].mean()
+            max_score = df['Điểm tổng quát'].max()
+            min_score = df['Điểm tổng quát'].min()
+            col2.metric("Điểm trung bình", f"{avg_score:.2f}")
+            col3.metric("Điểm cao nhất", f"{max_score:.2f}")
+            col4.metric("Điểm thấp nhất", f"{min_score:.2f}")
+        # Phân tích theo giai đoạn (mới)
+        if 'Giai đoạn' in df.columns:
+            st.header("🔄 Phân tích theo giai đoạn tuyển dụng")
+            col1, col2 = st.columns(2)
+            with col1:
+                stage_chart = plot_stage_distribution(df)
+                if stage_chart:
+                    st.plotly_chart(stage_chart, use_container_width=True)
+            with col2:
+                avg_score_chart = plot_avg_score_by_stage(df)
+                if avg_score_chart:
+                    st.plotly_chart(avg_score_chart, use_container_width=True)
+            # Biểu đồ heatmap các tiêu chí theo giai đoạn
+            criteria_stage_chart = plot_criteria_by_stage_heatmap(df)
+            if criteria_stage_chart:
+                st.plotly_chart(criteria_stage_chart, use_container_width=True)
+        # Phân phối điểm và Ma trận tương quan
+        if 'Điểm tổng quát' in df.columns:
+            st.header("📈 Phân tích điểm số")
+            col1, col2 = st.columns(2)
+            with col1:
+                st.plotly_chart(plot_score_distribution(df, 'Điểm tổng quát'), use_container_width=True)
+            with col2:
+                try:
+                    st.plotly_chart(plot_correlation_heatmap(df), use_container_width=True)
+                except Exception as e:
+                    st.warning(f"Không thể tạo ma trận tương quan: {e}")
+            # Phân tích đánh giá theo tiêu chí
+            st.header("🔬 Phân tích đánh giá theo tiêu chí")
+            try:
+                st.plotly_chart(plot_criteria_comparison(df), use_container_width=True)
+            except Exception as e:
+                st.warning(f"Không thể tạo biểu đồ so sánh tiêu chí: {e}")
+            # Phân bố ứng viên theo khoảng điểm
+            try:
+                st.plotly_chart(plot_score_range_distribution(df), use_container_width=True)
+            except Exception as e:
+                st.warning(f"Không thể tạo biểu đồ phân bố khoảng điểm: {e}")
         # Biểu đồ radar cho từng ứng viên
+        if 'Tên ứng viên' in df.columns:
+            st.header("🎯 Biểu đồ kỹ năng ứng viên")
+            col1, col2 = st.columns([1, 3])
+            with col1:
+                selected_candidate = st.selectbox("Chọn ứng viên", df['Tên ứng viên'].tolist())
+                if 'Tóm tắt' in df.columns:
+                    candidate_summary = df[df['Tên ứng viên'] == selected_candidate]['Tóm tắt'].values[0]
+                    st.subheader("Tóm tắt ứng viên")
+                    st.write(candidate_summary)
+            with col2:
+                try:
+                    st.plotly_chart(plot_candidate_radar(df, selected_candidate), use_container_width=True)
+                except Exception as e:
+                    st.warning(f"Không thể tạo biểu đồ radar: {e}")
         # Lọc và sắp xếp ứng viên
         st.header("🔍 Lọc và sắp xếp ứng viên")
+        # Cấu hình các bộ lọc
+        filter_columns = st.columns(3)
+        with filter_columns[0]:
+            # Tùy chọn lọc theo điểm
+            if 'Điểm tổng quát' in df.columns:
+                min_score = st.slider("Điểm tổng quát tối thiểu",
+                                     float(df['Điểm tổng quát'].min()),
+                                     float(df['Điểm tổng quát'].max()),
+                                     float(df['Điểm tổng quát'].min()))
+            else:
+                min_score = 0
+        with filter_columns[1]:
+            # Sắp xếp theo
+            sort_options = [col for col in df.columns if col in
+                          ['Điểm tổng quát', 'Mức độ phù hợp', 'Kỹ năng kỹ thuật',
+                           'Kinh nghiệm', 'Trình độ học vấn', 'Kỹ năng mềm']]
+            if sort_options:
+                sort_by = st.selectbox("Sắp xếp theo", sort_options)
+            else:
+                sort_by = None
+        with filter_columns[2]:
+            # Lọc theo giai đoạn
+            if 'Giai đoạn' in df.columns and not df['Giai đoạn'].isna().all():
+                stages = ['Tất cả'] + list(df['Giai đoạn'].dropna().unique())
+                selected_stage = st.selectbox("Giai đoạn", stages)
+            else:
+                selected_stage = 'Tất cả'
+        # Áp dụng các bộ lọc
+        filtered_df = df.copy()
+        if 'Điểm tổng quát' in filtered_df.columns:
+            filtered_df = filtered_df[filtered_df['Điểm tổng quát'] >= min_score]
+        if selected_stage != 'Tất cả' and 'Giai đoạn' in filtered_df.columns:
+            filtered_df = filtered_df[filtered_df['Giai đoạn'] == selected_stage]
+        if sort_by and sort_by in filtered_df.columns:
+            filtered_df = filtered_df.sort_values(sort_by, ascending=False)
+        # Hiển thị dữ liệu đã lọc
+        display_columns = ['Tên ứng viên']
+        if 'Điểm tổng quát' in df.columns:
+            display_columns.append('Điểm tổng quát')
+        score_columns = [col for col in df.columns if col in
+                       ['Mức độ phù hợp', 'Kỹ năng kỹ thuật', 'Kinh nghiệm',
+                        'Trình độ học vấn', 'Kỹ năng mềm']]
+        display_columns.extend(score_columns)
+        if 'Giai đoạn' in df.columns:
+            display_columns.append('Giai đoạn')
+        if 'Link ứng viên' in df.columns:
+            display_columns.append('Link ứng viên')
+        # Chỉ hiển thị các cột có trong DataFrame
+        display_columns = [col for col in display_columns if col in filtered_df.columns]
+        column_config = {}
+        if 'Link ứng viên' in display_columns:
+            column_config["Link ứng viên"] = st.column_config.LinkColumn()
+        st.dataframe(filtered_df[display_columns], column_config=column_config)
         # Top ứng viên
+        if 'Điểm tổng quát' in df.columns:
+            st.header("🏆 Top ứng viên theo điểm tổng quát")
+            top_n = st.slider("Số lượng ứng viên hàng đầu", 1, min(20, len(df)), 5)
+            top_candidates = df.sort_values('Điểm tổng quát', ascending=False).head(top_n)
+            st.table(top_candidates[display_columns])
         # Dữ liệu chi tiết
+        with st.expander("📋 Xem tất cả dữ liệu chi tiết"):
+            st.dataframe(df)
     else:
         st.info("Vui lòng upload file CSV để bắt đầu phân tích.")