Spaces:

Edenhuang
/

Home_work_for_0330

Sleeping

App Files Files Community

Edenhuang commited on 25 days ago

Commit

1529727

verified ·

1 Parent(s): 28477e1

Update app.py

Browse files

Files changed (1) hide show

app.py +197 -318

app.py CHANGED Viewed

@@ -3,354 +3,233 @@ import requests
 from bs4 import BeautifulSoup
 import pandas as pd
 import time
-import random
-from datetime import datetime
-import io
-# Set page configuration
 st.set_page_config(
-    page_title="台灣證券交易所公告擷取工具",
     page_icon="📊",
     layout="wide"
 )
-# App title and description
-st.title("台灣證券交易所公告擷取工具")
-st.markdown("這個應用程式可以擷取台灣證券交易所的公司公告資訊")
-def extract_data_from_html(html_content):
-    """Extract data from HTML content and return as DataFrame"""
-    # Parse HTML content
-    soup = BeautifulSoup(html_content, 'html.parser')
-    # Find the table
-    table = soup.find('table', {'class': 'hasBorder'})
-    # Lists to store data
-    company_codes = []
-    company_names = []
-    announcement_dates = []
-    announcement_times = []
-    subjects = []
-    # If table exists, extract rows
-    if table:
-        # Find all rows in tbody (skip header)
-        tbody = table.find('tbody')
-        if tbody:
-            rows = tbody.find_all('tr')
-        else:
-            rows = table.find_all('tr')[1:] if len(table.find_all('tr')) > 1 else []
-        for row in rows:
-            # Extract cells
-            cells = row.find_all('td')
-            if len(cells) >= 5:
-                # Extract cell data
-                company_codes.append(cells[0].text.strip())
-                company_names.append(cells[1].text.strip())
-                announcement_dates.append(cells[2].text.strip())
-                announcement_times.append(cells[3].text.strip())
-                # Get subject from button title attribute if available
-                subject_cell = cells[4]
-                subject_button = subject_cell.find('button')
-                if subject_button and 'title' in subject_button.attrs:
-                    subjects.append(subject_button['title'].strip())
-                else:
-                    subjects.append(subject_cell.text.strip())
-    # Create DataFrame
-    df = pd.DataFrame({
-        '公司代號': company_codes,
-        '公司簡稱': company_names,
-        '發言日期': announcement_dates,
-        '發言時間': announcement_times,
-        '主旨': subjects
-    })
-    return df
-# Function to extract data from the actual website
-@st.cache_data(ttl=1800)  # Cache data for 30 minutes
-def extract_data_from_website(url="https://mopsov.twse.com.tw/mops/web/t05sr01_1", retries=3):
-    # Rotating User-Agents to avoid detection
-    user_agents = [
-        'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
-        'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/15.0 Safari/605.1.15',
-        'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:90.0) Gecko/20100101 Firefox/90.0',
-        'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.107 Safari/537.36'
-    ]
-    # More comprehensive headers
     headers = {
-        'User-Agent': random.choice(user_agents),
-        'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
-        'Accept-Language': 'zh-TW,zh;q=0.9,en-US;q=0.8,en;q=0.7',
-        'Accept-Encoding': 'gzip, deflate, br',
-        'Connection': 'keep-alive',
-        'Upgrade-Insecure-Requests': '1',
-        'Sec-Fetch-Dest': 'document',
-        'Sec-Fetch-Mode': 'navigate',
-        'Sec-Fetch-Site': 'none',
-        'Sec-Fetch-User': '?1',
-        'Cache-Control': 'max-age=0'
     }
-    # Get current date in Taiwan format (ROC calendar)
-    now = datetime.now()
-    roc_year = now.year - 1911
-    current_date = f"{roc_year}/{now.month:02d}/{now.day:02d}"
-    for attempt in range(retries):
         try:
-            with st.spinner(f'正在從網站擷取資料... (嘗試 {attempt+1}/{retries})'):
-                # Create a session to maintain cookies
-                session = requests.Session()
-                # Initial visit to homepage to get cookies
-                session.get("https://mopsov.twse.com.tw/mops/web/index", headers=headers, timeout=15)
-                # Small delay to avoid triggering anti-scraping measures
-                time.sleep(random.uniform(1, 3))
-                # Visit the announcements page to get the form structure
-                response = session.get(url, headers=headers, timeout=15)
-                # Another small delay
-                time.sleep(random.uniform(1, 2))
-                # Create form data for POST request to get the announcements
-                # Enhanced form data with more parameters
-                form_data = {
-                    'step': '1',
-                    'firstin': '1',
-                    'off': '1',
-                    'keyword4': '',
-                    'code1': '',
-                    'TYPEK2': '',
-                    'checkbtn': '',
-                    'queryName': 'co_id',
-                    'inpuType': 'co_id',
-                    'TYPEK': 'all',
-                    'co_id': '',
-                    'year': str(roc_year),  # Current ROC year
-                    'month': str(now.month),  # Current month
-                    'day': str(now.day),  # Current day
-                    'b_date': '',
-                    'e_date': '',
-                    'skey': '',
-                    'date1': '',
-                    'date2': '',
-                }
-                # Make POST request
-                post_headers = headers.copy()
-                post_headers['Content-Type'] = 'application/x-www-form-urlencoded'
-                post_headers['Origin'] = 'https://mopsov.twse.com.tw'
-                post_headers['Referer'] = url
-                post_response = session.post(
-                    url,
-                    data=form_data,
-                    headers=post_headers,
-                    timeout=20
-                )
-                # Check if the response seems valid
-                if "hasBorder" in post_response.text and post_response.status_code == 200:
-                    # Parse the HTML content
-                    df = extract_data_from_html(post_response.text)
-                    if not df.empty:
-                        st.success(f'成功擷取 {len(df)} 筆公告資料!')
-                        return df
                     else:
-                        st.info(f'網站回應成功，但找不到公告資料。可能是當日({current_date})尚無公告。')
-                        # Attempt to look for other messages in the response
-                        soup = BeautifulSoup(post_response.text, 'html.parser')
-                        messages = soup.find_all('td', {'class': 'compName'})
-                        if messages:
-                            st.info(f"網站訊息: {messages[0].text.strip()}")
-                        continue
-                else:
-                    st.warning(f'網站返回狀態碼: {post_response.status_code}。嘗試重新連接...')
-                    continue
-        except requests.exceptions.RequestException as e:
-            st.warning(f'請求錯誤 (嘗試 {attempt+1}/{retries}): {str(e)}')
-            time.sleep(2)  # Wait before retrying
         except Exception as e:
-            st.warning(f'處理錯誤 (嘗試 {attempt+1}/{retries}): {str(e)}')
-            time.sleep(2)  # Wait before retrying
-    st.warning(f'嘗試 {retries} 次後仍無法從網站擷取資料，切換到範例資料')
-    return None
-# Example provided in the original code
-default_html_content = """
-<table class="hasBorder"><thead><tr class="tblHead_2"><th width="10%" nowrap="">公司代號</th><th width="10%" nowrap="">公司簡稱</th><th nowrap="">發言日期</th><th width="10%" nowrap="">發言時間</th><th>主旨</th></tr></thead><tbody id="tab2"><tr class="even_2" onmouseover="this.className='mouseOn_2';" onmouseout="this.className='even_2';"><td>7724</td><td>諾亞克</td><td>114/04/01</td><td>00:06:30</td><td class="table02"><button style="width:300px;height:28px;text-align:left;background-color:transparent;border:0;cursor:pointer;" onclick="document.fm_t05sr01_1.step.value='1';document.fm_t05sr01_1.SEQ_NO.value='1';document.fm_t05sr01_1.SPOKE_TIME.value='630';document.fm_t05sr01_1.SPOKE_DATE.value='20250401';document.fm_t05sr01_1.COMPANY_NAME.value='諾亞克';document.fm_t05sr01_1.COMPANY_ID.value='7724';document.fm_t05sr01_1.skey.value='7724202504011';document.fm_t05sr01_1.hhc_co_name.value='諾亞克';openWindow(document.fm_t05sr01_1 ,'');" title="公告本公司董事會決議不分配113年度董事及員工酬勞">公告本公司董事會決議不分配113年度董事......</button></td></tr><tr class="odd_2" onmouseover="this.className='mouseOn_2';" onmouseout="this.className='odd_2';"><td>4117</td><td>普生</td><td>114/04/01</td><td>00:04:31</td><td class="table02"><button style="width:300px;height:28px;text-align:left;background-color:transparent;border:0;cursor:pointer;" onclick="document.fm_t05sr01_1.step.value='1';document.fm_t05sr01_1.SEQ_NO.value='7';document.fm_t05sr01_1.SPOKE_TIME.value='431';document.fm_t05sr01_1.SPOKE_DATE.value='20250401';document.fm_t05sr01_1.COMPANY_NAME.value='普生';document.fm_t05sr01_1.COMPANY_ID.value='4117';document.fm_t05sr01_1.skey.value='4117202503317';document.fm_t05sr01_1.hhc_co_name.value='普生';openWindow(document.fm_t05sr01_1 ,'');" title="公告本公司董事會決議不發放股利">公告本公司董事會決議不發放股利</button></td></tr></tbody></table>
-"""
-# Add date range picker to sidebar
-st.sidebar.header("資料來源選項")
-data_source = st.sidebar.radio(
-    "選擇資料來源",
-    ["從網站擷取資料", "使用範例資料", "貼上HTML代碼"]
-)
-# Date range selector (only visible when fetching from website)
-if data_source == "從網站擷取資料":
-    st.sidebar.subheader("日期選擇")
-    # Calculate ROC year (Taiwan calendar)
-    current_year = datetime.now().year
-    roc_year = current_year - 1911
-    # Date inputs
-    col1, col2 = st.sidebar.columns(2)
-    with col1:
-        year = st.number_input("年度(民國)", min_value=100, max_value=roc_year, value=roc_year)
-    with col2:
-        month = st.number_input("月份", min_value=1, max_value=12, value=datetime.now().month)
-    custom_date = st.sidebar.checkbox("指定日期範圍")
-    if custom_date:
-        start_date = st.sidebar.date_input("起始日期")
-        end_date = st.sidebar.date_input("結束日期")
-# Initialize data frame
-df = None
-# Add progress
-if data_source == "從網站擷取資料":
-    with st.expander("網路連線診斷", expanded=False):
-        st.write("檢查台灣證券交易所網站連線...")
-        try:
-            check_response = requests.get("https://mopsov.twse.com.tw/", timeout=5)
-            st.write(f"網站狀態: {'可連線 ✅' if check_response.status_code == 200 else '無法連線 ❌'}")
-            st.write(f"HTTP 狀態碼: {check_response.status_code}")
-        except Exception as e:
-            st.write(f"網站連線檢查失敗: {e}")
-    fetch_data = st.button("開始擷取資料", type="primary")
-    if fetch_data:
-        # This will be enhanced to use the date parameters when implemented
-        df = extract_data_from_website()
-        if df is None:
-            st.sidebar.warning("從網站擷取資料失敗，切換到範例資料")
-            df = extract_data_from_html(default_html_content)
-elif data_source == "使用範例資料":
-    df = extract_data_from_html(default_html_content)
-else:  # "貼上HTML代碼"
-    html_input = st.sidebar.text_area("貼上HTML代碼", value=default_html_content, height=300)
-    if st.sidebar.button("解析HTML"):
-        df = extract_data_from_html(html_input)
-        st.sidebar.success("HTML解析完成!")
-# Display and filter data
-if df is not None and not df.empty:
-    st.subheader("台灣證券交易所公告資料")
-    # Add search filters
-    col1, col2, col3 = st.columns(3)
     with col1:
-        search_code = st.text_input("依公司代號篩選")
-    with col2:
-        search_name = st.text_input("依公司名稱篩選")
-    with col3:
-        search_subject = st.text_input("依主旨關鍵字篩選")
-    # Apply filters if provided
-    filtered_df = df.copy()
-    if search_code:
-        filtered_df = filtered_df[filtered_df['公司代號'].str.contains(search_code)]
-    if search_name:
-        filtered_df = filtered_df[filtered_df['公司簡稱'].str.contains(search_name)]
-    if search_subject:
-        filtered_df = filtered_df[filtered_df['主旨'].str.contains(search_subject)]
-    # Display the data
-    st.dataframe(filtered_df, use_container_width=True)
-    # Download as CSV
-    csv = filtered_df.to_csv(index=False).encode('utf-8-sig')
-    st.download_button(
-        label="下載為CSV",
-        data=csv,
-        file_name="twse_announcements.csv",
-        mime="text/csv",
     )
-    # Display statistics
-    st.subheader("資料統計")
-    col1, col2, col3 = st.columns(3)
-    with col1:
-        st.metric("公告總數", len(filtered_df))
-    with col2:
-        company_count = filtered_df['公司代號'].nunique()
-        st.metric("公司數量", company_count)
-    with col3:
-        date_counts = filtered_df['發言日期'].value_counts()
-        if not date_counts.empty:
-            latest_date = date_counts.index[0]
-            latest_count = date_counts.iloc[0]
-            st.metric(f"最新日期 ({latest_date})", latest_count)
-    # Show announcement details on selection
-    if not filtered_df.empty:
-        st.subheader("選擇公告以查看詳情")
-        selected_indices = st.multiselect(
-            "選擇公告",
-            options=list(range(len(filtered_df))),
-            format_func=lambda i: f"{filtered_df.iloc[i]['公司簡稱']} ({filtered_df.iloc[i]['公司代號']}) - {filtered_df.iloc[i]['主旨'][:20]}..."
-        )
-        if selected_indices:
-            for idx in selected_indices:
-                with st.expander(f"{filtered_df.iloc[idx]['公司簡稱']} ({filtered_df.iloc[idx]['公司代號']}) - {filtered_df.iloc[idx]['發言日期']}"):
-                    st.write(f"**公司代號:** {filtered_df.iloc[idx]['公司代號']}")
-                    st.write(f"**公司簡稱:** {filtered_df.iloc[idx]['公司簡稱']}")
-                    st.write(f"**發言日期:** {filtered_df.iloc[idx]['發言日期']}")
-                    st.write(f"**發言時間:** {filtered_df.iloc[idx]['發言時間']}")
-                    st.write(f"**主旨內容:** {filtered_df.iloc[idx]['主旨']}")
-else:
-    st.warning("沒有可顯示的資料")
-# Footer
-st.markdown("---")
-st.markdown("台灣證券交易所公告擷取工具 | 資料來源: [台灣證券交易所](https://mopsov.twse.com.tw/mops/web/index)")
-# Add FAQ section at the bottom
-with st.expander("常見問題", expanded=False):
-    st.subheader("常見問題")
-    st.markdown("""
-    **Q: 為什麼無法從網站擷取資料？**
-    A: 可能原因包括：
-    - 台灣證券交易所網站暫時無法連接
-    - 當日尚無公告資料
-    - 網站結構可能有所變更
-    - 網路連線問題
-    **Q: 資料顯示的日期格式是什麼？**
-    A: 發言日期採用中華民國紀年（民國紀年），例如「114/04/01」表示西元2025年4月1日。
-    **Q: 為什麼有些公告的主旨只顯示部分內容？**
-    A: 當主旨內容過長時，網站顯示會自動截斷。點選公告查看詳情可能會顯示完整主旨。
-    **Q: 如何取得更多歷史公告？**
-    A: 本工具目前僅擷取當前頁面資料。若需查詢歷史資料，建議直接前往[台灣證券交易所](https://mopsov.twse.com.tw/mops/web/index)官方網站搜尋。
-    """)
-# Add version info
-st.sidebar.markdown("---")
-st.sidebar.caption("版本: 1.1.1")
-st.sidebar.caption("最後更新: 2025-04-01")

 from bs4 import BeautifulSoup
 import pandas as pd
 import time
+import base64
+from io import BytesIO
+# 設置頁面配置
 st.set_page_config(
+    page_title="台灣證券交易所重大訊息爬蟲",
     page_icon="📊",
     layout="wide"
 )
+# 添加標題和說明
+st.title("台灣證券交易所重大訊息爬蟲")
+st.markdown("這個應用程式會從台灣證券交易所網站爬取上市公司的重大訊息公告。")
+# 添加側邊欄控制
+with st.sidebar:
+    st.header("設定")
+    auto_refresh = st.checkbox("啟用自動刷新", value=False)
+    refresh_interval = st.slider("刷新間隔 (分鐘)", 1, 60, 15) if auto_refresh else 0
+    max_results = st.slider("顯示結果數量", 5, 50, 20)
+    st.header("篩選器")
+    filter_enabled = st.checkbox("啟用關鍵字篩選", value=False)
+    filter_keyword = st.text_input("關鍵字") if filter_enabled else ""
+    st.header("關於")
+    st.info("此應用程式從台灣證券交易所獲取重大訊息公告，僅供參考用途。")
+# 下載CSV功能
+def get_csv_download_link(df, filename="data.csv"):
+    """生成CSV下載鏈接"""
+    csv = df.to_csv(index=False, encoding='utf-8-sig')
+    b64 = base64.b64encode(csv.encode()).decode()
+    href = f'<a href="data:file/csv;base64,{b64}" download="{filename}">下載 CSV 檔案</a>'
+    return href
+# 爬蟲功能
+def fetch_mops_announcements():
+    """從台灣證券交易所爬取重大訊息"""
+    # 設定請求URL
+    url = "https://mopsov.twse.com.tw/mops/web/t05sr01_1"
+    # 設定請求頭，模擬瀏覽器行為
     headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36",
+        "Accept-Language": "zh-TW,zh;q=0.9,en-US;q=0.8,en;q=0.7",
+        "Referer": "https://mopsov.twse.com.tw/mops/web/index"
     }
+    with st.spinner('正在獲取資料...'):
         try:
+            # 發送GET請求獲取頁面
+            response = requests.get(url, headers=headers, timeout=10)
+            response.encoding = 'utf-8'  # 確保正確編碼
+            if response.status_code != 200:
+                st.error(f"請求失敗，狀態碼：{response.status_code}")
+                return parse_example_data()
+            # 解析HTML內容
+            soup = BeautifulSoup(response.text, 'html.parser')
+            # 查找表格內容
+            table = soup.find('table', class_='hasBorder')
+            if not table:
+                st.warning("找不到目標表格，使用範例數據")
+                return parse_example_data()
+            # 查找表格體
+            tbody = table.find('tbody', id='tab2')
+            if not tbody:
+                st.warning("找不到tbody#tab2，嘗試直接查找tr元素")
+                rows = table.find_all('tr')[1:]  # 跳過表頭行
+            else:
+                rows = tbody.find_all('tr')
+            # 驗證是否找到行
+            if not rows:
+                st.warning("找不到任何資料行，使用範例數據")
+                return parse_example_data()
+            # 準備數據列表
+            data = []
+            # 解析每行數據
+            for row in rows:
+                cols = row.find_all('td')
+                if len(cols) >= 5:
+                    company_code = cols[0].text.strip()
+                    company_name = cols[1].text.strip()
+                    announce_date = cols[2].text.strip()
+                    announce_time = cols[3].text.strip()
+                    # 處理主旨 - 可能在按鈕的title屬性中
+                    subject_btn = cols[4].find('button')
+                    if subject_btn and 'title' in subject_btn.attrs:
+                        subject = subject_btn['title'].strip()
                     else:
+                        # 如果沒有按鈕或title屬性，直接獲取文本
+                        subject = cols[4].text.strip()
+                    # 添加到數據列表
+                    data.append({
+                        '公司代號': company_code,
+                        '公司簡稱': company_name,
+                        '發言日期': announce_date,
+                        '發言時間': announce_time,
+                        '主旨': subject
+                    })
+            # 如果沒有收集到數據，使用範例數據
+            if not data:
+                st.warning("未收集到任何數據，使用範例數據")
+                return parse_example_data()
+            # 創建DataFrame
+            df = pd.DataFrame(data)
+            st.success(f"成功獲取 {len(df)} 筆資料")
+            return df
         except Exception as e:
+            st.error(f"爬取過程發生錯誤: {str(e)}")
+            return parse_example_data()
+def parse_example_data():
+    """使用範例數據創建DataFrame"""
+    # 使用範例數據
+    data = [
+        {'公司代號': '1419', '公司簡稱': '新紡', '發言日期': '114/04/01', '發言時間': '12:36:37', '主旨': '公告本公司財務主管變動'},
+        {'公司代號': '1419', '公司簡稱': '新紡', '發言日期': '114/04/01', '發言時間': '12:36:00', '主旨': '公告本公司發言人及代理發言人異動'},
+        {'公司代號': '6277', '公司簡稱': '宏正', '發言日期': '114/04/01', '發言時間': '12:03:45', '主旨': '澄清媒體報導'},
+        {'公司代號': '2215', '公司簡稱': '匯豐汽車', '發言日期': '114/04/01', '發言時間': '12:03:03', '主旨': '公告本公司財務暨會計主管異動'},
+        {'公司代號': '2215', '公司簡稱': '匯豐汽車', '發言日期': '114/04/01', '發言時間': '12:00:20', '主旨': '公告本公司新任董事長'},
+        {'公司代號': '6414', '公司簡稱': '樺漢', '發言日期': '114/04/01', '發言時間': '11:42:52', '主旨': '澄清工商時報有關本公司之報導'},
+        {'公司代號': '8916', '公司簡稱': '光隆', '發言日期': '114/04/01', '發言時間': '10:56:03', '主旨': '更正公告〔113年度股利分派情形申報作業〕(含普通股及特別股)可分配盈餘及分配後期末未分配盈餘誤植(原114/3/11董事會決議無異動)'},
+        {'公司代號': '6597', '公司簡稱': '立誠', '發言日期': '114/04/01', '發言時間': '10:55:35', '主旨': '澄清媒體報導'}
+    ]
+    return pd.DataFrame(data)
+# 主應用邏輯
+def main():
+    # 添加刷新按鈕
+    col1, col2, col3 = st.columns([1, 1, 2])
     with col1:
+        refresh_button = st.button("刷新資料")
+    # 添加上次更新時間顯示
+    if 'last_update' not in st.session_state:
+        st.session_state.last_update = None
+    if 'data' not in st.session_state:
+        st.session_state.data = None
+    # 檢查是否需要刷新數據
+    current_time = time.time()
+    auto_refresh_needed = (
+        auto_refresh and
+        st.session_state.last_update is not None and
+        current_time - st.session_state.last_update > refresh_interval * 60
     )
+    if refresh_button or auto_refresh_needed or st.session_state.data is None:
+        # 獲取資料
+        df = fetch_mops_announcements()
+        st.session_state.data = df
+        st.session_state.last_update = current_time
+    # 顯示最後更新時間
+    with col2:
+        if st.session_state.last_update is not None:
+            last_update_str = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(st.session_state.last_update))
+            st.info(f"最後更新: {last_update_str}")
+    # 獲取當前資料
+    df = st.session_state.data
+    # 套用篩選
+    if filter_enabled and filter_keyword:
+        filtered_df = df[
+            df['公司代號'].str.contains(filter_keyword, case=False, na=False) |
+            df['公司簡稱'].str.contains(filter_keyword, case=False, na=False) |
+            df['主旨'].str.contains(filter_keyword, case=False, na=False)
+        ]
+        if len(filtered_df) > 0:
+            st.success(f"找到 {len(filtered_df)} 筆符合 '{filter_keyword}' 的資料")
+            df = filtered_df
+        else:
+            st.warning(f"沒有找到包含 '{filter_keyword}' 的資料")
+    # 限制顯示數量
+    df_display = df.head(max_results)
+    # 顯示數據表格
+    st.subheader("重大訊息公告")
+    st.dataframe(df_display, use_container_width=True)
+    # 顯示下載連結
+    st.markdown(get_csv_download_link(df, "重大訊息公告.csv"), unsafe_allow_html=True)
+    # 顯示統計信息
+    st.subheader("統計資訊")
+    col1, col2 = st.columns(2)
+    with col1:
+        # 日期統計
+        date_counts = df['發言日期'].value_counts().reset_index()
+        date_counts.columns = ['日期', '公告數量']
+        st.bar_chart(date_counts.set_index('日期'))
+    with col2:
+        # 公司統計
+        company_counts = df['公司簡稱'].value_counts().head(10).reset_index()
+        company_counts.columns = ['公司', '公告數量']
+        st.bar_chart(company_counts.set_index('公司'))
+    # 主旨關鍵詞統計
+    st.subheader("主旨關鍵詞分析")
+    keywords = ['董事長', '財務', '主管', '澄清', '媒體', '股利', '董事會', '異動', '收購']
+    keyword_counts = []
+    for keyword in keywords:
+        count = df['主旨'].str.contains(keyword).sum()
+        keyword_counts.append({'關鍵詞': keyword, '出現次數': count})
+    keyword_df = pd.DataFrame(keyword_counts)
+    st.bar_chart(keyword_df.set_index('關鍵詞'))
+# 執行主應用
+if __name__ == "__main__":
+    main()