seawolf2357 commited on
Commit
c1c1dea
β€’
1 Parent(s): 6eaab32

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -5
app.py CHANGED
@@ -7,9 +7,6 @@ import subprocess
7
  from datasets import load_dataset
8
  import pandas as pd
9
  from fuzzywuzzy import process
10
-
11
-
12
-
13
  # ν˜„μž¬ μž‘μ—… 디렉토리 좜λ ₯
14
  print("Current Working Directory:", os.getcwd())
15
 
@@ -30,12 +27,17 @@ else:
30
  def load_optimized_dataset(data_files):
31
  data_frames = [pd.read_csv(file) for file in data_files]
32
  full_data = pd.concat(data_frames, ignore_index=True)
 
33
  # 확인을 μœ„ν•œ 데이터 μƒ˜ν”Œ 좜λ ₯
34
- logging.debug(f"Data sample: {full_data[['사건λͺ…', 'μ‚¬κ±΄λ²ˆν˜Έ', 'νŒμ‹œμ‚¬ν•­']].head()}")
 
 
 
35
  # 사건λͺ…을 ν‚€λ‘œ ν•˜κ³  μ‚¬κ±΄λ²ˆν˜Έμ™€ 전문을 μ €μž₯ν•˜λŠ” λ”•μ…”λ„ˆλ¦¬ 생성
36
  name_to_number = full_data.groupby('사건λͺ…')['μ‚¬κ±΄λ²ˆν˜Έ'].apply(list).to_dict()
37
  summary_to_number = full_data.groupby('νŒμ‹œμ‚¬ν•­')['μ‚¬κ±΄λ²ˆν˜Έ'].apply(list).to_dict()
38
  number_to_fulltext = full_data.set_index('μ‚¬κ±΄λ²ˆν˜Έ')['μ „λ¬Έ'].to_dict()
 
39
  return name_to_number, summary_to_number, number_to_fulltext
40
 
41
  name_to_number, summary_to_number, number_to_fulltext = load_optimized_dataset(data_files)
@@ -147,4 +149,4 @@ async def generate_response(message):
147
 
148
  if __name__ == "__main__":
149
  discord_client = MyClient(intents=intents)
150
- discord_client.run(os.getenv('DISCORD_TOKEN'))
 
7
  from datasets import load_dataset
8
  import pandas as pd
9
  from fuzzywuzzy import process
 
 
 
10
  # ν˜„μž¬ μž‘μ—… 디렉토리 좜λ ₯
11
  print("Current Working Directory:", os.getcwd())
12
 
 
27
  def load_optimized_dataset(data_files):
28
  data_frames = [pd.read_csv(file) for file in data_files]
29
  full_data = pd.concat(data_frames, ignore_index=True)
30
+
31
  # 확인을 μœ„ν•œ 데이터 μƒ˜ν”Œ 좜λ ₯
32
+ print(full_data[['사건λͺ…', 'μ‚¬κ±΄λ²ˆν˜Έ', 'νŒμ‹œμ‚¬ν•­']].head()) # 'νŒμ‹œμ‚¬ν•­' ν•„λ“œμ˜ 데이터 μƒ˜ν”Œ 좜λ ₯
33
+ logging.debug(f"Columns in dataset: {full_data.columns}")
34
+ logging.debug(f"Sample data from 'νŒμ‹œμ‚¬ν•­': {full_data['νŒμ‹œμ‚¬ν•­'].dropna().head()}")
35
+
36
  # 사건λͺ…을 ν‚€λ‘œ ν•˜κ³  μ‚¬κ±΄λ²ˆν˜Έμ™€ 전문을 μ €μž₯ν•˜λŠ” λ”•μ…”λ„ˆλ¦¬ 생성
37
  name_to_number = full_data.groupby('사건λͺ…')['μ‚¬κ±΄λ²ˆν˜Έ'].apply(list).to_dict()
38
  summary_to_number = full_data.groupby('νŒμ‹œμ‚¬ν•­')['μ‚¬κ±΄λ²ˆν˜Έ'].apply(list).to_dict()
39
  number_to_fulltext = full_data.set_index('μ‚¬κ±΄λ²ˆν˜Έ')['μ „λ¬Έ'].to_dict()
40
+
41
  return name_to_number, summary_to_number, number_to_fulltext
42
 
43
  name_to_number, summary_to_number, number_to_fulltext = load_optimized_dataset(data_files)
 
149
 
150
  if __name__ == "__main__":
151
  discord_client = MyClient(intents=intents)
152
+ discord_client.run(os.getenv('DISCORD_TOKEN'))