awacke1 commited on
Commit
4a66f10
·
1 Parent(s): 1428628

Update backupapp.py

Browse files
Files changed (1) hide show
  1. backupapp.py +51 -8
backupapp.py CHANGED
@@ -4,6 +4,13 @@ import pandas as pd
4
  import plotly.express as px
5
  import seaborn as sns
6
  import matplotlib.pyplot as plt
 
 
 
 
 
 
 
7
 
8
  # Function to load JSONL file into a DataFrame
9
  def load_jsonl(file_path):
@@ -17,17 +24,43 @@ def load_jsonl(file_path):
17
  def filter_by_keyword(df, keyword):
18
  return df[df.apply(lambda row: row.astype(str).str.contains(keyword).any(), axis=1)]
19
 
20
- # Load the data
21
- small_data = load_jsonl("usmle_16.2MB.jsonl")
22
- large_data = load_jsonl("usmle_2.08MB.jsonl")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
 
24
  # Streamlit App
25
- st.title("EDA with Plotly and Seaborn 📊")
26
 
27
  # Dropdown for file selection
28
  file_option = st.selectbox("Select file:", ["small_file.jsonl", "large_file.jsonl"])
29
  st.write(f"You selected: {file_option}")
30
 
 
 
 
 
31
  # Show filtered data grid
32
  if file_option == "small_file.jsonl":
33
  data = small_data
@@ -41,12 +74,22 @@ search_keyword = st.text_input("Enter a keyword to filter data (e.g., Heart, Lun
41
  if st.button("Search"):
42
  filtered_data = filter_by_keyword(data, search_keyword)
43
  st.write(f"Filtered Dataset by '{search_keyword}'")
44
- st.dataframe(filtered_data)
45
-
 
 
 
 
 
 
 
 
 
 
 
46
 
47
  # Plotly and Seaborn charts for EDA
48
  if st.button("Generate Charts"):
49
-
50
  st.subheader("Plotly Charts 📈")
51
 
52
  # 1. Scatter Plot
@@ -93,4 +136,4 @@ if st.button("Generate Charts"):
93
  # 10. Regplot (Regression Plot)
94
  fig, ax = plt.subplots()
95
  sns.regplot(x=data.columns[0], y=data.columns[1], data=data)
96
- st.pyplot(fig)
 
4
  import plotly.express as px
5
  import seaborn as sns
6
  import matplotlib.pyplot as plt
7
+ import streamlit.components.v1 as components
8
+
9
+ # Global variable to hold selected row index
10
+ selected_row_index = None
11
+
12
+ # Initialize an empty DataFrame
13
+ filtered_data = pd.DataFrame()
14
 
15
  # Function to load JSONL file into a DataFrame
16
  def load_jsonl(file_path):
 
24
  def filter_by_keyword(df, keyword):
25
  return df[df.apply(lambda row: row.astype(str).str.contains(keyword).any(), axis=1)]
26
 
27
+
28
+ # Function to generate HTML5 code with embedded text
29
+ def generate_html(question_text, answer_text):
30
+ return f'''
31
+ <!DOCTYPE html>
32
+ <html>
33
+ <head>
34
+ <title>Read It Aloud</title>
35
+ <script type="text/javascript">
36
+ function readAloud(id) {{
37
+ const text = document.getElementById(id).innerText;
38
+ const speech = new SpeechSynthesisUtterance(text);
39
+ window.speechSynthesis.speak(speech);
40
+ }}
41
+ </script>
42
+ </head>
43
+ <body>
44
+ <h1>🔊 Read It Aloud</h1>
45
+ <p id="questionArea">{question_text}</p>
46
+ <button onclick="readAloud('questionArea')">🔊 Read Question Aloud</button>
47
+ <p id="answerArea">{answer_text}</p>
48
+ <button onclick="readAloud('answerArea')">🔊 Read Answer Aloud</button>
49
+ </body>
50
+ </html>
51
+ '''
52
 
53
  # Streamlit App
54
+ st.title("Medical Licensing Exam Explorer with Speech Synthesis, Plotly and Seaborn 📊")
55
 
56
  # Dropdown for file selection
57
  file_option = st.selectbox("Select file:", ["small_file.jsonl", "large_file.jsonl"])
58
  st.write(f"You selected: {file_option}")
59
 
60
+ # Load the data
61
+ small_data = load_jsonl("usmle_16.2MB.jsonl")
62
+ large_data = load_jsonl("usmle_2.08MB.jsonl")
63
+
64
  # Show filtered data grid
65
  if file_option == "small_file.jsonl":
66
  data = small_data
 
74
  if st.button("Search"):
75
  filtered_data = filter_by_keyword(data, search_keyword)
76
  st.write(f"Filtered Dataset by '{search_keyword}'")
77
+ selected_data = st.dataframe(filtered_data)
78
+
79
+ # Button to read selected row aloud
80
+ if st.button("Read Selected Row"):
81
+ if selected_row_index is not None:
82
+ selected_row = filtered_data.loc[selected_row_index]
83
+ question_text = selected_row.get("question", "No question field")
84
+ answer_text = selected_row.get("answer", "No answer field")
85
+
86
+ documentHTML5 = generate_html(question_text, answer_text)
87
+ components.html(documentHTML5, width=1280, height=1024)
88
+ else:
89
+ st.warning("Please select a row first.")
90
 
91
  # Plotly and Seaborn charts for EDA
92
  if st.button("Generate Charts"):
 
93
  st.subheader("Plotly Charts 📈")
94
 
95
  # 1. Scatter Plot
 
136
  # 10. Regplot (Regression Plot)
137
  fig, ax = plt.subplots()
138
  sns.regplot(x=data.columns[0], y=data.columns[1], data=data)
139
+ st.pyplot(fig)