Update backupapp.py
Browse files- backupapp.py +51 -8
backupapp.py
CHANGED
@@ -4,6 +4,13 @@ import pandas as pd
|
|
4 |
import plotly.express as px
|
5 |
import seaborn as sns
|
6 |
import matplotlib.pyplot as plt
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7 |
|
8 |
# Function to load JSONL file into a DataFrame
|
9 |
def load_jsonl(file_path):
|
@@ -17,17 +24,43 @@ def load_jsonl(file_path):
|
|
17 |
def filter_by_keyword(df, keyword):
|
18 |
return df[df.apply(lambda row: row.astype(str).str.contains(keyword).any(), axis=1)]
|
19 |
|
20 |
-
|
21 |
-
|
22 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
23 |
|
24 |
# Streamlit App
|
25 |
-
st.title("
|
26 |
|
27 |
# Dropdown for file selection
|
28 |
file_option = st.selectbox("Select file:", ["small_file.jsonl", "large_file.jsonl"])
|
29 |
st.write(f"You selected: {file_option}")
|
30 |
|
|
|
|
|
|
|
|
|
31 |
# Show filtered data grid
|
32 |
if file_option == "small_file.jsonl":
|
33 |
data = small_data
|
@@ -41,12 +74,22 @@ search_keyword = st.text_input("Enter a keyword to filter data (e.g., Heart, Lun
|
|
41 |
if st.button("Search"):
|
42 |
filtered_data = filter_by_keyword(data, search_keyword)
|
43 |
st.write(f"Filtered Dataset by '{search_keyword}'")
|
44 |
-
st.dataframe(filtered_data)
|
45 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
46 |
|
47 |
# Plotly and Seaborn charts for EDA
|
48 |
if st.button("Generate Charts"):
|
49 |
-
|
50 |
st.subheader("Plotly Charts 📈")
|
51 |
|
52 |
# 1. Scatter Plot
|
@@ -93,4 +136,4 @@ if st.button("Generate Charts"):
|
|
93 |
# 10. Regplot (Regression Plot)
|
94 |
fig, ax = plt.subplots()
|
95 |
sns.regplot(x=data.columns[0], y=data.columns[1], data=data)
|
96 |
-
st.pyplot(fig)
|
|
|
4 |
import plotly.express as px
|
5 |
import seaborn as sns
|
6 |
import matplotlib.pyplot as plt
|
7 |
+
import streamlit.components.v1 as components
|
8 |
+
|
9 |
+
# Global variable to hold selected row index
|
10 |
+
selected_row_index = None
|
11 |
+
|
12 |
+
# Initialize an empty DataFrame
|
13 |
+
filtered_data = pd.DataFrame()
|
14 |
|
15 |
# Function to load JSONL file into a DataFrame
|
16 |
def load_jsonl(file_path):
|
|
|
24 |
def filter_by_keyword(df, keyword):
|
25 |
return df[df.apply(lambda row: row.astype(str).str.contains(keyword).any(), axis=1)]
|
26 |
|
27 |
+
|
28 |
+
# Function to generate HTML5 code with embedded text
|
29 |
+
def generate_html(question_text, answer_text):
|
30 |
+
return f'''
|
31 |
+
<!DOCTYPE html>
|
32 |
+
<html>
|
33 |
+
<head>
|
34 |
+
<title>Read It Aloud</title>
|
35 |
+
<script type="text/javascript">
|
36 |
+
function readAloud(id) {{
|
37 |
+
const text = document.getElementById(id).innerText;
|
38 |
+
const speech = new SpeechSynthesisUtterance(text);
|
39 |
+
window.speechSynthesis.speak(speech);
|
40 |
+
}}
|
41 |
+
</script>
|
42 |
+
</head>
|
43 |
+
<body>
|
44 |
+
<h1>🔊 Read It Aloud</h1>
|
45 |
+
<p id="questionArea">{question_text}</p>
|
46 |
+
<button onclick="readAloud('questionArea')">🔊 Read Question Aloud</button>
|
47 |
+
<p id="answerArea">{answer_text}</p>
|
48 |
+
<button onclick="readAloud('answerArea')">🔊 Read Answer Aloud</button>
|
49 |
+
</body>
|
50 |
+
</html>
|
51 |
+
'''
|
52 |
|
53 |
# Streamlit App
|
54 |
+
st.title("Medical Licensing Exam Explorer with Speech Synthesis, Plotly and Seaborn 📊")
|
55 |
|
56 |
# Dropdown for file selection
|
57 |
file_option = st.selectbox("Select file:", ["small_file.jsonl", "large_file.jsonl"])
|
58 |
st.write(f"You selected: {file_option}")
|
59 |
|
60 |
+
# Load the data
|
61 |
+
small_data = load_jsonl("usmle_16.2MB.jsonl")
|
62 |
+
large_data = load_jsonl("usmle_2.08MB.jsonl")
|
63 |
+
|
64 |
# Show filtered data grid
|
65 |
if file_option == "small_file.jsonl":
|
66 |
data = small_data
|
|
|
74 |
if st.button("Search"):
|
75 |
filtered_data = filter_by_keyword(data, search_keyword)
|
76 |
st.write(f"Filtered Dataset by '{search_keyword}'")
|
77 |
+
selected_data = st.dataframe(filtered_data)
|
78 |
+
|
79 |
+
# Button to read selected row aloud
|
80 |
+
if st.button("Read Selected Row"):
|
81 |
+
if selected_row_index is not None:
|
82 |
+
selected_row = filtered_data.loc[selected_row_index]
|
83 |
+
question_text = selected_row.get("question", "No question field")
|
84 |
+
answer_text = selected_row.get("answer", "No answer field")
|
85 |
+
|
86 |
+
documentHTML5 = generate_html(question_text, answer_text)
|
87 |
+
components.html(documentHTML5, width=1280, height=1024)
|
88 |
+
else:
|
89 |
+
st.warning("Please select a row first.")
|
90 |
|
91 |
# Plotly and Seaborn charts for EDA
|
92 |
if st.button("Generate Charts"):
|
|
|
93 |
st.subheader("Plotly Charts 📈")
|
94 |
|
95 |
# 1. Scatter Plot
|
|
|
136 |
# 10. Regplot (Regression Plot)
|
137 |
fig, ax = plt.subplots()
|
138 |
sns.regplot(x=data.columns[0], y=data.columns[1], data=data)
|
139 |
+
st.pyplot(fig)
|