Hasan Iqbal
commited on
Custom developed metric card
Browse files
src/openfactcheck/app/evaluate_response.py
CHANGED
@@ -4,7 +4,7 @@ import pandas as pd
|
|
4 |
import streamlit as st
|
5 |
|
6 |
from openfactcheck.core.base import OpenFactCheck
|
7 |
-
from openfactcheck.app.utils import
|
8 |
|
9 |
# Create a function to check a LLM response
|
10 |
def evaluate_response(ofc: OpenFactCheck):
|
@@ -38,6 +38,7 @@ def evaluate_response(ofc: OpenFactCheck):
|
|
38 |
|
39 |
# Button to check factuality
|
40 |
if st.button("Check Factuality"):
|
|
|
41 |
with st.status("Checking factuality...", expanded=True) as status:
|
42 |
# Configure the pipeline
|
43 |
st.write("Configuring pipeline...")
|
@@ -90,8 +91,8 @@ def evaluate_response(ofc: OpenFactCheck):
|
|
90 |
formatted_text = "#### Detected Claims\n" + "\n".join(f"{i}. {extract_text(claim)}" for i, claim in enumerate(detected_claims, start=1)) + "\n"
|
91 |
|
92 |
with col2:
|
93 |
-
st.
|
94 |
-
|
95 |
|
96 |
# Yield each word with a space and simulate typing by sleeping
|
97 |
for word in formatted_text.split(" "):
|
@@ -113,8 +114,8 @@ def evaluate_response(ofc: OpenFactCheck):
|
|
113 |
formatted_text = "#### Retrieved Evidences\n" + "\n".join(f"{i}. {evidence}" for i, evidence in enumerate(evidences, start=1))
|
114 |
|
115 |
with col2:
|
116 |
-
st.
|
117 |
-
|
118 |
|
119 |
# Yield each word with a space and simulate typing by sleeping
|
120 |
for word in formatted_text.split(" "):
|
@@ -140,15 +141,8 @@ def evaluate_response(ofc: OpenFactCheck):
|
|
140 |
if final_response is not None:
|
141 |
overall_factuality = final_response.get("label", "Unknown")
|
142 |
with col2:
|
143 |
-
|
144 |
-
|
145 |
-
|
146 |
-
|
147 |
-
|
148 |
-
style_metric_cards(background_color="#F8D7DA", border_color="#F8D7DA", border_radius_px=0, border_left_color="#DC3545")
|
149 |
-
|
150 |
-
# Button to reset
|
151 |
-
if st.session_state.response is not None:
|
152 |
-
if st.button("Reset"):
|
153 |
-
st.session_state.response = None
|
154 |
-
st.rerun()
|
|
|
4 |
import streamlit as st
|
5 |
|
6 |
from openfactcheck.core.base import OpenFactCheck
|
7 |
+
from openfactcheck.app.utils import metric_card
|
8 |
|
9 |
# Create a function to check a LLM response
|
10 |
def evaluate_response(ofc: OpenFactCheck):
|
|
|
38 |
|
39 |
# Button to check factuality
|
40 |
if st.button("Check Factuality"):
|
41 |
+
|
42 |
with st.status("Checking factuality...", expanded=True) as status:
|
43 |
# Configure the pipeline
|
44 |
st.write("Configuring pipeline...")
|
|
|
91 |
formatted_text = "#### Detected Claims\n" + "\n".join(f"{i}. {extract_text(claim)}" for i, claim in enumerate(detected_claims, start=1)) + "\n"
|
92 |
|
93 |
with col2:
|
94 |
+
with st.container():
|
95 |
+
metric_card(label="Detected Claims", value=len(detected_claims))
|
96 |
|
97 |
# Yield each word with a space and simulate typing by sleeping
|
98 |
for word in formatted_text.split(" "):
|
|
|
114 |
formatted_text = "#### Retrieved Evidences\n" + "\n".join(f"{i}. {evidence}" for i, evidence in enumerate(evidences, start=1))
|
115 |
|
116 |
with col2:
|
117 |
+
with st.container():
|
118 |
+
metric_card(label="Retrieved Evidences", value=len(evidences))
|
119 |
|
120 |
# Yield each word with a space and simulate typing by sleeping
|
121 |
for word in formatted_text.split(" "):
|
|
|
141 |
if final_response is not None:
|
142 |
overall_factuality = final_response.get("label", "Unknown")
|
143 |
with col2:
|
144 |
+
with st.container():
|
145 |
+
if overall_factuality == True:
|
146 |
+
metric_card(label="Overall Factuality", value="True", background_color="#D4EDDA", border_left_color="#28A745")
|
147 |
+
elif overall_factuality == False:
|
148 |
+
metric_card(label="Overall Factuality", value="False", background_color="#F8D7DA", border_left_color="#DC3545")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
src/openfactcheck/app/utils.py
CHANGED
@@ -1,35 +1,35 @@
|
|
1 |
import streamlit as st
|
2 |
|
3 |
-
def
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
|
13 |
-
|
14 |
-
|
15 |
-
border_size_px (int, optional): Border size in pixels. Defaults to 1.
|
16 |
-
border_color (str, optional): Border color. Defaults to "#CCC".
|
17 |
-
border_radius_px (int, optional): Border radius in pixels. Defaults to 5.
|
18 |
-
border_left_color (str, optional): Borfer left color. Defaults to "#9AD8E1".
|
19 |
-
box_shadow (bool, optional): Whether a box shadow is applied. Defaults to True.
|
20 |
-
"""
|
21 |
-
st.markdown(
|
22 |
-
f"""
|
23 |
-
<style>
|
24 |
-
div[data-testid="stMetric"],
|
25 |
-
div[data-testid="metric-container"] {{
|
26 |
-
background-color: {background_color};
|
27 |
-
border: {border_size_px}px solid {border_color};
|
28 |
-
padding: 5% 5% 5% 10%;
|
29 |
-
border-radius: {border_radius_px}px;
|
30 |
-
border-left: 0.5rem solid {border_left_color} !important;
|
31 |
-
}}
|
32 |
-
</style>
|
33 |
-
""",
|
34 |
-
unsafe_allow_html=True,
|
35 |
-
)
|
|
|
1 |
import streamlit as st
|
2 |
|
3 |
+
def metric_card(
|
4 |
+
background_color: str = "#FFF",
|
5 |
+
border_size_px: int = 1,
|
6 |
+
border_color: str = "#CCC",
|
7 |
+
border_radius_px: int = 5,
|
8 |
+
border_left_color: str = "#9AD8E1",
|
9 |
+
label: str = "Label",
|
10 |
+
value: str = "Value",
|
11 |
+
) -> None:
|
12 |
+
|
13 |
+
html_str = f"""<div><p style='font-size: 14px;
|
14 |
+
color: rgb(49, 51, 63);
|
15 |
+
height: auto;
|
16 |
+
min-height: 1.5rem;
|
17 |
+
vertical-align: middle;
|
18 |
+
flex-direction: row;
|
19 |
+
-webkit-box-align: center;
|
20 |
+
align-items: center;
|
21 |
+
margin-bottom: 0px;
|
22 |
+
display: grid;
|
23 |
+
background-color: {background_color};
|
24 |
+
border: {border_size_px}px solid {border_color};
|
25 |
+
padding: 5% 5% 5% 10%;
|
26 |
+
border-radius: {border_radius_px}px;
|
27 |
+
border-left: 0.5rem solid {border_left_color};'>
|
28 |
+
{label}
|
29 |
+
</style><br>
|
30 |
+
<span style='font-size: 2.25rem;
|
31 |
+
padding-bottom: 0.25rem;'>{value}</span>
|
32 |
+
</p></div>"""
|
33 |
|
34 |
+
st.markdown(html_str, unsafe_allow_html=True)
|
35 |
+
st.markdown('######')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|