Spaces:

alfraser
/

llm-arch

Runtime error

App Files Files Community

alfraser commited on Jan 24, 2024

Commit

ab87be2

1 Parent(s): c0f0676

Added a test runner page which allows you to run a batch of test from the UI

Browse files

Files changed (1) hide show

pages/030_Test_Runner.py +45 -0

pages/030_Test_Runner.py ADDED Viewed

	@@ -0,0 +1,45 @@

+import streamlit as st
+from src.architectures import *
+from src.common import generate_group_tag
+from src.testing import TestGenerator
+from src.st_helpers import st_setup
+if Architecture.architectures is None:
+    Architecture.load_architectures()
+if st_setup('LLM Arch'):
+    summary = st.container()
+    with summary:
+        st.write("# Test Runner")
+        st.write("## Run a new test")
+        st.write("### Comment:")
+        comment = st.text_input("Optional comment for the test")
+        st.write("### Architectures to include:")
+        selected_archs = st.multiselect(label="Architectures", options=[a.name for a in Architecture.architectures])
+        st.write("### Number of questions to ask:")
+        q_count = st.slider(label="Number of questions", min_value=1, max_value=TestGenerator.question_count(), step=1)
+        st.write("### Tag:")
+        tag = generate_group_tag()
+        st.write(f'Test will be tagged as "{tag}" - record this for easy searching later')
+        total_tests = len(selected_archs) * q_count
+        st.write("### Run:")
+        st.write(f"**{total_tests}** total tests will be run")
+        if st.button("**Run**", disabled=(total_tests==0)):
+            progress = st.progress(0.0, text="Running tests...")
+            questions = TestGenerator.get_random_questions(q_count)
+            num_complete = 0
+            for arch_name in selected_archs:
+                architecture = Architecture.get_architecture(arch_name)
+                for q in questions:
+                    architecture(ArchitectureRequest(q), trace_tags=[tag, "TestRunner"], trace_comment=comment)
+                    num_complete += 1
+                    if num_complete == total_tests:
+                        progress.empty()
+                    else:
+                        progress.progress(num_complete/total_tests, f"Run {num_complete} of {total_tests} tests...")