Spaces:

alfraser
/

llm-arch

Runtime error

App Files Files Community

llm-arch / pages /030_Test_Runner.py

alfraser

Added a test runner page which allows you to run a batch of test from the UI

ab87be2 over 1 year ago

raw

history blame

1.9 kB

	import streamlit as st

	from src.architectures import *
	from src.common import generate_group_tag
	from src.testing import TestGenerator
	from src.st_helpers import st_setup


	if Architecture.architectures is None:
	Architecture.load_architectures()

	if st_setup('LLM Arch'):
	summary = st.container()
	with summary:
	st.write("# Test Runner")
	st.write("## Run a new test")
	st.write("### Comment:")
	comment = st.text_input("Optional comment for the test")

	st.write("### Architectures to include:")
	selected_archs = st.multiselect(label="Architectures", options=[a.name for a in Architecture.architectures])

	st.write("### Number of questions to ask:")
	q_count = st.slider(label="Number of questions", min_value=1, max_value=TestGenerator.question_count(), step=1)

	st.write("### Tag:")
	tag = generate_group_tag()
	st.write(f'Test will be tagged as "{tag}" - record this for easy searching later')

	total_tests = len(selected_archs) * q_count
	st.write("### Run:")
	st.write(f"{total_tests} total tests will be run")
	if st.button("Run", disabled=(total_tests==0)):
	progress = st.progress(0.0, text="Running tests...")
	questions = TestGenerator.get_random_questions(q_count)
	num_complete = 0
	for arch_name in selected_archs:
	architecture = Architecture.get_architecture(arch_name)
	for q in questions:
	architecture(ArchitectureRequest(q), trace_tags=[tag, "TestRunner"], trace_comment=comment)
	num_complete += 1
	if num_complete == total_tests:
	progress.empty()
	else:
	progress.progress(num_complete/total_tests, f"Run {num_complete} of {total_tests} tests...")