Spaces:

alfraser
/

llm-arch

Runtime error

llm-arch / pages /010_LLM_Architectures.py

Removed decimals from group tag and moved where it is called in the side by side flow so they actually share the same ID

2f008c2 over 1 year ago

raw

history blame

5.41 kB

	import pandas as pd
	import streamlit as st

	from time import time

	from src.st_helpers import st_setup
	from src.common import img_dir, escape_dollars, generate_group_tag
	from src.architectures import *


	def show_side_by_side() -> None:
	"""
	Streamlit render a prompt and the boxes to show each architecture
	:return:
	"""
	# Build the layout structure
	st.divider()
	header_container = st.container()
	arch_outer_container = st.container()
	with arch_outer_container:
	arch_cols = st.columns(len(Architecture.architectures))

	# Build header
	with header_container:
	st.write("### Side by side comparison of architectures")
	st.write('Enter a question below to have it sent to all available architectures to compare timing and response.')
	prompt = st.chat_input("Ask a question")
	if prompt:
	st.write(f"Question: {prompt}")

	# Now build the columns
	with arch_outer_container:
	if prompt:
	# Build columns per architecture
	for i, a in enumerate(Architecture.architectures):
	with arch_cols[i]:
	st.write(f'#### {a.name}')

	# Now dispatch the messages per architecture
	group_tag = generate_group_tag()
	for i, a in enumerate(Architecture.architectures):
	request = ArchitectureRequest(query=prompt)
	with arch_cols[i]:
	with st.spinner('Architecture processing request'):
	start = time()
	a(request, trace_tags=["UI", "SideBySideCompare", group_tag])
	elapsed_in_s = (int((time() - start) * 10))/10 # round to 1dp in seconds
	st.write('##### Timing')
	st.write(f'Request took {elapsed_in_s}s')
	st.write('##### Response')
	st.write(request.response)
	else:
	# Build columns per architecture for display only
	for i, a in enumerate(Architecture.architectures):
	with arch_cols[i]:
	st.write(f'#### {a.name}')


	def show_architecture(architecture: str) -> None:
	"""
	Streamlit render an architecture details and the
	ability to interact with the architecture
	:param architecture: the name of the architecture to output
	"""
	arch = Architecture.get_architecture(architecture)

	# Segment into two containers for organisation
	arch_container = st.container()
	chat_container = st.container()

	with arch_container:
	st.divider()
	st.write(f'### {arch.name}')
	st.write('#### Architecture description')
	st.write(arch.description)
	if arch.img is not None:
	img = os.path.join(img_dir, arch.img)
	st.image(img, caption=f'Protypical {arch.name} Under Test', width=1000)
	table_data = []
	for j, s in enumerate(arch.steps, start=1):
	table_data.append(
	[j, s.__class__.__name__, s.description, s.config_description()]
	)
	table_cols = ['Step', 'Name', 'Description', 'Config details']
	st.write('#### Architecture pipeline steps')
	st.table(pd.DataFrame(table_data, columns=table_cols))

	with chat_container:
	st.write(f"### Chat with {arch.name}")
	st.write("Note this is a simple single query through the relevant architecture. This is just a sample so you can interact with it and does not manage a chat session history.")

	chat_col, trace_col, request_col = st.columns([3, 2, 2])

	with chat_col:
	with st.chat_message("assistant"):
	st.write("Chat with me in the box below")
	if prompt := st.chat_input("Ask a question"):
	with chat_col:
	with st.chat_message("user"):
	st.write(prompt)
	request = ArchitectureRequest(query=prompt)
	trace = arch(request, trace_tags=["UI", "SingleArchTest"])
	with st.chat_message("assistant"):
	st.write(escape_dollars(request.response))
	with trace_col:
	st.write("#### Architecture Trace")
	st.markdown(trace.as_markdown())
	with request_col:
	st.write("#### Full Request/Response")
	st.markdown(request.as_markdown())


	if st_setup('LLM Arch'):
	st.write("# LLM Architectures")
	Architecture.load_architectures()

	# Display the available architectures
	arch_count = len(Architecture.architectures)
	if arch_count == 1:
	st.write('### 1 Architecture available')
	else:
	st.write(f'### {arch_count} Architectures available')

	if st.button("Force reload of architecture configs"):
	Architecture.load_architectures(force_reload=True)

	arch_names = [a.name for a in Architecture.architectures]
	compare = 'Side by side comparison'
	arch_names.append(compare)
	selected_arch = st.radio(label="Available architectures", label_visibility="hidden", options=arch_names, index=None)
	if selected_arch is None:
	st.info('Select an architecture from above to see details and interact with it')
	elif selected_arch == compare:
	show_side_by_side()
	else:
	show_architecture(selected_arch)