Spaces:

alfraser
/

llm-arch

Runtime error

App Files Files Community

alfraser commited on Jan 25, 2024

Commit

57b94ca

1 Parent(s): 79f35e2

Added ability to select which models to compare side by side, allowing for more flexibility in testing my fine-tuned llamas

Browse files

Files changed (1) hide show

pages/010_LLM_Architectures.py +40 -31

pages/010_LLM_Architectures.py CHANGED Viewed

@@ -17,43 +17,52 @@ def show_side_by_side() -> None:
     st.divider()
     header_container = st.container()
     arch_outer_container = st.container()
-    with arch_outer_container:
-        arch_cols = st.columns(len(Architecture.architectures))
     # Build header
     with header_container:
         st.write("### Side by side comparison of architectures")
-        st.write('Enter a question below to have it sent to all available architectures to compare timing and response.')
-        prompt = st.chat_input("Ask a question")
-        if prompt:
-            st.write(f"**Question:** {prompt}")
-    # Now build the columns
-    with arch_outer_container:
-        if prompt:
-            # Build columns per architecture
-            for i, a in enumerate(Architecture.architectures):
-                with arch_cols[i]:
-                    st.write(f'#### {a.name}')
-            # Now dispatch the messages per architecture
-            group_tag = generate_group_tag()
-            for i, a in enumerate(Architecture.architectures):
-                request = ArchitectureRequest(query=prompt)
-                with arch_cols[i]:
-                    with st.spinner('Architecture processing request'):
-                        start = time()
-                        a(request, trace_tags=["UI", "SideBySideCompare", group_tag])
-                        elapsed_in_s = (int((time() - start) * 10))/10  # round to 1dp in seconds
-                        st.write('##### Timing')
-                        st.write(f'Request took **{elapsed_in_s}s**')
-                        st.write('##### Response')
-                        st.write(request.response)
         else:
-            # Build columns per architecture for display only
-            for i, a in enumerate(Architecture.architectures):
-                with arch_cols[i]:
-                    st.write(f'#### {a.name}')
 def show_architecture(architecture: str) -> None:

     st.divider()
     header_container = st.container()
     arch_outer_container = st.container()
     # Build header
     with header_container:
         st.write("### Side by side comparison of architectures")
+        st.write('Enter a question below to have it sent to the selected architectures to compare timing and response.')
+        options = [a.name for a in Architecture.architectures]
+        selected_archs = st.multiselect("Select architectures to use", options=options, default=options)
+        if len(selected_archs) == 0:
+            st.write("To get started select some architectures to compare")
         else:
+            prompt = st.chat_input("Ask a question")
+            if prompt:
+                st.write(f"**Question:** {prompt}")
+    # Now build the columns
+    if len(selected_archs) > 0:
+        with arch_outer_container:
+            arch_cols = st.columns(len(selected_archs))
+            if prompt:
+                # Build columns per architecture
+                for i, a in enumerate(selected_archs):
+                    with arch_cols[i]:
+                        st.write(f'#### {a}')
+                # Now dispatch the messages per architecture
+                group_tag = generate_group_tag()
+                for i, a in enumerate(selected_archs):
+                    request = ArchitectureRequest(query=prompt)
+                    arch = Architecture.get_architecture(a)
+                    with arch_cols[i]:
+                        with st.spinner('Architecture processing request'):
+                            start = time()
+                            arch(request, trace_tags=["UI", "SideBySideCompare", group_tag])
+                            elapsed_in_s = (int((time() - start) * 10))/10  # round to 1dp in seconds
+                            st.write('##### Timing')
+                            st.write(f'Request took **{elapsed_in_s}s**')
+                            st.write('##### Response')
+                            st.write(request.response)
+            else:
+                # Build columns per architecture for display only
+                for i, a in enumerate(selected_archs):
+                    with arch_cols[i]:
+                        st.write(f'#### {a}')
 def show_architecture(architecture: str) -> None: