|
import streamlit as st |
|
import os |
|
import json |
|
def is_new_file_upload(uploaded_file): |
|
if 'last_uploaded_file' in st.session_state: |
|
|
|
if (uploaded_file.name != st.session_state.last_uploaded_file['name'] or |
|
uploaded_file.size != st.session_state.last_uploaded_file['size']): |
|
st.session_state.last_uploaded_file = {'name': uploaded_file.name, 'size': uploaded_file.size} |
|
|
|
return True |
|
else: |
|
|
|
return False |
|
else: |
|
|
|
st.session_state.last_uploaded_file = {'name': uploaded_file.name, 'size': uploaded_file.size} |
|
return True |
|
big_text = """ |
|
<div style='text-align: center;'> |
|
<h1 style='font-size: 30x;'>Knowledge Extraction 1</h1> |
|
</div> |
|
""" |
|
|
|
st.markdown(big_text, unsafe_allow_html=True) |
|
|
|
uploaded_json_file = st.file_uploader("Upload a pre-processed file", |
|
type=['json']) |
|
st.markdown( |
|
f'<a href="https://ikmtechnology.github.io/ikmtechnology/untethered_extracted_paragraphs.json" target="_blank">Sample 1 download and then upload to above</a>', |
|
unsafe_allow_html=True) |
|
|
|
if uploaded_json_file is not None: |
|
if is_new_file_upload(uploaded_json_file): |
|
print("is new file uploaded") |
|
save_path = './uploaded_files' |
|
if not os.path.exists(save_path): |
|
os.makedirs(save_path) |
|
with open(os.path.join(save_path, uploaded_json_file.name), "wb") as f: |
|
f.write(uploaded_json_file.getbuffer()) |
|
st.success(f'Saved file temp_{uploaded_json_file.name} in {save_path}') |
|
st.session_state.uploaded_path=os.path.join(save_path, uploaded_json_file.name) |
|
|
|
|
|
content = uploaded_json_file.read() |
|
try: |
|
data = json.loads(content) |
|
|
|
|
|
if isinstance(data, list): |
|
|
|
st.session_state.list_count = len(data) |
|
st.write(f'The number of elements at the top level of the hierarchy: {st.session_state.list_count }') |
|
else: |
|
st.write('The JSON content is not a dictionary.') |
|
except json.JSONDecodeError: |
|
st.write('Invalid JSON file.') |
|
st.rerun() |
|
|
|
if 'list_count' in st.session_state: |
|
st.write(f'The number of elements at the top level of the hierarchy: {st.session_state.list_count }') |