From 530d86fe1d492ab2995a9dcf439a6721af70d6eb Mon Sep 17 00:00:00 2001 From: George Tay <73705042+asdfghjkxd@users.noreply.github.com> Date: Wed, 2 Feb 2022 11:20:13 +0800 Subject: [PATCH] Compact Printouts --- pyfiles/pages/toolkit_nlp.py | 151 +++++++++++++++++++++++++---------- utils/helper.py | 16 +++- 2 files changed, 120 insertions(+), 47 deletions(-) diff --git a/pyfiles/pages/toolkit_nlp.py b/pyfiles/pages/toolkit_nlp.py index f2388f3..8b36312 100644 --- a/pyfiles/pages/toolkit_nlp.py +++ b/pyfiles/pages/toolkit_nlp.py @@ -1154,23 +1154,44 @@ def score2subject(score: int or float): st.markdown('---') st.markdown('### Save Data\n' '#### Topics') + collda, collda2 = st.columns(2) for index, data in enumerate(toolkit['TOPIC_TEXT']): if toolkit['OVERRIDE_FORMAT'] is not None: - st.markdown(prettyDownload( - object_to_download=data, - download_filename=f'lda_topics_{index}.{toolkit["OVERRIDE_FORMAT"].lower()}', - button_text=f'Download Topic List Data Entry {index}', - override_index=False, - format_=toolkit['OVERRIDE_FORMAT']), - unsafe_allow_html=True) + if (index + 1) % 2 != 0: + collda.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lda_topics_{index + 1}.' + f'{toolkit["OVERRIDE_FORMAT"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['OVERRIDE_FORMAT']), + unsafe_allow_html=True) + else: + collda2.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lda_topics_{index + 1}.' + f'{toolkit["OVERRIDE_FORMAT"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['OVERRIDE_FORMAT']), + unsafe_allow_html=True) else: - st.markdown(prettyDownload( - object_to_download=data, - download_filename=f'lda_topics_{index}.{toolkit["MODE"].lower()}', - button_text=f'Download Topic List Data Entry {index}', - override_index=False, - format_=toolkit['MODE']), - unsafe_allow_html=True) + if (index + 1) % 2 != 0: + collda.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lda_topics_{index + 1}.{toolkit["MODE"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['MODE']), + unsafe_allow_html=True) + else: + collda2.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lda_topics_{index + 1}.{toolkit["MODE"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['MODE']), + unsafe_allow_html=True) st.markdown('#### Topic/Word List') if toolkit['OVERRIDE_FORMAT'] is not None: @@ -1215,7 +1236,7 @@ def score2subject(score: int or float): l1_ratio=toolkit['L1_RATIO']).fit(toolkit['TFIDF_VECTORISED']) if toolkit['VERBOSE']: - st.markdown('### Model Data') + st.markdown('## Model Data') toolkit['TOPIC_TEXT'] = modelIterator(toolkit['NMF_MODEL'], toolkit['TFIDF_MODEL'], top_n=toolkit['NUM_TOPICS']) else: @@ -1240,23 +1261,44 @@ def score2subject(score: int or float): st.markdown('---') st.markdown('### Save Data\n' '#### Topics') + colnmf, colnmf2 = st.columns(2) for index, data in enumerate(toolkit['TOPIC_TEXT']): if toolkit['OVERRIDE_FORMAT'] is not None: - st.markdown(prettyDownload( - object_to_download=data, - download_filename=f'nmf_topics_{index}.{toolkit["OVERRIDE_FORMAT"].lower()}', - button_text=f'Download Topic List Data Entry {index}', - override_index=False, - format_=toolkit['OVERRIDE_FORMAT']), - unsafe_allow_html=True) + if (index + 1) % 2 != 0: + colnmf.markdown(prettyDownload( + object_to_download=data, + download_filename=f'nmf_topics_{index + 1}.' + f'{toolkit["OVERRIDE_FORMAT"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['OVERRIDE_FORMAT']), + unsafe_allow_html=True) + else: + colnmf2.markdown(prettyDownload( + object_to_download=data, + download_filename=f'nmf_topics_{index + 1}.' + f'{toolkit["OVERRIDE_FORMAT"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['OVERRIDE_FORMAT']), + unsafe_allow_html=True) else: - st.markdown(prettyDownload( - object_to_download=data, - download_filename=f'nmf_topics_{index}.{toolkit["MODE"].lower()}', - button_text=f'Download Topic List Data Entry {index}', - override_index=False, - format_=toolkit['MODE']), - unsafe_allow_html=True) + if (index + 1) % 2 != 0: + colnmf.markdown(prettyDownload( + object_to_download=data, + download_filename=f'nmf_topics_{index + 1}.{toolkit["MODE"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['MODE']), + unsafe_allow_html=True) + else: + colnmf2.markdown(prettyDownload( + object_to_download=data, + download_filename=f'nmf_topics_{index + 1}.{toolkit["MODE"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['MODE']), + unsafe_allow_html = True) st.markdown('#### Topic/Word List') if toolkit['OVERRIDE_FORMAT'] is not None: @@ -1283,7 +1325,7 @@ def score2subject(score: int or float): toolkit['LSI_DATA'] = toolkit['LSI_MODEL'].fit_transform(toolkit['VECTORISED']) if toolkit['VERBOSE']: - st.markdown('### Model Data') + st.markdown('## Model Data') toolkit['TOPIC_TEXT'] = modelIterator(toolkit['LSI_MODEL'], toolkit['CV'], top_n=toolkit['NUM_TOPICS']) else: @@ -1354,23 +1396,44 @@ def score2subject(score: int or float): st.markdown('---') st.markdown('### Save Data\n' '#### Topics') + collis, collis2 = st.columns(2) for index, data in enumerate(toolkit['TOPIC_TEXT']): if toolkit['OVERRIDE_FORMAT'] is not None: - st.markdown(prettyDownload( - object_to_download=data, - download_filename=f'lsi_topics_{index}.{toolkit["OVERRIDE_FORMAT"].lower()}', - button_text=f'Download Topic List Data Entry {index}', - override_index=False, - format_=toolkit['OVERRIDE_FORMAT']), - unsafe_allow_html=True) + if (index + 1) % 2 != 0: + collis.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lsi_topics_{index + 1}.' + f'{toolkit["OVERRIDE_FORMAT"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['OVERRIDE_FORMAT']), + unsafe_allow_html=True) + else: + collis2.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lsi_topics_{index + 1}.' + f'{toolkit["OVERRIDE_FORMAT"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['OVERRIDE_FORMAT']), + unsafe_allow_html=True) else: - st.markdown(prettyDownload( - object_to_download=data, - download_filename=f'lsi_topics_{index}.{toolkit["MODE"].lower()}', - button_text=f'Download Topic List Data Entry {index}', - override_index=False, - format_=toolkit['MODE']), - unsafe_allow_html=True) + if (index + 1) % 2 != 0: + collis.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lsi_topics_{index + 1}.{toolkit["MODE"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['MODE']), + unsafe_allow_html=True) + else: + collis2.markdown(prettyDownload( + object_to_download=data, + download_filename=f'lsi_topics_{index + 1}.{toolkit["MODE"].lower()}', + button_text=f'Download Topic List Data Entry {index + 1}', + override_index=False, + format_=toolkit['MODE']), + unsafe_allow_html=True) st.markdown('#### Topic/Word List') if toolkit['OVERRIDE_FORMAT'] is not None: diff --git a/utils/helper.py b/utils/helper.py index a75013e..03709a6 100644 --- a/utils/helper.py +++ b/utils/helper.py @@ -149,12 +149,22 @@ def modelIterator(model, vectoriser, top_n, vb=True): index=range(len(lister)), columns=['word', 'weight']) - if vb: - st.markdown(f'### Topic {id_}') - st.dataframe(df) + # if vb: + # st.markdown(f'### Topic {id_}') + # st.dataframe(df) frame_list.append(df) + if vb: + colx, coly = st.columns(2) + for order, data in enumerate(frame_list): + if (order + 1) % 2 != 0: + colx.markdown(f'### Topic {order + 1}') + colx.dataframe(data) + else: + coly.markdown(f'### Topic {order + 1}') + coly.dataframe(data) + return frame_list