Spaces:

awacke1
/

BERTopic-Topic-Modeler-NLP-ML

Runtime error

App Files Files Community

awacke1 commited on Mar 20, 2023

Commit

06e9888

1 Parent(s): 09d04b2

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -9

app.py CHANGED Viewed

@@ -9,15 +9,15 @@ from hdbscan import HDBSCAN
 from sklearn.feature_extraction.text import CountVectorizer
 st.set_page_config(page_title="HF-BERTopic")
-st.title("HF-BERTopic A front end for BERTopic")
-st.caption("By Allen Roush")
-st.caption("github: https://github.com/Hellisotherpeople")
-st.caption("Linkedin: https://www.linkedin.com/in/allen-roush-27721011b/")
-st.image("https://raw.githubusercontent.com/MaartenGr/BERTopic/master/images/logo.png", width = 380)
-st.caption("By Maarten Grootendorst")
-st.caption("github: https://github.com/MaartenGr/BERTopic")
-st.caption("Linkedin: https://www.linkedin.com/in/mgrootendorst/")
-st.image("https://maartengr.github.io/BERTopic/img/algorithm.png")
 form = st.sidebar.form("Main Settings")
@@ -28,10 +28,15 @@ form.header("Main Settings")
 dataset_name = form.text_area("Enter the name of the huggingface dataset to do analysis of:", value = "Hellisotherpeople/DebateSum")
 dataset_name_2 = form.text_area("Enter the name of the config for the dataset if it has one", value = "")
 split_name = form.text_area("Enter the name of the split of the dataset that you want to use", value = "train")
 number_of_records = form.number_input("Enter the number of documents that you want to analyze from the dataset", value = 200)
 column_name = form.text_area("Enter the name of the column that we are doing analysis on (the X value)", value = "Full-Document")
 labels = form.checkbox("Does this dataset have labels that you want to use?", value = True)
 if labels == True:
     labels_column_name = form.text_area("Enter the name of the column that we are using for labels doing analysis on (the Y value)", value = "OriginalDebateFileName")

 from sklearn.feature_extraction.text import CountVectorizer
 st.set_page_config(page_title="HF-BERTopic")
+#st.title("HF-BERTopic A front end for BERTopic")
+#st.caption("By Allen Roush")
+#st.caption("github: https://github.com/Hellisotherpeople")
+#st.caption("Linkedin: https://www.linkedin.com/in/allen-roush-27721011b/")
+#st.image("https://raw.githubusercontent.com/MaartenGr/BERTopic/master/images/logo.png", width = 380)
+#st.caption("By Maarten Grootendorst")
+#st.caption("github: https://github.com/MaartenGr/BERTopic")
+#st.caption("Linkedin: https://www.linkedin.com/in/mgrootendorst/")
+#st.image("https://maartengr.github.io/BERTopic/img/algorithm.png")
 form = st.sidebar.form("Main Settings")
 dataset_name = form.text_area("Enter the name of the huggingface dataset to do analysis of:", value = "Hellisotherpeople/DebateSum")
 dataset_name_2 = form.text_area("Enter the name of the config for the dataset if it has one", value = "")
 split_name = form.text_area("Enter the name of the split of the dataset that you want to use", value = "train")
 number_of_records = form.number_input("Enter the number of documents that you want to analyze from the dataset", value = 200)
 column_name = form.text_area("Enter the name of the column that we are doing analysis on (the X value)", value = "Full-Document")
 labels = form.checkbox("Does this dataset have labels that you want to use?", value = True)
 if labels == True:
     labels_column_name = form.text_area("Enter the name of the column that we are using for labels doing analysis on (the Y value)", value = "OriginalDebateFileName")