Spaces:

green
/

TopicDig

Runtime error

App Files Files Community

m. polinsky commited on Mar 28, 2022

Commit

9604970

unverified ·

1 Parent(s): e037e33

Update streamlit_app.py

Browse files

Files changed (1) hide show

streamlit_app.py +58 -62

streamlit_app.py CHANGED Viewed

@@ -15,10 +15,7 @@ from source import Source
 from scrape_sources import NPRLite, CNNText, stub
 import random
-# EDIT: before doing NER check time of last scrape and just read in from JSON store instead of rescraping
-# can force rescrape
-# This may take a config to get sources as input
-@st.cache()
 def initialize(limit, rando, use_cache=True):
     clusters: dict[str:List[namedtuple]] = dict()
     # This is a container for the source classes.
@@ -157,7 +154,7 @@ def ner_results(ner_object, groups=True, NER_THRESHOLD=0.5) -> List[str]:
 NER_API_URL =  "https://api-inference.huggingface.co/models/dbmdz/bert-large-cased-finetuned-conll03-english"
 headers = {"Authorization": f"""Bearer {st.secrets['ato']}"""}
-LIMIT = None # Controls time and number of clusters.
 USE_CACHE = True
 if not USE_CACHE:
@@ -176,60 +173,59 @@ article_dict, clusters = initialize(LIMIT, USE_CACHE)
 # We now have clusters and cluster data.  Redundancy.
 # We call a display function and get the user input.
 # For this its still streamlit.
-loop_control = 'y'
-while loop_control == 'y':
-    selections = []
-    choices = list(clusters.keys())
-    choices.insert(0,'None')
-    # Form used to take 3 menu inputs
-    with st.form(key='columns_in_form'):
-        cols = st.columns(3)
-        for i, col in enumerate(cols):
-            selections.append(col.selectbox(f'Make a Selection', choices, key=i))
-        submitted = st.form_submit_button('Submit')
-        if submitted:
-            selections = [i for i in selections if i is not None]
-            with st.spinner(text="Digesting...please wait, this will take a few moments...Maybe check some messages or start reading the latest papers on summarization with transformers...."):
-                found = False
-                # Check if we already have this digest.
-                for i in digests:
-                    if set(selections) == set(list(i)):
-                        digestor = digests[i]
-                        found = True
-                        break
-                # If we need a new digest
-                if not found:
-                    chosen = []
-                    # Why not just use answers.values()?
-                    for i in selections: # i is supposed to be a list of stubs, mostly one
-                        if i != 'None':
-                            for j in clusters[i]:
-                                if j not in chosen:
-                                    chosen.append(j) # j is supposed to be a stub.
-                    # Article dict contains stubs for unprocessed articles and lists of summarized chunks for processed ones.
-                    # Here we put together a list of article stubs and/or summary chunks and let the digestor sort out what it does with them,
-                    chosen = [i if isinstance(article_dict[i.hed], stub) else article_dict[i.hed] for i in chosen]
-                    # Digestor uses 'chosen', passed through 'stubs' to create digest.
-                    # 'user_choicese' is passed for reference.
-                    #    Passing list(answers.values()) includes 'None' choices.
-                    digestor = Digestor(timer=Timer(), cache = USE_CACHE, stubs=chosen, user_choices=list(selections))
-                    # happens internally but may be used differently so it isn't automatic upon digestor creation.
-                    # Easily turn caching off for testing.
-                    digestor.digest() # creates summaries and stores them associated with the digest
-                # Get displayable digest and digest data
-                digestor.build_digest()# only returns for data collection
-                digests[tuple(digestor.user_choices)] = digestor
-            if len(digestor.text) == 0:
-                st.write("You didn't select a topic!")
-            else:
-                st.write("Your digest is ready:\n")
-            st.write(digestor.text)
-    loop_control = input('Y to continue...')

 from scrape_sources import NPRLite, CNNText, stub
 import random
 def initialize(limit, rando, use_cache=True):
     clusters: dict[str:List[namedtuple]] = dict()
     # This is a container for the source classes.
 NER_API_URL =  "https://api-inference.huggingface.co/models/dbmdz/bert-large-cased-finetuned-conll03-english"
 headers = {"Authorization": f"""Bearer {st.secrets['ato']}"""}
+LIMIT = 20 # Controls time and number of clusters.
 USE_CACHE = True
 if not USE_CACHE:
 # We now have clusters and cluster data.  Redundancy.
 # We call a display function and get the user input.
 # For this its still streamlit.
+selections = []
+choices = list(clusters.keys())
+choices.insert(0,'None')
+# Form used to take 3 menu inputs
+with st.form(key='columns_in_form'):
+    cols = st.columns(3)
+    for i, col in enumerate(cols):
+        selections.append(col.selectbox(f'Make a Selection', choices, key=i))
+    submitted = st.form_submit_button('Submit')
+    if submitted:
+        selections = [i for i in selections if i is not None]
+        with st.spinner(text="Digesting...please wait, this will take a few moments...Maybe check some messages or start reading the latest papers on summarization with transformers...."):
+            found = False
+            # Check if we already have this digest.
+            for i in digests:
+                if set(selections) == set(list(i)):
+                    digestor = digests[i]
+                    found = True
+                    break
+            # If we need a new digest
+            if not found:
+                chosen = []
+                # Why not just use answers.values()?
+                for i in selections: # i is supposed to be a list of stubs, mostly one
+                    if i != 'None':
+                        for j in clusters[i]:
+                            if j not in chosen:
+                                chosen.append(j) # j is supposed to be a stub.
+                # Article dict contains stubs for unprocessed articles and lists of summarized chunks for processed ones.
+                # Here we put together a list of article stubs and/or summary chunks and let the digestor sort out what it does with them,
+                chosen = [i if isinstance(article_dict[i.hed], stub) else article_dict[i.hed] for i in chosen]
+                # Digestor uses 'chosen', passed through 'stubs' to create digest.
+                # 'user_choicese' is passed for reference.
+                #    Passing list(answers.values()) includes 'None' choices.
+                digestor = Digestor(timer=Timer(), cache = USE_CACHE, stubs=chosen, user_choices=list(selections))
+                # happens internally but may be used differently so it isn't automatic upon digestor creation.
+                # Easily turn caching off for testing.
+                digestor.digest() # creates summaries and stores them associated with the digest
+            # Get displayable digest and digest data
+            digestor.build_digest()# only returns for data collection
+            digests[tuple(digestor.user_choices)] = digestor
+        if len(digestor.text) == 0:
+            st.write("You didn't select a topic!")
+        else:
+            st.write("Your digest is ready:\n")
+        st.write(digestor.text)