Spaces:

green
/

TopicDig

Runtime error

green commited on Apr 14, 2022

Commit

b37a49f

1 Parent(s): b8a68ac

Update digestor.py

Files changed (1) hide show

digestor.py CHANGED Viewed

@@ -41,7 +41,7 @@ class Digestor:
         ])  = None
     # Summarization params:
-    token_limit: int = 512
     word_limit: int = 400
     SUMMARIZATION_PARAMETERS = {
                                 "do_sample": False,
@@ -139,7 +139,7 @@ class Digestor:
         """Breaks articles into chunks that will fit the desired token length limit"""
         # Get approximate word count
         words = len(piece.split(' ')) # rough estimate of words.  # words <= number tokens generally.
-        # get number of chunks by idividing number of words by chunk size (word limit)
         # Create list of ints to create rangelist from
         base_range = [i*limit for i in range(words//limit+1)]
         # For articles less than limit in length base_range will only contain zero.

         ])  = None
     # Summarization params:
+    token_limit: int = 1024
     word_limit: int = 400
     SUMMARIZATION_PARAMETERS = {
                                 "do_sample": False,
         """Breaks articles into chunks that will fit the desired token length limit"""
         # Get approximate word count
         words = len(piece.split(' ')) # rough estimate of words.  # words <= number tokens generally.
+        # get number of chunks by dividing number of words by chunk size (word limit)
         # Create list of ints to create rangelist from
         base_range = [i*limit for i in range(words//limit+1)]
         # For articles less than limit in length base_range will only contain zero.