green commited on
Commit
63010fb
1 Parent(s): 7348b09

Update digestor.py

Browse files
Files changed (1) hide show
  1. digestor.py +1 -1
digestor.py CHANGED
@@ -136,7 +136,7 @@ class Digestor:
136
  return json.loads(response.content.decode("utf-8"))
137
 
138
 
139
- def chunk_piece(self, piece, limit, tokenizer_checkpoint, include_tail=True):
140
  """Breaks articles into chunks that will fit the desired token length limit"""
141
  # Get approximate word count
142
  words = len(piece.split(' ')) # rough estimate of words. # words <= number tokens generally.
136
  return json.loads(response.content.decode("utf-8"))
137
 
138
 
139
+ def chunk_piece(self, piece, limit, tokenizer_checkpoint, include_tail=False):
140
  """Breaks articles into chunks that will fit the desired token length limit"""
141
  # Get approximate word count
142
  words = len(piece.split(' ')) # rough estimate of words. # words <= number tokens generally.