Update digestor.py
Browse files- digestor.py +1 -1
digestor.py
CHANGED
|
@@ -136,7 +136,7 @@ class Digestor:
|
|
| 136 |
return json.loads(response.content.decode("utf-8"))
|
| 137 |
|
| 138 |
|
| 139 |
-
def chunk_piece(self, piece, limit, tokenizer_checkpoint, include_tail=
|
| 140 |
"""Breaks articles into chunks that will fit the desired token length limit"""
|
| 141 |
# Get approximate word count
|
| 142 |
words = len(piece.split(' ')) # rough estimate of words. # words <= number tokens generally.
|
|
|
|
| 136 |
return json.loads(response.content.decode("utf-8"))
|
| 137 |
|
| 138 |
|
| 139 |
+
def chunk_piece(self, piece, limit, tokenizer_checkpoint, include_tail=False):
|
| 140 |
"""Breaks articles into chunks that will fit the desired token length limit"""
|
| 141 |
# Get approximate word count
|
| 142 |
words = len(piece.split(' ')) # rough estimate of words. # words <= number tokens generally.
|