Step... (186000/250000 | Loss: 1.7381113767623901, Acc: 0.6502522826194763): 74%|█████████████████ | 186090/250000 [2:39:06<32:58:04, 1.86s/it]
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- flax_model.msgpack +1 -1
- mc4/mc4.py +12 -9
- outputs/checkpoints/checkpoint-140001/training_state.json +0 -1
- outputs/checkpoints/checkpoint-150001/training_state.json +0 -1
- outputs/checkpoints/checkpoint-160001/training_state.json +0 -1
- outputs/checkpoints/checkpoint-170001/training_state.json +0 -1
- outputs/checkpoints/checkpoint-180001/data_collator.joblib +0 -3
- outputs/checkpoints/checkpoint-180001/flax_model.msgpack +0 -3
- outputs/checkpoints/checkpoint-180001/optimizer_state.msgpack +0 -3
- outputs/checkpoints/checkpoint-180001/training_args.joblib +0 -3
- outputs/checkpoints/checkpoint-180001/training_state.json +0 -1
- outputs/checkpoints/{checkpoint-140001 → checkpoint-182000}/config.json +0 -0
- outputs/checkpoints/{checkpoint-140001 → checkpoint-182000}/data_collator.joblib +2 -2
- outputs/checkpoints/{checkpoint-150001 → checkpoint-182000}/flax_model.msgpack +1 -1
- outputs/checkpoints/{checkpoint-150001 → checkpoint-182000}/optimizer_state.msgpack +1 -1
- outputs/checkpoints/{checkpoint-160001 → checkpoint-182000}/training_args.joblib +2 -2
- outputs/checkpoints/checkpoint-182000/training_state.json +1 -0
- outputs/checkpoints/{checkpoint-150001 → checkpoint-183000}/config.json +0 -0
- outputs/checkpoints/{checkpoint-150001 → checkpoint-183000}/data_collator.joblib +2 -2
- outputs/checkpoints/{checkpoint-140001 → checkpoint-183000}/flax_model.msgpack +1 -1
- outputs/checkpoints/{checkpoint-160001 → checkpoint-183000}/optimizer_state.msgpack +1 -1
- outputs/checkpoints/{checkpoint-170001 → checkpoint-183000}/training_args.joblib +2 -2
- outputs/checkpoints/checkpoint-183000/training_state.json +1 -0
- outputs/checkpoints/{checkpoint-160001 → checkpoint-184000}/config.json +0 -0
- outputs/checkpoints/{checkpoint-160001 → checkpoint-184000}/data_collator.joblib +2 -2
- outputs/checkpoints/{checkpoint-160001 → checkpoint-184000}/flax_model.msgpack +1 -1
- outputs/checkpoints/{checkpoint-140001 → checkpoint-184000}/optimizer_state.msgpack +1 -1
- outputs/checkpoints/{checkpoint-150001 → checkpoint-184000}/training_args.joblib +2 -2
- outputs/checkpoints/checkpoint-184000/training_state.json +1 -0
- outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/config.json +0 -0
- outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/data_collator.joblib +2 -2
- outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/flax_model.msgpack +1 -1
- outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/optimizer_state.msgpack +1 -1
- outputs/checkpoints/{checkpoint-140001 → checkpoint-185000}/training_args.joblib +2 -2
- outputs/checkpoints/checkpoint-185000/training_state.json +1 -0
- outputs/checkpoints/{checkpoint-180001 → checkpoint-186000}/config.json +0 -0
- outputs/checkpoints/checkpoint-186000/data_collator.joblib +3 -0
- outputs/checkpoints/checkpoint-186000/flax_model.msgpack +3 -0
- outputs/checkpoints/checkpoint-186000/optimizer_state.msgpack +3 -0
- outputs/checkpoints/checkpoint-186000/training_args.joblib +3 -0
- outputs/checkpoints/checkpoint-186000/training_state.json +1 -0
- outputs/data_collator.joblib +2 -2
- outputs/events.out.tfevents.1627122688.tablespoon.2185269.3.v2 +3 -0
- outputs/events.out.tfevents.1627122817.tablespoon.2191003.3.v2 +3 -0
- outputs/events.out.tfevents.1627125745.tablespoon.2266135.3.v2 +3 -0
- outputs/events.out.tfevents.1627128247.tablespoon.2330108.3.v2 +3 -0
- outputs/flax_model.msgpack +1 -1
- outputs/optimizer_state.msgpack +1 -1
- outputs/training_args.joblib +2 -2
- outputs/training_state.json +1 -1
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 249750019
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3362fadd5306539e1775600df59349acf0fd260751129abaa45b997091d089ce
|
3 |
size 249750019
|
mc4/mc4.py
CHANGED
@@ -1,11 +1,11 @@
|
|
1 |
-
"""mC4 dataset based on Common Crawl."""
|
2 |
|
3 |
|
4 |
import gzip
|
5 |
import json
|
6 |
|
7 |
import datasets
|
8 |
-
import kenlm
|
9 |
import numpy as np
|
10 |
from numpy.random import default_rng
|
11 |
|
@@ -289,6 +289,7 @@ class Mc4(datasets.GeneratorBasedBuilder):
|
|
289 |
self.sampling_factor = kwargs.pop("sampling_factor", None)
|
290 |
self.boundaries = kwargs.pop("boundaries", None)
|
291 |
self.seed = kwargs.pop("seed", None)
|
|
|
292 |
if self.sampling_method:
|
293 |
if self.seed is not None:
|
294 |
self.rng = default_rng(self.seed)
|
@@ -316,7 +317,7 @@ class Mc4(datasets.GeneratorBasedBuilder):
|
|
316 |
doc_length += length
|
317 |
return 10.0 ** (-doc_log_score / doc_length)
|
318 |
|
319 |
-
def _should_keep_doc_step(self, doc, factor=1.5e5, boundaries=None):
|
320 |
perplexity = self.get_perplexity(doc)
|
321 |
if boundaries is None:
|
322 |
boundaries = [536394.99320948, 662247.50212365, 919250.87225178]
|
@@ -331,17 +332,18 @@ class Mc4(datasets.GeneratorBasedBuilder):
|
|
331 |
probability = factor / quartile_range
|
332 |
return self.rng.uniform() < probability
|
333 |
|
334 |
-
def _should_keep_doc_gaussian(self, doc, factor=0.78, boundaries=None):
|
|
|
335 |
perplexity = self.get_perplexity(doc)
|
336 |
if boundaries is not None:
|
337 |
m = boundaries[1]
|
338 |
else:
|
339 |
m = 662247.50212365
|
340 |
-
exponential = np.exp(-
|
341 |
weighted_perplexity = factor * exponential
|
342 |
return self.rng.uniform() < weighted_perplexity
|
343 |
|
344 |
-
def _should_keep_doc_random(self, doc, factor=None, boundaries=None):
|
345 |
if factor is None:
|
346 |
factor = 0.5
|
347 |
return self.rng.uniform() <= factor
|
@@ -374,13 +376,13 @@ class Mc4(datasets.GeneratorBasedBuilder):
|
|
374 |
for lang in self.config.languages
|
375 |
for index in range(_N_SHARDS_PER_SPLIT[lang][split])
|
376 |
]
|
377 |
-
if "train" in self.data_files:
|
378 |
train_downloaded_files = self.data_files["train"]
|
379 |
if not isinstance(train_downloaded_files, (tuple, list)):
|
380 |
train_downloaded_files = [train_downloaded_files]
|
381 |
else:
|
382 |
train_downloaded_files = dl_manager.download(data_urls["train"])
|
383 |
-
if "validation" in self.data_files:
|
384 |
validation_downloaded_files = self.data_files["validation"]
|
385 |
if not isinstance(validation_downloaded_files, (tuple, list)):
|
386 |
validation_downloaded_files = [validation_downloaded_files]
|
@@ -415,7 +417,8 @@ class Mc4(datasets.GeneratorBasedBuilder):
|
|
415 |
if self.should_keep_doc(
|
416 |
example["text"],
|
417 |
factor=self.sampling_factor,
|
418 |
-
boundaries=self.boundaries
|
|
|
419 |
yield id_, example
|
420 |
id_ += 1
|
421 |
else:
|
|
|
1 |
+
"""Perplexity Sampled mC4 dataset based on Common Crawl."""
|
2 |
|
3 |
|
4 |
import gzip
|
5 |
import json
|
6 |
|
7 |
import datasets
|
8 |
+
import kenlm # pip install https://github.com/kpu/kenlm/archive/master.zip
|
9 |
import numpy as np
|
10 |
from numpy.random import default_rng
|
11 |
|
|
|
289 |
self.sampling_factor = kwargs.pop("sampling_factor", None)
|
290 |
self.boundaries = kwargs.pop("boundaries", None)
|
291 |
self.seed = kwargs.pop("seed", None)
|
292 |
+
self.kwargs = kwargs
|
293 |
if self.sampling_method:
|
294 |
if self.seed is not None:
|
295 |
self.rng = default_rng(self.seed)
|
|
|
317 |
doc_length += length
|
318 |
return 10.0 ** (-doc_log_score / doc_length)
|
319 |
|
320 |
+
def _should_keep_doc_step(self, doc, factor=1.5e5, boundaries=None, **kwargs):
|
321 |
perplexity = self.get_perplexity(doc)
|
322 |
if boundaries is None:
|
323 |
boundaries = [536394.99320948, 662247.50212365, 919250.87225178]
|
|
|
332 |
probability = factor / quartile_range
|
333 |
return self.rng.uniform() < probability
|
334 |
|
335 |
+
def _should_keep_doc_gaussian(self, doc, factor=0.78, boundaries=None, **kwargs):
|
336 |
+
width = kwargs.get("width", 9 / 2) # width (spread) of the exponential curve
|
337 |
perplexity = self.get_perplexity(doc)
|
338 |
if boundaries is not None:
|
339 |
m = boundaries[1]
|
340 |
else:
|
341 |
m = 662247.50212365
|
342 |
+
exponential = np.exp((-1 / width) * ((perplexity - m) / m) ** 2)
|
343 |
weighted_perplexity = factor * exponential
|
344 |
return self.rng.uniform() < weighted_perplexity
|
345 |
|
346 |
+
def _should_keep_doc_random(self, doc, factor=None, boundaries=None, **kwargs):
|
347 |
if factor is None:
|
348 |
factor = 0.5
|
349 |
return self.rng.uniform() <= factor
|
|
|
376 |
for lang in self.config.languages
|
377 |
for index in range(_N_SHARDS_PER_SPLIT[lang][split])
|
378 |
]
|
379 |
+
if self.data_files and "train" in self.data_files:
|
380 |
train_downloaded_files = self.data_files["train"]
|
381 |
if not isinstance(train_downloaded_files, (tuple, list)):
|
382 |
train_downloaded_files = [train_downloaded_files]
|
383 |
else:
|
384 |
train_downloaded_files = dl_manager.download(data_urls["train"])
|
385 |
+
if self.data_files and "validation" in self.data_files:
|
386 |
validation_downloaded_files = self.data_files["validation"]
|
387 |
if not isinstance(validation_downloaded_files, (tuple, list)):
|
388 |
validation_downloaded_files = [validation_downloaded_files]
|
|
|
417 |
if self.should_keep_doc(
|
418 |
example["text"],
|
419 |
factor=self.sampling_factor,
|
420 |
+
boundaries=self.boundaries,
|
421 |
+
**self.kwargs):
|
422 |
yield id_, example
|
423 |
id_ += 1
|
424 |
else:
|
outputs/checkpoints/checkpoint-140001/training_state.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"step": 140001}
|
|
|
|
outputs/checkpoints/checkpoint-150001/training_state.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"step": 150001}
|
|
|
|
outputs/checkpoints/checkpoint-160001/training_state.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"step": 160001}
|
|
|
|
outputs/checkpoints/checkpoint-170001/training_state.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"step": 170001}
|
|
|
|
outputs/checkpoints/checkpoint-180001/data_collator.joblib
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:e02a6e9cfa63cb321cac9402efd29841b652999fcbf787800ae050e747b161ee
|
3 |
-
size 1471394
|
|
|
|
|
|
|
|
outputs/checkpoints/checkpoint-180001/flax_model.msgpack
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:393c37966461709fe51a3b3f84befb7fa7e5030025856d171308efd40dbbc7da
|
3 |
-
size 249750019
|
|
|
|
|
|
|
|
outputs/checkpoints/checkpoint-180001/optimizer_state.msgpack
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:3a33cad417a7e78eaafc1c041f93fd54ad9f63869d01e1351bac4abcd58e4eeb
|
3 |
-
size 499500278
|
|
|
|
|
|
|
|
outputs/checkpoints/checkpoint-180001/training_args.joblib
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:8bc14fe16573d318dd510c7cfb42ebb7cc87b4dcf77e99247a2d1605cffd772b
|
3 |
-
size 1876
|
|
|
|
|
|
|
|
outputs/checkpoints/checkpoint-180001/training_state.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"step": 180001}
|
|
|
|
outputs/checkpoints/{checkpoint-140001 → checkpoint-182000}/config.json
RENAMED
File without changes
|
outputs/checkpoints/{checkpoint-140001 → checkpoint-182000}/data_collator.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0321b1a9629e1be122045cd72470365a63c8496fec109fdeec34827f01ffbb9e
|
3 |
+
size 1471424
|
outputs/checkpoints/{checkpoint-150001 → checkpoint-182000}/flax_model.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 249750019
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73b385f39d585a15aeee595103523252872a4277da8c21c9bc9bbfd0232a72c9
|
3 |
size 249750019
|
outputs/checkpoints/{checkpoint-150001 → checkpoint-182000}/optimizer_state.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 499500278
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6c074f7bc1330f514d95eb6277f0232abc85b0ec2f8c1c5972fd46af01985d4
|
3 |
size 499500278
|
outputs/checkpoints/{checkpoint-160001 → checkpoint-182000}/training_args.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79196d5f797a7527e60287e48f716fd4626c5d57186661d6a214a2027998c86d
|
3 |
+
size 1873
|
outputs/checkpoints/checkpoint-182000/training_state.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"step": 182001}
|
outputs/checkpoints/{checkpoint-150001 → checkpoint-183000}/config.json
RENAMED
File without changes
|
outputs/checkpoints/{checkpoint-150001 → checkpoint-183000}/data_collator.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0321b1a9629e1be122045cd72470365a63c8496fec109fdeec34827f01ffbb9e
|
3 |
+
size 1471424
|
outputs/checkpoints/{checkpoint-140001 → checkpoint-183000}/flax_model.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 249750019
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0059f1c021d4be233f41fc29384c42e8844d69c44e1d31806620a38d76d6aa00
|
3 |
size 249750019
|
outputs/checkpoints/{checkpoint-160001 → checkpoint-183000}/optimizer_state.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 499500278
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e99296d552d436c722721d611be2ed7cf4862c4b6a40abbc3464f7a75ca25c58
|
3 |
size 499500278
|
outputs/checkpoints/{checkpoint-170001 → checkpoint-183000}/training_args.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79196d5f797a7527e60287e48f716fd4626c5d57186661d6a214a2027998c86d
|
3 |
+
size 1873
|
outputs/checkpoints/checkpoint-183000/training_state.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"step": 183001}
|
outputs/checkpoints/{checkpoint-160001 → checkpoint-184000}/config.json
RENAMED
File without changes
|
outputs/checkpoints/{checkpoint-160001 → checkpoint-184000}/data_collator.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0321b1a9629e1be122045cd72470365a63c8496fec109fdeec34827f01ffbb9e
|
3 |
+
size 1471424
|
outputs/checkpoints/{checkpoint-160001 → checkpoint-184000}/flax_model.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 249750019
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5063b47bd0228e701c1cbc12f4ce305c577868d34589323f88eb3ca2057b322d
|
3 |
size 249750019
|
outputs/checkpoints/{checkpoint-140001 → checkpoint-184000}/optimizer_state.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 499500278
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03b1a223244cdeec59f4a501edcc3e29d75fa5a7467d514c3c30d9a2fcb49401
|
3 |
size 499500278
|
outputs/checkpoints/{checkpoint-150001 → checkpoint-184000}/training_args.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79196d5f797a7527e60287e48f716fd4626c5d57186661d6a214a2027998c86d
|
3 |
+
size 1873
|
outputs/checkpoints/checkpoint-184000/training_state.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"step": 184001}
|
outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/config.json
RENAMED
File without changes
|
outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/data_collator.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0321b1a9629e1be122045cd72470365a63c8496fec109fdeec34827f01ffbb9e
|
3 |
+
size 1471424
|
outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/flax_model.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 249750019
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53e61bbf07baa76be1c67dcb57fd59f87d0171d7ce5ebdff16e054e5e4c547fe
|
3 |
size 249750019
|
outputs/checkpoints/{checkpoint-170001 → checkpoint-185000}/optimizer_state.msgpack
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 499500278
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a2a3d946f859ac106a7ede9530e200364d0850a98d8c958672d441c57ab89bd
|
3 |
size 499500278
|
outputs/checkpoints/{checkpoint-140001 → checkpoint-185000}/training_args.joblib
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79196d5f797a7527e60287e48f716fd4626c5d57186661d6a214a2027998c86d
|
3 |
+
size 1873
|
outputs/checkpoints/checkpoint-185000/training_state.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"step": 185001}
|
outputs/checkpoints/{checkpoint-180001 → checkpoint-186000}/config.json
RENAMED
File without changes
|
outputs/checkpoints/checkpoint-186000/data_collator.joblib
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0321b1a9629e1be122045cd72470365a63c8496fec109fdeec34827f01ffbb9e
|
3 |
+
size 1471424
|
outputs/checkpoints/checkpoint-186000/flax_model.msgpack
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3362fadd5306539e1775600df59349acf0fd260751129abaa45b997091d089ce
|
3 |
+
size 249750019
|
outputs/checkpoints/checkpoint-186000/optimizer_state.msgpack
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e08084e7879de2059bc4fd38ff876b0bd1e987a646397956dd4bef19bb2dd1bf
|
3 |
+
size 499500278
|
outputs/checkpoints/checkpoint-186000/training_args.joblib
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79196d5f797a7527e60287e48f716fd4626c5d57186661d6a214a2027998c86d
|
3 |
+
size 1873
|
outputs/checkpoints/checkpoint-186000/training_state.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"step": 186001}
|
outputs/data_collator.joblib
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0321b1a9629e1be122045cd72470365a63c8496fec109fdeec34827f01ffbb9e
|
3 |
+
size 1471424
|
outputs/events.out.tfevents.1627122688.tablespoon.2185269.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96e9ae0a574bba9629f3ffc65a3b0714cef7fb3ee796573b1d132a3c80f25fc3
|
3 |
+
size 40
|
outputs/events.out.tfevents.1627122817.tablespoon.2191003.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8351632f70e7465eea0642599fff77709273a7fc9a50b607543f49754c6d694e
|
3 |
+
size 149322
|
outputs/events.out.tfevents.1627125745.tablespoon.2266135.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca4fd9200f1731b7b75feb068806b3d69d179f8e5d467282752c6a8efac760c0
|
3 |
+
size 149322
|
outputs/events.out.tfevents.1627128247.tablespoon.2330108.3.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8afd683918d2323382c5b27888561ecb6d879ebe3f6360a1c6ac02435d2f2122
|
3 |
+
size 746450
|
outputs/flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 249750019
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3362fadd5306539e1775600df59349acf0fd260751129abaa45b997091d089ce
|
3 |
size 249750019
|
outputs/optimizer_state.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 499500278
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e08084e7879de2059bc4fd38ff876b0bd1e987a646397956dd4bef19bb2dd1bf
|
3 |
size 499500278
|
outputs/training_args.joblib
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79196d5f797a7527e60287e48f716fd4626c5d57186661d6a214a2027998c86d
|
3 |
+
size 1873
|
outputs/training_state.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"step":
|
|
|
1 |
+
{"step": 186001}
|