Imcf1Y3FSatM commited on
Commit
7209ebe
1 Parent(s): e3993e6

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +184 -184
  2. tokenizer_config.json +1 -4
tokenizer.json CHANGED
@@ -2237,7 +2237,7 @@
2237
  ],
2238
  [
2239
  "ce",
2240
- -7.480814933776856
2241
  ],
2242
  [
2243
  "▁board",
@@ -2273,7 +2273,7 @@
2273
  ],
2274
  [
2275
  "ive",
2276
- -7.513410091400147
2277
  ],
2278
  [
2279
  "▁where",
@@ -2365,7 +2365,7 @@
2365
  ],
2366
  [
2367
  "▁myself",
2368
- -7.600685596466064
2369
  ],
2370
  [
2371
  "▁yen",
@@ -2433,7 +2433,7 @@
2433
  ],
2434
  [
2435
  "▁hav",
2436
- -7.641457080841064
2437
  ],
2438
  [
2439
  "▁As",
@@ -2549,7 +2549,7 @@
2549
  ],
2550
  [
2551
  "That",
2552
- -7.752362728118896
2553
  ],
2554
  [
2555
  "M",
@@ -2589,7 +2589,7 @@
2589
  ],
2590
  [
2591
  "T",
2592
- -7.786305427551269
2593
  ],
2594
  [
2595
  "▁read",
@@ -2693,11 +2693,11 @@
2693
  ],
2694
  [
2695
  "ng",
2696
- -7.874188899993896
2697
  ],
2698
  [
2699
  "▁mind",
2700
- -7.876381397247315
2701
  ],
2702
  [
2703
  "▁cannot",
@@ -2713,7 +2713,7 @@
2713
  ],
2714
  [
2715
  "▁hard",
2716
- -7.87647533416748
2717
  ],
2718
  [
2719
  "▁nothing",
@@ -2789,7 +2789,7 @@
2789
  ],
2790
  [
2791
  "The",
2792
- -7.928972721099853
2793
  ],
2794
  [
2795
  "▁sp",
@@ -2857,7 +2857,7 @@
2857
  ],
2858
  [
2859
  "▁put",
2860
- -7.977669239044189
2861
  ],
2862
  [
2863
  "▁line",
@@ -5041,7 +5041,7 @@
5041
  ],
5042
  [
5043
  "ian",
5044
- -9.022007942199709
5045
  ],
5046
  [
5047
  "rew",
@@ -5049,11 +5049,11 @@
5049
  ],
5050
  [
5051
  "rate",
5052
- -9.027299880981444
5053
  ],
5054
  [
5055
  "▁fai",
5056
- -9.028965950012209
5057
  ],
5058
  [
5059
  "▁Hi",
@@ -5065,19 +5065,19 @@
5065
  ],
5066
  [
5067
  "▁sw",
5068
- -9.040364265441896
5069
  ],
5070
  [
5071
  "ight",
5072
- -9.05210781097412
5073
  ],
5074
  [
5075
  "▁pass",
5076
- -9.059226036071776
5077
  ],
5078
  [
5079
  "▁accept",
5080
- -9.06157684326172
5081
  ],
5082
  [
5083
  "▁expect",
@@ -5085,7 +5085,7 @@
5085
  ],
5086
  [
5087
  "▁Be",
5088
- -9.062178611755373
5089
  ],
5090
  [
5091
  "▁meet",
@@ -5185,11 +5185,11 @@
5185
  ],
5186
  [
5187
  "▁sword",
5188
- -9.074662208557127
5189
  ],
5190
  [
5191
  "▁world",
5192
- -9.074662208557127
5193
  ],
5194
  [
5195
  "▁style",
@@ -5197,7 +5197,7 @@
5197
  ],
5198
  [
5199
  "▁death",
5200
- -9.074671745300291
5201
  ],
5202
  [
5203
  "▁push",
@@ -5205,7 +5205,7 @@
5205
  ],
5206
  [
5207
  "▁early",
5208
- -9.07468605041504
5209
  ],
5210
  [
5211
  "▁history",
@@ -5233,11 +5233,11 @@
5233
  ],
5234
  [
5235
  "stead",
5236
- -9.074742317199709
5237
  ],
5238
  [
5239
  "▁added",
5240
- -9.074756622314451
5241
  ],
5242
  [
5243
  "▁stuff",
@@ -5249,7 +5249,7 @@
5249
  ],
5250
  [
5251
  "▁temple",
5252
- -9.074835777282717
5253
  ],
5254
  [
5255
  "▁mention",
@@ -5273,11 +5273,11 @@
5273
  ],
5274
  [
5275
  "▁post",
5276
- -9.075267791748049
5277
  ],
5278
  [
5279
  "▁catch",
5280
- -9.075643539428713
5281
  ],
5282
  [
5283
  "▁leg",
@@ -5297,11 +5297,11 @@
5297
  ],
5298
  [
5299
  "▁arm",
5300
- -9.08041286468506
5301
  ],
5302
  [
5303
  "▁plan",
5304
- -9.081151008605955
5305
  ],
5306
  [
5307
  "▁pale",
@@ -5313,7 +5313,7 @@
5313
  ],
5314
  [
5315
  "▁efforts",
5316
- -9.086438179016112
5317
  ],
5318
  [
5319
  "▁accepted",
@@ -5337,11 +5337,11 @@
5337
  ],
5338
  [
5339
  "▁forty",
5340
- -9.09645652770996
5341
  ],
5342
  [
5343
  "▁walking",
5344
- -9.09681797027588
5345
  ],
5346
  [
5347
  "▁opened",
@@ -5349,7 +5349,7 @@
5349
  ],
5350
  [
5351
  "Don",
5352
- -9.100522994995115
5353
  ],
5354
  [
5355
  "position",
@@ -5361,11 +5361,11 @@
5361
  ],
5362
  [
5363
  "pri",
5364
- -9.103438377380373
5365
  ],
5366
  [
5367
  "▁forth",
5368
- -9.11118507385254
5369
  ],
5370
  [
5371
  "▁notice",
@@ -5373,7 +5373,7 @@
5373
  ],
5374
  [
5375
  "▁play",
5376
- -9.123631477355955
5377
  ],
5378
  [
5379
  "raw",
@@ -5381,7 +5381,7 @@
5381
  ],
5382
  [
5383
  "▁year",
5384
- -9.166281700134276
5385
  ],
5386
  [
5387
  "▁step",
@@ -5389,7 +5389,7 @@
5389
  ],
5390
  [
5391
  "▁fin",
5392
- -9.175487518310549
5393
  ],
5394
  [
5395
  "▁direct",
@@ -5397,19 +5397,19 @@
5397
  ],
5398
  [
5399
  "▁insist",
5400
- -9.185338020324709
5401
  ],
5402
  [
5403
  "▁enjoy",
5404
- -9.185760498046877
5405
  ],
5406
  [
5407
  "▁fashion",
5408
- -9.185760498046877
5409
  ],
5410
  [
5411
  "▁supper",
5412
- -9.185760498046877
5413
  ],
5414
  [
5415
  "Besides",
@@ -5493,11 +5493,11 @@
5493
  ],
5494
  [
5495
  "▁trick",
5496
- -9.185766220092772
5497
  ],
5498
  [
5499
  "▁sharp",
5500
- -9.18577480316162
5501
  ],
5502
  [
5503
  "▁married",
@@ -5505,7 +5505,7 @@
5505
  ],
5506
  [
5507
  "▁print",
5508
- -9.185812950134276
5509
  ],
5510
  [
5511
  "▁weak",
@@ -5513,7 +5513,7 @@
5513
  ],
5514
  [
5515
  "▁wife",
5516
- -9.185831069946287
5517
  ],
5518
  [
5519
  "▁translation",
@@ -5529,7 +5529,7 @@
5529
  ],
5530
  [
5531
  "▁below",
5532
- -9.185887336730955
5533
  ],
5534
  [
5535
  "▁smile",
@@ -5549,11 +5549,11 @@
5549
  ],
5550
  [
5551
  "▁noise",
5552
- -9.186004638671877
5553
  ],
5554
  [
5555
  "▁intention",
5556
- -9.186009407043455
5557
  ],
5558
  [
5559
  "▁coward",
@@ -5573,7 +5573,7 @@
5573
  ],
5574
  [
5575
  "▁loca",
5576
- -9.186867713928224
5577
  ],
5578
  [
5579
  "▁Ch",
@@ -5581,7 +5581,7 @@
5581
  ],
5582
  [
5583
  "▁perform",
5584
- -9.188361167907717
5585
  ],
5586
  [
5587
  "ike",
@@ -5597,7 +5597,7 @@
5597
  ],
5598
  [
5599
  "▁shot",
5600
- -9.188958168029783
5601
  ],
5602
  [
5603
  "▁display",
@@ -5605,7 +5605,7 @@
5605
  ],
5606
  [
5607
  "machi",
5608
- -9.190868377685549
5609
  ],
5610
  [
5611
  "▁mental",
@@ -5613,7 +5613,7 @@
5613
  ],
5614
  [
5615
  "▁sur",
5616
- -9.19241428375244
5617
  ],
5618
  [
5619
  "▁comply",
@@ -5629,11 +5629,11 @@
5629
  ],
5630
  [
5631
  "▁distribute",
5632
- -9.193628311157228
5633
  ],
5634
  [
5635
  "▁sooner",
5636
- -9.193878173828123
5637
  ],
5638
  [
5639
  "▁provide",
@@ -5645,7 +5645,7 @@
5645
  ],
5646
  [
5647
  "▁bor",
5648
- -9.203582763671877
5649
  ],
5650
  [
5651
  "▁standing",
@@ -5653,11 +5653,11 @@
5653
  ],
5654
  [
5655
  "▁drawing",
5656
- -9.20570945739746
5657
  ],
5658
  [
5659
  "▁fast",
5660
- -9.211029052734377
5661
  ],
5662
  [
5663
  "▁cur",
@@ -5665,7 +5665,7 @@
5665
  ],
5666
  [
5667
  "gen",
5668
- -9.213075637817385
5669
  ],
5670
  [
5671
  "etc",
@@ -5689,15 +5689,15 @@
5689
  ],
5690
  [
5691
  "Pro",
5692
- -9.220240592956545
5693
  ],
5694
  [
5695
  "▁nose",
5696
- -9.221141815185549
5697
  ],
5698
  [
5699
  "▁Re",
5700
- -9.246124267578123
5701
  ],
5702
  [
5703
  "light",
@@ -5705,7 +5705,7 @@
5705
  ],
5706
  [
5707
  "▁da",
5708
- -9.274735450744627
5709
  ],
5710
  [
5711
  "till",
@@ -5729,7 +5729,7 @@
5729
  ],
5730
  [
5731
  "▁TH",
5732
- -9.305097579956056
5733
  ],
5734
  [
5735
  "becom",
@@ -5737,27 +5737,27 @@
5737
  ],
5738
  [
5739
  "▁transfer",
5740
- -9.310699462890623
5741
  ],
5742
  [
5743
  "▁thir",
5744
- -9.310746192932127
5745
  ],
5746
  [
5747
  "sque",
5748
- -9.310760498046877
5749
  ],
5750
  [
5751
  "▁appeal",
5752
- -9.310760498046877
5753
  ],
5754
  [
5755
  "▁devil",
5756
- -9.310760498046877
5757
  ],
5758
  [
5759
  "▁judg",
5760
- -9.310760498046877
5761
  ],
5762
  [
5763
  "▁character",
@@ -5849,15 +5849,15 @@
5849
  ],
5850
  [
5851
  "▁Russ",
5852
- -9.310765266418455
5853
  ],
5854
  [
5855
  "▁plain",
5856
- -9.310769081115724
5857
  ],
5858
  [
5859
  "▁glad",
5860
- -9.31077003479004
5861
  ],
5862
  [
5863
  "▁Section",
@@ -5869,7 +5869,7 @@
5869
  ],
5870
  [
5871
  "▁deserv",
5872
- -9.310778617858888
5873
  ],
5874
  [
5875
  "▁credit",
@@ -5941,7 +5941,7 @@
5941
  ],
5942
  [
5943
  "▁refus",
5944
- -9.311113357543944
5945
  ],
5946
  [
5947
  "▁drum",
@@ -5957,7 +5957,7 @@
5957
  ],
5958
  [
5959
  "ordina",
5960
- -9.311413764953612
5961
  ],
5962
  [
5963
  "ware",
@@ -5977,7 +5977,7 @@
5977
  ],
5978
  [
5979
  "running",
5980
- -9.31202793121338
5981
  ],
5982
  [
5983
  "▁mark",
@@ -6001,7 +6001,7 @@
6001
  ],
6002
  [
6003
  "▁Ko",
6004
- -9.31403350830078
6005
  ],
6006
  [
6007
  "▁anybody",
@@ -6033,7 +6033,7 @@
6033
  ],
6034
  [
6035
  "▁shoo",
6036
- -9.320408821105955
6037
  ],
6038
  [
6039
  "▁buy",
@@ -6041,7 +6041,7 @@
6041
  ],
6042
  [
6043
  "dition",
6044
- -9.32142734527588
6045
  ],
6046
  [
6047
  "▁laws",
@@ -6113,7 +6113,7 @@
6113
  ],
6114
  [
6115
  "IT",
6116
- -9.397068977355955
6117
  ],
6118
  [
6119
  "ward",
@@ -6125,7 +6125,7 @@
6125
  ],
6126
  [
6127
  "▁simpl",
6128
- -9.40804958343506
6129
  ],
6130
  [
6131
  "uff",
@@ -6153,7 +6153,7 @@
6153
  ],
6154
  [
6155
  "▁late",
6156
- -9.451498031616213
6157
  ],
6158
  [
6159
  "▁gentle",
@@ -6249,19 +6249,19 @@
6249
  ],
6250
  [
6251
  "▁above",
6252
- -9.453619956970217
6253
  ],
6254
  [
6255
  "▁glance",
6256
- -9.453619956970217
6257
  ],
6258
  [
6259
  "▁shadow",
6260
- -9.453619956970217
6261
  ],
6262
  [
6263
  "▁unusual",
6264
- -9.453619956970217
6265
  ],
6266
  [
6267
  "▁gentlemen",
@@ -6297,7 +6297,7 @@
6297
  ],
6298
  [
6299
  "▁repeat",
6300
- -9.453625679016112
6301
  ],
6302
  [
6303
  "▁decent",
@@ -6325,7 +6325,7 @@
6325
  ],
6326
  [
6327
  "▁slip",
6328
- -9.453635215759276
6329
  ],
6330
  [
6331
  "doubt",
@@ -6337,7 +6337,7 @@
6337
  ],
6338
  [
6339
  "▁instructor",
6340
- -9.453639030456545
6341
  ],
6342
  [
6343
  "▁education",
@@ -6357,11 +6357,11 @@
6357
  ],
6358
  [
6359
  "▁demand",
6360
- -9.453653335571287
6361
  ],
6362
  [
6363
  "▁court",
6364
- -9.453690528869627
6365
  ],
6366
  [
6367
  "▁stuck",
@@ -6389,15 +6389,15 @@
6389
  ],
6390
  [
6391
  "▁Con",
6392
- -9.454066276550291
6393
  ],
6394
  [
6395
  "▁boatman",
6396
- -9.454066276550291
6397
  ],
6398
  [
6399
  "▁type",
6400
- -9.45411777496338
6401
  ],
6402
  [
6403
  "promise",
@@ -6413,11 +6413,11 @@
6413
  ],
6414
  [
6415
  "▁Up",
6416
- -9.454395294189451
6417
  ],
6418
  [
6419
  "▁yard",
6420
- -9.454404830932615
6421
  ],
6422
  [
6423
  "▁worth",
@@ -6437,7 +6437,7 @@
6437
  ],
6438
  [
6439
  "SE",
6440
- -9.455034255981444
6441
  ],
6442
  [
6443
  "▁peep",
@@ -6449,7 +6449,7 @@
6449
  ],
6450
  [
6451
  "▁subject",
6452
- -9.455371856689451
6453
  ],
6454
  [
6455
  "▁careful",
@@ -6457,7 +6457,7 @@
6457
  ],
6458
  [
6459
  "▁nonsense",
6460
- -9.455403327941896
6461
  ],
6462
  [
6463
  "▁pine",
@@ -6469,15 +6469,15 @@
6469
  ],
6470
  [
6471
  "▁ran",
6472
- -9.456183433532717
6473
  ],
6474
  [
6475
  "▁sometime",
6476
- -9.456221580505373
6477
  ],
6478
  [
6479
  "▁compar",
6480
- -9.456564903259276
6481
  ],
6482
  [
6483
  "▁Once",
@@ -6497,7 +6497,7 @@
6497
  ],
6498
  [
6499
  "▁table",
6500
- -9.461024284362791
6501
  ],
6502
  [
6503
  "▁prove",
@@ -6525,11 +6525,11 @@
6525
  ],
6526
  [
6527
  "paper",
6528
- -9.531177520751951
6529
  ],
6530
  [
6531
  "upon",
6532
- -9.53188133239746
6533
  ],
6534
  [
6535
  "some",
@@ -6537,7 +6537,7 @@
6537
  ],
6538
  [
6539
  "▁favor",
6540
- -9.538238525390623
6541
  ],
6542
  [
6543
  "named",
@@ -6545,7 +6545,7 @@
6545
  ],
6546
  [
6547
  "ode",
6548
- -9.582578659057615
6549
  ],
6550
  [
6551
  "cked",
@@ -6561,7 +6561,7 @@
6561
  ],
6562
  [
6563
  "▁stat",
6564
- -9.59182834625244
6565
  ],
6566
  [
6567
  "▁effort",
@@ -6569,7 +6569,7 @@
6569
  ],
6570
  [
6571
  "▁enter",
6572
- -9.609453201293944
6573
  ],
6574
  [
6575
  "▁surprise",
@@ -6581,11 +6581,11 @@
6581
  ],
6582
  [
6583
  "▁rikisha",
6584
- -9.61831760406494
6585
  ],
6586
  [
6587
  "▁whi",
6588
- -9.61833953857422
6589
  ],
6590
  [
6591
  "ency",
@@ -6601,7 +6601,7 @@
6601
  ],
6602
  [
6603
  "▁prefer",
6604
- -9.62006378173828
6605
  ],
6606
  [
6607
  "▁fun",
@@ -6609,15 +6609,15 @@
6609
  ],
6610
  [
6611
  "▁require",
6612
- -9.620274543762209
6613
  ],
6614
  [
6615
  "▁imagin",
6616
- -9.620284080505373
6617
  ],
6618
  [
6619
  "▁vigor",
6620
- -9.620284080505373
6621
  ],
6622
  [
6623
  "Botchan",
@@ -6797,7 +6797,7 @@
6797
  ],
6798
  [
6799
  "▁rattl",
6800
- -9.620288848876951
6801
  ],
6802
  [
6803
  "▁attention",
@@ -6805,7 +6805,7 @@
6805
  ],
6806
  [
6807
  "▁New",
6808
- -9.62029266357422
6809
  ],
6810
  [
6811
  "claim",
@@ -6837,11 +6837,11 @@
6837
  ],
6838
  [
6839
  "▁orange",
6840
- -9.620302200317385
6841
  ],
6842
  [
6843
  "▁dull",
6844
- -9.620311737060549
6845
  ],
6846
  [
6847
  "▁river",
@@ -6849,7 +6849,7 @@
6849
  ],
6850
  [
6851
  "▁fuss",
6852
- -9.620326042175291
6853
  ],
6854
  [
6855
  "▁cap",
@@ -6885,7 +6885,7 @@
6885
  ],
6886
  [
6887
  "nosu",
6888
- -9.62045192718506
6889
  ],
6890
  [
6891
  "▁flat",
@@ -6925,7 +6925,7 @@
6925
  ],
6926
  [
6927
  "▁sauc",
6928
- -9.620758056640623
6929
  ],
6930
  [
6931
  "▁rice",
@@ -6949,11 +6949,11 @@
6949
  ],
6950
  [
6951
  "▁treatment",
6952
- -9.621350288391112
6953
  ],
6954
  [
6955
  "▁favorit",
6956
- -9.621603965759276
6957
  ],
6958
  [
6959
  "▁glo",
@@ -6977,11 +6977,11 @@
6977
  ],
6978
  [
6979
  "▁file",
6980
- -9.623125076293944
6981
  ],
6982
  [
6983
  "▁reasonable",
6984
- -9.623706817626951
6985
  ],
6986
  [
6987
  "▁anyone",
@@ -7009,11 +7009,11 @@
7009
  ],
7010
  [
7011
  "▁hall",
7012
- -9.627115249633787
7013
  ],
7014
  [
7015
  "▁ice",
7016
- -9.63064670562744
7017
  ],
7018
  [
7019
  "ctual",
@@ -7041,7 +7041,7 @@
7041
  ],
7042
  [
7043
  "site",
7044
- -9.645623207092283
7045
  ],
7046
  [
7047
  "you",
@@ -7061,7 +7061,7 @@
7061
  ],
7062
  [
7063
  "duced",
7064
- -9.689046859741213
7065
  ],
7066
  [
7067
  "▁format",
@@ -7073,7 +7073,7 @@
7073
  ],
7074
  [
7075
  "▁dar",
7076
- -9.69410800933838
7077
  ],
7078
  [
7079
  "pic",
@@ -7101,7 +7101,7 @@
7101
  ],
7102
  [
7103
  "mats",
7104
- -9.743086814880373
7105
  ],
7106
  [
7107
  "knee",
@@ -7113,7 +7113,7 @@
7113
  ],
7114
  [
7115
  "goo",
7116
- -9.794201850891112
7117
  ],
7118
  [
7119
  "▁necessar",
@@ -7125,7 +7125,7 @@
7125
  ],
7126
  [
7127
  "▁law",
7128
- -9.801798820495604
7129
  ],
7130
  [
7131
  "▁decid",
@@ -7133,7 +7133,7 @@
7133
  ],
7134
  [
7135
  "trict",
7136
- -9.808300018310549
7137
  ],
7138
  [
7139
  "▁settl",
@@ -7153,11 +7153,11 @@
7153
  ],
7154
  [
7155
  "ould",
7156
- -9.819173812866213
7157
  ],
7158
  [
7159
  "pping",
7160
- -9.81940460205078
7161
  ],
7162
  [
7163
  "uck",
@@ -7165,7 +7165,7 @@
7165
  ],
7166
  [
7167
  "awn",
7168
- -9.819780349731444
7169
  ],
7170
  [
7171
  "▁compli",
@@ -7177,7 +7177,7 @@
7177
  ],
7178
  [
7179
  "eneral",
7180
- -9.820164680480955
7181
  ],
7182
  [
7183
  "mitted",
@@ -7385,51 +7385,51 @@
7385
  ],
7386
  [
7387
  "approv",
7388
- -9.820286750793455
7389
  ],
7390
  [
7391
  "nounc",
7392
- -9.820286750793455
7393
  ],
7394
  [
7395
  "▁everywhere",
7396
- -9.820286750793455
7397
  ],
7398
  [
7399
  "▁snap",
7400
- -9.820286750793455
7401
  ],
7402
  [
7403
  "Suppos",
7404
- -9.820287704467772
7405
  ],
7406
  [
7407
  "▁begun",
7408
- -9.820287704467772
7409
  ],
7410
  [
7411
  "▁fix",
7412
- -9.820287704467772
7413
  ],
7414
  [
7415
  "▁respectfully",
7416
- -9.820287704467772
7417
  ],
7418
  [
7419
  "▁result",
7420
- -9.820287704467772
7421
  ],
7422
  [
7423
  "▁yellow",
7424
- -9.820287704467772
7425
  ],
7426
  [
7427
  "umbling",
7428
- -9.820290565490724
7429
  ],
7430
  [
7431
  "▁official",
7432
- -9.820290565490724
7433
  ],
7434
  [
7435
  "▁group",
@@ -7449,15 +7449,15 @@
7449
  ],
7450
  [
7451
  "▁firm",
7452
- -9.820300102233888
7453
  ],
7454
  [
7455
  "▁gramma",
7456
- -9.820300102233888
7457
  ],
7458
  [
7459
  "▁panel",
7460
- -9.820300102233888
7461
  ],
7462
  [
7463
  "▁itself",
@@ -7501,7 +7501,7 @@
7501
  ],
7502
  [
7503
  "▁slap",
7504
- -9.82034397125244
7505
  ],
7506
  [
7507
  "▁noisy",
@@ -7517,11 +7517,11 @@
7517
  ],
7518
  [
7519
  "chief",
7520
- -9.820390701293944
7521
  ],
7522
  [
7523
  "▁shouted",
7524
- -9.820408821105955
7525
  ],
7526
  [
7527
  "▁ball",
@@ -7541,7 +7541,7 @@
7541
  ],
7542
  [
7543
  "▁edge",
7544
- -9.820578575134276
7545
  ],
7546
  [
7547
  "▁shak",
@@ -7549,7 +7549,7 @@
7549
  ],
7550
  [
7551
  "▁pride",
7552
- -9.820841789245604
7553
  ],
7554
  [
7555
  "▁expenses",
@@ -7561,11 +7561,11 @@
7561
  ],
7562
  [
7563
  "▁Tak",
7564
- -9.820967674255373
7565
  ],
7566
  [
7567
  "▁broke",
7568
- -9.821123123168944
7569
  ],
7570
  [
7571
  "struck",
@@ -7609,11 +7609,11 @@
7609
  ],
7610
  [
7611
  "▁tight",
7612
- -9.821817398071287
7613
  ],
7614
  [
7615
  "▁Every",
7616
- -9.821944236755373
7617
  ],
7618
  [
7619
  "reafter",
@@ -7621,7 +7621,7 @@
7621
  ],
7622
  [
7623
  "▁brain",
7624
- -9.822479248046877
7625
  ],
7626
  [
7627
  "▁manage",
@@ -7633,7 +7633,7 @@
7633
  ],
7634
  [
7635
  "grace",
7636
- -9.829718589782717
7637
  ],
7638
  [
7639
  "formed",
@@ -7669,7 +7669,7 @@
7669
  ],
7670
  [
7671
  "empt",
7672
- -9.88385772705078
7673
  ],
7674
  [
7675
  "dog",
@@ -7677,7 +7677,7 @@
7677
  ],
7678
  [
7679
  "Here",
7680
- -9.904093742370604
7681
  ],
7682
  [
7683
  "▁prais",
@@ -7697,7 +7697,7 @@
7697
  ],
7698
  [
7699
  "face",
7700
- -9.97946071624756
7701
  ],
7702
  [
7703
  "▁punish",
@@ -7733,7 +7733,7 @@
7733
  ],
7734
  [
7735
  "aka",
7736
- -10.034581184387209
7737
  ],
7738
  [
7739
  "pecul",
@@ -7745,7 +7745,7 @@
7745
  ],
7746
  [
7747
  "▁advis",
7748
- -10.064568519592283
7749
  ],
7750
  [
7751
  "educat",
@@ -7757,7 +7757,7 @@
7757
  ],
7758
  [
7759
  "▁respon",
7760
- -10.070267677307127
7761
  ],
7762
  [
7763
  "▁express",
@@ -8117,35 +8117,35 @@
8117
  ],
8118
  [
8119
  "version",
8120
- -10.070286750793455
8121
  ],
8122
  [
8123
  "▁engage",
8124
- -10.070286750793455
8125
  ],
8126
  [
8127
  "▁hobby",
8128
- -10.070286750793455
8129
  ],
8130
  [
8131
  "▁length",
8132
- -10.070286750793455
8133
  ],
8134
  [
8135
  "▁logic",
8136
- -10.070286750793455
8137
  ],
8138
  [
8139
  "▁midnight",
8140
- -10.070286750793455
8141
  ],
8142
  [
8143
  "▁polish",
8144
- -10.070286750793455
8145
  ],
8146
  [
8147
  "(",
8148
- -10.312033653259276
8149
  ],
8150
  [
8151
  "*",
@@ -8157,7 +8157,7 @@
8157
  ],
8158
  [
8159
  "q",
8160
- -11.903417587280272
8161
  ],
8162
  [
8163
  "j",
@@ -8165,7 +8165,7 @@
8165
  ],
8166
  [
8167
  "v",
8168
- -11.90361785888672
8169
  ]
8170
  ],
8171
  "byte_fallback": false
 
2237
  ],
2238
  [
2239
  "ce",
2240
+ -7.4808149337768555
2241
  ],
2242
  [
2243
  "▁board",
 
2273
  ],
2274
  [
2275
  "ive",
2276
+ -7.5134100914001465
2277
  ],
2278
  [
2279
  "▁where",
 
2365
  ],
2366
  [
2367
  "▁myself",
2368
+ -7.6006855964660645
2369
  ],
2370
  [
2371
  "▁yen",
 
2433
  ],
2434
  [
2435
  "▁hav",
2436
+ -7.6414570808410645
2437
  ],
2438
  [
2439
  "▁As",
 
2549
  ],
2550
  [
2551
  "That",
2552
+ -7.7523627281188965
2553
  ],
2554
  [
2555
  "M",
 
2589
  ],
2590
  [
2591
  "T",
2592
+ -7.7863054275512695
2593
  ],
2594
  [
2595
  "▁read",
 
2693
  ],
2694
  [
2695
  "ng",
2696
+ -7.8741888999938965
2697
  ],
2698
  [
2699
  "▁mind",
2700
+ -7.8763813972473145
2701
  ],
2702
  [
2703
  "▁cannot",
 
2713
  ],
2714
  [
2715
  "▁hard",
2716
+ -7.8764753341674805
2717
  ],
2718
  [
2719
  "▁nothing",
 
2789
  ],
2790
  [
2791
  "The",
2792
+ -7.9289727210998535
2793
  ],
2794
  [
2795
  "▁sp",
 
2857
  ],
2858
  [
2859
  "▁put",
2860
+ -7.9776692390441895
2861
  ],
2862
  [
2863
  "▁line",
 
5041
  ],
5042
  [
5043
  "ian",
5044
+ -9.022007942199707
5045
  ],
5046
  [
5047
  "rew",
 
5049
  ],
5050
  [
5051
  "rate",
5052
+ -9.027299880981445
5053
  ],
5054
  [
5055
  "▁fai",
5056
+ -9.028965950012207
5057
  ],
5058
  [
5059
  "▁Hi",
 
5065
  ],
5066
  [
5067
  "▁sw",
5068
+ -9.040364265441895
5069
  ],
5070
  [
5071
  "ight",
5072
+ -9.052107810974121
5073
  ],
5074
  [
5075
  "▁pass",
5076
+ -9.059226036071777
5077
  ],
5078
  [
5079
  "▁accept",
5080
+ -9.061576843261719
5081
  ],
5082
  [
5083
  "▁expect",
 
5085
  ],
5086
  [
5087
  "▁Be",
5088
+ -9.062178611755371
5089
  ],
5090
  [
5091
  "▁meet",
 
5185
  ],
5186
  [
5187
  "▁sword",
5188
+ -9.074662208557129
5189
  ],
5190
  [
5191
  "▁world",
5192
+ -9.074662208557129
5193
  ],
5194
  [
5195
  "▁style",
 
5197
  ],
5198
  [
5199
  "▁death",
5200
+ -9.074671745300293
5201
  ],
5202
  [
5203
  "▁push",
 
5205
  ],
5206
  [
5207
  "▁early",
5208
+ -9.074686050415039
5209
  ],
5210
  [
5211
  "▁history",
 
5233
  ],
5234
  [
5235
  "stead",
5236
+ -9.074742317199707
5237
  ],
5238
  [
5239
  "▁added",
5240
+ -9.074756622314453
5241
  ],
5242
  [
5243
  "▁stuff",
 
5249
  ],
5250
  [
5251
  "▁temple",
5252
+ -9.074835777282715
5253
  ],
5254
  [
5255
  "▁mention",
 
5273
  ],
5274
  [
5275
  "▁post",
5276
+ -9.075267791748047
5277
  ],
5278
  [
5279
  "▁catch",
5280
+ -9.075643539428711
5281
  ],
5282
  [
5283
  "▁leg",
 
5297
  ],
5298
  [
5299
  "▁arm",
5300
+ -9.080412864685059
5301
  ],
5302
  [
5303
  "▁plan",
5304
+ -9.081151008605957
5305
  ],
5306
  [
5307
  "▁pale",
 
5313
  ],
5314
  [
5315
  "▁efforts",
5316
+ -9.086438179016113
5317
  ],
5318
  [
5319
  "▁accepted",
 
5337
  ],
5338
  [
5339
  "▁forty",
5340
+ -9.096456527709961
5341
  ],
5342
  [
5343
  "▁walking",
5344
+ -9.096817970275879
5345
  ],
5346
  [
5347
  "▁opened",
 
5349
  ],
5350
  [
5351
  "Don",
5352
+ -9.100522994995117
5353
  ],
5354
  [
5355
  "position",
 
5361
  ],
5362
  [
5363
  "pri",
5364
+ -9.103438377380371
5365
  ],
5366
  [
5367
  "▁forth",
5368
+ -9.111185073852539
5369
  ],
5370
  [
5371
  "▁notice",
 
5373
  ],
5374
  [
5375
  "▁play",
5376
+ -9.123631477355957
5377
  ],
5378
  [
5379
  "raw",
 
5381
  ],
5382
  [
5383
  "▁year",
5384
+ -9.166281700134277
5385
  ],
5386
  [
5387
  "▁step",
 
5389
  ],
5390
  [
5391
  "▁fin",
5392
+ -9.175487518310547
5393
  ],
5394
  [
5395
  "▁direct",
 
5397
  ],
5398
  [
5399
  "▁insist",
5400
+ -9.185338020324707
5401
  ],
5402
  [
5403
  "▁enjoy",
5404
+ -9.185760498046875
5405
  ],
5406
  [
5407
  "▁fashion",
5408
+ -9.185760498046875
5409
  ],
5410
  [
5411
  "▁supper",
5412
+ -9.185760498046875
5413
  ],
5414
  [
5415
  "Besides",
 
5493
  ],
5494
  [
5495
  "▁trick",
5496
+ -9.185766220092773
5497
  ],
5498
  [
5499
  "▁sharp",
5500
+ -9.185774803161621
5501
  ],
5502
  [
5503
  "▁married",
 
5505
  ],
5506
  [
5507
  "▁print",
5508
+ -9.185812950134277
5509
  ],
5510
  [
5511
  "▁weak",
 
5513
  ],
5514
  [
5515
  "▁wife",
5516
+ -9.185831069946289
5517
  ],
5518
  [
5519
  "▁translation",
 
5529
  ],
5530
  [
5531
  "▁below",
5532
+ -9.185887336730957
5533
  ],
5534
  [
5535
  "▁smile",
 
5549
  ],
5550
  [
5551
  "▁noise",
5552
+ -9.186004638671875
5553
  ],
5554
  [
5555
  "▁intention",
5556
+ -9.186009407043457
5557
  ],
5558
  [
5559
  "▁coward",
 
5573
  ],
5574
  [
5575
  "▁loca",
5576
+ -9.186867713928223
5577
  ],
5578
  [
5579
  "▁Ch",
 
5581
  ],
5582
  [
5583
  "▁perform",
5584
+ -9.188361167907715
5585
  ],
5586
  [
5587
  "ike",
 
5597
  ],
5598
  [
5599
  "▁shot",
5600
+ -9.188958168029785
5601
  ],
5602
  [
5603
  "▁display",
 
5605
  ],
5606
  [
5607
  "machi",
5608
+ -9.190868377685547
5609
  ],
5610
  [
5611
  "▁mental",
 
5613
  ],
5614
  [
5615
  "▁sur",
5616
+ -9.192414283752441
5617
  ],
5618
  [
5619
  "▁comply",
 
5629
  ],
5630
  [
5631
  "▁distribute",
5632
+ -9.193628311157227
5633
  ],
5634
  [
5635
  "▁sooner",
5636
+ -9.193878173828125
5637
  ],
5638
  [
5639
  "▁provide",
 
5645
  ],
5646
  [
5647
  "▁bor",
5648
+ -9.203582763671875
5649
  ],
5650
  [
5651
  "▁standing",
 
5653
  ],
5654
  [
5655
  "▁drawing",
5656
+ -9.205709457397461
5657
  ],
5658
  [
5659
  "▁fast",
5660
+ -9.211029052734375
5661
  ],
5662
  [
5663
  "▁cur",
 
5665
  ],
5666
  [
5667
  "gen",
5668
+ -9.213075637817383
5669
  ],
5670
  [
5671
  "etc",
 
5689
  ],
5690
  [
5691
  "Pro",
5692
+ -9.220240592956543
5693
  ],
5694
  [
5695
  "▁nose",
5696
+ -9.221141815185547
5697
  ],
5698
  [
5699
  "▁Re",
5700
+ -9.246124267578125
5701
  ],
5702
  [
5703
  "light",
 
5705
  ],
5706
  [
5707
  "▁da",
5708
+ -9.274735450744629
5709
  ],
5710
  [
5711
  "till",
 
5729
  ],
5730
  [
5731
  "▁TH",
5732
+ -9.305097579956055
5733
  ],
5734
  [
5735
  "becom",
 
5737
  ],
5738
  [
5739
  "▁transfer",
5740
+ -9.310699462890625
5741
  ],
5742
  [
5743
  "▁thir",
5744
+ -9.310746192932129
5745
  ],
5746
  [
5747
  "sque",
5748
+ -9.310760498046875
5749
  ],
5750
  [
5751
  "▁appeal",
5752
+ -9.310760498046875
5753
  ],
5754
  [
5755
  "▁devil",
5756
+ -9.310760498046875
5757
  ],
5758
  [
5759
  "▁judg",
5760
+ -9.310760498046875
5761
  ],
5762
  [
5763
  "▁character",
 
5849
  ],
5850
  [
5851
  "▁Russ",
5852
+ -9.310765266418457
5853
  ],
5854
  [
5855
  "▁plain",
5856
+ -9.310769081115723
5857
  ],
5858
  [
5859
  "▁glad",
5860
+ -9.310770034790039
5861
  ],
5862
  [
5863
  "▁Section",
 
5869
  ],
5870
  [
5871
  "▁deserv",
5872
+ -9.310778617858887
5873
  ],
5874
  [
5875
  "▁credit",
 
5941
  ],
5942
  [
5943
  "▁refus",
5944
+ -9.311113357543945
5945
  ],
5946
  [
5947
  "▁drum",
 
5957
  ],
5958
  [
5959
  "ordina",
5960
+ -9.311413764953613
5961
  ],
5962
  [
5963
  "ware",
 
5977
  ],
5978
  [
5979
  "running",
5980
+ -9.312027931213379
5981
  ],
5982
  [
5983
  "▁mark",
 
6001
  ],
6002
  [
6003
  "▁Ko",
6004
+ -9.314033508300781
6005
  ],
6006
  [
6007
  "▁anybody",
 
6033
  ],
6034
  [
6035
  "▁shoo",
6036
+ -9.320408821105957
6037
  ],
6038
  [
6039
  "▁buy",
 
6041
  ],
6042
  [
6043
  "dition",
6044
+ -9.321427345275879
6045
  ],
6046
  [
6047
  "▁laws",
 
6113
  ],
6114
  [
6115
  "IT",
6116
+ -9.397068977355957
6117
  ],
6118
  [
6119
  "ward",
 
6125
  ],
6126
  [
6127
  "▁simpl",
6128
+ -9.408049583435059
6129
  ],
6130
  [
6131
  "uff",
 
6153
  ],
6154
  [
6155
  "▁late",
6156
+ -9.451498031616211
6157
  ],
6158
  [
6159
  "▁gentle",
 
6249
  ],
6250
  [
6251
  "▁above",
6252
+ -9.453619956970215
6253
  ],
6254
  [
6255
  "▁glance",
6256
+ -9.453619956970215
6257
  ],
6258
  [
6259
  "▁shadow",
6260
+ -9.453619956970215
6261
  ],
6262
  [
6263
  "▁unusual",
6264
+ -9.453619956970215
6265
  ],
6266
  [
6267
  "▁gentlemen",
 
6297
  ],
6298
  [
6299
  "▁repeat",
6300
+ -9.453625679016113
6301
  ],
6302
  [
6303
  "▁decent",
 
6325
  ],
6326
  [
6327
  "▁slip",
6328
+ -9.453635215759277
6329
  ],
6330
  [
6331
  "doubt",
 
6337
  ],
6338
  [
6339
  "▁instructor",
6340
+ -9.453639030456543
6341
  ],
6342
  [
6343
  "▁education",
 
6357
  ],
6358
  [
6359
  "▁demand",
6360
+ -9.453653335571289
6361
  ],
6362
  [
6363
  "▁court",
6364
+ -9.453690528869629
6365
  ],
6366
  [
6367
  "▁stuck",
 
6389
  ],
6390
  [
6391
  "▁Con",
6392
+ -9.454066276550293
6393
  ],
6394
  [
6395
  "▁boatman",
6396
+ -9.454066276550293
6397
  ],
6398
  [
6399
  "▁type",
6400
+ -9.454117774963379
6401
  ],
6402
  [
6403
  "promise",
 
6413
  ],
6414
  [
6415
  "▁Up",
6416
+ -9.454395294189453
6417
  ],
6418
  [
6419
  "▁yard",
6420
+ -9.454404830932617
6421
  ],
6422
  [
6423
  "▁worth",
 
6437
  ],
6438
  [
6439
  "SE",
6440
+ -9.455034255981445
6441
  ],
6442
  [
6443
  "▁peep",
 
6449
  ],
6450
  [
6451
  "▁subject",
6452
+ -9.455371856689453
6453
  ],
6454
  [
6455
  "▁careful",
 
6457
  ],
6458
  [
6459
  "▁nonsense",
6460
+ -9.455403327941895
6461
  ],
6462
  [
6463
  "▁pine",
 
6469
  ],
6470
  [
6471
  "▁ran",
6472
+ -9.456183433532715
6473
  ],
6474
  [
6475
  "▁sometime",
6476
+ -9.456221580505371
6477
  ],
6478
  [
6479
  "▁compar",
6480
+ -9.456564903259277
6481
  ],
6482
  [
6483
  "▁Once",
 
6497
  ],
6498
  [
6499
  "▁table",
6500
+ -9.461024284362793
6501
  ],
6502
  [
6503
  "▁prove",
 
6525
  ],
6526
  [
6527
  "paper",
6528
+ -9.531177520751953
6529
  ],
6530
  [
6531
  "upon",
6532
+ -9.531881332397461
6533
  ],
6534
  [
6535
  "some",
 
6537
  ],
6538
  [
6539
  "▁favor",
6540
+ -9.538238525390625
6541
  ],
6542
  [
6543
  "named",
 
6545
  ],
6546
  [
6547
  "ode",
6548
+ -9.582578659057617
6549
  ],
6550
  [
6551
  "cked",
 
6561
  ],
6562
  [
6563
  "▁stat",
6564
+ -9.591828346252441
6565
  ],
6566
  [
6567
  "▁effort",
 
6569
  ],
6570
  [
6571
  "▁enter",
6572
+ -9.609453201293945
6573
  ],
6574
  [
6575
  "▁surprise",
 
6581
  ],
6582
  [
6583
  "▁rikisha",
6584
+ -9.618317604064941
6585
  ],
6586
  [
6587
  "▁whi",
6588
+ -9.618339538574219
6589
  ],
6590
  [
6591
  "ency",
 
6601
  ],
6602
  [
6603
  "▁prefer",
6604
+ -9.620063781738281
6605
  ],
6606
  [
6607
  "▁fun",
 
6609
  ],
6610
  [
6611
  "▁require",
6612
+ -9.620274543762207
6613
  ],
6614
  [
6615
  "▁imagin",
6616
+ -9.620284080505371
6617
  ],
6618
  [
6619
  "▁vigor",
6620
+ -9.620284080505371
6621
  ],
6622
  [
6623
  "Botchan",
 
6797
  ],
6798
  [
6799
  "▁rattl",
6800
+ -9.620288848876953
6801
  ],
6802
  [
6803
  "▁attention",
 
6805
  ],
6806
  [
6807
  "▁New",
6808
+ -9.620292663574219
6809
  ],
6810
  [
6811
  "claim",
 
6837
  ],
6838
  [
6839
  "▁orange",
6840
+ -9.620302200317383
6841
  ],
6842
  [
6843
  "▁dull",
6844
+ -9.620311737060547
6845
  ],
6846
  [
6847
  "▁river",
 
6849
  ],
6850
  [
6851
  "▁fuss",
6852
+ -9.620326042175293
6853
  ],
6854
  [
6855
  "▁cap",
 
6885
  ],
6886
  [
6887
  "nosu",
6888
+ -9.620451927185059
6889
  ],
6890
  [
6891
  "▁flat",
 
6925
  ],
6926
  [
6927
  "▁sauc",
6928
+ -9.620758056640625
6929
  ],
6930
  [
6931
  "▁rice",
 
6949
  ],
6950
  [
6951
  "▁treatment",
6952
+ -9.621350288391113
6953
  ],
6954
  [
6955
  "▁favorit",
6956
+ -9.621603965759277
6957
  ],
6958
  [
6959
  "▁glo",
 
6977
  ],
6978
  [
6979
  "▁file",
6980
+ -9.623125076293945
6981
  ],
6982
  [
6983
  "▁reasonable",
6984
+ -9.623706817626953
6985
  ],
6986
  [
6987
  "▁anyone",
 
7009
  ],
7010
  [
7011
  "▁hall",
7012
+ -9.627115249633789
7013
  ],
7014
  [
7015
  "▁ice",
7016
+ -9.630646705627441
7017
  ],
7018
  [
7019
  "ctual",
 
7041
  ],
7042
  [
7043
  "site",
7044
+ -9.645623207092285
7045
  ],
7046
  [
7047
  "you",
 
7061
  ],
7062
  [
7063
  "duced",
7064
+ -9.689046859741211
7065
  ],
7066
  [
7067
  "▁format",
 
7073
  ],
7074
  [
7075
  "▁dar",
7076
+ -9.694108009338379
7077
  ],
7078
  [
7079
  "pic",
 
7101
  ],
7102
  [
7103
  "mats",
7104
+ -9.743086814880371
7105
  ],
7106
  [
7107
  "knee",
 
7113
  ],
7114
  [
7115
  "goo",
7116
+ -9.794201850891113
7117
  ],
7118
  [
7119
  "▁necessar",
 
7125
  ],
7126
  [
7127
  "▁law",
7128
+ -9.801798820495605
7129
  ],
7130
  [
7131
  "▁decid",
 
7133
  ],
7134
  [
7135
  "trict",
7136
+ -9.808300018310547
7137
  ],
7138
  [
7139
  "▁settl",
 
7153
  ],
7154
  [
7155
  "ould",
7156
+ -9.819173812866211
7157
  ],
7158
  [
7159
  "pping",
7160
+ -9.819404602050781
7161
  ],
7162
  [
7163
  "uck",
 
7165
  ],
7166
  [
7167
  "awn",
7168
+ -9.819780349731445
7169
  ],
7170
  [
7171
  "▁compli",
 
7177
  ],
7178
  [
7179
  "eneral",
7180
+ -9.820164680480957
7181
  ],
7182
  [
7183
  "mitted",
 
7385
  ],
7386
  [
7387
  "approv",
7388
+ -9.820286750793457
7389
  ],
7390
  [
7391
  "nounc",
7392
+ -9.820286750793457
7393
  ],
7394
  [
7395
  "▁everywhere",
7396
+ -9.820286750793457
7397
  ],
7398
  [
7399
  "▁snap",
7400
+ -9.820286750793457
7401
  ],
7402
  [
7403
  "Suppos",
7404
+ -9.820287704467773
7405
  ],
7406
  [
7407
  "▁begun",
7408
+ -9.820287704467773
7409
  ],
7410
  [
7411
  "▁fix",
7412
+ -9.820287704467773
7413
  ],
7414
  [
7415
  "▁respectfully",
7416
+ -9.820287704467773
7417
  ],
7418
  [
7419
  "▁result",
7420
+ -9.820287704467773
7421
  ],
7422
  [
7423
  "▁yellow",
7424
+ -9.820287704467773
7425
  ],
7426
  [
7427
  "umbling",
7428
+ -9.820290565490723
7429
  ],
7430
  [
7431
  "▁official",
7432
+ -9.820290565490723
7433
  ],
7434
  [
7435
  "▁group",
 
7449
  ],
7450
  [
7451
  "▁firm",
7452
+ -9.820300102233887
7453
  ],
7454
  [
7455
  "▁gramma",
7456
+ -9.820300102233887
7457
  ],
7458
  [
7459
  "▁panel",
7460
+ -9.820300102233887
7461
  ],
7462
  [
7463
  "▁itself",
 
7501
  ],
7502
  [
7503
  "▁slap",
7504
+ -9.820343971252441
7505
  ],
7506
  [
7507
  "▁noisy",
 
7517
  ],
7518
  [
7519
  "chief",
7520
+ -9.820390701293945
7521
  ],
7522
  [
7523
  "▁shouted",
7524
+ -9.820408821105957
7525
  ],
7526
  [
7527
  "▁ball",
 
7541
  ],
7542
  [
7543
  "▁edge",
7544
+ -9.820578575134277
7545
  ],
7546
  [
7547
  "▁shak",
 
7549
  ],
7550
  [
7551
  "▁pride",
7552
+ -9.820841789245605
7553
  ],
7554
  [
7555
  "▁expenses",
 
7561
  ],
7562
  [
7563
  "▁Tak",
7564
+ -9.820967674255371
7565
  ],
7566
  [
7567
  "▁broke",
7568
+ -9.821123123168945
7569
  ],
7570
  [
7571
  "struck",
 
7609
  ],
7610
  [
7611
  "▁tight",
7612
+ -9.821817398071289
7613
  ],
7614
  [
7615
  "▁Every",
7616
+ -9.821944236755371
7617
  ],
7618
  [
7619
  "reafter",
 
7621
  ],
7622
  [
7623
  "▁brain",
7624
+ -9.822479248046875
7625
  ],
7626
  [
7627
  "▁manage",
 
7633
  ],
7634
  [
7635
  "grace",
7636
+ -9.829718589782715
7637
  ],
7638
  [
7639
  "formed",
 
7669
  ],
7670
  [
7671
  "empt",
7672
+ -9.883857727050781
7673
  ],
7674
  [
7675
  "dog",
 
7677
  ],
7678
  [
7679
  "Here",
7680
+ -9.904093742370605
7681
  ],
7682
  [
7683
  "▁prais",
 
7697
  ],
7698
  [
7699
  "face",
7700
+ -9.979460716247559
7701
  ],
7702
  [
7703
  "▁punish",
 
7733
  ],
7734
  [
7735
  "aka",
7736
+ -10.034581184387207
7737
  ],
7738
  [
7739
  "pecul",
 
7745
  ],
7746
  [
7747
  "▁advis",
7748
+ -10.064568519592285
7749
  ],
7750
  [
7751
  "educat",
 
7757
  ],
7758
  [
7759
  "▁respon",
7760
+ -10.070267677307129
7761
  ],
7762
  [
7763
  "▁express",
 
8117
  ],
8118
  [
8119
  "version",
8120
+ -10.070286750793457
8121
  ],
8122
  [
8123
  "▁engage",
8124
+ -10.070286750793457
8125
  ],
8126
  [
8127
  "▁hobby",
8128
+ -10.070286750793457
8129
  ],
8130
  [
8131
  "▁length",
8132
+ -10.070286750793457
8133
  ],
8134
  [
8135
  "▁logic",
8136
+ -10.070286750793457
8137
  ],
8138
  [
8139
  "▁midnight",
8140
+ -10.070286750793457
8141
  ],
8142
  [
8143
  "▁polish",
8144
+ -10.070286750793457
8145
  ],
8146
  [
8147
  "(",
8148
+ -10.312033653259277
8149
  ],
8150
  [
8151
  "*",
 
8157
  ],
8158
  [
8159
  "q",
8160
+ -11.903417587280273
8161
  ],
8162
  [
8163
  "j",
 
8165
  ],
8166
  [
8167
  "v",
8168
+ -11.903617858886719
8169
  ]
8170
  ],
8171
  "byte_fallback": false
tokenizer_config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
@@ -73,15 +74,11 @@
73
  "extra_ids": 0,
74
  "legacy": true,
75
  "mask_token": "<MASK>",
76
- "max_length": 2048,
77
  "model_max_length": 2048,
78
  "pad_token": "<pad>",
79
  "sep_token": "<SEP>",
80
  "sp_model_kwargs": {},
81
  "split_special_tokens": true,
82
- "stride": 0,
83
  "tokenizer_class": "T5Tokenizer",
84
- "truncation_side": "right",
85
- "truncation_strategy": "longest_first",
86
  "unk_token": "<unk>"
87
  }
 
1
  {
2
+ "add_prefix_space": true,
3
  "added_tokens_decoder": {
4
  "0": {
5
  "content": "<unk>",
 
74
  "extra_ids": 0,
75
  "legacy": true,
76
  "mask_token": "<MASK>",
 
77
  "model_max_length": 2048,
78
  "pad_token": "<pad>",
79
  "sep_token": "<SEP>",
80
  "sp_model_kwargs": {},
81
  "split_special_tokens": true,
 
82
  "tokenizer_class": "T5Tokenizer",
 
 
83
  "unk_token": "<unk>"
84
  }