MCOD-4.7M / tokenizer.json
Harley-ml's picture
Upload 4 files
3006ff4 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 0,
"content": "<unk>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": "<unk>",
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": false,
"vocab": {
"<unk>": 0,
"!": 1,
"\"": 2,
"#": 3,
"$": 4,
"%": 5,
"&": 6,
"'": 7,
"(": 8,
")": 9,
"*": 10,
"+": 11,
",": 12,
"-": 13,
".": 14,
"/": 15,
"0": 16,
"1": 17,
"2": 18,
"3": 19,
"4": 20,
"5": 21,
"6": 22,
"7": 23,
"8": 24,
"9": 25,
":": 26,
";": 27,
"<": 28,
"=": 29,
">": 30,
"?": 31,
"@": 32,
"A": 33,
"B": 34,
"C": 35,
"D": 36,
"E": 37,
"F": 38,
"G": 39,
"H": 40,
"I": 41,
"J": 42,
"K": 43,
"L": 44,
"M": 45,
"N": 46,
"O": 47,
"P": 48,
"Q": 49,
"R": 50,
"S": 51,
"T": 52,
"U": 53,
"V": 54,
"W": 55,
"X": 56,
"Y": 57,
"Z": 58,
"[": 59,
"\\": 60,
"]": 61,
"^": 62,
"_": 63,
"`": 64,
"a": 65,
"b": 66,
"c": 67,
"d": 68,
"e": 69,
"f": 70,
"g": 71,
"h": 72,
"i": 73,
"j": 74,
"k": 75,
"l": 76,
"m": 77,
"n": 78,
"o": 79,
"p": 80,
"q": 81,
"r": 82,
"s": 83,
"t": 84,
"u": 85,
"v": 86,
"w": 87,
"x": 88,
"y": 89,
"z": 90,
"{": 91,
"|": 92,
"}": 93,
"~": 94,
"Ċ": 95,
"č": 96,
"Ġ": 97,
"\\\"": 98,
"Ġ\\\"": 99,
"\\\":": 100,
"er": 101,
"en": 102,
"ti": 103,
"on": 104,
"\\\",": 105,
"si": 106,
"at": 107,
"in": 108,
"ro": 109,
"tion": 110,
"id": 111,
"Ġ1": 112,
"Ġ0": 113,
"or": 114,
"la": 115,
"po": 116,
"al": 117,
"el": 118,
"tr": 119,
"ut": 120,
"nu": 121,
"od": 122,
"se": 123,
"pe": 124,
"ch": 125,
"ze": 126,
"ty": 127,
"ar": 128,
"ad": 129,
"size": 130,
"dro": 131,
"ed": 132,
"ec": 133,
"Ġ2": 134,
"to": 135,
"type": 136,
"num": 137,
"lay": 138,
"att": 139,
"layer": 140,
"an": 141,
"ca": 142,
"den": 143,
"pout": 144,
"dropout": 145,
"hid": 146,
"hidden": 147,
"ken": 148,
"ention": 149,
"attention": 150,
"ing": 151,
"token": 152,
"ue": 153,
"ma": 154,
"Ġ{": 155,
"Ġ3": 156,
"re": 157,
"em": 158,
"Ġ5": 159,
"true": 160,
"Ġtrue": 161,
"pro": 162,
"orm": 163,
"ac": 164,
"12": 165,
"emb": 166,
"02": 167,
"Ġf": 168,
"alse": 169,
"Ġfalse": 170,
"prob": 171,
"ex": 172,
"oder": 173,
"embed": 174,
"ding": 175,
"Ġ[": 176,
"],": 177,
"embedding": 178,
"am": 179,
"Ġ12": 180,
"odel": 181,
"00": 182,
"fi": 183,
"he": 184,
"di": 185,
"os": 186,
"it": 187,
"layers": 188,
"model": 189,
"vo": 190,
"cab": 191,
"vocab": 192,
"head": 193,
"Ġ{\\\"": 194,
"ure": 195,
"Ġ512": 196,
"st": 197,
"posi": 198,
"ect": 199,
"position": 200,
"max": 201,
"norm": 202,
"sk": 203,
"ll": 204,
"EL": 205,
"ert": 206,
"lo": 207,
"LA": 208,
"},": 209,
"BEL": 210,
"LABEL": 211,
"act": 212,
"heads": 213,
"ans": 214,
"ext": 215,
"las": 216,
"iz": 217,
"text": 218,
"trans": 219,
"ate": 220,
"th": 221,
"ver": 222,
"ation": 223,
"ge": 224,
"lassi": 225,
"sion": 226,
"embeddings": 227,
"ep": 228,
"{\\\"": 229,
"\":": 230,
"\"}": 231,
"\"{\\\"": 232,
"}\"}": 233,
"čĊ": 234,
"Ġ\"{\\\"": 235,
"Ġ{\"": 236,
"dec": 237,
"Ġ[\\\"": 238,
"\\\"],": 239,
"enc": 240,
"decoder": 241,
"lab": 242,
"ter": 243,
"ini": 244,
"izer": 245,
"label": 246,
"elu": 247,
"use": 248,
"tiv": 249,
"arch": 250,
"form": 251,
"ures": 252,
"len": 253,
"itect": 254,
"architect": 255,
"architectures": 256,
"su": 257,
"Ġ4": 258,
"pat": 259,
"transform": 260,
"gth": 261,
"ers": 262,
"tial": 263,
"lassifi": 264,
"length": 265,
"gelu": 266,
"ame": 267,
"version": 268,
"mask": 269,
"transformers": 270,
"Ġ7": 271,
"initial": 272,
"bert": 273,
"initializer": 274,
"path": 275,
"pad": 276,
"null": 277,
"Ġnull": 278,
"con": 279,
"fe": 280,
"name": 281,
"sum": 282,
"Ġ6": 283,
"ng": 284,
"For": 285,
"ran": 286,
"Ġ\"{\\\"_": 287,
"dim": 288,
"range": 289,
"le": 290,
"68": 291,
"flo": 292,
"05": 293,
"float": 294,
"tor": 295,
"32": 296,
"dtype": 297,
"torch": 298,
"mar": 299,
"Ġ768": 300,
"ent": 301,
"eos": 302,
"encoder": 303,
"feat": 304,
"eps": 305,
"che": 306,
"edi": 307,
"cache": 308,
"inter": 309,
"is": 310,
"summar": 311,
"fu": 312,
"medi": 313,
"ol": 314,
"activ": 315,
"activation": 316,
"mediate": 317,
"intermediate": 318,
"classifi": 319,
"me": 320,
"07": 321,
"bos": 322,
"conv": 323,
"drop": 324,
"ev": 325,
"proj": 326,
"ear": 327,
"072": 328,
"summary": 329,
"Ġ102": 330,
"ab": 331,
"be": 332,
"Ġ1024": 333,
"Ġ3072": 334,
"Ġ16": 335,
"Ġ32": 336,
"cation": 337,
"56": 338,
"classifier": 339,
"eck": 340,
"nel": 341,
"probs": 342,
"ams": 343,
"check": 344,
"out": 345,
"ting": 346,
"put": 347,
"\\\"},": 348,
"sc": 349,
"poin": 350,
"checkpoin": 351,
"as": 352,
"Ġ128": 353,
"ne": 354,
"ff": 355,
"ase": 356,
"gr": 357,
"full": 358,
"ta": 359,
"Ġ502": 360,
"qu": 361,
"output": 362,
"ient": 363,
"time": 364,
"ig": 365,
"art": 366,
"up": 367,
"ap": 368,
"grad": 369,
"gradient": 370,
"Ġ8": 371,
"un": 372,
"checkpointing": 373,
"per": 374,
"sol": 375,
"tive": 376,
"lin": 377,
"96": 378,
"extr": 379,
"min": 380,
"scal": 381,
"bi": 382,
"16": 383,
"berta": 384,
"ForC": 385,
"ute": 386,
"absol": 387,
"absolute": 388,
"ck": 389,
"LM": 390,
"linear": 391,
"ts": 392,
"for": 393,
"av": 394,
"ction": 395,
"igh": 396,
"base": 397,
"ector": 398,
"do": 399,
"ly": 400,
"Ġ10": 401,
"48": 402,
"Ġ40": 403,
"extract": 404,
"Bert": 405,
"ct": 406,
"beams": 407,
"we": 408,
"gro": 409,
"Classifi": 410,
"scale": 411,
"Classification": 412,
"pt": 413,
"layerdrop": 414,
"group": 415,
"sil": 416,
"22": 417,
"ence": 418,
"weigh": 419,
"pos": 420,
"pre": 421,
"attn": 422,
"Ġ20": 423,
"spe": 424,
"cod": 425,
"au": 426,
"10": 427,
"fin": 428,
"ener": 429,
"Ġ4096": 430,
"pool": 431,
"par": 432,
"bias": 433,
"chan": 434,
"task": 435,
"channel": 436,
"evector": 437,
"codevector": 438,
"rate": 439,
"BertFor": 440,
"Ġ256": 441,
"start": 442,
"spec": 443,
"top": 444,
"pooler": 445,
"ord": 446,
"ali": 447,
"pdrop": 448,
"feature": 449,
"quence": 450,
"eneration": 451,
"Model": 452,
"0000": 453,
"Ġ15": 454,
"dev": 455,
"embd": 456,
"adap": 457,
"adapter": 458,
"add": 459,
"ffn": 460,
"Ġ24": 461,
"Se": 462,
"14": 463,
"str": 464,
"ker": 465,
"Sequence": 466,
"SequenceClassification": 467,
"dition": 468,
"Ġ64": 469,
"pa": 470,
"epsil": 471,
"epsilon": 472,
"Ġ2048": 473,
"de": 474,
"fun": 475,
"til": 476,
"tra": 477,
"kernel": 478,
"tie": 479,
"oss": 480,
"rope": 481,
"function": 482,
"ce": 483,
"ping": 484,
"fix": 485,
"loss": 486,
"roberta": 487,
"no": 488,
"its": 489,
"stop": 490,
"word": 491,
"lation": 492,
"early": 493,
"stopping": 494,
"}},": 495,
"pen": 496,
"000": 497,
"positions": 498,
"tic": 499,
"ple": 500,
"ditional": 501,
"past": 502,
"nn": 503,
"fic": 504,
"Ġ305": 505,
"\\\\": 506,
"alize": 507,
"normalize": 508,
"ment": 509,
"prefix": 510,
"lative": 511,
"relative": 512,
"Generation": 513,
"lem": 514,
"ide": 515,
"groups": 516,
"onditional": 517,
"onditionalGeneration": 518,
"ForConditionalGeneration": 519,
"li": 520,
"fact": 521,
"speci": 522,
"final": 523,
"problem": 524,
"06": 525,
"alty": 526,
"log": 527,
"penalty": 528,
"Ġ30522": 529,
"factor": 530,
"labels": 531,
"classification": 532,
"ish": 533,
"sl": 534,
"ctc": 535,
"val": 536,
"fir": 537,
"ace": 538,
"first": 539,
"iding": 540,
"sliding": 541,
"new": 542,
"Ro": 543,
"sing": 544,
"sam": 545,
"params": 546,
"et": 547,
"zer": 548,
"weight": 549,
"bu": 550,
"single": 551,
"specific": 552,
"sed": 553,
"logits": 554,
"Ġ50256": 555,
"19": 556,
"ls": 557,
"cased": 558,
"sta": 559,
"td": 560,
"ection": 561,
"init": 562,
"stride": 563,
"dir": 564,
"tdnn": 565,
"ke": 566,
"dis": 567,
"so": 568,
"gpt": 569,
"57": 570,
"wav": 571,
"classi": 572,
"ization": 573,
"train": 574,
"able": 575,
"classif": 576,
"sh": 577,
"sample": 578,
"To": 579,
"512": 580,
"vec": 581,
"11": 582,
"weights": 583,
"ri": 584,
"war": 585,
"ER": 586,
"BertForSequenceClassification": 587,
"dat": 588,
"static": 589,
"dow": 590,
"ind": 591,
"Token": 592,
"fig": 593,
"sal": 594,
"vi": 595,
"Ġ514": 596,
"summarization": 597,
"oo": 598,
"kv": 599,
"distil": 600,
"std": 601,
"edu": 602,
"index": 603,
"Ġ50": 604,
"Roberta": 605,
"tem": 606,
"masks": 607,
"late": 608,
"set": 609,
"65": 610,
"ga": 611,
"buck": 612,
"ced": 613,
"key": 614,
"atch": 615,
"ets": 616,
"ic": 617,
"ian": 618,
"15": 619,
"forced": 620,
"buckets": 621,
"PT": 622,
"ner": 623,
"lish": 624,
"value": 625,
"18": 626,
"ode": 627,
"win": 628,
"Ma": 629,
"25": 630,
"lar": 631,
"Ġto": 632,
"fc": 633,
"distilbert": 634,
"inf": 635,
"ĠE": 636,
"translation": 637,
"poch": 638,
"Ġ300": 639,
"ward": 640,
"36": 641,
"ated": 642,
"epoch": 643,
"Ġ50257": 644,
"ve": 645,
"clas": 646,
"OR": 647,
"translate": 648,
"ckpt": 649,
"ss": 650,
"finet": 651,
"17": 652,
"GPT": 653,
"ature": 654,
"sp": 655,
"ĠEng": 656,
"Mask": 657,
"ausal": 658,
"ausalLM": 659,
"ForCausalLM": 660,
"lock": 661,
"ĠEnglish": 662,
"Ġ\\\"},": 663,
"resi": 664,
"Ġ\\\"/": 665,
"Masked": 666,
"quan": 667,
"finetun": 668,
"sel": 669,
"ram": 670,
"mage": 671,
"MaskedLM": 672,
"repe": 673,
"resid": 674,
"co": 675,
"24": 676,
"window": 677,
"large": 678,
"inner": 679,
"21": 680,
"sw": 681,
"lm": 682,
"ur": 683,
"perature": 684,
"temperature": 685,
"app": 686,
"Ġ100": 687,
"13": 688,
"gment": 689,
"config": 690,
"Ġ10000": 691,
"feed": 692,
"RobertaFor": 693,
"forward": 694,
"all": 695,
"uncased": 696,
"the": 697,
"relu": 698,
"ids": 699,
"AR": 700,
"20": 701,
"man": 702,
"ON": 703,
"Ġ25": 704,
"apply": 705,
"cls": 706,
"fore": 707,
"before": 708,
"augment": 709,
"Ġ14": 710,
"Ġ50265": 711,
"Ġ9": 712,
"ngram": 713,
"gative": 714,
"quanti": 715,
"repeat": 716,
"Di": 717,
"uto": 718,
"class": 719,
"ms": 720,
"zero": 721,
"bfloat": 722,
"pu": 723,
"He": 724,
"tar": 725,
"redu": 726,
"negative": 727,
"arn": 728,
"reduction": 729,
"ther": 730,
"net": 731,
"Ġ28": 732,
"wen": 733,
"Wav": 734,
"Vec": 735,
"Ġ11": 736,
"contr": 737,
"silu": 738,
"inity": 739,
"ai": 740,
"other": 741,
"infinity": 742,
"mt": 743,
"rms": 744,
"batch": 745,
"stable": 746,
"image": 747,
"selection": 748,
"and": 749,
"Head": 750,
"patch": 751,
"TC": 752,
"Ġ1500": 753,
"space": 754,
"ft": 755,
"finetuning": 756,
"setting": 757,
"learn": 758,
"128": 759,
"settings": 760,
"tokenizer": 761,
"theta": 762,
"DP": 763,
"face": 764,
"fr": 765,
"ook": 766,
"mean": 767,
"qa": 768,
"LMHead": 769,
"mu": 770,
"ctx": 771,
"DE": 772,
"book": 773,
"LMHeadModel": 774,
"bart": 775,
"sity": 776,
"Ġ320": 777,
"exp": 778,
"OC": 779,
"seq": 780,
"learning": 781,
"ra": 782,
"weighted": 783,
"gated": 784,
"0002": 785,
"Ġ\\\"_": 786,
"lama": 787,
"lt": 788,
"TI": 789,
"vision": 790,
"channels": 791,
"ForCTC": 792,
"ub": 793,
"84": 794,
"PR": 795,
"versity": 796,
"block": 797,
"LOC": 798,
"Bad": 799,
"diversity": 800,
"BadDi": 801,
"PER": 802,
"facebook": 803,
"epochs": 804,
"ORG": 805,
"steps": 806,
"mp": 807,
"Ġ1516": 808,
"negatives": 809,
"quantizer": 810,
"codevectors": 811,
"astive": 812,
"contrastive": 813,
"cal": 814,
"generation": 815,
"DDP": 816,
"DDPM": 817,
"TokenClassification": 818,
"data": 819,
"Dis": 820,
"pr": 821,
"datase": 822,
"An": 823,
"Tokenizer": 824,
"idal": 825,
"soidal": 826,
"sinu": 827,
"shar": 828,
"sinusoidal": 829,
"04": 830,
"Ġ-": 831,
"embds": 832,
"_\\\":": 833,
"mo": 834,
"tral": 835,
"Distil": 836,
"es": 837,
"CI": 838,
"Ġ13": 839,
"get": 840,
"ues": 841,
"checkpoint": 842,
"Auto": 843,
"Ġ\\\".": 844,
"ED": 845,
"ality": 846,
"pretrain": 847,
"26": 848,
"BertForMaskedLM": 849,
"uestion": 850,
"by": 851,
"SC": 852,
"ance": 853,
"FAR": 854,
"ates": 855,
"28": 856,
"CIFAR": 857,
"35": 858,
"local": 859,
"seed": 860,
"models": 861,
"over": 862,
"fusion": 863,
"mode": 864,
"Question": 865,
"dilation": 866,
"ering": 867,
"100": 868,
"ison": 869,
"UN": 870,
"ectra": 871,
"glo": 872,
"sch": 873,
"idi": 874,
"Answ": 875,
"Ġ248": 876,
"Answering": 877,
"QuestionAnswering": 878,
"scaling": 879,
"bal": 880,
"sav": 881,
"env": 882,
"95": 883,
"mb": 884,
"ho": 885,
"xlm": 886,
"\\\"}\"}": 887,
"global": 888,
"mem": 889,
"lp": 890,
"sm": 891,
"soft": 892,
"ize": 893,
"MT": 894,
"23": 895,
"Ġ30": 896,
"bidi": 897,
"Ġ32128": 898,
"cu": 899,
"Ġ200": 900,
"vector": 901,
"tokens": 902,
"Po": 903,
"save": 904,
"input": 905,
"Ġ[[": 906,
"xvector": 907,
"]],": 908,
"order": 909,
"dataset": 910,
"qwen": 911,
"hy": 912,
"gle": 913,
"cast": 914,
"Ġ32000": 915,
"wor": 916,
"upcast": 917,
"inver": 918,
"direction": 919,
"idx": 920,
"res": 921,
"directionality": 922,
"/\\\",": 923,
"inverse": 924,
"reorder": 925,
"Bart": 926,
"target": 927,
"AD": 928,
"small": 929,
"mul": 930,
"Con": 931,
"stance": 932,
"his": 933,
"AT": 934,
"256": 935,
"ameter": 936,
"parameter": 937,
"Ġ26": 938,
"NL": 939,
"xls": 940,
"goo": 941,
"share": 942,
"words": 943,
"lip": 944,
"google": 945,
"def": 946,
"bad": 947,
"mlp": 948,
"27": 949,
"99": 950,
"resu": 951,
"distance": 952,
"bo": 953,
"hisper": 954,
"NLP": 955,
"Ġ\\\"}},": 956,
"pretraining": 957,
"arian": 958,
"Ġ\\\"./": 959,
"Ġ[],": 960,
"33": 961,
"lr": 962,
"work": 963,
"Ġ{},": 964,
"ice": 965,
"por": 966,
"eval": 967,
"Ġ15164": 968,
"ault": 969,
"ODE": 970,
"ack": 971,
"ForSequenceClassification": 972,
"BadDiff": 973,
"op": 974,
"ory": 975,
"RobertaForSequenceClassification": 976,
"ger": 977,
"load": 978,
"ki": 979,
"parameters": 980,
"fre": 981,
"default": 982,
"53": 983,
"uct": 984,
"llama": 985,
"ren": 986,
"ĠF": 987,
"hyper": 988,
"Rates": 989,
"fn": 990,
"Poison": 991,
"BertForTokenClassification": 992,
"Ġ56": 993,
"ĠG": 994,
"mic": 995,
"tary": 996,
"memory": 997,
"rotary": 998,
"Ġ18": 999,
"expert": 1000,
"dense": 1001,
"ef": 1002,
"gener": 1003,
"marian": 1004,
"erman": 1005,
"MI": 1006,
"54": 1007,
"Marian": 1008,
"SI": 1009,
"996": 1010,
"rel": 1011,
"gg": 1012,
"hub": 1013,
"map": 1014,
"MTModel": 1015,
"MarianMTModel": 1016,
"34": 1017,
"one": 1018,
"summarize": 1019,
"schedu": 1020,
"rive": 1021,
"ual": 1022,
"ail": 1023,
"rench": 1024,
"BartForConditionalGeneration": 1025,
"ĠFrench": 1026,
"sin": 1027,
"bin": 1028,
"01": 1029,
"scr": 1030,
"swish": 1031,
"Ġ19": 1032,
"Roman": 1033,
"scratch": 1034,
"29": 1035,
"ine": 1036,
"Ġ50000": 1037,
"ST": 1038,
"XLM": 1039,
"go": 1040,
"Ġ28996": 1041,
"Gen": 1042,
"Qwen": 1043,
"ĠRoman": 1044,
"ĠGerman": 1045,
"ĠRomanian": 1046,
"tp": 1047,
"Ġ224": 1048,
"pri": 1049,
"types": 1050,
"DistilBertForSequenceClassification": 1051,
"64": 1052,
"ite": 1053,
"58": 1054,
"cf": 1055,
"mini": 1056,
"Ġ60": 1057,
"us": 1058,
"Llama": 1059,
"mi": 1060,
"pus": 1061,
"MISC": 1062,
"spar": 1063,
"fp": 1064,
"vit": 1065,
"schedule": 1066,
"Block": 1067,
"end": 1068,
"Ġ384": 1069,
"mm": 1070,
"utral": 1071,
"Config": 1072,
"NE": 1073,
"te": 1074,
"CPR": 1075,
"rain": 1076,
"restart": 1077,
"restarts": 1078,
"electra": 1079,
"wr": 1080,
"micro": 1081,
"opus": 1082,
"ffusion": 1083,
"Ġ1000": 1084,
"beta": 1085,
"mple": 1086,
"sparse": 1087,
"microsoft": 1088,
"last": 1089,
"BertModel": 1090,
"down": 1091,
"Hel": 1092,
"Ġ21": 1093,
"SM": 1094,
"um": 1095,
"sinki": 1096,
"Helsinki": 1097,
"entail": 1098,
"entailment": 1099,
"age": 1100,
"device": 1101,
"ay": 1102,
"sup": 1103,
"cnn": 1104,
"experts": 1105,
"xsum": 1106,
"ip": 1107,
"Ġ24805": 1108,
"uc": 1109,
"Ġ5120": 1110,
"50": 1111,
"write": 1112,
"press": 1113,
"Ġ62": 1114,
"overwrite": 1115,
"768": 1116,
"Ġ36": 1117,
"Ġ142": 1118,
"moe": 1119,
"VE": 1120,
"Train": 1121,
"psi": 1122,
"BadDiffusion": 1123,
"GenBadDiffusion": 1124,
"BertForQuestionAnswering": 1125,
"cfg": 1126,
"OP": 1127,
"AL": 1128,
"Ġ448": 1129,
"vp": 1130,
"AutoModel": 1131,
"ary": 1132,
"001": 1133,
"ES": 1134,
"Ġ500": 1135,
"Ġ1536": 1136,
"Ġ250002": 1137,
"infer": 1138,
"TION": 1139,
"force": 1140,
"reg": 1141,
"suppress": 1142,
"30": 1143,
"whisper": 1144,
"cro": 1145,
"neutral": 1146,
"tmp": 1147,
"meas": 1148,
"mit": 1149,
"dep": 1150,
"condition": 1151,
"measure": 1152,
"cl": 1153,
"network": 1154,
"extra": 1155,
"31": 1156,
"144": 1157,
"former": 1158,
"scri": 1159,
"nli": 1160,
"multi": 1161,
"bj": 1162,
"RobertaForMaskedLM": 1163,
"08": 1164,
"ness": 1165,
"avi": 1166,
"sequence": 1167,
"depth": 1168,
"IN": 1169,
"Ġ17": 1170,
"units": 1171,
"192": 1172,
"ech": 1173,
"lts": 1174,
"stic": 1175,
"conditioning": 1176,
"simple": 1177,
"tt": 1178,
"results": 1179,
"ph": 1180,
"Ġ1000000": 1181,
"freq": 1182,
"mrope": 1183,
"modeling": 1184,
"Ġ48": 1185,
"struct": 1186,
"94": 1187,
"termini": 1188,
"determini": 1189,
"LlamaForCausalLM": 1190,
"deterministic": 1191,
"cc": 1192,
"vis": 1193,
"Ġ\\\"\\\\": 1194,
"frame": 1195,
"hu": 1196,
"rout": 1197,
"home": 1198,
"encode": 1199,
"Ne": 1200,
"py": 1201,
"goal": 1202,
"TIVE": 1203,
"gu": 1204,
"post": 1205,
"hic": 1206,
"om": 1207,
"EN": 1208,
"cle": 1209,
"Ġ\\\\": 1210,
"Ġ1280": 1211,
"cont": 1212,
"tc": 1213,
"Ġ32768": 1214,
"istral": 1215,
"75": 1216,
"wn": 1217,
"Ġ23": 1218,
"slo": 1219,
"Ġ30000": 1220,
"limit": 1221,
"back": 1222,
"Ġ8192": 1223,
"finetuned": 1224,
"Ġ80": 1225,
"auto": 1226,
"ight": 1227,
"cau": 1228,
"not": 1229,
"CON": 1230,
"PAR": 1231,
"il": 1232,
"202": 1233,
"Do": 1234,
"ast": 1235,
"causal": 1236,
"El": 1237,
"sent": 1238,
"mel": 1239,
"sig": 1240,
"In": 1241,
"qkv": 1242,
"bins": 1243,
"Ġ27": 1244,
"eng": 1245,
"Ġ84": 1246,
"300": 1247,
"entable": 1248,
"checkpoints": 1249,
"opentable": 1250,
"Electra": 1251,
"lamb": 1252,
"Image": 1253,
"TR": 1254,
"tur": 1255,
"Ġ35": 1256,
"mod": 1257,
"lambd": 1258,
"cel": 1259,
"interval": 1260,
"Ġ151643": 1261,
"havi": 1262,
"rati": 1263,
"PO": 1264,
"behavi": 1265,
"66": 1266,
"eci": 1267,
"behavior": 1268,
"224": 1269,
"OF": 1270,
"ong": 1271,
"lang": 1272,
"content": 1273,
"tan": 1274,
"causalm": 1275,
"AN": 1276,
"envs": 1277,
"38": 1278,
"384": 1279,
"mtp": 1280,
"}}\"}": 1281,
"project": 1282,
"clip": 1283,
"uration": 1284,
"uth": 1285,
"quad": 1286,
"positive": 1287,
"NO": 1288,
"De": 1289,
"ses": 1290,
"ForImage": 1291,
"ical": 1292,
"37": 1293,
"ule": 1294,
"BO": 1295,
"unk": 1296,
"xlsr": 1297,
"pl": 1298,
"peri": 1299,
"sentence": 1300,
"tanh": 1301,
"Pro": 1302,
"sus": 1303,
"sour": 1304,
"router": 1305,
"ForImageClassification": 1306,
"98": 1307,
"BER": 1308,
"albert": 1309,
"sci": 1310,
"ideo": 1311,
"Ch": 1312,
"fro": 1313,
"Ġ65": 1314,
"backb": 1315,
"blocks": 1316,
"BOX": 1317,
"backbone": 1318,
"mup": 1319,
"Ġ119": 1320,
"deberta": 1321,
"port": 1322,
"trig": 1323,
"embert": 1324,
"gasus": 1325,
"source": 1326,
"mix": 1327,
"partial": 1328,
"trigger": 1329,
"Ġ22": 1330,
"states": 1331,
"Ġ262": 1332,
"structure": 1333,
"hi": 1334,
"classes": 1335,
"effic": 1336,
"aux": 1337,
"OD": 1338,
"step": 1339,
"efficient": 1340,
"tin": 1341,
"drive": 1342,
"jo": 1343,
"ingual": 1344,
"GN": 1345,
"fl": 1346,
"fo": 1347,
"are": 1348,
"warmup": 1349,
"Ġ262144": 1350,
"pytorch": 1351,
"90": 1352,
"adi": 1353,
"mamb": 1354,
"mamba": 1355,
"idth": 1356,
"97": 1357,
"BERT": 1358,
"wer": 1359,
"Ġ50258": 1360,
"RobertaModel": 1361,
"quantiz": 1362,
"clean": 1363,
"tri": 1364,
"Down": 1365,
"Ġ151645": 1366,
"SDE": 1367,
"gs": 1368,
"run": 1369,
"generate": 1370,
"turn": 1371,
"padding": 1372,
"predi": 1373,
"ME": 1374,
"Pre": 1375,
"sizes": 1376,
">\\\",": 1377,
"width": 1378,
"gin": 1379,
"ore": 1380,
"ATE": 1381,
"quantization": 1382,
"Vi": 1383,
"CO": 1384,
"My": 1385,
"only": 1386,
"outputs": 1387,
"tilingual": 1388,
"547": 1389,
"UM": 1390,
"of": 1391,
"ron": 1392,
"return": 1393,
"shared": 1394,
"Ġ31": 1395,
"multilingual": 1396,
"SIGN": 1397,
"ForMaskedLM": 1398,
"Drive": 1399,
"PC": 1400,
"sde": 1401,
"Ġ58": 1402,
"gam": 1403,
"FI": 1404,
"video": 1405,
"ratio": 1406,
"Ġand": 1407,
"adapters": 1408,
"AI": 1409,
"UR": 1410,
"Ġ131": 1411,
"77": 1412,
"Net": 1413,
"spa": 1414,
"lap": 1415,
"UNC": 1416,
"CONJ": 1417,
"result": 1418,
"open": 1419,
"inal": 1420,
"squad": 1421,
"Ġ<": 1422,
"ator": 1423,
"datasets": 1424,
"HE": 1425,
"bits": 1426,
"eb": 1427,
"Ġ131072": 1428,
"tiny": 1429,
"dio": 1430,
"special": 1431,
"com": 1432,
"repo": 1433,
"Training": 1434,
"PART": 1435,
"Ġ119547": 1436,
"spatial": 1437,
"__": 1438,
"read": 1439,
"auth": 1440,
"begin": 1441,
"ecision": 1442,
"MyDrive": 1443,
"mer": 1444,
"AutoConfig": 1445,
"STOP": 1446,
"Ġ503": 1447,
"agg": 1448,
"sual": 1449,
"keep": 1450,
"precision": 1451,
"mixed": 1452,
"del": 1453,
"ery": 1454,
"poison": 1455,
"acc": 1456,
"gpu": 1457,
"generated": 1458,
"Up": 1459,
"Ġ21128": 1460,
"YM": 1461,
"ak": 1462,
"005": 1463,
"self": 1464,
"RobertaForTokenClassification": 1465,
"ux": 1466,
"fil": 1467,
"priv": 1468,
"cell": 1469,
"unslo": 1470,
"from": 1471,
"private": 1472,
"unsloth": 1473,
"46": 1474,
"42": 1475,
"push": 1476,
"VP": 1477,
"accu": 1478,
"der": 1479,
"attentions": 1480,
"336": 1481,
"overlap": 1482,
"car": 1483,
"ul": 1484,
"cross": 1485,
"accumu": 1486,
"table": 1487,
"vl": 1488,
"stage": 1489,
"Al": 1490,
"NEG": 1491,
"40": 1492,
"NUM": 1493,
"gen": 1494,
"ith": 1495,
"accumulation": 1496,
"hor": 1497,
"solver": 1498,
"has": 1499,
"UNI": 1500,
"sign": 1501,
"gamma": 1502,
"eze": 1503,
"sad": 1504,
"uned": 1505,
"postfix": 1506,
"FOR": 1507,
"ball": 1508,
"visual": 1509,
"fclip": 1510,
"Ġ24804": 1511,
"regation": 1512,
"aggregation": 1513,
"im": 1514,
"Ġ96": 1515,
"lan": 1516,
"sched": 1517,
"bott": 1518,
"int": 1519,
"section": 1520,
"main": 1521,
"adiction": 1522,
"obj": 1523,
"Ġ\\\"<": 1524,
"emical": 1525,
"Ġ518": 1526,
"module": 1527,
"ci": 1528,
"ot": 1529,
"Ġ16384": 1530,
"220": 1531,
"ength": 1532,
"layernorm": 1533,
"./": 1534,
"Whisper": 1535,
"erson": 1536,
"leav": 1537,
"grap": 1538,
"contradiction": 1539,
"orig": 1540,
"life": 1541,
"Ġ5026": 1542,
"WhisperForConditionalGeneration": 1543,
"AS": 1544,
"Mo": 1545,
"Re": 1546,
"strength": 1547,
"ru": 1548,
"Ġ57": 1549,
"&_": 1550,
"_&_": 1551,
"ational": 1552,
"leneck": 1553,
"residual": 1554,
"script": 1555,
"ViT": 1556,
"COM": 1557,
"ae": 1558,
"vel": 1559,
"Ġ1519": 1560,
"deep": 1561,
"bottleneck": 1562,
"thod": 1563,
"medium": 1564,
"viron": 1565,
"configuration": 1566,
"pruned": 1567,
"softmax": 1568,
"HED": 1569,
"MED": 1570,
"af": 1571,
"play": 1572,
"quant": 1573,
"SCHED": 1574,
"DownBlock": 1575,
"modules": 1576,
"Py": 1577,
"sic": 1578,
"Ġ29": 1579,
"vironment": 1580,
"bit": 1581,
"ud": 1582,
"neo": 1583,
"duct": 1584,
"ko": 1585,
"ort": 1586,
"sha": 1587,
"XED": 1588,
"sampl": 1589,
"Ġ14336": 1590,
"inference": 1591,
"Albert": 1592,
"tok": 1593,
"torchscript": 1594,
"FIXED": 1595,
"Mistral": 1596,
"tition": 1597,
"VER": 1598,
"mis": 1599,
"anger": 1600,
"tal": 1601,
"fear": 1602,
"\\\\\\\\": 1603,
"als": 1604,
"ased": 1605,
"Ġ250": 1606,
"period": 1607,
"food": 1608,
"gan": 1609,
"En": 1610,
"Hu": 1611,
"gate": 1612,
"008": 1613,
"pretrained": 1614,
"ign": 1615,
"repetition": 1616,
"Ġ500000": 1617,
"UNIPC": 1618,
"sadness": 1619,
"Ġ151936": 1620,
"44": 1621,
"revision": 1622,
"audio": 1623,
"AU": 1624,
"col": 1625,
"interleav": 1626,
"biased": 1627,
"sy": 1628,
"vers": 1629,
"now": 1630,
"55": 1631,
"long": 1632,
"Ġthe": 1633,
"original": 1634,
"args": 1635,
"2000": 1636,
"enti": 1637,
"tom": 1638,
"level": 1639,
"Ġ2501": 1640,
"ODEL": 1641,
"PreTraining": 1642,
"ser": 1643,
"ForQuestionAnswering": 1644,
"Tar": 1645,
"way": 1646,
"lic": 1647,
"ViTForImageClassification": 1648,
"MODEL": 1649,
"mnli": 1650,
"mpnet": 1651,
"crop": 1652,
"POSI": 1653,
"Ġ51865": 1654,
"cam": 1655,
"emo": 1656,
"ffer": 1657,
"joy": 1658,
"filter": 1659,
"52": 1660,
"training": 1661,
"poral": 1662,
"NEGA": 1663,
"person": 1664,
"method": 1665,
"shi": 1666,
"convers": 1667,
"152": 1668,
"Target": 1669,
"ie": 1670,
"ard": 1671,
"code": 1672,
"RobertaForQuestionAnswering": 1673,
"resnet": 1674,
"freeze": 1675,
"Snow": 1676,
"Tr": 1677,
"ili": 1678,
"pegasus": 1679,
"sur": 1680,
"bug": 1681,
"temporal": 1682,
"hics": 1683,
"ballTarget": 1684,
"POSITIVE": 1685,
"SnowballTarget": 1686,
"ity": 1687,
"mbart": 1688,
"ant": 1689,
"izon": 1690,
"merge": 1691,
"horizon": 1692,
"Ġ43": 1693,
"ramids": 1694,
"Pyramids": 1695,
"Ġ250112": 1696,
"NEGATIVE": 1697,
"environment": 1698,
"best": 1699,
"camembert": 1700,
"xl": 1701,
"verage": 1702,
"quality": 1703,
"debug": 1704,
"graphics": 1705,
"conversational": 1706,
"43": 1707,
"59": 1708,
"gap": 1709,
"peech": 1710,
"bio": 1711,
"ADJ": 1712,
"hicle": 1713,
"sume": 1714,
"qui": 1715,
"ssm": 1716,
"resume": 1717,
"trainer": 1718,
"ĠS": 1719,
"UpBlock": 1720,
"ora": 1721,
"lambda": 1722,
"ise": 1723,
"vehicle": 1724,
"surpri": 1725,
"reward": 1726,
"320": 1727,
"buffer": 1728,
"ENT": 1729,
"uction": 1730,
"alo": 1731,
"initialize": 1732,
"ForTokenClassification": 1733,
"langu": 1734,
"gem": 1735,
"answer": 1736,
"speech": 1737,
"fixed": 1738,
"interleaved": 1739,
"language": 1740,
"hf": 1741,
"oning": 1742,
"height": 1743,
"Ġ248044": 1744,
"79": 1745,
"80": 1746,
"qk": 1747,
"tern": 1748,
"query": 1749,
"Ġ2560": 1750,
"cus": 1751,
"mistral": 1752,
"pla": 1753,
"thread": 1754,
"Ġ5036": 1755,
"accep": 1756,
"average": 1757,
"Ġ33": 1758,
"location": 1759,
"AutoModelForCausalLM": 1760,
"engine": 1761,
"surprise": 1762,
"minator": 1763,
"ADV": 1764,
"Ġ192": 1765,
"AUX": 1766,
"\\\"}}\"}": 1767,
"pture": 1768,
"hyperparameters": 1769,
"behavioral": 1770,
"QU": 1771,
"lue": 1772,
"insic": 1773,
"extrinsic": 1774,
"span": 1775,
"Ġ\\\"../": 1776,
"Ġ5005": 1777,
"behaviors": 1778,
"signals": 1779,
"70": 1780,
"gi": 1781,
"capture": 1782,
"Ġ310": 1783,
"cloning": 1784,
"Deberta": 1785,
"areas": 1786,
"lifetime": 1787,
"threaded": 1788,
"72": 1789,
"ecut": 1790,
"execut": 1791,
"comm": 1792,
"NOUN": 1793,
"Bi": 1794,
"HI": 1795,
"ables": 1796,
"phm": 1797,
"Mini": 1798,
"Ġ20000": 1799,
"discri": 1800,
"temp": 1801,
"discriminator": 1802,
"DistilBertForMaskedLM": 1803,
"openai": 1804,
"shape": 1805,
"acceptable": 1806,
"llm": 1807,
"constr": 1808,
"BertTokenizer": 1809,
"executables": 1810,
"Ġof": 1811,
"additional": 1812,
"delta": 1813,
"custom": 1814,
"cos": 1815,
"indexes": 1816,
"Ġ11008": 1817,
"60": 1818,
"88": 1819,
"Ġ\\\",": 1820,
"Ġ1152": 1821,
"bile": 1822,
"cap": 1823,
"low": 1824,
"DET": 1825,
"sequences": 1826,
"topk": 1827,
"/.": 1828,
"OT": 1829,
"pct": 1830,
"Ġ10000000": 1831,
"flat": 1832,
"IS": 1833,
"ln": 1834,
"0003": 1835,
"39": 1836,
"cor": 1837,
"sers": 1838,
"gging": 1839,
"tu": 1840,
"Ġ5035": 1841,
"opti": 1842,
"predict": 1843,
"construction": 1844,
"lora": 1845,
"mr": 1846,
"qg": 1847,
"tas": 1848,
"PRON": 1849,
"PROP": 1850,
"EX": 1851,
"off": 1852,
"sease": 1853,
"Ġ128000": 1854,
"103": 1855,
"bot": 1856,
"equi": 1857,
"sian": 1858,
"valent": 1859,
"VERB": 1860,
"equivalent": 1861,
"09": 1862,
"coder": 1863,
"sep": 1864,
"RO": 1865,
"stack": 1866,
"subj": 1867,
"US": 1868,
"Ġ595": 1869,
"cola": 1870,
"ADP": 1871,
"big": 1872,
"lu": 1873,
"ForPreTraining": 1874,
"sampling": 1875,
"PROPN": 1876,
"Co": 1877,
"ba": 1878,
"cated": 1879,
"rd": 1880,
"trained": 1881,
"AutoTrain": 1882,
"template": 1883,
"51": 1884,
"SYM": 1885,
"ni": 1886,
"features": 1887,
"XLMRobertaForTokenClassification": 1888,
"PUNC": 1889,
"sa": 1890,
"product": 1891,
"binary": 1892,
"Chemical": 1893,
"MistralForCausalLM": 1894,
"chunk": 1895,
"loom": 1896,
"vice": 1897,
"Ġ2304": 1898,
"Att": 1899,
"CCONJ": 1900,
"mon": 1901,
"dent": 1902,
"linux": 1903,
"ignore": 1904,
"mlm": 1905,
"sv": 1906,
"101": 1907,
"ebd": 1908,
"NC": 1909,
"bm": 1910,
"}}},": 1911,
"288": 1912,
"hugging": 1913,
"PUNCT": 1914,
"74": 1915,
"EV": 1916,
"ix": 1917,
"ppo": 1918,
"Ġ34": 1919,
"coefficient": 1920,
"cen": 1921,
"ou": 1922,
"sst": 1923,
"und": 1924,
"0001": 1925,
"depths": 1926,
"INT": 1927,
"non": 1928,
"FE": 1929,
"imp": 1930,
"ous": 1931,
"stem": 1932,
"skip": 1933,
"ATUR": 1934,
"Attn": 1935,
"So": 1936,
"Ġ59": 1937,
"Fast": 1938,
"alth": 1939,
"XLMRobertaForSequenceClassification": 1940,
"umn": 1941,
"HEAD": 1942,
"column": 1943,
"DATE": 1944,
"Mul": 1945,
"mail": 1946,
"vox": 1947,
"love": 1948,
"coef": 1949,
"deepstack": 1950,
"br": 1951,
"du": 1952,
"Ġst": 1953,
"Ġ{}},": 1954,
"news": 1955,
"comp": 1956,
"Ġ248320": 1957,
"ggy": 1958,
"Cam": 1959,
"fast": 1960,
"english": 1961,
"spanish": 1962,
"49": 1963,
"ATION": 1964,
"layout": 1965,
"dedi": 1966,
"ust": 1967,
"stu": 1968,
"ORA": 1969,
"auxili": 1970,
"Multi": 1971,
"dedicated": 1972,
"auxiliary": 1973,
"YP": 1974,
"tec": 1975,
"normal": 1976,
"Neo": 1977,
"ElectraForSequenceClassification": 1978,
"FEATUR": 1979,
"FT": 1980,
"Ġ39": 1981,
"Ġ46": 1982,
"repla": 1983,
"berts": 1984,
"GE": 1985,
"\\\"]": 1986,
"Huggy": 1987,
"Ġ4304": 1988,
"--": 1989,
"824": 1990,
"HAT": 1991,
"ber": 1992,
"false": 1993,
"Ġ\\\"[": 1994,
"total": 1995,
"Name": 1996,
"ane": 1997,
"NEU": 1998,
"FED": 1999,
"ws": 2000,
"tron": 2001,
"ement": 2002,
"ression": 2003,
"FEDORA": 2004,
"73": 2005,
"Ġ12288": 2006,
"sts": 2007,
"Encoder": 2008,
"DebertaV": 2009,
"45": 2010,
"78": 2011,
"dict": 2012,
"Ġ50264": 2013,
"GPTNeo": 2014,
"gust": 2015,
"student": 2016,
"IC": 2017,
"MP": 2018,
"bs": 2019,
"Ġre": 2020,
"valid": 2021,
"layoutlm": 2022,
"Or": 2023,
"cy": 2024,
"nl": 2025,
"xi": 2026,
"search": 2027,
"action": 2028,
"lender": 2029,
"architecture": 2030,
"appro": 2031,
"noise": 2032,
"center": 2033,
"AC": 2034,
"Pe": 2035,
"projector": 2036,
"longformer": 2037,
"76": 2038,
"chine": 2039,
"ang": 2040,
"fusions": 2041,
"INTJ": 2042,
"lenderbot": 2043,
"VL": 2044,
"fer": 2045,
"075": 2046,
"line": 2047
},
"merges": [
[
"\\",
"\""
],
[
"Ġ",
"\\\""
],
[
"\\\"",
":"
],
[
"e",
"r"
],
[
"e",
"n"
],
[
"t",
"i"
],
[
"o",
"n"
],
[
"\\\"",
","
],
[
"s",
"i"
],
[
"a",
"t"
],
[
"i",
"n"
],
[
"r",
"o"
],
[
"ti",
"on"
],
[
"i",
"d"
],
[
"Ġ",
"1"
],
[
"Ġ",
"0"
],
[
"o",
"r"
],
[
"l",
"a"
],
[
"p",
"o"
],
[
"a",
"l"
],
[
"e",
"l"
],
[
"t",
"r"
],
[
"u",
"t"
],
[
"n",
"u"
],
[
"o",
"d"
],
[
"s",
"e"
],
[
"p",
"e"
],
[
"c",
"h"
],
[
"z",
"e"
],
[
"t",
"y"
],
[
"a",
"r"
],
[
"a",
"d"
],
[
"si",
"ze"
],
[
"d",
"ro"
],
[
"e",
"d"
],
[
"e",
"c"
],
[
"Ġ",
"2"
],
[
"t",
"o"
],
[
"ty",
"pe"
],
[
"nu",
"m"
],
[
"la",
"y"
],
[
"at",
"t"
],
[
"lay",
"er"
],
[
"a",
"n"
],
[
"c",
"a"
],
[
"d",
"en"
],
[
"po",
"ut"
],
[
"dro",
"pout"
],
[
"h",
"id"
],
[
"hid",
"den"
],
[
"k",
"en"
],
[
"en",
"tion"
],
[
"att",
"ention"
],
[
"in",
"g"
],
[
"to",
"ken"
],
[
"u",
"e"
],
[
"m",
"a"
],
[
"Ġ",
"{"
],
[
"Ġ",
"3"
],
[
"r",
"e"
],
[
"e",
"m"
],
[
"Ġ",
"5"
],
[
"tr",
"ue"
],
[
"Ġ",
"true"
],
[
"p",
"ro"
],
[
"or",
"m"
],
[
"a",
"c"
],
[
"1",
"2"
],
[
"em",
"b"
],
[
"0",
"2"
],
[
"Ġ",
"f"
],
[
"al",
"se"
],
[
"Ġf",
"alse"
],
[
"pro",
"b"
],
[
"e",
"x"
],
[
"od",
"er"
],
[
"emb",
"ed"
],
[
"d",
"ing"
],
[
"Ġ",
"["
],
[
"]",
","
],
[
"embed",
"ding"
],
[
"a",
"m"
],
[
"Ġ1",
"2"
],
[
"od",
"el"
],
[
"0",
"0"
],
[
"f",
"i"
],
[
"h",
"e"
],
[
"d",
"i"
],
[
"o",
"s"
],
[
"i",
"t"
],
[
"layer",
"s"
],
[
"m",
"odel"
],
[
"v",
"o"
],
[
"ca",
"b"
],
[
"vo",
"cab"
],
[
"he",
"ad"
],
[
"Ġ{",
"\\\""
],
[
"u",
"re"
],
[
"Ġ5",
"12"
],
[
"s",
"t"
],
[
"po",
"si"
],
[
"ec",
"t"
],
[
"posi",
"tion"
],
[
"ma",
"x"
],
[
"n",
"orm"
],
[
"s",
"k"
],
[
"l",
"l"
],
[
"E",
"L"
],
[
"er",
"t"
],
[
"l",
"o"
],
[
"L",
"A"
],
[
"}",
","
],
[
"B",
"EL"
],
[
"LA",
"BEL"
],
[
"ac",
"t"
],
[
"head",
"s"
],
[
"an",
"s"
],
[
"ex",
"t"
],
[
"la",
"s"
],
[
"i",
"z"
],
[
"t",
"ext"
],
[
"tr",
"ans"
],
[
"at",
"e"
],
[
"t",
"h"
],
[
"v",
"er"
],
[
"a",
"tion"
],
[
"g",
"e"
],
[
"las",
"si"
],
[
"si",
"on"
],
[
"embedding",
"s"
],
[
"e",
"p"
],
[
"{",
"\\\""
],
[
"\"",
":"
],
[
"\"",
"}"
],
[
"\"",
"{\\\""
],
[
"}",
"\"}"
],
[
"č",
"Ċ"
],
[
"Ġ",
"\"{\\\""
],
[
"Ġ{",
"\""
],
[
"d",
"ec"
],
[
"Ġ[",
"\\\""
],
[
"\\\"",
"],"
],
[
"en",
"c"
],
[
"dec",
"oder"
],
[
"la",
"b"
],
[
"t",
"er"
],
[
"in",
"i"
],
[
"iz",
"er"
],
[
"lab",
"el"
],
[
"el",
"u"
],
[
"u",
"se"
],
[
"ti",
"v"
],
[
"ar",
"ch"
],
[
"f",
"orm"
],
[
"ure",
"s"
],
[
"l",
"en"
],
[
"it",
"ect"
],
[
"arch",
"itect"
],
[
"architect",
"ures"
],
[
"s",
"u"
],
[
"Ġ",
"4"
],
[
"p",
"at"
],
[
"trans",
"form"
],
[
"g",
"th"
],
[
"er",
"s"
],
[
"ti",
"al"
],
[
"lassi",
"fi"
],
[
"len",
"gth"
],
[
"g",
"elu"
],
[
"am",
"e"
],
[
"ver",
"sion"
],
[
"ma",
"sk"
],
[
"transform",
"ers"
],
[
"Ġ",
"7"
],
[
"ini",
"tial"
],
[
"b",
"ert"
],
[
"initial",
"izer"
],
[
"pat",
"h"
],
[
"p",
"ad"
],
[
"nu",
"ll"
],
[
"Ġ",
"null"
],
[
"c",
"on"
],
[
"f",
"e"
],
[
"n",
"ame"
],
[
"su",
"m"
],
[
"Ġ",
"6"
],
[
"n",
"g"
],
[
"F",
"or"
],
[
"r",
"an"
],
[
"Ġ\"{\\\"",
"_"
],
[
"di",
"m"
],
[
"ran",
"ge"
],
[
"l",
"e"
],
[
"6",
"8"
],
[
"f",
"lo"
],
[
"0",
"5"
],
[
"flo",
"at"
],
[
"t",
"or"
],
[
"3",
"2"
],
[
"d",
"type"
],
[
"tor",
"ch"
],
[
"m",
"ar"
],
[
"Ġ7",
"68"
],
[
"en",
"t"
],
[
"e",
"os"
],
[
"enc",
"oder"
],
[
"fe",
"at"
],
[
"ep",
"s"
],
[
"ch",
"e"
],
[
"ed",
"i"
],
[
"ca",
"che"
],
[
"in",
"ter"
],
[
"i",
"s"
],
[
"sum",
"mar"
],
[
"f",
"u"
],
[
"m",
"edi"
],
[
"o",
"l"
],
[
"ac",
"tiv"
],
[
"activ",
"ation"
],
[
"medi",
"ate"
],
[
"inter",
"mediate"
],
[
"c",
"lassifi"
],
[
"m",
"e"
],
[
"0",
"7"
],
[
"b",
"os"
],
[
"con",
"v"
],
[
"dro",
"p"
],
[
"e",
"v"
],
[
"pro",
"j"
],
[
"e",
"ar"
],
[
"07",
"2"
],
[
"summar",
"y"
],
[
"Ġ1",
"02"
],
[
"a",
"b"
],
[
"b",
"e"
],
[
"Ġ102",
"4"
],
[
"Ġ3",
"072"
],
[
"Ġ1",
"6"
],
[
"Ġ3",
"2"
],
[
"ca",
"tion"
],
[
"5",
"6"
],
[
"classifi",
"er"
],
[
"ec",
"k"
],
[
"n",
"el"
],
[
"prob",
"s"
],
[
"am",
"s"
],
[
"ch",
"eck"
],
[
"o",
"ut"
],
[
"ti",
"ng"
],
[
"p",
"ut"
],
[
"\\\"",
"},"
],
[
"s",
"c"
],
[
"po",
"in"
],
[
"check",
"poin"
],
[
"a",
"s"
],
[
"Ġ12",
"8"
],
[
"n",
"e"
],
[
"f",
"f"
],
[
"a",
"se"
],
[
"g",
"r"
],
[
"fu",
"ll"
],
[
"t",
"a"
],
[
"Ġ5",
"02"
],
[
"q",
"u"
],
[
"out",
"put"
],
[
"i",
"ent"
],
[
"ti",
"me"
],
[
"i",
"g"
],
[
"ar",
"t"
],
[
"u",
"p"
],
[
"a",
"p"
],
[
"gr",
"ad"
],
[
"grad",
"ient"
],
[
"Ġ",
"8"
],
[
"u",
"n"
],
[
"checkpoin",
"ting"
],
[
"p",
"er"
],
[
"s",
"ol"
],
[
"tiv",
"e"
],
[
"l",
"in"
],
[
"9",
"6"
],
[
"ex",
"tr"
],
[
"m",
"in"
],
[
"sc",
"al"
],
[
"b",
"i"
],
[
"1",
"6"
],
[
"bert",
"a"
],
[
"For",
"C"
],
[
"ut",
"e"
],
[
"ab",
"sol"
],
[
"absol",
"ute"
],
[
"c",
"k"
],
[
"L",
"M"
],
[
"lin",
"ear"
],
[
"t",
"s"
],
[
"f",
"or"
],
[
"a",
"v"
],
[
"c",
"tion"
],
[
"ig",
"h"
],
[
"b",
"ase"
],
[
"ect",
"or"
],
[
"d",
"o"
],
[
"l",
"y"
],
[
"Ġ1",
"0"
],
[
"4",
"8"
],
[
"Ġ4",
"0"
],
[
"extr",
"act"
],
[
"B",
"ert"
],
[
"c",
"t"
],
[
"be",
"ams"
],
[
"w",
"e"
],
[
"g",
"ro"
],
[
"C",
"lassifi"
],
[
"scal",
"e"
],
[
"Classifi",
"cation"
],
[
"p",
"t"
],
[
"layer",
"drop"
],
[
"gro",
"up"
],
[
"si",
"l"
],
[
"2",
"2"
],
[
"enc",
"e"
],
[
"we",
"igh"
],
[
"po",
"s"
],
[
"p",
"re"
],
[
"att",
"n"
],
[
"Ġ2",
"0"
],
[
"s",
"pe"
],
[
"c",
"od"
],
[
"a",
"u"
],
[
"1",
"0"
],
[
"f",
"in"
],
[
"en",
"er"
],
[
"Ġ40",
"96"
],
[
"po",
"ol"
],
[
"p",
"ar"
],
[
"bi",
"as"
],
[
"ch",
"an"
],
[
"ta",
"sk"
],
[
"chan",
"nel"
],
[
"ev",
"ector"
],
[
"cod",
"evector"
],
[
"r",
"ate"
],
[
"Bert",
"For"
],
[
"Ġ2",
"56"
],
[
"st",
"art"
],
[
"spe",
"c"
],
[
"to",
"p"
],
[
"pool",
"er"
],
[
"or",
"d"
],
[
"al",
"i"
],
[
"p",
"drop"
],
[
"feat",
"ure"
],
[
"qu",
"ence"
],
[
"ener",
"ation"
],
[
"M",
"odel"
],
[
"00",
"00"
],
[
"Ġ1",
"5"
],
[
"d",
"ev"
],
[
"emb",
"d"
],
[
"ad",
"ap"
],
[
"adap",
"ter"
],
[
"ad",
"d"
],
[
"ff",
"n"
],
[
"Ġ2",
"4"
],
[
"S",
"e"
],
[
"1",
"4"
],
[
"s",
"tr"
],
[
"k",
"er"
],
[
"Se",
"quence"
],
[
"Sequence",
"Classification"
],
[
"di",
"tion"
],
[
"Ġ6",
"4"
],
[
"p",
"a"
],
[
"ep",
"sil"
],
[
"epsil",
"on"
],
[
"Ġ20",
"48"
],
[
"d",
"e"
],
[
"fu",
"n"
],
[
"ti",
"l"
],
[
"tr",
"a"
],
[
"ker",
"nel"
],
[
"ti",
"e"
],
[
"os",
"s"
],
[
"ro",
"pe"
],
[
"fun",
"ction"
],
[
"c",
"e"
],
[
"p",
"ing"
],
[
"fi",
"x"
],
[
"l",
"oss"
],
[
"ro",
"berta"
],
[
"n",
"o"
],
[
"it",
"s"
],
[
"s",
"top"
],
[
"w",
"ord"
],
[
"la",
"tion"
],
[
"ear",
"ly"
],
[
"stop",
"ping"
],
[
"}",
"},"
],
[
"p",
"en"
],
[
"00",
"0"
],
[
"position",
"s"
],
[
"ti",
"c"
],
[
"p",
"le"
],
[
"dition",
"al"
],
[
"pa",
"st"
],
[
"n",
"n"
],
[
"fi",
"c"
],
[
"Ġ3",
"05"
],
[
"\\",
"\\"
],
[
"ali",
"ze"
],
[
"norm",
"alize"
],
[
"m",
"ent"
],
[
"pre",
"fix"
],
[
"la",
"tive"
],
[
"re",
"lative"
],
[
"G",
"eneration"
],
[
"l",
"em"
],
[
"id",
"e"
],
[
"group",
"s"
],
[
"on",
"ditional"
],
[
"onditional",
"Generation"
],
[
"ForC",
"onditionalGeneration"
],
[
"l",
"i"
],
[
"f",
"act"
],
[
"spec",
"i"
],
[
"fin",
"al"
],
[
"prob",
"lem"
],
[
"0",
"6"
],
[
"al",
"ty"
],
[
"lo",
"g"
],
[
"pen",
"alty"
],
[
"Ġ305",
"22"
],
[
"fact",
"or"
],
[
"label",
"s"
],
[
"classifi",
"cation"
],
[
"is",
"h"
],
[
"s",
"l"
],
[
"ct",
"c"
],
[
"v",
"al"
],
[
"fi",
"r"
],
[
"ac",
"e"
],
[
"fir",
"st"
],
[
"id",
"ing"
],
[
"sl",
"iding"
],
[
"ne",
"w"
],
[
"R",
"o"
],
[
"si",
"ng"
],
[
"s",
"am"
],
[
"par",
"ams"
],
[
"e",
"t"
],
[
"z",
"er"
],
[
"weigh",
"t"
],
[
"b",
"u"
],
[
"sing",
"le"
],
[
"speci",
"fic"
],
[
"se",
"d"
],
[
"log",
"its"
],
[
"Ġ502",
"56"
],
[
"1",
"9"
],
[
"l",
"s"
],
[
"ca",
"sed"
],
[
"st",
"a"
],
[
"t",
"d"
],
[
"ec",
"tion"
],
[
"in",
"it"
],
[
"str",
"ide"
],
[
"di",
"r"
],
[
"td",
"nn"
],
[
"k",
"e"
],
[
"di",
"s"
],
[
"s",
"o"
],
[
"g",
"pt"
],
[
"5",
"7"
],
[
"w",
"av"
],
[
"c",
"lassi"
],
[
"iz",
"ation"
],
[
"tra",
"in"
],
[
"ab",
"le"
],
[
"classi",
"f"
],
[
"s",
"h"
],
[
"sam",
"ple"
],
[
"T",
"o"
],
[
"5",
"12"
],
[
"v",
"ec"
],
[
"1",
"1"
],
[
"weigh",
"ts"
],
[
"r",
"i"
],
[
"w",
"ar"
],
[
"E",
"R"
],
[
"BertFor",
"SequenceClassification"
],
[
"d",
"at"
],
[
"sta",
"tic"
],
[
"do",
"w"
],
[
"in",
"d"
],
[
"To",
"ken"
],
[
"fi",
"g"
],
[
"s",
"al"
],
[
"v",
"i"
],
[
"Ġ5",
"14"
],
[
"summar",
"ization"
],
[
"o",
"o"
],
[
"k",
"v"
],
[
"dis",
"til"
],
[
"st",
"d"
],
[
"ed",
"u"
],
[
"ind",
"ex"
],
[
"Ġ5",
"0"
],
[
"Ro",
"berta"
],
[
"t",
"em"
],
[
"mask",
"s"
],
[
"l",
"ate"
],
[
"se",
"t"
],
[
"6",
"5"
],
[
"g",
"a"
],
[
"bu",
"ck"
],
[
"c",
"ed"
],
[
"ke",
"y"
],
[
"at",
"ch"
],
[
"e",
"ts"
],
[
"i",
"c"
],
[
"i",
"an"
],
[
"1",
"5"
],
[
"for",
"ced"
],
[
"buck",
"ets"
],
[
"P",
"T"
],
[
"n",
"er"
],
[
"l",
"ish"
],
[
"val",
"ue"
],
[
"1",
"8"
],
[
"od",
"e"
],
[
"w",
"in"
],
[
"M",
"a"
],
[
"2",
"5"
],
[
"la",
"r"
],
[
"Ġ",
"to"
],
[
"f",
"c"
],
[
"distil",
"bert"
],
[
"in",
"f"
],
[
"Ġ",
"E"
],
[
"trans",
"lation"
],
[
"po",
"ch"
],
[
"Ġ3",
"00"
],
[
"war",
"d"
],
[
"3",
"6"
],
[
"at",
"ed"
],
[
"e",
"poch"
],
[
"Ġ502",
"57"
],
[
"v",
"e"
],
[
"c",
"las"
],
[
"O",
"R"
],
[
"trans",
"late"
],
[
"ck",
"pt"
],
[
"s",
"s"
],
[
"fin",
"et"
],
[
"1",
"7"
],
[
"G",
"PT"
],
[
"at",
"ure"
],
[
"s",
"p"
],
[
"ĠE",
"ng"
],
[
"Ma",
"sk"
],
[
"au",
"sal"
],
[
"ausal",
"LM"
],
[
"ForC",
"ausalLM"
],
[
"lo",
"ck"
],
[
"ĠEng",
"lish"
],
[
"Ġ\\\"",
"},"
],
[
"re",
"si"
],
[
"Ġ\\\"",
"/"
],
[
"Mask",
"ed"
],
[
"qu",
"an"
],
[
"finet",
"un"
],
[
"s",
"el"
],
[
"r",
"am"
],
[
"ma",
"ge"
],
[
"Masked",
"LM"
],
[
"re",
"pe"
],
[
"resi",
"d"
],
[
"c",
"o"
],
[
"2",
"4"
],
[
"win",
"dow"
],
[
"lar",
"ge"
],
[
"in",
"ner"
],
[
"2",
"1"
],
[
"s",
"w"
],
[
"l",
"m"
],
[
"u",
"r"
],
[
"per",
"ature"
],
[
"tem",
"perature"
],
[
"ap",
"p"
],
[
"Ġ1",
"00"
],
[
"1",
"3"
],
[
"g",
"ment"
],
[
"con",
"fig"
],
[
"Ġ1",
"0000"
],
[
"fe",
"ed"
],
[
"Roberta",
"For"
],
[
"for",
"ward"
],
[
"al",
"l"
],
[
"un",
"cased"
],
[
"t",
"he"
],
[
"r",
"elu"
],
[
"id",
"s"
],
[
"A",
"R"
],
[
"2",
"0"
],
[
"m",
"an"
],
[
"O",
"N"
],
[
"Ġ2",
"5"
],
[
"app",
"ly"
],
[
"c",
"ls"
],
[
"for",
"e"
],
[
"be",
"fore"
],
[
"au",
"gment"
],
[
"Ġ1",
"4"
],
[
"Ġ502",
"65"
],
[
"Ġ",
"9"
],
[
"ng",
"ram"
],
[
"ga",
"tive"
],
[
"quan",
"ti"
],
[
"repe",
"at"
],
[
"D",
"i"
],
[
"ut",
"o"
],
[
"clas",
"s"
],
[
"m",
"s"
],
[
"zer",
"o"
],
[
"b",
"float"
],
[
"p",
"u"
],
[
"H",
"e"
],
[
"t",
"ar"
],
[
"r",
"edu"
],
[
"ne",
"gative"
],
[
"ar",
"n"
],
[
"redu",
"ction"
],
[
"th",
"er"
],
[
"ne",
"t"
],
[
"Ġ2",
"8"
],
[
"w",
"en"
],
[
"W",
"av"
],
[
"V",
"ec"
],
[
"Ġ1",
"1"
],
[
"con",
"tr"
],
[
"sil",
"u"
],
[
"ini",
"ty"
],
[
"a",
"i"
],
[
"o",
"ther"
],
[
"inf",
"inity"
],
[
"m",
"t"
],
[
"r",
"ms"
],
[
"b",
"atch"
],
[
"st",
"able"
],
[
"i",
"mage"
],
[
"sel",
"ection"
],
[
"an",
"d"
],
[
"He",
"ad"
],
[
"pat",
"ch"
],
[
"T",
"C"
],
[
"Ġ15",
"00"
],
[
"sp",
"ace"
],
[
"f",
"t"
],
[
"finetun",
"ing"
],
[
"set",
"ting"
],
[
"le",
"arn"
],
[
"12",
"8"
],
[
"setting",
"s"
],
[
"token",
"izer"
],
[
"the",
"ta"
],
[
"D",
"P"
],
[
"f",
"ace"
],
[
"f",
"r"
],
[
"oo",
"k"
],
[
"me",
"an"
],
[
"q",
"a"
],
[
"LM",
"Head"
],
[
"m",
"u"
],
[
"ct",
"x"
],
[
"D",
"E"
],
[
"b",
"ook"
],
[
"LMHead",
"Model"
],
[
"b",
"art"
],
[
"si",
"ty"
],
[
"Ġ32",
"0"
],
[
"ex",
"p"
],
[
"O",
"C"
],
[
"se",
"q"
],
[
"learn",
"ing"
],
[
"r",
"a"
],
[
"weight",
"ed"
],
[
"g",
"ated"
],
[
"00",
"02"
],
[
"Ġ\\\"",
"_"
],
[
"la",
"ma"
],
[
"l",
"t"
],
[
"T",
"I"
],
[
"vi",
"sion"
],
[
"channel",
"s"
],
[
"ForC",
"TC"
],
[
"u",
"b"
],
[
"8",
"4"
],
[
"P",
"R"
],
[
"ver",
"sity"
],
[
"b",
"lock"
],
[
"L",
"OC"
],
[
"B",
"ad"
],
[
"di",
"versity"
],
[
"Bad",
"Di"
],
[
"P",
"ER"
],
[
"face",
"book"
],
[
"epoch",
"s"
],
[
"OR",
"G"
],
[
"st",
"eps"
],
[
"m",
"p"
],
[
"Ġ15",
"16"
],
[
"negative",
"s"
],
[
"quanti",
"zer"
],
[
"codevector",
"s"
],
[
"as",
"tive"
],
[
"contr",
"astive"
],
[
"c",
"al"
],
[
"g",
"eneration"
],
[
"D",
"DP"
],
[
"DDP",
"M"
],
[
"Token",
"Classification"
],
[
"dat",
"a"
],
[
"D",
"is"
],
[
"p",
"r"
],
[
"dat",
"ase"
],
[
"A",
"n"
],
[
"Token",
"izer"
],
[
"id",
"al"
],
[
"so",
"idal"
],
[
"si",
"nu"
],
[
"sh",
"ar"
],
[
"sinu",
"soidal"
],
[
"0",
"4"
],
[
"Ġ",
"-"
],
[
"embd",
"s"
],
[
"_",
"\\\":"
],
[
"m",
"o"
],
[
"tr",
"al"
],
[
"Dis",
"til"
],
[
"e",
"s"
],
[
"C",
"I"
],
[
"Ġ1",
"3"
],
[
"ge",
"t"
],
[
"ue",
"s"
],
[
"checkpoin",
"t"
],
[
"A",
"uto"
],
[
"Ġ\\\"",
"."
],
[
"E",
"D"
],
[
"ali",
"ty"
],
[
"pre",
"train"
],
[
"2",
"6"
],
[
"BertFor",
"MaskedLM"
],
[
"ues",
"tion"
],
[
"b",
"y"
],
[
"S",
"C"
],
[
"an",
"ce"
],
[
"F",
"AR"
],
[
"ate",
"s"
],
[
"2",
"8"
],
[
"CI",
"FAR"
],
[
"3",
"5"
],
[
"lo",
"cal"
],
[
"se",
"ed"
],
[
"model",
"s"
],
[
"o",
"ver"
],
[
"fu",
"sion"
],
[
"m",
"ode"
],
[
"Q",
"uestion"
],
[
"di",
"lation"
],
[
"er",
"ing"
],
[
"1",
"00"
],
[
"is",
"on"
],
[
"U",
"N"
],
[
"ec",
"tra"
],
[
"g",
"lo"
],
[
"s",
"ch"
],
[
"id",
"i"
],
[
"An",
"sw"
],
[
"Ġ2",
"48"
],
[
"Answ",
"ering"
],
[
"Question",
"Answering"
],
[
"scal",
"ing"
],
[
"b",
"al"
],
[
"s",
"av"
],
[
"en",
"v"
],
[
"9",
"5"
],
[
"m",
"b"
],
[
"h",
"o"
],
[
"x",
"lm"
],
[
"\\\"",
"}\"}"
],
[
"glo",
"bal"
],
[
"m",
"em"
],
[
"l",
"p"
],
[
"s",
"m"
],
[
"so",
"ft"
],
[
"i",
"ze"
],
[
"M",
"T"
],
[
"2",
"3"
],
[
"Ġ3",
"0"
],
[
"b",
"idi"
],
[
"Ġ32",
"128"
],
[
"c",
"u"
],
[
"Ġ2",
"00"
],
[
"v",
"ector"
],
[
"token",
"s"
],
[
"P",
"o"
],
[
"sav",
"e"
],
[
"in",
"put"
],
[
"Ġ[",
"["
],
[
"x",
"vector"
],
[
"]",
"],"
],
[
"ord",
"er"
],
[
"datase",
"t"
],
[
"q",
"wen"
],
[
"h",
"y"
],
[
"g",
"le"
],
[
"ca",
"st"
],
[
"Ġ32",
"000"
],
[
"w",
"or"
],
[
"up",
"cast"
],
[
"in",
"ver"
],
[
"dir",
"ection"
],
[
"id",
"x"
],
[
"re",
"s"
],
[
"direction",
"ality"
],
[
"/",
"\\\","
],
[
"inver",
"se"
],
[
"re",
"order"
],
[
"B",
"art"
],
[
"tar",
"get"
],
[
"A",
"D"
],
[
"sm",
"all"
],
[
"mu",
"l"
],
[
"C",
"on"
],
[
"st",
"ance"
],
[
"h",
"is"
],
[
"A",
"T"
],
[
"2",
"56"
],
[
"ame",
"ter"
],
[
"par",
"ameter"
],
[
"Ġ2",
"6"
],
[
"N",
"L"
],
[
"x",
"ls"
],
[
"g",
"oo"
],
[
"shar",
"e"
],
[
"word",
"s"
],
[
"li",
"p"
],
[
"goo",
"gle"
],
[
"de",
"f"
],
[
"b",
"ad"
],
[
"m",
"lp"
],
[
"2",
"7"
],
[
"9",
"9"
],
[
"re",
"su"
],
[
"di",
"stance"
],
[
"b",
"o"
],
[
"his",
"per"
],
[
"NL",
"P"
],
[
"Ġ\\\"",
"}},"
],
[
"pretrain",
"ing"
],
[
"ar",
"ian"
],
[
"Ġ\\\".",
"/"
],
[
"Ġ[",
"],"
],
[
"3",
"3"
],
[
"l",
"r"
],
[
"wor",
"k"
],
[
"Ġ{",
"},"
],
[
"i",
"ce"
],
[
"p",
"or"
],
[
"ev",
"al"
],
[
"Ġ1516",
"4"
],
[
"au",
"lt"
],
[
"O",
"DE"
],
[
"ac",
"k"
],
[
"For",
"SequenceClassification"
],
[
"BadDi",
"ff"
],
[
"o",
"p"
],
[
"or",
"y"
],
[
"RobertaFor",
"SequenceClassification"
],
[
"g",
"er"
],
[
"lo",
"ad"
],
[
"k",
"i"
],
[
"parameter",
"s"
],
[
"f",
"re"
],
[
"def",
"ault"
],
[
"5",
"3"
],
[
"u",
"ct"
],
[
"l",
"lama"
],
[
"r",
"en"
],
[
"Ġ",
"F"
],
[
"hy",
"per"
],
[
"R",
"ates"
],
[
"f",
"n"
],
[
"Po",
"ison"
],
[
"BertFor",
"TokenClassification"
],
[
"Ġ5",
"6"
],
[
"Ġ",
"G"
],
[
"m",
"ic"
],
[
"tar",
"y"
],
[
"mem",
"ory"
],
[
"ro",
"tary"
],
[
"Ġ1",
"8"
],
[
"exp",
"ert"
],
[
"den",
"se"
],
[
"e",
"f"
],
[
"g",
"ener"
],
[
"mar",
"ian"
],
[
"er",
"man"
],
[
"M",
"I"
],
[
"5",
"4"
],
[
"M",
"arian"
],
[
"S",
"I"
],
[
"9",
"96"
],
[
"r",
"el"
],
[
"g",
"g"
],
[
"h",
"ub"
],
[
"ma",
"p"
],
[
"MT",
"Model"
],
[
"Marian",
"MTModel"
],
[
"3",
"4"
],
[
"on",
"e"
],
[
"summar",
"ize"
],
[
"sch",
"edu"
],
[
"ri",
"ve"
],
[
"u",
"al"
],
[
"ai",
"l"
],
[
"ren",
"ch"
],
[
"Bart",
"ForConditionalGeneration"
],
[
"ĠF",
"rench"
],
[
"si",
"n"
],
[
"b",
"in"
],
[
"0",
"1"
],
[
"sc",
"r"
],
[
"sw",
"ish"
],
[
"Ġ1",
"9"
],
[
"Ro",
"man"
],
[
"scr",
"atch"
],
[
"2",
"9"
],
[
"in",
"e"
],
[
"Ġ5",
"0000"
],
[
"S",
"T"
],
[
"X",
"LM"
],
[
"g",
"o"
],
[
"Ġ28",
"996"
],
[
"G",
"en"
],
[
"Q",
"wen"
],
[
"Ġ",
"Roman"
],
[
"ĠG",
"erman"
],
[
"ĠRoman",
"ian"
],
[
"t",
"p"
],
[
"Ġ2",
"24"
],
[
"p",
"ri"
],
[
"type",
"s"
],
[
"Distil",
"BertForSequenceClassification"
],
[
"6",
"4"
],
[
"it",
"e"
],
[
"5",
"8"
],
[
"c",
"f"
],
[
"m",
"ini"
],
[
"Ġ6",
"0"
],
[
"u",
"s"
],
[
"L",
"lama"
],
[
"m",
"i"
],
[
"pu",
"s"
],
[
"MI",
"SC"
],
[
"s",
"par"
],
[
"f",
"p"
],
[
"v",
"it"
],
[
"schedu",
"le"
],
[
"B",
"lock"
],
[
"en",
"d"
],
[
"Ġ3",
"84"
],
[
"m",
"m"
],
[
"u",
"tral"
],
[
"Con",
"fig"
],
[
"N",
"E"
],
[
"t",
"e"
],
[
"C",
"PR"
],
[
"ra",
"in"
],
[
"re",
"start"
],
[
"restart",
"s"
],
[
"el",
"ectra"
],
[
"w",
"r"
],
[
"mic",
"ro"
],
[
"o",
"pus"
],
[
"f",
"fusion"
],
[
"Ġ1",
"000"
],
[
"be",
"ta"
],
[
"m",
"ple"
],
[
"spar",
"se"
],
[
"micro",
"soft"
],
[
"la",
"st"
],
[
"Bert",
"Model"
],
[
"dow",
"n"
],
[
"H",
"el"
],
[
"Ġ2",
"1"
],
[
"S",
"M"
],
[
"u",
"m"
],
[
"sin",
"ki"
],
[
"Hel",
"sinki"
],
[
"ent",
"ail"
],
[
"entail",
"ment"
],
[
"a",
"ge"
],
[
"dev",
"ice"
],
[
"a",
"y"
],
[
"su",
"p"
],
[
"c",
"nn"
],
[
"expert",
"s"
],
[
"x",
"sum"
],
[
"i",
"p"
],
[
"Ġ248",
"05"
],
[
"u",
"c"
],
[
"Ġ512",
"0"
],
[
"5",
"0"
],
[
"wr",
"ite"
],
[
"pre",
"ss"
],
[
"Ġ6",
"2"
],
[
"over",
"write"
],
[
"7",
"68"
],
[
"Ġ3",
"6"
],
[
"Ġ14",
"2"
],
[
"mo",
"e"
],
[
"V",
"E"
],
[
"T",
"rain"
],
[
"p",
"si"
],
[
"BadDi",
"ffusion"
],
[
"Gen",
"BadDiffusion"
],
[
"BertFor",
"QuestionAnswering"
],
[
"cf",
"g"
],
[
"O",
"P"
],
[
"A",
"L"
],
[
"Ġ4",
"48"
],
[
"v",
"p"
],
[
"Auto",
"Model"
],
[
"ar",
"y"
],
[
"00",
"1"
],
[
"E",
"S"
],
[
"Ġ5",
"00"
],
[
"Ġ15",
"36"
],
[
"Ġ25",
"0002"
],
[
"inf",
"er"
],
[
"TI",
"ON"
],
[
"for",
"ce"
],
[
"re",
"g"
],
[
"sup",
"press"
],
[
"3",
"0"
],
[
"w",
"hisper"
],
[
"c",
"ro"
],
[
"ne",
"utral"
],
[
"t",
"mp"
],
[
"me",
"as"
],
[
"m",
"it"
],
[
"d",
"ep"
],
[
"con",
"dition"
],
[
"meas",
"ure"
],
[
"c",
"l"
],
[
"net",
"work"
],
[
"extr",
"a"
],
[
"3",
"1"
],
[
"14",
"4"
],
[
"form",
"er"
],
[
"sc",
"ri"
],
[
"n",
"li"
],
[
"mul",
"ti"
],
[
"b",
"j"
],
[
"RobertaFor",
"MaskedLM"
],
[
"0",
"8"
],
[
"ne",
"ss"
],
[
"av",
"i"
],
[
"se",
"quence"
],
[
"dep",
"th"
],
[
"I",
"N"
],
[
"Ġ1",
"7"
],
[
"un",
"its"
],
[
"19",
"2"
],
[
"e",
"ch"
],
[
"l",
"ts"
],
[
"s",
"tic"
],
[
"condition",
"ing"
],
[
"si",
"mple"
],
[
"t",
"t"
],
[
"resu",
"lts"
],
[
"p",
"h"
],
[
"Ġ10000",
"00"
],
[
"fre",
"q"
],
[
"m",
"rope"
],
[
"model",
"ing"
],
[
"Ġ4",
"8"
],
[
"str",
"uct"
],
[
"9",
"4"
],
[
"ter",
"mini"
],
[
"de",
"termini"
],
[
"Llama",
"ForCausalLM"
],
[
"determini",
"stic"
],
[
"c",
"c"
],
[
"v",
"is"
],
[
"Ġ\\\"",
"\\\\"
],
[
"fr",
"ame"
],
[
"h",
"u"
],
[
"ro",
"ut"
],
[
"ho",
"me"
],
[
"enc",
"ode"
],
[
"N",
"e"
],
[
"p",
"y"
],
[
"go",
"al"
],
[
"TI",
"VE"
],
[
"g",
"u"
],
[
"po",
"st"
],
[
"h",
"ic"
],
[
"o",
"m"
],
[
"E",
"N"
],
[
"c",
"le"
],
[
"Ġ",
"\\\\"
],
[
"Ġ128",
"0"
],
[
"con",
"t"
],
[
"t",
"c"
],
[
"Ġ32",
"768"
],
[
"is",
"tral"
],
[
"7",
"5"
],
[
"w",
"n"
],
[
"Ġ2",
"3"
],
[
"s",
"lo"
],
[
"Ġ3",
"0000"
],
[
"li",
"mit"
],
[
"b",
"ack"
],
[
"Ġ8",
"192"
],
[
"finetun",
"ed"
],
[
"Ġ8",
"0"
],
[
"a",
"uto"
],
[
"igh",
"t"
],
[
"ca",
"u"
],
[
"no",
"t"
],
[
"C",
"ON"
],
[
"P",
"AR"
],
[
"i",
"l"
],
[
"2",
"02"
],
[
"D",
"o"
],
[
"a",
"st"
],
[
"cau",
"sal"
],
[
"E",
"l"
],
[
"s",
"ent"
],
[
"m",
"el"
],
[
"si",
"g"
],
[
"I",
"n"
],
[
"q",
"kv"
],
[
"bin",
"s"
],
[
"Ġ2",
"7"
],
[
"en",
"g"
],
[
"Ġ8",
"4"
],
[
"3",
"00"
],
[
"ent",
"able"
],
[
"checkpoin",
"ts"
],
[
"op",
"entable"
],
[
"El",
"ectra"
],
[
"la",
"mb"
],
[
"I",
"mage"
],
[
"T",
"R"
],
[
"t",
"ur"
],
[
"Ġ3",
"5"
],
[
"m",
"od"
],
[
"lamb",
"d"
],
[
"c",
"el"
],
[
"inter",
"val"
],
[
"Ġ15164",
"3"
],
[
"h",
"avi"
],
[
"ra",
"ti"
],
[
"P",
"O"
],
[
"be",
"havi"
],
[
"6",
"6"
],
[
"ec",
"i"
],
[
"behavi",
"or"
],
[
"22",
"4"
],
[
"O",
"F"
],
[
"on",
"g"
],
[
"la",
"ng"
],
[
"cont",
"ent"
],
[
"t",
"an"
],
[
"causal",
"m"
],
[
"A",
"N"
],
[
"env",
"s"
],
[
"3",
"8"
],
[
"3",
"84"
],
[
"mt",
"p"
],
[
"}",
"}\"}"
],
[
"proj",
"ect"
],
[
"c",
"lip"
],
[
"ur",
"ation"
],
[
"ut",
"h"
],
[
"qu",
"ad"
],
[
"posi",
"tive"
],
[
"N",
"O"
],
[
"D",
"e"
],
[
"se",
"s"
],
[
"For",
"Image"
],
[
"ic",
"al"
],
[
"3",
"7"
],
[
"u",
"le"
],
[
"B",
"O"
],
[
"un",
"k"
],
[
"xls",
"r"
],
[
"p",
"l"
],
[
"per",
"i"
],
[
"sent",
"ence"
],
[
"tan",
"h"
],
[
"P",
"ro"
],
[
"su",
"s"
],
[
"so",
"ur"
],
[
"rout",
"er"
],
[
"ForImage",
"Classification"
],
[
"9",
"8"
],
[
"B",
"ER"
],
[
"al",
"bert"
],
[
"sc",
"i"
],
[
"ide",
"o"
],
[
"C",
"h"
],
[
"f",
"ro"
],
[
"Ġ6",
"5"
],
[
"back",
"b"
],
[
"block",
"s"
],
[
"BO",
"X"
],
[
"backb",
"one"
],
[
"m",
"up"
],
[
"Ġ1",
"19"
],
[
"de",
"berta"
],
[
"por",
"t"
],
[
"tr",
"ig"
],
[
"emb",
"ert"
],
[
"ga",
"sus"
],
[
"sour",
"ce"
],
[
"mi",
"x"
],
[
"par",
"tial"
],
[
"trig",
"ger"
],
[
"Ġ2",
"2"
],
[
"st",
"ates"
],
[
"Ġ26",
"2"
],
[
"struct",
"ure"
],
[
"h",
"i"
],
[
"clas",
"ses"
],
[
"ef",
"fic"
],
[
"au",
"x"
],
[
"O",
"D"
],
[
"st",
"ep"
],
[
"effic",
"ient"
],
[
"ti",
"n"
],
[
"d",
"rive"
],
[
"j",
"o"
],
[
"ing",
"ual"
],
[
"G",
"N"
],
[
"f",
"l"
],
[
"f",
"o"
],
[
"ar",
"e"
],
[
"war",
"mup"
],
[
"Ġ262",
"144"
],
[
"py",
"torch"
],
[
"9",
"0"
],
[
"ad",
"i"
],
[
"ma",
"mb"
],
[
"mamb",
"a"
],
[
"id",
"th"
],
[
"9",
"7"
],
[
"BER",
"T"
],
[
"w",
"er"
],
[
"Ġ502",
"58"
],
[
"Roberta",
"Model"
],
[
"quanti",
"z"
],
[
"cle",
"an"
],
[
"tr",
"i"
],
[
"Do",
"wn"
],
[
"Ġ15164",
"5"
],
[
"S",
"DE"
],
[
"g",
"s"
],
[
"r",
"un"
],
[
"gener",
"ate"
],
[
"tur",
"n"
],
[
"pad",
"ding"
],
[
"pr",
"edi"
],
[
"M",
"E"
],
[
"P",
"re"
],
[
"size",
"s"
],
[
">",
"\\\","
],
[
"w",
"idth"
],
[
"g",
"in"
],
[
"or",
"e"
],
[
"AT",
"E"
],
[
"quantiz",
"ation"
],
[
"V",
"i"
],
[
"C",
"O"
],
[
"M",
"y"
],
[
"on",
"ly"
],
[
"output",
"s"
],
[
"til",
"ingual"
],
[
"54",
"7"
],
[
"U",
"M"
],
[
"o",
"f"
],
[
"r",
"on"
],
[
"re",
"turn"
],
[
"shar",
"ed"
],
[
"Ġ3",
"1"
],
[
"mul",
"tilingual"
],
[
"SI",
"GN"
],
[
"For",
"MaskedLM"
],
[
"D",
"rive"
],
[
"P",
"C"
],
[
"s",
"de"
],
[
"Ġ5",
"8"
],
[
"g",
"am"
],
[
"F",
"I"
],
[
"v",
"ideo"
],
[
"rati",
"o"
],
[
"Ġ",
"and"
],
[
"adapter",
"s"
],
[
"A",
"I"
],
[
"U",
"R"
],
[
"Ġ13",
"1"
],
[
"7",
"7"
],
[
"N",
"et"
],
[
"s",
"pa"
],
[
"la",
"p"
],
[
"UN",
"C"
],
[
"CON",
"J"
],
[
"resu",
"lt"
],
[
"o",
"pen"
],
[
"in",
"al"
],
[
"s",
"quad"
],
[
"Ġ",
"<"
],
[
"at",
"or"
],
[
"datase",
"ts"
],
[
"H",
"E"
],
[
"b",
"its"
],
[
"e",
"b"
],
[
"Ġ131",
"072"
],
[
"tin",
"y"
],
[
"di",
"o"
],
[
"speci",
"al"
],
[
"co",
"m"
],
[
"re",
"po"
],
[
"Train",
"ing"
],
[
"PAR",
"T"
],
[
"Ġ119",
"547"
],
[
"spa",
"tial"
],
[
"_",
"_"
],
[
"re",
"ad"
],
[
"a",
"uth"
],
[
"be",
"gin"
],
[
"eci",
"sion"
],
[
"My",
"Drive"
],
[
"m",
"er"
],
[
"Auto",
"Config"
],
[
"ST",
"OP"
],
[
"Ġ50",
"3"
],
[
"a",
"gg"
],
[
"su",
"al"
],
[
"ke",
"ep"
],
[
"pr",
"ecision"
],
[
"mix",
"ed"
],
[
"d",
"el"
],
[
"er",
"y"
],
[
"po",
"ison"
],
[
"ac",
"c"
],
[
"g",
"pu"
],
[
"gener",
"ated"
],
[
"U",
"p"
],
[
"Ġ21",
"128"
],
[
"Y",
"M"
],
[
"a",
"k"
],
[
"00",
"5"
],
[
"sel",
"f"
],
[
"RobertaFor",
"TokenClassification"
],
[
"u",
"x"
],
[
"fi",
"l"
],
[
"pri",
"v"
],
[
"cel",
"l"
],
[
"un",
"slo"
],
[
"fro",
"m"
],
[
"priv",
"ate"
],
[
"unslo",
"th"
],
[
"4",
"6"
],
[
"4",
"2"
],
[
"pu",
"sh"
],
[
"V",
"P"
],
[
"ac",
"cu"
],
[
"d",
"er"
],
[
"attention",
"s"
],
[
"3",
"36"
],
[
"over",
"lap"
],
[
"c",
"ar"
],
[
"u",
"l"
],
[
"cro",
"ss"
],
[
"accu",
"mu"
],
[
"t",
"able"
],
[
"v",
"l"
],
[
"sta",
"ge"
],
[
"A",
"l"
],
[
"NE",
"G"
],
[
"4",
"0"
],
[
"N",
"UM"
],
[
"g",
"en"
],
[
"it",
"h"
],
[
"accumu",
"lation"
],
[
"h",
"or"
],
[
"sol",
"ver"
],
[
"h",
"as"
],
[
"UN",
"I"
],
[
"sig",
"n"
],
[
"gam",
"ma"
],
[
"e",
"ze"
],
[
"s",
"ad"
],
[
"un",
"ed"
],
[
"post",
"fix"
],
[
"F",
"OR"
],
[
"b",
"all"
],
[
"vi",
"sual"
],
[
"fc",
"lip"
],
[
"Ġ248",
"04"
],
[
"reg",
"ation"
],
[
"agg",
"regation"
],
[
"i",
"m"
],
[
"Ġ",
"96"
],
[
"la",
"n"
],
[
"sch",
"ed"
],
[
"bo",
"tt"
],
[
"in",
"t"
],
[
"se",
"ction"
],
[
"ma",
"in"
],
[
"adi",
"ction"
],
[
"o",
"bj"
],
[
"Ġ\\\"",
"<"
],
[
"em",
"ical"
],
[
"Ġ5",
"18"
],
[
"mod",
"ule"
],
[
"c",
"i"
],
[
"o",
"t"
],
[
"Ġ16",
"384"
],
[
"22",
"0"
],
[
"en",
"gth"
],
[
"layer",
"norm"
],
[
".",
"/"
],
[
"W",
"hisper"
],
[
"ers",
"on"
],
[
"le",
"av"
],
[
"gr",
"ap"
],
[
"contr",
"adiction"
],
[
"or",
"ig"
],
[
"li",
"fe"
],
[
"Ġ502",
"6"
],
[
"Whisper",
"ForConditionalGeneration"
],
[
"A",
"S"
],
[
"M",
"o"
],
[
"R",
"e"
],
[
"str",
"ength"
],
[
"r",
"u"
],
[
"Ġ5",
"7"
],
[
"&",
"_"
],
[
"_",
"&_"
],
[
"ation",
"al"
],
[
"len",
"eck"
],
[
"resid",
"ual"
],
[
"scri",
"pt"
],
[
"Vi",
"T"
],
[
"CO",
"M"
],
[
"a",
"e"
],
[
"v",
"el"
],
[
"Ġ15",
"19"
],
[
"de",
"ep"
],
[
"bott",
"leneck"
],
[
"th",
"od"
],
[
"medi",
"um"
],
[
"vi",
"ron"
],
[
"config",
"uration"
],
[
"pr",
"uned"
],
[
"soft",
"max"
],
[
"H",
"ED"
],
[
"M",
"ED"
],
[
"a",
"f"
],
[
"p",
"lay"
],
[
"quan",
"t"
],
[
"SC",
"HED"
],
[
"Down",
"Block"
],
[
"module",
"s"
],
[
"P",
"y"
],
[
"si",
"c"
],
[
"Ġ2",
"9"
],
[
"viron",
"ment"
],
[
"b",
"it"
],
[
"u",
"d"
],
[
"ne",
"o"
],
[
"d",
"uct"
],
[
"k",
"o"
],
[
"or",
"t"
],
[
"sh",
"a"
],
[
"X",
"ED"
],
[
"sam",
"pl"
],
[
"Ġ14",
"336"
],
[
"infer",
"ence"
],
[
"Al",
"bert"
],
[
"to",
"k"
],
[
"torch",
"script"
],
[
"FI",
"XED"
],
[
"M",
"istral"
],
[
"ti",
"tion"
],
[
"V",
"ER"
],
[
"m",
"is"
],
[
"an",
"ger"
],
[
"t",
"al"
],
[
"fe",
"ar"
],
[
"\\\\",
"\\\\"
],
[
"al",
"s"
],
[
"ase",
"d"
],
[
"Ġ25",
"0"
],
[
"peri",
"od"
],
[
"fo",
"od"
],
[
"g",
"an"
],
[
"E",
"n"
],
[
"H",
"u"
],
[
"g",
"ate"
],
[
"00",
"8"
],
[
"pretrain",
"ed"
],
[
"ig",
"n"
],
[
"repe",
"tition"
],
[
"Ġ50000",
"0"
],
[
"UNI",
"PC"
],
[
"sad",
"ness"
],
[
"Ġ1519",
"36"
],
[
"4",
"4"
],
[
"re",
"vision"
],
[
"au",
"dio"
],
[
"A",
"U"
],
[
"c",
"ol"
],
[
"inter",
"leav"
],
[
"bi",
"ased"
],
[
"s",
"y"
],
[
"ver",
"s"
],
[
"no",
"w"
],
[
"5",
"5"
],
[
"l",
"ong"
],
[
"Ġ",
"the"
],
[
"orig",
"inal"
],
[
"ar",
"gs"
],
[
"2",
"000"
],
[
"en",
"ti"
],
[
"to",
"m"
],
[
"le",
"vel"
],
[
"Ġ25",
"01"
],
[
"OD",
"EL"
],
[
"Pre",
"Training"
],
[
"s",
"er"
],
[
"For",
"QuestionAnswering"
],
[
"T",
"ar"
],
[
"w",
"ay"
],
[
"li",
"c"
],
[
"ViT",
"ForImageClassification"
],
[
"M",
"ODEL"
],
[
"m",
"nli"
],
[
"mp",
"net"
],
[
"cro",
"p"
],
[
"PO",
"SI"
],
[
"Ġ518",
"65"
],
[
"ca",
"m"
],
[
"em",
"o"
],
[
"ff",
"er"
],
[
"jo",
"y"
],
[
"fil",
"ter"
],
[
"5",
"2"
],
[
"train",
"ing"
],
[
"por",
"al"
],
[
"NEG",
"A"
],
[
"p",
"erson"
],
[
"me",
"thod"
],
[
"sh",
"i"
],
[
"con",
"vers"
],
[
"15",
"2"
],
[
"Tar",
"get"
],
[
"i",
"e"
],
[
"ar",
"d"
],
[
"cod",
"e"
],
[
"RobertaFor",
"QuestionAnswering"
],
[
"res",
"net"
],
[
"fre",
"eze"
],
[
"S",
"now"
],
[
"T",
"r"
],
[
"i",
"li"
],
[
"pe",
"gasus"
],
[
"su",
"r"
],
[
"bu",
"g"
],
[
"tem",
"poral"
],
[
"hic",
"s"
],
[
"ball",
"Target"
],
[
"POSI",
"TIVE"
],
[
"Snow",
"ballTarget"
],
[
"i",
"ty"
],
[
"m",
"bart"
],
[
"an",
"t"
],
[
"iz",
"on"
],
[
"mer",
"ge"
],
[
"hor",
"izon"
],
[
"Ġ4",
"3"
],
[
"ram",
"ids"
],
[
"Py",
"ramids"
],
[
"Ġ2501",
"12"
],
[
"NEGA",
"TIVE"
],
[
"en",
"vironment"
],
[
"be",
"st"
],
[
"cam",
"embert"
],
[
"x",
"l"
],
[
"ver",
"age"
],
[
"qu",
"ality"
],
[
"de",
"bug"
],
[
"grap",
"hics"
],
[
"convers",
"ational"
],
[
"4",
"3"
],
[
"5",
"9"
],
[
"g",
"ap"
],
[
"pe",
"ech"
],
[
"bi",
"o"
],
[
"AD",
"J"
],
[
"hic",
"le"
],
[
"sum",
"e"
],
[
"qu",
"i"
],
[
"ss",
"m"
],
[
"re",
"sume"
],
[
"train",
"er"
],
[
"Ġ",
"S"
],
[
"Up",
"Block"
],
[
"or",
"a"
],
[
"lambd",
"a"
],
[
"i",
"se"
],
[
"ve",
"hicle"
],
[
"sur",
"pri"
],
[
"re",
"ward"
],
[
"32",
"0"
],
[
"bu",
"ffer"
],
[
"EN",
"T"
],
[
"u",
"ction"
],
[
"al",
"o"
],
[
"initial",
"ize"
],
[
"For",
"TokenClassification"
],
[
"lang",
"u"
],
[
"g",
"em"
],
[
"ans",
"wer"
],
[
"spe",
"ech"
],
[
"fix",
"ed"
],
[
"interleav",
"ed"
],
[
"langu",
"age"
],
[
"h",
"f"
],
[
"on",
"ing"
],
[
"he",
"ight"
],
[
"Ġ24804",
"4"
],
[
"7",
"9"
],
[
"8",
"0"
],
[
"q",
"k"
],
[
"ter",
"n"
],
[
"qu",
"ery"
],
[
"Ġ256",
"0"
],
[
"cu",
"s"
],
[
"m",
"istral"
],
[
"p",
"la"
],
[
"th",
"read"
],
[
"Ġ50",
"36"
],
[
"acc",
"ep"
],
[
"a",
"verage"
],
[
"Ġ3",
"3"
],
[
"lo",
"cation"
],
[
"AutoModel",
"ForCausalLM"
],
[
"eng",
"ine"
],
[
"surpri",
"se"
],
[
"min",
"ator"
],
[
"AD",
"V"
],
[
"Ġ19",
"2"
],
[
"AU",
"X"
],
[
"\\\"",
"}}\"}"
],
[
"pt",
"ure"
],
[
"hyper",
"parameters"
],
[
"behavior",
"al"
],
[
"Q",
"U"
],
[
"l",
"ue"
],
[
"in",
"sic"
],
[
"extr",
"insic"
],
[
"sp",
"an"
],
[
"Ġ\\\".",
"./"
],
[
"Ġ500",
"5"
],
[
"behavior",
"s"
],
[
"sign",
"als"
],
[
"7",
"0"
],
[
"g",
"i"
],
[
"ca",
"pture"
],
[
"Ġ3",
"10"
],
[
"cl",
"oning"
],
[
"De",
"berta"
],
[
"are",
"as"
],
[
"life",
"time"
],
[
"thread",
"ed"
],
[
"7",
"2"
],
[
"ec",
"ut"
],
[
"ex",
"ecut"
],
[
"co",
"mm"
],
[
"NO",
"UN"
],
[
"B",
"i"
],
[
"H",
"I"
],
[
"able",
"s"
],
[
"ph",
"m"
],
[
"M",
"ini"
],
[
"Ġ2",
"0000"
],
[
"di",
"scri"
],
[
"tem",
"p"
],
[
"discri",
"minator"
],
[
"Distil",
"BertForMaskedLM"
],
[
"open",
"ai"
],
[
"sha",
"pe"
],
[
"accep",
"table"
],
[
"ll",
"m"
],
[
"con",
"str"
],
[
"Bert",
"Tokenizer"
],
[
"execut",
"ables"
],
[
"Ġ",
"of"
],
[
"ad",
"ditional"
],
[
"del",
"ta"
],
[
"cus",
"tom"
],
[
"c",
"os"
],
[
"index",
"es"
],
[
"Ġ11",
"008"
],
[
"6",
"0"
],
[
"8",
"8"
],
[
"Ġ\\\"",
","
],
[
"Ġ1",
"152"
],
[
"bi",
"le"
],
[
"ca",
"p"
],
[
"lo",
"w"
],
[
"DE",
"T"
],
[
"sequence",
"s"
],
[
"top",
"k"
],
[
"/",
"."
],
[
"O",
"T"
],
[
"p",
"ct"
],
[
"Ġ10000",
"000"
],
[
"fl",
"at"
],
[
"I",
"S"
],
[
"l",
"n"
],
[
"000",
"3"
],
[
"3",
"9"
],
[
"c",
"or"
],
[
"s",
"ers"
],
[
"gg",
"ing"
],
[
"t",
"u"
],
[
"Ġ50",
"35"
],
[
"op",
"ti"
],
[
"predi",
"ct"
],
[
"constr",
"uction"
],
[
"l",
"ora"
],
[
"m",
"r"
],
[
"q",
"g"
],
[
"t",
"as"
],
[
"PR",
"ON"
],
[
"PR",
"OP"
],
[
"E",
"X"
],
[
"o",
"ff"
],
[
"se",
"ase"
],
[
"Ġ128",
"000"
],
[
"10",
"3"
],
[
"bo",
"t"
],
[
"e",
"qui"
],
[
"si",
"an"
],
[
"val",
"ent"
],
[
"VER",
"B"
],
[
"equi",
"valent"
],
[
"0",
"9"
],
[
"c",
"oder"
],
[
"se",
"p"
],
[
"R",
"O"
],
[
"st",
"ack"
],
[
"su",
"bj"
],
[
"U",
"S"
],
[
"Ġ5",
"95"
],
[
"co",
"la"
],
[
"A",
"DP"
],
[
"b",
"ig"
],
[
"l",
"u"
],
[
"For",
"PreTraining"
],
[
"sampl",
"ing"
],
[
"PROP",
"N"
],
[
"C",
"o"
],
[
"b",
"a"
],
[
"c",
"ated"
],
[
"r",
"d"
],
[
"train",
"ed"
],
[
"Auto",
"Train"
],
[
"temp",
"late"
],
[
"5",
"1"
],
[
"S",
"YM"
],
[
"n",
"i"
],
[
"feat",
"ures"
],
[
"XLM",
"RobertaForTokenClassification"
],
[
"P",
"UNC"
],
[
"s",
"a"
],
[
"pro",
"duct"
],
[
"bin",
"ary"
],
[
"Ch",
"emical"
],
[
"Mistral",
"ForCausalLM"
],
[
"ch",
"unk"
],
[
"lo",
"om"
],
[
"vi",
"ce"
],
[
"Ġ23",
"04"
],
[
"A",
"tt"
],
[
"C",
"CONJ"
],
[
"m",
"on"
],
[
"den",
"t"
],
[
"lin",
"ux"
],
[
"ign",
"ore"
],
[
"m",
"lm"
],
[
"s",
"v"
],
[
"10",
"1"
],
[
"eb",
"d"
],
[
"N",
"C"
],
[
"b",
"m"
],
[
"}",
"}},"
],
[
"28",
"8"
],
[
"hu",
"gging"
],
[
"PUNC",
"T"
],
[
"7",
"4"
],
[
"E",
"V"
],
[
"i",
"x"
],
[
"p",
"po"
],
[
"Ġ3",
"4"
],
[
"co",
"efficient"
],
[
"c",
"en"
],
[
"o",
"u"
],
[
"s",
"st"
],
[
"un",
"d"
],
[
"000",
"1"
],
[
"depth",
"s"
],
[
"IN",
"T"
],
[
"n",
"on"
],
[
"F",
"E"
],
[
"i",
"mp"
],
[
"o",
"us"
],
[
"st",
"em"
],
[
"sk",
"ip"
],
[
"AT",
"UR"
],
[
"Att",
"n"
],
[
"S",
"o"
],
[
"Ġ5",
"9"
],
[
"F",
"ast"
],
[
"al",
"th"
],
[
"XLM",
"RobertaForSequenceClassification"
],
[
"um",
"n"
],
[
"HE",
"AD"
],
[
"col",
"umn"
],
[
"D",
"ATE"
],
[
"M",
"ul"
],
[
"ma",
"il"
],
[
"vo",
"x"
],
[
"lo",
"ve"
],
[
"co",
"ef"
],
[
"deep",
"stack"
],
[
"b",
"r"
],
[
"d",
"u"
],
[
"Ġ",
"st"
],
[
"Ġ{",
"}},"
],
[
"new",
"s"
],
[
"co",
"mp"
],
[
"Ġ248",
"320"
],
[
"gg",
"y"
],
[
"C",
"am"
],
[
"f",
"ast"
],
[
"eng",
"lish"
],
[
"span",
"ish"
],
[
"4",
"9"
],
[
"A",
"TION"
],
[
"lay",
"out"
],
[
"d",
"edi"
],
[
"u",
"st"
],
[
"st",
"u"
],
[
"OR",
"A"
],
[
"aux",
"ili"
],
[
"Mul",
"ti"
],
[
"dedi",
"cated"
],
[
"auxili",
"ary"
],
[
"Y",
"P"
],
[
"t",
"ec"
],
[
"norm",
"al"
],
[
"Ne",
"o"
],
[
"Electra",
"ForSequenceClassification"
],
[
"FE",
"ATUR"
],
[
"F",
"T"
],
[
"Ġ3",
"9"
],
[
"Ġ4",
"6"
],
[
"re",
"pla"
],
[
"bert",
"s"
],
[
"G",
"E"
],
[
"\\\"",
"]"
],
[
"Hu",
"ggy"
],
[
"Ġ43",
"04"
],
[
"-",
"-"
],
[
"8",
"24"
],
[
"H",
"AT"
],
[
"b",
"er"
],
[
"f",
"alse"
],
[
"Ġ\\\"",
"["
],
[
"to",
"tal"
],
[
"N",
"ame"
],
[
"an",
"e"
],
[
"NE",
"U"
],
[
"F",
"ED"
],
[
"w",
"s"
],
[
"tr",
"on"
],
[
"em",
"ent"
],
[
"res",
"sion"
],
[
"FED",
"ORA"
],
[
"7",
"3"
],
[
"Ġ12",
"288"
],
[
"st",
"s"
],
[
"En",
"coder"
],
[
"Deberta",
"V"
],
[
"4",
"5"
],
[
"7",
"8"
],
[
"di",
"ct"
],
[
"Ġ502",
"64"
],
[
"GPT",
"Neo"
],
[
"gu",
"st"
],
[
"stu",
"dent"
],
[
"I",
"C"
],
[
"M",
"P"
],
[
"b",
"s"
],
[
"Ġ",
"re"
],
[
"val",
"id"
],
[
"layout",
"lm"
],
[
"O",
"r"
],
[
"c",
"y"
],
[
"n",
"l"
],
[
"x",
"i"
],
[
"se",
"arch"
],
[
"ac",
"tion"
],
[
"len",
"der"
],
[
"architect",
"ure"
],
[
"ap",
"pro"
],
[
"no",
"ise"
],
[
"cen",
"ter"
],
[
"A",
"C"
],
[
"P",
"e"
],
[
"proj",
"ector"
],
[
"long",
"former"
],
[
"7",
"6"
],
[
"ch",
"ine"
],
[
"an",
"g"
],
[
"fusion",
"s"
],
[
"INT",
"J"
],
[
"lender",
"bot"
],
[
"V",
"L"
],
[
"f",
"er"
],
[
"07",
"5"
],
[
"lin",
"e"
]
]
}
}