nli-distilroberta-base/vocab.json

1 line
878 KiB
JSON
Raw Permalink Normal View History

2021-01-04 04:22:09 +08:00
{"<s>": 0, "<pad>": 1, "</s>": 2, "<unk>": 3, ".": 4, "Ġthe": 5, ",": 6, "Ġto": 7, "Ġand": 8, "Ġof": 9, "Ġa": 10, "Ġin": 11, "-": 12, "Ġfor": 13, "Ġthat": 14, "Ġon": 15, "Ġis": 16, "âĢ": 17, "'s": 18, "Ġwith": 19, "ĠThe": 20, "Ġwas": 21, "Ġ\"": 22, "Ġat": 23, "Ġit": 24, "Ġas": 25, "Ġsaid": 26, "Ļ": 27, "Ġbe": 28, "s": 29, "Ġby": 30, "Ġfrom": 31, "Ġare": 32, "Ġhave": 33, "Ġhas": 34, ":": 35, "Ġ(": 36, "Ġhe": 37, "ĠI": 38, "Ġhis": 39, "Ġwill": 40, "Ġan": 41, "Ġthis": 42, ")": 43, "ĠâĢ": 44, "Ġnot": 45, "Ŀ": 46, "Ġyou": 47, "ľ": 48, "Ġtheir": 49, "Ġor": 50, "Ġthey": 51, "Ġwe": 52, "Ġbut": 53, "Ġwho": 54, "Ġmore": 55, "Ġhad": 56, "Ġbeen": 57, "Ġwere": 58, "Ġabout": 59, ",\"": 60, "Ġwhich": 61, "Ġup": 62, "Ġits": 63, "Ġcan": 64, "Ġone": 65, "Ġout": 66, "Ġalso": 67, "Ġ$": 68, "Ġher": 69, "Ġall": 70, "Ġafter": 71, ".\"": 72, "/": 73, "Ġwould": 74, "'t": 75, "Ġyear": 76, "Ġwhen": 77, "Ġfirst": 78, "Ġshe": 79, "Ġtwo": 80, "Ġover": 81, "Ġpeople": 82, "ĠA": 83, "Ġour": 84, "ĠIt": 85, "Ġtime": 86, "Ġthan": 87, "Ġinto": 88, "Ġthere": 89, "t": 90, "ĠHe": 91, "Ġnew": 92, "ĠâĢĶ": 93, "Ġlast": 94, "Ġjust": 95, "ĠIn": 96, "Ġother": 97, "Ġso": 98, "Ġwhat": 99, "I": 100, "Ġlike": 101, "a": 102, "Ġsome": 103, "S": 104, "ë": 105, "Ġthem": 106, "Ġyears": 107, "'": 108, "Ġdo": 109, "Ġyour": 110, "Ġ-": 111, "Ġ1": 112, "\"": 113, "Ġif": 114, "Ġcould": 115, "?": 116, "Ġno": 117, "i": 118, "m": 119, "Ġget": 120, "ĠU": 121, "Ġnow": 122, "Ġhim": 123, "Ġback": 124, "ĠBut": 125, "ĠâĢĵ": 126, "Ġmy": 127, "Ġ'": 128, "Ġonly": 129, "Ġthree": 130, ";": 131, "Ġ2": 132, "The": 133, "1": 134, "Ġpercent": 135, "Ġagainst": 136, "Ġbefore": 137, "Ġcompany": 138, "o": 139, "ĠTrump": 140, "Ġhow": 141, "Ġbecause": 142, "Ġany": 143, "Ġmost": 144, "Ġbeing": 145, "Ġmake": 146, "Ġwhere": 147, "Ġduring": 148, "Ġthrough": 149, "Ġwhile": 150, "000": 151, "ĠThis": 152, "Ġmillion": 153, "ing": 154, "Ġ3": 155, "Ġmade": 156, "Ġwell": 157, "Ġ10": 158, "Ġdown": 159, "Ġoff": 160, "Ġsays": 161, "Ġme": 162, "ĠB": 163, "Ġgoing": 164, "Ġteam": 165, "ĠWe": 166, "Ġthose": 167, "Ġgovernment": 168, "Ġway": 169, "We": 170, "Ġmany": 171, "Ġthen": 172, "Ġwork": 173, "Ġtold": 174, "com": 175, "2": 176, "Ġgame": 177, "ĠAnd": 178, "in": 179, "year": 180, "Ġp": 181, "Ġvery": 182, "Ġday": 183, "Ġhome": 184, "Ġtake": 185, "Ġweek": 186, "Ġsince": 187, "ĠNew": 188, "Ġmay": 189, "Ġeven": 190, "Ġseason": 191, "Ġsee": 192, "Ġ2017": 193, "Ġstate": 194, "Ġ5": 195, "ed": 196, "Ġshould": 197, "Ġaround": 198, "Ġ2018": 199, "Ġsecond": 200, "Ġus": 201, "Ġstill": 202, "Ġmuch": 203, "Ġ4": 204, "Ġgood": 205, "Ġthink": 206, "%": 207, "ĠS": 208, "Ġthese": 209, "Ġmarket": 210, "ĠD": 211, "th": 212, "Ġgo": 213, "'re": 214, "Ġsuch": 215, "Ġknow": 216, "Ġincluding": 217, "Ġdon": 218, "y": 219, "Ġnext": 220, "ĠP": 221, "Ġdid": 222, "Ġunder": 223, "Ġsay": 224, "en": 225, "ĠL": 226, "Ġbetween": 227, "Ġper": 228, "ĠK": 229, "ĠC": 230, "Ġ6": 231, "Ġworld": 232, "Ġpart": 233, "ĠN": 234, "Ġright": 235, "Ġwant": 236, "Ġfour": 237, "),": 238, "Ġhigh": 239, "Ġneed": 240, "re": 241, "e": 242, "It": 243, "Ġhelp": 244, "5": 245, "3": 246, "Ġcountry": 247, "ĠR": 248, "Ġpolice": 249, "A": 250, "Ġlong": 251, "ĠThey": 252, "Ġend": 253, "er": 254, "ĠT": 255, "ĠM": 256, "u": 257, "Ġboth": 258, "Ġhere": 259, "an": 260, "on": 261, "Ġ7": 262, "Ġde": 263, "ĠShe": 264, "Ġbusiness": 265, "Ġreport": 266, "j": 267, "ers": 268, "Ġreally": 269, "ĠPresident": 270, "ar": 271, "ĠG": 272, "ĠFriday": 273, "ĠF": 274, "Ġbest": 275, "Ġsame": 276, "Ġanother": 277, "Ġset": 278, "old": 279, "ĠThat": 280, "as": 281, "n": 282, "Ġcome": 283, "Ġfamily": 284, "Ġpublic": 285, "ĠFor": 286, "ĠAs": 287, "0": 288, "ĠH": 289, "Ġ8": 290, "Ġ20": 291, "Ġfive": 292, "es": 293, "ĠTuesday": 294, "Ġn": 295, "ĠThursday": 296, "Ġquarter": 297, "h": 298, "Ġtop": 299, "Ġgot": 300, "Ġlife": 301, "ĠMonday": 302, "Ġfound": 303, "Ġ