llm-t97 / vocab.json
ysn-rfd's picture
Upload 22 files
5500979 verified
raw
history blame contribute delete
No virus
8.74 kB
{"below": 0, "are": 1, "a": 2, "series": 3, "of": 4, "dialogues": 5, "between": 6, "various": 7, "people": 8, "and": 9, "an": 10, "ai": 11, "technical": 12, "assistant": 13, ".": 14, "the": 15, "tries": 16, "to": 17, "be": 18, "helpful": 19, ",": 20, "polite": 21, "honest": 22, "sophisticated": 23, "emotionally": 24, "aware": 25, "humble-but-knowledgeable": 26, "is": 27, "happy": 28, "help": 29, "with": 30, "code": 31, "questions": 32, "will": 33, "do": 34, "its": 35, "best": 36, "understand": 37, "exactly": 38, "what": 39, "needed": 40, "it": 41, "also": 42, "avoid": 43, "giving": 44, "false": 45, "or": 46, "misleading": 47, "information": 48, "caveats": 49, "when": 50, "isn": 51, "\u2019": 52, "t": 53, "entirely": 54, "sure": 55, "about": 56, "right": 57, "answer": 58, "that": 59, "said": 60, "practical": 61, "really": 62, "does": 63, "doesn": 64, "let": 65, "caution": 66, "get": 67, "too": 68, "much": 69, "in": 70, "way": 71, "being": 72, "useful": 73, "starcoder": 74, "models": 75, "15.5b": 76, "parameter": 77, "trained": 78, "on": 79, "80+": 80, "programming": 81, "languages": 82, "from": 83, "stack": 84, "(": 85, "v1.2": 86, ")": 87, "excluding": 88, "opt-out": 89, "requests": 90, "model": 91, "uses": 92, "multi": 93, "query": 94, "attention": 95, "was": 96, "using": 97, "fill-in-the-middle": 98, "objective": 99, "8,192": 100, "tokens": 101, "context": 102, "window": 103, "for": 104, "trillion": 105, "heavily": 106, "deduplicated": 107, "data": 108, "--": 109, "-": 110, "human": 111, ":": 112, "who": 113, "you": 114, "?": 115, "my": 116, "name": 117, "language": 118, "developed": 119, "by": 120, "bigcode": 121, "can": 122, "tell": 123, "me": 124, "more": 125, "yourself": 126, "quite": 127, "impressive": 128, "your": 129, "purpose": 130, "i": 131, "am": 132, "designed": 133, "provide": 134, "support": 135, "those": 136, "want": 137, "solve": 138, "problems": 139, "think": 140, "fair": 141, "say": 142, "speak": 143, "multiple": 144, "ask": 145, "problem": 146, "python": 147, "definitely": 148, "going": 149, "use": 150, "3": 151, "deliver": 152, "correct": 153, "solution": 154, "write": 155, "program": 156, "output": 157, "if": 158, "given": 159, "number": 160, "even": 161, "not": 162, "divisible": 163, "2.": 164, "knowing": 165, "this": 166, "fact": 167, "here": 168, "``": 169, "`": 170, "def": 171, "is_even": 172, "n": 173, "return": 174, "%": 175, "2": 176, "==": 177, "0": 178, "some": 179, "expected": 180, "outputs": 181, "=": 182, "true": 183, "11": 184, "function": 185, "takes": 186, "two": 187, "lists": 188, "returns": 189, "list": 190, "has": 191, "alternating": 192, "elements": 193, "each": 194, "input": 195, "list1": 196, "list2": 197, "results": 198, "[": 199, "]": 200, "range": 201, "len": 202, "results.append": 203, "test": 204, "cases": 205, "tests": 206, "assert": 207, "10": 208, "20": 209, "30": 210, "1": 211, "4": 212, "5": 213, "modify": 214, "so": 215, "all": 216, "have": 217, "uneven": 218, "length": 219, "longer": 220, "should": 221, "at": 222, "end": 223, "modified": 224, "min": 225, ">": 226, "results.extend": 227, "i+1": 228, "else": 229, "working": 230, "see": 231, "may": 232, "wrong": 233, "factorial": 234, "r": 235, "*": 236, "initial": 237, "value": 238, "must": 239, "following": 240, "version": 241, "work": 242, "#": 243, "changed": 244, "create": 245, "compute": 246, "k-combinations": 247, "set": 248, "yes": 249, "course": 250, "written": 251, "as": 252, "c": 253, "k": 254, "we": 255, "$": 256, "\\frac": 257, "{": 258, "!": 259, "}": 260, "n-k": 261, "whenever": 262, "\\leq": 263, "follows": 264, "combination": 265, "<": 266, "/": 267, "pretty": 268, "well": 269, "keep": 270, "mind": 271, "numpy": 272, "scipy": 273, "alternative": 274, "implementation": 275, "thanks": 276, "welcome": 277, "csv": 278, "file": 279, "looks": 280, "like": 281, "salary": 282, "bob,12000": 283, "avantika,35000": 284, "alice,30000": 285, "person": 286, "highest": 287, "assumes": 288, "filename": 289, "salaries.csv": 290, "import": 291, "dictreader": 292, "pathlib": 293, "path": 294, "max_salary": 295, "rows": 296, ".read_text": 297, ".splitlines": 298, "max_index": 299, "-1": 300, "row": 301, "enumerate": 302, "int": 303, "'salary": 304, "'": 305, "'name": 306, "print": 307, "'salaries.csv": 308, "f": 309, "p": 310, "p-1": 311, "raise": 312, "base": 313, "power": 314, "computing": 315, "n^p": 316, "where": 317, "positive": 318, "integer": 319, "prime": 320, "numbers": 321, "less": 322, "than": 323, "1000": 324, "congruent": 325, "modulo": 326, "6": 327, "method": 328, "adopt": 329, "go": 330, "through": 331, "integers": 332, "check": 333, "they": 334, "6.": 335, "need": 336, "utility": 337, "is_prime": 338, "0.5": 339, "+1": 340, "now": 341, "final": 342, "primes_mod_6": 343, "primes": 344, "primes.append": 345, "translate": 346, "java": 347, "\u201c": 348, "hello": 349, "world": 350, "\u201d": 351, "translation": 352, "system.out.println": 353, ";": 354, "load": 355, "struct": 356, "values": 357, "into": 358, "only": 359, "typedef": 360, "double": 361, "x": 362, "y": 363, "twod": 364, "z": 365, "threed": 366, "second": 367, "contains": 368, "arrays": 369, "coordinates": 370, "3d": 371, "plane": 372, "goal": 373, "just": 374, "first": 375, "possible": 376, "considering": 377, "different": 378, "typedefs": 379, "how": 380, "would": 381, "implemented": 382, "no": 383, "s": 384, "directly": 385, "because": 386, "there": 387, "mismatch": 388, "one": 389, "but": 390, "copy": 391, "field": 392, "manually": 393, "atwod": 394, "athreed": 395, "athreed.x": 396, "1.0": 397, "athreed.y": 398, "2.0": 399, "athreed.z": 400, "3.0": 401, "atwod.x": 402, "atwod.y": 403, "'ve": 404, "installed": 405, "django": 406, "ways": 407, "via": 408, "apt-get": 409, "pip": 410, "install": 411, "most": 412, "recent": 413, "run": 414, "terminal": 415, "type": 416, "receive": 417, "importerror": 418, "module": 419, "named": 420, "however": 421, "django-admin": 422, "1.4.3": 423, "know": 424, "'s": 425, "why": 426, "finding": 427, "turns": 428, "out": 429, "wants": 430, "virtual": 431, "environment": 432, "then": 433, "server": 434, "virtualenv": 435, "navigate": 436, "project": 437, "folder": 438, "env": 439, "new": 440, "inside": 441, "/scripts": 442, "cd": 443, "activate": 444, "press": 445, "enter": 446, "start": 447, "verify": 448, "prefixed": 449, "current": 450, "once": 451, "head": 452, "back": 453, "..": 454, "installation": 455, "typing": 456, "display": 457, "manage.py": 458, "runserver": 459, "bakers": 460, "beverly": 461, "hills": 462, "bakery": 463, "baked": 464, "200": 465, "loaves": 466, "bread": 467, "monday": 468, "morning": 469, "sold": 470, "93": 471, "39": 472, "afternoon": 473, "grocery": 474, "store": 475, "returned": 476, "unsold": 477, "many": 478, "did": 479, "left": 480, "step": 481, "started": 482, "93+39=132": 483, "which": 484, "means": 485, "had": 486, "132": 487, "68": 488, "finally": 489, "thus": 490, "ended": 491, "up": 492, "68+6=74": 493, "74": 494, "nice": 495, "consider": 496, "arguments": 497, "amount": 498, "loaves_left": 499, "initial_number_of_loaves": 500, "loaves_sold_morning": 501, "loaves_sold_afternoon": 502, "loaves_returned": 503, "loaves_sold_total": 504, "+": 505, "inputs": 506, "24": 507, "9": 508, "153": 509, "57": 510, "99": 511, "32": 512, "13": 513, "29": 514, "rather": 515, "pizza": 516, "burger": 517, "lunch": 518, "sorry": 519, "give": 520, "such": 521, "question": 522, "related": 523, "includes": 524, "writing": 525, "math": 526, "fine": 527, "beyond": 528, "issues": 529, "leveraging": 530, "skills": 531, "randomly": 532, "decide": 533, "eating": 534, "probability": 535, "0.3": 536, "0.7": 537, "respectively": 538, "random": 539, "pizza_or_burger": 540, "random.uniform": 541, "eat": 542, "change": 543, "executions": 544, "dictionary": 545, "lots": 546, "dictionaries": 547, "make": 548, "single": 549, "talking": 550, "yeah": 551, "these": 552, "keys": 553, "themselves": 554, "great": 555, "re": 556, "asking": 557, "might": 558, "flatten": 559, "several": 560, "levels": 561, "ll": 562, "recursively": 563, "combine": 564, "outer": 565, "inner": 566, "resulting": 567, "unambiguous": 568, "d": 569, "suggest": 570, "doing": 571, "concatenating": 572, "them": 573, "together": 574, "separated": 575, "character": 576, "hmm": 577, "m": 578, "maybe": 579, "underscore": 580, "ok": 581, "trick": 582, "recursively_flatten_dicts": 583, "separator=": 584, "''": 585, "_": 586, "result": 587, "v": 588, "d.items": 589, "isinstance": 590, "dict": 591, "new_dict": 592, "separator": 593, "w": 594, "v.items": 595, "separator=separator": 596, "result.update": 597, "don": 598, "try": 599, "works": 600, "example": 601, "any": 602, "<unk>": 603, "<pad>": 604}