| { |
| "version": "1.0", |
| "truncation": null, |
| "padding": null, |
| "added_tokens": [ |
| { |
| "id": 0, |
| "content": "<pad>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 1, |
| "content": "<eos>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 2, |
| "content": "<bos>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 3, |
| "content": "<unk>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 4, |
| "content": "<mask>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 822, |
| "content": "[PAD]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 823, |
| "content": "[EOS]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 824, |
| "content": "[BOS]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 825, |
| "content": "[UNK]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 826, |
| "content": "[MASK]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 827, |
| "content": "[CLS]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 828, |
| "content": "[SEP]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 829, |
| "content": "[PROMPT]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 830, |
| "content": "[TIMESTAMP]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| } |
| ], |
| "normalizer": null, |
| "pre_tokenizer": { |
| "type": "Sequence", |
| "pretokenizers": [ |
| { |
| "type": "Split", |
| "pattern": { |
| "Regex": "<[^>]+>|\\.\\d+,\\d+|[1-9]{2}\\-[a-z]\\]|[0-9]\\-[a-z]\\]|[1-9]{2}[a-z]|[1-9]{2}'[a-z]|[0-9]'[a-z]|[0-9][a-z]|\\([0-9]\\+\\)|\\([0-9]\\-\\)|[1-9]{2}|[0-9]|-|\\s|\\(|\\)|S|R|E|Z|N|C|O|'|\\\"|;|λ|H|,|\\.|\\[[a-z]{2}\\]|\\[[a-z]\\]|\\[|\\]|indolizin|arsindol|indol|furan|furo|piperazin|pyrrolidin|pyrrolizin|thiophen|thiolo|imidazolidin|imidazol|pyrimidin|pyridin|piperidin|morpholin|pyrazol|pyridazin|oxocinnolin|cinnolin|pyrrol|thiochromen|oxochromen|chromen|quinazolin|phthalazin|quinoxalin|carbazol|xanthen|pyrazin|purin|indazol|naphthyridin|quinolizin|guanidin|pyranthren|pyran|thianthren|thian|acridin|acrido|yohimban|porphyrin|pteridin|tetramin|pentamin|borinin|borino|boriran|borolan|borol|borinan|phenanthridin|quinolin|perimidin|corrin|phenanthrolin|phosphinolin|indacen|silonin|borepin|naphthalen|naphthal|inden|adamant|fluoren|thiourea|urea|anthracen|acenaphthylen|carbohydrazide|annulen|aniline|acetaldehyde|benzaldehyde|formaldehyde|phthalaldehyde|acephenanthrylen|phenanthren|chrysen|carbanid|chloroform|fulleren|cumen|formonitril|fluoranthen|terephthalaldehyde|azulen|picen|pyren|pleiaden|coronen|tetracen|pentacen|perylen|pentalen|heptalen|cuban|hexacen|oxanthren|ovalen|aceanthrylen|acid|ether|hydrogen|helium|lithium|beryllium|nitrogen|oxygen|fluorine|neon|sodium|magnesium|aluminum|silicon|phosphorus|sulfur|chlorine|argon|potassium|calcium|scandium|titanium|vanadium|chromium|manganese|iron|cobalt|nickel|copper|zinc|gallium|germanium|arsenic|selenium|bromine|krypton|rubidium|yttrium|zirconium|niobium|molybdenum|technetium|ruthenium|rhodium|palladium|silver|cadmium|indium|antimony|tellurium|iodine|xenon|cesium|barium|lanthanum|cerium|praseodymium|neodymium|latinum|promethium|samarium|europium|gadolinium|terbium|dysprosium|holmium|erbium|thulium|ytterbium|lutetium|hafnium|tantalum|tungsten|rhenium|osmium|iridium|platinum|gold|aurum|mercury|thallium|lead|bismuth|polonium|astatine|radon|francium|radium|actinium|thorium|protactinium|uranium|neptunium|plutonium|americium|curium|berkelium|einsteinium|fermium|californium|mendelevium|nobelium|lawrencium|rutherfordium|dubnium|seaborgium|bohrium|hassium|meitnerium|tin|protio|deuterio|tritio|perchlorate|perbromate|periodate|hypofluorite|hypochlorite|hypobromite|hypoiodite|nitrate|silicate|hydride|methane|methanoyl|methan|ethane|ethanoyl|ethan|propanoyl|propane|propan|propa|butane|butanoyl|butan|buta|pentane|pentanoyl|pentan|hexane|hexanoyl|hexan|heptane|heptanoyl|heptan|octane|octanoyl|octan|nonane|nonanoyl|nonan|decane|decanoyl|decan|icosane|icosan|cosane|cosan|contane|contan|mono|un|bis|bi|dicta|di|tetraza|tetraz|tetra|tetr|pentaza|pentaz|penta|hexaza|hexa|heptaza|hepta|octaza|octa|nonaza|nona|decaza|deca|kis|hydroxide|hydroxyl|hydroxy|hydrate|hydro|cyclo|spiro|iso|methylidene|methyl|ethyl|isopropyl|propyl|isobutyl|sec-butyl|tert-butyl|butyl|pentyl|hexyl|heptyl|octyl|meth|eth|prop|but|pent|hex|hept|oct|non|dec|icosa|icos|cosa|cos|icon|conta|cont|con|heni|hene|hen|hecta|hect|silanide|silane|silole|silanyl|silyloxy|silylo|silyl|sila|hydrazono|hydrazino|nitroso|nitrous|nitro|formamido|amino|amido|imino|imido|anilino|anilin|thiocyanato|cyanato|cyano|azido|azanidyl|azanyl|azanide|azanida|azonia|azonio|amidino|nitramido|diazo|sulfanylidene|sulfinamoyl|sulfonimidoyl|sulfinimidoyl|sulfamoyl|sulfonyl|sulfanyl|sulfinyl|sulfinato|sulfenato|sulfonato|sulfonio|sulfino|sulfono|sulfido|carboxylate|carboxylato|carboxylic|carboxy|halocarbonyl|carbamoyl|carbonyl|carbamo|thioformyl|formyl|alumanyl|gallanyl|stannyl|plumbyl|tellanyl|germanyl|germyl|benzhydryl|benzoxaza|benzoxaz|benzoxa|benzox|benzo|benzyl|benz|phenacyl|phenanthro|phenyl|phenoxaza|phenoxaz|phenoxy|phenox|phenol|pheno|phen|acetyl|aceto|acet|peroxy|oxido|oxino|oxalo|oxolo|oxocyclo|oxol|oxoc|oxon|oxo|oxy|pyrido|pyrimido|imidazo|naphtho|stiboryl|stibolo|fluoro|fluoranyl|fluoridoyl|fluorido|chloro|chloranyl|chloridoyl|chlorido|bromo|bromanyl|bromidoyl|bromido|iodo|iodanyl|iodidoyl|iodanuidyl|iodido|phosphonato|phosphoroso|phosphonia|phosphoryl|phosphanyl|arsono|arsanyl|stiba|carbonitrile|carboxamide|carbamimidothioate|carbodithioate|carbohydrazonate|carbonimidoyl|carboximidoyl|carbamimidoyl|carbamimidate|carbamimid|carbaldehyde|carbamate|carbothioyl|carboximidothioate|carbonate|carboximidamide|carboximidate|carbamic|carbonochloridate|carbothialdehyde|carbothioate|carbothioic|carbono|carbon|carbo|formate|formic|ammonium|hydrazide|hydrazine|hydrazin|amine|imine|oxamide|nitramide|formamide|cyanamide|amide|imide|amidine|isocyanide|azanium|thiocyanate|cyanate|cyanic|cyanatidoyl|cyanide|nitrile|nitrite|hydrazonate|sulfonamide|sulfinamide|sulfonamido|sulfonic|sulfamic|sulfinic|sulfuric|thial|thione|thiol|sulfonate|sulfite|sulfate|sulfide|sulfinate|sulfanium|sulfamate|sulfane|sulfo|fluoride|chloride|chloridic|perchloric|bromide|iodide|iodane|hypoiodous|hypochlorous|phosphanium|phosphate|phosphite|phosphane|phosphanide|phosphonamidic|phosphonous|phosphinous|phosphinite|phosphono|arsonic|stibane|chromium|stannane|gallane|alumane|aluminane|aluminan|germane|germa|ane|ano|an|ene|enoxy|eno|en|yne|yn|yl|peroxol|peroxo|terephthalate|terephthalic|phthalic|phthalate|oxide|oate|ol|oic|ic|al|ate|ium|one|ir|et|olo|ol|ino|in|ep|oc|on|ec|protide|boranyl|boranuide|boronamidic|boranuida|boranide|borinic|borate|borane|boran|borono|boron|bora|selanyl|seleno|thiaz|oxaza|oxaz|oxan|oxa|ox|aza|az|thia|thioc|thion|thio|thi|telluro|phospha|phosph|selen|bor|sil|alum|ars|germ|tellur|imid|idine|idene|idin|ane|an|ine|in|id|e|do|trisodium|tris|triacetyl|triamine|triaza|triaz|tria|trityl|tri|o" |
| }, |
| "behavior": "Isolated", |
| "invert": false |
| }, |
| { |
| "type": "Split", |
| "pattern": { |
| "Regex": "\\[|\\]|\\(|\\)|<[^>]+>|0|1|2|3|4|5|6|7|8|9|-|meth|ane|eth|prop|but|pent|hex|hept|oct|non|dec|cos|cont|icos|benz|phen|amine|cyan|imine|amide|cyan|imid|nitril|nitr|ane|ano|ene|en|ox|per|ol|on|oic|oate|tris|iso|yl|ate|az|hypo|sil|bor|thio|carb|ferrum|sulf|chlor|brom|phosph|hydr|fluor" |
| }, |
| "behavior": "Isolated", |
| "invert": false |
| } |
| ] |
| }, |
| "post_processor": { |
| "type": "TemplateProcessing", |
| "single": [ |
| { |
| "SpecialToken": { |
| "id": "[CLS]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[PROMPT]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[TIMESTAMP]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[BOS]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "Sequence": { |
| "id": "A", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[EOS]", |
| "type_id": 0 |
| } |
| } |
| ], |
| "pair": [ |
| { |
| "SpecialToken": { |
| "id": "[CLS]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[PROMPT]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[TIMESTAMP]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[BOS]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "Sequence": { |
| "id": "A", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[SEP]", |
| "type_id": 0 |
| } |
| }, |
| { |
| "Sequence": { |
| "id": "B", |
| "type_id": 0 |
| } |
| }, |
| { |
| "SpecialToken": { |
| "id": "[EOS]", |
| "type_id": 0 |
| } |
| } |
| ], |
| "special_tokens": { |
| "[BOS]": { |
| "id": "[BOS]", |
| "ids": [ |
| 824 |
| ], |
| "tokens": [ |
| "[BOS]" |
| ] |
| }, |
| "[CLS]": { |
| "id": "[CLS]", |
| "ids": [ |
| 827 |
| ], |
| "tokens": [ |
| "[CLS]" |
| ] |
| }, |
| "[EOS]": { |
| "id": "[EOS]", |
| "ids": [ |
| 823 |
| ], |
| "tokens": [ |
| "[EOS]" |
| ] |
| }, |
| "[PROMPT]": { |
| "id": "[PROMPT]", |
| "ids": [ |
| 829 |
| ], |
| "tokens": [ |
| "[PROMPT]" |
| ] |
| }, |
| "[SEP]": { |
| "id": "[SEP]", |
| "ids": [ |
| 828 |
| ], |
| "tokens": [ |
| "[SEP]" |
| ] |
| }, |
| "[TIMESTAMP]": { |
| "id": "[TIMESTAMP]", |
| "ids": [ |
| 830 |
| ], |
| "tokens": [ |
| "[TIMESTAMP]" |
| ] |
| } |
| } |
| }, |
| "decoder": { |
| "type": "BPEDecoder", |
| "suffix": "</w>" |
| }, |
| "model": { |
| "type": "WordLevel", |
| "vocab": { |
| "<pad>": 0, |
| "<eos>": 1, |
| "<bos>": 2, |
| "<unk>": 3, |
| "<mask>": 4, |
| "-": 5, |
| "yl": 6, |
| "2": 7, |
| ",": 8, |
| "1": 9, |
| "(": 10, |
| ")": 11, |
| "[": 12, |
| "]": 13, |
| "3": 14, |
| "4": 15, |
| "meth": 16, |
| "ox": 17, |
| "o": 18, |
| "5": 19, |
| "phen": 20, |
| "an": 21, |
| "ol": 22, |
| "y": 23, |
| "az": 24, |
| "e": 25, |
| "di": 26, |
| "6": 27, |
| "eth": 28, |
| "N": 29, |
| "a": 30, |
| "prop": 31, |
| "amino": 32, |
| " ": 33, |
| "on": 34, |
| "carb": 35, |
| "hydr": 36, |
| "in": 37, |
| "id": 38, |
| "7": 39, |
| "S": 40, |
| "benz": 41, |
| "amide": 42, |
| "R": 43, |
| "fluor": 44, |
| ".": 45, |
| "0": 46, |
| "cyclo": 47, |
| "en": 48, |
| "ene": 49, |
| "tri": 50, |
| "8": 51, |
| "but": 52, |
| "chlor": 53, |
| "pyr": 54, |
| "9": 55, |
| ";": 56, |
| "idin": 57, |
| "imid": 58, |
| "H": 59, |
| "sulf": 60, |
| "acid": 61, |
| "per": 62, |
| "hex": 63, |
| "pi": 64, |
| "ic": 65, |
| "pent": 66, |
| "pyridin": 67, |
| "amine": 68, |
| "pyrr": 69, |
| "ane": 70, |
| "tetra": 71, |
| "acet": 72, |
| "thio": 73, |
| "thi": 74, |
| "ate": 75, |
| "et": 76, |
| "dec": 77, |
| "brom": 78, |
| "Z": 79, |
| "bis": 80, |
| "r": 81, |
| "k": 82, |
| "E": 83, |
| "ind": 84, |
| "iso": 85, |
| "ano": 86, |
| "quin": 87, |
| "'": 88, |
| "tert": 89, |
| "st": 90, |
| "b": 91, |
| "amo": 92, |
| "furan": 93, |
| "hept": 94, |
| "oct": 95, |
| "nitr": 96, |
| "cyan": 97, |
| "ide": 98, |
| "oic": 99, |
| "c": 100, |
| "morph": 101, |
| "oate": 102, |
| "l": 103, |
| "phosph": 104, |
| "d": 105, |
| "i": 106, |
| "spiro": 107, |
| "anilino": 108, |
| "bi": 109, |
| "ep": 110, |
| "naphthal": 111, |
| "thia": 112, |
| "t": 113, |
| "ium": 114, |
| "n": 115, |
| "non": 116, |
| "am": 117, |
| "cos": 118, |
| "ino": 119, |
| "sil": 120, |
| "do": 121, |
| "yn": 122, |
| "pyran": 123, |
| "al": 124, |
| "urea": 125, |
| "m": 126, |
| "itrile": 127, |
| "tris": 128, |
| "guanidin": 129, |
| "tetr": 130, |
| "qu": 131, |
| "pip": 132, |
| "p": 133, |
| "imino": 134, |
| "pyrid": 135, |
| "s": 136, |
| "nitril": 137, |
| "v": 138, |
| "chrom": 139, |
| "amido": 140, |
| "or": 141, |
| "pyrido": 142, |
| "yr": 143, |
| "x": 144, |
| "iodide": 145, |
| "iodo": 146, |
| "bor": 147, |
| "aniline": 148, |
| "h": 149, |
| "un": 150, |
| "anium": 151, |
| "amic": 152, |
| "cont": 153, |
| "anthr": 154, |
| "deuterio": 155, |
| "acr": 156, |
| "furo": 157, |
| "purin": 158, |
| "icos": 159, |
| "naphth": 160, |
| "fur": 161, |
| "idine": 162, |
| "ec": 163, |
| "tria": 164, |
| "aldehyde": 165, |
| "O": 166, |
| "kis": 167, |
| "f": 168, |
| "ido": 169, |
| "tin": 170, |
| "alin": 171, |
| "adamant": 172, |
| "iodan": 173, |
| "aceto": 174, |
| "ambda": 175, |
| "naphthyridin": 176, |
| "ir": 177, |
| "form": 178, |
| "anthrac": 179, |
| "og": 180, |
| "nip": 181, |
| "rt": 182, |
| "amm": 183, |
| "is": 184, |
| "ne": 185, |
| "lambda": 186, |
| "+": 187, |
| "imine": 188, |
| "g": 189, |
| "amidine": 190, |
| "naphtho": 191, |
| "furfur": 192, |
| "oc": 193, |
| "xy": 194, |
| "sodium": 195, |
| "C": 196, |
| "xanth": 197, |
| "ato": 198, |
| "ine": 199, |
| "thian": 200, |
| "izin": 201, |
| "ia": 202, |
| "chr": 203, |
| "phthal": 204, |
| "ur": 205, |
| "umar": 206, |
| "thr": 207, |
| "acridin": 208, |
| "amidino": 209, |
| "anide": 210, |
| "rcapt": 211, |
| "sec": 212, |
| "lo": 213, |
| "ular": 214, |
| "cum": 215, |
| "u": 216, |
| "arbam": 217, |
| "pr": 218, |
| "oso": 219, |
| "yne": 220, |
| "phth": 221, |
| "iridium": 222, |
| "hyd": 223, |
| "potassium": 224, |
| "succ": 225, |
| "platinum": 226, |
| "tetrac": 227, |
| "rg": 228, |
| "glyc": 229, |
| "anid": 230, |
| "capr": 231, |
| "chrys": 232, |
| "ratr": 233, |
| "yttrium": 234, |
| "pteridin": 235, |
| "ochrom": 236, |
| "laur": 237, |
| "ac": 238, |
| "pic": 239, |
| "ocyclo": 240, |
| "sel": 241, |
| "anthridin": 242, |
| "styril": 243, |
| "lithium": 244, |
| "formic": 245, |
| "formamido": 246, |
| "acetaldehyde": 247, |
| "trit": 248, |
| "sit": 249, |
| "ar": 250, |
| "ch": 251, |
| "anuide": 252, |
| "ite": 253, |
| "zirc": 254, |
| "'a": 255, |
| "glutar": 256, |
| "rm": 257, |
| "zinc": 258, |
| "cinn": 259, |
| "stann": 260, |
| "triacet": 261, |
| "annul": 262, |
| "inic": 263, |
| "titanium": 264, |
| "ul": 265, |
| "im": 266, |
| "us": 267, |
| "hypo": 268, |
| "porphyrin": 269, |
| "anth": 270, |
| "ad": 271, |
| "ucl": 272, |
| "xam": 273, |
| "piv": 274, |
| "nam": 275, |
| "cop": 276, |
| "de": 277, |
| "magnesium": 278, |
| "umaril": 279, |
| "fl": 280, |
| "ycl": 281, |
| "styr": 282, |
| "tungst": 283, |
| "tritio": 284, |
| "palladium": 285, |
| "anthro": 286, |
| "indac": 287, |
| "nickel": 288, |
| "aphth": 289, |
| "vanadium": 290, |
| "germ": 291, |
| "th": 292, |
| "cobalt": 293, |
| "myrist": 294, |
| "hr": 295, |
| "anida": 296, |
| "ruth": 297, |
| "selan": 298, |
| "bar": 299, |
| "tur": 300, |
| "inin": 301, |
| "arg": 302, |
| "iz": 303, |
| "cd": 304, |
| "xim": 305, |
| "calcium": 306, |
| "inato": 307, |
| "chl": 308, |
| "hyp": 309, |
| "formaldehyde": 310, |
| "rph": 311, |
| "ni": 312, |
| "mit": 313, |
| "anuida": 314, |
| "br": 315, |
| "phthalic": 316, |
| "iodanuid": 317, |
| "ous": 318, |
| "uracil": 319, |
| "oroso": 320, |
| "inan": 321, |
| "arach": 322, |
| "fg": 323, |
| "mang": 324, |
| "se": 325, |
| "F": 326, |
| "chromium": 327, |
| "um": 328, |
| "il": 329, |
| "rc": 330, |
| "amidic": 331, |
| "uranium": 332, |
| "alum": 333, |
| "yg": 334, |
| "ulf": 335, |
| "hafnium": 336, |
| "ver": 337, |
| "rp": 338, |
| "ars": 339, |
| "odium": 340, |
| "inamo": 341, |
| "tra": 342, |
| "da": 343, |
| "mercury": 344, |
| "iodite": 345, |
| "ybd": 346, |
| "rhodium": 347, |
| "cupr": 348, |
| "lign": 349, |
| "iodine": 350, |
| "aluman": 351, |
| "actinium": 352, |
| "rcar": 353, |
| "thraqu": 354, |
| "odi": 355, |
| "hth": 356, |
| "io": 357, |
| "aluminum": 358, |
| "thianthr": 359, |
| "ill": 360, |
| "barium": 361, |
| "iod": 362, |
| "isa": 363, |
| "rubidium": 364, |
| "cesium": 365, |
| "ut": 366, |
| "osmium": 367, |
| "rr": 368, |
| "terephthalic": 369, |
| "fumar": 370, |
| "rh": 371, |
| "'b": 372, |
| "apht": 373, |
| "telluro": 374, |
| "lut": 375, |
| "inous": 376, |
| "tellan": 377, |
| "iodous": 378, |
| "pim": 379, |
| "liz": 380, |
| "j": 381, |
| "gad": 382, |
| "inium": 383, |
| "at": 384, |
| "I": 385, |
| "cadmium": 386, |
| "bismuth": 387, |
| "asar": 388, |
| "ph": 389, |
| "arb": 390, |
| "tetramin": 391, |
| "corrin": 392, |
| "bac": 393, |
| "rutherfordium": 394, |
| "cerium": 395, |
| "sub": 396, |
| "cy": 397, |
| "itr": 398, |
| "hecta": 399, |
| "sar": 400, |
| "tyr": 401, |
| "cuban": 402, |
| "stiba": 403, |
| "europium": 404, |
| "gly": 405, |
| "germa": 406, |
| "thallium": 407, |
| "technetium": 408, |
| "lanthanum": 409, |
| "la": 410, |
| "na": 411, |
| "tellur": 412, |
| "lact": 413, |
| "thial": 414, |
| "str": 415, |
| "arsan": 416, |
| "chu": 417, |
| "antim": 418, |
| "oform": 419, |
| "itril": 420, |
| "sti": 421, |
| "neodymium": 422, |
| "tantalum": 423, |
| "plumb": 424, |
| "yohimban": 425, |
| "cym": 426, |
| "niobium": 427, |
| "ld": 428, |
| "alo": 429, |
| "praseodymium": 430, |
| "ocinn": 431, |
| "hy": 432, |
| "lead": 433, |
| "inite": 434, |
| "liss": 435, |
| "cr": 436, |
| "ci": 437, |
| "rth": 438, |
| "ytterbium": 439, |
| "ra": 440, |
| "\"": 441, |
| "z": 442, |
| "ps": 443, |
| "samarium": 444, |
| "naph": 445, |
| "terbium": 446, |
| "othialdehyde": 447, |
| "scandium": 448, |
| "tartar": 449, |
| "pyruv": 450, |
| "as": 451, |
| "ber": 452, |
| "lium": 453, |
| "ll": 454, |
| "nu": 455, |
| "za": 456, |
| "phthalaldehyde": 457, |
| "llit": 458, |
| "tassi": 459, |
| "dysprosium": 460, |
| "epin": 461, |
| "lutetium": 462, |
| "ct": 463, |
| "acrido": 464, |
| "ij": 465, |
| "nthr": 466, |
| "indium": 467, |
| "fermium": 468, |
| "pha": 469, |
| "thra": 470, |
| "gallium": 471, |
| "erbium": 472, |
| "gamma": 473, |
| "flu": 474, |
| "sam": 475, |
| "hl": 476, |
| "thorium": 477, |
| "ma": 478, |
| "terephthal": 479, |
| "gallan": 480, |
| "lum": 481, |
| "mium": 482, |
| "lacc": 483, |
| "rs": 484, |
| "cor": 485, |
| "gall": 486, |
| "hippur": 487, |
| "taur": 488, |
| "caff": 489, |
| "nia": 490, |
| "ip": 491, |
| "pia": 492, |
| "dur": 493, |
| "glutam": 494, |
| "fuller": 495, |
| "atr": 496, |
| "plast": 497, |
| "terephthalaldehyde": 498, |
| "gluc": 499, |
| "phl": 500, |
| "thulium": 501, |
| "apr": 502, |
| "mu": 503, |
| "iran": 504, |
| "jap": 505, |
| "Tc": 506, |
| "stib": 507, |
| "citra": 508, |
| "astatine": 509, |
| "rcuri": 510, |
| "it": 511, |
| "iodido": 512, |
| "brass": 513, |
| "rcur": 514, |
| "rchl": 515, |
| "idic": 516, |
| "citr": 517, |
| "Br": 518, |
| "aceanthr": 519, |
| "rit": 520, |
| "mim": 521, |
| "rul": 522, |
| "tit": 523, |
| "pyranthr": 524, |
| "Ih": 525, |
| "protio": 526, |
| "stilb": 527, |
| "ypr": 528, |
| "dicta": 529, |
| "curium": 530, |
| "sg": 531, |
| "amin": 532, |
| "mi": 533, |
| "cta": 534, |
| ":": 535, |
| "ila": 536, |
| "mm": 537, |
| "neptunium": 538, |
| "ulfit": 539, |
| "aur": 540, |
| "cac": 541, |
| "orus": 542, |
| "pp": 543, |
| "cium": 544, |
| "lawr": 545, |
| "dd": 546, |
| "ri": 547, |
| "skat": 548, |
| "thaps": 549, |
| "hygr": 550, |
| "parab": 551, |
| "tartr": 552, |
| "yv": 553, |
| "germanium": 554, |
| "plut": 555, |
| "ita": 556, |
| "wn": 557, |
| "rphyr": 558, |
| "ace": 559, |
| "thym": 560, |
| "apth": 561, |
| "At": 562, |
| "buckm": 563, |
| "einsteinium": 564, |
| "americium": 565, |
| "pro": 566, |
| "nobelium": 567, |
| "T": 568, |
| "xysucc": 569, |
| "plumba": 570, |
| "helium": 571, |
| "w": 572, |
| "P": 573, |
| "mad": 574, |
| "guaiac": 575, |
| "gu": 576, |
| "cadav": 577, |
| "californium": 578, |
| "tr": 579, |
| "hnit": 580, |
| "ilv": 581, |
| "pla": 582, |
| "ti": 583, |
| "thyr": 584, |
| "ru": 585, |
| "sc": 586, |
| "B": 587, |
| "atido": 588, |
| "protactinium": 589, |
| "xyv": 590, |
| "lup": 591, |
| "pleiad": 592, |
| "aluminan": 593, |
| "ulfat": 594, |
| "arsind": 595, |
| "lmn": 596, |
| "gium": 597, |
| "rcura": 598, |
| "sea": 599, |
| "syr": 600, |
| "li": 601, |
| "camph": 602, |
| "ychr": 603, |
| "hect": 604, |
| "flav": 605, |
| "ybda": 606, |
| "yp": 607, |
| "rsa": 608, |
| "ug": 609, |
| "dubnium": 610, |
| "oval": 611, |
| "tis": 612, |
| "yc": 613, |
| "krypt": 614, |
| "vi": 615, |
| "berkelium": 616, |
| "ign": 617, |
| "fulm": 618, |
| "xyst": 619, |
| "tim": 620, |
| "meitnerium": 621, |
| "tellurium": 622, |
| "nil": 623, |
| "carvacr": 624, |
| "D": 625, |
| "hafna": 626, |
| "ymyrist": 627, |
| "llur": 628, |
| "german": 629, |
| "prism": 630, |
| "rad": 631, |
| "bohrium": 632, |
| "rb": 633, |
| "hassium": 634, |
| "astat": 635, |
| "delevium": 636, |
| "symcl": 637, |
| "umb": 638, |
| "rach": 639, |
| "llif": 640, |
| "xycapr": 641, |
| "xyp": 642, |
| "ulfam": 643, |
| "lat": 644, |
| "gsta": 645, |
| "hym": 646, |
| "nti": 647, |
| "yqu": 648, |
| "sa": 649, |
| "plum": 650, |
| "xa": 651, |
| "astata": 652, |
| "xyacr": 653, |
| "xym": 654, |
| "ada": 655, |
| "adm": 656, |
| "fulv": 657, |
| "ba": 658, |
| "warfar": 659, |
| "ycapr": 660, |
| "rri": 661, |
| "tipyr": 662, |
| "ypip": 663, |
| "hrys": 664, |
| "ast": 665, |
| "xyb": 666, |
| "xyi": 667, |
| "ruc": 668, |
| "alumin": 669, |
| "xymyrist": 670, |
| "rut": 671, |
| "jugl": 672, |
| "ysucc": 673, |
| "aci": 674, |
| "radium": 675, |
| "xypr": 676, |
| "yacr": 677, |
| "xychr": 678, |
| "uvit": 679, |
| "'c": 680, |
| "ub": 681, |
| "scul": 682, |
| "xyarach": 683, |
| "yt": 684, |
| "safr": 685, |
| "dymi": 686, |
| "protide": 687, |
| "rbr": 688, |
| "sma": 689, |
| "xychl": 690, |
| "fusar": 691, |
| "ga": 692, |
| "As": 693, |
| "In": 694, |
| "pras": 695, |
| "xyqu": 696, |
| "abas": 697, |
| "acc": 698, |
| "yphth": 699, |
| "xyc": 700, |
| "ascl": 701, |
| "gst": 702, |
| "plumbag": 703, |
| "yfur": 704, |
| "xyglutar": 705, |
| "Ga": 706, |
| "asti": 707, |
| "sux": 708, |
| "xya": 709, |
| "yb": 710, |
| "ata": 711, |
| "parax": 712, |
| "G": 713, |
| "Li": 714, |
| "francium": 715, |
| "rsaplumb": 716, |
| "rv": 717, |
| "daphn": 718, |
| "ag": 719, |
| "guai": 720, |
| "ychl": 721, |
| "yf": 722, |
| "ym": 723, |
| "samari": 724, |
| "si": 725, |
| "ucc": 726, |
| "full": 727, |
| "ib": 728, |
| "nthrac": 729, |
| "sap": 730, |
| "ypyr": 731, |
| "hn": 732, |
| "sm": 733, |
| "ta": 734, |
| "ud": 735, |
| "llura": 736, |
| "yglutar": 737, |
| "yst": 738, |
| "btu": 739, |
| "M": 740, |
| "U": 741, |
| "dyma": 742, |
| "lad": 743, |
| "magn": 744, |
| "vacc": 745, |
| "ya": 746, |
| "ntim": 747, |
| "rsast": 748, |
| "ap": 749, |
| "par": 750, |
| "xypip": 751, |
| "xysti": 752, |
| "yamm": 753, |
| "Pt": 754, |
| "Y": 755, |
| "aplumb": 756, |
| "auri": 757, |
| "bara": 758, |
| "dyspr": 759, |
| "frax": 760, |
| "lada": 761, |
| "purpur": 762, |
| "sp": 763, |
| "xysub": 764, |
| "yisa": 765, |
| "xyac": 766, |
| "xyphth": 767, |
| "yx": 768, |
| "astib": 769, |
| "chav": 770, |
| "fursulti": 771, |
| "hist": 772, |
| "mast": 773, |
| "rfull": 774, |
| "uramil": 775, |
| "usn": 776, |
| "xypim": 777, |
| "xyth": 778, |
| "yhyd": 779, |
| "Bi": 780, |
| "Bk": 781, |
| "Tl": 782, |
| "thuli": 783, |
| "tiba": 784, |
| "xybr": 785, |
| "xyim": 786, |
| "ypim": 787, |
| "ys": 788, |
| "ytt": 789, |
| "cyt": 790, |
| "dr": 791, |
| "ilast": 792, |
| "nag": 793, |
| "xypyr": 794, |
| "xys": 795, |
| "yarach": 796, |
| "ybar": 797, |
| "yfurfur": 798, |
| "ysub": 799, |
| "yuracil": 800, |
| "aph": 801, |
| "cad": 802, |
| "cham": 803, |
| "dym": 804, |
| "laws": 805, |
| "phys": 806, |
| "rsam": 807, |
| "stat": 808, |
| "tsuzu": 809, |
| "xymu": 810, |
| "xystib": 811, |
| "yac": 812, |
| "yh": 813, |
| "yhyp": 814, |
| "yi": 815, |
| "yim": 816, |
| "yphl": 817, |
| "ypi": 818, |
| "yru": 819, |
| "ystib": 820, |
| "yur": 821 |
| }, |
| "unk_token": "<unk>" |
| } |
| } |