| { | |
| "version": "1.0", | |
| "truncation": null, | |
| "padding": null, | |
| "added_tokens": [ | |
| { | |
| "id": 0, | |
| "content": "<pad>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 1, | |
| "content": "<eos>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 2, | |
| "content": "<bos>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 3, | |
| "content": "<unk>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 4, | |
| "content": "<mask>", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 822, | |
| "content": "[PAD]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 823, | |
| "content": "[EOS]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 824, | |
| "content": "[BOS]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 825, | |
| "content": "[UNK]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 826, | |
| "content": "[MASK]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 827, | |
| "content": "[CLS]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 828, | |
| "content": "[SEP]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 829, | |
| "content": "[PROMPT]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| }, | |
| { | |
| "id": 830, | |
| "content": "[TIMESTAMP]", | |
| "single_word": false, | |
| "lstrip": false, | |
| "rstrip": false, | |
| "normalized": false, | |
| "special": true | |
| } | |
| ], | |
| "normalizer": null, | |
| "pre_tokenizer": { | |
| "type": "Sequence", | |
| "pretokenizers": [ | |
| { | |
| "type": "Split", | |
| "pattern": { | |
| "Regex": "<[^>]+>|\\.\\d+,\\d+|[1-9]{2}\\-[a-z]\\]|[0-9]\\-[a-z]\\]|[1-9]{2}[a-z]|[1-9]{2}'[a-z]|[0-9]'[a-z]|[0-9][a-z]|\\([0-9]\\+\\)|\\([0-9]\\-\\)|[1-9]{2}|[0-9]|-|\\s|\\(|\\)|S|R|E|Z|N|C|O|'|\\\"|;|λ|H|,|\\.|\\[[a-z]{2}\\]|\\[[a-z]\\]|\\[|\\]|indolizin|arsindol|indol|furan|furo|piperazin|pyrrolidin|pyrrolizin|thiophen|thiolo|imidazolidin|imidazol|pyrimidin|pyridin|piperidin|morpholin|pyrazol|pyridazin|oxocinnolin|cinnolin|pyrrol|thiochromen|oxochromen|chromen|quinazolin|phthalazin|quinoxalin|carbazol|xanthen|pyrazin|purin|indazol|naphthyridin|quinolizin|guanidin|pyranthren|pyran|thianthren|thian|acridin|acrido|yohimban|porphyrin|pteridin|tetramin|pentamin|borinin|borino|boriran|borolan|borol|borinan|phenanthridin|quinolin|perimidin|corrin|phenanthrolin|phosphinolin|indacen|silonin|borepin|naphthalen|naphthal|inden|adamant|fluoren|thiourea|urea|anthracen|acenaphthylen|carbohydrazide|annulen|aniline|acetaldehyde|benzaldehyde|formaldehyde|phthalaldehyde|acephenanthrylen|phenanthren|chrysen|carbanid|chloroform|fulleren|cumen|formonitril|fluoranthen|terephthalaldehyde|azulen|picen|pyren|pleiaden|coronen|tetracen|pentacen|perylen|pentalen|heptalen|cuban|hexacen|oxanthren|ovalen|aceanthrylen|acid|ether|hydrogen|helium|lithium|beryllium|nitrogen|oxygen|fluorine|neon|sodium|magnesium|aluminum|silicon|phosphorus|sulfur|chlorine|argon|potassium|calcium|scandium|titanium|vanadium|chromium|manganese|iron|cobalt|nickel|copper|zinc|gallium|germanium|arsenic|selenium|bromine|krypton|rubidium|yttrium|zirconium|niobium|molybdenum|technetium|ruthenium|rhodium|palladium|silver|cadmium|indium|antimony|tellurium|iodine|xenon|cesium|barium|lanthanum|cerium|praseodymium|neodymium|latinum|promethium|samarium|europium|gadolinium|terbium|dysprosium|holmium|erbium|thulium|ytterbium|lutetium|hafnium|tantalum|tungsten|rhenium|osmium|iridium|platinum|gold|aurum|mercury|thallium|lead|bismuth|polonium|astatine|radon|francium|radium|actinium|thorium|protactinium|uranium|neptunium|plutonium|americium|curium|berkelium|einsteinium|fermium|californium|mendelevium|nobelium|lawrencium|rutherfordium|dubnium|seaborgium|bohrium|hassium|meitnerium|tin|protio|deuterio|tritio|perchlorate|perbromate|periodate|hypofluorite|hypochlorite|hypobromite|hypoiodite|nitrate|silicate|hydride|methane|methanoyl|methan|ethane|ethanoyl|ethan|propanoyl|propane|propan|propa|butane|butanoyl|butan|buta|pentane|pentanoyl|pentan|hexane|hexanoyl|hexan|heptane|heptanoyl|heptan|octane|octanoyl|octan|nonane|nonanoyl|nonan|decane|decanoyl|decan|icosane|icosan|cosane|cosan|contane|contan|mono|un|bis|bi|dicta|di|tetraza|tetraz|tetra|tetr|pentaza|pentaz|penta|hexaza|hexa|heptaza|hepta|octaza|octa|nonaza|nona|decaza|deca|kis|hydroxide|hydroxyl|hydroxy|hydrate|hydro|cyclo|spiro|iso|methylidene|methyl|ethyl|isopropyl|propyl|isobutyl|sec-butyl|tert-butyl|butyl|pentyl|hexyl|heptyl|octyl|meth|eth|prop|but|pent|hex|hept|oct|non|dec|icosa|icos|cosa|cos|icon|conta|cont|con|heni|hene|hen|hecta|hect|silanide|silane|silole|silanyl|silyloxy|silylo|silyl|sila|hydrazono|hydrazino|nitroso|nitrous|nitro|formamido|amino|amido|imino|imido|anilino|anilin|thiocyanato|cyanato|cyano|azido|azanidyl|azanyl|azanide|azanida|azonia|azonio|amidino|nitramido|diazo|sulfanylidene|sulfinamoyl|sulfonimidoyl|sulfinimidoyl|sulfamoyl|sulfonyl|sulfanyl|sulfinyl|sulfinato|sulfenato|sulfonato|sulfonio|sulfino|sulfono|sulfido|carboxylate|carboxylato|carboxylic|carboxy|halocarbonyl|carbamoyl|carbonyl|carbamo|thioformyl|formyl|alumanyl|gallanyl|stannyl|plumbyl|tellanyl|germanyl|germyl|benzhydryl|benzoxaza|benzoxaz|benzoxa|benzox|benzo|benzyl|benz|phenacyl|phenanthro|phenyl|phenoxaza|phenoxaz|phenoxy|phenox|phenol|pheno|phen|acetyl|aceto|acet|peroxy|oxido|oxino|oxalo|oxolo|oxocyclo|oxol|oxoc|oxon|oxo|oxy|pyrido|pyrimido|imidazo|naphtho|stiboryl|stibolo|fluoro|fluoranyl|fluoridoyl|fluorido|chloro|chloranyl|chloridoyl|chlorido|bromo|bromanyl|bromidoyl|bromido|iodo|iodanyl|iodidoyl|iodanuidyl|iodido|phosphonato|phosphoroso|phosphonia|phosphoryl|phosphanyl|arsono|arsanyl|stiba|carbonitrile|carboxamide|carbamimidothioate|carbodithioate|carbohydrazonate|carbonimidoyl|carboximidoyl|carbamimidoyl|carbamimidate|carbamimid|carbaldehyde|carbamate|carbothioyl|carboximidothioate|carbonate|carboximidamide|carboximidate|carbamic|carbonochloridate|carbothialdehyde|carbothioate|carbothioic|carbono|carbon|carbo|formate|formic|ammonium|hydrazide|hydrazine|hydrazin|amine|imine|oxamide|nitramide|formamide|cyanamide|amide|imide|amidine|isocyanide|azanium|thiocyanate|cyanate|cyanic|cyanatidoyl|cyanide|nitrile|nitrite|hydrazonate|sulfonamide|sulfinamide|sulfonamido|sulfonic|sulfamic|sulfinic|sulfuric|thial|thione|thiol|sulfonate|sulfite|sulfate|sulfide|sulfinate|sulfanium|sulfamate|sulfane|sulfo|fluoride|chloride|chloridic|perchloric|bromide|iodide|iodane|hypoiodous|hypochlorous|phosphanium|phosphate|phosphite|phosphane|phosphanide|phosphonamidic|phosphonous|phosphinous|phosphinite|phosphono|arsonic|stibane|chromium|stannane|gallane|alumane|aluminane|aluminan|germane|germa|ane|ano|an|ene|enoxy|eno|en|yne|yn|yl|peroxol|peroxo|terephthalate|terephthalic|phthalic|phthalate|oxide|oate|ol|oic|ic|al|ate|ium|one|ir|et|olo|ol|ino|in|ep|oc|on|ec|protide|boranyl|boranuide|boronamidic|boranuida|boranide|borinic|borate|borane|boran|borono|boron|bora|selanyl|seleno|thiaz|oxaza|oxaz|oxan|oxa|ox|aza|az|thia|thioc|thion|thio|thi|telluro|phospha|phosph|selen|bor|sil|alum|ars|germ|tellur|imid|idine|idene|idin|ane|an|ine|in|id|e|do|trisodium|tris|triacetyl|triamine|triaza|triaz|tria|trityl|tri|o" | |
| }, | |
| "behavior": "Isolated", | |
| "invert": false | |
| }, | |
| { | |
| "type": "Split", | |
| "pattern": { | |
| "Regex": "\\[|\\]|\\(|\\)|<[^>]+>|0|1|2|3|4|5|6|7|8|9|-|meth|ane|eth|prop|but|pent|hex|hept|oct|non|dec|cos|cont|icos|benz|phen|amine|cyan|imine|amide|cyan|imid|nitril|nitr|ane|ano|ene|en|ox|per|ol|on|oic|oate|tris|iso|yl|ate|az|hypo|sil|bor|thio|carb|ferrum|sulf|chlor|brom|phosph|hydr|fluor" | |
| }, | |
| "behavior": "Isolated", | |
| "invert": false | |
| } | |
| ] | |
| }, | |
| "post_processor": { | |
| "type": "TemplateProcessing", | |
| "single": [ | |
| { | |
| "SpecialToken": { | |
| "id": "[CLS]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[PROMPT]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[TIMESTAMP]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[BOS]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "Sequence": { | |
| "id": "A", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[EOS]", | |
| "type_id": 0 | |
| } | |
| } | |
| ], | |
| "pair": [ | |
| { | |
| "SpecialToken": { | |
| "id": "[CLS]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[PROMPT]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[TIMESTAMP]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[BOS]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "Sequence": { | |
| "id": "A", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[SEP]", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "Sequence": { | |
| "id": "B", | |
| "type_id": 0 | |
| } | |
| }, | |
| { | |
| "SpecialToken": { | |
| "id": "[EOS]", | |
| "type_id": 0 | |
| } | |
| } | |
| ], | |
| "special_tokens": { | |
| "[BOS]": { | |
| "id": "[BOS]", | |
| "ids": [ | |
| 824 | |
| ], | |
| "tokens": [ | |
| "[BOS]" | |
| ] | |
| }, | |
| "[CLS]": { | |
| "id": "[CLS]", | |
| "ids": [ | |
| 827 | |
| ], | |
| "tokens": [ | |
| "[CLS]" | |
| ] | |
| }, | |
| "[EOS]": { | |
| "id": "[EOS]", | |
| "ids": [ | |
| 823 | |
| ], | |
| "tokens": [ | |
| "[EOS]" | |
| ] | |
| }, | |
| "[PROMPT]": { | |
| "id": "[PROMPT]", | |
| "ids": [ | |
| 829 | |
| ], | |
| "tokens": [ | |
| "[PROMPT]" | |
| ] | |
| }, | |
| "[SEP]": { | |
| "id": "[SEP]", | |
| "ids": [ | |
| 828 | |
| ], | |
| "tokens": [ | |
| "[SEP]" | |
| ] | |
| }, | |
| "[TIMESTAMP]": { | |
| "id": "[TIMESTAMP]", | |
| "ids": [ | |
| 830 | |
| ], | |
| "tokens": [ | |
| "[TIMESTAMP]" | |
| ] | |
| } | |
| } | |
| }, | |
| "decoder": { | |
| "type": "BPEDecoder", | |
| "suffix": "</w>" | |
| }, | |
| "model": { | |
| "type": "WordLevel", | |
| "vocab": { | |
| "<pad>": 0, | |
| "<eos>": 1, | |
| "<bos>": 2, | |
| "<unk>": 3, | |
| "<mask>": 4, | |
| "-": 5, | |
| "yl": 6, | |
| "2": 7, | |
| ",": 8, | |
| "1": 9, | |
| "(": 10, | |
| ")": 11, | |
| "[": 12, | |
| "]": 13, | |
| "3": 14, | |
| "4": 15, | |
| "meth": 16, | |
| "ox": 17, | |
| "o": 18, | |
| "5": 19, | |
| "phen": 20, | |
| "an": 21, | |
| "ol": 22, | |
| "y": 23, | |
| "az": 24, | |
| "e": 25, | |
| "di": 26, | |
| "6": 27, | |
| "eth": 28, | |
| "N": 29, | |
| "a": 30, | |
| "prop": 31, | |
| "amino": 32, | |
| " ": 33, | |
| "on": 34, | |
| "carb": 35, | |
| "hydr": 36, | |
| "in": 37, | |
| "id": 38, | |
| "7": 39, | |
| "S": 40, | |
| "benz": 41, | |
| "amide": 42, | |
| "R": 43, | |
| "fluor": 44, | |
| ".": 45, | |
| "0": 46, | |
| "cyclo": 47, | |
| "en": 48, | |
| "ene": 49, | |
| "tri": 50, | |
| "8": 51, | |
| "but": 52, | |
| "chlor": 53, | |
| "pyr": 54, | |
| "9": 55, | |
| ";": 56, | |
| "idin": 57, | |
| "imid": 58, | |
| "H": 59, | |
| "sulf": 60, | |
| "acid": 61, | |
| "per": 62, | |
| "hex": 63, | |
| "pi": 64, | |
| "ic": 65, | |
| "pent": 66, | |
| "pyridin": 67, | |
| "amine": 68, | |
| "pyrr": 69, | |
| "ane": 70, | |
| "tetra": 71, | |
| "acet": 72, | |
| "thio": 73, | |
| "thi": 74, | |
| "ate": 75, | |
| "et": 76, | |
| "dec": 77, | |
| "brom": 78, | |
| "Z": 79, | |
| "bis": 80, | |
| "r": 81, | |
| "k": 82, | |
| "E": 83, | |
| "ind": 84, | |
| "iso": 85, | |
| "ano": 86, | |
| "quin": 87, | |
| "'": 88, | |
| "tert": 89, | |
| "st": 90, | |
| "b": 91, | |
| "amo": 92, | |
| "furan": 93, | |
| "hept": 94, | |
| "oct": 95, | |
| "nitr": 96, | |
| "cyan": 97, | |
| "ide": 98, | |
| "oic": 99, | |
| "c": 100, | |
| "morph": 101, | |
| "oate": 102, | |
| "l": 103, | |
| "phosph": 104, | |
| "d": 105, | |
| "i": 106, | |
| "spiro": 107, | |
| "anilino": 108, | |
| "bi": 109, | |
| "ep": 110, | |
| "naphthal": 111, | |
| "thia": 112, | |
| "t": 113, | |
| "ium": 114, | |
| "n": 115, | |
| "non": 116, | |
| "am": 117, | |
| "cos": 118, | |
| "ino": 119, | |
| "sil": 120, | |
| "do": 121, | |
| "yn": 122, | |
| "pyran": 123, | |
| "al": 124, | |
| "urea": 125, | |
| "m": 126, | |
| "itrile": 127, | |
| "tris": 128, | |
| "guanidin": 129, | |
| "tetr": 130, | |
| "qu": 131, | |
| "pip": 132, | |
| "p": 133, | |
| "imino": 134, | |
| "pyrid": 135, | |
| "s": 136, | |
| "nitril": 137, | |
| "v": 138, | |
| "chrom": 139, | |
| "amido": 140, | |
| "or": 141, | |
| "pyrido": 142, | |
| "yr": 143, | |
| "x": 144, | |
| "iodide": 145, | |
| "iodo": 146, | |
| "bor": 147, | |
| "aniline": 148, | |
| "h": 149, | |
| "un": 150, | |
| "anium": 151, | |
| "amic": 152, | |
| "cont": 153, | |
| "anthr": 154, | |
| "deuterio": 155, | |
| "acr": 156, | |
| "furo": 157, | |
| "purin": 158, | |
| "icos": 159, | |
| "naphth": 160, | |
| "fur": 161, | |
| "idine": 162, | |
| "ec": 163, | |
| "tria": 164, | |
| "aldehyde": 165, | |
| "O": 166, | |
| "kis": 167, | |
| "f": 168, | |
| "ido": 169, | |
| "tin": 170, | |
| "alin": 171, | |
| "adamant": 172, | |
| "iodan": 173, | |
| "aceto": 174, | |
| "ambda": 175, | |
| "naphthyridin": 176, | |
| "ir": 177, | |
| "form": 178, | |
| "anthrac": 179, | |
| "og": 180, | |
| "nip": 181, | |
| "rt": 182, | |
| "amm": 183, | |
| "is": 184, | |
| "ne": 185, | |
| "lambda": 186, | |
| "+": 187, | |
| "imine": 188, | |
| "g": 189, | |
| "amidine": 190, | |
| "naphtho": 191, | |
| "furfur": 192, | |
| "oc": 193, | |
| "xy": 194, | |
| "sodium": 195, | |
| "C": 196, | |
| "xanth": 197, | |
| "ato": 198, | |
| "ine": 199, | |
| "thian": 200, | |
| "izin": 201, | |
| "ia": 202, | |
| "chr": 203, | |
| "phthal": 204, | |
| "ur": 205, | |
| "umar": 206, | |
| "thr": 207, | |
| "acridin": 208, | |
| "amidino": 209, | |
| "anide": 210, | |
| "rcapt": 211, | |
| "sec": 212, | |
| "lo": 213, | |
| "ular": 214, | |
| "cum": 215, | |
| "u": 216, | |
| "arbam": 217, | |
| "pr": 218, | |
| "oso": 219, | |
| "yne": 220, | |
| "phth": 221, | |
| "iridium": 222, | |
| "hyd": 223, | |
| "potassium": 224, | |
| "succ": 225, | |
| "platinum": 226, | |
| "tetrac": 227, | |
| "rg": 228, | |
| "glyc": 229, | |
| "anid": 230, | |
| "capr": 231, | |
| "chrys": 232, | |
| "ratr": 233, | |
| "yttrium": 234, | |
| "pteridin": 235, | |
| "ochrom": 236, | |
| "laur": 237, | |
| "ac": 238, | |
| "pic": 239, | |
| "ocyclo": 240, | |
| "sel": 241, | |
| "anthridin": 242, | |
| "styril": 243, | |
| "lithium": 244, | |
| "formic": 245, | |
| "formamido": 246, | |
| "acetaldehyde": 247, | |
| "trit": 248, | |
| "sit": 249, | |
| "ar": 250, | |
| "ch": 251, | |
| "anuide": 252, | |
| "ite": 253, | |
| "zirc": 254, | |
| "'a": 255, | |
| "glutar": 256, | |
| "rm": 257, | |
| "zinc": 258, | |
| "cinn": 259, | |
| "stann": 260, | |
| "triacet": 261, | |
| "annul": 262, | |
| "inic": 263, | |
| "titanium": 264, | |
| "ul": 265, | |
| "im": 266, | |
| "us": 267, | |
| "hypo": 268, | |
| "porphyrin": 269, | |
| "anth": 270, | |
| "ad": 271, | |
| "ucl": 272, | |
| "xam": 273, | |
| "piv": 274, | |
| "nam": 275, | |
| "cop": 276, | |
| "de": 277, | |
| "magnesium": 278, | |
| "umaril": 279, | |
| "fl": 280, | |
| "ycl": 281, | |
| "styr": 282, | |
| "tungst": 283, | |
| "tritio": 284, | |
| "palladium": 285, | |
| "anthro": 286, | |
| "indac": 287, | |
| "nickel": 288, | |
| "aphth": 289, | |
| "vanadium": 290, | |
| "germ": 291, | |
| "th": 292, | |
| "cobalt": 293, | |
| "myrist": 294, | |
| "hr": 295, | |
| "anida": 296, | |
| "ruth": 297, | |
| "selan": 298, | |
| "bar": 299, | |
| "tur": 300, | |
| "inin": 301, | |
| "arg": 302, | |
| "iz": 303, | |
| "cd": 304, | |
| "xim": 305, | |
| "calcium": 306, | |
| "inato": 307, | |
| "chl": 308, | |
| "hyp": 309, | |
| "formaldehyde": 310, | |
| "rph": 311, | |
| "ni": 312, | |
| "mit": 313, | |
| "anuida": 314, | |
| "br": 315, | |
| "phthalic": 316, | |
| "iodanuid": 317, | |
| "ous": 318, | |
| "uracil": 319, | |
| "oroso": 320, | |
| "inan": 321, | |
| "arach": 322, | |
| "fg": 323, | |
| "mang": 324, | |
| "se": 325, | |
| "F": 326, | |
| "chromium": 327, | |
| "um": 328, | |
| "il": 329, | |
| "rc": 330, | |
| "amidic": 331, | |
| "uranium": 332, | |
| "alum": 333, | |
| "yg": 334, | |
| "ulf": 335, | |
| "hafnium": 336, | |
| "ver": 337, | |
| "rp": 338, | |
| "ars": 339, | |
| "odium": 340, | |
| "inamo": 341, | |
| "tra": 342, | |
| "da": 343, | |
| "mercury": 344, | |
| "iodite": 345, | |
| "ybd": 346, | |
| "rhodium": 347, | |
| "cupr": 348, | |
| "lign": 349, | |
| "iodine": 350, | |
| "aluman": 351, | |
| "actinium": 352, | |
| "rcar": 353, | |
| "thraqu": 354, | |
| "odi": 355, | |
| "hth": 356, | |
| "io": 357, | |
| "aluminum": 358, | |
| "thianthr": 359, | |
| "ill": 360, | |
| "barium": 361, | |
| "iod": 362, | |
| "isa": 363, | |
| "rubidium": 364, | |
| "cesium": 365, | |
| "ut": 366, | |
| "osmium": 367, | |
| "rr": 368, | |
| "terephthalic": 369, | |
| "fumar": 370, | |
| "rh": 371, | |
| "'b": 372, | |
| "apht": 373, | |
| "telluro": 374, | |
| "lut": 375, | |
| "inous": 376, | |
| "tellan": 377, | |
| "iodous": 378, | |
| "pim": 379, | |
| "liz": 380, | |
| "j": 381, | |
| "gad": 382, | |
| "inium": 383, | |
| "at": 384, | |
| "I": 385, | |
| "cadmium": 386, | |
| "bismuth": 387, | |
| "asar": 388, | |
| "ph": 389, | |
| "arb": 390, | |
| "tetramin": 391, | |
| "corrin": 392, | |
| "bac": 393, | |
| "rutherfordium": 394, | |
| "cerium": 395, | |
| "sub": 396, | |
| "cy": 397, | |
| "itr": 398, | |
| "hecta": 399, | |
| "sar": 400, | |
| "tyr": 401, | |
| "cuban": 402, | |
| "stiba": 403, | |
| "europium": 404, | |
| "gly": 405, | |
| "germa": 406, | |
| "thallium": 407, | |
| "technetium": 408, | |
| "lanthanum": 409, | |
| "la": 410, | |
| "na": 411, | |
| "tellur": 412, | |
| "lact": 413, | |
| "thial": 414, | |
| "str": 415, | |
| "arsan": 416, | |
| "chu": 417, | |
| "antim": 418, | |
| "oform": 419, | |
| "itril": 420, | |
| "sti": 421, | |
| "neodymium": 422, | |
| "tantalum": 423, | |
| "plumb": 424, | |
| "yohimban": 425, | |
| "cym": 426, | |
| "niobium": 427, | |
| "ld": 428, | |
| "alo": 429, | |
| "praseodymium": 430, | |
| "ocinn": 431, | |
| "hy": 432, | |
| "lead": 433, | |
| "inite": 434, | |
| "liss": 435, | |
| "cr": 436, | |
| "ci": 437, | |
| "rth": 438, | |
| "ytterbium": 439, | |
| "ra": 440, | |
| "\"": 441, | |
| "z": 442, | |
| "ps": 443, | |
| "samarium": 444, | |
| "naph": 445, | |
| "terbium": 446, | |
| "othialdehyde": 447, | |
| "scandium": 448, | |
| "tartar": 449, | |
| "pyruv": 450, | |
| "as": 451, | |
| "ber": 452, | |
| "lium": 453, | |
| "ll": 454, | |
| "nu": 455, | |
| "za": 456, | |
| "phthalaldehyde": 457, | |
| "llit": 458, | |
| "tassi": 459, | |
| "dysprosium": 460, | |
| "epin": 461, | |
| "lutetium": 462, | |
| "ct": 463, | |
| "acrido": 464, | |
| "ij": 465, | |
| "nthr": 466, | |
| "indium": 467, | |
| "fermium": 468, | |
| "pha": 469, | |
| "thra": 470, | |
| "gallium": 471, | |
| "erbium": 472, | |
| "gamma": 473, | |
| "flu": 474, | |
| "sam": 475, | |
| "hl": 476, | |
| "thorium": 477, | |
| "ma": 478, | |
| "terephthal": 479, | |
| "gallan": 480, | |
| "lum": 481, | |
| "mium": 482, | |
| "lacc": 483, | |
| "rs": 484, | |
| "cor": 485, | |
| "gall": 486, | |
| "hippur": 487, | |
| "taur": 488, | |
| "caff": 489, | |
| "nia": 490, | |
| "ip": 491, | |
| "pia": 492, | |
| "dur": 493, | |
| "glutam": 494, | |
| "fuller": 495, | |
| "atr": 496, | |
| "plast": 497, | |
| "terephthalaldehyde": 498, | |
| "gluc": 499, | |
| "phl": 500, | |
| "thulium": 501, | |
| "apr": 502, | |
| "mu": 503, | |
| "iran": 504, | |
| "jap": 505, | |
| "Tc": 506, | |
| "stib": 507, | |
| "citra": 508, | |
| "astatine": 509, | |
| "rcuri": 510, | |
| "it": 511, | |
| "iodido": 512, | |
| "brass": 513, | |
| "rcur": 514, | |
| "rchl": 515, | |
| "idic": 516, | |
| "citr": 517, | |
| "Br": 518, | |
| "aceanthr": 519, | |
| "rit": 520, | |
| "mim": 521, | |
| "rul": 522, | |
| "tit": 523, | |
| "pyranthr": 524, | |
| "Ih": 525, | |
| "protio": 526, | |
| "stilb": 527, | |
| "ypr": 528, | |
| "dicta": 529, | |
| "curium": 530, | |
| "sg": 531, | |
| "amin": 532, | |
| "mi": 533, | |
| "cta": 534, | |
| ":": 535, | |
| "ila": 536, | |
| "mm": 537, | |
| "neptunium": 538, | |
| "ulfit": 539, | |
| "aur": 540, | |
| "cac": 541, | |
| "orus": 542, | |
| "pp": 543, | |
| "cium": 544, | |
| "lawr": 545, | |
| "dd": 546, | |
| "ri": 547, | |
| "skat": 548, | |
| "thaps": 549, | |
| "hygr": 550, | |
| "parab": 551, | |
| "tartr": 552, | |
| "yv": 553, | |
| "germanium": 554, | |
| "plut": 555, | |
| "ita": 556, | |
| "wn": 557, | |
| "rphyr": 558, | |
| "ace": 559, | |
| "thym": 560, | |
| "apth": 561, | |
| "At": 562, | |
| "buckm": 563, | |
| "einsteinium": 564, | |
| "americium": 565, | |
| "pro": 566, | |
| "nobelium": 567, | |
| "T": 568, | |
| "xysucc": 569, | |
| "plumba": 570, | |
| "helium": 571, | |
| "w": 572, | |
| "P": 573, | |
| "mad": 574, | |
| "guaiac": 575, | |
| "gu": 576, | |
| "cadav": 577, | |
| "californium": 578, | |
| "tr": 579, | |
| "hnit": 580, | |
| "ilv": 581, | |
| "pla": 582, | |
| "ti": 583, | |
| "thyr": 584, | |
| "ru": 585, | |
| "sc": 586, | |
| "B": 587, | |
| "atido": 588, | |
| "protactinium": 589, | |
| "xyv": 590, | |
| "lup": 591, | |
| "pleiad": 592, | |
| "aluminan": 593, | |
| "ulfat": 594, | |
| "arsind": 595, | |
| "lmn": 596, | |
| "gium": 597, | |
| "rcura": 598, | |
| "sea": 599, | |
| "syr": 600, | |
| "li": 601, | |
| "camph": 602, | |
| "ychr": 603, | |
| "hect": 604, | |
| "flav": 605, | |
| "ybda": 606, | |
| "yp": 607, | |
| "rsa": 608, | |
| "ug": 609, | |
| "dubnium": 610, | |
| "oval": 611, | |
| "tis": 612, | |
| "yc": 613, | |
| "krypt": 614, | |
| "vi": 615, | |
| "berkelium": 616, | |
| "ign": 617, | |
| "fulm": 618, | |
| "xyst": 619, | |
| "tim": 620, | |
| "meitnerium": 621, | |
| "tellurium": 622, | |
| "nil": 623, | |
| "carvacr": 624, | |
| "D": 625, | |
| "hafna": 626, | |
| "ymyrist": 627, | |
| "llur": 628, | |
| "german": 629, | |
| "prism": 630, | |
| "rad": 631, | |
| "bohrium": 632, | |
| "rb": 633, | |
| "hassium": 634, | |
| "astat": 635, | |
| "delevium": 636, | |
| "symcl": 637, | |
| "umb": 638, | |
| "rach": 639, | |
| "llif": 640, | |
| "xycapr": 641, | |
| "xyp": 642, | |
| "ulfam": 643, | |
| "lat": 644, | |
| "gsta": 645, | |
| "hym": 646, | |
| "nti": 647, | |
| "yqu": 648, | |
| "sa": 649, | |
| "plum": 650, | |
| "xa": 651, | |
| "astata": 652, | |
| "xyacr": 653, | |
| "xym": 654, | |
| "ada": 655, | |
| "adm": 656, | |
| "fulv": 657, | |
| "ba": 658, | |
| "warfar": 659, | |
| "ycapr": 660, | |
| "rri": 661, | |
| "tipyr": 662, | |
| "ypip": 663, | |
| "hrys": 664, | |
| "ast": 665, | |
| "xyb": 666, | |
| "xyi": 667, | |
| "ruc": 668, | |
| "alumin": 669, | |
| "xymyrist": 670, | |
| "rut": 671, | |
| "jugl": 672, | |
| "ysucc": 673, | |
| "aci": 674, | |
| "radium": 675, | |
| "xypr": 676, | |
| "yacr": 677, | |
| "xychr": 678, | |
| "uvit": 679, | |
| "'c": 680, | |
| "ub": 681, | |
| "scul": 682, | |
| "xyarach": 683, | |
| "yt": 684, | |
| "safr": 685, | |
| "dymi": 686, | |
| "protide": 687, | |
| "rbr": 688, | |
| "sma": 689, | |
| "xychl": 690, | |
| "fusar": 691, | |
| "ga": 692, | |
| "As": 693, | |
| "In": 694, | |
| "pras": 695, | |
| "xyqu": 696, | |
| "abas": 697, | |
| "acc": 698, | |
| "yphth": 699, | |
| "xyc": 700, | |
| "ascl": 701, | |
| "gst": 702, | |
| "plumbag": 703, | |
| "yfur": 704, | |
| "xyglutar": 705, | |
| "Ga": 706, | |
| "asti": 707, | |
| "sux": 708, | |
| "xya": 709, | |
| "yb": 710, | |
| "ata": 711, | |
| "parax": 712, | |
| "G": 713, | |
| "Li": 714, | |
| "francium": 715, | |
| "rsaplumb": 716, | |
| "rv": 717, | |
| "daphn": 718, | |
| "ag": 719, | |
| "guai": 720, | |
| "ychl": 721, | |
| "yf": 722, | |
| "ym": 723, | |
| "samari": 724, | |
| "si": 725, | |
| "ucc": 726, | |
| "full": 727, | |
| "ib": 728, | |
| "nthrac": 729, | |
| "sap": 730, | |
| "ypyr": 731, | |
| "hn": 732, | |
| "sm": 733, | |
| "ta": 734, | |
| "ud": 735, | |
| "llura": 736, | |
| "yglutar": 737, | |
| "yst": 738, | |
| "btu": 739, | |
| "M": 740, | |
| "U": 741, | |
| "dyma": 742, | |
| "lad": 743, | |
| "magn": 744, | |
| "vacc": 745, | |
| "ya": 746, | |
| "ntim": 747, | |
| "rsast": 748, | |
| "ap": 749, | |
| "par": 750, | |
| "xypip": 751, | |
| "xysti": 752, | |
| "yamm": 753, | |
| "Pt": 754, | |
| "Y": 755, | |
| "aplumb": 756, | |
| "auri": 757, | |
| "bara": 758, | |
| "dyspr": 759, | |
| "frax": 760, | |
| "lada": 761, | |
| "purpur": 762, | |
| "sp": 763, | |
| "xysub": 764, | |
| "yisa": 765, | |
| "xyac": 766, | |
| "xyphth": 767, | |
| "yx": 768, | |
| "astib": 769, | |
| "chav": 770, | |
| "fursulti": 771, | |
| "hist": 772, | |
| "mast": 773, | |
| "rfull": 774, | |
| "uramil": 775, | |
| "usn": 776, | |
| "xypim": 777, | |
| "xyth": 778, | |
| "yhyd": 779, | |
| "Bi": 780, | |
| "Bk": 781, | |
| "Tl": 782, | |
| "thuli": 783, | |
| "tiba": 784, | |
| "xybr": 785, | |
| "xyim": 786, | |
| "ypim": 787, | |
| "ys": 788, | |
| "ytt": 789, | |
| "cyt": 790, | |
| "dr": 791, | |
| "ilast": 792, | |
| "nag": 793, | |
| "xypyr": 794, | |
| "xys": 795, | |
| "yarach": 796, | |
| "ybar": 797, | |
| "yfurfur": 798, | |
| "ysub": 799, | |
| "yuracil": 800, | |
| "aph": 801, | |
| "cad": 802, | |
| "cham": 803, | |
| "dym": 804, | |
| "laws": 805, | |
| "phys": 806, | |
| "rsam": 807, | |
| "stat": 808, | |
| "tsuzu": 809, | |
| "xymu": 810, | |
| "xystib": 811, | |
| "yac": 812, | |
| "yh": 813, | |
| "yhyp": 814, | |
| "yi": 815, | |
| "yim": 816, | |
| "yphl": 817, | |
| "ypi": 818, | |
| "yru": 819, | |
| "ystib": 820, | |
| "yur": 821 | |
| }, | |
| "unk_token": "<unk>" | |
| } | |
| } |