SELFIES_VOCAB_SMALL = ['[#Branch1]', '[#Branch2]', '[#C]', '[#N]', '[=Branch1]', '[=Branch2]', '[=C]', '[=N]',
                       '[=O]', '[=Ring1]', '[=Ring2]', '[=S]', '[B]', '[Br]', '[Branch1]', '[Branch2]', '[C]',
                       '[Cl]', '[F]', '[NH1]', '[N]', '[O]', '[P]', '[Ring1]', '[Ring2]', '[S]']
# len = 26
# removed: '[N+1]', '[O-1]' from NO2, '[B-1]', '[=N+1]' from BODIPYs


SELFIES_VOCAB_LARGE = ['[#Branch1]', '[#Branch2]', '[#C]', '[#N]', '[-/Ring1]', '[-\\Ring1]',
                       '[/Br]', '[/C@@H1]', '[/C@@]', '[/C@H1]', '[/C@]', '[/C]', '[/Cl]', '[/F]',
                       '[/NH1]', '[/N]', '[/O]', '[/S@]', '[/S]', '[=Branch1]', '[=Branch2]', '[=C]',
                       '[=O]', '[=P@@]', '[=P@]', '[=PH2]', '[=P]', '[=Ring1]', '[=Ring2]', '[=S@@]',
                       '[=S@]', '[=S]', '[Br]', '[Branch1]', '[Branch2]', '[C@@H1]', '[C@@]', '[C@H1]',
                       '[C@]', '[C]', '[Cl]', '[F]', '[I]',  '[NH1]', '[N]', '[O]', '[P@@H1]',
                       '[P@@]', '[P@]',  '[PH1]', '[P]', '[Ring1]', '[Ring2]', '[S@@]', '[S@]', '[S]',
                       '[\\Br]', '[\\C@@H1]', '[\\C@H1]', '[\\C]', '[\\Cl]',
                       '[\\F]', '[\\I]', '[\\NH1]', '[\\N]', '[\\O]', '[\\S@]', '[\\S]']
# len = 68
# removed: '[/N-1]', '[/S-1]', '[=N-1]', '[/NH1-1]', '[/O-1]', '[CH1-1]', '[CH2-1]', '[N-1]', '[NH1-1]', '[O-1]', '[S-1]',
# '[\\N-1]', '[\\O-1]', '[\\S-1]', '[#N+1]', '[/N+1]', '[/NH1+1]', '[/NH2+1]', '[/O+1]', '[=N+1]', '[=NH1+1]',
# '[=NH2+1]', '[=N]', '[=O+1]', '[=OH1+1]', '[=S+1]', '[=SH1+1]', '[N+1]', '[NH1+1]','[NH2+1]', '[NH3+1]', '[S+1]',
#  '[S@@+1]',  '[PH1+1]','[P+1]', '[\\N+1]', '[\\NH1+1]', '[\\NH2+1]',