modules/pymol/parsing.py (474 lines of code) (raw):

#A* ------------------------------------------------------------------- #B* This file contains source code for the PyMOL computer program #C* Copyright (c) Schrodinger, LLC. #D* ------------------------------------------------------------------- #E* It is unlawful to modify or remove this copyright notice. #F* ------------------------------------------------------------------- #G* Please see the accompanying LICENSE file for further information. #H* ------------------------------------------------------------------- #I* Additional authors of this source file include: #-* #-* #-* #Z* ------------------------------------------------------------------- # parser2.py # An improved command parser for PyMOL, but still a terrible kluuge # PyMOL needs to migrate to a real parser soon! # === Goals: # 1. improved 1to1 mapping between pymol "cmd" API and command language # 2. support for named arguments # 3. support for calling arbitrary python functions via this mapping # === Syntatic Examples # * simple commands # command # * commands with arguments # # command value1 # command value1,value2 # command value1,value2,value3 # * commands with named arguments # # command argument1=value1 # command argument1=value1,argument2=value2,argument3=value3 # command argument3=value1,argument2=value2,argument1=value1 # * mixed... # # command value1,argument3=value3,arg # * commands with legacy '=' support for first argument # # command string1=value1 # * which should map to # command string1,value1 # * legacy '=' combined as above # # command string1=value1,value2 # command string1=value1,value2,value3,... # command string1=value1,argument3=value3 # === Burdens placed on API functions... # # None. However, function must have real arguments for error checking. # from __future__ import absolute_import # Don't import __future__.print_function if __name__=='pymol.parsing': import re import sys import threading import types import traceback import inspect from . import colorprinting class QuietException(BaseException): pass # constants for keyword modes SIMPLE = 0 # original pymol parsing (deprecated) MOVIE = 1 # ignore ";", treat entire line as a single command RUN = 2 # run command SPAWN = 3 # for spawn and fork commands ABORT = 4 # terminates command script PYTHON = 5 # pass entire line to python EMBED = 6 # embedded data PYTHON_BLOCK = 7 # embedded python block SKIP = 8 # skipping commands NO_CHECK = 10 # no error checking STRICT = 11 # strict name->argument checking SECURE = 12 # command not available in "secure" mode LEGACY = 13 # support legacy construct str1=val1,... -> str1,val1,... LITERAL = 20 # argument is to be treated as a literal string LITERAL1 = 21 # one regular argument, followed by literal string LITERAL2 = 22 # two regular argument, followed by literal string # key regular expressions arg_name_re = re.compile(r"[A-Za-z0-9_]+\s*\=") nester_char_re = re.compile(r"\(|\)|\[|\]") nester_re = re.compile(r"[^,;]*[\(\[]") arg_pre_nester_re = re.compile(r"([^,;\(\[]+)[\(\[]") arg_post_nester_re = re.compile(r"[^,;\(\[]*") arg_easy_nester_re = re.compile(r"\([^,]*\)|\[[^,]*\]") arg_hard_nester_re = re.compile(r"\(.*\)|\[.*\]") # NOTE '''sdf'sdfs''' doesn't work in below. arg_value_re = re.compile(r"'''[^']*'''|'[^']*'|"+r'"[^"]*"|[^,;]+') def trim_nester(st): # utility routine, returns single instance of a nested string # should be modified to handle quotes too pc = 1 l = len(st) c = 1 while c<l: if st[c] in ('(','['): pc = pc + 1 if st[c] in (')',']'): pc = pc - 1 c = c + 1 if not pc: break if pc: return None return st[0:c] def apply_arg(inp_arg,par=(),def_dict={}): n_inp = len(inp_arg) n_req = n_inp - len(def_dict) result = [] inp_dict = {} for a in inp_arg: if a[0] != None: inp_dict[a[0]] = a[1]; c = 0 for p in par: if c<n_inp: a = inp_arg[c] if a[0] == None: result.append(a[1]) c = c + 1 continue if p in inp_dict: result.append(inp_dict[p]) del inp_dict[p] elif p in def_dict: result.append(def_dict[p]) elif c<n_req: raise QuietException("Error: invalid argument(s).") c = c + 1 if len(inp_dict): raise QuietException("Error: invalid argument(s).") return result def parse_arg(st,mode=STRICT,_self=None): ''' parse_arg(st) expects entire command to be passed in returns list of tuples of strings: [(None,value),(name,value)...] ''' result = [] # current character cc = 0 a = st.split(None, 1) if len(a) == 2: st = a[1] while 1: if mode>=LITERAL: # LITERAL argument handling if (mode-LITERAL)==len(result): result.append((None, st[cc:].strip())) return result # clean whitespace st = st.lstrip() if st == '': break # read argument name, if any mo = arg_name_re.match(st) if mo: nam = mo.group(0)[:-1].strip() st = st[mo.end(0):].lstrip() else: nam = None # is one or more nesters present? skip_flag = 0 if nester_re.match(st[cc:]): skip_flag = 1 nest_flag = 1 nest_str = '' while nest_flag: # parse all the nesters nest_flag = 0 # text before nester? mo = arg_pre_nester_re.match(st[cc:]) if mo: nest_str = nest_str + mo.group(1) cc=cc+mo.end(1) # special handling for nesters (selections, lists, tuples, etc.) mo = arg_easy_nester_re.match(st[cc:]) # no internal commas if mo: cnt = len(nester_char_re.findall(mo.group(0))) if cnt % 2 == 1: # make sure nesters are matched in count mo = None if mo: nest_str = nest_str + mo.group(0) cc=cc+mo.end(0) # text after nester? mo = arg_post_nester_re.match(st[cc:]) if mo: post_nester = mo.group(0) cc=cc+mo.end(0) nest_str = nest_str + post_nester nest_flag = 1 # one more cycle else: mo = arg_hard_nester_re.match(st[cc:]) if mo: se = trim_nester(mo.group(0)) if se==None: colorprinting.error("Error: "+st) colorprinting.error("Error: "+" "*cc+"^ syntax error (type 1).") raise QuietException else: cc = cc + len(se) nest_str = nest_str + se # text after nester? mo = arg_post_nester_re.match(st[cc:]) if mo: nest_str = nest_str + mo.group(0) cc=cc+mo.end(0) nest_flag = 1 # one more cycle if not len(nest_str): # we must have failed to parse... skip_flag = 0 else: result.append((nam, nest_str.strip())) if not skip_flag: # no nester, so just read normal argument value argval = None mo = arg_value_re.match(st[cc:]) if not mo: if(st[cc:cc+1]!=','): colorprinting.error("Error: "+st) colorprinting.error("Error: "+" "*cc+"^ syntax error (type 2).") raise QuietException else: # allow blank arguments result.append((nam,None)) else: argval = mo.group(0) cc=cc+mo.end(0) while 1: # pickup unqouted characters after quotes mo = arg_value_re.match(st[cc:]) if not mo: break argval = argval + mo.group(0) cc=cc+mo.end(0) if argval!=None: result.append((nam, argval.strip())) # clean whitespace st = st[cc:].lstrip() cc = 0 # skip over comma if st != '': if st.startswith(','): st = st[1:].lstrip() else: colorprinting.error("Error: "+st) colorprinting.error("Error: "+" "*cc+"^ syntax error (type 3).") raise QuietException if __name__!='__main__': if _self._feedback(_self.fb_module.parser, _self.fb_mask.debugging): _self.fb_debug.write(" parsing-DEBUG: tup: "+str(result)+"\n") return result def dump_str_list(list): lst = list_to_str_list(list) for a in lst: print(a) def list_to_str_list(list,width=77,margin=2): # format strings into a list result = [] ll=len(list) if ll>0: mxln = 1 for a in list: if len(a)>mxln: mxln = len(a) n_col = width//mxln width = width - margin while (n_col * mxln + n_col*2)>width: n_col = n_col - 1 if n_col < 1: n_col = 1 ll = len(list) n_row = len(list)//n_col while (n_row*n_col)<ll: n_row = n_row + 1 rows = [] for a in range(n_row): rows.append([]) row = 0 pad_list = [] for a in list: pad_list.append(("%-"+str(mxln)+"s")%a) for a in pad_list: rows[row].append(a) row = row + 1 if row >= n_row: row = 0 for a in rows: st = margin*' ' row = 0 st = st + ' '.join(a) result.append(st) return result def dump_arg(name,arg_lst,nreq): ac = 0 pc = 0 st = "Usage: "+name if '_self' in arg_lst: arg_lst = list(arg_lst) arg_lst.remove('_self') for a in arg_lst: if ac>=nreq: st = st + " [" pc = pc + 1 if ac: st = st + ", " + a else: st = st + " " + a ac = ac + 1 print(st + " " + "]"*pc) def prepare_call(fn,lst,mode=STRICT,name=None,_self=None): # returns tuple of arg,kw or excepts if error if name==None: name=fn.__name__ result = (None,None) arg = [] kw = {} co = fn.__code__ if (co.co_flags & 0xC): # disable error checking for *arg or **kw functions mode = NO_CHECK offset = 1 if inspect.ismethod(fn) else 0 arg_nam = co.co_varnames[offset:co.co_argcount] narg = len(arg_nam) if fn.__defaults__: ndef = len(fn.__defaults__) else: ndef = 0 nreq = narg-ndef if len(lst)==1: if lst[0]==(None,'?'): dump_arg(name,arg_nam,nreq) raise QuietException if mode==NO_CHECK: # no error checking for a in lst: if a[0]==None: arg.append(a[1]) else: kw[a[0]]=a[1] # set feedback argument (quiet), if extant, results enabled, and not overridden if "quiet" in arg_nam: if "quiet" not in kw: if __name__!='__main__': if _self._feedback(_self.fb_module.cmd, _self.fb_mask.results): kw["quiet"] = 0 if "_self" not in kw: # always send _self in the dictionary kw["_self"]=_self else: # error checking enabled # build name dictionary, with required flag arg_dct={} c = 0 for a in arg_nam: arg_dct[a]=c<nreq c = c + 1 if mode==LEGACY: # handle legacy string=value transformation tmp_lst = [] for a in lst: if(a[0]!=None): if a[0] not in arg_dct: tmp_lst.extend([(None,a[0]),(None,a[1])]) else: tmp_lst.append(a) else: tmp_lst.append(a) lst = tmp_lst # make sure we don't have too many arguments if len(lst)>narg: if not narg: colorprinting.error("Error: too many arguments for %s; None expected."%(name)) elif narg==nreq: colorprinting.error("Error: too many arguments for %s; %d expected, %d found."%( name,nreq,len(lst))) dump_arg(name,arg_nam,nreq) else: colorprinting.error("Error: too many arguments for %s; %d to %d expected, %d found."%( name,nreq,narg,len(lst))) dump_arg(name,arg_nam,nreq) raise QuietException # match names to unnamed arguments to create argument dictionary ac = 0 val_dct = {} for a in lst: if a[0]==None: if ac>=narg: raise QuietException("Parsing-Error: ambiguous argument: '"+str(a[1])+"'") else: val_dct[arg_nam[ac]]=a[1] else: val_dct[a[0]]=a[1] ac = ac + 1 # now check to make sure we don't have any missing arguments for a in arg_nam: if arg_dct[a]: if a not in val_dct: raise QuietException("Parsing-Error: missing required argument in function %s : %s" % (name, a)) # return all arguments as keyword arguments kw = val_dct # set feedback argument (quiet), if extant, results enabled, and not overridden if "quiet" in arg_dct: if "quiet" not in kw: if _self._feedback(_self.fb_module.cmd, _self.fb_mask.results): kw["quiet"] = 0 # make sure command knows which PyMOL instance to message if "_self" in arg_nam: if "_self" not in kw: kw["_self"]=_self if __name__!='__main__': if _self._feedback(_self.fb_module.parser, _self.fb_mask.debugging): _self.fb_debug.write(" parsing-DEBUG: kw: "+str(kw)+"\n") return (arg,kw) # launching routines def run(filename, namespace='global', _spawn=0, _self=None): ''' DESCRIPTION "run" executes an external Python script in a local name space, the main Python namespace, the global PyMOL namespace, or in its own namespace (as a module). USAGE run file [, namespace ] ARGUMENTS file = string: a Python program, typically ending in .py or .pym. namespace = local, global, module, main, or private {default: global} NOTES Due to an idiosyncracy in Pickle, you can not pickle objects directly created at the main level in a script run as "module", (because the pickled object becomes dependent on that module). Workaround: delegate construction to an imported module. SEE ALSO spawn ''' from __main__ import __dict__ as ns_main from pymol import __dict__ as ns_pymol if not _self: from pymol import cmd as _self if filename.endswith('.pml'): return _self.load(filename) path = _self.exp_path(filename) spawn = int(_spawn) run_ = spawn_file if spawn else run_file if namespace == 'global': run_(path, ns_pymol, ns_pymol) elif namespace == 'local': run_(path, ns_pymol, {}) elif namespace == 'main': run_(path, ns_main, ns_main) elif namespace == 'private': run_(path, ns_main, {}) elif namespace == 'module': run_file_as_module(path, spawn=spawn) else: raise ValueError('invalid namespace "%s"' % namespace) def spawn(filename, namespace='module', _self=None): ''' DESCRIPTION "spawn" launches a Python script in a new thread which will run concurrently with the PyMOL interpreter. It can be run in its own namespace (like a Python module, default), a local name space, or in the global namespace. USAGE spawn file [, namespace ] NOTES The default namespace for spawn is "module". The best way to spawn processes at startup is to use the -l option (see "help launching"). SEE ALSO run ''' return run(filename, namespace, 1, _self) def _print_exc(): colorprinting.print_exc([__file__]) def execfile(filename, global_ns, local_ns): import pymol.internal as pi co = compile(pi.file_read(filename), filename, 'exec') exec(co, global_ns, local_ns) def run_file(file,global_ns,local_ns): global_ns['__script__'] = file try: execfile(file,global_ns,local_ns) except pymol.CmdException: # so the idea here is to print the traceback here and then # cascade all the way back up to the interactive level # without any further output _print_exc() raise QuietException def run_file_as_module(file,spawn=0): name = re.sub('[^A-Za-z0-9]','_',file) if not isinstance(name, str): # Python 2 only name = name.encode('ascii', errors='ignore') mod = types.ModuleType(name) mod.__file__ = file mod.__script__ = file sys.modules[name]=mod if spawn: t = threading.Thread(target=execfile, args=(file,mod.__dict__,mod.__dict__)) t.setDaemon(1) t.start() else: try: execfile(file,mod.__dict__,mod.__dict__) except pymol.CmdException: _print_exc() raise QuietException del sys.modules[name] del mod def spawn_file(args,global_ns,local_ns): local_ns['__script__'] = args t = threading.Thread(target=execfile,args=(args,global_ns,local_ns)) t.setDaemon(1) t.start() def split(*arg,**kw): # custom split-and-trim ''' split(string,token[,count]) -> list of strings UTILITY FUNCTION, NOT PART OF THE API Breaks strings up by tokens but preserves quoted strings and parenthetical groups (such as atom selections). USAGE OF THIS FUNCTION IS DISCOURAGED - THE GOAL IS TO MAKE IT UNNECESSARY BY IMPROVING THE BUILT-IN PARSER ''' str = arg[0] tok = arg[1] if len(arg)>2: mx=arg[2] else: mx=0 pair = { '(':')','[':']','{':'}',"'":"'",'"':'"' } plst = list(pair.keys()) stack = [] lst = [] c = 0 nf = 0 l = len(str) wd = "" while str[c]==tok: c = c + 1 while c<l: ch = str[c] if (ch in tok) and (len(stack)==0): lst.append(wd.strip()) nf = nf + 1 if mx: if nf==mx: wd = str[c+1:].strip() break; wd = '' w = 0 else: if len(stack): if ch==stack[0]: stack = stack[1:] elif (ch in plst): stack[:0]=[pair[ch]] elif (ch in plst): stack[:0]=[pair[ch]] wd = wd + ch c = c + 1 if len(wd): lst.append(wd.strip()) return lst import pymol