Show More
@@ -1,313 +1,316 b'' | |||
|
1 | 1 | # -*- coding: utf-8 -*- |
|
2 | 2 | """ |
|
3 | 3 | Classes and functions for prefiltering (transforming) a line of user input. |
|
4 | 4 | This module is responsible, primarily, for breaking the line up into useful |
|
5 | 5 | pieces and triggering the appropriate handlers in iplib to do the actual |
|
6 | 6 | transforming work. |
|
7 | 7 | """ |
|
8 | 8 | __docformat__ = "restructuredtext en" |
|
9 | 9 | |
|
10 | 10 | import re |
|
11 | 11 | import IPython.ipapi |
|
12 | 12 | |
|
13 | 13 | class LineInfo(object): |
|
14 | 14 | """A single line of input and associated info. |
|
15 | 15 | |
|
16 | 16 | Includes the following as properties: |
|
17 | 17 | |
|
18 | 18 | line |
|
19 | 19 | The original, raw line |
|
20 | 20 | |
|
21 | 21 | continue_prompt |
|
22 | 22 | Is this line a continuation in a sequence of multiline input? |
|
23 | 23 | |
|
24 | 24 | pre |
|
25 | 25 | The initial esc character or whitespace. |
|
26 | 26 | |
|
27 | 27 | preChar |
|
28 | 28 | The escape character(s) in pre or the empty string if there isn't one. |
|
29 | 29 | Note that '!!' is a possible value for preChar. Otherwise it will |
|
30 | 30 | always be a single character. |
|
31 | 31 | |
|
32 | 32 | preWhitespace |
|
33 | 33 | The leading whitespace from pre if it exists. If there is a preChar, |
|
34 | 34 | this is just ''. |
|
35 | 35 | |
|
36 | 36 | iFun |
|
37 | 37 | The 'function part', which is basically the maximal initial sequence |
|
38 | 38 | of valid python identifiers and the '.' character. This is what is |
|
39 | 39 | checked for alias and magic transformations, used for auto-calling, |
|
40 | 40 | etc. |
|
41 | 41 | |
|
42 | 42 | theRest |
|
43 | 43 | Everything else on the line. |
|
44 | 44 | """ |
|
45 | 45 | def __init__(self, line, continue_prompt): |
|
46 | 46 | self.line = line |
|
47 | 47 | self.continue_prompt = continue_prompt |
|
48 | 48 | self.pre, self.iFun, self.theRest = splitUserInput(line) |
|
49 | 49 | |
|
50 | 50 | self.preChar = self.pre.strip() |
|
51 | 51 | if self.preChar: |
|
52 | 52 | self.preWhitespace = '' # No whitespace allowd before esc chars |
|
53 | 53 | else: |
|
54 | 54 | self.preWhitespace = self.pre |
|
55 | 55 | |
|
56 | 56 | self._oinfo = None |
|
57 | 57 | |
|
58 | 58 | def ofind(self, ip): |
|
59 | 59 | """Do a full, attribute-walking lookup of the iFun in the various |
|
60 | 60 | namespaces for the given IPython InteractiveShell instance. |
|
61 | 61 | |
|
62 | 62 | Return a dict with keys: found,obj,ospace,ismagic |
|
63 | 63 | |
|
64 | 64 | Note: can cause state changes because of calling getattr, but should |
|
65 | 65 | only be run if autocall is on and if the line hasn't matched any |
|
66 | 66 | other, less dangerous handlers. |
|
67 | 67 | |
|
68 | 68 | Does cache the results of the call, so can be called multiple times |
|
69 | 69 | without worrying about *further* damaging state. |
|
70 | 70 | """ |
|
71 | 71 | if not self._oinfo: |
|
72 | 72 | self._oinfo = ip._ofind(self.iFun) |
|
73 | 73 | return self._oinfo |
|
74 | ||
|
74 | def __str__(self): | |
|
75 | return "Lineinfo [%s|%s|%s]" %(self.pre,self.iFun,self.theRest) | |
|
75 | 76 | |
|
76 | 77 | def splitUserInput(line, pattern=None): |
|
77 | 78 | """Split user input into pre-char/whitespace, function part and rest. |
|
78 | 79 | |
|
79 | 80 | Mostly internal to this module, but also used by iplib.expand_aliases, |
|
80 | 81 | which passes in a shell pattern. |
|
81 | 82 | """ |
|
82 | 83 | # It seems to me that the shell splitting should be a separate method. |
|
83 | 84 | |
|
84 | 85 | if not pattern: |
|
85 | 86 | pattern = line_split |
|
86 | 87 | match = pattern.match(line) |
|
87 | 88 | if not match: |
|
88 | 89 | #print "match failed for line '%s'" % line |
|
89 | 90 | try: |
|
90 | 91 | iFun,theRest = line.split(None,1) |
|
91 | 92 | except ValueError: |
|
92 | 93 | #print "split failed for line '%s'" % line |
|
93 | 94 | iFun,theRest = line,'' |
|
94 | 95 | pre = re.match('^(\s*)(.*)',line).groups()[0] |
|
95 | 96 | else: |
|
96 | 97 | pre,iFun,theRest = match.groups() |
|
97 | 98 | |
|
98 | 99 | # iFun has to be a valid python identifier, so it better be only pure |
|
99 | 100 | # ascii, no unicode: |
|
100 | 101 | try: |
|
101 | 102 | iFun = iFun.encode('ascii') |
|
102 | 103 | except UnicodeEncodeError: |
|
103 | 104 | theRest = iFun + u' ' + theRest |
|
104 | 105 | iFun = u'' |
|
105 | 106 | |
|
106 | 107 | #print 'line:<%s>' % line # dbg |
|
107 | 108 | #print 'pre <%s> iFun <%s> rest <%s>' % (pre,iFun.strip(),theRest) # dbg |
|
108 | 109 | return pre,iFun.strip(),theRest.lstrip() |
|
109 | 110 | |
|
110 | 111 | |
|
111 | 112 | # RegExp for splitting line contents into pre-char//first word-method//rest. |
|
112 | 113 | # For clarity, each group in on one line. |
|
113 | 114 | |
|
114 | 115 | # WARNING: update the regexp if the escapes in iplib are changed, as they |
|
115 | 116 | # are hardwired in. |
|
116 | 117 | |
|
117 | 118 | # Although it's not solely driven by the regex, note that: |
|
118 | 119 | # ,;/% only trigger if they are the first character on the line |
|
119 | 120 | # ! and !! trigger if they are first char(s) *or* follow an indent |
|
120 | 121 | # ? triggers as first or last char. |
|
121 | 122 | |
|
122 | 123 | # The three parts of the regex are: |
|
123 | 124 | # 1) pre: pre_char *or* initial whitespace |
|
124 | 125 | # 2) iFun: first word/method (mix of \w and '.') |
|
125 | 126 | # 3) theRest: rest of line (separated from iFun by space if non-empty) |
|
126 | 127 | line_split = re.compile(r'^([,;/%?]|!!?|\s*)' |
|
127 | 128 | r'\s*([\w\.]+)' |
|
128 | 129 | r'(\s+.*$|$)') |
|
129 | 130 | |
|
130 | 131 | shell_line_split = re.compile(r'^(\s*)(\S*\s*)(.*$)') |
|
131 | 132 | |
|
132 | 133 | def prefilter(line_info, ip): |
|
133 | 134 | """Call one of the passed-in InteractiveShell's handler preprocessors, |
|
134 | 135 | depending on the form of the line. Return the results, which must be a |
|
135 | 136 | value, even if it's a blank ('').""" |
|
136 | 137 | # Note: the order of these checks does matter. |
|
137 | 138 | for check in [ checkEmacs, |
|
138 | 139 | checkIPyAutocall, |
|
139 | 140 | checkMultiLineShell, |
|
140 | 141 | checkEscChars, |
|
141 | 142 | checkAssignment, |
|
142 | 143 | checkAutomagic, |
|
143 | 144 | checkAlias, |
|
144 | 145 | checkPythonOps, |
|
145 | 146 | checkAutocall, |
|
146 | 147 | ]: |
|
147 | 148 | handler = check(line_info, ip) |
|
148 | 149 | if handler: |
|
149 | 150 | return handler(line_info) |
|
150 | 151 | |
|
151 | 152 | return ip.handle_normal(line_info) |
|
152 | 153 | |
|
153 | 154 | # Handler checks |
|
154 | 155 | # |
|
155 | 156 | # All have the same interface: they take a LineInfo object and a ref to the |
|
156 | 157 | # iplib.InteractiveShell object. They check the line to see if a particular |
|
157 | 158 | # handler should be called, and return either a handler or None. The |
|
158 | 159 | # handlers which they return are *bound* methods of the InteractiveShell |
|
159 | 160 | # object. |
|
160 | 161 | # |
|
161 | 162 | # In general, these checks should only take responsibility for their 'own' |
|
162 | 163 | # handler. If it doesn't get triggered, they should just return None and |
|
163 | 164 | # let the rest of the check sequence run. |
|
164 | 165 | def checkEmacs(l_info,ip): |
|
165 | 166 | "Emacs ipython-mode tags certain input lines." |
|
166 | 167 | if l_info.line.endswith('# PYTHON-MODE'): |
|
167 | 168 | return ip.handle_emacs |
|
168 | 169 | else: |
|
169 | 170 | return None |
|
170 | 171 | |
|
171 | 172 | def checkIPyAutocall(l_info,ip): |
|
172 | 173 | "Instances of IPyAutocall in user_ns get autocalled immediately" |
|
173 | 174 | obj = ip.user_ns.get(l_info.iFun, None) |
|
174 | 175 | if isinstance(obj, IPython.ipapi.IPyAutocall): |
|
175 | 176 | obj.set_ip(ip.api) |
|
176 | 177 | return ip.handle_auto |
|
177 | 178 | else: |
|
178 | 179 | return None |
|
179 | 180 | |
|
180 | 181 | |
|
181 | 182 | def checkMultiLineShell(l_info,ip): |
|
182 | 183 | "Allow ! and !! in multi-line statements if multi_line_specials is on" |
|
183 | 184 | # Note that this one of the only places we check the first character of |
|
184 | 185 | # iFun and *not* the preChar. Also note that the below test matches |
|
185 | 186 | # both ! and !!. |
|
186 | 187 | if l_info.continue_prompt \ |
|
187 |
|
|
|
188 |
|
|
|
188 | and ip.rc.multi_line_specials: | |
|
189 | if l_info.iFun.startswith(ip.ESC_SHELL): | |
|
189 | 190 | return ip.handle_shell_escape |
|
191 | if l_info.iFun.startswith(ip.ESC_MAGIC): | |
|
192 | return ip.handle_magic | |
|
190 | 193 | else: |
|
191 | 194 | return None |
|
192 | 195 | |
|
193 | 196 | def checkEscChars(l_info,ip): |
|
194 | 197 | """Check for escape character and return either a handler to handle it, |
|
195 | 198 | or None if there is no escape char.""" |
|
196 | 199 | if l_info.line[-1] == ip.ESC_HELP \ |
|
197 | 200 | and l_info.preChar != ip.ESC_SHELL \ |
|
198 | 201 | and l_info.preChar != ip.ESC_SH_CAP: |
|
199 | 202 | # the ? can be at the end, but *not* for either kind of shell escape, |
|
200 | 203 | # because a ? can be a vaild final char in a shell cmd |
|
201 | 204 | return ip.handle_help |
|
202 | 205 | elif l_info.preChar in ip.esc_handlers: |
|
203 | 206 | return ip.esc_handlers[l_info.preChar] |
|
204 | 207 | else: |
|
205 | 208 | return None |
|
206 | 209 | |
|
207 | 210 | |
|
208 | 211 | def checkAssignment(l_info,ip): |
|
209 | 212 | """Check to see if user is assigning to a var for the first time, in |
|
210 | 213 | which case we want to avoid any sort of automagic / autocall games. |
|
211 | 214 | |
|
212 | 215 | This allows users to assign to either alias or magic names true python |
|
213 | 216 | variables (the magic/alias systems always take second seat to true |
|
214 | 217 | python code). E.g. ls='hi', or ls,that=1,2""" |
|
215 | 218 | if l_info.theRest and l_info.theRest[0] in '=,': |
|
216 | 219 | return ip.handle_normal |
|
217 | 220 | else: |
|
218 | 221 | return None |
|
219 | 222 | |
|
220 | 223 | |
|
221 | 224 | def checkAutomagic(l_info,ip): |
|
222 | 225 | """If the iFun is magic, and automagic is on, run it. Note: normal, |
|
223 | 226 | non-auto magic would already have been triggered via '%' in |
|
224 | 227 | check_esc_chars. This just checks for automagic. Also, before |
|
225 | 228 | triggering the magic handler, make sure that there is nothing in the |
|
226 | 229 | user namespace which could shadow it.""" |
|
227 | 230 | if not ip.rc.automagic or not hasattr(ip,'magic_'+l_info.iFun): |
|
228 | 231 | return None |
|
229 | 232 | |
|
230 | 233 | # We have a likely magic method. Make sure we should actually call it. |
|
231 | 234 | if l_info.continue_prompt and not ip.rc.multi_line_specials: |
|
232 | 235 | return None |
|
233 | 236 | |
|
234 | 237 | head = l_info.iFun.split('.',1)[0] |
|
235 | 238 | if isShadowed(head,ip): |
|
236 | 239 | return None |
|
237 | 240 | |
|
238 | 241 | return ip.handle_magic |
|
239 | 242 | |
|
240 | 243 | |
|
241 | 244 | def checkAlias(l_info,ip): |
|
242 | 245 | "Check if the initital identifier on the line is an alias." |
|
243 | 246 | # Note: aliases can not contain '.' |
|
244 | 247 | head = l_info.iFun.split('.',1)[0] |
|
245 | 248 | |
|
246 | 249 | if l_info.iFun not in ip.alias_table \ |
|
247 | 250 | or head not in ip.alias_table \ |
|
248 | 251 | or isShadowed(head,ip): |
|
249 | 252 | return None |
|
250 | 253 | |
|
251 | 254 | return ip.handle_alias |
|
252 | 255 | |
|
253 | 256 | |
|
254 | 257 | def checkPythonOps(l_info,ip): |
|
255 | 258 | """If the 'rest' of the line begins with a function call or pretty much |
|
256 | 259 | any python operator, we should simply execute the line (regardless of |
|
257 | 260 | whether or not there's a possible autocall expansion). This avoids |
|
258 | 261 | spurious (and very confusing) geattr() accesses.""" |
|
259 | 262 | if l_info.theRest and l_info.theRest[0] in '!=()<>,+*/%^&|': |
|
260 | 263 | return ip.handle_normal |
|
261 | 264 | else: |
|
262 | 265 | return None |
|
263 | 266 | |
|
264 | 267 | |
|
265 | 268 | def checkAutocall(l_info,ip): |
|
266 | 269 | "Check if the initial word/function is callable and autocall is on." |
|
267 | 270 | if not ip.rc.autocall: |
|
268 | 271 | return None |
|
269 | 272 | |
|
270 | 273 | oinfo = l_info.ofind(ip) # This can mutate state via getattr |
|
271 | 274 | if not oinfo['found']: |
|
272 | 275 | return None |
|
273 | 276 | |
|
274 | 277 | if callable(oinfo['obj']) \ |
|
275 | 278 | and (not re_exclude_auto.match(l_info.theRest)) \ |
|
276 | 279 | and re_fun_name.match(l_info.iFun): |
|
277 | 280 | #print 'going auto' # dbg |
|
278 | 281 | return ip.handle_auto |
|
279 | 282 | else: |
|
280 | 283 | #print 'was callable?', callable(l_info.oinfo['obj']) # dbg |
|
281 | 284 | return None |
|
282 | 285 | |
|
283 | 286 | # RegExp to identify potential function names |
|
284 | 287 | re_fun_name = re.compile(r'[a-zA-Z_]([a-zA-Z0-9_.]*) *$') |
|
285 | 288 | |
|
286 | 289 | # RegExp to exclude strings with this start from autocalling. In |
|
287 | 290 | # particular, all binary operators should be excluded, so that if foo is |
|
288 | 291 | # callable, foo OP bar doesn't become foo(OP bar), which is invalid. The |
|
289 | 292 | # characters '!=()' don't need to be checked for, as the checkPythonChars |
|
290 | 293 | # routine explicitely does so, to catch direct calls and rebindings of |
|
291 | 294 | # existing names. |
|
292 | 295 | |
|
293 | 296 | # Warning: the '-' HAS TO BE AT THE END of the first group, otherwise |
|
294 | 297 | # it affects the rest of the group in square brackets. |
|
295 | 298 | re_exclude_auto = re.compile(r'^[,&^\|\*/\+-]' |
|
296 | 299 | r'|^is |^not |^in |^and |^or ') |
|
297 | 300 | |
|
298 | 301 | # try to catch also methods for stuff in lists/tuples/dicts: off |
|
299 | 302 | # (experimental). For this to work, the line_split regexp would need |
|
300 | 303 | # to be modified so it wouldn't break things at '['. That line is |
|
301 | 304 | # nasty enough that I shouldn't change it until I can test it _well_. |
|
302 | 305 | #self.re_fun_name = re.compile (r'[a-zA-Z_]([a-zA-Z0-9_.\[\]]*) ?$') |
|
303 | 306 | |
|
304 | 307 | # Handler Check Utilities |
|
305 | 308 | def isShadowed(identifier,ip): |
|
306 | 309 | """Is the given identifier defined in one of the namespaces which shadow |
|
307 | 310 | the alias and magic namespaces? Note that an identifier is different |
|
308 | 311 | than iFun, because it can not contain a '.' character.""" |
|
309 | 312 | # This is much safer than calling ofind, which can change state |
|
310 | 313 | return (identifier in ip.user_ns \ |
|
311 | 314 | or identifier in ip.internal_ns \ |
|
312 | 315 | or identifier in ip.ns_table['builtin']) |
|
313 | 316 |
General Comments 0
You need to be logged in to leave comments.
Login now