Coverage for local/lib/python2.7/site-packages/sage/repl/preparse.py: 94%

sage: dep_regex = r'^ *(?:(?:cimport +([\w\. ,]+))|(?:from +(\w+) +cimport)|(?:include *[\'"]([^\'"]+)[\'"])|(?:cdef *extern *from *[\'"]([^\'"]+)[\'"]))' # Ticket 5821

"""

new_code = []

literals = {}

counter = 0

start = q = 0

if state is None:

in_quote = False

raw = False

else:

in_quote, raw = state

while True:

sig_q = code.find("'", q)

dbl_q = code.find('"', q)

hash_q = code.find('#', q)

q = min(sig_q, dbl_q)

if q == -1: q = max(sig_q, dbl_q)

if not in_quote and hash_q != -1 and (q == -1 or hash_q < q):

# it's a comment

newline = code.find('\n', hash_q)

if newline == -1: newline = len(code)

counter += 1

label = "L%s" % counter

literals[label] = code[hash_q+1:newline]

new_code.append(code[start:hash_q].replace('%','%%'))

new_code.append("#%%(%s)s" % label)

start = q = newline

elif q == -1:

if in_quote:

counter += 1

label = "L%s" % counter

literals[label] = code[start:]

new_code.append("%%(%s)s" % label)

else:

new_code.append(code[start:].replace('%','%%'))

break

elif in_quote:

if code[q-1] == '\\':

k = 2

while code[q-k] == '\\':

k += 1

if k % 2 == 0:

q += 1

if code[q:q+len(in_quote)] == in_quote:

counter += 1

label = "L%s" % counter

literals[label] = code[start:q+len(in_quote)]

new_code.append("%%(%s)s" % label)

q += len(in_quote)

start = q

in_quote = False

else:

q += 1

else:

raw = q>0 and code[q-1] in 'rR'

if len(code) >= q+3 and (code[q+1] == code[q] == code[q+2]):

in_quote = code[q]*3

else:

in_quote = code[q]

new_code.append(code[start:q].replace('%', '%%'))

start = q

q += len(in_quote)

return "".join(new_code), literals, (in_quote, raw)

def containing_block(code, idx, delimiters=['()','[]','{}'], require_delim=True):

"""

Find the code block given by balanced delimiters that contains the position ``idx``.

INPUT:

- ``code`` - a string

- ``idx`` - an integer; a starting position

- ``delimiters`` - a list of strings (default: ['()', '[]',

'{}']); the delimiters to balance. A delimiter must be a single

character and no character can at the same time be opening and

closing delimiter.

- ``require_delim`` - a boolean (default: True); whether to raise

a SyntaxError if delimiters are present. If the delimiters are

unbalanced, an error will be raised in any case.

OUTPUT:

- a 2-tuple ``(a,b)`` of integers, such that ``code[a:b]`` is

delimited by balanced delimiters, ``a<=idx<b``, and ``a``

is maximal and ``b`` is minimal with that property. If that

does not exist, a ``SyntaxError`` is raised.

- If ``require_delim`` is false and ``a,b`` as above can not be

found, then ``0, len(code)`` is returned.

EXAMPLES::

sage: from sage.repl.preparse import containing_block

sage: s = "factor(next_prime(L[5]+1))"

sage: s[22]

'+'

sage: start, end = containing_block(s, 22)

sage: start, end

(17, 25)

sage: s[start:end]

'(L[5]+1)'

sage: s[20]

'5'

sage: start, end = containing_block(s, 20); s[start:end]

'[5]'

sage: start, end = containing_block(s, 20, delimiters=['()']); s[start:end]

'(L[5]+1)'

sage: start, end = containing_block(s, 10); s[start:end]

'(next_prime(L[5]+1))'

TESTS::

sage: containing_block('((a{))',0)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('((a{))',1)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('((a{))',2)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('((a{))',3)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('((a{))',4)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('((a{))',5)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('(()()',1)

(1, 3)

sage: containing_block('(()()',3)

(3, 5)

sage: containing_block('(()()',4)

(3, 5)

sage: containing_block('(()()',0)

Traceback (most recent call last):

...

SyntaxError: Unbalanced delimiters

sage: containing_block('(()()',0, require_delim=False)

(0, 5)

sage: containing_block('((})()',1, require_delim=False)

(0, 6)

sage: containing_block('abc',1, require_delim=False)

(0, 3)

"""

openings = "".join([d[0] for d in delimiters])

closings = "".join([d[-1] for d in delimiters])

levels = [0] * len(openings)

p = 0

start = idx

while start >= 0:

if code[start] in openings:

p = openings.index(code[start])

levels[p] -= 1

if levels[p] == -1:

break

elif code[start] in closings and start < idx:

p = closings.index(code[start])

levels[p] += 1

start -= 1

if start == -1:

if require_delim:

raise SyntaxError("Unbalanced or missing delimiters")

else:

return 0, len(code)

if levels.count(0) != len(levels)-1:

if require_delim:

raise SyntaxError("Unbalanced delimiters")

else:

return 0, len(code)

p0 = p

# We now have levels[p0]==-1. We go to the right hand side

# till we find a closing delimiter of type p0 that makes

# levels[p0]==0.

end = idx

while end < len(code):

if code[end] in closings:

p = closings.index(code[end])

levels[p] += 1

if p==p0 and levels[p] == 0:

break

elif code[end] in openings and end > idx:

p = openings.index(code[end])

levels[p] -= 1

end += 1

if levels.count(0) != len(levels):

# This also occurs when end==len(code) without finding a closing delimiter

if require_delim:

raise SyntaxError("Unbalanced delimiters")

else:

return 0, len(code)

return start, end+1

def parse_ellipsis(code, preparse_step=True):

"""

Preparses [0,2,..,n] notation.

INPUT:

- ``code`` - a string

- ``preparse_step`` - a boolean (default: True)

OUTPUT:

- a string

EXAMPLES::

sage: from sage.repl.preparse import parse_ellipsis

sage: parse_ellipsis("[1,2,..,n]")

'(ellipsis_range(1,2,Ellipsis,n))'

sage: parse_ellipsis("for i in (f(x) .. L[10]):")

'for i in (ellipsis_iter(f(x) ,Ellipsis, L[10])):'

sage: [1.0..2.0]

[1.00000000000000, 2.00000000000000]

TESTS:

Check that nested ellipsis is processed correctly (:trac:`17378`)::

sage: preparse('[1,..,2,..,len([1..3])]')

'(ellipsis_range(Integer(1),Ellipsis,Integer(2),Ellipsis,len((ellipsis_range(Integer(1),Ellipsis,Integer(3))))))'

"""

ix = code.find('..')

while ix != -1:

if ix == 0:

raise SyntaxError("Cannot start line with ellipsis.")

elif code[ix-1]=='.':

# '...' be valid Python in index slices

code = code[:ix-1] + "Ellipsis" + code[ix+2:]

elif len(code) >= ix+3 and code[ix+2]=='.':

# '...' be valid Python in index slices

code = code[:ix] + "Ellipsis" + code[ix+3:]

else:

start_list, end_list = containing_block(code, ix, ['()','[]'])

#search the current containing block for other '..' occurrences that may

#be contained in proper subblocks. Those need to be processed before

#we can deal with the present level of ellipses.

ix = code.find('..',ix+2,end_list)

while ix != -1:

if code[ix-1]!='.' and code[ix+2]!='.':

start_list,end_list = containing_block(code,ix,['()','[]'])

ix = code.find('..',ix+2,end_list)

arguments = code[start_list+1:end_list-1].replace('...', ',Ellipsis,').replace('..', ',Ellipsis,')

arguments = re.sub(r',\s*,', ',', arguments)

if preparse_step:

arguments = arguments.replace(';', ', step=')

range_or_iter = 'range' if code[start_list]=='[' else 'iter'

code = "%s(ellipsis_%s(%s))%s" % (code[:start_list],

range_or_iter,

arguments,

code[end_list:])

ix = code.find('..')

return code

def extract_numeric_literals(code):

"""

Pulls out numeric literals and assigns them to global variables.

This eliminates the need to re-parse and create the literals,

e.g., during every iteration of a loop.

INPUT:

- ``code`` - a string; a block of code

OUTPUT:

- a (string, string:string dictionary) 2-tuple; the block with

literals replaced by variable names and a mapping from names to

the new variables

EXAMPLES::

sage: from sage.repl.preparse import extract_numeric_literals

sage: code, nums = extract_numeric_literals("1.2 + 5")

sage: print(code)

_sage_const_1p2 + _sage_const_5

sage: print(nums)

{'_sage_const_1p2': "RealNumber('1.2')", '_sage_const_5': 'Integer(5)'}

sage: extract_numeric_literals("[1, 1.1, 1e1, -1e-1, 1.]")[0]

'[_sage_const_1 , _sage_const_1p1 , _sage_const_1e1 , -_sage_const_1en1 , _sage_const_1p ]'

sage: extract_numeric_literals("[1.sqrt(), 1.2.sqrt(), 1r, 1.2r, R.1, R0.1, (1..5)]")[0]

'[_sage_const_1 .sqrt(), _sage_const_1p2 .sqrt(), 1 , 1.2 , R.1, R0.1, (_sage_const_1 .._sage_const_5 )]'

"""

return preparse_numeric_literals(code, True)

all_num_regex = None

def preparse_numeric_literals(code, extract=False):

"""

This preparses numerical literals into their Sage counterparts,

e.g. Integer, RealNumber, and ComplexNumber.

INPUT:

- ``code`` - a string; a code block to preparse

- ``extract`` - a boolean (default: False); whether to create

names for the literals and return a dictionary of

name-construction pairs

OUTPUT:

- a string or (string, string:string dictionary) 2-tuple; the

preparsed block and, if ``extract`` is True, the

name-construction mapping

EXAMPLES::

sage: from sage.repl.preparse import preparse_numeric_literals

sage: preparse_numeric_literals("5")

'Integer(5)'

sage: preparse_numeric_literals("5j")

"ComplexNumber(0, '5')"

sage: preparse_numeric_literals("5jr")

'5J'

sage: preparse_numeric_literals("5l")

'5l'

sage: preparse_numeric_literals("5L")

'5L'

sage: preparse_numeric_literals("1.5")

"RealNumber('1.5')"

sage: preparse_numeric_literals("1.5j")

"ComplexNumber(0, '1.5')"

sage: preparse_numeric_literals(".5j")

"ComplexNumber(0, '.5')"

sage: preparse_numeric_literals("5e9j")

"ComplexNumber(0, '5e9')"

sage: preparse_numeric_literals("5.")

"RealNumber('5.')"

sage: preparse_numeric_literals("5.j")

"ComplexNumber(0, '5.')"

sage: preparse_numeric_literals("5.foo()")

'Integer(5).foo()'

sage: preparse_numeric_literals("5.5.foo()")

"RealNumber('5.5').foo()"

sage: preparse_numeric_literals("5.5j.foo()")

"ComplexNumber(0, '5.5').foo()"

sage: preparse_numeric_literals("5j.foo()")

"ComplexNumber(0, '5').foo()"

sage: preparse_numeric_literals("1.exp()")

'Integer(1).exp()'

sage: preparse_numeric_literals("1e+10")

"RealNumber('1e+10')"

sage: preparse_numeric_literals("0x0af")

'Integer(0x0af)'

sage: preparse_numeric_literals("0x10.sqrt()")

'Integer(0x10).sqrt()'

sage: preparse_numeric_literals('0o100')

'Integer(0o100)'

sage: preparse_numeric_literals('0b111001')

'Integer(0b111001)'

sage: preparse_numeric_literals('0xe')

'Integer(0xe)'

sage: preparse_numeric_literals('0xEAR')

'0xEA'

sage: preparse_numeric_literals('0x1012Fae')

'Integer(0x1012Fae)'

"""

literals = {}

last = 0

new_code = []

global all_num_regex

if all_num_regex is None:

dec_num = r"\b\d+"

hex_num = r"\b0x[0-9a-f]+"

oct_num = r"\b0o[0-7]+"

bin_num = r"\b0b[01]+"

# This is slightly annoying as floating point numbers may start

# with a decimal point, but if they do the \b will not match.

float_num = r"((\b\d+([.]\d*)?)|([.]\d+))(e[-+]?\d+)?"

all_num = r"((%s)|(%s)|(%s)|(%s)|(%s))(rj|rL|jr|Lr|j|L|r|)\b" % (hex_num, oct_num, bin_num, float_num, dec_num)

all_num_regex = re.compile(all_num, re.I)

for m in all_num_regex.finditer(code):

start, end = m.start(), m.end()

num = m.group(1)

postfix = m.groups()[-1].upper()

if 'R' in postfix:

num_name = num_make = num + postfix.replace('R', '')

elif 'L' in postfix:

continue

else:

# The Sage preparser does extra things with numbers, which we need to handle here.

if '.' in num:

if start > 0 and num[0] == '.':

if code[start-1] == '.':

# handle Ellipsis

start += 1

num = num[1:]

elif re.match(r'[a-zA-Z0-9_\])]', code[start-1]):

# handle R.0

continue

elif end < len(code) and num[-1] == '.':

if re.match('[a-zA-Z_]', code[end]):

# handle 4.sqrt()

end -= 1

num = num[:-1]

elif end < len(code) and code[end] == '.' and not postfix and re.match(r'\d+$', num):

# \b does not match after the . for floating point

# two dots in a row would be an ellipsis

if end+1 == len(code) or code[end+1] != '.':

end += 1

num += '.'

num_name = numeric_literal_prefix + num.replace('.', 'p').replace('-', 'n').replace('+', '')

if 'J' in postfix:

num_make = "ComplexNumber(0, '%s')" % num

num_name += 'j'

elif len(num) < 2 or num[1] in 'oObBxX':

num_make = "Integer(%s)" % num

elif '.' in num or 'e' in num or 'E' in num:

num_make = "RealNumber('%s')" % num

elif num[0] == "0":

num_make = "Integer('%s')" % num

else:

num_make = "Integer(%s)" % num

literals[num_name] = num_make

new_code.append(code[last:start])

if extract:

new_code.append(num_name+' ')

else:

new_code.append(num_make)

last = end

new_code.append(code[last:])

code = ''.join(new_code)

if extract:

return code, literals

else:

return code

def strip_prompts(line):

r"""

Removes leading sage: and >>> prompts so that pasting of examples

from the documentation works.

INPUT:

- ``line`` - a string to process

OUTPUT:

- a string stripped of leading prompts

EXAMPLES::

sage: from sage.repl.preparse import strip_prompts

sage: strip_prompts("sage: 2 + 2")

'2 + 2'

sage: strip_prompts(">>> 3 + 2")

'3 + 2'

sage: strip_prompts(" 2 + 4")

' 2 + 4'

"""

for prompt in ['sage:', '>>>']:

if line.startswith(prompt):

line = line[len(prompt):].lstrip()

break

return line

def preparse_calculus(code):

"""

Supports calculus-like function assignment, e.g., transforms::

f(x,y,z) = sin(x^3 - 4*y) + y^x

into::

__tmp__=var("x,y,z")

f = symbolic_expression(sin(x**3 - 4*y) + y**x).function(x,y,z)

AUTHORS:

- Bobby Moretti

- Initial version - 02/2007

- William Stein

- Make variables become defined if they aren't already defined.

- Robert Bradshaw

- Rewrite using regular expressions (01/2009)

EXAMPLES::

sage: preparse("f(x) = x^3-x")

'__tmp__=var("x"); f = symbolic_expression(x**Integer(3)-x).function(x)'

sage: preparse("f(u,v) = u - v")

'__tmp__=var("u,v"); f = symbolic_expression(u - v).function(u,v)'

sage: preparse("f(x) =-5")

'__tmp__=var("x"); f = symbolic_expression(-Integer(5)).function(x)'

sage: preparse("f(x) -= 5")

'f(x) -= Integer(5)'

sage: preparse("f(x_1, x_2) = x_1^2 - x_2^2")

'__tmp__=var("x_1,x_2"); f = symbolic_expression(x_1**Integer(2) - x_2**Integer(2)).function(x_1,x_2)'

For simplicity, this function assumes all statements begin and end

with a semicolon::

sage: from sage.repl.preparse import preparse_calculus

sage: preparse_calculus(";f(t,s)=t^2;")

';__tmp__=var("t,s"); f = symbolic_expression(t^2).function(t,s);'

sage: preparse_calculus(";f( t , s ) = t^2;")

';__tmp__=var("t,s"); f = symbolic_expression(t^2).function(t,s);'

TESTS:

The arguments in the definition must be symbolic variables (:trac:`10747`)::

sage: preparse_calculus(";f(_sage_const_)=x;")

Traceback (most recent call last):

...

ValueError: Argument names should be valid python identifiers.

Although preparse_calculus returns something for f(1)=x, when

preparsing a file an exception is raised because it is invalid python::

sage: preparse_calculus(";f(1)=x;")

';__tmp__=var("1"); f = symbolic_expression(x).function(1);'

sage: from sage.repl.preparse import preparse_file

sage: preparse_file("f(1)=x")

Traceback (most recent call last):

...

ValueError: Argument names should be valid python identifiers.

sage: from sage.repl.preparse import preparse_file

sage: preparse_file("f(x,1)=2")

Traceback (most recent call last):

...

ValueError: Argument names should be valid python identifiers.

"""

new_code = []

last_end = 0

# f ( vars ) = expr

for m in re.finditer(r";(\s*)([a-zA-Z_]\w*) *$([^()]+)$ *= *([^;#=][^;#]*)", code):

ident, func, vars, expr = m.groups()

stripped_vars = [v.strip() for v in vars.split(',')]

# if the variable name starts with numeric_literal_prefix

# the argument name for the symbolic expression is a numeric literal

# such as f(2)=5

if any(n.startswith(numeric_literal_prefix) for n in stripped_vars):

raise ValueError("Argument names should be valid python identifiers.")

vars = ','.join(stripped_vars)

new_code.append(code[last_end:m.start()])

new_code.append(';%s__tmp__=var("%s"); %s = symbolic_expression(%s).function(%s)' %

(ident, vars, func, expr, vars))

last_end = m.end()

if last_end == 0:

return code

else:

new_code.append(code[m.end():])

return ''.join(new_code)

def preparse_generators(code):

r"""

Parses generator syntax, converting::

obj.<gen0,gen1,...,genN> = objConstructor(...)

into::

obj = objConstructor(..., names=("gen0", "gen1", ..., "genN"))

(gen0, gen1, ..., genN,) = obj.gens()

and::

obj.<gen0,gen1,...,genN> = R[interior]

into::

obj = R[interior]; (gen0, gen1, ..., genN,) = obj.gens()

INPUT:

- ``code`` - a string

OUTPUT:

- a string

LIMITATIONS:

- The entire constructor *must* be on one line.

AUTHORS:

- 2006-04-14: Joe Wetherell (jlwether@alum.mit.edu)

- Initial version.

- 2006-04-17: William Stein

- Improvements to allow multiple statements.

- 2006-05-01: William

- Fix bug that Joe found.

- 2006-10-31: William

- Fix so obj doesn't have to be mutated.

- 2009-01-27: Robert Bradshaw

- Rewrite using regular expressions

TESTS::

sage: from sage.repl.preparse import preparse, preparse_generators

Vanilla::

sage: preparse("R.<x> = ZZ['x']")

"R = ZZ['x']; (x,) = R._first_ngens(1)"

sage: preparse("R.<x,y> = ZZ['x,y']")

"R = ZZ['x,y']; (x, y,) = R._first_ngens(2)"

No square brackets::

sage: preparse("R.<x> = PolynomialRing(ZZ, 'x')")

"R = PolynomialRing(ZZ, 'x', names=('x',)); (x,) = R._first_ngens(1)"

sage: preparse("R.<x,y> = PolynomialRing(ZZ, 'x,y')")

"R = PolynomialRing(ZZ, 'x,y', names=('x', 'y',)); (x, y,) = R._first_ngens(2)"

Names filled in::

sage: preparse("R.<x> = ZZ[]")

"R = ZZ['x']; (x,) = R._first_ngens(1)"

sage: preparse("R.<x,y> = ZZ[]")

"R = ZZ['x, y']; (x, y,) = R._first_ngens(2)"

Names given not the same as generator names::

sage: preparse("R.<x> = ZZ['y']")

"R = ZZ['y']; (x,) = R._first_ngens(1)"

sage: preparse("R.<x,y> = ZZ['u,v']")

"R = ZZ['u,v']; (x, y,) = R._first_ngens(2)"

Number fields::

sage: preparse("K.<a> = QQ[2^(1/3)]")

'K = QQ[Integer(2)**(Integer(1)/Integer(3))]; (a,) = K._first_ngens(1)'

sage: preparse("K.<a, b> = QQ[2^(1/3), 2^(1/2)]")

'K = QQ[Integer(2)**(Integer(1)/Integer(3)), Integer(2)**(Integer(1)/Integer(2))]; (a, b,) = K._first_ngens(2)'

Just the .<> notation::

sage: preparse("R.<x> = ZZx")

'R = ZZx; (x,) = R._first_ngens(1)'

sage: preparse("R.<x, y> = a+b")

'R = a+b; (x, y,) = R._first_ngens(2)'

sage: preparse("A.<x,y,z>=FreeAlgebra(ZZ,3)")

"A = FreeAlgebra(ZZ,Integer(3), names=('x', 'y', 'z',)); (x, y, z,) = A._first_ngens(3)"

Ensure we don't eat too much::

sage: preparse("R.<x, y> = ZZ;2")

'R = ZZ; (x, y,) = R._first_ngens(2);Integer(2)'

sage: preparse("R.<x, y> = ZZ['x,y'];2")

"R = ZZ['x,y']; (x, y,) = R._first_ngens(2);Integer(2)"

sage: preparse("F.<b>, f, g = S.field_extension()")

"F, f, g = S.field_extension(names=('b',)); (b,) = F._first_ngens(1)"

For simplicity, this function assumes all statements begin and end

with a semicolon::

sage: preparse_generators("; R.<x>=ZZ[];")

"; R = ZZ['x']; (x,) = R._first_ngens(1);"

See :trac:`16731` ::

sage: preparse_generators('R.<x> = ')

'R.<x> = '

"""

new_code = []

last_end = 0

# obj .< gens > , other = constructor

for m in re.finditer(r";(\s*)([a-zA-Z_]\w*)\.<([^>]+)> *((?:,[\w, ]+)?)= *([^;#]+)", code):

ident, obj, gens, other_objs, constructor = m.groups()

gens = [v.strip() for v in gens.split(',')]

constructor = constructor.rstrip()

if len(constructor) == 0:

pass # SyntaxError will be raised by Python later

elif constructor[-1] == ')':

if '(' not in constructor:

raise SyntaxError("Mismatched ')'")

opening = constructor.rindex('(')

# Only use comma if there are already arguments to the constructor

comma = ', ' if constructor[opening+1:-1].strip() != '' else ''

names = "('%s',)" % "', '".join(gens)

constructor = constructor[:-1] + comma + "names=%s)" % names

elif constructor[-1] == ']':

# Could be nested.

if '[' not in constructor:

raise SyntaxError("Mismatched ']'")

opening = constructor.rindex('[')

closing = constructor.index(']', opening)

if constructor[opening+1:closing].strip() == '':

names = "'" + ', '.join(gens) + "'"

constructor = constructor[:opening+1] + names + constructor[closing:]

else:

pass

gens_tuple = "(%s,)" % ', '.join(gens)

new_code.append(code[last_end:m.start()])

new_code.append(";%s%s%s = %s; %s = %s._first_ngens(%s)" %

(ident, obj, other_objs, constructor, gens_tuple, obj, len(gens)))

last_end = m.end()

if last_end == 0:

return code

else:

new_code.append(code[m.end():])

return ''.join(new_code)

quote_state = None

def preparse(line, reset=True, do_time=False, ignore_prompts=False,

numeric_literals=True):

r"""

Preparses a line of input.

INPUT:

- ``line`` - a string

- ``reset`` - a boolean (default: True)

- ``do_time`` - a boolean (default: False)

- ``ignore_prompts`` - a boolean (default: False)

- ``numeric_literals`` - a boolean (default: True)

OUTPUT:

- a string

EXAMPLES::

sage: preparse("ZZ.<x> = ZZ['x']")

"ZZ = ZZ['x']; (x,) = ZZ._first_ngens(1)"

sage: preparse("ZZ.<x> = ZZ['y']")

"ZZ = ZZ['y']; (x,) = ZZ._first_ngens(1)"

sage: preparse("ZZ.<x,y> = ZZ[]")

"ZZ = ZZ['x, y']; (x, y,) = ZZ._first_ngens(2)"

sage: preparse("ZZ.<x,y> = ZZ['u,v']")

"ZZ = ZZ['u,v']; (x, y,) = ZZ._first_ngens(2)"

sage: preparse("ZZ.<x> = QQ[2^(1/3)]")

'ZZ = QQ[Integer(2)**(Integer(1)/Integer(3))]; (x,) = ZZ._first_ngens(1)'

sage: QQ[2^(1/3)]

Number Field in a with defining polynomial x^3 - 2

sage: preparse("a^b")

'a**b'

sage: preparse("a^^b")

'a^b'

sage: 8^1

sage: 8^^1

sage: 9^^1

sage: preparse("A \\ B")

'A * BackslashOperator() * B'

sage: preparse("A^2 \\ B + C")

'A**Integer(2) * BackslashOperator() * B + C'

sage: preparse("a \\ b \\") # There is really only one backslash here, it's just being escaped.

'a * BackslashOperator() * b \\'

sage: preparse("time R.<x> = ZZ[]", do_time=True)

'__time__=misc.cputime(); __wall__=misc.walltime(); R = ZZ[\'x\']; print("Time: CPU %.2f s, Wall: %.2f s"%(misc.cputime(__time__), misc.walltime(__wall__))); (x,) = R._first_ngens(1)'

"""

global quote_state

if reset:

quote_state = None

L = line.lstrip()

if len(L) > 0 and L[0] in ['#', '!']:

return line

if L.startswith('...'):

i = line.find('...')

return line[:i+3] + preparse(line[i+3:], reset=reset, do_time=do_time, ignore_prompts=ignore_prompts)

if ignore_prompts:

# Get rid of leading sage: and >>> so that pasting of examples from

# the documentation works.

line = strip_prompts(line)

# This part handles lines with semi-colons all at once

# Then can also handle multiple lines more efficiently, but

# that optimization can be done later.

L, literals, quote_state = strip_string_literals(line, quote_state)

# Ellipsis Range

# [1..n]

try:

L = parse_ellipsis(L, preparse_step=False)

except SyntaxError:

pass

if implicit_mul_level:

# Implicit Multiplication

# 2x -> 2*x

L = implicit_mul(L, level = implicit_mul_level)

if numeric_literals:

# Wrapping

# 1 + 0.5 -> Integer(1) + RealNumber('0.5')

L = preparse_numeric_literals(L)

# Generators

# R.0 -> R.gen(0)

L = re.sub(r'([_a-zA-Z]\w*|[)\]])\.(\d+)', r'\1.gen(\2)', L)

# Use ^ for exponentiation and ^^ for xor

# (A side effect is that **** becomes xor as well.)

L = L.replace('^', '**').replace('****', '^')

# Make it easy to match statement ends

L = ';%s;' % L.replace('\n', ';\n;')

if do_time:

# Separate time statement

L = re.sub(r';(\s*)time +(\w)', r';time;\1\2', L)

# Construction with generators

# R.<...> = obj()

# R.<...> = R[]

L = preparse_generators(L)

# Calculus functions

# f(x,y) = x^3 - sin(y)

L = preparse_calculus(L)

# Backslash

L = re.sub(r'''\\\s*([^\t ;#])''', r' * BackslashOperator() * \1', L)

if do_time:

# Time keyword

L = re.sub(r';time;(\s*)(\S[^;]*)',

r';\1__time__=misc.cputime(); __wall__=misc.walltime(); \2; print(' +

'"Time: CPU %%.2f s, Wall: %%.2f s"%%(misc.cputime(__time__), misc.walltime(__wall__)))',

# Remove extra ;'s

L = L.replace(';\n;', '\n')[1:-1]

line = L % literals

return line

######################################################

## Apply the preparser to an entire file

######################################################

def preparse_file(contents, globals=None, numeric_literals=True):

"""

Preparses input, attending to numeric literals and load/attach

file directives.

.. note:: Temporarily, if @parallel is in the input, then

numeric_literals is always set to False.

INPUT:

- ``contents`` - a string

- ``globals`` - dict or None (default: None); if given, then

arguments to load/attach are evaluated in the namespace of this

dict.

- ``numeric_literals`` - bool (default: True), whether to factor

out wrapping of integers and floats, so they don't get created

repeatedly inside loops

OUTPUT:

- a string

TESTS::

sage: from sage.repl.preparse import preparse_file

sage: lots_of_numbers = "[%s]" % ", ".join(str(i) for i in range(3000))

sage: _ = preparse_file(lots_of_numbers)

sage: print(preparse_file("type(100r), type(100)"))

_sage_const_100 = Integer(100)

type(100 ), type(_sage_const_100 )

"""

if not isinstance(contents, six.string_types):

raise TypeError("contents must be a string")

if globals is None:

globals = {}

# This is a hack, since when we use @parallel to parallelize code,

# the numeric literals that are factored out do not get copied

# to the subprocesses properly. See trac #4545.

if '@parallel' in contents:

numeric_literals = False

if numeric_literals:

contents, literals, state = strip_string_literals(contents)

contents, nums = extract_numeric_literals(contents)

contents = contents % literals

if nums:

# Stick the assignments at the top, trying not to shift

# the lines down.

ix = contents.find('\n')

if ix == -1: ix = len(contents)

if not re.match(r"^ *(#.*)?$", contents[:ix]):

contents = "\n"+contents

assignments = ["%s = %s" % x for x in nums.items()]

# the preparser recurses on semicolons, so we only attempt

# to preserve line numbers if there are a few

if len(assignments) < 500:

contents = "; ".join(assignments) + contents

else:

contents = "\n".join(assignments) + "\n\n" + contents

# The list F contains the preparsed lines so far.

F = []

# A is the input, as a list of lines.

A = contents.splitlines()

# We are currently parsing the i-th input line.

i = 0

while i < len(A):

L = A[i]

do_preparse = True

for cmd in ['load', 'attach']:

if L.lstrip().startswith(cmd+' '):

j = L.find(cmd+' ')

s = L[j+len(cmd)+1:].strip()

if not s.startswith('('):

F.append(' '*j + load_wrap(s, cmd=='attach'))

do_preparse = False

continue

if do_preparse:

F.append(preparse(L, reset=(i==0), do_time=True, ignore_prompts=False,

numeric_literals=not numeric_literals))

i += 1

return '\n'.join(F)

def implicit_mul(code, level=5):

"""

Inserts \*'s to make implicit multiplication explicit.

INPUT:

- ``code`` -- a string; the code with missing \*'s

- ``level`` -- an integer (default: 5); how aggressive to be in

placing \*'s

- 0 - Do nothing

- 1 - Numeric followed by alphanumeric

- 2 - Closing parentheses followed by alphanumeric

- 3 - Spaces between alphanumeric

- 10 - Adjacent parentheses (may mangle call statements)

OUTPUT:

- a string

EXAMPLES::

sage: from sage.repl.preparse import implicit_mul

sage: implicit_mul('(2x^2-4x+3)a0')

'(2*x^2-4*x+3)*a0'

sage: implicit_mul('a b c in L')

'a*b*c in L'

sage: implicit_mul('1r + 1e3 + 5exp(2)')

'1r + 1e3 + 5*exp(2)'

sage: implicit_mul('f(a)(b)', level=10)

'f(a)*(b)'

"""

def re_no_keyword(pattern, code):

for _ in range(2): # do it twice in because matches don't overlap

for m in reversed(list(re.finditer(pattern, code))):

left, right = m.groups()

if left not in keywords and right not in keywords:

code = "%s%s*%s%s" % (code[:m.start()],

left,

right,

code[m.end():])

return code

code, literals, state = strip_string_literals(code)

if level >= 1:

no_mul_token = " '''_no_mult_token_''' "

code = re.sub(r'\b0x', r'0%sx' % no_mul_token, code) # hex digits

code = re.sub(r'( *)time ', r'\1time %s' % no_mul_token, code) # first word may be magic 'time'

code = re.sub(r'\b(\d+(?:\.\d+)?(?:e\d+)?)([rR]\b)', r'\1%s\2' % no_mul_token, code) # exclude such things as 10r

code = re.sub(r'\b(\d+(?:\.\d+)?)e([-\d])', r'\1%se%s\2' % (no_mul_token, no_mul_token), code) # exclude such things as 1e5

code = re_no_keyword(r'\b((?:\d+(?:\.\d+)?)|(?:%s[0-9eEpn]*\b)) *([a-zA-Z_(]\w*)\b' % numeric_literal_prefix, code)

if level >= 2:

code = re.sub(r'(\%$L\d+$)s', r'\1%ss%s' % (no_mul_token, no_mul_token), code) # literal strings

code = re_no_keyword(r'(\)) *(\w+)', code)

if level >= 3:

code = re_no_keyword(r'(\w+) +(\w+)', code)

if level >= 10:

code = re.sub(r'\) *\(', ')*(', code)

code = code.replace(no_mul_token, '')

return code % literals

def _strip_quotes(s):

"""

Strips one set of outer quotes.

INPUT:

- ``s`` - a string

OUTPUT:

- a string with any single and double quotes on either side of

``s`` removed

EXAMPLES:

Both types of quotes work::

sage: import sage.repl.preparse

sage: sage.repl.preparse._strip_quotes('"foo.sage"')

'foo.sage'

sage: sage.repl.preparse._strip_quotes("'foo.sage'")

'foo.sage'

The only thing that is stripped is at most one set of outer quotes::

sage: sage.repl.preparse._strip_quotes('""foo".sage""')

'"foo".sage"'

"""

if len(s) == 0:

return s

if s[0] in ["'", '"']:

s = s[1:]

if s[-1] in ["'", '"']:

s = s[:-1]

return s

def handle_encoding_declaration(contents, out):

r"""

Find a PEP 263-style Python encoding declaration in the first or

second line of ``contents``. If found, output it to ``out`` and return

``contents`` without the encoding line; otherwise output a default

UTF-8 declaration and return ``contents``.

EXAMPLES::

sage: from sage.repl.preparse import handle_encoding_declaration

sage: import sys

sage: c1='# -*- coding: latin-1 -*-\nimport os, sys\n...'

sage: c2='# -*- coding: iso-8859-15 -*-\nimport os, sys\n...'

sage: c3='# -*- coding: ascii -*-\nimport os, sys\n...'

sage: c4='import os, sys\n...'

sage: handle_encoding_declaration(c1, sys.stdout)

# -*- coding: latin-1 -*-

'import os, sys\n...'

sage: handle_encoding_declaration(c2, sys.stdout)

# -*- coding: iso-8859-15 -*-

'import os, sys\n...'

sage: handle_encoding_declaration(c3, sys.stdout)

# -*- coding: ascii -*-

'import os, sys\n...'

sage: handle_encoding_declaration(c4, sys.stdout)

# -*- coding: utf-8 -*-

'import os, sys\n...'

TESTS:

These are some of the tests listed in PEP 263::

sage: contents = '#!/usr/bin/python\n# -*- coding: latin-1 -*-\nimport os, sys'

sage: handle_encoding_declaration(contents, sys.stdout)

# -*- coding: latin-1 -*-

'#!/usr/bin/python\nimport os, sys'

sage: contents = '# This Python file uses the following encoding: utf-8\nimport os, sys'

sage: handle_encoding_declaration(contents, sys.stdout)

# This Python file uses the following encoding: utf-8

'import os, sys'

sage: contents = '#!/usr/local/bin/python\n# coding: latin-1\nimport os, sys'

sage: handle_encoding_declaration(contents, sys.stdout)

# coding: latin-1

'#!/usr/local/bin/python\nimport os, sys'

Two hash marks are okay; this shows up in SageTeX-generated scripts::

sage: contents = '## -*- coding: utf-8 -*-\nimport os, sys\nprint(x)'

sage: handle_encoding_declaration(contents, sys.stdout)

## -*- coding: utf-8 -*-

'import os, sys\nprint(x)'

When the encoding declaration doesn't match the specification, we

spit out a default UTF-8 encoding.

Incorrect coding line::

sage: contents = '#!/usr/local/bin/python\n# latin-1\nimport os, sys'

sage: handle_encoding_declaration(contents, sys.stdout)

# -*- coding: utf-8 -*-

'#!/usr/local/bin/python\n# latin-1\nimport os, sys'

Encoding declaration not on first or second line::

sage: contents ='#!/usr/local/bin/python\n#\n# -*- coding: latin-1 -*-\nimport os, sys'

sage: handle_encoding_declaration(contents, sys.stdout)

# -*- coding: utf-8 -*-

'#!/usr/local/bin/python\n#\n# -*- coding: latin-1 -*-\nimport os, sys'

We don't check for legal encoding names; that's Python's job::

sage: contents ='#!/usr/local/bin/python\n# -*- coding: utf-42 -*-\nimport os, sys'

sage: handle_encoding_declaration(contents, sys.stdout)

# -*- coding: utf-42 -*-

'#!/usr/local/bin/python\nimport os, sys'

.. NOTE::

- :pep:`263` says that Python will interpret a UTF-8

byte order mark as a declaration of UTF-8 encoding, but I don't

think we do that; this function only sees a Python string so it

can't account for a BOM.

- We default to UTF-8 encoding even though PEP 263 says that

Python files should default to ASCII.

- Also see https://docs.python.org/ref/encodings.html.

AUTHORS:

- Lars Fischer

- Dan Drake (2010-12-08, rewrite for :trac:`10440`)

"""

lines = contents.splitlines()

for num, line in enumerate(lines[:2]):

if re.search(r"coding[:=]\s*([-\w.]+)", line):

out.write(line + '\n')

return '\n'.join(lines[:num] + lines[(num+1):])

# If we didn't find any encoding hints, use utf-8. This is not in

# conformance with PEP 263, which says that Python files default to

# ascii encoding.

out.write("# -*- coding: utf-8 -*-\n")

return contents

def preparse_file_named_to_stream(name, out):

r"""

Preparse file named \code{name} (presumably a .sage file), outputting to

stream \code{out}.

"""

name = os.path.abspath(name)

contents = open(name).read()

contents = handle_encoding_declaration(contents, out)

parsed = preparse_file(contents)

out.write('#'*70+'\n')

out.write('# This file was *autogenerated* from the file %s.\n' % name)

out.write('#'*70+'\n')

out.write(parsed)

def preparse_file_named(name):

r"""

Preparse file named \code{name} (presumably a .sage file), outputting to a

temporary file. Returns name of temporary file.

"""

from sage.misc.temporary_file import tmp_filename

tmpfilename = tmp_filename(os.path.basename(name)) + '.py'

out = open(tmpfilename, 'w')

preparse_file_named_to_stream(name, out)

out.close()

return tmpfilename

Coverage for local/lib/python2.7/site-packages/sage/repl/preparse.py : 94%

384 statements 361 run 23 missing 0 excluded