python3.2  3.2.2
tokenize Namespace Reference


class  TokenInfo


def group
def any
def maybe


string __author__ = 'Ka-Ping Yee <>'
tuple __credits__
tuple cookie_re = re.compile("coding[:=]\s*([-\w.]+)")
list __all__
int NL = 1
int ENCODING = 2
string Whitespace = r'[ \f\t]*'
string Comment = r'#[^\r\n]*'
tuple Ignore = Whitespace+any(r'\\\r?\n' + Whitespace)
string Name = r'\w+'
string Hexnumber = r'0[xX][0-9a-fA-F]+'
string Binnumber = r'0[bB][01]+'
string Octnumber = r'0[oO][0-7]+'
string Decnumber = r'(?:0+|[1-9][0-9]*)'
tuple Intnumber = group(Hexnumber, Binnumber, Octnumber, Decnumber)
string Exponent = r'[eE][-+]?[0-9]+'
tuple Pointfloat = group(r'[0-9]+\.[0-9]*', r'\.[0-9]+')
string Expfloat = r'[0-9]+'
tuple Floatnumber = group(Pointfloat, Expfloat)
tuple Imagnumber = group(r'[0-9]+[jJ]', Floatnumber + r'[jJ]')
tuple Number = group(Imagnumber, Floatnumber, Intnumber)
string Single = r"[^'\\]*(?:\\.[^'\\]*)*'"
string Double = r'[^"\\]*(?:\\.[^"\\]*)*"'
string Single3 = r"[^'\\]*(?:(?:\\.|'(?!''))[^'\\]*)*'''"
string Double3 = r'[^"\\]*(?:(?:\\.|"(?!""))[^"\\]*)*"""'

Detailed Description

Tokenization help for Python programs.

tokenize(readline) is a generator that breaks a stream of bytes into
Python tokens.  It decodes the bytes according to PEP-0263 for
determining source file encoding.

It accepts a readline-like method which is called repeatedly to get the
next line of input (or b"" for EOF).  It generates 5-tuples with these

the token type (see
the token (a string)
the starting (row, column) indices of the token (a 2-tuple of ints)
the ending (row, column) indices of the token (a 2-tuple of ints)
the original line (string)

It is designed to match the working of the Python tokenizer exactly, except
that it produces COMMENT tokens for comments and gives type OP for all
operators.  Additionally, all token lists start with an ENCODING token
which tells you which encoding was used to decode the bytes stream.

Function Documentation

def tokenize.any (   choices)

def any(*choices): return group(*choices) + '*'
def (   choices)

def group(*choices): return '(' + '|'.join(choices) + ')'
def tokenize.maybe (   choices)

00058 def maybe(*choices): return group(*choices) + '?'
00060 # Note: we use unicode matching for names ("\w") but ascii matching for
# number literals.

Initial value:
00001 token.__all__+["COMMENT", "tokenize", "detect_encoding",
00002                            "NL", "untokenize", "ENCODING", "TokenInfo"]

string tokenize.__author__ = 'Ka-Ping Yee <>'

Initial value:
00001 ('GvR, ESR, Tim Peters, Thomas Wouters, Fred Drake, '
00002                'Skip Montanaro, Raymond Hettinger, Trent Nelson, '
00003                'Michael Foord')

string tokenize.Binnumber = r'0[bB][01]+'

tuple tokenize.cookie_re = re.compile("coding[:=]\s*([-\w.]+)")

string tokenize.Decnumber = r'(?:0+|[1-9][0-9]*)'

string tokenize.Double = r'[^"\\]*(?:\\.[^"\\]*)*"'

string tokenize.Double3 = r'[^"\\]*(?:(?:\\.|"(?!""))[^"\\]*)*"""'

string tokenize.Exponent = r'[eE][-+]?[0-9]+'

string tokenize.Hexnumber = r'0[xX][0-9a-fA-F]+'

tuple tokenize.Ignore = Whitespace+any(r'\\\r?\n' + Whitespace)

tuple tokenize.Imagnumber = group(r'[0-9]+[jJ]', Floatnumber + r'[jJ]')

string tokenize.Octnumber = r'0[oO][0-7]+'

tuple tokenize.Pointfloat = group(r'[0-9]+\.[0-9]*', r'\.[0-9]+')

string tokenize.Single = r"[^'\\]*(?:\\.[^'\\]*)*'"

string tokenize.Single3 = r"[^'\\]*(?:(?:\\.|'(?!''))[^'\\]*)*'''"

string tokenize.Whitespace = r'[ \f\t]*'

