upstream/ipython Commit - r7388:4659fca1

1

# encoding: utf-8

1

# encoding: utf-8

2

"""

2

"""

3

Utilities for working with strings and text.

3

Utilities for working with strings and text.

4

"""

4

"""

5

6

#-----------------------------------------------------------------------------

6

#-----------------------------------------------------------------------------

7

8

#

8

#

9

# Distributed under the terms of the BSD License. The full license is in

9

# Distributed under the terms of the BSD License. The full license is in

10

# the file COPYING, distributed as part of this software.

10

# the file COPYING, distributed as part of this software.

11

#-----------------------------------------------------------------------------

11

#-----------------------------------------------------------------------------

12

13

#-----------------------------------------------------------------------------

13

#-----------------------------------------------------------------------------

14

# Imports

14

# Imports

15

#-----------------------------------------------------------------------------

15

#-----------------------------------------------------------------------------

16

17

import __main__

17

import __main__

18

19

import os

19

import os

20

import re

20

import re

21

import shutil

21

import shutil

22

import sys

22

import sys

23

import textwrap

23

import textwrap

24

from string import Formatter

24

from string import Formatter

25

26

from IPython.external.path import path

26

from IPython.external.path import path

27

from IPython.testing.skipdoctest import skip_doctest_py3

27

from IPython.testing.skipdoctest import skip_doctest_py3, skip_doctest

28

from IPython.utils import py3compat

28

from IPython.utils import py3compat

29

from IPython.utils.io import nlprint

29

from IPython.utils.io import nlprint

30

from IPython.utils.data import flatten

30

from IPython.utils.data import flatten

31

32

#-----------------------------------------------------------------------------

32

#-----------------------------------------------------------------------------

33

# Code

33

# Code

34

#-----------------------------------------------------------------------------

34

#-----------------------------------------------------------------------------

35

36

def unquote_ends(istr):

36

def unquote_ends(istr):

37

"""Remove a single pair of quotes from the endpoints of a string."""

37

"""Remove a single pair of quotes from the endpoints of a string."""

38

39

if not istr:

39

if not istr:

40

return istr

40

return istr

41

if (istr[0]=="'" and istr[-1]=="'") or \

41

if (istr[0]=="'" and istr[-1]=="'") or \

42

(istr[0]=='"' and istr[-1]=='"'):

42

(istr[0]=='"' and istr[-1]=='"'):

43

return istr[1:-1]

43

return istr[1:-1]

44

else:

44

else:

45

return istr

45

return istr

46

47

48

class LSString(str):

48

class LSString(str):

49

"""String derivative with a special access attributes.

49

"""String derivative with a special access attributes.

50

51

These are normal strings, but with the special attributes:

51

These are normal strings, but with the special attributes:

52

53

.l (or .list) : value as list (split on newlines).

53

.l (or .list) : value as list (split on newlines).

54

.n (or .nlstr): original value (the string itself).

54

.n (or .nlstr): original value (the string itself).

55

.s (or .spstr): value as whitespace-separated string.

55

.s (or .spstr): value as whitespace-separated string.

56

.p (or .paths): list of path objects

56

.p (or .paths): list of path objects

57

58

Any values which require transformations are computed only once and

58

Any values which require transformations are computed only once and

59

cached.

59

cached.

60

61

Such strings are very useful to efficiently interact with the shell, which

61

Such strings are very useful to efficiently interact with the shell, which

62

typically only understands whitespace-separated options for commands."""

62

typically only understands whitespace-separated options for commands."""

63

64

def get_list(self):

64

def get_list(self):

65

try:

65

try:

66

return self.__list

66

return self.__list

67

except AttributeError:

67

except AttributeError:

68

self.__list = self.split('\n')

68

self.__list = self.split('\n')

69

return self.__list

69

return self.__list

70

71

l = list = property(get_list)

71

l = list = property(get_list)

72

73

def get_spstr(self):

73

def get_spstr(self):

74

try:

74

try:

75

return self.__spstr

75

return self.__spstr

76

except AttributeError:

76

except AttributeError:

77

self.__spstr = self.replace('\n',' ')

77

self.__spstr = self.replace('\n',' ')

78

return self.__spstr

78

return self.__spstr

79

80

s = spstr = property(get_spstr)

80

s = spstr = property(get_spstr)

81

82

def get_nlstr(self):

82

def get_nlstr(self):

83

return self

83

return self

84

85

n = nlstr = property(get_nlstr)

85

n = nlstr = property(get_nlstr)

86

87

def get_paths(self):

87

def get_paths(self):

88

try:

88

try:

89

return self.__paths

89

return self.__paths

90

except AttributeError:

90

except AttributeError:

91

self.__paths = [path(p) for p in self.split('\n') if os.path.exists(p)]

91

self.__paths = [path(p) for p in self.split('\n') if os.path.exists(p)]

92

return self.__paths

92

return self.__paths

93

94

p = paths = property(get_paths)

94

p = paths = property(get_paths)

95

96

# FIXME: We need to reimplement type specific displayhook and then add this

96

# FIXME: We need to reimplement type specific displayhook and then add this

97

# back as a custom printer. This should also be moved outside utils into the

97

# back as a custom printer. This should also be moved outside utils into the

98

# core.

98

# core.

99

100

# def print_lsstring(arg):

100

# def print_lsstring(arg):

101

# """ Prettier (non-repr-like) and more informative printer for LSString """

101

# """ Prettier (non-repr-like) and more informative printer for LSString """

102

# print "LSString (.p, .n, .l, .s available). Value:"

102

# print "LSString (.p, .n, .l, .s available). Value:"

103

# print arg

103

# print arg

104

#

104

#

105

#

105

#

106

# print_lsstring = result_display.when_type(LSString)(print_lsstring)

106

# print_lsstring = result_display.when_type(LSString)(print_lsstring)

107

108

109

class SList(list):

109

class SList(list):

110

"""List derivative with a special access attributes.

110

"""List derivative with a special access attributes.

111

112

These are normal lists, but with the special attributes:

112

These are normal lists, but with the special attributes:

113

114

.l (or .list) : value as list (the list itself).

114

.l (or .list) : value as list (the list itself).

115

.n (or .nlstr): value as a string, joined on newlines.

115

.n (or .nlstr): value as a string, joined on newlines.

116

.s (or .spstr): value as a string, joined on spaces.

116

.s (or .spstr): value as a string, joined on spaces.

117

.p (or .paths): list of path objects

117

.p (or .paths): list of path objects

118

119

Any values which require transformations are computed only once and

119

Any values which require transformations are computed only once and

120

cached."""

120

cached."""

121

122

def get_list(self):

122

def get_list(self):

123

return self

123

return self

124

125

l = list = property(get_list)

125

l = list = property(get_list)

126

127

def get_spstr(self):

127

def get_spstr(self):

128

try:

128

try:

129

return self.__spstr

129

return self.__spstr

130

except AttributeError:

130

except AttributeError:

131

self.__spstr = ' '.join(self)

131

self.__spstr = ' '.join(self)

132

return self.__spstr

132

return self.__spstr

133

134

s = spstr = property(get_spstr)

134

s = spstr = property(get_spstr)

135

136

def get_nlstr(self):

136

def get_nlstr(self):

137

try:

137

try:

138

return self.__nlstr

138

return self.__nlstr

139

except AttributeError:

139

except AttributeError:

140

self.__nlstr = '\n'.join(self)

140

self.__nlstr = '\n'.join(self)

141

return self.__nlstr

141

return self.__nlstr

142

143

n = nlstr = property(get_nlstr)

143

n = nlstr = property(get_nlstr)

144

145

def get_paths(self):

145

def get_paths(self):

146

try:

146

try:

147

return self.__paths

147

return self.__paths

148

except AttributeError:

148

except AttributeError:

149

self.__paths = [path(p) for p in self if os.path.exists(p)]

149

self.__paths = [path(p) for p in self if os.path.exists(p)]

150

return self.__paths

150

return self.__paths

151

152

p = paths = property(get_paths)

152

p = paths = property(get_paths)

153

154

def grep(self, pattern, prune = False, field = None):

154

def grep(self, pattern, prune = False, field = None):

155

""" Return all strings matching 'pattern' (a regex or callable)

155

""" Return all strings matching 'pattern' (a regex or callable)

156

157

This is case-insensitive. If prune is true, return all items

157

This is case-insensitive. If prune is true, return all items

158

NOT matching the pattern.

158

NOT matching the pattern.

159

160

If field is specified, the match must occur in the specified

160

If field is specified, the match must occur in the specified

161

whitespace-separated field.

161

whitespace-separated field.

162

163

Examples::

163

Examples::

164

165

a.grep( lambda x: x.startswith('C') )

165

a.grep( lambda x: x.startswith('C') )

166

a.grep('Cha.*log', prune=1)

166

a.grep('Cha.*log', prune=1)

167

a.grep('chm', field=-1)

167

a.grep('chm', field=-1)

168

"""

168

"""

169

170

def match_target(s):

170

def match_target(s):

171

if field is None:

171

if field is None:

172

return s

172

return s

173

parts = s.split()

173

parts = s.split()

174

try:

174

try:

175

tgt = parts[field]

175

tgt = parts[field]

176

return tgt

176

return tgt

177

except IndexError:

177

except IndexError:

178

return ""

178

return ""

179

180

if isinstance(pattern, basestring):

180

if isinstance(pattern, basestring):

181

pred = lambda x : re.search(pattern, x, re.IGNORECASE)

181

pred = lambda x : re.search(pattern, x, re.IGNORECASE)

182

else:

182

else:

183

pred = pattern

183

pred = pattern

184

if not prune:

184

if not prune:

185

return SList([el for el in self if pred(match_target(el))])

185

return SList([el for el in self if pred(match_target(el))])

186

else:

186

else:

187

return SList([el for el in self if not pred(match_target(el))])

187

return SList([el for el in self if not pred(match_target(el))])

188

189

def fields(self, *fields):

189

def fields(self, *fields):

190

""" Collect whitespace-separated fields from string list

190

""" Collect whitespace-separated fields from string list

191

192

Allows quick awk-like usage of string lists.

192

Allows quick awk-like usage of string lists.

193

194

Example data (in var a, created by 'a = !ls -l')::

194

Example data (in var a, created by 'a = !ls -l')::

195

-rwxrwxrwx 1 ville None 18 Dec 14 2006 ChangeLog

195

-rwxrwxrwx 1 ville None 18 Dec 14 2006 ChangeLog

196

drwxrwxrwx+ 6 ville None 0 Oct 24 18:05 IPython

196

drwxrwxrwx+ 6 ville None 0 Oct 24 18:05 IPython

197

198

a.fields(0) is ['-rwxrwxrwx', 'drwxrwxrwx+']

198

a.fields(0) is ['-rwxrwxrwx', 'drwxrwxrwx+']

199

a.fields(1,0) is ['1 -rwxrwxrwx', '6 drwxrwxrwx+']

199

a.fields(1,0) is ['1 -rwxrwxrwx', '6 drwxrwxrwx+']

200

(note the joining by space).

200

(note the joining by space).

201

a.fields(-1) is ['ChangeLog', 'IPython']

201

a.fields(-1) is ['ChangeLog', 'IPython']

202

203

IndexErrors are ignored.

203

IndexErrors are ignored.

204

205

Without args, fields() just split()'s the strings.

205

Without args, fields() just split()'s the strings.

206

"""

206

"""

207

if len(fields) == 0:

207

if len(fields) == 0:

208

return [el.split() for el in self]

208

return [el.split() for el in self]

209

210

res = SList()

210

res = SList()

211

for el in [f.split() for f in self]:

211

for el in [f.split() for f in self]:

212

lineparts = []

212

lineparts = []

213

214

for fd in fields:

214

for fd in fields:

215

try:

215

try:

216

lineparts.append(el[fd])

216

lineparts.append(el[fd])

217

except IndexError:

217

except IndexError:

218

pass

218

pass

219

if lineparts:

219

if lineparts:

220

res.append(" ".join(lineparts))

220

res.append(" ".join(lineparts))

221

222

return res

222

return res

223

224

def sort(self,field= None, nums = False):

224

def sort(self,field= None, nums = False):

225

""" sort by specified fields (see fields())

225

""" sort by specified fields (see fields())

226

227

Example::

227

Example::

228

a.sort(1, nums = True)

228

a.sort(1, nums = True)

229

230

Sorts a by second field, in numerical order (so that 21 > 3)

230

Sorts a by second field, in numerical order (so that 21 > 3)

231

232

"""

232

"""

233

234

#decorate, sort, undecorate

234

#decorate, sort, undecorate

235

if field is not None:

235

if field is not None:

236

dsu = [[SList([line]).fields(field), line] for line in self]

236

dsu = [[SList([line]).fields(field), line] for line in self]

237

else:

237

else:

238

dsu = [[line, line] for line in self]

238

dsu = [[line, line] for line in self]

239

if nums:

239

if nums:

240

for i in range(len(dsu)):

240

for i in range(len(dsu)):

241

numstr = "".join([ch for ch in dsu[i][0] if ch.isdigit()])

241

numstr = "".join([ch for ch in dsu[i][0] if ch.isdigit()])

242

try:

242

try:

243

n = int(numstr)

243

n = int(numstr)

244

except ValueError:

244

except ValueError:

245

n = 0;

245

n = 0;

246

dsu[i][0] = n

246

dsu[i][0] = n

247

248

249

dsu.sort()

249

dsu.sort()

250

return SList([t[1] for t in dsu])

250

return SList([t[1] for t in dsu])

251

252

253

# FIXME: We need to reimplement type specific displayhook and then add this

253

# FIXME: We need to reimplement type specific displayhook and then add this

254

# back as a custom printer. This should also be moved outside utils into the

254

# back as a custom printer. This should also be moved outside utils into the

255

# core.

255

# core.

256

257

# def print_slist(arg):

257

# def print_slist(arg):

258

# """ Prettier (non-repr-like) and more informative printer for SList """

258

# """ Prettier (non-repr-like) and more informative printer for SList """

259

# print "SList (.p, .n, .l, .s, .grep(), .fields(), sort() available):"

259

# print "SList (.p, .n, .l, .s, .grep(), .fields(), sort() available):"

260

# if hasattr(arg, 'hideonce') and arg.hideonce:

260

# if hasattr(arg, 'hideonce') and arg.hideonce:

261

# arg.hideonce = False

261

# arg.hideonce = False

262

# return

262

# return

263

#

263

#

264

# nlprint(arg)

264

# nlprint(arg)

265

#

265

#

266

# print_slist = result_display.when_type(SList)(print_slist)

266

# print_slist = result_display.when_type(SList)(print_slist)

267

268

269

def esc_quotes(strng):

269

def esc_quotes(strng):

270

"""Return the input string with single and double quotes escaped out"""

270

"""Return the input string with single and double quotes escaped out"""

271

272

return strng.replace('"','\\"').replace("'","\\'")

272

return strng.replace('"','\\"').replace("'","\\'")

273

274

275

def qw(words,flat=0,sep=None,maxsplit=-1):

275

def qw(words,flat=0,sep=None,maxsplit=-1):

276

"""Similar to Perl's qw() operator, but with some more options.

276

"""Similar to Perl's qw() operator, but with some more options.

277

278

qw(words,flat=0,sep=' ',maxsplit=-1) -> words.split(sep,maxsplit)

278

qw(words,flat=0,sep=' ',maxsplit=-1) -> words.split(sep,maxsplit)

279

280

words can also be a list itself, and with flat=1, the output will be

280

words can also be a list itself, and with flat=1, the output will be

281

recursively flattened.

281

recursively flattened.

282

283

Examples:

283

Examples:

284

285

>>> qw('1 2')

285

>>> qw('1 2')

286

['1', '2']

286

['1', '2']

287

288

>>> qw(['a b','1 2',['m n','p q']])

288

>>> qw(['a b','1 2',['m n','p q']])

289

[['a', 'b'], ['1', '2'], [['m', 'n'], ['p', 'q']]]

289

[['a', 'b'], ['1', '2'], [['m', 'n'], ['p', 'q']]]

290

291

>>> qw(['a b','1 2',['m n','p q']],flat=1)

291

>>> qw(['a b','1 2',['m n','p q']],flat=1)

292

['a', 'b', '1', '2', 'm', 'n', 'p', 'q']

292

['a', 'b', '1', '2', 'm', 'n', 'p', 'q']

293

"""

293

"""

294

295

if isinstance(words, basestring):

295

if isinstance(words, basestring):

296

return [word.strip() for word in words.split(sep,maxsplit)

296

return [word.strip() for word in words.split(sep,maxsplit)

297

if word and not word.isspace() ]

297

if word and not word.isspace() ]

298

if flat:

298

if flat:

299

return flatten(map(qw,words,[1]*len(words)))

299

return flatten(map(qw,words,[1]*len(words)))

300

return map(qw,words)

300

return map(qw,words)

301

302

303

def qwflat(words,sep=None,maxsplit=-1):

303

def qwflat(words,sep=None,maxsplit=-1):

304

"""Calls qw(words) in flat mode. It's just a convenient shorthand."""

304

"""Calls qw(words) in flat mode. It's just a convenient shorthand."""

305

return qw(words,1,sep,maxsplit)

305

return qw(words,1,sep,maxsplit)

306

307

308

def qw_lol(indata):

308

def qw_lol(indata):

309

"""qw_lol('a b') -> [['a','b']],

309

"""qw_lol('a b') -> [['a','b']],

310

otherwise it's just a call to qw().

310

otherwise it's just a call to qw().

311

312

We need this to make sure the modules_some keys *always* end up as a

312

We need this to make sure the modules_some keys *always* end up as a

313

list of lists."""

313

list of lists."""

314

315

if isinstance(indata, basestring):

315

if isinstance(indata, basestring):

316

return [qw(indata)]

316

return [qw(indata)]

317

else:

317

else:

318

return qw(indata)

318

return qw(indata)

319

320

321

def grep(pat,list,case=1):

321

def grep(pat,list,case=1):

322

"""Simple minded grep-like function.

322

"""Simple minded grep-like function.

323

grep(pat,list) returns occurrences of pat in list, None on failure.

323

grep(pat,list) returns occurrences of pat in list, None on failure.

324

325

It only does simple string matching, with no support for regexps. Use the

325

It only does simple string matching, with no support for regexps. Use the

326

option case=0 for case-insensitive matching."""

326

option case=0 for case-insensitive matching."""

327

328

# This is pretty crude. At least it should implement copying only references

328

# This is pretty crude. At least it should implement copying only references

329

# to the original data in case it's big. Now it copies the data for output.

329

# to the original data in case it's big. Now it copies the data for output.

330

out=[]

330

out=[]

331

if case:

331

if case:

332

for term in list:

332

for term in list:

333

if term.find(pat)>-1: out.append(term)

333

if term.find(pat)>-1: out.append(term)

334

else:

334

else:

335

lpat=pat.lower()

335

lpat=pat.lower()

336

for term in list:

336

for term in list:

337

if term.lower().find(lpat)>-1: out.append(term)

337

if term.lower().find(lpat)>-1: out.append(term)

338

339

if len(out): return out

339

if len(out): return out

340

else: return None

340

else: return None

341

342

343

def dgrep(pat,*opts):

343

def dgrep(pat,*opts):

344

"""Return grep() on dir()+dir(__builtins__).

344

"""Return grep() on dir()+dir(__builtins__).

345

346

A very common use of grep() when working interactively."""

346

A very common use of grep() when working interactively."""

347

348

return grep(pat,dir(__main__)+dir(__main__.__builtins__),*opts)

348

return grep(pat,dir(__main__)+dir(__main__.__builtins__),*opts)

349

350

351

def idgrep(pat):

351

def idgrep(pat):

352

"""Case-insensitive dgrep()"""

352

"""Case-insensitive dgrep()"""

353

354

return dgrep(pat,0)

354

return dgrep(pat,0)

355

356

357

def igrep(pat,list):

357

def igrep(pat,list):

358

"""Synonym for case-insensitive grep."""

358

"""Synonym for case-insensitive grep."""

359

360

return grep(pat,list,case=0)

360

return grep(pat,list,case=0)

361

362

363

def indent(instr,nspaces=4, ntabs=0, flatten=False):

363

def indent(instr,nspaces=4, ntabs=0, flatten=False):

364

"""Indent a string a given number of spaces or tabstops.

364

"""Indent a string a given number of spaces or tabstops.

365

366

indent(str,nspaces=4,ntabs=0) -> indent str by ntabs+nspaces.

366

indent(str,nspaces=4,ntabs=0) -> indent str by ntabs+nspaces.

367

368

Parameters

368

Parameters

369

----------

369

----------

370

371

instr : basestring

371

instr : basestring

372

The string to be indented.

372

The string to be indented.

373

nspaces : int (default: 4)

373

nspaces : int (default: 4)

374

The number of spaces to be indented.

374

The number of spaces to be indented.

375

ntabs : int (default: 0)

375

ntabs : int (default: 0)

376

The number of tabs to be indented.

376

The number of tabs to be indented.

377

flatten : bool (default: False)

377

flatten : bool (default: False)

378

Whether to scrub existing indentation. If True, all lines will be

378

Whether to scrub existing indentation. If True, all lines will be

379

aligned to the same indentation. If False, existing indentation will

379

aligned to the same indentation. If False, existing indentation will

380

be strictly increased.

380

be strictly increased.

381

382

Returns

382

Returns

383

-------

383

-------

384

385

str|unicode : string indented by ntabs and nspaces.

385

str|unicode : string indented by ntabs and nspaces.

386

387

"""

387

"""

388

if instr is None:

388

if instr is None:

389

return

389

return

390

ind = '\t'*ntabs+' '*nspaces

390

ind = '\t'*ntabs+' '*nspaces

391

if flatten:

391

if flatten:

392

pat = re.compile(r'^\s*', re.MULTILINE)

392

pat = re.compile(r'^\s*', re.MULTILINE)

393

else:

393

else:

394

pat = re.compile(r'^', re.MULTILINE)

394

pat = re.compile(r'^', re.MULTILINE)

395

outstr = re.sub(pat, ind, instr)

395

outstr = re.sub(pat, ind, instr)

396

if outstr.endswith(os.linesep+ind):

396

if outstr.endswith(os.linesep+ind):

397

return outstr[:-len(ind)]

397

return outstr[:-len(ind)]

398

else:

398

else:

399

return outstr

399

return outstr

400

401

def native_line_ends(filename,backup=1):

401

def native_line_ends(filename,backup=1):

402

"""Convert (in-place) a file to line-ends native to the current OS.

402

"""Convert (in-place) a file to line-ends native to the current OS.

403

404

If the optional backup argument is given as false, no backup of the

404

If the optional backup argument is given as false, no backup of the

405

original file is left. """

405

original file is left. """

406

407

backup_suffixes = {'posix':'~','dos':'.bak','nt':'.bak','mac':'.bak'}

407

backup_suffixes = {'posix':'~','dos':'.bak','nt':'.bak','mac':'.bak'}

408

409

bak_filename = filename + backup_suffixes[os.name]

409

bak_filename = filename + backup_suffixes[os.name]

410

411

original = open(filename).read()

411

original = open(filename).read()

412

shutil.copy2(filename,bak_filename)

412

shutil.copy2(filename,bak_filename)

413

try:

413

try:

414

new = open(filename,'wb')

414

new = open(filename,'wb')

415

new.write(os.linesep.join(original.splitlines()))

415

new.write(os.linesep.join(original.splitlines()))

416

new.write(os.linesep) # ALWAYS put an eol at the end of the file

416

new.write(os.linesep) # ALWAYS put an eol at the end of the file

417

new.close()

417

new.close()

418

except:

418

except:

419

os.rename(bak_filename,filename)

419

os.rename(bak_filename,filename)

420

if not backup:

420

if not backup:

421

try:

421

try:

422

os.remove(bak_filename)

422

os.remove(bak_filename)

423

except:

423

except:

424

pass

424

pass

425

426

427

def list_strings(arg):

427

def list_strings(arg):

428

"""Always return a list of strings, given a string or list of strings

428

"""Always return a list of strings, given a string or list of strings

429

as input.

429

as input.

430

431

:Examples:

431

:Examples:

432

433

In [7]: list_strings('A single string')

433

In [7]: list_strings('A single string')

434

Out[7]: ['A single string']

434

Out[7]: ['A single string']

435

436

In [8]: list_strings(['A single string in a list'])

436

In [8]: list_strings(['A single string in a list'])

437

Out[8]: ['A single string in a list']

437

Out[8]: ['A single string in a list']

438

439

In [9]: list_strings(['A','list','of','strings'])

439

In [9]: list_strings(['A','list','of','strings'])

440

Out[9]: ['A', 'list', 'of', 'strings']

440

Out[9]: ['A', 'list', 'of', 'strings']

441

"""

441

"""

442

443

if isinstance(arg,basestring): return [arg]

443

if isinstance(arg,basestring): return [arg]

444

else: return arg

444

else: return arg

445

446

447

def marquee(txt='',width=78,mark='*'):

447

def marquee(txt='',width=78,mark='*'):

448

"""Return the input string centered in a 'marquee'.

448

"""Return the input string centered in a 'marquee'.

449

450

:Examples:

450

:Examples:

451

452

In [16]: marquee('A test',40)

452

In [16]: marquee('A test',40)

453

Out[16]: '**************** A test ****************'

453

Out[16]: '**************** A test ****************'

454

455

In [17]: marquee('A test',40,'-')

455

In [17]: marquee('A test',40,'-')

456

Out[17]: '---------------- A test ----------------'

456

Out[17]: '---------------- A test ----------------'

457

458

In [18]: marquee('A test',40,' ')

458

In [18]: marquee('A test',40,' ')

459

Out[18]: ' A test '

459

Out[18]: ' A test '

460

461

"""

461

"""

462

if not txt:

462

if not txt:

463

return (mark*width)[:width]

463

return (mark*width)[:width]

464

nmark = (width-len(txt)-2)//len(mark)//2

464

nmark = (width-len(txt)-2)//len(mark)//2

465

if nmark < 0: nmark =0

465

if nmark < 0: nmark =0

466

marks = mark*nmark

466

marks = mark*nmark

467

return '%s %s %s' % (marks,txt,marks)

467

return '%s %s %s' % (marks,txt,marks)

468

469

470

ini_spaces_re = re.compile(r'^(\s+)')

470

ini_spaces_re = re.compile(r'^(\s+)')

471

472

def num_ini_spaces(strng):

472

def num_ini_spaces(strng):

473

"""Return the number of initial spaces in a string"""

473

"""Return the number of initial spaces in a string"""

474

475

ini_spaces = ini_spaces_re.match(strng)

475

ini_spaces = ini_spaces_re.match(strng)

476

if ini_spaces:

476

if ini_spaces:

477

return ini_spaces.end()

477

return ini_spaces.end()

478

else:

478

else:

479

return 0

479

return 0

480

481

482

def format_screen(strng):

482

def format_screen(strng):

483

"""Format a string for screen printing.

483

"""Format a string for screen printing.

484

485

This removes some latex-type format codes."""

485

This removes some latex-type format codes."""

486

# Paragraph continue

486

# Paragraph continue

487

par_re = re.compile(r'\\$',re.MULTILINE)

487

par_re = re.compile(r'\\$',re.MULTILINE)

488

strng = par_re.sub('',strng)

488

strng = par_re.sub('',strng)

489

return strng

489

return strng

490

491

def dedent(text):

491

def dedent(text):

492

"""Equivalent of textwrap.dedent that ignores unindented first line.

492

"""Equivalent of textwrap.dedent that ignores unindented first line.

493

494

This means it will still dedent strings like:

494

This means it will still dedent strings like:

495

'''foo

495

'''foo

496

is a bar

496

is a bar

497

'''

497

'''

498

499

For use in wrap_paragraphs.

499

For use in wrap_paragraphs.

500

"""

500

"""

501

502

if text.startswith('\n'):

502

if text.startswith('\n'):

503

# text starts with blank line, don't ignore the first line

503

# text starts with blank line, don't ignore the first line

504

return textwrap.dedent(text)

504

return textwrap.dedent(text)

505

506

# split first line

506

# split first line

507

splits = text.split('\n',1)

507

splits = text.split('\n',1)

508

if len(splits) == 1:

508

if len(splits) == 1:

509

# only one line

509

# only one line

510

return textwrap.dedent(text)

510

return textwrap.dedent(text)

511

512

first, rest = splits

512

first, rest = splits

513

# dedent everything but the first line

513

# dedent everything but the first line

514

rest = textwrap.dedent(rest)

514

rest = textwrap.dedent(rest)

515

return '\n'.join([first, rest])

515

return '\n'.join([first, rest])

516

517

def wrap_paragraphs(text, ncols=80):

517

def wrap_paragraphs(text, ncols=80):

518

"""Wrap multiple paragraphs to fit a specified width.

518

"""Wrap multiple paragraphs to fit a specified width.

519

520

This is equivalent to textwrap.wrap, but with support for multiple

520

This is equivalent to textwrap.wrap, but with support for multiple

521

paragraphs, as separated by empty lines.

521

paragraphs, as separated by empty lines.

522

523

Returns

523

Returns

524

-------

524

-------

525

526

list of complete paragraphs, wrapped to fill `ncols` columns.

526

list of complete paragraphs, wrapped to fill `ncols` columns.

527

"""

527

"""

528

paragraph_re = re.compile(r'\n(\s*\n)+', re.MULTILINE)

528

paragraph_re = re.compile(r'\n(\s*\n)+', re.MULTILINE)

529

text = dedent(text).strip()

529

text = dedent(text).strip()

530

paragraphs = paragraph_re.split(text)[::2] # every other entry is space

530

paragraphs = paragraph_re.split(text)[::2] # every other entry is space

531

out_ps = []

531

out_ps = []

532

indent_re = re.compile(r'\n\s+', re.MULTILINE)

532

indent_re = re.compile(r'\n\s+', re.MULTILINE)

533

for p in paragraphs:

533

for p in paragraphs:

534

# presume indentation that survives dedent is meaningful formatting,

534

# presume indentation that survives dedent is meaningful formatting,

535

# so don't fill unless text is flush.

535

# so don't fill unless text is flush.

536

if indent_re.search(p) is None:

536

if indent_re.search(p) is None:

537

# wrap paragraph

537

# wrap paragraph

538

p = textwrap.fill(p, ncols)

538

p = textwrap.fill(p, ncols)

539

out_ps.append(p)

539

out_ps.append(p)

540

return out_ps

540

return out_ps

541

542

543

class EvalFormatter(Formatter):

543

class EvalFormatter(Formatter):

544

"""A String Formatter that allows evaluation of simple expressions.

544

"""A String Formatter that allows evaluation of simple expressions.

545

546

Note that this version interprets a : as specifying a format string (as per

546

Note that this version interprets a : as specifying a format string (as per

547

standard string formatting), so if slicing is required, you must explicitly

547

standard string formatting), so if slicing is required, you must explicitly

548

create a slice.

548

create a slice.

549

550

This is to be used in templating cases, such as the parallel batch

550

This is to be used in templating cases, such as the parallel batch

551

script templates, where simple arithmetic on arguments is useful.

551

script templates, where simple arithmetic on arguments is useful.

552

553

Examples

553

Examples

554

--------

554

--------

555

556

In [1]: f = EvalFormatter()

556

In [1]: f = EvalFormatter()

557

In [2]: f.format('{n//4}', n=8)

557

In [2]: f.format('{n//4}', n=8)

558

Out [2]: '2'

558

Out [2]: '2'

559

560

In [3]: f.format("{greeting[slice(2,4)]}", greeting="Hello")

560

In [3]: f.format("{greeting[slice(2,4)]}", greeting="Hello")

561

Out [3]: 'll'

561

Out [3]: 'll'

562

"""

562

"""

563

def get_field(self, name, args, kwargs):

563

def get_field(self, name, args, kwargs):

564

v = eval(name, kwargs)

564

v = eval(name, kwargs)

565

return v, name

565

return v, name

566

567

@skip_doctest_py3

567

@skip_doctest_py3

568

class FullEvalFormatter(Formatter):

568

class FullEvalFormatter(Formatter):

569

"""A String Formatter that allows evaluation of simple expressions.

569

"""A String Formatter that allows evaluation of simple expressions.

570

571

Any time a format key is not found in the kwargs,

571

Any time a format key is not found in the kwargs,

572

it will be tried as an expression in the kwargs namespace.

572

it will be tried as an expression in the kwargs namespace.

573

574

Note that this version allows slicing using [1:2], so you cannot specify

574

Note that this version allows slicing using [1:2], so you cannot specify

575

a format string. Use :class:`EvalFormatter` to permit format strings.

575

a format string. Use :class:`EvalFormatter` to permit format strings.

576

577

Examples

577

Examples

578

--------

578

--------

579

580

In [1]: f = FullEvalFormatter()

580

In [1]: f = FullEvalFormatter()

581

In [2]: f.format('{n//4}', n=8)

581

In [2]: f.format('{n//4}', n=8)

582

Out[2]: u'2'

582

Out[2]: u'2'

583

584

In [3]: f.format('{list(range(5))[2:4]}')

584

In [3]: f.format('{list(range(5))[2:4]}')

585

Out[3]: u'[2, 3]'

585

Out[3]: u'[2, 3]'

586

587

In [4]: f.format('{3*2}')

587

In [4]: f.format('{3*2}')

588

Out[4]: u'6'

588

Out[4]: u'6'

589

"""

589

"""

590

# copied from Formatter._vformat with minor changes to allow eval

590

# copied from Formatter._vformat with minor changes to allow eval

591

# and replace the format_spec code with slicing

591

# and replace the format_spec code with slicing

592

def _vformat(self, format_string, args, kwargs, used_args, recursion_depth):

592

def _vformat(self, format_string, args, kwargs, used_args, recursion_depth):

593

if recursion_depth < 0:

593

if recursion_depth < 0:

594

raise ValueError('Max string recursion exceeded')

594

raise ValueError('Max string recursion exceeded')

595

result = []

595

result = []

596

for literal_text, field_name, format_spec, conversion in \

596

for literal_text, field_name, format_spec, conversion in \

597

self.parse(format_string):

597

self.parse(format_string):

598

599

# output the literal text

599

# output the literal text

600

if literal_text:

600

if literal_text:

601

result.append(literal_text)

601

result.append(literal_text)

602

603

# if there's a field, output it

603

# if there's a field, output it

604

if field_name is not None:

604

if field_name is not None:

605

# this is some markup, find the object and do

605

# this is some markup, find the object and do

606

# the formatting

606

# the formatting

607

608

if format_spec:

608

if format_spec:

609

# override format spec, to allow slicing:

609

# override format spec, to allow slicing:

610

field_name = ':'.join([field_name, format_spec])

610

field_name = ':'.join([field_name, format_spec])

611

612

# eval the contents of the field for the object

612

# eval the contents of the field for the object

613

# to be formatted

613

# to be formatted

614

obj = eval(field_name, kwargs)

614

obj = eval(field_name, kwargs)

615

616

# do any conversion on the resulting object

616

# do any conversion on the resulting object

617

obj = self.convert_field(obj, conversion)

617

obj = self.convert_field(obj, conversion)

618

619

# format the object and append to the result

619

# format the object and append to the result

620

result.append(self.format_field(obj, ''))

620

result.append(self.format_field(obj, ''))

621

622

return u''.join(py3compat.cast_unicode(s) for s in result)

622

return u''.join(py3compat.cast_unicode(s) for s in result)

623

624

@skip_doctest_py3

624

@skip_doctest_py3

625

class DollarFormatter(FullEvalFormatter):

625

class DollarFormatter(FullEvalFormatter):

626

"""Formatter allowing Itpl style $foo replacement, for names and attribute

626

"""Formatter allowing Itpl style $foo replacement, for names and attribute

627

access only. Standard {foo} replacement also works, and allows full

627

access only. Standard {foo} replacement also works, and allows full

628

evaluation of its arguments.

628

evaluation of its arguments.

629

630

Examples

630

Examples

631

--------

631

--------

632

In [1]: f = DollarFormatter()

632

In [1]: f = DollarFormatter()

633

In [2]: f.format('{n//4}', n=8)

633

In [2]: f.format('{n//4}', n=8)

634

Out[2]: u'2'

634

Out[2]: u'2'

635

636

In [3]: f.format('23 * 76 is $result', result=23*76)

636

In [3]: f.format('23 * 76 is $result', result=23*76)

637

Out[3]: u'23 * 76 is 1748'

637

Out[3]: u'23 * 76 is 1748'

638

639

In [4]: f.format('$a or {b}', a=1, b=2)

639

In [4]: f.format('$a or {b}', a=1, b=2)

640

Out[4]: u'1 or 2'

640

Out[4]: u'1 or 2'

641

"""

641

"""

642

_dollar_pattern = re.compile("(.*?)\$(\$?[\w\.]+)")

642

_dollar_pattern = re.compile("(.*?)\$(\$?[\w\.]+)")

643

def parse(self, fmt_string):

643

def parse(self, fmt_string):

644

for literal_txt, field_name, format_spec, conversion \

644

for literal_txt, field_name, format_spec, conversion \

645

in Formatter.parse(self, fmt_string):

645

in Formatter.parse(self, fmt_string):

646

647

# Find $foo patterns in the literal text.

647

# Find $foo patterns in the literal text.

648

continue_from = 0

648

continue_from = 0

649

txt = ""

649

txt = ""

650

for m in self._dollar_pattern.finditer(literal_txt):

650

for m in self._dollar_pattern.finditer(literal_txt):

651

new_txt, new_field = m.group(1,2)

651

new_txt, new_field = m.group(1,2)

652

# $$foo --> $foo

652

# $$foo --> $foo

653

if new_field.startswith("$"):

653

if new_field.startswith("$"):

654

txt += new_txt + new_field

654

txt += new_txt + new_field

655

else:

655

else:

656

yield (txt + new_txt, new_field, "", None)

656

yield (txt + new_txt, new_field, "", None)

657

txt = ""

657

txt = ""

658

continue_from = m.end()

658

continue_from = m.end()

659

660

# Re-yield the {foo} style pattern

660

# Re-yield the {foo} style pattern

661

yield (txt + literal_txt[continue_from:], field_name, format_spec, conversion)

661

yield (txt + literal_txt[continue_from:], field_name, format_spec, conversion)

662

663

#-----------------------------------------------------------------------------

663

#-----------------------------------------------------------------------------

664

# Utils to columnize a list of string

664

# Utils to columnize a list of string

665

#-----------------------------------------------------------------------------

665

#-----------------------------------------------------------------------------

666

def _chunks(l, n):

666

def _chunks(l, n):

667

"""Yield successive n-sized chunks from l."""

667

"""Yield successive n-sized chunks from l."""

668

for i in xrange(0, len(l), n):

668

for i in xrange(0, len(l), n):

669

yield l[i:i+n]

669

yield l[i:i+n]

670

671

def _find_optimal(rlist , sepsize=2 , displaywidth=80):

671

def _find_optimal(rlist , separator_size=2 , displaywidth=80):

672

"""Calculate optimal info to columnize a list of string"""

672

"""Calculate optimal info to columnize a list of string"""

673

for nrow in range(1, len(rlist)+1) :

673

for nrow in range(1, len(rlist)+1) :

674

chk = [max(l) ~~for~~ l in _chunks(rlist, nrow) ]

674

chk = map(max,_chunks(rlist, nrow))

675

sumlength = sum(chk)

675

sumlength = sum(chk)

676

ncols = len(chk)

676

ncols = len(chk)

677

if sumlength+sepsize*(ncols-1) <= displaywidth :

677

if sumlength+separator_size*(ncols-1) <= displaywidth :

678

break;

678

break;

679

return {'columns_numbers' : ncols,

679

return {'columns_numbers' : ncols,

680

'optimal_separator_width':(displaywidth - sumlength)/(ncols-1) if (ncols -1) else 0,

680

'optimal_separator_width':(displaywidth - sumlength)/(ncols-1) if (ncols -1) else 0,

681

'rows_numbers' : nrow,

681

'rows_numbers' : nrow,

682

'columns_width' : chk

682

'columns_width' : chk

683

}

683

}

684

685

def _get_or_default(mylist, i, default=None):

685

def _get_or_default(mylist, i, default=None):

686

"""return list item number, or default if don't exist"""

686

"""return list item number, or default if don't exist"""

687

if i >= len(mylist):

687

if i >= len(mylist):

688

return default

688

return default

689

else :

689

else :

690

return mylist[i]

690

return mylist[i]

691

692

@skip_doctest

692

def compute_item_matrix(items, *args, **kwargs) :

693

def compute_item_matrix(items, *args, **kwargs) :

693

""" Transform a list of strings into a nested list to columnize

694

"""Returns a nested list, and info to columnize items

695

696

Parameters :

697

------------

698

699

items :

700

list of strings to columize

701

separator_size : int (default=2)

702

How much caracters will be used as a separation between each columns.

703

displaywidth : int (default=80)

704

The width of the area onto wich the columns should enter

705

706

Returns :

707

---------

694

708

695

Returns a tuple of (strings_matrix, dict_info)

709

Returns a tuple of (strings_matrix, dict_info)

696

710

697

innermost lists are rows, see columnize for options info

711

strings_matrix :

712

713

nested list of string, the outer most list contains as many list as

714

rows, the innermost lists have each as many element as colums. If the

715

total number of elements in `items` does not equal the product of

716

rows*columns, the last element of some lists are filled with `None`.

717

718

dict_info :

719

some info to make columnize easier:

720

721

columns_numbers : number of columns

722

rows_numbers : number of rows

723

columns_width : list of with of each columns

724

optimal_separator_width : best separator width between columns

725

726

Exemple :

727

---------

728

729

In [1]: l = ['aaa','b','cc','d','eeeee','f','g','h','i','j','k','l']

730

...: compute_item_matrix(l,displaywidth=12)

731

Out[1]:

732

([['aaa', 'f', 'k'],

733

['b', 'g', 'l'],

734

['cc', 'h', None],

735

['d', 'i', None],

736

['eeeee', 'j', None]],

737

{'columns_numbers': 3,

738

'columns_width': [5, 1, 1],

739

'optimal_separator_width': 2,

740

'rows_numbers': 5})

741

698

"""

742

"""

699

info = _find_optimal(map(len, items), *args, **kwargs)

743

info = _find_optimal(map(len, items), *args, **kwargs)

700

nrow, ncol = info['rows_numbers'], info['columns_numbers']

744

nrow, ncol = info['rows_numbers'], info['columns_numbers']

701

return ([[ _get_or_default(items, c*nrow+i) for c in range(ncol) ] for i in range(nrow) ], info)

745

return ([[ _get_or_default(items, c*nrow+i) for c in range(ncol) ] for i in range(nrow) ], info)

702

746

703

def columnize(items, separator=' ', displaywidth=80):

747

def columnize(items, separator=' ', displaywidth=80):

704

""" Transform a list of strings into a single string with columns.

748

""" Transform a list of strings into a single string with columns.

705

749

706

Parameters

750

Parameters

707

----------

751

----------

708

items : sequence of strings

752

items : sequence of strings

709

The strings to process.

753

The strings to process.

710

754

711

separator : str, optional [default is two spaces]

755

separator : str, optional [default is two spaces]

712

The string that separates columns.

756

The string that separates columns.

713

757

714

displaywidth : int, optional [default is 80]

758

displaywidth : int, optional [default is 80]

715

Width of the display in number of characters.

759

Width of the display in number of characters.

716

760

717

Returns

761

Returns

718

-------

762

-------

719

The formatted string.

763

The formatted string.

720

"""

764

"""

721

if not items :

765

if not items :

722

return '\n'

766

return '\n'

723

matrix, info = compute_item_matrix(items, sepsize=len(separator), displaywidth=displaywidth)

767

matrix, info = compute_item_matrix(items, separator_size=len(separator), displaywidth=displaywidth)

724

#sep = ' '*min(info['optimal_separator_width'], 9)

725

fmatrix = matrix

726

fmatrix = [filter(None, x) for x in matrix]

768

fmatrix = [filter(None, x) for x in matrix]

727

sjoin = lambda x : separator.join([ y.ljust(w, ' ') for y, w in zip(x, info['columns_width'])])

769

sjoin = lambda x : separator.join([ y.ljust(w, ' ') for y, w in zip(x, info['columns_width'])])

728

return '\n'.join(map(sjoin, fmatrix))+'\n'

770

return '\n'.join(map(sjoin, fmatrix))+'\n'

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # encoding: utf-8
             """
             Utilities for working with strings and text.
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2008-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             import __main__
             import os
             import re
             import shutil
             import sys
             import textwrap
             from string import Formatter
             from IPython.external.path import path
-            from IPython.testing.skipdoctest import skip_doctest_py3
+            from IPython.testing.skipdoctest import skip_doctest_py3, skip_doctest
             from IPython.utils import py3compat
             from IPython.utils.io import nlprint
             from IPython.utils.data import flatten
             #-----------------------------------------------------------------------------
             # Code
             #-----------------------------------------------------------------------------
             def unquote_ends(istr):
                 """Remove a single pair of quotes from the endpoints of a string."""
                 if not istr:
                     return istr
                 if (istr[0]=="'" and istr[-1]=="'") or \
                    (istr[0]=='"' and istr[-1]=='"'):
                     return istr[1:-1]
                 else:
                     return istr
             class LSString(str):
                 """String derivative with a special access attributes.
                 These are normal strings, but with the special attributes:
                     .l (or .list) : value as list (split on newlines).
                     .n (or .nlstr): original value (the string itself).
                     .s (or .spstr): value as whitespace-separated string.
                     .p (or .paths): list of path objects
                 Any values which require transformations are computed only once and
                 cached.
                 Such strings are very useful to efficiently interact with the shell, which
                 typically only understands whitespace-separated options for commands."""
                 def get_list(self):
                     try:
                         return self.__list
                     except AttributeError:
                         self.__list = self.split('\n')
                         return self.__list
                 l = list = property(get_list)
                 def get_spstr(self):
                     try:
                         return self.__spstr
                     except AttributeError:
                         self.__spstr = self.replace('\n',' ')
                         return self.__spstr
                 s = spstr = property(get_spstr)
                 def get_nlstr(self):
                     return self
                 n = nlstr = property(get_nlstr)
                 def get_paths(self):
                     try:
                         return self.__paths
                     except AttributeError:
                         self.__paths = [path(p) for p in self.split('\n') if os.path.exists(p)]
                         return self.__paths
                 p = paths = property(get_paths)
             # FIXME: We need to reimplement type specific displayhook and then add this
             # back as a custom printer. This should also be moved outside utils into the
             # core.
             # def print_lsstring(arg):
             #     """ Prettier (non-repr-like) and more informative printer for LSString """
             #     print "LSString (.p, .n, .l, .s available). Value:"
             #     print arg
             #
             #
             # print_lsstring = result_display.when_type(LSString)(print_lsstring)
             class SList(list):
                 """List derivative with a special access attributes.
                 These are normal lists, but with the special attributes:
                     .l (or .list) : value as list (the list itself).
                     .n (or .nlstr): value as a string, joined on newlines.
                     .s (or .spstr): value as a string, joined on spaces.
                     .p (or .paths): list of path objects
                 Any values which require transformations are computed only once and
                 cached."""
                 def get_list(self):
                     return self
                 l = list = property(get_list)
                 def get_spstr(self):
                     try:
                         return self.__spstr
                     except AttributeError:
                         self.__spstr = ' '.join(self)
                         return self.__spstr
                 s = spstr = property(get_spstr)
                 def get_nlstr(self):
                     try:
                         return self.__nlstr
                     except AttributeError:
                         self.__nlstr = '\n'.join(self)
                         return self.__nlstr
                 n = nlstr = property(get_nlstr)
                 def get_paths(self):
                     try:
                         return self.__paths
                     except AttributeError:
                         self.__paths = [path(p) for p in self if os.path.exists(p)]
                         return self.__paths
                 p = paths = property(get_paths)
                 def grep(self, pattern, prune = False, field = None):
                     """ Return all strings matching 'pattern' (a regex or callable)
                     This is case-insensitive. If prune is true, return all items
                     NOT matching the pattern.
                     If field is specified, the match must occur in the specified
                     whitespace-separated field.
                     Examples::
                         a.grep( lambda x: x.startswith('C') )
                         a.grep('Cha.*log', prune=1)
                         a.grep('chm', field=-1)
                     """
                     def match_target(s):
                         if field is None:
                             return s
                         parts = s.split()
                         try:
                             tgt = parts[field]
                             return tgt
                         except IndexError:
                             return ""
                     if isinstance(pattern, basestring):
                         pred = lambda x : re.search(pattern, x, re.IGNORECASE)
                     else:
                         pred = pattern
                     if not prune:
                         return SList([el for el in self if pred(match_target(el))])
                     else:
                         return SList([el for el in self if not pred(match_target(el))])
                 def fields(self, *fields):
                     """ Collect whitespace-separated fields from string list
                     Allows quick awk-like usage of string lists.
                     Example data (in var a, created by 'a = !ls -l')::
                         -rwxrwxrwx  1 ville None      18 Dec 14  2006 ChangeLog
                         drwxrwxrwx+ 6 ville None       0 Oct 24 18:05 IPython
                     a.fields(0) is ['-rwxrwxrwx', 'drwxrwxrwx+']
                     a.fields(1,0) is ['1 -rwxrwxrwx', '6 drwxrwxrwx+']
                     (note the joining by space).
                     a.fields(-1) is ['ChangeLog', 'IPython']
                     IndexErrors are ignored.
                     Without args, fields() just split()'s the strings.
                     """
                     if len(fields) == 0:
                         return [el.split() for el in self]
                     res = SList()
                     for el in [f.split() for f in self]:
                         lineparts = []
                         for fd in fields:
                             try:
                                 lineparts.append(el[fd])
                             except IndexError:
                                 pass
                         if lineparts:
                             res.append(" ".join(lineparts))
                     return res
                 def sort(self,field= None,  nums = False):
                     """ sort by specified fields (see fields())
                     Example::
                         a.sort(1, nums = True)
                     Sorts a by second field, in numerical order (so that 21 > 3)
                     """
                     #decorate, sort, undecorate
                     if field is not None:
                         dsu = [[SList([line]).fields(field),  line] for line in self]
                     else:
                         dsu = [[line,  line] for line in self]
                     if nums:
                         for i in range(len(dsu)):
                             numstr = "".join([ch for ch in dsu[i][0] if ch.isdigit()])
                             try:
                                 n = int(numstr)
                             except ValueError:
                                 n = 0;
                             dsu[i][0] = n
                     dsu.sort()
                     return SList([t[1] for t in dsu])
             # FIXME: We need to reimplement type specific displayhook and then add this
             # back as a custom printer. This should also be moved outside utils into the
             # core.
             # def print_slist(arg):
             #     """ Prettier (non-repr-like) and more informative printer for SList """
             #     print "SList (.p, .n, .l, .s, .grep(), .fields(), sort() available):"
             #     if hasattr(arg,  'hideonce') and arg.hideonce:
             #         arg.hideonce = False
             #         return
             #
             #     nlprint(arg)
             #
             # print_slist = result_display.when_type(SList)(print_slist)
             def esc_quotes(strng):
                 """Return the input string with single and double quotes escaped out"""
                 return strng.replace('"','\\"').replace("'","\\'")
             def qw(words,flat=0,sep=None,maxsplit=-1):
                 """Similar to Perl's qw() operator, but with some more options.
                 qw(words,flat=0,sep=' ',maxsplit=-1) -> words.split(sep,maxsplit)
                 words can also be a list itself, and with flat=1, the output will be
                 recursively flattened.
                 Examples:
                 >>> qw('1 2')
                 ['1', '2']
                 >>> qw(['a b','1 2',['m n','p q']])
                 [['a', 'b'], ['1', '2'], [['m', 'n'], ['p', 'q']]]
                 >>> qw(['a b','1 2',['m n','p q']],flat=1)
                 ['a', 'b', '1', '2', 'm', 'n', 'p', 'q']
                 """
                 if isinstance(words, basestring):
                     return [word.strip() for word in words.split(sep,maxsplit)
                             if word and not word.isspace() ]
                 if flat:
                     return flatten(map(qw,words,[1]*len(words)))
                 return map(qw,words)
             def qwflat(words,sep=None,maxsplit=-1):
                 """Calls qw(words) in flat mode. It's just a convenient shorthand."""
                 return qw(words,1,sep,maxsplit)
             def qw_lol(indata):
                 """qw_lol('a b') -> [['a','b']],
                 otherwise it's just a call to qw().
                 We need this to make sure the modules_some keys *always* end up as a
                 list of lists."""
                 if isinstance(indata, basestring):
                     return [qw(indata)]
                 else:
                     return qw(indata)
             def grep(pat,list,case=1):
                 """Simple minded grep-like function.
                 grep(pat,list) returns occurrences of pat in list, None on failure.
                 It only does simple string matching, with no support for regexps. Use the
                 option case=0 for case-insensitive matching."""
                 # This is pretty crude. At least it should implement copying only references
                 # to the original data in case it's big. Now it copies the data for output.
                 out=[]
                 if case:
                     for term in list:
                         if term.find(pat)>-1: out.append(term)
                 else:
                     lpat=pat.lower()
                     for term in list:
                         if term.lower().find(lpat)>-1: out.append(term)
                 if len(out): return out
                 else: return None
             def dgrep(pat,*opts):
                 """Return grep() on dir()+dir(__builtins__).
                 A very common use of grep() when working interactively."""
                 return grep(pat,dir(__main__)+dir(__main__.__builtins__),*opts)
             def idgrep(pat):
                 """Case-insensitive dgrep()"""
                 return dgrep(pat,0)
             def igrep(pat,list):
                 """Synonym for case-insensitive grep."""
                 return grep(pat,list,case=0)
             def indent(instr,nspaces=4, ntabs=0, flatten=False):
                 """Indent a string a given number of spaces or tabstops.
                 indent(str,nspaces=4,ntabs=0) -> indent str by ntabs+nspaces.
                 Parameters
                 ----------
                 instr : basestring
                     The string to be indented.
                 nspaces : int (default: 4)
                     The number of spaces to be indented.
                 ntabs : int (default: 0)
                     The number of tabs to be indented.
                 flatten : bool (default: False)
                     Whether to scrub existing indentation.  If True, all lines will be
                     aligned to the same indentation.  If False, existing indentation will
                     be strictly increased.
                 Returns
                 -------
                 str|unicode : string indented by ntabs and nspaces.
                 """
                 if instr is None:
                     return
                 ind = '\t'*ntabs+' '*nspaces
                 if flatten:
                     pat = re.compile(r'^\s*', re.MULTILINE)
                 else:
                     pat = re.compile(r'^', re.MULTILINE)
                 outstr = re.sub(pat, ind, instr)
                 if outstr.endswith(os.linesep+ind):
                     return outstr[:-len(ind)]
                 else:
                     return outstr
             def native_line_ends(filename,backup=1):
                 """Convert (in-place) a file to line-ends native to the current OS.
                 If the optional backup argument is given as false, no backup of the
                 original file is left.  """
                 backup_suffixes = {'posix':'~','dos':'.bak','nt':'.bak','mac':'.bak'}
                 bak_filename = filename + backup_suffixes[os.name]
                 original = open(filename).read()
                 shutil.copy2(filename,bak_filename)
                 try:
                     new = open(filename,'wb')
                     new.write(os.linesep.join(original.splitlines()))
                     new.write(os.linesep) # ALWAYS put an eol at the end of the file
                     new.close()
                 except:
                     os.rename(bak_filename,filename)
                 if not backup:
                     try:
                         os.remove(bak_filename)
                     except:
                         pass
             def list_strings(arg):
                 """Always return a list of strings, given a string or list of strings
                 as input.
                 :Examples:
                     In [7]: list_strings('A single string')
                     Out[7]: ['A single string']
                     In [8]: list_strings(['A single string in a list'])
                     Out[8]: ['A single string in a list']
                     In [9]: list_strings(['A','list','of','strings'])
                     Out[9]: ['A', 'list', 'of', 'strings']
                 """
                 if isinstance(arg,basestring): return [arg]
                 else: return arg
             def marquee(txt='',width=78,mark='*'):
                 """Return the input string centered in a 'marquee'.
                 :Examples:
                     In [16]: marquee('A test',40)
                     Out[16]: '**************** A test ****************'
                     In [17]: marquee('A test',40,'-')
                     Out[17]: '---------------- A test ----------------'
                     In [18]: marquee('A test',40,' ')
                     Out[18]: '                 A test                 '
                 """
                 if not txt:
                     return (mark*width)[:width]
                 nmark = (width-len(txt)-2)//len(mark)//2
                 if nmark < 0: nmark =0
                 marks = mark*nmark
                 return '%s %s %s' % (marks,txt,marks)
             ini_spaces_re = re.compile(r'^(\s+)')
             def num_ini_spaces(strng):
                 """Return the number of initial spaces in a string"""
                 ini_spaces = ini_spaces_re.match(strng)
                 if ini_spaces:
                     return ini_spaces.end()
                 else:
                     return 0
             def format_screen(strng):
                 """Format a string for screen printing.
                 This removes some latex-type format codes."""
                 # Paragraph continue
                 par_re = re.compile(r'\\$',re.MULTILINE)
                 strng = par_re.sub('',strng)
                 return strng
             def dedent(text):
                 """Equivalent of textwrap.dedent that ignores unindented first line.
                 This means it will still dedent strings like:
                 '''foo
                 is a bar
                 '''
                 For use in wrap_paragraphs.
                 """
                 if text.startswith('\n'):
                     # text starts with blank line, don't ignore the first line
                     return textwrap.dedent(text)
                 # split first line
                 splits = text.split('\n',1)
                 if len(splits) == 1:
                     # only one line
                     return textwrap.dedent(text)
                 first, rest = splits
                 # dedent everything but the first line
                 rest = textwrap.dedent(rest)
                 return '\n'.join([first, rest])
             def wrap_paragraphs(text, ncols=80):
                 """Wrap multiple paragraphs to fit a specified width.
                 This is equivalent to textwrap.wrap, but with support for multiple
                 paragraphs, as separated by empty lines.
                 Returns
                 -------
                 list of complete paragraphs, wrapped to fill `ncols` columns.
                 """
                 paragraph_re = re.compile(r'\n(\s*\n)+', re.MULTILINE)
                 text = dedent(text).strip()
                 paragraphs = paragraph_re.split(text)[::2] # every other entry is space
                 out_ps = []
                 indent_re = re.compile(r'\n\s+', re.MULTILINE)
                 for p in paragraphs:
                     # presume indentation that survives dedent is meaningful formatting,
                     # so don't fill unless text is flush.
                     if indent_re.search(p) is None:
                         # wrap paragraph
                         p = textwrap.fill(p, ncols)
                     out_ps.append(p)
                 return out_ps
             class EvalFormatter(Formatter):
                 """A String Formatter that allows evaluation of simple expressions.
                 Note that this version interprets a : as specifying a format string (as per
                 standard string formatting), so if slicing is required, you must explicitly
                 create a slice.
                 This is to be used in templating cases, such as the parallel batch
                 script templates, where simple arithmetic on arguments is useful.
                 Examples
                 --------
                 In  [1]: f = EvalFormatter()
                 In  [2]: f.format('{n//4}', n=8)
                 Out [2]: '2'
                 In  [3]: f.format("{greeting[slice(2,4)]}", greeting="Hello")
                 Out [3]: 'll'
                 """
                 def get_field(self, name, args, kwargs):
                     v = eval(name, kwargs)
                     return v, name
             @skip_doctest_py3
             class FullEvalFormatter(Formatter):
                 """A String Formatter that allows evaluation of simple expressions.
                 Any time a format key is not found in the kwargs,
                 it will be tried as an expression in the kwargs namespace.
                 Note that this version allows slicing using [1:2], so you cannot specify
                 a format string. Use :class:`EvalFormatter` to permit format strings.
                 Examples
                 --------
                 In [1]: f = FullEvalFormatter()
                 In [2]: f.format('{n//4}', n=8)
                 Out[2]: u'2'
                 In [3]: f.format('{list(range(5))[2:4]}')
                 Out[3]: u'[2, 3]'
                 In [4]: f.format('{3*2}')
                 Out[4]: u'6'
                 """
                 # copied from Formatter._vformat with minor changes to allow eval
                 # and replace the format_spec code with slicing
                 def _vformat(self, format_string, args, kwargs, used_args, recursion_depth):
                     if recursion_depth < 0:
                         raise ValueError('Max string recursion exceeded')
                     result = []
                     for literal_text, field_name, format_spec, conversion in \
                             self.parse(format_string):
                         # output the literal text
                         if literal_text:
                             result.append(literal_text)
                         # if there's a field, output it
                         if field_name is not None:
                             # this is some markup, find the object and do
                             # the formatting
                             if format_spec:
                                 # override format spec, to allow slicing:
                                 field_name = ':'.join([field_name, format_spec])
                             # eval the contents of the field for the object
                             # to be formatted
                             obj = eval(field_name, kwargs)
                             # do any conversion on the resulting object
                             obj = self.convert_field(obj, conversion)
                             # format the object and append to the result
                             result.append(self.format_field(obj, ''))
                     return u''.join(py3compat.cast_unicode(s) for s in result)
             @skip_doctest_py3
             class DollarFormatter(FullEvalFormatter):
                 """Formatter allowing Itpl style $foo replacement, for names and attribute
                 access only. Standard {foo} replacement also works, and allows full
                 evaluation of its arguments.
                 Examples
                 --------
                 In [1]: f = DollarFormatter()
                 In [2]: f.format('{n//4}', n=8)
                 Out[2]: u'2'
                 In [3]: f.format('23 * 76 is $result', result=23*76)
                 Out[3]: u'23 * 76 is 1748'
                 In [4]: f.format('$a or {b}', a=1, b=2)
                 Out[4]: u'1 or 2'
                 """
                 _dollar_pattern = re.compile("(.*?)\$(\$?[\w\.]+)")
                 def parse(self, fmt_string):
                     for literal_txt, field_name, format_spec, conversion \
                                 in Formatter.parse(self, fmt_string):
                         # Find $foo patterns in the literal text.
                         continue_from = 0
                         txt = ""
                         for m in self._dollar_pattern.finditer(literal_txt):
                             new_txt, new_field = m.group(1,2)
                             # $$foo --> $foo
                             if new_field.startswith("$"):
                                 txt += new_txt + new_field
                             else:
                                 yield (txt + new_txt, new_field, "", None)
                                 txt = ""
                             continue_from = m.end()
                         # Re-yield the {foo} style pattern
                         yield (txt + literal_txt[continue_from:], field_name, format_spec, conversion)
             #-----------------------------------------------------------------------------
             # Utils to columnize a list of string
             #-----------------------------------------------------------------------------
             def _chunks(l, n):
                 """Yield successive n-sized chunks from l."""
                 for i in xrange(0, len(l), n):
                     yield l[i:i+n]
-            def _find_optimal(rlist , sepsize=2 , displaywidth=80):
+            def _find_optimal(rlist , separator_size=2 , displaywidth=80):
                 """Calculate optimal info to columnize a list of string"""
                 for nrow in range(1, len(rlist)+1) :
-                    chk = [max(l) for l in _chunks(rlist, nrow) ]
+                    chk = map(max,_chunks(rlist, nrow))
                     sumlength = sum(chk)
                     ncols = len(chk)
-                    if sumlength+sepsize*(ncols-1) <= displaywidth :
+                    if sumlength+separator_size*(ncols-1) <= displaywidth :
                         break;
                 return {'columns_numbers' : ncols,
                         'optimal_separator_width':(displaywidth - sumlength)/(ncols-1) if (ncols -1) else 0,
                         'rows_numbers' : nrow,
                         'columns_width' : chk
                        }
             def _get_or_default(mylist, i, default=None):
                 """return list item number, or default if don't exist"""
                 if i >= len(mylist):
                     return default
                 else :
                     return mylist[i]
+            @skip_doctest
             def compute_item_matrix(items, *args, **kwargs) :
-                """ Transform a list of strings into a nested list to columnize
+                """Returns a nested list, and info to columnize items
+                Parameters :
+                ------------
+                items :
+                    list of strings to columize
+                separator_size : int (default=2)
+                    How much caracters will be used as a separation between each columns.
+                displaywidth : int (default=80)
+                    The width of the area onto wich the columns should enter
+                Returns :
+                ---------
                 Returns a tuple of (strings_matrix, dict_info)
-                innermost lists are rows, see columnize for options info
+                strings_matrix :
+                    nested list of string, the outer most list contains as many list as
+                    rows, the innermost lists have each as many element as colums. If the
+                    total number of elements in `items` does not equal the product of
+                    rows*columns, the last element of some lists are filled with `None`.
+                dict_info :
+                    some info to make columnize easier:
+                    columns_numbers : number of columns
+                    rows_numbers    : number of rows
+                    columns_width   : list of with of each columns
+                    optimal_separator_width : best separator width between columns
+                Exemple :
+                ---------
+                In [1]: l = ['aaa','b','cc','d','eeeee','f','g','h','i','j','k','l']
+                   ...: compute_item_matrix(l,displaywidth=12)
+                Out[1]:
+                    ([['aaa', 'f', 'k'],
+                    ['b', 'g', 'l'],
+                    ['cc', 'h', None],
+                    ['d', 'i', None],
+                    ['eeeee', 'j', None]],
+                    {'columns_numbers': 3,
+                    'columns_width': [5, 1, 1],
+                    'optimal_separator_width': 2,
+                    'rows_numbers': 5})
                 """
                 info = _find_optimal(map(len, items), *args, **kwargs)
                 nrow, ncol = info['rows_numbers'], info['columns_numbers']
                 return ([[ _get_or_default(items, c*nrow+i) for c in range(ncol) ] for i in range(nrow) ], info)
             def columnize(items, separator='  ', displaywidth=80):
                 """ Transform a list of strings into a single string with columns.
                 Parameters
                 ----------
                 items : sequence of strings
                     The strings to process.
                 separator : str, optional [default is two spaces]
                     The string that separates columns.
                 displaywidth : int, optional [default is 80]
                     Width of the display in number of characters.
                 Returns
                 -------
                 The formatted string.
                 """
                 if not items :
                     return '\n'
-                matrix, info = compute_item_matrix(items, sepsize=len(separator), displaywidth=displaywidth)
+                matrix, info = compute_item_matrix(items, separator_size=len(separator), displaywidth=displaywidth)
-                #sep = ' '*min(info['optimal_separator_width'], 9)
-                fmatrix = matrix
                 fmatrix = [filter(None, x) for x in matrix]
                 sjoin = lambda x : separator.join([ y.ljust(w, ' ') for y, w in zip(x, info['columns_width'])])
                 return '\n'.join(map(sjoin, fmatrix))+'\n'