Coverage for src/thunderlab/tabledata.py: 88%

1570 statements  

« prev     ^ index     » next       coverage.py v7.7.0, created at 2025-03-18 22:36 +0000

1""" 

2Tables with hierarchical headers and units 

3 

4## Classes 

5 

6- `class TableData`: tables with a rich hierarchical header 

7 including units and column-specific formats. Kind of similar to a 

8 pandas data frame, but with intuitive numpy-style indexing and nicely 

9 formatted output to csv, html, and latex. 

10 

11 

12## Helper functions 

13 

14- `write()`: shortcut for constructing and writing a TableData. 

15- `latex_unit()`: translate unit string into SIunit LaTeX code. 

16- `index2aa()`: convert an integer into an alphabetical representation. 

17- `aa2index()`: convert an alphabetical representation to an index. 

18 

19 

20## Configuration 

21 

22- `add_write_table_config()`: add parameter specifying how to write a table to a file as a new section to a configuration. 

23- `write_table_args()`: translates a configuration to the respective parameter names for writing a table to a file. 

24""" 

25 

26import sys 

27import os 

28import re 

29import math as m 

30import numpy as np 

31from io import StringIO 

32try: 

33 import pandas as pd 

34 has_pandas = True 

35except ImportError: 

36 has_pandas = False 

37 

38 

39__pdoc__ = {} 

40__pdoc__['TableData.__contains__'] = True 

41__pdoc__['TableData.__len__'] = True 

42__pdoc__['TableData.__iter__'] = True 

43__pdoc__['TableData.__next__'] = True 

44__pdoc__['TableData.__setupkey__'] = True 

45__pdoc__['TableData.__call__'] = True 

46__pdoc__['TableData.__getitem__'] = True 

47__pdoc__['TableData.__setitem__'] = True 

48__pdoc__['TableData.__delitem__'] = True 

49__pdoc__['TableData.__str__'] = True 

50 

51 

52default_missing_str = '-' 

53"""Default string indicating nan data elements when outputting data.""" 

54 

55default_missing_inputs = ['na', 'NA', 'nan', 'NAN', '-'] 

56"""Default strings that are translated to nan when loading table data.""" 

57 

58 

59class TableData(object): 

60 """Table with numpy-style indexing and a rich hierarchical header including units and formats. 

61  

62 Parameters 

63 ---------- 

64 data: str, stream, ndarray 

65 - a filename: load table from file with name `data`. 

66 - a stream/file handle: load table from that stream. 

67 - 1-D or 2-D ndarray of data: the data of the table. 

68 Requires als a specified `header`. 

69 header: list of str 

70 Header labels for each column. 

71 units: list of str, optional 

72 Unit strings for each column. 

73 formats: str or list of str, optional 

74 Format strings for each column. If only a single format string is 

75 given, then all columns are initialized with this format string. 

76 missing: list of str 

77 Missing data are indicated by one of these strings. 

78 

79 Manipulate table header 

80 ----------------------- 

81 

82 Each column of the table has a label (the name of the column), a 

83 unit, and a format specifier. Sections group columns into a hierarchy. 

84 

85 - `__init__()`: initialize a TableData from data or a file. 

86 - `append()`: append column to the table. 

87 - `insert()`: insert a table column at a given position. 

88 - `remove()`: remove columns from the table. 

89 - `section()`: the section name of a specified column. 

90 - `set_section()`: set a section name. 

91 - `append_section()`: add sections to the table header. 

92 - `insert_section()`: insert a section at a given position of the table header. 

93 - `label()`: the name of a column. 

94 - `set_label()`: set the name of a column. 

95 - `unit()`: the unit of a column. 

96 - `set_unit()`: set the unit of a column. 

97 - `set_units()`: set the units of all columns. 

98 - `format()`: the format string of the column. 

99 - `set_format()`: set the format string of a column. 

100 - `set_formats()`: set the format strings of all columns. 

101 

102 For example: 

103 ``` 

104 tf = TableData('data.csv') 

105 ``` 

106 loads a table directly from a file. See `load()` for details. 

107 ``` 

108 tf = TableData(np.random.randn(4,3), header=['aaa', 'bbb', 'ccc'], units=['m', 's', 'g'], formats='%.2f')  

109 ``` 

110 results in 

111 ``` plain 

112 aaa bbb ccc 

113 m s g  

114 1.45 0.01 0.16 

115 -0.74 -0.58 -1.34 

116 -2.06 0.08 1.47 

117 -0.43 0.60 1.38 

118 ``` 

119 

120 A more elaborate way to construct a table is: 

121 ``` 

122 df = TableData() 

123 # first column with section names and 3 data values: 

124 df.append(["data", "partial information", "size"], "m", "%6.2f", 

125 [2.34, 56.7, 8.9]) 

126 # next columns with single data values: 

127 df.append("full weight", "kg", "%.0f", 122.8) 

128 df.append_section("complete reaction") 

129 df.append("speed", "m/s", "%.3g", 98.7) 

130 df.append("median jitter", "mm", "%.1f", 23) 

131 df.append("size", "g", "%.2e", 1.234) 

132 # add a missing value to the second column: 

133 df.append_data(np.nan, 1) 

134 # fill up the remaining columns of the row: 

135 df.append_data((0.543, 45, 1.235e2)) 

136 # append data to the next row starting at the second column: 

137 df.append_data((43.21, 6789.1, 3405, 1.235e-4), 1) # next row 

138 ``` 

139 results in 

140 ``` plain 

141 data 

142 partial information complete reaction 

143 size full weight speed median jitter size 

144 m kg m/s mm g  

145 2.34 123 98.7 23.0 1.23e+00 

146 56.70 - 0.543 45.0 1.24e+02 

147 8.90 43 6.79e+03 3405.0 1.23e-04 

148 ``` 

149  

150 Table columns 

151 ------------- 

152 

153 Columns can be specified by an index or by the name of a column. In 

154 table headers with sections the colum can be specified by the 

155 section names and the column name separated by '>'. 

156  

157 - `index()`: the index of a column. 

158 - `__contains__()`: check for existence of a column. 

159 - `find_col()`: find the start and end index of a column specification. 

160 - `column_spec()`: full specification of a column with all its section names. 

161 - `column_head()`: the name, unit, and format of a column. 

162 - `table_header()`: the header of the table without content. 

163 

164 For example: 

165 ``` 

166 df.index('complete reaction>size) # returns 4 

167 'speed' in df # is True 

168 ``` 

169 

170 Iterating over columns 

171 ---------------------- 

172 

173 A table behaves like an ordered dictionary with column names as 

174 keys and the data of each column as values. 

175 Iterating over a table goes over columns. 

176  

177 - `keys()`: list of unique column keys for all available columns. 

178 - `values()`: list of column data corresponding to keys(). 

179 - `items()`: list of tuples with unique column specifications and the corresponding data. 

180 - `__len__()`: the number of columns. 

181 - `__iter__()`: initialize iteration over data columns. 

182 - `__next__()`: return data of next column as a list. 

183 - `data`: the table data as a list over columns each containing a list of data elements. 

184 

185 For example: 

186 ``` 

187 print('column specifications:') 

188 for c in range(df.columns()): 

189 print(df.column_spec(c)) 

190 print('keys():') 

191 for c, k in enumerate(df.keys()): 

192 print('%d: %s' % (c, k)) 

193 print('values():') 

194 for c, v in enumerate(df.values()): 

195 print(v) 

196 print('iterating over the table:') 

197 for v in df: 

198 print(v) 

199 ``` 

200 results in 

201 ``` plain 

202 column specifications: 

203 data>partial information>size 

204 data>partial information>full weight 

205 data>complete reaction>speed 

206 data>complete reaction>median jitter 

207 data>complete reaction>size 

208 keys(): 

209 0: data>partial information>size 

210 1: data>partial information>full weight 

211 2: data>complete reaction>speed 

212 3: data>complete reaction>median jitter 

213 4: data>complete reaction>size 

214 values(): 

215 [2.34, 56.7, 8.9] 

216 [122.8, nan, 43.21] 

217 [98.7, 0.543, 6789.1] 

218 [23, 45, 3405] 

219 [1.234, 123.5, 0.0001235] 

220 iterating over the table: 

221 [2.34, 56.7, 8.9] 

222 [122.8, nan, 43.21] 

223 [98.7, 0.543, 6789.1] 

224 [23, 45, 3405] 

225 [1.234, 123.5, 0.0001235] 

226 ``` 

227 

228 Accessing data 

229 -------------- 

230 

231 In contrast to the iterator functions the [] operator treats the 

232 table as a 2D-array where the first index indicates the row and 

233 the second index the column. 

234 

235 Like a numpy aray the table can be sliced, and logical indexing can 

236 be used to select specific parts of the table. 

237  

238 As for any function, columns can be specified as indices or strings. 

239  

240 - `rows()`: the number of rows. 

241 - `columns()`: the number of columns. 

242 - `shape`: number of rows and columns. 

243 - `row()`: a single row of the table as TableData. 

244 - `row_dict()`: a single row of the table as dictionary. 

245 - `col()`: a single column of the table as TableData. 

246 - `__call__()`: a single column of the table as ndarray. 

247 - `__getitem__()`: data elements specified by slice. 

248 - `__setitem__()`: assign values to data elements specified by slice. 

249 - `__delitem__()`: delete data elements or whole columns or rows. 

250 - `array()`: the table data as a ndarray. 

251 - `data_frame()`: the table data as a pandas DataFrame. 

252 - `dicts()`: the table as a list of dictionaries. 

253 - `dict()`: the table as a dictionary. 

254 - `append_data()`: append data elements to successive columns. 

255 - `append_data_column()`: append data elements to a column. 

256 - `set_column()`: set the column where to add data. 

257 - `fill_data()`: fill up all columns with missing data. 

258 - `clear_data()`: clear content of the table but keep header. 

259 - `key_value()`: a data element returned as a key-value pair. 

260  

261 - `sort()`: sort the table rows in place. 

262 - `statistics()`: descriptive statistics of each column. 

263 

264 For example: 

265 ``` 

266 # single column:  

267 df('size') # data of 'size' column as ndarray 

268 df[:,'size'] # data of 'size' column as ndarray 

269 df.col('size') # table with the single column 'size' 

270 

271 # single row:  

272 df[2,:] # table with data of only the third row 

273 df.row(2) # table with data of only the third row 

274 

275 # slices: 

276 df[2:5,['size','jitter']] # sub-table 

277 df[2:5,['size','jitter']].array() # ndarray with data only 

278 

279 # logical indexing: 

280 df[df('speed') > 100.0, 'size'] = 0.0 # set size to 0 if speed is > 100 

281 

282 # delete: 

283 del df[3:6, 'weight'] # delete rows 3-6 from column 'weight' 

284 del df[3:5,:] # delete rows 3-5 completeley 

285 del df[:,'speed'] # remove column 'speed' from table 

286 df.remove('weight') # remove column 'weigth' from table 

287 

288 # sort and statistics: 

289 df.sort(['weight', 'jitter']) 

290 df.statistics() 

291 ``` 

292 statistics() returns a table with standard descriptive statistics: 

293 ``` plain 

294 statistics data 

295 - partial information complete reaction 

296 - size full weight speed median jitter size 

297 - m kg m/s mm g  

298 mean 22.65 83 2.3e+03 1157.7 4.16e+01 

299 std 24.23 40 3.18e+03 1589.1 5.79e+01 

300 min 2.34 43 0.543 23.0 1.23e-04 

301 quartile1 5.62 83 49.6 34.0 6.17e-01 

302 median 8.90 123 98.7 45.0 1.23e+00 

303 quartile3 32.80 - 3.44e+03 1725.0 6.24e+01 

304 max 56.70 123 6.79e+03 3405.0 1.24e+02 

305 count 3.00 2 3 3.0 3.00e+00 

306 ``` 

307 

308 Write and load tables 

309 --------------------- 

310 

311 Table data can be written to a variety of text-based formats 

312 including comma separated values, latex and html files. Which 

313 columns are written can be controlled by the hide() and show() 

314 functions. TableData can be loaded from all the written file formats 

315 (except html), also directly via the constructor. 

316  

317 - `hide()`: hide a column or a range of columns. 

318 - `hide_all()`: hide all columns. 

319 - `hide_empty_columns()`: hide all columns that do not contain data. 

320 - `show()`: show a column or a range of columns. 

321 - `write()`: write table to a file or stream. 

322 - `write_file_stream()`: write table to file or stream and return appropriate file name. 

323 - `__str__()`: write table to a string. 

324 - `load()`: load table from file or stream. 

325 - `formats`: list of supported file formats for writing. 

326 - `descriptions`: dictionary with descriptions of the supported file formats. 

327 - `extensions`: dictionary with default filename extensions for each of the file formats. 

328 - `ext_formats`: dictionary mapping filename extensions to file formats. 

329 

330 See documentation of the `write()` function for examples of the supported file formats. 

331 

332 """ 

333 

334 formats = ['dat', 'ascii', 'csv', 'rtai', 'md', 'tex', 'html'] 

335 """list of strings: Supported output formats.""" 

336 descriptions = {'dat': 'data text file', 'ascii': 'ascii-art table', 

337 'csv': 'comma separated values', 'rtai': 'rtai-style table', 

338 'md': 'markdown', 'tex': 'latex tabular', 

339 'html': 'html markup'} 

340 """dict: Decription of output formats corresponding to `formats`.""" 

341 extensions = {'dat': 'dat', 'ascii': 'txt', 'csv': 'csv', 'rtai': 'dat', 

342 'md': 'md', 'tex': 'tex', 'html': 'html'} 

343 """dict: Default file extensions for the output `formats`. """ 

344 ext_formats = {'dat': 'dat', 'DAT': 'dat', 'txt': 'dat', 'TXT': 'dat', 

345 'csv': 'csv', 'CSV': 'csv', 'md': 'md', 'MD': 'md', 

346 'tex': 'tex', 'TEX': 'tex', 'html': 'html', 'HTML': 'html'} 

347 """dict: Mapping of file extensions to the output formats.""" 

348 

349 def __init__(self, data=None, header=None, units=None, formats=None, 

350 missing=default_missing_inputs, stop=None): 

351 self.data = [] 

352 self.shape = (0, 0) 

353 self.header = [] 

354 self.nsecs = 0 

355 self.units = [] 

356 self.formats = [] 

357 self.hidden = [] 

358 self.setcol = 0 

359 self.addcol = 0 

360 if header is not None: 

361 if units is None: 

362 units = ['']*len(header) 

363 if formats is None: 

364 formats = ['%g']*len(header) 

365 elif not isinstance(formats, (list, tuple, np.ndarray)): 

366 formats = [formats]*len(header) 

367 for h, u, f in zip(header, units, formats): 

368 self.append(h, u, f) 

369 if data is not None: 

370 if isinstance(data, TableData): 

371 self.shape = data.shape 

372 self.nsecs = data.nsecs 

373 self.setcol = data.setcol 

374 self.addcol = data.addcol 

375 for c in range(data.columns()): 

376 self.header.append([]) 

377 for h in data.header[c]: 

378 self.header[c].append(h) 

379 self.units.append(data.units[c]) 

380 self.formats.append(data.formats[c]) 

381 self.hidden.append(data.hidden[c]) 

382 self.data.append([]) 

383 for d in data.data[c]: 

384 self.data[c].append(d) 

385 elif has_pandas and isinstance(data, pd.DataFrame): 

386 for k in data.keys(): 

387 values = data[k].tolist() 

388 f = '%s' if isinstance(values[0], str) else '%g' 

389 self.append(k, '', f, value=values) 

390 elif isinstance(data, (list, tuple, np.ndarray)): 

391 if isinstance(data[0], (list, tuple, np.ndarray)): 

392 # 2D list, rows first: 

393 for row in data: 

394 for c, val in enumerate(row): 

395 self.data[c].append(val) 

396 else: 

397 # 1D list: 

398 for c, val in enumerate(data): 

399 self.data[c].append(val) 

400 else: 

401 self.load(data, missing, stop) 

402 

403 def append(self, label, unit=None, formats=None, value=None, 

404 fac=None, key=None): 

405 """Append column to the table. 

406 

407 Parameters 

408 ---------- 

409 label: str or list of str 

410 Optional section titles and the name of the column. 

411 unit: str or None 

412 The unit of the column contents. 

413 formats: str or None 

414 The C-style format string used for printing out the column content, e.g. 

415 '%g', '%.2f', '%s', etc. 

416 If None, the format is set to '%g'. 

417 value: None, float, int, str, etc. or list thereof, or list of dict 

418 If not None, data for the column. 

419 If list of dictionaries, extract from each dictionary in the list 

420 the value specified by `key`. If `key` is `None` use `label` as 

421 the key. 

422 fac: float 

423 If not None, multiply the data values by this number. 

424 key: None or key of a dictionary 

425 If not None and `value` is a list of dictionaries, 

426 extract from each dictionary in the list the value specified 

427 by `key` and assign the resulting list as data to the column. 

428 

429 Returns 

430 ------- 

431 index: int 

432 The index of the new column. 

433 """ 

434 if self.addcol >= len(self.data): 

435 if isinstance(label, (list, tuple, np.ndarray)): 

436 self.header.append(list(reversed(label))) 

437 label = label[-1] 

438 else: 

439 self.header.append([label]) 

440 self.formats.append(formats or '%g') 

441 self.units.append(unit or '') 

442 self.hidden.append(False) 

443 self.data.append([]) 

444 if self.nsecs < len(self.header[-1])-1: 

445 self.nsecs = len(self.header[-1])-1 

446 else: 

447 if isinstance(label, (list, tuple, np.ndarray)): 

448 self.header[self.addcol] = list(reversed(label)) + self.header[self.addcol] 

449 label = label[-1] 

450 else: 

451 self.header[self.addcol] = [label] + self.header[self.addcol] 

452 self.units[self.addcol] = unit or '' 

453 self.formats[self.addcol] = formats or '%g' 

454 if self.nsecs < len(self.header[self.addcol])-1: 

455 self.nsecs = len(self.header[self.addcol])-1 

456 if not key: 

457 key = label 

458 if value is not None: 

459 if isinstance(value, (list, tuple, np.ndarray)): 

460 if key and len(value) > 0 and isinstance(value[0], dict): 

461 value = [d[key] if key in d else float('nan') for d in value] 

462 self.data[-1].extend(value) 

463 else: 

464 self.data[-1].append(value) 

465 if fac: 

466 for k in range(len(self.data[-1])): 

467 self.data[-1][k] *= fac 

468 self.addcol = len(self.data) 

469 self.shape = (self.rows(), self.columns()) 

470 return self.addcol-1 

471 

472 def insert(self, column, label, unit=None, formats=None, value=None): 

473 """Insert a table column at a given position. 

474 

475 .. WARNING:: 

476 If no `value` is given, the inserted column is an empty list. 

477 

478 Parameters 

479 ---------- 

480 columns int or str 

481 Column before which to insert the new column. 

482 Column can be specified by index or name, 

483 see `index()` for details. 

484 label: str or list of str 

485 Optional section titles and the name of the column. 

486 unit: str or None 

487 The unit of the column contents. 

488 formats: str or None 

489 The C-style format string used for printing out the column content, e.g. 

490 '%g', '%.2f', '%s', etc. 

491 If None, the format is set to '%g'. 

492 value: None, float, int, str, etc. or list thereof 

493 If not None, data for the column. 

494 

495 Returns 

496 ------- 

497 index: int 

498 The index of the inserted column. 

499  

500 Raises 

501 ------ 

502 IndexError: 

503 If an invalid column was specified. 

504 """ 

505 col = self.index(column) 

506 if col is None: 

507 if isinstance(column, (np.integer, int)): 

508 column = '%d' % column 

509 raise IndexError('Cannot insert before non-existing column ' + column) 

510 if isinstance(label, (list, tuple, np.ndarray)): 

511 self.header.insert(col, list(reversed(label))) 

512 else: 

513 self.header.insert(col, [label]) 

514 self.formats.insert(col, formats or '%g') 

515 self.units.insert(col, unit or '') 

516 self.hidden.insert(col, False) 

517 self.data.insert(col, []) 

518 if self.nsecs < len(self.header[col])-1: 

519 self.nsecs = len(self.header[col])-1 

520 if value is not None: 

521 if isinstance(value, (list, tuple, np.ndarray)): 

522 self.data[col].extend(value) 

523 else: 

524 self.data[col].append(value) 

525 self.addcol = len(self.data) 

526 self.shape = (self.rows(), self.columns()) 

527 return col 

528 

529 def remove(self, columns): 

530 """Remove columns from the table. 

531 

532 Parameters 

533 ----------- 

534 columns: int or str or list of int of str 

535 Columns can be specified by index or name, 

536 see `index()` for details. 

537 

538 Raises 

539 ------ 

540 IndexError: 

541 If an invalid column was specified. 

542 """ 

543 # fix columns: 

544 if not isinstance(columns, (list, tuple, np.ndarray)): 

545 columns = [ columns ] 

546 if not columns: 

547 return 

548 # remove: 

549 for col in columns: 

550 c = self.index(col) 

551 if c is None: 

552 if isinstance(col, (np.integer, int)): 

553 col = '%d' % col 

554 raise IndexError('Cannot remove non-existing column ' + col) 

555 continue 

556 if c+1 < len(self.header): 

557 self.header[c+1].extend(self.header[c][len(self.header[c+1]):]) 

558 del self.header[c] 

559 del self.units[c] 

560 del self.formats[c] 

561 del self.hidden[c] 

562 del self.data[c] 

563 if self.setcol >= len(self.data): 

564 self.setcol = 0 

565 self.shape = (self.rows(), self.columns()) 

566 

567 def section(self, column, level): 

568 """The section name of a specified column. 

569 

570 Parameters 

571 ---------- 

572 column: None, int, or str 

573 A specification of a column. 

574 See self.index() for more information on how to specify a column. 

575 level: int 

576 The level of the section to be returned. The column label itself is level=0. 

577 

578 Returns 

579 ------- 

580 name: str 

581 The name of the section at the specified level containing 

582 the column. 

583 index: int 

584 The column index that contains this section 

585 (equal or smaller thant `column`). 

586 

587 Raises 

588 ------ 

589 IndexError: 

590 If `level` exceeds the maximum possible level. 

591 """ 

592 if level < 0 or level > self.nsecs: 

593 raise IndexError('Invalid section level') 

594 column = self.index(column) 

595 while len(self.header[column]) <= level: 

596 column -= 1 

597 return self.header[column][level], column 

598 

599 def set_section(self, label, column, level): 

600 """Set a section name. 

601 

602 Parameters 

603 ---------- 

604 label: str 

605 The new name to be used for the section. 

606 column: None, int, or str 

607 A specification of a column. 

608 See self.index() for more information on how to specify a column. 

609 level: int 

610 The level of the section to be set. The column label itself is level=0. 

611 """ 

612 column = self.index(column) 

613 self.header[column][level] = label 

614 return column 

615 

616 def append_section(self, label): 

617 """Add sections to the table header. 

618 

619 Each column of the table has a header label. Columns can be 

620 grouped into sections. Sections can be nested arbitrarily. 

621 

622 Parameters 

623 ---------- 

624 label: stri or list of str 

625 The name(s) of the section(s). 

626 

627 Returns 

628 ------- 

629 index: int 

630 The column index where the section was appended. 

631 """ 

632 if self.addcol >= len(self.data): 

633 if isinstance(label, (list, tuple, np.ndarray)): 

634 self.header.append(list(reversed(label))) 

635 else: 

636 self.header.append([label]) 

637 self.units.append('') 

638 self.formats.append('') 

639 self.hidden.append(False) 

640 self.data.append([]) 

641 else: 

642 if isinstance(label, (list, tuple, np.ndarray)): 

643 self.header[self.addcol] = list(reversed(label)) + self.header[self.addcol] 

644 else: 

645 self.header[self.addcol] = [label] + self.header[self.addcol] 

646 if self.nsecs < len(self.header[self.addcol]): 

647 self.nsecs = len(self.header[self.addcol]) 

648 self.addcol = len(self.data)-1 

649 self.shape = (self.rows(), self.columns()) 

650 return self.addcol 

651 

652 def insert_section(self, column, section): 

653 """Insert a section at a given position of the table header. 

654 

655 Parameters 

656 ---------- 

657 columns int or str 

658 Column before which to insert the new section. 

659 Column can be specified by index or name, 

660 see `index()` for details. 

661 section: str 

662 The name of the section. 

663 

664 Returns 

665 ------- 

666 index: int 

667 The index of the column where the section was inserted. 

668  

669 Raises 

670 ------ 

671 IndexError: 

672 If an invalid column was specified. 

673 """ 

674 col = self.index(column) 

675 if col is None: 

676 if isinstance(column, (np.integer, int)): 

677 column = '%d' % column 

678 raise IndexError('Cannot insert at non-existing column ' + column) 

679 self.header[col].append(section) 

680 if self.nsecs < len(self.header[col])-1: 

681 self.nsecs = len(self.header[col])-1 

682 return col 

683 

684 def label(self, column): 

685 """The name of a column. 

686 

687 Parameters 

688 ---------- 

689 column: None, int, or str 

690 A specification of a column. 

691 See self.index() for more information on how to specify a column. 

692 

693 Returns 

694 ------- 

695 name: str 

696 The column label. 

697 """ 

698 column = self.index(column) 

699 return self.header[column][0] 

700 

701 def set_label(self, label, column): 

702 """Set the name of a column. 

703 

704 Parameters 

705 ---------- 

706 label: str 

707 The new name to be used for the column. 

708 column: None, int, or str 

709 A specification of a column. 

710 See self.index() for more information on how to specify a column. 

711 """ 

712 column = self.index(column) 

713 self.header[column][0] = label 

714 return column 

715 

716 def unit(self, column): 

717 """The unit of a column. 

718 

719 Parameters 

720 ---------- 

721 column: None, int, or str 

722 A specification of a column. 

723 See self.index() for more information on how to specify a column. 

724 

725 Returns 

726 ------- 

727 unit: str 

728 The unit. 

729 """ 

730 column = self.index(column) 

731 return self.units[column] 

732 

733 def set_unit(self, unit, column): 

734 """Set the unit of a column. 

735 

736 Parameters 

737 ---------- 

738 unit: str 

739 The new unit to be used for the column. 

740 column: None, int, or str 

741 A specification of a column. 

742 See self.index() for more information on how to specify a column. 

743 """ 

744 column = self.index(column) 

745 self.units[column] = unit 

746 return column 

747 

748 def set_units(self, units): 

749 """Set the units of all columns. 

750 

751 Parameters 

752 ---------- 

753 units: list of str 

754 The new units to be used. 

755 """ 

756 for c, u in enumerate(units): 

757 self.units[c] = u 

758 

759 def format(self, column): 

760 """The format string of the column. 

761 

762 Parameters 

763 ---------- 

764 column: None, int, or str 

765 A specification of a column. 

766 See self.index() for more information on how to specify a column. 

767 

768 Returns 

769 ------- 

770 format: str 

771 The format string. 

772 """ 

773 column = self.index(column) 

774 return self.formats[column] 

775 

776 def set_format(self, format, column): 

777 """Set the format string of a column. 

778 

779 Parameters 

780 ---------- 

781 format: str 

782 The new format string to be used for the column. 

783 column: None, int, or str 

784 A specification of a column. 

785 See self.index() for more information on how to specify a column. 

786 """ 

787 column = self.index(column) 

788 self.formats[column] = format 

789 return column 

790 

791 def set_formats(self, formats): 

792 """Set the format strings of all columns. 

793 

794 Parameters 

795 ---------- 

796 formats: str or list of str 

797 The new format strings to be used. 

798 If only a single format is specified, 

799 then all columns get the same format. 

800 """ 

801 if isinstance(formats, (list, tuple, np.ndarray)): 

802 for c, f in enumerate(formats): 

803 self.formats[c] = f or '%g' 

804 else: 

805 for c in range(len(self.formats)): 

806 self.formats[c] = formats or '%g' 

807 

808 def table_header(self): 

809 """The header of the table without content. 

810 

811 Returns 

812 ------- 

813 data: TableData 

814 A TableData object with the same header but empty data. 

815 """ 

816 data = TableData() 

817 sec_indices = [-1] * self.nsecs 

818 for c in range(self.columns()): 

819 data.append(*self.column_head(c)) 

820 for l in range(self.nsecs): 

821 s, i = self.section(c, l+1) 

822 if i != sec_indices[l]: 

823 data.header[-1].append(s) 

824 sec_indices[l] = i 

825 data.nsecs = self.nsecs 

826 return data 

827 

828 def column_head(self, column): 

829 """The name, unit, and format of a column. 

830 

831 Parameters 

832 ---------- 

833 column: None, int, or str 

834 A specification of a column. 

835 See self.index() for more information on how to specify a column. 

836 

837 Returns 

838 ------- 

839 name: str 

840 The column label. 

841 unit: str 

842 The unit. 

843 format: str 

844 The format string. 

845 """ 

846 column = self.index(column) 

847 return self.header[column][0], self.units[column], self.formats[column] 

848 

849 def column_spec(self, column): 

850 """Full specification of a column with all its section names. 

851 

852 Parameters 

853 ---------- 

854 column: int or str 

855 Specifies the column. 

856 See self.index() for more information on how to specify a column. 

857 

858 Returns 

859 ------- 

860 s: str 

861 Full specification of the column by all its section names and its header name. 

862 """ 

863 c = self.index(column) 

864 fh = [self.header[c][0]] 

865 for l in range(self.nsecs): 

866 fh.append(self.section(c, l+1)[0]) 

867 return '>'.join(reversed(fh)) 

868 

869 def find_col(self, column): 

870 """Find the start and end index of a column specification. 

871  

872 Parameters 

873 ---------- 

874 column: None, int, or str 

875 A specification of a column. 

876 See self.index() for more information on how to specify a column. 

877 

878 Returns 

879 ------- 

880 c0: int or None 

881 A valid column index or None that is specified by `column`. 

882 c1: int or None 

883 A valid column index or None of the column following the range specified 

884 by `column`. 

885 """ 

886 

887 def find_column_indices(ss, si, minns, maxns, c0, strict=True): 

888 if si >= len(ss): 

889 return None, None, None, None 

890 ns0 = 0 

891 for ns in range(minns, maxns+1): 

892 nsec = maxns-ns 

893 if ss[si] == '': 

894 si += 1 

895 continue 

896 for c in range(c0, len(self.header)): 

897 if nsec < len(self.header[c]) and \ 

898 ( ( strict and self.header[c][nsec] == ss[si] ) or 

899 ( not strict and ss[si] in self.header[c][nsec] ) ): 

900 ns0 = ns 

901 c0 = c 

902 si += 1 

903 if si >= len(ss): 

904 c1 = len(self.header) 

905 for c in range(c0+1, len(self.header)): 

906 if nsec < len(self.header[c]): 

907 c1 = c 

908 break 

909 return c0, c1, ns0, None 

910 elif nsec > 0: 

911 break 

912 return None, c0, ns0, si 

913 

914 if column is None: 

915 return None, None 

916 if not isinstance(column, (np.integer, int)) and column.isdigit(): 

917 column = int(column) 

918 if isinstance(column, (np.integer, int)): 

919 if column >= 0 and column < len(self.header): 

920 return column, column+1 

921 else: 

922 return None, None 

923 # find column by header: 

924 ss = column.rstrip('>').split('>') 

925 maxns = self.nsecs 

926 si0 = 0 

927 while si0 < len(ss) and ss[si0] == '': 

928 maxns -= 1 

929 si0 += 1 

930 if maxns < 0: 

931 maxns = 0 

932 c0, c1, ns, si = find_column_indices(ss, si0, 0, maxns, 0, True) 

933 if c0 is None and c1 is not None: 

934 c0, c1, ns, si = find_column_indices(ss, si, ns, maxns, c1, False) 

935 return c0, c1 

936 

937 def index(self, column): 

938 """The index of a column. 

939  

940 Parameters 

941 ---------- 

942 column: None, int, or str 

943 A specification of a column. 

944 - None: no column is specified 

945 - int: the index of the column (first column is zero), e.g. `index(2)`. 

946 - a string representing an integer is converted into the column index, 

947 e.g. `index('2')` 

948 - a string specifying a column by its header. 

949 Header names of descending hierarchy are separated by '>'. 

950 

951 Returns 

952 ------- 

953 index: int or None 

954 A valid column index or None. 

955 """ 

956 c0, c1 = self.find_col(column) 

957 return c0 

958 

959 def __contains__(self, column): 

960 """Check for existence of a column. 

961 

962 Parameters 

963 ---------- 

964 column: None, int, or str 

965 The column to be checked. 

966 See self.index() for more information on how to specify a column. 

967 

968 Returns 

969 ------- 

970 contains: bool 

971 True if `column` specifies an existing column key. 

972 """ 

973 return self.index(column) is not None 

974 

975 def keys(self): 

976 """List of unique column keys for all available columns. 

977 

978 Returns 

979 ------- 

980 keys: list of str 

981 List of unique column specifications. 

982 """ 

983 return [self.column_spec(c) for c in range(self.columns())] 

984 

985 def values(self): 

986 """List of column data corresponding to keys(). 

987 

988 Returns 

989 ------- 

990 data: list of list of values 

991 The data of the table. First index is columns! 

992 """ 

993 return self.data 

994 

995 def items(self): 

996 """Column names and corresponding data. 

997 

998 Returns 

999 ------- 

1000 items: list of tuples 

1001 Unique column specifications and the corresponding data. 

1002 """ 

1003 return [(self.column_spec(c), self.data[c]) for c in range(self.columns())] 

1004 

1005 def __len__(self): 

1006 """The number of columns. 

1007  

1008 Returns 

1009 ------- 

1010 columns: int 

1011 The number of columns contained in the table. 

1012 """ 

1013 return self.columns() 

1014 

1015 def __iter__(self): 

1016 """Initialize iteration over data columns. 

1017 """ 

1018 self.iter_counter = -1 

1019 return self 

1020 

1021 def __next__(self): 

1022 """Next column of data. 

1023 

1024 Returns 

1025 ------- 

1026 data: list of values 

1027 Table data of next column. 

1028 """ 

1029 self.iter_counter += 1 

1030 if self.iter_counter >= self.columns(): 

1031 raise StopIteration 

1032 else: 

1033 return self.data[self.iter_counter] 

1034 

1035 def next(self): 

1036 """Return next data columns. (python2 syntax) 

1037 

1038 See also: 

1039 --------- 

1040 `__next__()` 

1041 """ 

1042 return self.__next__() 

1043 

1044 def rows(self): 

1045 """The number of rows. 

1046  

1047 Returns 

1048 ------- 

1049 rows: int 

1050 The number of rows contained in the table. 

1051 """ 

1052 return max(map(len, self.data)) if self.data else 0 

1053 

1054 def columns(self): 

1055 """The number of columns. 

1056  

1057 Returns 

1058 ------- 

1059 columns: int 

1060 The number of columns contained in the table. 

1061 """ 

1062 return len(self.header) 

1063 

1064 def row(self, index): 

1065 """A single row of the table. 

1066 

1067 Parameters 

1068 ---------- 

1069 index: int 

1070 The index of the row to be returned. 

1071 

1072 Returns 

1073 ------- 

1074 data: TableData 

1075 A TableData object with a single row. 

1076 """ 

1077 data = TableData() 

1078 sec_indices = [-1] * self.nsecs 

1079 for c in range(self.columns()): 

1080 data.append(*self.column_head(c)) 

1081 for l in range(self.nsecs): 

1082 s, i = self.section(c, l+1) 

1083 if i != sec_indices[l]: 

1084 data.header[-1].append(s) 

1085 sec_indices[l] = i 

1086 data.data[-1] = [self.data[c][index]] 

1087 data.nsecs = self.nsecs 

1088 return data 

1089 

1090 def row_dict(self, index): 

1091 """A single row of the table. 

1092 

1093 Parameters 

1094 ---------- 

1095 index: int 

1096 The index of the row to be returned. 

1097 

1098 Returns 

1099 ------- 

1100 data: dict 

1101 A dictionary with column header as key and corresponding data value of row `index` 

1102 as value. 

1103 """ 

1104 data = {} 

1105 for c in range(self.columns()): 

1106 data[self.label(c)] = self.data[c][index] 

1107 return data 

1108 

1109 def col(self, column): 

1110 """A single column of the table. 

1111 

1112 Parameters 

1113 ---------- 

1114 column: None, int, or str 

1115 The column to be returned. 

1116 See self.index() for more information on how to specify a column. 

1117 

1118 Returns 

1119 ------- 

1120 table: TableData 

1121 A TableData object with a single column. 

1122 """ 

1123 data = TableData() 

1124 c = self.index(column) 

1125 data.append(*self.column_head(c)) 

1126 data.data = [self.data[c]] 

1127 data.nsecs = 0 

1128 return data 

1129 

1130 def __call__(self, column): 

1131 """A single column of the table as a ndarray. 

1132 

1133 Parameters 

1134 ---------- 

1135 column: None, int, or str 

1136 The column to be returned. 

1137 See self.index() for more information on how to specify a column. 

1138 

1139 Returns 

1140 ------- 

1141 data: 1-D ndarray 

1142 Content of the specified column as a ndarray. 

1143 """ 

1144 c = self.index(column) 

1145 return np.asarray(self.data[c]) 

1146 

1147 def __setupkey(self, key): 

1148 """Helper function that turns a key into row and column indices. 

1149 

1150 Returns 

1151 ------- 

1152 rows: list of int, slice, None 

1153 Indices of selected rows. 

1154 cols: list of int 

1155 Indices of selected columns. 

1156 

1157 Raises 

1158 ------ 

1159 IndexError: 

1160 If an invalid column was specified. 

1161 """ 

1162 if type(key) is not tuple: 

1163 rows = key 

1164 cols = range(self.columns()) 

1165 else: 

1166 rows = key[0] 

1167 cols = key[1] 

1168 if isinstance(cols, slice): 

1169 start = cols.start 

1170 if start is not None: 

1171 start = self.index(start) 

1172 if start is None: 

1173 raise IndexError('"%s" is not a valid column index' % cols.start) 

1174 stop = cols.stop 

1175 if stop is not None: 

1176 stop = self.index(stop) 

1177 if stop is None: 

1178 raise IndexError('"%s" is not a valid column index' % cols.stop) 

1179 cols = slice(start, stop, cols.step) 

1180 cols = range(self.columns())[cols] 

1181 else: 

1182 if not isinstance(cols, (list, tuple, np.ndarray)): 

1183 cols = [cols] 

1184 c = [self.index(inx) for inx in cols] 

1185 if None in c: 

1186 raise IndexError('"%s" is not a valid column index' % cols[c.index(None)]) 

1187 cols = c 

1188 if isinstance(rows, np.ndarray) and rows.dtype == np.dtype(bool): 

1189 rows = np.where(rows)[0] 

1190 if len(rows) == 0: 

1191 rows = None 

1192 return rows, cols 

1193 

1194 def __getitem__(self, key): 

1195 """Data elements specified by slice. 

1196 

1197 Parameters 

1198 ----------- 

1199 key: 

1200 First key specifies row, (optional) second one the column. 

1201 Columns can be specified by index or name, 

1202 see `index()` for details. 

1203 

1204 Returns 

1205 ------- 

1206 data: 

1207 - A single data value if a single row and a single column is specified. 

1208 - A ndarray of data elements if a single single column is specified. 

1209 - A TableData object for multiple columns. 

1210 - None if no row is selected (e.g. by a logical index that nowhere is True) 

1211 

1212 Raises 

1213 ------ 

1214 IndexError: 

1215 If an invalid column was specified. 

1216 """ 

1217 rows, cols = self.__setupkey(key) 

1218 if len(cols) == 1: 

1219 if rows is None: 

1220 return None 

1221 elif isinstance(rows, slice): 

1222 return np.asarray(self.data[cols[0]][rows]) 

1223 elif isinstance(rows, (list, tuple, np.ndarray)): 

1224 return np.asarray([self.data[cols[0]][r] for r in rows]) 

1225 else: 

1226 return self.data[cols[0]][rows] 

1227 else: 

1228 data = TableData() 

1229 sec_indices = [-1] * self.nsecs 

1230 for c in cols: 

1231 data.append(*self.column_head(c)) 

1232 for l in range(self.nsecs): 

1233 s, i = self.section(c, l+1) 

1234 if i != sec_indices[l]: 

1235 data.header[-1].append(s) 

1236 sec_indices[l] = i 

1237 if rows is None: 

1238 continue 

1239 if isinstance(rows, (list, tuple, np.ndarray)): 

1240 for r in rows: 

1241 data.data[-1].append(self.data[c][r]) 

1242 else: 

1243 if isinstance(self.data[c][rows], (list, tuple, np.ndarray)): 

1244 data.data[-1].extend(self.data[c][rows]) 

1245 else: 

1246 data.data[-1].append(self.data[c][rows]) 

1247 data.nsecs = self.nsecs 

1248 return data 

1249 

1250 def __setitem__(self, key, value): 

1251 """Assign values to data elements specified by slice. 

1252 

1253 Parameters 

1254 ----------- 

1255 key: 

1256 First key specifies row, (optional) second one the column. 

1257 Columns can be specified by index or name, 

1258 see `index()` for details. 

1259 value: TableData, list, ndarray, float, ... 

1260 Value(s) used to assing to the table elements as specified by `key`. 

1261 

1262 Raises 

1263 ------ 

1264 IndexError: 

1265 If an invalid column was specified. 

1266 """ 

1267 rows, cols = self.__setupkey(key) 

1268 if rows is None: 

1269 return 

1270 if isinstance(value, TableData): 

1271 if isinstance(self.data[cols[0]][rows], (list, tuple, np.ndarray)): 

1272 for k, c in enumerate(cols): 

1273 self.data[c][rows] = value.data[k] 

1274 else: 

1275 for k, c in enumerate(cols): 

1276 self.data[c][rows] = value.data[k][0] 

1277 else: 

1278 if len(cols) == 1: 

1279 if isinstance(rows, (list, tuple, np.ndarray)): 

1280 if len(rows) == 1: 

1281 self.data[cols[0]][rows[0]] = value 

1282 elif isinstance(value, (list, tuple, np.ndarray)): 

1283 for k, r in enumerate(rows): 

1284 self.data[cols[0]][r] = value[k] 

1285 else: 

1286 for r in rows: 

1287 self.data[cols[0]][r] = value 

1288 elif isinstance(value, (list, tuple, np.ndarray)): 

1289 self.data[cols[0]][rows] = value 

1290 elif isinstance(rows, (np.integer, int)): 

1291 self.data[cols[0]][rows] = value 

1292 else: 

1293 n = len(self.data[cols[0]][rows]) 

1294 if n > 1: 

1295 self.data[cols[0]][rows] = [value]*n 

1296 else: 

1297 self.data[cols[0]][rows] = value 

1298 else: 

1299 if isinstance(self.data[0][rows], (list, tuple, np.ndarray)): 

1300 for k, c in enumerate(cols): 

1301 self.data[c][rows] = value[:,k] 

1302 elif isinstance(value, (list, tuple, np.ndarray)): 

1303 for k, c in enumerate(cols): 

1304 self.data[c][rows] = value[k] 

1305 else: 

1306 for k, c in enumerate(cols): 

1307 self.data[c][rows] = value 

1308 

1309 def __delitem__(self, key): 

1310 """Delete data elements or whole columns or rows. 

1311 

1312 Parameters 

1313 ----------- 

1314 key: 

1315 First key specifies row, (optional) second one the column. 

1316 Columns can be specified by index or name, 

1317 see `index()` for details. 

1318 If all rows are selected, then the specified columns are removed from the table. 

1319 Otherwise only data values are removed. 

1320 If all columns are selected than entire rows of data values are removed. 

1321 Otherwise only data values in the specified rows are removed. 

1322 

1323 Raises 

1324 ------ 

1325 IndexError: 

1326 If an invalid column was specified. 

1327 """ 

1328 rows, cols = self.__setupkey(key) 

1329 if rows is None: 

1330 return 

1331 row_indices = np.arange(self.rows(), dtype=int)[rows] 

1332 if isinstance(row_indices, np.ndarray): 

1333 if len(row_indices) == self.rows(): 

1334 # delete whole columns: 

1335 self.remove(cols) 

1336 elif len(row_indices) > 0: 

1337 for r in reversed(sorted(row_indices)): 

1338 for c in cols: 

1339 del self.data[c][r] 

1340 self.shape = (self.rows(), self.columns()) 

1341 else: 

1342 for c in cols: 

1343 del self.data[c][row_indices] 

1344 self.shape = (self.rows(), self.columns()) 

1345 

1346 def array(self, row=None): 

1347 """The table data as a ndarray. 

1348 

1349 Parameters 

1350 ---------- 

1351 row: int or None 

1352 If specified, a 1D ndarray of that row will be returned. 

1353 

1354 Returns 

1355 ------- 

1356 data: 2D or 1D ndarray 

1357 If no row is specified, the data content of the entire table 

1358 as a 2D ndarray (rows first). 

1359 If a row is specified, a 1D ndarray of that row. 

1360 """ 

1361 if row is None: 

1362 return np.array(self.data).T 

1363 else: 

1364 return np.array([d[row] for d in self.data]) 

1365 

1366 def data_frame(self): 

1367 """The table data as a pandas DataFrame. 

1368 

1369 Returns 

1370 ------- 

1371 data: pandas.DataFrame 

1372 A pandas DataFrame of the whole table. 

1373 """ 

1374 return pd.DataFrame(self.dict()) 

1375 

1376 def dicts(self, raw_values=True, missing=default_missing_str): 

1377 """The table as a list of dictionaries. 

1378 

1379 Parameters 

1380 ---------- 

1381 raw_values: bool 

1382 If True, use raw table values as values, 

1383 else format the values and add unit string. 

1384 missing: str 

1385 String indicating non-existing data elements. 

1386 

1387 Returns 

1388 ------- 

1389 table: list of dict 

1390 For each row of the table a dictionary with header as key. 

1391 """ 

1392 table = [] 

1393 for row in range(self.rows()): 

1394 data = {} 

1395 for col in range(len(self.header)): 

1396 if raw_values: 

1397 v = self.data[col][row]; 

1398 else: 

1399 if isinstance(self.data[col][row], (float, np.floating)) and m.isnan(self.data[col][row]): 

1400 v = missing 

1401 else: 

1402 u = '' 

1403 if not self.units[col] in '1-' and self.units[col] != 'a.u.': 

1404 u = self.units[col] 

1405 v = (self.formats[col] % self.data[col][row]) + u 

1406 data[self.header[col][0]] = v 

1407 table.append(data) 

1408 return table 

1409 

1410 def dict(self): 

1411 """The table as a dictionary. 

1412 

1413 Returns 

1414 ------- 

1415 table: dict 

1416 A dictionary with keys being the column headers and 

1417 values the list of data elements of the corresponding column. 

1418 """ 

1419 table = {k: v for k, v in self.items()} 

1420 return table 

1421 

1422 def append_data(self, data, column=None): 

1423 """Append data elements to successive columns. 

1424 

1425 The current column is set behid the added columns. 

1426 

1427 Parameters 

1428 ---------- 

1429 data: float, int, str, etc. or list thereof or list of list thereof or dict or list of dict 

1430 Data values to be appended to successive columns: 

1431 - A single value is simply appened to the specified column of the table. 

1432 - A 1D-list of values is appended to successive columns of the table 

1433 starting with the specified column. 

1434 - The columns of a 2D-list of values (second index) are appended 

1435 to successive columns of the table starting with the specified column. 

1436 - Values or list of values of a dictionary are added to the 

1437 columns specified by the keys. Does not affect the current column. 

1438 - The values of dictionaries in a list are appended to the 

1439 columns specified by the keys. Does not affect the current column. 

1440 column: None, int, or str 

1441 The first column to which the data should be appended, 

1442 if `data` does not specify columns. 

1443 If None, append to the current column. 

1444 See self.index() for more information on how to specify a column. 

1445 """ 

1446 column = self.index(column) 

1447 if column is None: 

1448 column = self.setcol 

1449 if isinstance(data, (list, tuple, np.ndarray)): 

1450 if isinstance(data[0], (list, tuple, np.ndarray)): 

1451 # 2D list, rows first: 

1452 for row in data: 

1453 for i, val in enumerate(row): 

1454 self.data[column+i].append(val) 

1455 self.setcol = column + len(data[0]) 

1456 elif isinstance(data[0], dict): 

1457 # list of dictionaries: 

1458 for row in data: 

1459 for key in row: 

1460 column = self.index(k) 

1461 self.data[column].append(data[k]) 

1462 else: 

1463 # 1D list: 

1464 for val in data: 

1465 self.data[column].append(val) 

1466 column += 1 

1467 self.setcol = column 

1468 elif isinstance(data, dict): 

1469 # dictionary with values: 

1470 for key in data: 

1471 column = self.index(key) 

1472 if isinstance(data[key], (list, tuple, np.ndarray)): 

1473 self.data[column].extend(data[key]) 

1474 else: 

1475 self.data[column].append(data[key]) 

1476 else: 

1477 # single value: 

1478 self.data[column].append(data) 

1479 self.setcol = column + 1 

1480 if self.setcol >= len(self.data): 

1481 self.setcol = 0 

1482 self.shape = (self.rows(), self.columns()) 

1483 

1484 def append_data_column(self, data, column=None): 

1485 """Append data elements to a column. 

1486 

1487 The current column is incremented by one. 

1488 

1489 Parameters 

1490 ---------- 

1491 data: float, int, str, etc. or list thereof 

1492 Data values to be appended to a column. 

1493 column: None, int, or str 

1494 The column to which the data should be appended. 

1495 If None, append to the current column. 

1496 See self.index() for more information on how to specify a column. 

1497 """ 

1498 column = self.index(column) 

1499 if column is None: 

1500 column = self.setcol 

1501 if isinstance(data, (list, tuple, np.ndarray)): 

1502 self.data[column].extend(data) 

1503 column += 1 

1504 self.setcol = column 

1505 else: 

1506 self.data[column].append(data) 

1507 self.setcol = column+1 

1508 if self.setcol >= len(self.data): 

1509 self.setcol = 0 

1510 self.shape = (self.rows(), self.columns()) 

1511 

1512 def set_column(self, column): 

1513 """Set the column where to add data. 

1514 

1515 Parameters 

1516 ---------- 

1517 column: int or str 

1518 The column to which data elements should be appended. 

1519 See self.index() for more information on how to specify a column. 

1520 

1521 Raises 

1522 ------ 

1523 IndexError: 

1524 If an invalid column was specified. 

1525 """ 

1526 col = self.index(column) 

1527 if col is None: 

1528 if isinstance(column, (np.integer, int)): 

1529 column = '%d' % column 

1530 raise IndexError('column ' + column + ' not found or invalid') 

1531 self.setcol = col 

1532 return col 

1533 

1534 def fill_data(self): 

1535 """Fill up all columns with missing data to have the same number of 

1536 data elements. 

1537 """ 

1538 # maximum rows: 

1539 maxr = self.rows() 

1540 # fill up: 

1541 for c in range(len(self.data)): 

1542 while len(self.data[c]) < maxr: 

1543 self.data[c].append(np.nan) 

1544 self.setcol = 0 

1545 self.shape = (self.rows(), self.columns()) 

1546 

1547 def clear_data(self): 

1548 """Clear content of the table but keep header. 

1549 """ 

1550 for c in range(len(self.data)): 

1551 self.data[c] = [] 

1552 self.setcol = 0 

1553 self.shape = (self.rows(), self.columns()) 

1554 

1555 def sort(self, columns, reverse=False): 

1556 """Sort the table rows in place. 

1557 

1558 Parameters 

1559 ---------- 

1560 columns: int or str or list of int or str 

1561 A column specifier or a list of column specifiers of the columns 

1562 to be sorted. 

1563 reverse: boolean 

1564 If `True` sort in descending order. 

1565 

1566 Raises 

1567 ------ 

1568 IndexError: 

1569 If an invalid column was specified. 

1570 """ 

1571 # fix columns: 

1572 if not isinstance(columns, (list, tuple, np.ndarray)): 

1573 columns = [ columns ] 

1574 if not columns: 

1575 return 

1576 cols = [] 

1577 for col in columns: 

1578 c = self.index(col) 

1579 if c is None: 

1580 if isinstance(col, (np.integer, int)): 

1581 col = '%d' % col 

1582 raise IndexError('sort column ' + col + ' not found') 

1583 continue 

1584 cols.append(c) 

1585 # get sorted row indices: 

1586 row_inx = range(self.rows()) 

1587 row_inx = sorted(row_inx, key=lambda x : [float('-inf') if self.data[c][x] is np.nan \ 

1588 or self.data[c][x] != self.data[c][x] \ 

1589 else self.data[c][x] for c in cols], reverse=reverse) 

1590 # sort table according to indices: 

1591 for c in range(self.columns()): 

1592 self.data[c] = [self.data[c][r] for r in row_inx] 

1593 

1594 def statistics(self): 

1595 """Descriptive statistics of each column. 

1596 """ 

1597 ds = TableData() 

1598 if self.nsecs > 0: 

1599 ds.append_section('statistics') 

1600 for l in range(1,self.nsecs): 

1601 ds.append_section('-') 

1602 ds.append('-', '-', '%-10s') 

1603 else: 

1604 ds.append('statistics', '-', '%-10s') 

1605 ds.append_data('mean', 0) 

1606 ds.append_data('std', 0) 

1607 ds.append_data('min', 0) 

1608 ds.append_data('quartile1', 0) 

1609 ds.append_data('median', 0) 

1610 ds.append_data('quartile3', 0) 

1611 ds.append_data('max', 0) 

1612 ds.append_data('count', 0) 

1613 dc = 1 

1614 for c in range(self.columns()): 

1615 if len(self.data[c]) > 0 and isinstance(self.data[c][0], (float, int, np.floating, np.integer)): 

1616 ds.hidden.append(False) 

1617 ds.header.append(self.header[c]) 

1618 ds.units.append(self.units[c]) 

1619 # integer data still make floating point statistics: 

1620 if isinstance(self.data[c][0], (float, np.floating)): 

1621 f = self.formats[c] 

1622 i0 = f.find('.') 

1623 if i0 > 0: 

1624 p = int(f[i0+1:-1]) 

1625 if p <= 0: 

1626 f = '%.1f' 

1627 ds.formats.append(f) 

1628 else: 

1629 ds.formats.append('%.1f') 

1630 # remove nans: 

1631 data = np.asarray(self.data[c], float) 

1632 data = data[np.isfinite(data)] 

1633 # compute statistics: 

1634 ds.data.append([]) 

1635 ds.append_data(np.mean(data), dc) 

1636 ds.append_data(np.std(data), dc) 

1637 ds.append_data(np.min(data), dc) 

1638 q1, m, q3 = np.percentile(data, [25., 50., 75.]) 

1639 ds.append_data(q1, dc) 

1640 ds.append_data(m, dc) 

1641 ds.append_data(q3, dc) 

1642 ds.append_data(np.max(data), dc) 

1643 ds.append_data(len(data), dc) 

1644 dc += 1 

1645 ds.nsecs = self.nsecs 

1646 ds.shape = (ds.rows(), ds.columns()) 

1647 return ds 

1648 

1649 def key_value(self, row, col, missing=default_missing_str): 

1650 """A data element returned as a key-value pair. 

1651 

1652 Parameters 

1653 ---------- 

1654 row: int 

1655 Specifies the row from which the data element should be retrieved. 

1656 col: None, int, or str 

1657 A specification of a column. 

1658 See self.index() for more information on how to specify a column. 

1659 missing: str 

1660 String indicating non-existing data elements. 

1661 

1662 Returns 

1663 ------- 

1664 key: str 

1665 Header label of the column 

1666 value: str 

1667 A textual representation of the data element according to the format 

1668 of the column, followed by the unit of the column. 

1669 """ 

1670 col = self.index(col) 

1671 if col is None: 

1672 return '' 

1673 if isinstance(self.data[col][row], (float, np.floating)) and m.isnan(self.data[col][row]): 

1674 v = missing 

1675 else: 

1676 u = '' 

1677 if not self.units[col] in '1-' and self.units[col] != 'a.u.': 

1678 u = self.units[col] 

1679 v = (self.formats[col] % self.data[col][row]) + u 

1680 return self.header[col][0], v 

1681 

1682 def hide(self, column): 

1683 """Hide a column or a range of columns. 

1684 

1685 Hidden columns will not be printed out by the write() function. 

1686 

1687 Parameters 

1688 ---------- 

1689 column: int or str 

1690 The column to be hidden. 

1691 See self.index() for more information on how to specify a column. 

1692 """ 

1693 c0, c1 = self.find_col(column) 

1694 if c0 is not None: 

1695 for c in range(c0, c1): 

1696 self.hidden[c] = True 

1697 

1698 def hide_all(self): 

1699 """Hide all columns. 

1700 

1701 Hidden columns will not be printed out by the write() function. 

1702 """ 

1703 for c in range(len(self.hidden)): 

1704 self.hidden[c] = True 

1705 

1706 def hide_empty_columns(self, missing=default_missing_inputs): 

1707 """Hide all columns that do not contain data. 

1708 

1709 Hidden columns will not be printed out by the write() function. 

1710 

1711 Parameters 

1712 ---------- 

1713 missing: list of str 

1714 Strings indicating missing data. 

1715 """ 

1716 for c in range(len(self.data)): 

1717 # check for empty column: 

1718 isempty = True 

1719 for v in self.data[c]: 

1720 if isinstance(v, (float, np.floating)): 

1721 if not m.isnan(v): 

1722 isempty = False 

1723 break 

1724 else: 

1725 if not v in missing: 

1726 isempty = False 

1727 break 

1728 if isempty: 

1729 self.hidden[c] = True 

1730 

1731 def show(self, column): 

1732 """Show a column or a range of columns. 

1733 

1734 Undoes hiding of a column. 

1735 

1736 Parameters 

1737 ---------- 

1738 column: int or str 

1739 The column to be shown. 

1740 See self.index() for more information on how to specify a column. 

1741 """ 

1742 c0, c1 = self.find_col(column) 

1743 if c0 is not None: 

1744 for c in range(c0, c1): 

1745 self.hidden[c] = False 

1746 

1747 def write(self, fh=sys.stdout, table_format=None, delimiter=None, 

1748 unit_style=None, column_numbers=None, sections=None, 

1749 align_columns=None, shrink_width=True, 

1750 missing=default_missing_str, center_columns=False, 

1751 latex_label_command='', latex_merge_std=False): 

1752 """Write the table to a file or stream. 

1753 

1754 Parameters 

1755 ---------- 

1756 fh: filename or stream 

1757 If not a stream, the file with name `fh` is opened. 

1758 If `fh` does not have an extension, 

1759 the `table_format` is appended as an extension. 

1760 Otherwise `fh` is used as a stream for writing. 

1761 table_format: None or str 

1762 The format to be used for output. 

1763 One of 'out', 'dat', 'ascii', 'csv', 'rtai', 'md', 'tex', 'html'. 

1764 If None or 'auto' then the format is set to the extension of the filename given by `fh`. 

1765 If `fh` is a stream the format is set to 'dat'. 

1766 delimiter: str 

1767 String or character separating columns, if supported by the `table_format`. 

1768 If None or 'auto' use the default for the specified `table_format`. 

1769 unit_style: None or str 

1770 - None or 'auto': use default of the specified `table_format`. 

1771 - 'row': write an extra row to the table header specifying the units of the columns. 

1772 - 'header': add the units to the column headers. 

1773 - 'none': do not specify the units. 

1774 column_numbers: str or None 

1775 Add a row specifying the column index: 

1776 - 'index': indices are integers, first column is 0. 

1777 - 'num': indices are integers, first column is 1. 

1778 - 'aa': use 'a', 'b', 'c', ..., 'z', 'aa', 'ab', ... for indexing 

1779 - 'aa': use 'A', 'B', 'C', ..., 'Z', 'AA', 'AB', ... for indexing 

1780 - None or 'none': do not add a row with column indices 

1781 TableData.column_numbering is a list with the supported styles. 

1782 sections: None or int 

1783 Number of section levels to be printed. 

1784 If `None` or 'auto' use default of selected `table_format`. 

1785 align_columns: boolean 

1786 - `True`: set width of column formats to make them align. 

1787 - `False`: set width of column formats to 0 - no unnecessary spaces. 

1788 - None or 'auto': Use default of the selected `table_format`. 

1789 shrink_width: boolean 

1790 If `True` disregard width specified by the format strings, 

1791 such that columns can become narrower. 

1792 missing: str 

1793 Indicate missing data by this string. 

1794 center_columns: boolean 

1795 If True center all columns (markdown, html, and latex). 

1796 latex_label_command: str 

1797 LaTeX command for formatting header labels. 

1798 E.g. 'textbf' for making the header labels bold. 

1799 latex_merge_std: str 

1800 Merge header of columns with standard deviations with previous column 

1801 (LaTeX tables only). 

1802 

1803 Returns 

1804 ------- 

1805 file_name: str or None 

1806 The full name of the file into which the data were written. 

1807 

1808 Supported file formats 

1809 ---------------------- 

1810  

1811 ## `dat`: data text file 

1812 ``` plain 

1813 # info reaction  

1814 # size weight delay jitter 

1815 # m kg ms mm  

1816 2.34 123 98.7 23 

1817 56.70 3457 54.3 45 

1818 8.90 43 67.9 345 

1819 ``` 

1820 

1821 ## `ascii`: ascii-art table 

1822 ``` plain 

1823 |---------------------------------| 

1824 | info | reaction | 

1825 | size | weight | delay | jitter | 

1826 | m | kg | ms | mm | 

1827 |-------|--------|-------|--------| 

1828 | 2.34 | 123 | 98.7 | 23 | 

1829 | 56.70 | 3457 | 54.3 | 45 | 

1830 | 8.90 | 43 | 67.9 | 345 | 

1831 |---------------------------------| 

1832 ``` 

1833 

1834 ## `csv`: comma separated values 

1835 ``` plain 

1836 size/m,weight/kg,delay/ms,jitter/mm 

1837 2.34,123,98.7,23 

1838 56.70,3457,54.3,45 

1839 8.90,43,67.9,345 

1840 ``` 

1841 

1842 ## `rtai`: rtai-style table 

1843 ``` plain 

1844 RTH| info | reaction  

1845 RTH| size | weight| delay| jitter 

1846 RTH| m | kg | ms | mm  

1847 RTD| 2.34| 123| 98.7| 23 

1848 RTD| 56.70| 3457| 54.3| 45 

1849 RTD| 8.90| 43| 67.9| 345 

1850 ``` 

1851 

1852 ## `md`: markdown 

1853 ``` plain 

1854 | size/m | weight/kg | delay/ms | jitter/mm | 

1855 |------:|-------:|------:|-------:| 

1856 | 2.34 | 123 | 98.7 | 23 | 

1857 | 56.70 | 3457 | 54.3 | 45 | 

1858 | 8.90 | 43 | 67.9 | 345 | 

1859 ``` 

1860 

1861 ## `tex`: latex tabular 

1862 ``` tex 

1863 \\begin{tabular}{rrrr} 

1864 \\hline 

1865 \\multicolumn{2}{l}{info} & \\multicolumn{2}{l}{reaction} \\ 

1866 \\multicolumn{1}{l}{size} & \\multicolumn{1}{l}{weight} & \\multicolumn{1}{l}{delay} & \\multicolumn{1}{l}{jitter} \\ 

1867 \\multicolumn{1}{l}{m} & \\multicolumn{1}{l}{kg} & \\multicolumn{1}{l}{ms} & \\multicolumn{1}{l}{mm} \\ 

1868 \\hline 

1869 2.34 & 123 & 98.7 & 23 \\ 

1870 56.70 & 3457 & 54.3 & 45 \\ 

1871 8.90 & 43 & 67.9 & 345 \\ 

1872 \\hline 

1873 \\end{tabular} 

1874 ``` 

1875 

1876 ## `html`: html 

1877 ``` html 

1878 <table> 

1879 <thead> 

1880 <tr class="header"> 

1881 <th align="left" colspan="2">info</th> 

1882 <th align="left" colspan="2">reaction</th> 

1883 </tr> 

1884 <tr class="header"> 

1885 <th align="left">size</th> 

1886 <th align="left">weight</th> 

1887 <th align="left">delay</th> 

1888 <th align="left">jitter</th> 

1889 </tr> 

1890 <tr class="header"> 

1891 <th align="left">m</th> 

1892 <th align="left">kg</th> 

1893 <th align="left">ms</th> 

1894 <th align="left">mm</th> 

1895 </tr> 

1896 </thead> 

1897 <tbody> 

1898 <tr class"odd"> 

1899 <td align="right">2.34</td> 

1900 <td align="right">123</td> 

1901 <td align="right">98.7</td> 

1902 <td align="right">23</td> 

1903 </tr> 

1904 <tr class"even"> 

1905 <td align="right">56.70</td> 

1906 <td align="right">3457</td> 

1907 <td align="right">54.3</td> 

1908 <td align="right">45</td> 

1909 </tr> 

1910 <tr class"odd"> 

1911 <td align="right">8.90</td> 

1912 <td align="right">43</td> 

1913 <td align="right">67.9</td> 

1914 <td align="right">345</td> 

1915 </tr> 

1916 </tbody> 

1917 </table> 

1918 ``` 

1919 """ 

1920 # fix parameter: 

1921 if table_format == 'auto': 

1922 table_format = None 

1923 if delimiter == 'auto': 

1924 delimiter = None 

1925 if unit_style == 'auto': 

1926 unit_style = None 

1927 if column_numbers == 'none': 

1928 column_numbers = None 

1929 if sections == 'auto': 

1930 sections = None 

1931 if align_columns == 'auto': 

1932 align_columns = None 

1933 # open file: 

1934 own_file = False 

1935 file_name = None 

1936 if not hasattr(fh, 'write'): 

1937 _, ext = os.path.splitext(fh) 

1938 if table_format is None: 

1939 if len(ext) > 1 and ext[1:] in self.ext_formats: 

1940 table_format = self.ext_formats[ext[1:]] 

1941 elif not ext or not ext[1:].lower() in self.ext_formats: 

1942 fh += '.' + self.extensions[table_format] 

1943 file_name = fh 

1944 fh = open(fh, 'w') 

1945 own_file = True 

1946 if table_format is None: 

1947 table_format = 'dat' 

1948 # set style:  

1949 if table_format[0] == 'd': 

1950 align_columns = True 

1951 begin_str = '' 

1952 end_str = '' 

1953 header_start = '# ' 

1954 header_sep = ' ' 

1955 header_close = '' 

1956 header_end = '\n' 

1957 data_start = ' ' 

1958 data_sep = ' ' 

1959 data_close = '' 

1960 data_end = '\n' 

1961 top_line = False 

1962 header_line = False 

1963 bottom_line = False 

1964 if delimiter is not None: 

1965 header_sep = delimiter 

1966 data_sep = delimiter 

1967 if sections is None: 

1968 sections = 1000 

1969 elif table_format[0] == 'a': 

1970 align_columns = True 

1971 begin_str = '' 

1972 end_str = '' 

1973 header_start = '| ' 

1974 header_sep = ' | ' 

1975 header_close = '' 

1976 header_end = ' |\n' 

1977 data_start = '| ' 

1978 data_sep = ' | ' 

1979 data_close = '' 

1980 data_end = ' |\n' 

1981 top_line = True 

1982 header_line = True 

1983 bottom_line = True 

1984 if delimiter is not None: 

1985 header_sep = delimiter 

1986 data_sep = delimiter 

1987 if sections is None: 

1988 sections = 1000 

1989 elif table_format[0] == 'c': 

1990 # csv according to http://www.ietf.org/rfc/rfc4180.txt : 

1991 column_numbers=None 

1992 if unit_style is None: 

1993 unit_style = 'header' 

1994 if align_columns is None: 

1995 align_columns = False 

1996 begin_str = '' 

1997 end_str = '' 

1998 header_start='' 

1999 header_sep = ',' 

2000 header_close = '' 

2001 header_end='\n' 

2002 data_start='' 

2003 data_sep = ',' 

2004 data_close = '' 

2005 data_end='\n' 

2006 top_line = False 

2007 header_line = False 

2008 bottom_line = False 

2009 if delimiter is not None: 

2010 header_sep = delimiter 

2011 data_sep = delimiter 

2012 if sections is None: 

2013 sections = 0 

2014 elif table_format[0] == 'r': 

2015 align_columns = True 

2016 begin_str = '' 

2017 end_str = '' 

2018 header_start = 'RTH| ' 

2019 header_sep = '| ' 

2020 header_close = '' 

2021 header_end = '\n' 

2022 data_start = 'RTD| ' 

2023 data_sep = '| ' 

2024 data_close = '' 

2025 data_end = '\n' 

2026 top_line = False 

2027 header_line = False 

2028 bottom_line = False 

2029 if sections is None: 

2030 sections = 1000 

2031 elif table_format[0] == 'm': 

2032 if unit_style is None or unit_style == 'row': 

2033 unit_style = 'header' 

2034 align_columns = True 

2035 begin_str = '' 

2036 end_str = '' 

2037 header_start='| ' 

2038 header_sep = ' | ' 

2039 header_close = '' 

2040 header_end=' |\n' 

2041 data_start='| ' 

2042 data_sep = ' | ' 

2043 data_close = '' 

2044 data_end=' |\n' 

2045 top_line = False 

2046 header_line = True 

2047 bottom_line = False 

2048 if sections is None: 

2049 sections = 0 

2050 elif table_format[0] == 'h': 

2051 align_columns = False 

2052 begin_str = '<table>\n<thead>\n' 

2053 end_str = '</tbody>\n</table>\n' 

2054 if center_columns: 

2055 header_start=' <tr>\n <th align="center"' 

2056 header_sep = '</th>\n <th align="center"' 

2057 else: 

2058 header_start=' <tr>\n <th align="left"' 

2059 header_sep = '</th>\n <th align="left"' 

2060 header_close = '>' 

2061 header_end='</th>\n </tr>\n' 

2062 data_start=' <tr>\n <td' 

2063 data_sep = '</td>\n <td' 

2064 data_close = '>' 

2065 data_end='</td>\n </tr>\n' 

2066 top_line = False 

2067 header_line = False 

2068 bottom_line = False 

2069 if sections is None: 

2070 sections = 1000 

2071 elif table_format[0] == 't': 

2072 if align_columns is None: 

2073 align_columns = False 

2074 begin_str = '\\begin{tabular}' 

2075 end_str = '\\end{tabular}\n' 

2076 header_start=' ' 

2077 header_sep = ' & ' 

2078 header_close = '' 

2079 header_end=' \\\\\n' 

2080 data_start=' ' 

2081 data_sep = ' & ' 

2082 data_close = '' 

2083 data_end=' \\\\\n' 

2084 top_line = True 

2085 header_line = True 

2086 bottom_line = True 

2087 if sections is None: 

2088 sections = 1000 

2089 else: 

2090 if align_columns is None: 

2091 align_columns = True 

2092 begin_str = '' 

2093 end_str = '' 

2094 header_start = '' 

2095 header_sep = ' ' 

2096 header_close = '' 

2097 header_end = '\n' 

2098 data_start = '' 

2099 data_sep = ' ' 

2100 data_close = '' 

2101 data_end = '\n' 

2102 top_line = False 

2103 header_line = False 

2104 bottom_line = False 

2105 if sections is None: 

2106 sections = 1000 

2107 # check units: 

2108 if unit_style is None: 

2109 unit_style = 'row' 

2110 have_units = False 

2111 for u in self.units: 

2112 if u and u != '1' and u != '-': 

2113 have_units = True 

2114 break 

2115 if not have_units: 

2116 unit_style = 'none' 

2117 # find std columns: 

2118 stdev_col = np.zeros(len(self.header), dtype=bool) 

2119 for c in range(len(self.header)-1): 

2120 if self.header[c+1][0].lower() in ['sd', 'std', 's.d.', 'stdev'] and \ 

2121 not self.hidden[c+1]: 

2122 stdev_col[c] = True 

2123 # begin table: 

2124 fh.write(begin_str) 

2125 if table_format[0] == 't': 

2126 fh.write('{') 

2127 merged = False 

2128 for h, f, s in zip(self.hidden, self.formats, stdev_col): 

2129 if merged: 

2130 fh.write('l') 

2131 merged = False 

2132 continue 

2133 if h: 

2134 continue 

2135 if latex_merge_std and s: 

2136 fh.write('r@{$\\,\\pm\\,$}') 

2137 merged = True 

2138 elif center_columns: 

2139 fh.write('c') 

2140 elif f[1] == '-': 

2141 fh.write('l') 

2142 else: 

2143 fh.write('r') 

2144 fh.write('}\n') 

2145 # retrieve column formats and widths: 

2146 widths = [] 

2147 widths_pos = [] 

2148 for c, f in enumerate(self.formats): 

2149 w = 0 

2150 # position of width specification: 

2151 i0 = 1 

2152 if len(f) > 1 and f[1] == '-' : 

2153 i0 = 2 

2154 i1 = f.find('.') 

2155 if not shrink_width: 

2156 if f[i0:i1]: 

2157 w = int(f[i0:i1]) 

2158 widths_pos.append((i0, i1)) 

2159 # adapt width to header label: 

2160 hw = len(self.header[c][0]) 

2161 if unit_style == 'header' and self.units[c] and\ 

2162 self.units[c] != '1' and self.units[c] != '-': 

2163 hw += 1 + len(self.units[c]) 

2164 if w < hw: 

2165 w = hw 

2166 # adapt width to data: 

2167 if f[-1] == 's': 

2168 for v in self.data[c]: 

2169 if not isinstance(v, (float, np.floating)) and w < len(v): 

2170 w = len(v) 

2171 else: 

2172 fs = f[:i0] + str(0) + f[i1:] 

2173 for v in self.data[c]: 

2174 if isinstance(v, (float, np.floating)) and m.isnan(v): 

2175 s = missing 

2176 else: 

2177 try: 

2178 s = fs % v 

2179 except ValueError: 

2180 s = missing 

2181 except TypeError: 

2182 s = str(v) 

2183 if w < len(s): 

2184 w = len(s) 

2185 widths.append(w) 

2186 # adapt width to sections: 

2187 sec_indices = [0] * self.nsecs 

2188 sec_widths = [0] * self.nsecs 

2189 sec_columns = [0] * self.nsecs 

2190 for c in range(len(self.header)): 

2191 w = widths[c] 

2192 for l in range(min(self.nsecs, sections)): 

2193 if 1+l < len(self.header[c]): 

2194 if c > 0 and sec_columns[l] > 0 and \ 

2195 1+l < len(self.header[sec_indices[l]]) and \ 

2196 len(self.header[sec_indices[l]][1+l]) > sec_widths[l]: 

2197 dw = len(self.header[sec_indices[l]][1+l]) - sec_widths[l] 

2198 nc = sec_columns[l] 

2199 ddw = np.zeros(nc, dtype=int) + dw // nc 

2200 ddw[:dw % nc] += 1 

2201 wk = 0 

2202 for ck in range(sec_indices[l], c): 

2203 if not self.hidden[ck]: 

2204 widths[ck] += ddw[wk] 

2205 wk += 1 

2206 sec_widths[l] = 0 

2207 sec_indices[l] = c 

2208 if not self.hidden[c]: 

2209 if sec_widths[l] > 0: 

2210 sec_widths[l] += len(header_sep) 

2211 sec_widths[l] += w 

2212 sec_columns[l] += 1 

2213 # set width of format string: 

2214 formats = [] 

2215 for c, (f, w) in enumerate(zip(self.formats, widths)): 

2216 formats.append(f[:widths_pos[c][0]] + str(w) + f[widths_pos[c][1]:]) 

2217 # top line: 

2218 if top_line: 

2219 if table_format[0] == 't': 

2220 fh.write(' \\hline \\\\[-2ex]\n') 

2221 else: 

2222 first = True 

2223 fh.write(header_start.replace(' ', '-')) 

2224 for c in range(len(self.header)): 

2225 if self.hidden[c]: 

2226 continue 

2227 if not first: 

2228 fh.write('-'*len(header_sep)) 

2229 first = False 

2230 fh.write(header_close) 

2231 w = widths[c] 

2232 fh.write(w*'-') 

2233 fh.write(header_end.replace(' ', '-')) 

2234 # section and column headers: 

2235 nsec0 = self.nsecs-sections 

2236 if nsec0 < 0: 

2237 nsec0 = 0 

2238 for ns in range(nsec0, self.nsecs+1): 

2239 nsec = self.nsecs-ns 

2240 first = True 

2241 last = False 

2242 merged = False 

2243 fh.write(header_start) 

2244 for c in range(len(self.header)): 

2245 if nsec < len(self.header[c]): 

2246 # section width and column count: 

2247 sw = -len(header_sep) 

2248 columns = 0 

2249 if not self.hidden[c]: 

2250 sw = widths[c] 

2251 columns = 1 

2252 for k in range(c+1, len(self.header)): 

2253 if nsec < len(self.header[k]): 

2254 break 

2255 if self.hidden[k]: 

2256 continue 

2257 sw += len(header_sep) + widths[k] 

2258 columns += 1 

2259 else: 

2260 last = True 

2261 if len(header_end.strip()) == 0: 

2262 sw = 0 # last entry needs no width 

2263 if columns == 0: 

2264 continue 

2265 if not first and not merged: 

2266 fh.write(header_sep) 

2267 first = False 

2268 if table_format[0] == 'c': 

2269 sw -= len(header_sep)*(columns-1) 

2270 elif table_format[0] == 'h': 

2271 if columns>1: 

2272 fh.write(' colspan="%d"' % columns) 

2273 elif table_format[0] == 't': 

2274 if merged: 

2275 merged = False 

2276 continue 

2277 if latex_merge_std and nsec == 0 and stdev_col[c]: 

2278 merged = True 

2279 fh.write('\\multicolumn{%d}{c}{' % (columns+1)) 

2280 elif center_columns: 

2281 fh.write('\\multicolumn{%d}{c}{' % columns) 

2282 else: 

2283 fh.write('\\multicolumn{%d}{l}{' % columns) 

2284 if latex_label_command: 

2285 fh.write('\\%s{' % latex_label_command) 

2286 fh.write(header_close) 

2287 hs = self.header[c][nsec] 

2288 if nsec == 0 and unit_style == 'header': 

2289 if self.units[c] and self.units[c] != '1' and self.units[c] != '-': 

2290 hs += '/' + self.units[c] 

2291 if align_columns and not table_format[0] in 'th': 

2292 f = '%%-%ds' % sw 

2293 fh.write(f % hs) 

2294 else: 

2295 fh.write(hs) 

2296 if table_format[0] == 'c': 

2297 if not last: 

2298 fh.write(header_sep*(columns-1)) 

2299 elif table_format[0] == 't': 

2300 if latex_label_command: 

2301 fh.write('}') 

2302 fh.write('}') 

2303 fh.write(header_end) 

2304 # units: 

2305 if unit_style == 'row': 

2306 first = True 

2307 merged = False 

2308 fh.write(header_start) 

2309 for c in range(len(self.header)): 

2310 if self.hidden[c] or merged: 

2311 merged = False 

2312 continue 

2313 if not first: 

2314 fh.write(header_sep) 

2315 first = False 

2316 fh.write(header_close) 

2317 unit = self.units[c] 

2318 if not unit: 

2319 unit = '-' 

2320 if table_format[0] == 't': 

2321 if latex_merge_std and stdev_col[c]: 

2322 merged = True 

2323 fh.write('\\multicolumn{2}{c}{%s}' % latex_unit(unit)) 

2324 elif center_columns: 

2325 fh.write('\\multicolumn{1}{c}{%s}' % latex_unit(unit)) 

2326 else: 

2327 fh.write('\\multicolumn{1}{l}{%s}' % latex_unit(unit)) 

2328 else: 

2329 if align_columns and not table_format[0] in 'h': 

2330 f = '%%-%ds' % widths[c] 

2331 fh.write(f % unit) 

2332 else: 

2333 fh.write(unit) 

2334 fh.write(header_end) 

2335 # column numbers: 

2336 if column_numbers is not None: 

2337 first = True 

2338 fh.write(header_start) 

2339 for c in range(len(self.header)): 

2340 if self.hidden[c]: 

2341 continue 

2342 if not first: 

2343 fh.write(header_sep) 

2344 first = False 

2345 fh.write(header_close) 

2346 i = c 

2347 if column_numbers == 'num': 

2348 i = c+1 

2349 aa = index2aa(c, 'a') 

2350 if column_numbers == 'AA': 

2351 aa = index2aa(c, 'A') 

2352 if table_format[0] == 't': 

2353 if column_numbers == 'num' or column_numbers == 'index': 

2354 fh.write('\\multicolumn{1}{l}{%d}' % i) 

2355 else: 

2356 fh.write('\\multicolumn{1}{l}{%s}' % aa) 

2357 else: 

2358 if column_numbers == 'num' or column_numbers == 'index': 

2359 if align_columns: 

2360 f = '%%%dd' % widths[c] 

2361 fh.write(f % i) 

2362 else: 

2363 fh.write('%d' % i) 

2364 else: 

2365 if align_columns: 

2366 f = '%%-%ds' % widths[c] 

2367 fh.write(f % aa) 

2368 else: 

2369 fh.write(aa) 

2370 fh.write(header_end) 

2371 # header line: 

2372 if header_line: 

2373 if table_format[0] == 'm': 

2374 fh.write('|') 

2375 for c in range(len(self.header)): 

2376 if self.hidden[c]: 

2377 continue 

2378 w = widths[c]+2 

2379 if center_columns: 

2380 fh.write(':' + (w-2)*'-' + ':|') 

2381 elif formats[c][1] == '-': 

2382 fh.write(w*'-' + '|') 

2383 else: 

2384 fh.write((w-1)*'-' + ':|') 

2385 fh.write('\n') 

2386 elif table_format[0] == 't': 

2387 fh.write(' \\hline \\\\[-2ex]\n') 

2388 else: 

2389 first = True 

2390 fh.write(header_start.replace(' ', '-')) 

2391 for c in range(len(self.header)): 

2392 if self.hidden[c]: 

2393 continue 

2394 if not first: 

2395 fh.write(header_sep.replace(' ', '-')) 

2396 first = False 

2397 fh.write(header_close) 

2398 w = widths[c] 

2399 fh.write(w*'-') 

2400 fh.write(header_end.replace(' ', '-')) 

2401 # start table data: 

2402 if table_format[0] == 'h': 

2403 fh.write('</thead>\n<tbody>\n') 

2404 # data: 

2405 for k in range(self.rows()): 

2406 first = True 

2407 merged = False 

2408 fh.write(data_start) 

2409 for c, f in enumerate(formats): 

2410 if self.hidden[c] or merged: 

2411 merged = False 

2412 continue 

2413 if not first: 

2414 fh.write(data_sep) 

2415 first = False 

2416 if table_format[0] == 'h': 

2417 if center_columns: 

2418 fh.write(' align="center"') 

2419 elif f[1] == '-': 

2420 fh.write(' align="left"') 

2421 else: 

2422 fh.write(' align="right"') 

2423 fh.write(data_close) 

2424 if k >= len(self.data[c]) or \ 

2425 (isinstance(self.data[c][k], (float, np.floating)) and m.isnan(self.data[c][k])): 

2426 # missing data: 

2427 if table_format[0] == 't' and latex_merge_std and stdev_col[c]: 

2428 merged = True 

2429 fh.write('\\multicolumn{2}{c}{%s}' % missing) 

2430 elif align_columns: 

2431 if f[1] == '-': 

2432 fn = '%%-%ds' % widths[c] 

2433 else: 

2434 fn = '%%%ds' % widths[c] 

2435 fh.write(fn % missing) 

2436 else: 

2437 fh.write(missing) 

2438 else: 

2439 # data value: 

2440 try: 

2441 ds = f % self.data[c][k] 

2442 except ValueError: 

2443 ds = missing 

2444 except TypeError: 

2445 ds = str(self.data[c][k]) 

2446 if not align_columns: 

2447 ds = ds.strip() 

2448 fh.write(ds) 

2449 fh.write(data_end) 

2450 # bottom line: 

2451 if bottom_line: 

2452 if table_format[0] == 't': 

2453 fh.write(' \\hline\n') 

2454 else: 

2455 first = True 

2456 fh.write(header_start.replace(' ', '-')) 

2457 for c in range(len(self.header)): 

2458 if self.hidden[c]: 

2459 continue 

2460 if not first: 

2461 fh.write('-'*len(header_sep)) 

2462 first = False 

2463 fh.write(header_close) 

2464 w = widths[c] 

2465 fh.write(w*'-') 

2466 fh.write(header_end.replace(' ', '-')) 

2467 # end table: 

2468 fh.write(end_str) 

2469 # close file: 

2470 if own_file: 

2471 fh.close() 

2472 # return file name: 

2473 return file_name 

2474 

2475 

2476 def write_file_stream(self, basename, file_name, **kwargs): 

2477 """Write table to file or stream and return appropriate file name. 

2478 

2479 Parameters 

2480 ---------- 

2481 basename: str or stream 

2482 If str, path and basename of file. 

2483 `file_name` and an extension are appended. 

2484 If stream, write table data into this stream. 

2485 file_name: str 

2486 Name of file that is appended to a base path or `basename`. 

2487 kwargs: 

2488 Arguments passed on to `TableData.write()`. 

2489 In particular, 'table_format' is used to the set the file extension 

2490 that is appended to the returned `file_name`. 

2491 

2492 Returns 

2493 ------- 

2494 file_name: str 

2495 Path and full name of the written file in case of `basename` 

2496 being a string. Otherwise, the file name and extension that 

2497 should be appended to a base path. 

2498 """ 

2499 if hasattr(basename, 'write'): 

2500 table_format = kwargs.get('table_format', None) 

2501 if table_format is None or table_format == 'auto': 

2502 table_format = 'csv' 

2503 file_name += '.' + TableData.extensions[table_format] 

2504 self.write(basename, **kwargs) 

2505 return file_name 

2506 else: 

2507 file_name = self.write(basename + file_name, **kwargs) 

2508 return file_name 

2509 

2510 

2511 def __str__(self): 

2512 """Write table to a string. 

2513 """ 

2514 stream = StringIO() 

2515 self.write(stream, table_format='out') 

2516 return stream.getvalue() 

2517 

2518 

2519 def load(self, fh, missing=default_missing_inputs, stop=None): 

2520 """Load table from file or stream. 

2521 

2522 File type and properties are automatically inferred. 

2523 

2524 Parameters 

2525 ---------- 

2526 fh: str or stream 

2527 If not a stream, the file with name `fh` is opened for reading. 

2528 missing: str or list of str 

2529 Missing data are indicated by this string and 

2530 are translated to np.nan. 

2531 stop: str or None 

2532 If the beginning of a line matches `stop`, then stop reading the file. 

2533 

2534 Raises 

2535 ------ 

2536 FileNotFoundError: 

2537 If `fh` is a path that does not exist. 

2538 """ 

2539 

2540 def read_key_line(line, sep, table_format): 

2541 if sep is None: 

2542 cols, indices = zip(*[(m.group(0), m.start()) for m in re.finditer(r'( ?[\S]+)+(?=[ ][ ]+|\Z)', line.strip())]) 

2543 elif table_format == 'csv': 

2544 cols, indices = zip(*[(c.strip(), i) for i, c in enumerate(line.strip().split(sep)) if c.strip()]) 

2545 return cols, indices 

2546 else: 

2547 seps = r'[^'+re.escape(sep)+']+' 

2548 cols, indices = zip(*[(m.group(0), m.start()) for m in re.finditer(seps, line.strip())]) 

2549 colss = [] 

2550 indicess = [] 

2551 if table_format == 'tex': 

2552 i = 0 

2553 for c in cols: 

2554 if 'multicolumn' in c: 

2555 fields = c.split('{') 

2556 n = int(fields[1].strip().rstrip('}').rstrip()) 

2557 colss.append(fields[3].strip().rstrip('}').rstrip()) 

2558 indicess.append(i) 

2559 i += n 

2560 else: 

2561 colss.append(c.strip()) 

2562 indicess.append(i) 

2563 i += 1 

2564 else: 

2565 for k, (c, i) in enumerate(zip(cols, indices)): 

2566 if k == 0: 

2567 c = c.lstrip('|') 

2568 if k == len(cols)-1: 

2569 c = c.rstrip('|') 

2570 cs = c.strip() 

2571 colss.append(cs) 

2572 indicess.append(i) 

2573 return colss, indicess 

2574 

2575 def read_data_line(line, sep, post, precd, alld, numc, exped, 

2576 fixed, strf, missing, nans): 

2577 # read line: 

2578 cols = [] 

2579 if sep is None: 

2580 cols = [m.group(0) for m in re.finditer(r'\S+', line.strip())] 

2581 else: 

2582 if sep.isspace(): 

2583 seps = r'[^'+re.escape(sep)+']+' 

2584 cols = [m.group(0) for m in re.finditer(seps, line.strip())] 

2585 else: 

2586 cols = line.split(sep) 

2587 if len(cols) > 0 and len(cols[0]) == 0: 

2588 cols = cols[1:] 

2589 if len(cols) > 0 and len(cols[-1]) == 0: 

2590 cols = cols[:-1] 

2591 if len(cols) > 0: 

2592 cols[0] = cols[0].lstrip('|').lstrip() 

2593 cols[-1] = cols[-1].rstrip('|').rstrip() 

2594 cols = [c.strip() for c in cols if c != '|'] 

2595 # read columns: 

2596 for k, c in enumerate(cols): 

2597 try: 

2598 v = float(c) 

2599 ad = 0 

2600 ve = c.split('e') 

2601 if len(ve) <= 1: 

2602 exped[k] = False 

2603 else: 

2604 ad = len(ve[1])+1 

2605 vc = ve[0].split('.') 

2606 ad += len(vc[0]) 

2607 prec = len(vc[0].lstrip('-').lstrip('+').lstrip('0')) 

2608 if len(vc) == 2: 

2609 if numc[k] and post[k] != len(vc[1]): 

2610 fixed[k] = False 

2611 if post[k] < len(vc[1]): 

2612 post[k] = len(vc[1]) 

2613 ad += len(vc[1])+1 

2614 prec += len(vc[1].rstrip('0')) 

2615 if precd[k] < prec: 

2616 precd[k] = prec 

2617 if alld[k] < ad: 

2618 alld[k] = ad 

2619 numc[k] = True 

2620 except ValueError: 

2621 if c in missing: 

2622 v = np.nan 

2623 nans[k] = c 

2624 else: 

2625 strf[k] = True 

2626 if alld[k] < len(c): 

2627 alld[k] = len(c) 

2628 v = c 

2629 self.append_data(v, k) 

2630 

2631 # initialize: 

2632 if isinstance(missing, str): 

2633 missing = [missing] 

2634 self.data = [] 

2635 self.shape = (0, 0) 

2636 self.header = [] 

2637 self.nsecs = 0 

2638 self.units = [] 

2639 self.formats = [] 

2640 self.hidden = [] 

2641 self.setcol = 0 

2642 self.addcol = 0 

2643 # open file: 

2644 own_file = False 

2645 if not hasattr(fh, 'readline'): 

2646 fh = open(fh, 'r') 

2647 own_file = True 

2648 # read inital lines of file: 

2649 key = [] 

2650 data = [] 

2651 target = data 

2652 comment = False 

2653 table_format='dat' 

2654 for line in fh: 

2655 line = line.rstrip() 

2656 if line == stop: 

2657 break; 

2658 if line: 

2659 if r'\begin{tabular' in line: 

2660 table_format='tex' 

2661 target = key 

2662 continue 

2663 if table_format == 'tex': 

2664 if r'\end{tabular' in line: 

2665 break 

2666 if r'\hline' in line: 

2667 if key: 

2668 target = data 

2669 continue 

2670 line = line.rstrip(r'\\') 

2671 if line[0] == '#': 

2672 comment = True 

2673 table_format='dat' 

2674 target = key 

2675 line = line.lstrip('#') 

2676 elif comment: 

2677 target = data 

2678 if line[0:3] == 'RTH': 

2679 target = key 

2680 line = line[3:] 

2681 table_format='rtai' 

2682 elif line[0:3] == 'RTD': 

2683 target = data 

2684 line = line[3:] 

2685 table_format='rtai' 

2686 if (line[0:3] == '|--' or line[0:3] == '|:-') and \ 

2687 (line[-3:] == '--|' or line[-3:] == '-:|'): 

2688 if not data and not key: 

2689 table_format='ascii' 

2690 target = key 

2691 continue 

2692 elif not key: 

2693 table_format='md' 

2694 key = data 

2695 data = [] 

2696 target = data 

2697 continue 

2698 elif not data: 

2699 target = data 

2700 continue 

2701 else: 

2702 break 

2703 target.append(line) 

2704 else: 

2705 break 

2706 if len(data) > 5: 

2707 break 

2708 # find column separator of data and number of columns: 

2709 col_seps = ['|', ',', ';', ':', '\t', '&', None] 

2710 colstd = np.zeros(len(col_seps)) 

2711 colnum = np.zeros(len(col_seps), dtype=int) 

2712 for k, sep in enumerate(col_seps): 

2713 cols = [] 

2714 s = 5 if len(data) >= 8 else len(data) - 3 

2715 if s < 0 or key: 

2716 s = 0 

2717 for line in data[s:]: 

2718 cs = line.strip().split(sep) 

2719 if not cs[0]: 

2720 cs = cs[1:] 

2721 if cs and not cs[-1]: 

2722 cs = cs[:-1] 

2723 cols.append(len(cs)) 

2724 colstd[k] = np.std(cols) 

2725 colnum[k] = np.median(cols) 

2726 if np.max(colnum) < 2: 

2727 sep = None 

2728 colnum = 1 

2729 else: 

2730 ci = np.where(np.array(colnum)>1.5)[0] 

2731 ci = ci[np.argmin(colstd[ci])] 

2732 sep = col_seps[ci] 

2733 colnum = int(colnum[ci]) 

2734 # fix key: 

2735 if not key and sep is not None and sep in ',;:\t|': 

2736 table_format = 'csv' 

2737 # read key: 

2738 key_cols = [] 

2739 key_indices = [] 

2740 for line in key: 

2741 cols, indices = read_key_line(line, sep, table_format) 

2742 key_cols.append(cols) 

2743 key_indices.append(indices) 

2744 if not key_cols: 

2745 # no obviously marked table key: 

2746 key_num = 0 

2747 for line in data: 

2748 cols, indices = read_key_line(line, sep, table_format) 

2749 numbers = 0 

2750 for c in cols: 

2751 try: 

2752 v = float(c) 

2753 numbers += 1 

2754 except ValueError: 

2755 pass 

2756 if numbers == 0: 

2757 key_cols.append(cols) 

2758 key_indices.append(indices) 

2759 key_num += 1 

2760 else: 

2761 break 

2762 data = data[key_num:] 

2763 kr = len(key_cols)-1 

2764 # check for key with column indices: 

2765 if kr >= 0: 

2766 cols = key_cols[kr] 

2767 numrow = True 

2768 try: 

2769 pv = int(cols[0]) 

2770 for c in cols[1:]: 

2771 v = int(c) 

2772 if v != pv+1: 

2773 numrow = False 

2774 break 

2775 pv = v 

2776 except ValueError: 

2777 try: 

2778 pv = aa2index(cols[0]) 

2779 for c in cols[1:]: 

2780 v = aa2index(c) 

2781 if v != pv+1: 

2782 numrow = False 

2783 break 

2784 pv = v 

2785 except ValueError: 

2786 numrow = False 

2787 if numrow: 

2788 kr -= 1 

2789 # check for unit line: 

2790 units = None 

2791 if kr > 0 and len(key_cols[kr]) == len(key_cols[kr-1]): 

2792 units = key_cols[kr] 

2793 kr -= 1 

2794 # column labels: 

2795 if kr >= 0: 

2796 if units is None: 

2797 # units may be part of the label: 

2798 labels = [] 

2799 units = [] 

2800 for c in key_cols[kr]: 

2801 if c[-1] == ')': 

2802 lu = c[:-1].split('(') 

2803 if len(lu) >= 2: 

2804 labels.append(lu[0].strip()) 

2805 units.append('('.join(lu[1:]).strip()) 

2806 continue 

2807 lu = c.split('/') 

2808 if len(lu) >= 2: 

2809 labels.append(lu[0].strip()) 

2810 units.append('/'.join(lu[1:]).strip()) 

2811 else: 

2812 labels.append(c) 

2813 units.append('') 

2814 else: 

2815 labels = key_cols[kr] 

2816 indices = key_indices[kr] 

2817 # init table columns: 

2818 for k in range(colnum): 

2819 self.append(labels[k], units[k], '%g') 

2820 # read in sections: 

2821 while kr > 0: 

2822 kr -= 1 

2823 for sec_label, sec_inx in zip(key_cols[kr], key_indices[kr]): 

2824 col_inx = indices.index(sec_inx) 

2825 self.header[col_inx].append(sec_label) 

2826 if self.nsecs < len(self.header[col_inx])-1: 

2827 self.nsecs = len(self.header[col_inx])-1 

2828 # read data: 

2829 post = np.zeros(colnum) 

2830 precd = np.zeros(colnum) 

2831 alld = np.zeros(colnum) 

2832 numc = [False] * colnum 

2833 exped = [True] * colnum 

2834 fixed = [True] * colnum 

2835 strf = [False] * colnum 

2836 nans = [None] * colnum 

2837 for line in data: 

2838 read_data_line(line, sep, post, precd, alld, numc, exped, fixed, 

2839 strf, missing, nans) 

2840 # read remaining data: 

2841 for line in fh: 

2842 line = line.rstrip() 

2843 if line == stop: 

2844 break; 

2845 if table_format == 'tex': 

2846 if r'\end{tabular' in line or r'\hline' in line: 

2847 break 

2848 line = line.rstrip(r'\\') 

2849 if (line[0:3] == '|--' or line[0:3] == '|:-') and \ 

2850 (line[-3:] == '--|' or line[-3:] == '-:|'): 

2851 break 

2852 if line[0:3] == 'RTD': 

2853 line = line[3:] 

2854 read_data_line(line, sep, post, precd, alld, numc, exped, fixed, 

2855 strf, missing, nans) 

2856 # set formats: 

2857 for k in range(len(alld)): 

2858 if strf[k]: 

2859 self.set_format('%%-%ds' % alld[k], k) 

2860 # make sure all elements are strings: 

2861 for i in range(len(self.data[k])): 

2862 if self.data[k][i] is np.nan: 

2863 self.data[k][i] = nans[k] 

2864 else: 

2865 self.data[k][i] = str(self.data[k][i]) 

2866 elif exped[k]: 

2867 self.set_format('%%%d.%de' % (alld[k], post[k]), k) 

2868 elif fixed[k]: 

2869 self.set_format('%%%d.%df' % (alld[k], post[k]), k) 

2870 else: 

2871 self.set_format('%%%d.%dg' % (alld[k], precd[k]), k) 

2872 # close file: 

2873 if own_file: 

2874 fh.close() 

2875 

2876 

2877def write(fh, data, header, units=None, formats=None, 

2878 table_format=None, delimiter=None, unit_style=None, 

2879 column_numbers=None, sections=None, align_columns=None, 

2880 shrink_width=True, missing=default_missing_str, 

2881 center_columns=False, latex_label_command='', 

2882 latex_merge_std=False): 

2883 """Construct table and write to file. 

2884 

2885 Parameters 

2886 ---------- 

2887 fh: filename or stream 

2888 If not a stream, the file with name `fh` is opened. 

2889 If `fh` does not have an extension, 

2890 the `table_format` is appended as an extension. 

2891 Otherwise `fh` is used as a stream for writing. 

2892 data: 1-D or 2-D ndarray of data 

2893 The data of the table. 

2894 header: list of str 

2895 Header labels for each column. 

2896 units: list of str, optional 

2897 Unit strings for each column. 

2898 formats: str or list of str, optional 

2899 Format strings for each column. If only a single format string is 

2900 given, then all columns are initialized with this format string. 

2901 

2902 See `TableData.write()` for a description of all other parameters. 

2903 

2904 Example 

2905 ------- 

2906 ``` 

2907 write(sys.stdout, np.random.randn(4,3), ['aaa', 'bbb', 'ccc'], units=['m', 's', 'g'], formats='%.2f') 

2908 ``` 

2909 """ 

2910 td = TableData(data, header, units, formats) 

2911 td.write(fh, table_format=table_format, unit_style=unit_style, 

2912 column_numbers=column_numbers, missing=missing, 

2913 shrink_width=shrink_width, delimiter=delimiter, 

2914 align_columns=align_columns, sections=sections, 

2915 latex_label_command=latex_label_command, 

2916 latex_merge_std=latex_merge_std) 

2917 

2918 

2919def add_write_table_config(cfg, table_format=None, delimiter=None, 

2920 unit_style=None, column_numbers=None, 

2921 sections=None, align_columns=None, 

2922 shrink_width=True, missing='-', 

2923 center_columns=False, 

2924 latex_label_command='', 

2925 latex_merge_std=False): 

2926 """Add parameter specifying how to write a table to a file as a new 

2927section to a configuration. 

2928 

2929 Parameters 

2930 ---------- 

2931 cfg: ConfigFile 

2932 The configuration. 

2933 """ 

2934 

2935 cfg.add_section('File format for storing analysis results:') 

2936 cfg.add('fileFormat', table_format or 'auto', '', 'Default file format used to store analysis results.\nOne of %s.' % ', '.join(TableData.formats)) 

2937 cfg.add('fileDelimiter', delimiter or 'auto', '', 'String used to separate columns or "auto".') 

2938 cfg.add('fileUnitStyle', unit_style or 'auto', '', 'Add units as extra row ("row"), add units to header label separated by "/" ("header"), do not print out units ("none"), or "auto".') 

2939 cfg.add('fileColumnNumbers', column_numbers or 'none', '', 'Add line with column indices ("index", "num", "aa", "AA", or "none")') 

2940 cfg.add('fileSections', sections or 'auto', '', 'Maximum number of section levels or "auto"') 

2941 cfg.add('fileAlignColumns', align_columns or 'auto', '', 'If True, write all data of a column using the same width, if False write the data without any white space, or "auto".') 

2942 cfg.add('fileShrinkColumnWidth', shrink_width, '', 'Allow to make columns narrower than specified by the corresponding format strings.') 

2943 cfg.add('fileMissing', missing, '', 'String used to indicate missing data values.') 

2944 cfg.add('fileCenterColumns', center_columns, '', 'Center content of all columns instead of left align columns of strings and right align numbers (markdown, html, and latex).') 

2945 cfg.add('fileLaTeXLabelCommand', latex_label_command, '', 'LaTeX command name for formatting column labels of the table header.') 

2946 cfg.add('fileLaTeXMergeStd', latex_merge_std, '', 'Merge header of columns with standard deviations with previous column (LaTeX tables only).') 

2947 

2948 

2949def write_table_args(cfg): 

2950 """Translates a configuration to the respective parameter names for 

2951writing a table to a file. 

2952  

2953 The return value can then be passed as key-word arguments to TableData.write(). 

2954 

2955 Parameters 

2956 ---------- 

2957 cfg: ConfigFile 

2958 The configuration. 

2959 

2960 Returns 

2961 ------- 

2962 a: dict 

2963 Dictionary with names of arguments of the `TableData.write` function 

2964 and their values as supplied by `cfg`. 

2965 """ 

2966 d = cfg.map({'table_format': 'fileFormat', 

2967 'delimiter': 'fileDelimiter', 

2968 'unit_style': 'fileUnitStyle', 

2969 'column_numbers': 'fileColumnNumbers', 

2970 'sections': 'fileSections', 

2971 'align_columns': 'fileAlignColumns', 

2972 'shrink_width': 'fileShrinkColumnWidth', 

2973 'missing': 'fileMissing', 

2974 'center_columns': 'fileCenterColumns', 

2975 'latex_label_command': 'fileLaTeXLabelCommand', 

2976 'latex_merge_std': 'fileLaTeXMergeStd'}) 

2977 if 'sections' in d: 

2978 if d['sections'] != 'auto': 

2979 d['sections'] = int(d['sections']) 

2980 return d 

2981 

2982 

2983def latex_unit(unit): 

2984 """Translate unit string into SIunit LaTeX code. 

2985  

2986 Parameters 

2987 ---------- 

2988 unit: str 

2989 String enoting a unit. 

2990  

2991 Returns 

2992 ------- 

2993 unit: str 

2994 Unit string as valid LaTeX code. 

2995 """ 

2996 si_prefixes = {'y': '\\yocto', 

2997 'z': '\\zepto', 

2998 'a': '\\atto', 

2999 'f': '\\femto', 

3000 'p': '\\pico', 

3001 'n': '\\nano', 

3002 'u': '\\micro', 

3003 'm': '\\milli', 

3004 'c': '\\centi', 

3005 'd': '\\deci', 

3006 'h': '\\hecto', 

3007 'k': '\\kilo', 

3008 'M': '\\mega', 

3009 'G': '\\giga', 

3010 'T': '\\tera', 

3011 'P': '\\peta', 

3012 'E': '\\exa', 

3013 'Z': '\\zetta', 

3014 'Y': '\\yotta' } 

3015 si_units = {'m': '\\metre', 

3016 'g': '\\gram', 

3017 's': '\\second', 

3018 'A': '\\ampere', 

3019 'K': '\\kelvin', 

3020 'mol': '\\mole', 

3021 'cd': '\\candela', 

3022 'Hz': '\\hertz', 

3023 'N': '\\newton', 

3024 'Pa': '\\pascal', 

3025 'J': '\\joule', 

3026 'W': '\\watt', 

3027 'C': '\\coulomb', 

3028 'V': '\\volt', 

3029 'F': '\\farad', 

3030 'O': '\\ohm', 

3031 'S': '\\siemens', 

3032 'Wb': '\\weber', 

3033 'T': '\\tesla', 

3034 'H': '\\henry', 

3035 'C': '\\celsius', 

3036 'lm': '\\lumen', 

3037 'lx': '\\lux', 

3038 'Bq': '\\becquerel', 

3039 'Gv': '\\gray', 

3040 'Sv': '\\sievert'} 

3041 other_units = {"'": '\\arcminute', 

3042 "''": '\\arcsecond', 

3043 'a': '\\are', 

3044 'd': '\\dday', 

3045 'eV': '\\electronvolt', 

3046 'ha': '\\hectare', 

3047 'h': '\\hour', 

3048 'L': '\\liter', 

3049 'l': '\\litre', 

3050 'min': '\\minute', 

3051 'Np': '\\neper', 

3052 'rad': '\\rad', 

3053 't': '\\ton', 

3054 '%': '\\%'} 

3055 unit_powers = {'^2': '\\squared', 

3056 '^3': '\\cubed', 

3057 '/': '\\per', 

3058 '^-1': '\\power{}{-1}', 

3059 '^-2': '\\rpsquared', 

3060 '^-3': '\\rpcubed'} 

3061 if '\\' in unit: # this string is already translated! 

3062 return unit 

3063 units = '' 

3064 j = len(unit) 

3065 while j >= 0: 

3066 for k in range(-3, 0): 

3067 if j+k < 0: 

3068 continue 

3069 uss = unit[j+k:j] 

3070 if uss in unit_powers: 

3071 units = unit_powers[uss] + units 

3072 break 

3073 elif uss in other_units: 

3074 units = other_units[uss] + units 

3075 break 

3076 elif uss in si_units: 

3077 units = si_units[uss] + units 

3078 j = j+k 

3079 k = 0 

3080 if j-1 >= 0: 

3081 uss = unit[j-1:j] 

3082 if uss in si_prefixes: 

3083 units = si_prefixes[uss] + units 

3084 k = -1 

3085 break 

3086 else: 

3087 k = -1 

3088 units = unit[j+k:j] + units 

3089 j = j + k 

3090 return units 

3091 

3092 

3093def index2aa(n, a='a'): 

3094 """Convert an integer into an alphabetical representation. 

3095 

3096 The integer number is converted into 'a', 'b', 'c', ..., 'z', 

3097 'aa', 'ab', 'ac', ..., 'az', 'ba', 'bb', ... 

3098 

3099 Inspired by https://stackoverflow.com/a/37604105 

3100 

3101 Parameters 

3102 ---------- 

3103 n: int 

3104 An integer to be converted into alphabetical representation. 

3105 a: str ('a' or 'A') 

3106 Use upper or lower case characters. 

3107 

3108 Returns 

3109 ------- 

3110 ns: str 

3111 Alphabetical represtnation of an integer. 

3112 """ 

3113 d, m = divmod(n, 26) 

3114 bm = chr(ord(a)+m) 

3115 return index2aa(d-1, a) + bm if d else bm 

3116 

3117 

3118def aa2index(s): 

3119 """Convert an alphabetical representation to an index. 

3120 

3121 The alphabetical representation 'a', 'b', 'c', ..., 'z', 

3122 'aa', 'ab', 'ac', ..., 'az', 'ba', 'bb', ... 

3123 is converted to an index starting with 0. 

3124 

3125 Parameters 

3126 ---------- 

3127 s: str 

3128 Alphabetical representation of an index. 

3129 

3130 Returns 

3131 ------- 

3132 index: int 

3133 The corresponding index. 

3134 

3135 Raises 

3136 ------ 

3137 ValueError: 

3138 Invalid character in input string. 

3139 """ 

3140 index = 0 

3141 maxc = ord('z') - ord('a') + 1 

3142 for c in s.lower(): 

3143 index *= maxc 

3144 if ord(c) < ord('a') or ord(c) > ord('z'): 

3145 raise ValueError('invalid character "%s" in string.' % c) 

3146 index += ord(c) - ord('a') + 1 

3147 return index-1 

3148 

3149 

3150class IndentStream(object): 

3151 """Filter an output stream and start each newline with a number of 

3152 spaces. 

3153 """ 

3154 def __init__(self, stream, indent=4): 

3155 self.stream = stream 

3156 self.indent = indent 

3157 self.pending = True 

3158 

3159 def __getattr__(self, attr_name): 

3160 return getattr(self.stream, attr_name) 

3161 

3162 def write(self, data): 

3163 if not data: 

3164 return 

3165 if self.pending: 

3166 self.stream.write(' '*self.indent) 

3167 self.pending = False 

3168 substr = data.rstrip('\n') 

3169 rn = len(data) - len(substr) 

3170 if len(substr) > 0: 

3171 self.stream.write(substr.replace('\n', '\n'+' '*self.indent)) 

3172 if rn > 0: 

3173 self.stream.write('\n'*rn) 

3174 self.pending = True 

3175 

3176 def flush(self): 

3177 self.stream.flush() 

3178 

3179 

3180def main(): 

3181 # setup a table: 

3182 df = TableData() 

3183 df.append(["data", "partial information", "ID"], "", "%-s", list('ABCDEFGH')) 

3184 df.append("size", "m", "%6.2f", [2.34, 56.7, 8.9]) 

3185 df.append("full weight", "kg", "%.0f", 122.8) 

3186 df.append_section("complete reaction") 

3187 df.append("speed", "m/s", "%.3g", 98.7) 

3188 df.append("median jitter", "mm", "%.1f", 23) 

3189 df.append("size", "g", "%.2e", 1.234) 

3190 df.append_data(np.nan, 2) # single value 

3191 df.append_data((0.543, 45, 1.235e2)) # remaining row 

3192 df.append_data((43.21, 6789.1, 3405, 1.235e-4), 2) # next row 

3193 a = 0.5*np.arange(1, 6)*np.random.randn(5, 5) + 10.0 + np.arange(5) 

3194 df.append_data(a.T, 1) # rest of table 

3195 df[3:6,'weight'] = [11.0]*3 

3196 

3197 # write out in all formats: 

3198 for tf in TableData.formats: 

3199 print(' - `%s`: %s' % (tf, TableData.descriptions[tf])) 

3200 print(' ```') 

3201 iout = IndentStream(sys.stdout, 4+2) 

3202 df.write(iout, table_format=tf) 

3203 print(' ```') 

3204 print('') 

3205 

3206 

3207if __name__ == "__main__": 

3208 main()