|
|
|
#! /usr/bin/python
|
|
|
|
########################################################################
|
|
|
|
#
|
|
|
|
# reorder and reformat a file in columns
|
|
|
|
#
|
|
|
|
# this utility takes lines from its standard input and reproduces them,
|
|
|
|
# partially reordered and reformatted, on its standard output.
|
|
|
|
#
|
|
|
|
# It has the same effect as a 'sort | column -t', with the exception
|
|
|
|
# that empty lines, as well as lines which start with a '#' sign, are
|
|
|
|
# not affected, i.e. they keep their position and formatting, and act
|
|
|
|
# as separators, i.e. the parts before and after them are each sorted
|
|
|
|
# separately (but overall field widths are computed across the whole
|
|
|
|
# input).
|
|
|
|
#
|
|
|
|
# Options:
|
|
|
|
# -i:
|
|
|
|
# --ignore-case:
|
|
|
|
# Do not consider case when sorting.
|
|
|
|
# -d:
|
|
|
|
# --default:
|
|
|
|
# What to chage empty fields to.
|
|
|
|
# -s <N>:
|
|
|
|
# --split=<N>:
|
|
|
|
# Treat only the first N whitespace sequences as separators.
|
|
|
|
# line content after the Nth separator will count as only one
|
|
|
|
# field even if it contains whitespace.
|
|
|
|
# Example : '-s 2' causes input 'a b c d e' to be split into
|
|
|
|
# three fields, 'a', 'b', and 'c d e'.
|
|
|
|
#
|
|
|
|
# boards.cfg requires -ids 6.
|
|
|
|
#
|
|
|
|
########################################################################
|
|
|
|
|
|
|
|
import sys, getopt, locale
|
|
|
|
|
|
|
|
# ensure we sort using the C locale.
|
|
|
|
|
|
|
|
locale.setlocale(locale.LC_ALL, 'C')
|
|
|
|
|
|
|
|
# check options
|
|
|
|
|
|
|
|
maxsplit = 0
|
|
|
|
ignore_case = 0
|
|
|
|
default_field =''
|
|
|
|
|
|
|
|
try:
|
|
|
|
opts, args = getopt.getopt(sys.argv[1:], "id:s:",
|
|
|
|
["ignore-case","default","split="])
|
|
|
|
except getopt.GetoptError as err:
|
|
|
|
print str(err) # will print something like "option -a not recognized"
|
|
|
|
sys.exit(2)
|
|
|
|
|
|
|
|
for o, a in opts:
|
|
|
|
if o in ("-s", "--split"):
|
|
|
|
maxsplit = eval(a)
|
|
|
|
elif o in ("-i", "--ignore-case"):
|
|
|
|
ignore_case = 1
|
|
|
|
elif o in ("-d", "--default"):
|
|
|
|
default_field = a
|
|
|
|
else:
|
|
|
|
assert False, "unhandled option"
|
|
|
|
|
|
|
|
# collect all lines from standard input and, for the ones which must be
|
|
|
|
# reformatted and sorted, count their fields and compute each field's
|
|
|
|
# maximum size
|
|
|
|
|
|
|
|
input_lines = []
|
|
|
|
field_width = []
|
|
|
|
|
|
|
|
for line in sys.stdin:
|
|
|
|
# remove final end of line
|
|
|
|
input_line = line.strip('\n')
|
|
|
|
if (len(input_line)>0) and (input_line[0] != '#'):
|
|
|
|
# sortable line: split into fields
|
|
|
|
fields = input_line.split(None,maxsplit)
|
|
|
|
# if there are new fields, top up field_widths
|
|
|
|
for f in range(len(field_width), len(fields)):
|
|
|
|
field_width.append(0)
|
|
|
|
# compute the maximum witdh of each field
|
|
|
|
for f in range(len(fields)):
|
|
|
|
field_width[f] = max(field_width[f],len(fields[f]))
|
|
|
|
# collect the line for next stage
|
|
|
|
input_lines.append(input_line)
|
|
|
|
|
|
|
|
# run through collected input lines, collect the ones which must be
|
|
|
|
# reformatted and sorted, and whenever a non-reformattable, non-sortable
|
|
|
|
# line is met, sort the collected lines before it and append them to the
|
|
|
|
# output lines, then add the non-sortable line too.
|
|
|
|
|
|
|
|
output_lines = []
|
|
|
|
sortable_lines = []
|
|
|
|
for input_line in input_lines:
|
|
|
|
if (len(input_line)>0) and (input_line[0] != '#'):
|
|
|
|
# this line should be reformatted and sorted
|
|
|
|
input_fields = input_line.split(None,maxsplit)
|
|
|
|
output_fields = [];
|
|
|
|
# reformat each field to this field's column width
|
|
|
|
for f in range(len(input_fields)):
|
|
|
|
output_field = input_fields[f];
|
|
|
|
output_fields.append(output_field.ljust(field_width[f]))
|
|
|
|
# any missing field is set to default if it exists
|
|
|
|
if default_field != '':
|
|
|
|
for f in range(len(input_fields),len(field_width)):
|
|
|
|
output_fields.append(default_field.ljust(field_width[f]))
|
|
|
|
# join fields using two spaces, like column -t would
|
|
|
|
output_line = ' '.join(output_fields);
|
|
|
|
# collect line for later
|
|
|
|
sortable_lines.append(output_line)
|
|
|
|
else:
|
|
|
|
# this line is non-sortable
|
|
|
|
# sort collected sortable lines
|
|
|
|
if ignore_case!=0:
|
|
|
|
sortable_lines.sort(key=lambda x: str.lower(locale.strxfrm(x)))
|
|
|
|
else:
|
|
|
|
sortable_lines.sort(key=lambda x: locale.strxfrm(x))
|
|
|
|
# append sortable lines to the final output
|
|
|
|
output_lines.extend(sortable_lines)
|
|
|
|
sortable_lines = []
|
|
|
|
# append non-sortable line to the final output
|
|
|
|
output_lines.append(input_line)
|
|
|
|
# maybe we had sortable lines pending, so append them to the final output
|
|
|
|
if ignore_case!=0:
|
|
|
|
sortable_lines.sort(key=lambda x: str.lower(locale.strxfrm(x)))
|
|
|
|
else:
|
|
|
|
sortable_lines.sort(key=lambda x: locale.strxfrm(x))
|
|
|
|
output_lines.extend(sortable_lines)
|
|
|
|
|
|
|
|
# run through output lines and print them, except rightmost whitespace
|
|
|
|
|
|
|
|
for output_line in output_lines:
|
|
|
|
print output_line.rstrip()
|