// Copyright 2009 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

// Package tabwriter implements a write filter (tabwriter.Writer) that // translates tabbed columns in input into properly aligned text. // // The package is using the Elastic Tabstops algorithm described at // http://nickgravgaard.com/elastictabstops/index.html. // // The text/tabwriter package is frozen and is not accepting new features.
package tabwriter import ( ) // ---------------------------------------------------------------------------- // Filter implementation // A cell represents a segment of text terminated by tabs or line breaks. // The text itself is stored in a separate buffer; cell only describes the // segment's size in bytes, its width in runes, and whether it's an htab // ('\t') terminated cell. type cell struct { size int // cell size in bytes width int // cell width in runes htab bool // true if the cell is terminated by an htab ('\t') } // A Writer is a filter that inserts padding around tab-delimited // columns in its input to align them in the output. // // The Writer treats incoming bytes as UTF-8-encoded text consisting // of cells terminated by horizontal ('\t') or vertical ('\v') tabs, // and newline ('\n') or formfeed ('\f') characters; both newline and // formfeed act as line breaks. // // Tab-terminated cells in contiguous lines constitute a column. The // Writer inserts padding as needed to make all cells in a column have // the same width, effectively aligning the columns. It assumes that // all characters have the same width, except for tabs for which a // tabwidth must be specified. Column cells must be tab-terminated, not // tab-separated: non-tab terminated trailing text at the end of a line // forms a cell but that cell is not part of an aligned column. // For instance, in this example (where | stands for a horizontal tab): // // aaaa|bbb|d // aa |b |dd // a | // aa |cccc|eee // // the b and c are in distinct columns (the b column is not contiguous // all the way). The d and e are not in a column at all (there's no // terminating tab, nor would the column be contiguous). // // The Writer assumes that all Unicode code points have the same width; // this may not be true in some fonts or if the string contains combining // characters. // // If DiscardEmptyColumns is set, empty columns that are terminated // entirely by vertical (or "soft") tabs are discarded. Columns // terminated by horizontal (or "hard") tabs are not affected by // this flag. // // If a Writer is configured to filter HTML, HTML tags and entities // are passed through. The widths of tags and entities are // assumed to be zero (tags) and one (entities) for formatting purposes. // // A segment of text may be escaped by bracketing it with Escape // characters. The tabwriter passes escaped text segments through // unchanged. In particular, it does not interpret any tabs or line // breaks within the segment. If the StripEscape flag is set, the // Escape characters are stripped from the output; otherwise they // are passed through as well. For the purpose of formatting, the // width of the escaped text is always computed excluding the Escape // characters. // // The formfeed character acts like a newline but it also terminates // all columns in the current line (effectively calling Flush). Tab- // terminated cells in the next line start new columns. Unless found // inside an HTML tag or inside an escaped text segment, formfeed // characters appear as newlines in the output. // // The Writer must buffer input internally, because proper spacing // of one line may depend on the cells in future lines. Clients must // call Flush when done calling Write. type Writer struct { // configuration output io.Writer minwidth int tabwidth int padding int padbytes [8]byte flags uint // current state buf []byte // collected text excluding tabs or line breaks pos int // buffer position up to which cell.width of incomplete cell has been computed cell cell // current incomplete cell; cell.width is up to buf[pos] excluding ignored sections endChar byte // terminating char of escaped sequence (Escape for escapes, '>', ';' for HTML tags/entities, or 0) lines [][]cell // list of lines; each line is a list of cells widths []int // list of column widths in runes - re-used during formatting } // addLine adds a new line. // flushed is a hint indicating whether the underlying writer was just flushed. // If so, the previous line is not likely to be a good indicator of the new line's cells. func ( *Writer) ( bool) { // Grow slice instead of appending, // as that gives us an opportunity // to re-use an existing []cell. if := len(.lines) + 1; <= cap(.lines) { .lines = .lines[:] .lines[-1] = .lines[-1][:0] } else { .lines = append(.lines, nil) } if ! { // The previous line is probably a good indicator // of how many cells the current line will have. // If the current line's capacity is smaller than that, // abandon it and make a new one. if := len(.lines); >= 2 { if := len(.lines[-2]); > cap(.lines[-1]) { .lines[-1] = make([]cell, 0, ) } } } } // Reset the current state. func ( *Writer) () { .buf = .buf[:0] .pos = 0 .cell = cell{} .endChar = 0 .lines = .lines[0:0] .widths = .widths[0:0] .addLine(true) } // Internal representation (current state): // // - all text written is appended to buf; tabs and line breaks are stripped away // - at any given time there is a (possibly empty) incomplete cell at the end // (the cell starts after a tab or line break) // - cell.size is the number of bytes belonging to the cell so far // - cell.width is text width in runes of that cell from the start of the cell to // position pos; html tags and entities are excluded from this width if html // filtering is enabled // - the sizes and widths of processed text are kept in the lines list // which contains a list of cells for each line // - the widths list is a temporary list with current widths used during // formatting; it is kept in Writer because it's re-used // // |<---------- size ---------->| // | | // |<- width ->|<- ignored ->| | // | | | | // [---processed---tab------------<tag>...</tag>...] // ^ ^ ^ // | | | // buf start of incomplete cell pos // Formatting can be controlled with these flags. const ( // Ignore html tags and treat entities (starting with '&' // and ending in ';') as single characters (width = 1). FilterHTML uint = 1 << iota // Strip Escape characters bracketing escaped text segments // instead of passing them through unchanged with the text. StripEscape // Force right-alignment of cell content. // Default is left-alignment. AlignRight // Handle empty columns as if they were not present in // the input in the first place. DiscardEmptyColumns // Always use tabs for indentation columns (i.e., padding of // leading empty cells on the left) independent of padchar. TabIndent // Print a vertical bar ('|') between columns (after formatting). // Discarded columns appear as zero-width columns ("||"). Debug ) // A Writer must be initialized with a call to Init. The first parameter (output) // specifies the filter output. The remaining parameters control the formatting: // // minwidth minimal cell width including any padding // tabwidth width of tab characters (equivalent number of spaces) // padding padding added to a cell before computing its width // padchar ASCII char used for padding // if padchar == '\t', the Writer will assume that the // width of a '\t' in the formatted output is tabwidth, // and cells are left-aligned independent of align_left // (for correct-looking results, tabwidth must correspond // to the tab width in the viewer displaying the result) // flags formatting control func ( *Writer) ( io.Writer, , , int, byte, uint) *Writer { if < 0 || < 0 || < 0 { panic("negative minwidth, tabwidth, or padding") } .output = .minwidth = .tabwidth = .padding = for := range .padbytes { .padbytes[] = } if == '\t' { // tab padding enforces left-alignment &^= AlignRight } .flags = .reset() return } // debugging support (keep code around) func ( *Writer) () { := 0 for , := range .lines { print("(", , ") ") for , := range { print("[", string(.buf[:+.size]), "]") += .size } print("\n") } print("\n") } // local error wrapper so we can distinguish errors we want to return // as errors from genuine panics (which we don't want to return as errors) type osError struct { err error } func ( *Writer) ( []byte) { , := .output.Write() if != len() && == nil { = io.ErrShortWrite } if != nil { panic(osError{}) } } func ( *Writer) ( []byte, int) { for > len() { .write0() -= len() } .write0([0:]) } var ( newline = []byte{'\n'} tabs = []byte("\t\t\t\t\t\t\t\t") ) func ( *Writer) (, int, bool) { if .padbytes[0] == '\t' || { // padding is done with tabs if .tabwidth == 0 { return // tabs have no width - can't do any padding } // make cellw the smallest multiple of b.tabwidth = ( + .tabwidth - 1) / .tabwidth * .tabwidth := - // amount of padding if < 0 { panic("internal error") } .writeN(tabs, (+.tabwidth-1)/.tabwidth) return } // padding is done with non-tab characters .writeN(.padbytes[0:], -) } var vbar = []byte{'|'} func ( *Writer) ( int, , int) ( int) { = for := ; < ; ++ { := .lines[] // if TabIndent is set, use tabs to pad leading empty cells := .flags&TabIndent != 0 for , := range { if > 0 && .flags&Debug != 0 { // indicate column break .write0(vbar) } if .size == 0 { // empty cell if < len(.widths) { .writePadding(.width, .widths[], ) } } else { // non-empty cell = false if .flags&AlignRight == 0 { // align left .write0(.buf[ : +.size]) += .size if < len(.widths) { .writePadding(.width, .widths[], false) } } else { // align right if < len(.widths) { .writePadding(.width, .widths[], false) } .write0(.buf[ : +.size]) += .size } } } if +1 == len(.lines) { // last buffered line - we don't have a newline, so just write // any outstanding buffered data .write0(.buf[ : +.cell.size]) += .cell.size } else { // not the last line - write newline .write0(newline) } } return } // Format the text between line0 and line1 (excluding line1); pos // is the buffer position corresponding to the beginning of line0. // Returns the buffer position corresponding to the beginning of // line1 and an error, if any. func ( *Writer) ( int, , int) ( int) { = := len(.widths) for := ; < ; ++ { := .lines[] if >= len()-1 { continue } // cell exists in this column => this line // has more cells than the previous line // (the last cell per line is ignored because cells are // tab-terminated; the last cell per line describes the // text before the newline/formfeed and does not belong // to a column) // print unprinted lines until beginning of block = .writeLines(, , ) = // column block begin := .minwidth // minimal column width := true // true if all cells in this column are empty and "soft" for ; < ; ++ { = .lines[] if >= len()-1 { break } // cell exists in this column := [] // update width if := .width + .padding; > { = } // update discardable if .width > 0 || .htab { = false } } // column block end // discard empty columns if necessary if && .flags&DiscardEmptyColumns != 0 { = 0 } // format and print all columns to the right of this column // (we know the widths of this column and all columns to the left) .widths = append(.widths, ) // push width = .(, , ) .widths = .widths[0 : len(.widths)-1] // pop width = } // print unprinted lines until end return .writeLines(, , ) } // Append text to current cell. func ( *Writer) ( []byte) { .buf = append(.buf, ...) .cell.size += len() } // Update the cell width. func ( *Writer) () { .cell.width += utf8.RuneCount(.buf[.pos:]) .pos = len(.buf) } // To escape a text segment, bracket it with Escape characters. // For instance, the tab in this string "Ignore this tab: \xff\t\xff" // does not terminate a cell and constitutes a single character of // width one for formatting purposes. // // The value 0xff was chosen because it cannot appear in a valid UTF-8 sequence. const Escape = '\xff' // Start escaped mode. func ( *Writer) ( byte) { switch { case Escape: .endChar = Escape case '<': .endChar = '>' case '&': .endChar = ';' } } // Terminate escaped mode. If the escaped text was an HTML tag, its width // is assumed to be zero for formatting purposes; if it was an HTML entity, // its width is assumed to be one. In all other cases, the width is the // unicode width of the text. func ( *Writer) () { switch .endChar { case Escape: .updateWidth() if .flags&StripEscape == 0 { .cell.width -= 2 // don't count the Escape chars } case '>': // tag of zero width case ';': .cell.width++ // entity, count as one rune } .pos = len(.buf) .endChar = 0 } // Terminate the current cell by adding it to the list of cells of the // current line. Returns the number of cells in that line. func ( *Writer) ( bool) int { .cell.htab = := &.lines[len(.lines)-1] * = append(*, .cell) .cell = cell{} return len(*) } func ( *Writer) ( *error, string) { if := recover(); != nil { if == "Flush" { // If Flush ran into a panic, we still need to reset. .reset() } if , := .(osError); { * = .err return } panic("tabwriter: panic during " + ) } } // Flush should be called after the last call to Write to ensure // that any data buffered in the Writer is written to output. Any // incomplete escape sequence at the end is considered // complete for formatting purposes. func ( *Writer) () error { return .flush() } // flush is the internal version of Flush, with a named return value which we // don't want to expose. func ( *Writer) () ( error) { defer .handlePanic(&, "Flush") .flushNoDefers() return nil } // flushNoDefers is like flush, but without a deferred handlePanic call. This // can be called from other methods which already have their own deferred // handlePanic calls, such as Write, and avoid the extra defer work. func ( *Writer) () { // add current cell if not empty if .cell.size > 0 { if .endChar != 0 { // inside escape - terminate it even if incomplete .endEscape() } .terminateCell(false) } // format contents of buffer .format(0, 0, len(.lines)) .reset() } var hbar = []byte("---\n") // Write writes buf to the writer b. // The only errors returned are ones encountered // while writing to the underlying output stream. func ( *Writer) ( []byte) ( int, error) { defer .handlePanic(&, "Write") // split text into cells = 0 for , := range { if .endChar == 0 { // outside escape switch { case '\t', '\v', '\n', '\f': // end of cell .append([:]) .updateWidth() = + 1 // ch consumed := .terminateCell( == '\t') if == '\n' || == '\f' { // terminate line .addLine( == '\f') if == '\f' || == 1 { // A '\f' always forces a flush. Otherwise, if the previous // line has only one cell which does not have an impact on // the formatting of the following lines (the last cell per // line is ignored by format()), thus we can flush the // Writer contents. .flushNoDefers() if == '\f' && .flags&Debug != 0 { // indicate section break .write0(hbar) } } } case Escape: // start of escaped sequence .append([:]) .updateWidth() = if .flags&StripEscape != 0 { ++ // strip Escape } .startEscape(Escape) case '<', '&': // possibly an html tag/entity if .flags&FilterHTML != 0 { // begin of tag/entity .append([:]) .updateWidth() = .startEscape() } } } else { // inside escape if == .endChar { // end of tag/entity := + 1 if == Escape && .flags&StripEscape != 0 { = // strip Escape } .append([:]) = + 1 // ch consumed .endEscape() } } } // append leftover text .append([:]) = len() return } // NewWriter allocates and initializes a new tabwriter.Writer. // The parameters are the same as for the Init function. func ( io.Writer, , , int, byte, uint) *Writer { return new(Writer).Init(, , , , , ) }