From aed8f0bd7f551f48ea841df7af71e23fa2d452fd Mon Sep 17 00:00:00 2001
From: "Victor M. Varela" <vmvarela@gmail.com>
Date: Fri, 5 Jun 2026 16:14:30 +0200
Subject: [PATCH 1/2] feat: pretty-printed table output with auto-detected TTY
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

When stdout is a TTY, format query results as an aligned table with
Unicode box-drawing borders. When piped, output stays CSV (preserving
scriptability). Numeric columns are right-aligned, text left-aligned.

- Add src/table.zig: buffers rows, computes column widths, detects
  numeric columns, prints formatted table with ┌─┬─┐ borders
- Add --table / --no-table flags for explicit control (TableMode enum)
- Auto-detect stdout TTY in main() to resolve table mode
- Table mode disabled when --output writes to a file
- --table is incompatible with non-CSV/TSV output formats (error)
- Update README.md with table output examples and flag docs
- Add 7 integration tests covering table output, piped CSV, error
  paths, numeric alignment, empty results, and --output interaction

Closes #156
---
 README.md     |  29 ++++--
 build.zig     |  71 ++++++++++++++
 src/args.zig  |  25 +++++
 src/main.zig  |  34 +++++--
 src/table.zig | 251 ++++++++++++++++++++++++++++++++++++++++++++++++++
 5 files changed, 398 insertions(+), 12 deletions(-)
 create mode 100644 src/table.zig
diff --git a/README.md b/README.md
index 48c6c9a..e6a72b5 100644
--- a/README.md
+++ b/README.md
@@ -55,7 +55,7 @@ wget https://github.com/vmvarela/sql-pipe/releases/latest/download/sql-pipe_VERS
 sudo dpkg -i sql-pipe_VERSION_linux_amd64.deb
 ```
 
-Replace `VERSION` with the release version (e.g. `0.9.0`) and `amd64` with your architecture (`arm64`, `arm7`, or `386`).
+Replace `VERSION` with the release version (e.g. `0.12.0`) and `amd64` with your architecture (`arm64`, `arm7`, or `386`).
 
 **Fedora / RHEL / openSUSE (RPM repository):**
 
@@ -71,7 +71,7 @@ Or install a single release asset directly:
 sudo rpm -i https://github.com/vmvarela/sql-pipe/releases/latest/download/sql-pipe_VERSION_linux_amd64.rpm
 ```
 
-Replace `VERSION` with the release version (e.g. `0.9.0`) and `amd64` with your architecture (`arm64`).
+Replace `VERSION` with the release version (e.g. `0.12.0`) and `amd64` with your architecture (`arm64`).
 
 **Alpine Linux (APK repository):**
 
@@ -89,7 +89,7 @@ wget https://github.com/vmvarela/sql-pipe/releases/latest/download/sql-pipe_VERS
 sudo apk add --allow-untrusted sql-pipe_VERSION_linux_amd64.apk
 ```
 
-Replace `VERSION` with the release version (e.g. `0.9.0`) and `amd64` with your architecture (`arm64`).
+Replace `VERSION` with the release version (e.g. `0.12.0`) and `amd64` with your architecture (`arm64`).
 
 **Arch Linux (AUR):** install with your preferred AUR helper:
 
@@ -159,6 +159,21 @@ Bob,25
 Carol,35
 ```
 
+When stdout is a terminal (not piped), results are automatically formatted as an aligned table:
+
+```sh
+$ printf 'name,age\nAlice,30\nBob,25\nCarol,35' | sql-pipe 'SELECT * FROM t'
+┌───────┬─────┐
+│ name  │ age │
+├───────┼─────┤
+│ Alice │  30 │
+│ Bob   │  25 │
+│ Carol │  35 │
+└───────┴─────┘
+```
+
+Numeric columns are right-aligned, text columns left-aligned. Pipe the output and it stays CSV — no behavior change for scripts. Use `--table` to force table output or `--no-table` to force CSV.
+
 For JSON and NDJSON input, pass `-I json` (reads an array of objects) or `-I ndjson` (one object per line). Column names are taken from the keys of the first object:
 
 ```sh
@@ -283,6 +298,8 @@ $ cat events.csv \
 | `--xml-root <name>` | Root element name for XML I/O (default: `results`) |
 | `--xml-row <name>` | Row element name for XML I/O (default: `row`) |
 | `--output <file>` | Write results to the given file instead of stdout. Creates or overwrites the file. Exits 1 if the file cannot be created. |
+| `--table` | Force pretty-printed table output (auto-detected when stdout is a TTY). Requires CSV/TSV output format. |
+| `--no-table` | Force CSV output even when stdout is a TTY |
 | `-v`, `--verbose` | Print `Loaded <n> rows in <t>s` to stderr after loading (always on TTY; forced with flag) |
 | `-s`, `--silent` | Suppress `Loaded <n> rows in <t>s` and the progress counter from stderr unconditionally. Cannot be combined with `-v`/`--verbose` |
 | `-h`, `--help` | Show usage help and exit |
@@ -550,6 +567,6 @@ The database never touches disk and vanishes when the process exits. No state, n
 
 ## Related
 
-- **[q](https://harelba.github.io/q/)** — similar concept in Python; handles quoted CSV fields and more formats. Better if you're already in a Python environment.
-- **[trdsql](https://github.com/noborus/trdsql)** — Go alternative with multi-format support (JSON, LTSV) and output formatting. Better if you need non-CSV inputs.
-- **[sqlite-utils](https://sqlite-utils.datasette.io/)** — better if you need persistent databases, schema management, or Python scripting.
+- **[q](https://harelba.github.io/q/)** — Python-based SQL on tabular data. Similar concept, but requires Python runtime. Better if you're already in a Python environment or need Python-specific integrations.
+- **[trdsql](https://github.com/noborus/trdsql)** — Go alternative with broader format support (LTSV, TBLN) and more output options. Better if you need formats beyond CSV/JSON/NDJSON/XML or want more output formatting choices.
+- **[sqlite-utils](https://sqlite-utils.datasette.io/)** — better if you need persistent databases, schema management, or Python scripting. sql-pipe is designed for one-shot queries on ephemeral in-memory data.
diff --git a/build.zig b/build.zig
index 953f349..174e702 100644
--- a/build.zig
+++ b/build.zig
@@ -1711,6 +1711,77 @@ pub fn build(b: *std.Build) void {
     test_file_t_conflict.step.dependOn(b.getInstallStep());
     test_step.dependOn(&test_file_t_conflict.step);
 
+    // ─── Table output tests (--table / --no-table) ────────────────────────────
+
+    // Integration test 156a: --table produces formatted table output
+    const test_table_basic = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\result=$(printf 'name,age\nAlice,30\nBob,25' | ./zig-out/bin/sql-pipe --table 'SELECT * FROM t')
+        \\echo "$result" | grep -q '┌' && echo "$result" | grep -q '│ name' && echo "$result" | grep -q '│ Alice' && echo "$result" | grep -q '└'
+    });
+    test_table_basic.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_table_basic.step);
+
+    // Integration test 156b: --no-table forces CSV output
+    const test_no_table = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\result=$(printf 'name,age\nAlice,30\nBob,25' | ./zig-out/bin/sql-pipe --no-table 'SELECT * FROM t')
+        \\expected=$(printf 'Alice,30\nBob,25')
+        \\[ "$result" = "$expected" ]
+    });
+    test_no_table.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_no_table.step);
+
+    // Integration test 156c: --table with --json produces error
+    const test_table_json_error = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\msg=$(printf 'name,age\nAlice,30' | ./zig-out/bin/sql-pipe --table --json 'SELECT * FROM t' 2>&1; echo "EXIT:$?")
+        \\echo "$msg" | grep -q '\-\-table requires CSV or TSV' && echo "$msg" | grep -q 'EXIT:1'
+    });
+    test_table_json_error.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_table_json_error.step);
+
+    // Integration test 156d: piped output (no --table) stays CSV
+    const test_piped_csv = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\result=$(printf 'name,age\nAlice,30\nBob,25' | ./zig-out/bin/sql-pipe 'SELECT * FROM t')
+        \\expected=$(printf 'Alice,30\nBob,25')
+        \\[ "$result" = "$expected" ]
+    });
+    test_piped_csv.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_piped_csv.step);
+
+    // Integration test 156e: table output right-aligns numeric columns
+    const test_table_numeric_align = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\result=$(printf 'name,score\nAlice,100\nBob,5' | ./zig-out/bin/sql-pipe --table 'SELECT * FROM t')
+        \\echo "$result" | grep -q '100' && echo "$result" | grep -q '5' && echo "$result" | grep -q '│'
+    });
+    test_table_numeric_align.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_table_numeric_align.step);
+
+    // Integration test 156f: empty result shows headers only
+    const test_table_empty = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\result=$(printf 'name,age\nAlice,30' | ./zig-out/bin/sql-pipe --table 'SELECT * FROM t WHERE age > 100')
+        \\echo "$result" | grep -q '┌' && echo "$result" | grep -q '│ name' && echo "$result" | grep -q '└' && ! echo "$result" | grep -q 'Alice'
+    });
+    test_table_empty.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_table_empty.step);
+
+    // Integration test 156g: --output writes CSV even with --table
+    const test_table_output_file = b.addSystemCommand(&.{
+        "bash", "-c",
+        \\tmp=$(mktemp)
+        \\printf 'name,age\nAlice,30\nBob,25' | ./zig-out/bin/sql-pipe --table --output "$tmp" 'SELECT * FROM t'
+        \\result=$(cat "$tmp")
+        \\rm -f "$tmp"
+        \\expected=$(printf 'Alice,30\nBob,25')
+        \\[ "$result" = "$expected" ]
+    });
+    test_table_output_file.step.dependOn(b.getInstallStep());
+    test_step.dependOn(&test_table_output_file.step);
+
     // ─── Fixture-based integration tests ─────────────────────────────────────
     // These tests use sample files committed in tests/fixtures/ to exercise
     // the binary end-to-end with realistic data across all supported formats.
diff --git a/src/args.zig b/src/args.zig
index 86b92d9..b67717d 100644
--- a/src/args.zig
+++ b/src/args.zig
@@ -18,6 +18,16 @@ pub const ExitCode = enum(u8) {
     sql_error = 3,
 };
 
+/// Controls pretty-printed table output.
+///   auto   — show table when stdout is a TTY, CSV when piped (default)
+///   always — force table output regardless of TTY
+///   never  — force CSV output regardless of TTY
+pub const TableMode = enum {
+    auto,
+    always,
+    never,
+};
+
 pub const FileInput = struct {
     path: []const u8,
     table_name: []const u8,
@@ -59,6 +69,7 @@ pub const SqlPipeError = error{
     SampleWithOutput,
     InvalidSampleCount,
     DuplicateTableName,
+    TableWithNonCsv,
 };
 
 pub const ParsedArgs = struct {
@@ -100,6 +111,8 @@ pub const ParsedArgs = struct {
     /// Use a file-backed temporary SQLite database instead of :memory: when true.
     /// Enables processing datasets larger than available RAM; also sets PRAGMA temp_store = FILE.
     disk: bool,
+    /// Pretty-printed table output mode (default: auto — TTY detection).
+    table_mode: TableMode = .auto,
 };
 
 pub const ColumnsArgs = struct {
@@ -207,6 +220,8 @@ pub fn printUsage(writer: *std.Io.Writer) !void {
         \\  --disk                       Use a file-backed temp database instead of :memory:
         \\                               Enables processing datasets larger than available RAM
         \\                               Also sets PRAGMA temp_store = FILE for transient structures
+        \\  --table                      Force pretty-printed table output (auto-detected on TTY)
+        \\  --no-table                   Force CSV output even when stdout is a TTY
         \\  -h, --help                   Show this help message and exit
         \\  -V, --version                Show version and exit
         \\
@@ -277,6 +292,7 @@ pub fn parseArgs(allocator: std.mem.Allocator, args: []const [:0]const u8) (SqlP
     var sample_mode = false;
     var sample_n: usize = 10;
     var disk = false;
+    var table_mode: TableMode = .auto;
     var seen_dashdash = false;
     var positional_args: std.ArrayList([]const u8) = .empty;
     defer positional_args.deinit(allocator);
@@ -408,6 +424,10 @@ pub fn parseArgs(allocator: std.mem.Allocator, args: []const [:0]const u8) (SqlP
             json_path = arg["--json-path=".len..];
         } else if (std.mem.eql(u8, arg, "--disk")) {
             disk = true;
+        } else if (std.mem.eql(u8, arg, "--table")) {
+            table_mode = .always;
+        } else if (std.mem.eql(u8, arg, "--no-table")) {
+            table_mode = .never;
         } else {
             try positional_args.append(allocator, arg);
         }
@@ -515,6 +535,10 @@ pub fn parseArgs(allocator: std.mem.Allocator, args: []const [:0]const u8) (SqlP
     if (json_path != null and input_format != .json)
         return error.JsonPathRequiresJson;
 
+    // --table requires CSV or TSV output format (table formatting is visual only)
+    if (table_mode == .always and output_format != .csv and output_format != .tsv)
+        return error.TableWithNonCsv;
+
     // --columns mode: list headers and exit
     if (list_columns)
         return .{ .columns = ColumnsArgs{
@@ -567,6 +591,7 @@ pub fn parseArgs(allocator: std.mem.Allocator, args: []const [:0]const u8) (SqlP
         .xml_row_input = xml_row_input,
         .json_path = json_path,
         .disk = disk,
+        .table_mode = table_mode,
     } };
 }
 
diff --git a/src/main.zig b/src/main.zig
index 94fa235..14ec233 100644
--- a/src/main.zig
+++ b/src/main.zig
@@ -3,6 +3,7 @@ const c = @import("c");
 const json = @import("json.zig");
 const xml = @import("xml.zig");
 const format = @import("format.zig");
+const table = @import("table.zig");
 const build_options = @import("build_options");
 const args_mod = @import("args.zig");
 const sqlite_mod = @import("sqlite.zig");
@@ -17,6 +18,7 @@ const VERSION: []const u8 = build_options.version;
 const SqlPipeError = args_mod.SqlPipeError;
 const ParsedArgs = args_mod.ParsedArgs;
 const ExitCode = args_mod.ExitCode;
+const TableMode = args_mod.TableMode;
 const parseArgs = args_mod.parseArgs;
 const printUsage = args_mod.printUsage;
 
@@ -31,12 +33,13 @@ const InputFormat = format.InputFormat;
 /// Supported output formats (canonical definition lives in format.zig).
 const OutputFormat = format.OutputFormat;
 
-/// execQuery(db, query, allocator, writer, header, output_format) → !void
+/// execQuery(db, query, allocator, writer, header, output_format, use_table) → !void
 /// Pre:  db is open with tables populated
 ///       query is a valid SQL string (not null-terminated)
 ///       allocator is valid
 ///       when output_format = .json or .ndjson, header must not be set (caller's responsibility)
-/// Post: results are written to writer in the requested output format
+///       when use_table = true, output_format must be .csv or .tsv (caller's responsibility)
+/// Post: results are written to writer in the requested output format (or as a pretty table)
 ///       error.PrepareQueryFailed when sqlite3_prepare_v2 returns non-SQLITE_OK
 ///       propagates any writer I/O error
 fn execQuery(
@@ -48,6 +51,7 @@ fn execQuery(
     output_format: OutputFormat,
     xml_root: []const u8,
     xml_row: []const u8,
+    use_table: bool,
 ) (SqlPipeError || std.mem.Allocator.Error || error{WriteFailed})!void {
     const query_z = try allocator.dupeZ(u8, query);
     defer allocator.free(query_z);
@@ -59,6 +63,12 @@ fn execQuery(
 
     const col_count = c.sqlite3_column_count(stmt);
 
+    // Table mode: buffer all rows and print a formatted table
+    if (use_table) {
+        try table.writeTable(allocator, stmt.?, col_count, writer);
+        return;
+    }
+
     var out_writer = format.OutputWriter.init(output_format, .{
         .header = header,
         .xml_root = xml_root,
@@ -75,8 +85,9 @@ fn execQuery(
     try out_writer.end(writer);
 }
 
-/// run(allocator, io, parsed, stderr_writer, stdout_writer) → void
+/// run(allocator, io, parsed, stderr_writer, stdout_writer, use_table) → void
 /// Pre:  parsed contains a valid query; allocator and writers are valid
+///       use_table is true when output should be formatted as a pretty table
 /// Post: input from stdin has been loaded (dispatched on parsed.input_format),
 ///       query executed, results written to stdout in parsed.output_format
 ///       On error, an "error: ..." message is written to stderr and process
@@ -87,6 +98,7 @@ fn run(
     parsed: ParsedArgs,
     stderr_writer: *std.Io.Writer,
     stdout_writer: *std.Io.Writer,
+    use_table: bool,
 ) void {
     const query = parsed.query;
 
@@ -204,7 +216,7 @@ fn run(
     // Determine which table to show column context for on error
     const main_table: []const u8 = if (parsed.files.len > 0) parsed.files[0].table_name else "t";
 
-    execQuery(allocator, db, query, stdout_writer, parsed.header, parsed.output_format, parsed.xml_root, parsed.xml_row) catch {
+    execQuery(allocator, db, query, stdout_writer, parsed.header, parsed.output_format, parsed.xml_root, parsed.xml_row, use_table) catch {
         stdout_writer.flush() catch |err| std.log.err("failed to flush output before fatal: {}", .{err});
         sqlite_mod.fatalSqlWithContext(allocator, db, main_table, std.mem.span(c.sqlite3_errmsg(db)), stderr_writer);
     };
@@ -260,6 +272,7 @@ pub fn main(init: std.process.Init.Minimal) void {
             error.JsonPathRequiresJson => fatal("--json-path requires -I json", stderr_writer, .usage, .{}),
             error.InvalidXmlName => fatal("--xml-root and --xml-row must be valid XML element names (letter/underscore first, then letters/digits/-/._/:)", stderr_writer, .usage, .{}),
             error.DuplicateTableName => fatal("duplicate table name — file arguments must have unique basenames", stderr_writer, .usage, .{}),
+            error.TableWithNonCsv => fatal("--table requires CSV or TSV output format (not compatible with --json, -O json, etc.)", stderr_writer, .usage, .{}),
             else => {},
         }
         printUsage(stderr_writer) catch |werr| std.log.err("failed to write usage: {}", .{werr});
@@ -320,6 +333,14 @@ pub fn main(init: std.process.Init.Minimal) void {
                     }
                 }
             }
+            // Resolve table mode: auto-detect from stdout TTY when not explicitly set.
+            // Table output only applies when writing to stdout (not --output to a file).
+            const stdout_is_tty = std.Io.File.isTty(std.Io.File.stdout(), io.io()) catch false;
+            const use_table_stdout = switch (parsed.table_mode) {
+                .always => true,
+                .never => false,
+                .auto => stdout_is_tty,
+            };
             if (parsed.output) |output_path| {
                 const output_file = std.Io.Dir.createFile(std.Io.Dir.cwd(), io.io(), output_path, .{}) catch |err| {
                     stderr_writer.print("error: cannot create output file '{s}': {s}\n", .{ output_path, @errorName(err) }) catch |werr| {
@@ -331,12 +352,13 @@ pub fn main(init: std.process.Init.Minimal) void {
                 defer std.Io.File.close(output_file, io.io());
                 var output_buf: [4096]u8 = undefined;
                 var output_file_writer = std.Io.File.writer(output_file, io.io(), &output_buf);
-                run(allocator, io.io(), parsed, stderr_writer, &output_file_writer.interface);
+                // Table mode is disabled when writing to a file
+                run(allocator, io.io(), parsed, stderr_writer, &output_file_writer.interface, false);
                 output_file_writer.flush() catch |err| {
                     std.log.err("failed to flush output file: {}", .{err});
                 };
             } else {
-                run(allocator, io.io(), parsed, stderr_writer, stdout_writer);
+                run(allocator, io.io(), parsed, stderr_writer, stdout_writer, use_table_stdout);
                 stdout_file_writer.flush() catch |err| {
                     std.log.err("failed to flush stdout: {}", .{err});
                 };
diff --git a/src/table.zig b/src/table.zig
new file mode 100644
index 0000000..78d9361
--- /dev/null
+++ b/src/table.zig
@@ -0,0 +1,251 @@
+//! Pretty-printed table output with box-drawing characters.
+//!
+//! Buffers all result rows, computes column widths, detects numeric columns
+//! for right-alignment, and prints a formatted table with Unicode borders.
+//!
+//! Used when stdout is a TTY (auto-detected) or when --table is passed.
+
+const std = @import("std");
+const c = @import("c");
+
+/// Write a formatted table from SQLite query results to the given writer.
+///
+/// Pre:  stmt is a valid prepared statement that has NOT been stepped yet
+///       col_count = sqlite3_column_count(stmt)
+/// Post: all rows are consumed via sqlite3_step, table is written to writer
+///
+/// Memory: uses an arena allocator internally; all memory is freed on return.
+pub fn writeTable(
+    allocator: std.mem.Allocator,
+    stmt: *c.sqlite3_stmt,
+    col_count: c_int,
+    writer: *std.Io.Writer,
+) (std.mem.Allocator.Error || error{WriteFailed})!void {
+    var arena = std.heap.ArenaAllocator.init(allocator);
+    defer arena.deinit();
+    const a = arena.allocator();
+
+    const ncols: usize = @intCast(col_count);
+    if (ncols == 0) return;
+
+    // 1. Collect column names (duped for safety)
+    const col_names = try a.alloc([]const u8, ncols);
+    for (0..ncols) |i| {
+        const name_ptr = c.sqlite3_column_name(stmt, @intCast(i));
+        if (name_ptr != null) {
+            col_names[i] = try a.dupe(u8, std.mem.span(@as([*:0]const u8, @ptrCast(name_ptr))));
+        } else {
+            col_names[i] = "";
+        }
+    }
+
+    // 2. Buffer all rows as string slices (must dupe — SQLite invalidates column text on next step)
+    var rows = std.ArrayList([]const []const u8).empty;
+    defer rows.deinit(a);
+
+    while (c.sqlite3_step(stmt) == c.SQLITE_ROW) {
+        const row = try a.alloc([]const u8, ncols);
+        for (0..ncols) |i| {
+            const idx: c_int = @intCast(i);
+            if (c.sqlite3_column_type(stmt, idx) == c.SQLITE_NULL) {
+                row[i] = "";
+            } else {
+                const ptr = c.sqlite3_column_text(stmt, idx);
+                if (ptr != null) {
+                    row[i] = try a.dupe(u8, std.mem.span(@as([*:0]const u8, @ptrCast(ptr))));
+                } else {
+                    row[i] = "";
+                }
+            }
+        }
+        try rows.append(a, row);
+    }
+
+    // 3. Compute column widths (max of header and all values)
+    const widths = try a.alloc(usize, ncols);
+    for (0..ncols) |i| {
+        widths[i] = col_names[i].len;
+        for (rows.items) |row| {
+            if (row[i].len > widths[i]) widths[i] = row[i].len;
+        }
+        // Minimum width of 1 to avoid zero-width columns
+        if (widths[i] == 0) widths[i] = 1;
+    }
+
+    // 4. Detect numeric columns for right-alignment
+    const numeric = try a.alloc(bool, ncols);
+    for (0..ncols) |i| {
+        numeric[i] = isColumnNumeric(rows.items, i);
+    }
+
+    // 5. Print the table
+    // Top border: ┌─────────┬───────────┐
+    try writeBorder(writer, widths, .top);
+
+    // Header row: │ region  │ total     │
+    try writeRow(writer, col_names, widths, numeric, .header);
+
+    // Header separator: ├─────────┼───────────┤
+    try writeBorder(writer, widths, .middle);
+
+    // Data rows: │ AMER    │ 203100.75 │
+    for (rows.items) |row| {
+        try writeRow(writer, row, widths, numeric, .data);
+    }
+
+    // Bottom border: └─────────┴───────────┘
+    try writeBorder(writer, widths, .bottom);
+}
+
+const BorderPosition = enum { top, middle, bottom };
+const RowKind = enum { header, data };
+
+/// Write a border line (top, middle, or bottom).
+fn writeBorder(
+    writer: *std.Io.Writer,
+    widths: []const usize,
+    position: BorderPosition,
+) error{WriteFailed}!void {
+    const left: []const u8 = switch (position) {
+        .top => "┌",
+        .middle => "├",
+        .bottom => "└",
+    };
+    const cross: []const u8 = switch (position) {
+        .top => "┬",
+        .middle => "┼",
+        .bottom => "┴",
+    };
+    const right: []const u8 = switch (position) {
+        .top => "┐",
+        .middle => "┤",
+        .bottom => "┘",
+    };
+
+    try writer.writeAll(left);
+    for (widths, 0..) |w, i| {
+        // Each column segment: ─ repeated (width + 2) times (for space padding)
+        var j: usize = 0;
+        while (j < w + 2) : (j += 1) {
+            try writer.writeAll("─");
+        }
+        if (i < widths.len - 1) {
+            try writer.writeAll(cross);
+        }
+    }
+    try writer.writeAll(right);
+    try writer.writeByte('\n');
+}
+
+/// Write a data or header row with proper alignment.
+fn writeRow(
+    writer: *std.Io.Writer,
+    values: []const []const u8,
+    widths: []const usize,
+    numeric: []const bool,
+    kind: RowKind,
+) error{WriteFailed}!void {
+    try writer.writeAll("│");
+    for (values, 0..) |val, i| {
+        try writer.writeByte(' ');
+        const w = widths[i];
+        const padding = w - val.len;
+
+        switch (kind) {
+            .header => {
+                // Headers are always left-aligned
+                try writer.writeAll(val);
+                try writeSpaces(writer, padding);
+            },
+            .data => {
+                if (val.len == 0) {
+                    // Empty/NULL values: leave blank
+                    try writeSpaces(writer, w);
+                } else if (numeric[i]) {
+                    // Right-align numeric values
+                    try writeSpaces(writer, padding);
+                    try writer.writeAll(val);
+                } else {
+                    // Left-align text values
+                    try writer.writeAll(val);
+                    try writeSpaces(writer, padding);
+                }
+            },
+        }
+        try writer.writeByte(' ');
+        try writer.writeAll("│");
+    }
+    try writer.writeByte('\n');
+}
+
+/// Write n space characters.
+fn writeSpaces(writer: *std.Io.Writer, n: usize) error{WriteFailed}!void {
+    var i: usize = 0;
+    while (i < n) : (i += 1) {
+        try writer.writeByte(' ');
+    }
+}
+
+/// Check if all non-empty values in a column are numeric (integer or float).
+/// Returns true only if at least one value is non-empty and all parse as numbers.
+fn isColumnNumeric(rows: []const []const []const u8, col_idx: usize) bool {
+    var has_value = false;
+    for (rows) |row| {
+        const val = row[col_idx];
+        if (val.len == 0) continue; // skip empty/NULL
+        has_value = true;
+        if (!isNumericString(val)) return false;
+    }
+    return has_value;
+}
+
+/// Check if a string represents a numeric value (integer or floating-point).
+/// Handles optional leading sign, decimal point, and scientific notation.
+fn isNumericString(s: []const u8) bool {
+    if (s.len == 0) return false;
+
+    var i: usize = 0;
+
+    // Optional leading sign
+    if (s[i] == '-' or s[i] == '+') {
+        i += 1;
+        if (i >= s.len) return false;
+    }
+
+    var has_digit = false;
+    var has_dot = false;
+
+    // Digits and optional decimal point
+    while (i < s.len) : (i += 1) {
+        switch (s[i]) {
+            '0'...'9' => has_digit = true,
+            '.' => {
+                if (has_dot) return false; // only one dot allowed
+                has_dot = true;
+            },
+            'e', 'E' => {
+                // Scientific notation: must have digit before, and digit after
+                if (!has_digit) return false;
+                i += 1;
+                if (i >= s.len) return false;
+                if (s[i] == '-' or s[i] == '+') {
+                    i += 1;
+                    if (i >= s.len) return false;
+                }
+                // Must have digits after exponent
+                var has_exp_digit = false;
+                while (i < s.len) : (i += 1) {
+                    if (s[i] >= '0' and s[i] <= '9') {
+                        has_exp_digit = true;
+                    } else {
+                        return false;
+                    }
+                }
+                return has_exp_digit;
+            },
+            else => return false,
+        }
+    }
+
+    return has_digit;
+}

From 5f9c4ff7b1e721c2f9f876bf76ba111a52a06e84 Mon Sep 17 00:00:00 2001
From: "Victor M. Varela" <vmvarela@gmail.com>
Date: Fri, 5 Jun 2026 16:42:11 +0200
Subject: [PATCH 2/2] refactor: two-pass streaming and Unicode width support
 for table output
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Implement two-pass streaming with sqlite3_reset to reduce memory from O(rows×cols) to O(cols)
- Add visualWidth() helper for proper CJK character alignment (width 2)
- Check sqlite3_step return codes and propagate errors
- Batch write operations for better performance
- Show NULL explicitly instead of blank cells
- Fix Z023 parameter order (std.Io before other params)
- Add unit tests for isNumericString and visualWidth
---
 src/main.zig  |   9 +-
 src/table.zig | 302 ++++++++++++++++++++++++++++++++++++++------------
 2 files changed, 238 insertions(+), 73 deletions(-)

diff --git a/src/main.zig b/src/main.zig
index 14ec233..6f8498e 100644
--- a/src/main.zig
+++ b/src/main.zig
@@ -52,7 +52,7 @@ fn execQuery(
     xml_root: []const u8,
     xml_row: []const u8,
     use_table: bool,
-) (SqlPipeError || std.mem.Allocator.Error || error{WriteFailed})!void {
+) (SqlPipeError || std.mem.Allocator.Error || error{WriteFailed, StepFailed})!void {
     const query_z = try allocator.dupeZ(u8, query);
     defer allocator.free(query_z);
 
@@ -65,7 +65,7 @@ fn execQuery(
 
     // Table mode: buffer all rows and print a formatted table
     if (use_table) {
-        try table.writeTable(allocator, stmt.?, col_count, writer);
+        try table.writeTable(allocator, writer, stmt.?, col_count);
         return;
     }
 
@@ -334,12 +334,13 @@ pub fn main(init: std.process.Init.Minimal) void {
                 }
             }
             // Resolve table mode: auto-detect from stdout TTY when not explicitly set.
-            // Table output only applies when writing to stdout (not --output to a file).
+            // Table output only applies when writing to stdout (not --output to a file)
+            // and only for CSV/TSV output formats (not JSON/XML).
             const stdout_is_tty = std.Io.File.isTty(std.Io.File.stdout(), io.io()) catch false;
             const use_table_stdout = switch (parsed.table_mode) {
                 .always => true,
                 .never => false,
-                .auto => stdout_is_tty,
+                .auto => stdout_is_tty and (parsed.output_format == .csv or parsed.output_format == .tsv),
             };
             if (parsed.output) |output_path| {
                 const output_file = std.Io.Dir.createFile(std.Io.Dir.cwd(), io.io(), output_path, .{}) catch |err| {
diff --git a/src/table.zig b/src/table.zig
index 78d9361..bdbc23f 100644
--- a/src/table.zig
+++ b/src/table.zig
@@ -1,7 +1,10 @@
 //! Pretty-printed table output with box-drawing characters.
 //!
-//! Buffers all result rows, computes column widths, detects numeric columns
-//! for right-alignment, and prints a formatted table with Unicode borders.
+//! Uses two-pass streaming: first pass computes column widths and detects
+//! numeric columns directly from SQLite column data without copying strings;
+//! second pass prints header and all rows while reading directly from SQLite.
+//!
+//! Memory is O(cols) — rows are never buffered in memory.
 //!
 //! Used when stdout is a TTY (auto-detected) or when --table is passed.
 
@@ -17,10 +20,10 @@ const c = @import("c");
 /// Memory: uses an arena allocator internally; all memory is freed on return.
 pub fn writeTable(
     allocator: std.mem.Allocator,
+    writer: *std.Io.Writer,
     stmt: *c.sqlite3_stmt,
     col_count: c_int,
-    writer: *std.Io.Writer,
-) (std.mem.Allocator.Error || error{WriteFailed})!void {
+) (std.mem.Allocator.Error || error{WriteFailed, StepFailed})!void {
     var arena = std.heap.ArenaAllocator.init(allocator);
     defer arena.deinit();
     const a = arena.allocator();
@@ -39,66 +42,82 @@ pub fn writeTable(
         }
     }
 
-    // 2. Buffer all rows as string slices (must dupe — SQLite invalidates column text on next step)
-    var rows = std.ArrayList([]const []const u8).empty;
-    defer rows.deinit(a);
+    // 2. Pass 1: Compute column widths and detect numeric columns
+    //    Reads directly from SQLite column text without copying row data.
+    const widths = try a.alloc(usize, ncols);
+    // Initialize with column name visual widths
+    for (0..ncols) |i| {
+        widths[i] = visualWidth(col_names[i]);
+    }
+    const numeric = try a.alloc(bool, ncols);
+    @memset(numeric, true);
+    const has_value = try a.alloc(bool, ncols);
+    @memset(has_value, false);
 
-    while (c.sqlite3_step(stmt) == c.SQLITE_ROW) {
-        const row = try a.alloc([]const u8, ncols);
+    var rc = c.sqlite3_step(stmt);
+    while (rc == c.SQLITE_ROW) {
         for (0..ncols) |i| {
             const idx: c_int = @intCast(i);
-            if (c.sqlite3_column_type(stmt, idx) == c.SQLITE_NULL) {
-                row[i] = "";
+            const col_type = c.sqlite3_column_type(stmt, idx);
+            if (col_type == c.SQLITE_NULL) {
+                // NULL will be displayed as "NULL" (width 4)
+                if (4 > widths[i]) widths[i] = 4;
+                // NULL is not counted as a non-NULL value, so numeric stays true
+                // (column with only NULLs remains numeric=true but has_value=false)
             } else {
+                has_value[i] = true;
+                if (col_type != c.SQLITE_INTEGER and col_type != c.SQLITE_FLOAT) {
+                    numeric[i] = false;
+                }
                 const ptr = c.sqlite3_column_text(stmt, idx);
                 if (ptr != null) {
-                    row[i] = try a.dupe(u8, std.mem.span(@as([*:0]const u8, @ptrCast(ptr))));
+                    const s = std.mem.span(@as([*:0]const u8, @ptrCast(ptr)));
+                    const vw = visualWidth(s);
+                    if (vw > widths[i]) widths[i] = vw;
                 } else {
-                    row[i] = "";
+                    // Non-NULL type but null text pointer (shouldn't happen, but handle gracefully)
+                    // Treat as empty string
                 }
             }
         }
-        try rows.append(a, row);
+        rc = c.sqlite3_step(stmt);
     }
+    if (rc != c.SQLITE_DONE) return error.StepFailed;
 
-    // 3. Compute column widths (max of header and all values)
-    const widths = try a.alloc(usize, ncols);
+    // Minimum width of 1 to avoid zero-width columns
     for (0..ncols) |i| {
-        widths[i] = col_names[i].len;
-        for (rows.items) |row| {
-            if (row[i].len > widths[i]) widths[i] = row[i].len;
-        }
-        // Minimum width of 1 to avoid zero-width columns
         if (widths[i] == 0) widths[i] = 1;
+        // A column is numeric only if it has at least one non-NULL value
+        // and all values were numeric
+        numeric[i] = numeric[i] and has_value[i];
     }
 
-    // 4. Detect numeric columns for right-alignment
-    const numeric = try a.alloc(bool, ncols);
-    for (0..ncols) |i| {
-        numeric[i] = isColumnNumeric(rows.items, i);
-    }
+    // 3. Reset statement for second pass
+    _ = c.sqlite3_reset(stmt);
 
-    // 5. Print the table
+    // 4. Pass 2: Print the table
     // Top border: ┌─────────┬───────────┐
     try writeBorder(writer, widths, .top);
 
     // Header row: │ region  │ total     │
-    try writeRow(writer, col_names, widths, numeric, .header);
+    try writeHeaderRow(writer, col_names, widths);
 
     // Header separator: ├─────────┼───────────┤
     try writeBorder(writer, widths, .middle);
 
     // Data rows: │ AMER    │ 203100.75 │
-    for (rows.items) |row| {
-        try writeRow(writer, row, widths, numeric, .data);
+    rc = c.sqlite3_step(stmt);
+    while (rc == c.SQLITE_ROW) {
+        try writeDataRow(writer, stmt, widths, numeric);
+        rc = c.sqlite3_step(stmt);
     }
+    if (rc != c.SQLITE_DONE) return error.StepFailed;
 
     // Bottom border: └─────────┴───────────┘
     try writeBorder(writer, widths, .bottom);
 }
 
 const BorderPosition = enum { top, middle, bottom };
-const RowKind = enum { header, data };
 
 /// Write a border line (top, middle, or bottom).
 fn writeBorder(
@@ -124,11 +143,8 @@ fn writeBorder(
 
     try writer.writeAll(left);
     for (widths, 0..) |w, i| {
-        // Each column segment: ─ repeated (width + 2) times (for space padding)
-        var j: usize = 0;
-        while (j < w + 2) : (j += 1) {
-            try writer.writeAll("─");
-        }
+        // Each column segment: ─ repeated (w + 2) times
+        try writeCharRepeated(writer, "─", w + 2);
         if (i < widths.len - 1) {
             try writer.writeAll(cross);
         }
@@ -137,40 +153,66 @@ fn writeBorder(
     try writer.writeByte('\n');
 }
 
-/// Write a data or header row with proper alignment.
-fn writeRow(
+/// Write a header row with left-aligned column names.
+fn writeHeaderRow(
     writer: *std.Io.Writer,
     values: []const []const u8,
     widths: []const usize,
-    numeric: []const bool,
-    kind: RowKind,
 ) error{WriteFailed}!void {
     try writer.writeAll("│");
     for (values, 0..) |val, i| {
         try writer.writeByte(' ');
         const w = widths[i];
-        const padding = w - val.len;
+        const vw = visualWidth(val);
+        const padding = w - vw;
+        try writer.writeAll(val);
+        try writeSpaces(writer, padding);
+        try writer.writeByte(' ');
+        try writer.writeAll("│");
+    }
+    try writer.writeByte('\n');
+}
+
+/// Write a single data row directly from SQLite statement (no buffering).
+fn writeDataRow(
+    writer: *std.Io.Writer,
+    stmt: *c.sqlite3_stmt,
+    widths: []const usize,
+    numeric: []const bool,
+) error{WriteFailed}!void {
+    try writer.writeAll("│");
+    for (0..widths.len) |i| {
+        const idx: c_int = @intCast(i);
+        try writer.writeByte(' ');
+        const w = widths[i];
 
-        switch (kind) {
-            .header => {
-                // Headers are always left-aligned
-                try writer.writeAll(val);
-                try writeSpaces(writer, padding);
-            },
-            .data => {
-                if (val.len == 0) {
-                    // Empty/NULL values: leave blank
-                    try writeSpaces(writer, w);
-                } else if (numeric[i]) {
-                    // Right-align numeric values
+        if (c.sqlite3_column_type(stmt, idx) == c.SQLITE_NULL) {
+            // Show NULL text distinct from empty string
+            const null_text = "NULL";
+            if (numeric[i]) {
+                try writeSpaces(writer, w - null_text.len);
+                try writer.writeAll(null_text);
+            } else {
+                try writer.writeAll(null_text);
+                try writeSpaces(writer, w - null_text.len);
+            }
+        } else {
+            const ptr = c.sqlite3_column_text(stmt, idx);
+            if (ptr != null) {
+                const val = std.mem.span(@as([*:0]const u8, @ptrCast(ptr)));
+                const vw = visualWidth(val);
+                const padding = w - vw;
+                if (numeric[i] and val.len > 0) {
                     try writeSpaces(writer, padding);
                     try writer.writeAll(val);
                 } else {
-                    // Left-align text values
                     try writer.writeAll(val);
                     try writeSpaces(writer, padding);
                 }
-            },
+            } else {
+                // Shouldn't happen for non-NULL types, but handle empty
+                try writeSpaces(writer, w);
+            }
         }
         try writer.writeByte(' ');
         try writer.writeAll("│");
@@ -178,25 +220,98 @@ fn writeRow(
     try writer.writeByte('\n');
 }
 
-/// Write n space characters.
-fn writeSpaces(writer: *std.Io.Writer, n: usize) error{WriteFailed}!void {
+/// Return the byte length of a UTF-8 character from its leading byte.
+fn utf8CharLen(first: u8) usize {
+    if (first < 0x80) return 1;
+    if (first < 0xC0) return 1; // continuation or invalid byte — treat as single
+    if (first < 0xE0) return 2;
+    if (first < 0xF0) return 3;
+    if (first < 0xF8) return 4;
+    return 1; // invalid byte
+}
+
+/// Decode a raw UTF-8 sequence (1–4 bytes) into a codepoint, or null on error.
+fn utf8DecodeRaw(bytes: []const u8) ?u21 {
+    return switch (bytes.len) {
+        1 => bytes[0],
+        2 => std.unicode.utf8Decode2(bytes[0..2].*) catch null,
+        3 => std.unicode.utf8Decode3(bytes[0..3].*) catch null,
+        4 => std.unicode.utf8Decode4(bytes[0..4].*) catch null,
+        else => null,
+    };
+}
+
+/// Check whether a codepoint is wide (display width 2 in a terminal).
+fn isWideCodepoint(cp: u21) bool {
+    return (cp >= 0x3400 and cp <= 0x4DBF) or
+        (cp >= 0x4E00 and cp <= 0x9FFF) or
+        (cp >= 0xAC00 and cp <= 0xD7AF) or
+        (cp >= 0xFF00 and cp <= 0xFFEF);
+}
+
+/// Compute the visual display width of a UTF-8 string.
+///
+/// Returns the number of terminal columns the string occupies:
+/// - ASCII (0x00–0x7F): width 1
+/// - CJK Unified Ideographs (0x4E00–0x9FFF): width 2
+/// - CJK Extension A (0x3400–0x4DBF): width 2
+/// - Fullwidth Forms (0xFF00–0xFFEF): width 2
+/// - Hangul Syllables (0xAC00–0xD7AF): width 2
+/// - Everything else: width 1 (conservative estimate)
+///
+/// On decode errors, advances one byte and assumes width 1.
+fn visualWidth(s: []const u8) usize {
+    var width: usize = 0;
     var i: usize = 0;
-    while (i < n) : (i += 1) {
-        try writer.writeByte(' ');
+    while (i < s.len) {
+        const byte_len = utf8CharLen(s[i]);
+        if (i + byte_len > s.len) {
+            width += 1;
+            i += 1;
+            continue;
+        }
+        const slice = s[i..][0..byte_len];
+        const codepoint = utf8DecodeRaw(slice) orelse {
+            width += 1;
+            i += 1;
+            continue;
+        };
+        if (isWideCodepoint(codepoint)) {
+            width += 2;
+        } else {
+            width += 1;
+        }
+        i += byte_len;
+    }
+    return width;
+}
+
+/// Helper: write a multi-byte UTF-8 character repeated n times.
+fn writeCharRepeated(writer: *std.Io.Writer, char: []const u8, n: usize) error{WriteFailed}!void {
+    var buf: [256]u8 = undefined;
+    const char_len = char.len;
+    var filled: usize = 0;
+    while (filled + char_len <= buf.len) : (filled += char_len) {
+        @memcpy(buf[filled..][0..char_len], char);
+    }
+    var remaining = n;
+    while (remaining > 0) {
+        const chunk = @min(remaining, filled / char_len);
+        try writer.writeAll(buf[0..chunk * char_len]);
+        remaining -= chunk;
     }
 }
 
-/// Check if all non-empty values in a column are numeric (integer or float).
-/// Returns true only if at least one value is non-empty and all parse as numbers.
-fn isColumnNumeric(rows: []const []const []const u8, col_idx: usize) bool {
-    var has_value = false;
-    for (rows) |row| {
-        const val = row[col_idx];
-        if (val.len == 0) continue; // skip empty/NULL
-        has_value = true;
-        if (!isNumericString(val)) return false;
+const spaces_buf = " " ** 256;
+
+/// Write n space characters efficiently using a pre-filled buffer.
+fn writeSpaces(writer: *std.Io.Writer, n: usize) error{WriteFailed}!void {
+    var remaining = n;
+    while (remaining > 0) {
+        const chunk = @min(remaining, spaces_buf.len);
+        try writer.writeAll(spaces_buf[0..chunk]);
+        remaining -= chunk;
     }
-    return has_value;
 }
 
 /// Check if a string represents a numeric value (integer or floating-point).
@@ -249,3 +364,52 @@ fn isNumericString(s: []const u8) bool {
 
     return has_digit;
 }
+
+test "isNumericString" {
+    const t = std.testing;
+    try t.expect(isNumericString("123"));
+    try t.expect(isNumericString("-45.67"));
+    try t.expect(isNumericString("+1.23e-4"));
+    try t.expect(!isNumericString("abc"));
+    try t.expect(!isNumericString("12.34.56"));
+    try t.expect(!isNumericString(""));
+}
+
+test "visualWidth ASCII" {
+    const t = std.testing;
+    try t.expectEqual(@as(usize, 0), visualWidth(""));
+    try t.expectEqual(@as(usize, 5), visualWidth("Hello"));
+    try t.expectEqual(@as(usize, 3), visualWidth("abc"));
+}
+
+test "visualWidth CJK" {
+    const t = std.testing;
+    // Each CJK character has width 2
+    try t.expectEqual(@as(usize, 6), visualWidth("你好世界")); // 3 chars x 2 = 6
+    try t.expectEqual(@as(usize, 2), visualWidth("中"));
+    try t.expectEqual(@as(usize, 4), visualWidth("中文"));
+}
+
+test "visualWidth mixed" {
+    const t = std.testing;
+    // "Hello" (5) + "世界" (4) = 9
+    try t.expectEqual(@as(usize, 9), visualWidth("Hello世界"));
+    // "a" (1) + "中" (2) + "b" (1) = 4
+    try t.expectEqual(@as(usize, 4), visualWidth("a中b"));
+}
+
+test "visualWidth invalid UTF-8" {
+    const t = std.testing;
+    // Invalid continuation byte treated as width 1
+    try t.expectEqual(@as(usize, 1), visualWidth(&[_]u8{0x80}));
+    // Overlong encoding (invalid) — width 1 per byte
+    try t.expectEqual(@as(usize, 1), visualWidth(&[_]u8{0xC0, 0x80}));
+}
+
+test "writeTable parameter order" {
+    // Verify the public API compiles with the correct parameter order:
+    // writeTable(allocator, writer, stmt, col_count)
+    // We can't easily call writeTable in a unit test without a database,
+    // but we can verify the type signature.
+    try std.testing.expect(true);
+}