π File detail
utils/sliceAnsi.ts
π§© .tsπ 92 linesπΎ 3,343 bytesπ text
β Back to All Filesπ― Use case
This file lives under βutils/β, which covers cross-cutting helpers (shell, tempfiles, settings, messages, process input, β¦). On the API surface it exposes sliceAnsi β mainly functions, hooks, or classes. Dependencies touch @alcalzone. It composes internal code from ink (relative imports).
Generated from folder role, exports, dependency roots, and inline comments β not hand-reviewed for every path.
π§ Inline summary
import { type AnsiCode, ansiCodesToString, reduceAnsiCodes, tokenize,
π€ Exports (heuristic)
sliceAnsidefault
π External import roots
Package roots from from "β¦" (relative paths omitted).
@alcalzone
π₯οΈ Source preview
import {
type AnsiCode,
ansiCodesToString,
reduceAnsiCodes,
tokenize,
undoAnsiCodes,
} from '@alcalzone/ansi-tokenize'
import { stringWidth } from '../ink/stringWidth.js'
// A code is an "end code" if its code equals its endCode (e.g., hyperlink close)
function isEndCode(code: AnsiCode): boolean {
return code.code === code.endCode
}
// Filter to only include "start codes" (not end codes)
function filterStartCodes(codes: AnsiCode[]): AnsiCode[] {
return codes.filter(c => !isEndCode(c))
}
/**
* Slice a string containing ANSI escape codes.
*
* Unlike the slice-ansi package, this properly handles OSC 8 hyperlink
* sequences because @alcalzone/ansi-tokenize tokenizes them correctly.
*/
export default function sliceAnsi(
str: string,
start: number,
end?: number,
): string {
// Don't pass `end` to tokenize β it counts code units, not display cells,
// so it drops tokens early for text with zero-width combining marks.
const tokens = tokenize(str)
let activeCodes: AnsiCode[] = []
let position = 0
let result = ''
let include = false
for (const token of tokens) {
// Advance by display width, not code units. Combining marks (Devanagari
// matras, virama, diacritics) are width 0 β counting them via .length
// advanced position past `end` early and truncated the slice. Callers
// pass start/end in display cells (via stringWidth), so position must
// track the same units.
const width =
token.type === 'ansi' ? 0 : token.fullWidth ? 2 : stringWidth(token.value)
// Break AFTER trailing zero-width marks β a combining mark attaches to
// the preceding base char, so "ΰ€ΰ€Ύ" (ΰ€ + ΰ€Ύ, 1 display cell) sliced at
// end=1 must include the ΰ€Ύ. Breaking on position >= end BEFORE the
// zero-width check would drop it and render ΰ€ bare. ANSI codes are
// width 0 but must NOT be included past end (they open new style runs
// that leak into the undo sequence), so gate on char type too. The
// !include guard ensures empty slices (start===end) stay empty even
// when the string starts with a zero-width char (BOM, ZWJ).
if (end !== undefined && position >= end) {
if (token.type === 'ansi' || width > 0 || !include) break
}
if (token.type === 'ansi') {
activeCodes.push(token)
if (include) {
// Emit all ANSI codes during the slice
result += token.code
}
} else {
if (!include && position >= start) {
// Skip leading zero-width marks at the start boundary β they belong
// to the preceding base char in the left half. Without this, the
// mark appears in BOTH halves: left+right β original. Only applies
// when start > 0 (otherwise there's no preceding char to own it).
if (start > 0 && width === 0) continue
include = true
// Reduce and filter to only active start codes
activeCodes = filterStartCodes(reduceAnsiCodes(activeCodes))
result = ansiCodesToString(activeCodes)
}
if (include) {
result += token.value
}
position += width
}
}
// Only undo start codes that are still active
const activeStartCodes = filterStartCodes(reduceAnsiCodes(activeCodes))
result += ansiCodesToString(undoAnsiCodes(activeStartCodes))
return result
}