π File detail
utils/readEditContext.ts
π§© .tsπ 228 linesπΎ 7,224 bytesπ text
β Back to All Filesπ― Use case
This file lives under βutils/β, which covers cross-cutting helpers (shell, tempfiles, settings, messages, process input, β¦). On the API surface it exposes CHUNK_SIZE, MAX_SCAN_BYTES, EditContext, readEditContext, and openForScan (and more) β mainly functions, hooks, or classes. Dependencies touch Node filesystem. It composes internal code from errors (relative imports).
Generated from folder role, exports, dependency roots, and inline comments β not hand-reviewed for every path.
π§ Inline summary
import { type FileHandle, open } from 'fs/promises' import { isENOENT } from './errors.js' export const CHUNK_SIZE = 8 * 1024 export const MAX_SCAN_BYTES = 10 * 1024 * 1024
π€ Exports (heuristic)
CHUNK_SIZEMAX_SCAN_BYTESEditContextreadEditContextopenForScanscanForContextreadCapped
π External import roots
Package roots from from "β¦" (relative paths omitted).
fs
π₯οΈ Source preview
import { type FileHandle, open } from 'fs/promises'
import { isENOENT } from './errors.js'
export const CHUNK_SIZE = 8 * 1024
export const MAX_SCAN_BYTES = 10 * 1024 * 1024
const NL = 0x0a
export type EditContext = {
/** Slice of the file: contextLines before/after the match, on line boundaries. */
content: string
/** 1-based line number of content's first line in the original file. */
lineOffset: number
/** True if MAX_SCAN_BYTES was hit without finding the needle. */
truncated: boolean
}
/**
* Finds `needle` in the file at `path` and returns a context-window slice
* containing the match plus `contextLines` of surrounding context on each side.
*
* Scans in 8KB chunks with a straddle overlap so matches crossing a chunk
* boundary are found. Capped at MAX_SCAN_BYTES. No stat β EOF detected via
* bytesRead.
*
* React callers: wrap in useState lazy-init then use() + Suspense. useMemo
* re-runs when callers pass fresh array literals.
*
* Returns null on ENOENT. Returns { truncated: true, content: '' } if the
* needle isn't found within MAX_SCAN_BYTES.
*/
export async function readEditContext(
path: string,
needle: string,
contextLines = 3,
): Promise<EditContext | null> {
const handle = await openForScan(path)
if (handle === null) return null
try {
return await scanForContext(handle, needle, contextLines)
} finally {
await handle.close()
}
}
/**
* Opens `path` for reading. Returns null on ENOENT. Caller owns close().
*/
export async function openForScan(path: string): Promise<FileHandle | null> {
try {
return await open(path, 'r')
} catch (e) {
if (isENOENT(e)) return null
throw e
}
}
/**
* Handle-accepting core of readEditContext. Caller owns open/close.
*/
export async function scanForContext(
handle: FileHandle,
needle: string,
contextLines: number,
): Promise<EditContext> {
if (needle === '') return { content: '', lineOffset: 1, truncated: false }
const needleLF = Buffer.from(needle, 'utf8')
// Model sends LF; files may be CRLF. Count newlines to size the overlap for
// the longer CRLF form; defer encoding the CRLF buffer until LF scan misses.
let nlCount = 0
for (let i = 0; i < needleLF.length; i++) if (needleLF[i] === NL) nlCount++
let needleCRLF: Buffer | undefined
const overlap = needleLF.length + nlCount - 1
const buf = Buffer.allocUnsafe(CHUNK_SIZE + overlap)
let pos = 0
let linesBeforePos = 0
let prevTail = 0
while (pos < MAX_SCAN_BYTES) {
const { bytesRead } = await handle.read(buf, prevTail, CHUNK_SIZE, pos)
if (bytesRead === 0) break
const viewLen = prevTail + bytesRead
let matchAt = indexOfWithin(buf, needleLF, viewLen)
let matchLen = needleLF.length
if (matchAt === -1 && nlCount > 0) {
needleCRLF ??= Buffer.from(needle.replaceAll('\n', '\r\n'), 'utf8')
matchAt = indexOfWithin(buf, needleCRLF, viewLen)
matchLen = needleCRLF.length
}
if (matchAt !== -1) {
const absMatch = pos - prevTail + matchAt
return await sliceContext(
handle,
buf,
absMatch,
matchLen,
contextLines,
linesBeforePos + countNewlines(buf, 0, matchAt),
)
}
pos += bytesRead
// Shift the tail to the front for straddle. linesBeforePos tracks
// newlines in bytes we've DISCARDED (not in buf) β count only the
// non-overlap portion we're about to copyWithin over.
const nextTail = Math.min(overlap, viewLen)
linesBeforePos += countNewlines(buf, 0, viewLen - nextTail)
prevTail = nextTail
buf.copyWithin(0, viewLen - prevTail, viewLen)
}
return { content: '', lineOffset: 1, truncated: pos >= MAX_SCAN_BYTES }
}
/**
* Reads the entire file via `handle` up to MAX_SCAN_BYTES. Returns null if the
* file exceeds the cap. For the multi-edit path in FileEditToolDiff where
* sequential replacements need the full string.
*
* Single buffer, doubles on fill β ~log2(size/8KB) allocs instead of O(n)
* chunks + concat. Reads directly into the right offset; no intermediate copies.
*/
export async function readCapped(handle: FileHandle): Promise<string | null> {
let buf = Buffer.allocUnsafe(CHUNK_SIZE)
let total = 0
for (;;) {
if (total === buf.length) {
const grown = Buffer.allocUnsafe(
Math.min(buf.length * 2, MAX_SCAN_BYTES + CHUNK_SIZE),
)
buf.copy(grown, 0, 0, total)
buf = grown
}
const { bytesRead } = await handle.read(
buf,
total,
buf.length - total,
total,
)
if (bytesRead === 0) break
total += bytesRead
if (total > MAX_SCAN_BYTES) return null
}
return normalizeCRLF(buf, total)
}
/** buf.indexOf bounded to [0, end) without allocating a view. */
function indexOfWithin(buf: Buffer, needle: Buffer, end: number): number {
const at = buf.indexOf(needle)
return at === -1 || at + needle.length > end ? -1 : at
}
function countNewlines(buf: Buffer, start: number, end: number): number {
let n = 0
for (let i = start; i < end; i++) if (buf[i] === NL) n++
return n
}
/** Decode buf[0..len) to utf8, normalizing CRLF only if CR is present. */
function normalizeCRLF(buf: Buffer, len: number): string {
const s = buf.toString('utf8', 0, len)
return s.includes('\r') ? s.replaceAll('\r\n', '\n') : s
}
/**
* Given an absolute match offset, read Β±contextLines around it and return
* the decoded slice with its starting line number. Reuses `scratch` (the
* caller's scan buffer) for back/forward/output reads β zero new allocs
* when the context fits, one alloc otherwise.
*/
async function sliceContext(
handle: FileHandle,
scratch: Buffer,
matchStart: number,
matchLen: number,
contextLines: number,
linesBeforeMatch: number,
): Promise<EditContext> {
// Scan backward from matchStart to find contextLines prior newlines.
const backChunk = Math.min(matchStart, CHUNK_SIZE)
const { bytesRead: backRead } = await handle.read(
scratch,
0,
backChunk,
matchStart - backChunk,
)
let ctxStart = matchStart
let nlSeen = 0
for (let i = backRead - 1; i >= 0 && nlSeen <= contextLines; i--) {
if (scratch[i] === NL) {
nlSeen++
if (nlSeen > contextLines) break
}
ctxStart--
}
// Compute lineOffset now, before scratch is overwritten by the forward read.
const walkedBack = matchStart - ctxStart
const lineOffset =
linesBeforeMatch -
countNewlines(scratch, backRead - walkedBack, backRead) +
1
// Scan forward from matchEnd to find contextLines trailing newlines.
const matchEnd = matchStart + matchLen
const { bytesRead: fwdRead } = await handle.read(
scratch,
0,
CHUNK_SIZE,
matchEnd,
)
let ctxEnd = matchEnd
nlSeen = 0
for (let i = 0; i < fwdRead; i++) {
ctxEnd++
if (scratch[i] === NL) {
nlSeen++
if (nlSeen >= contextLines + 1) break
}
}
// Read the exact context range. Reuse scratch if it fits.
const len = ctxEnd - ctxStart
const out = len <= scratch.length ? scratch : Buffer.allocUnsafe(len)
const { bytesRead: outRead } = await handle.read(out, 0, len, ctxStart)
return { content: normalizeCRLF(out, outRead), lineOffset, truncated: false }
}