Add chunk command, add limit param to split command

This commit is contained in:
2026-04-06 09:22:13 -05:00
parent 055babc9f3
commit 32aa8dc3d1
4 changed files with 121 additions and 4 deletions

101
src/vm/commands/chunk.ts Normal file
View File

@@ -0,0 +1,101 @@
import {Command, ParseContext, StrTerm, TypeError, wrapDestructured, wrapString} from "./command.js";
import {LexInput} from "../lexer.js";
import {StrVM} from "../vm.js";
import {log} from "../../log.js";
type ChunkData = {
every: StrTerm,
type: 'line'|'word'|'char',
}
export class Chunk extends Command<ChunkData> {
private logger = log.getStreamLogger('cmd-chunk')
async attemptParse(context: ParseContext): Promise<ChunkData> {
return {
every: await context.popTerm(),
type: context.popKeywordInSet(['line', 'word', 'char']).value,
}
}
getDisplayName(): string {
return 'chunk'
}
isParseCandidate(token: LexInput): boolean {
return this.isKeyword(token, 'chunk')
}
async execute(vm: StrVM, data: ChunkData): Promise<StrVM> {
return vm.replaceContextMatchingTerm(ctx => ({
destructure: sub => {
const every = ctx.resolveInt(data.every)
let delimiter: RegExp|string|undefined = undefined
if ( data.type === 'line' ) {
delimiter = '\n'
} else if ( data.type === 'char' ) {
delimiter = ''
} else if ( data.type === 'word' ) {
delimiter = /\s+/sg
}
if ( typeof delimiter === 'undefined' ) {
// This would only happen if we add a case to `type` and don't handle it above.
throw new TypeError('Could not resolve delimiter.')
}
this.logger.debug({ every, delimiter })
const chunks = this.chunkByDelimiter(sub, delimiter, every)
this.logger.verbose({ chunks })
return chunks.map(part => ({
prefix: part[0],
value: wrapString(part[1]),
}))
},
}))
}
private chunkByDelimiter(sub: string, delimiter: string|RegExp, nth: number): [string|undefined, string][] {
if ( typeof delimiter === 'string' && delimiter ) {
delimiter = new RegExp(delimiter.replace(/[/\-\\^$*+?.()|[\]{}]/g, '\\$&'), 'sg')
}
const separators = delimiter instanceof RegExp ? [...sub.matchAll(delimiter)] : []
const parts = sub.split(delimiter)
this.logger.verbose({ parts, separators })
const chunkSeparators: string[] = []
const chunks = []
let chunk = 0
let acc = ''
for ( let i = 0; i < parts.length; i += 1 ) {
if ( !(i % nth) && chunk ) {
chunks.push(acc)
chunk = 0
acc = ''
}
if ( chunk ) {
acc += separators[i - 1]?.[0] || ''
} else {
const chunkSeparator = separators[i - 1]?.[0] || ''
this.logger.verbose({ i, chunkSeparator })
chunkSeparators.push(chunkSeparator)
}
acc += parts[i]
chunk += 1
}
chunks.push(acc)
return chunks.map((chunk, idx) => [
idx ? chunkSeparators[idx] : undefined,
chunk,
])
}
}

View File

@@ -49,11 +49,13 @@ import {Assign} from "./assign.js";
import {Zip} from "./zip.js";
import {Concat} from "./concat.js";
import {Call} from "./call.js";
import {Chunk} from "./chunk.js";
export type Commands = Command<CommandData>[]
export const commands: Commands = [
new Assign,
new Call,
new Chunk,
new Clear,
new Concat,
new Contains,

View File

@@ -1,4 +1,4 @@
import {Command, CommandData, ParseContext, StrLVal} from "./command.js";
import {Command, CommandData, ParseContext, StrLVal, wrapString} from "./command.js";
import {Executable} from "../parse.js";
import {LexInput} from "../lexer.js";
import {StrVM} from "../vm.js";
@@ -26,7 +26,7 @@ export class Over extends Command<OverData> {
async execute(vm: StrVM, data: OverData): Promise<StrVM> {
return vm.tapInPlace(async parentCtx => {
const oldValue = parentCtx.resolveRequired(data.subject)
const oldValue = parentCtx.resolve(data.subject) || wrapString('')
const newValue = await vm.runInChild(async (child, childCtx) => {
await childCtx.replaceSubject(() => oldValue)
await data.exec.command.execute(child, data.exec.data)

View File

@@ -5,13 +5,14 @@ import {Awaitable} from "../../util/types.js";
export type SplitData = {
on: StrTerm,
with?: StrTerm,
limit?: StrTerm,
}
export class Split extends Command<SplitData> {
async attemptParse(context: ParseContext): Promise<SplitData> {
return {
on: await context.popTerm(),
limit: await context.popOptionalTerm(),
}
}
@@ -27,7 +28,20 @@ export class Split extends Command<SplitData> {
return vm.replaceContextMatchingTerm(ctx => ({
destructure: sub => {
const prefix = ctx.resolveString(data.on)
return sub.split(prefix)
let parts = sub.split(prefix)
if ( data.limit ) {
// If there was a limit, only split the specified number of times:
const limit = ctx.resolveInt(data.limit)
const head = parts.slice(0, limit)
const tail = parts.slice(limit)
parts = head
if ( tail.length ) {
parts.push(tail.join(prefix))
}
}
return parts
.map((segment, idx) => ({
prefix: idx ? prefix : undefined,
value: wrapString(segment),