39 lines
1.0 KiB
TypeScript
39 lines
1.0 KiB
TypeScript
import { CommandModule } from "yargs";
|
|
import { BuildGpu, LlamaNuma } from "../../bindings/types.js";
|
|
type CompleteCommand = {
|
|
modelPath?: string;
|
|
header?: string[];
|
|
gpu?: BuildGpu | "auto";
|
|
systemInfo: boolean;
|
|
text?: string;
|
|
textFile?: string;
|
|
contextSize?: number;
|
|
batchSize?: number;
|
|
flashAttention?: boolean;
|
|
swaFullCache?: boolean;
|
|
threads?: number;
|
|
temperature: number;
|
|
minP: number;
|
|
topK: number;
|
|
topP: number;
|
|
seed?: number;
|
|
gpuLayers?: number;
|
|
repeatPenalty: number;
|
|
lastTokensRepeatPenalty: number;
|
|
penalizeRepeatingNewLine: boolean;
|
|
repeatFrequencyPenalty?: number;
|
|
repeatPresencePenalty?: number;
|
|
maxTokens: number;
|
|
tokenPredictionDraftModel?: string;
|
|
tokenPredictionModelContextSize?: number;
|
|
debug: boolean;
|
|
numa?: LlamaNuma;
|
|
meter: boolean;
|
|
timing: boolean;
|
|
noMmap: boolean;
|
|
noDirectIo: boolean;
|
|
printTimings: boolean;
|
|
};
|
|
export declare const CompleteCommand: CommandModule<object, CompleteCommand>;
|
|
export {};
|