import { LLM } from "llama-node"; import { LLamaCpp, type LoadConfig } from "llama-node/dist/llm/llama-cpp.js"; import path from "path"; const model = path.resolve(process.cwd(), "../ggml-vic7b-q5_1.bin"); const llama = new LLM(LLamaCpp); const config: LoadConfig = { modelPath: model, enableLogging: true, nCtx: 1024, seed: 0, f16Kv: false, logitsAll: false, vocabOnly: false, useMlock: false, embedding: true, useMmap: true, nGpuLayers: 0 }; const prompt = `Who is the president of the United States?`; const params = { nThreads: 4, nTokPredict: 2048, topK: 40, topP: 0.1, temp: 0.2, repeatPenalty: 1, prompt, }; const run = async () => { await llama.load(config); await llama.getEmbedding(params).then(console.log); }; run();