Atome-FE
diff --git a/‎example/js/langchain/langchain.js‎
Lines changed: 1 addition & 1 deletion b/‎example/js/langchain/langchain.js‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎example/js/llama-cpp/embedding.js‎
Lines changed: 5 additions & 2 deletions b/‎example/js/llama-cpp/embedding.js‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎example/js/llama-cpp/inference.js‎
Lines changed: 9 additions & 5 deletions b/‎example/js/llama-cpp/inference.js‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎example/js/llama-cpp/tokenize.js‎
Lines changed: 5 additions & 2 deletions b/‎example/js/llama-cpp/tokenize.js‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎example/js/llama-rs/embedding.js‎
Lines changed: 1 addition & 1 deletion b/‎example/js/llama-rs/embedding.js‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎example/js/llama-rs/inference.js‎
Lines changed: 9 additions & 5 deletions b/‎example/js/llama-rs/inference.js‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎example/js/llama-rs/tokenize.js‎
Lines changed: 5 additions & 2 deletions b/‎example/js/llama-rs/tokenize.js‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎example/js/rwkv-cpp/inference.js‎
Lines changed: 9 additions & 5 deletions b/‎example/js/rwkv-cpp/inference.js‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎example/js/rwkv-cpp/tokenize.js‎
Lines changed: 5 additions & 2 deletions b/‎example/js/rwkv-cpp/tokenize.js‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎example/package.json‎
Lines changed: 5 additions & 5 deletions b/‎example/package.json‎
Lines changed: 5 additions & 5 deletions
@@ -18,8 +18,8 @@ const config = {
     embedding: true,
     useMmap: true,
 };
-llama.load(config);
 const run = async () => {
+    await llama.load(config);
     // Load the docs into the vector store
     const vectorStore = await MemoryVectorStore.fromTexts(["Hello world", "Bye bye", "hello nice world"], [{ id: 2 }, { id: 1 }, { id: 3 }], new LLamaEmbeddings({ maxConcurrency: 1 }, llama));
     // Search for the most similar document
 
@@ -16,7 +16,6 @@ const config = {
     embedding: true,
     useMmap: true,
 };
-llama.load(config);
 const prompt = `Who is the president of the United States?`;
 const params = {
     nThreads: 4,
@@ -27,4 +26,8 @@ const params = {
     repeatPenalty: 1,
     prompt,
 };
-llama.getEmbedding(params).then(console.log);
+const run = async () => {
+    await llama.load(config);
+    await llama.getEmbedding(params).then(console.log);
+};
+run();
@@ -16,19 +16,23 @@ const config = {
     embedding: false,
     useMmap: true,
 };
-llama.load(config);
 const template = `How are you?`;
 const prompt = `A chat between a user and an assistant.
 USER: ${template}
 ASSISTANT:`;
-llama.createCompletion({
+const params = {
     nThreads: 4,
     nTokPredict: 2048,
     topK: 40,
     topP: 0.1,
     temp: 0.2,
     repeatPenalty: 1,
     prompt,
-}, (response) => {
-    process.stdout.write(response.token);
-});
+};
+const run = async () => {
+    await llama.load(config);
+    await llama.createCompletion(params, (response) => {
+        process.stdout.write(response.token);
+    });
+};
+run();
@@ -16,6 +16,9 @@ const config = {
     embedding: false,
     useMmap: true,
 };
-llama.load(config);
 const content = "how are you?";
-llama.tokenize({ content, nCtx: 2048 }).then(console.log);
+const run = async () => {
+    await llama.load(config);
+    await llama.tokenize({ content, nCtx: 2048 }).then(console.log);
+};
+run();
@@ -4,7 +4,6 @@ import path from "path";
 import fs from "fs";
 const model = path.resolve(process.cwd(), "../ggml-alpaca-7b-q4.bin");
 const llama = new LLM(LLamaRS);
-llama.load({ path: model });
 const getWordEmbeddings = async (prompt, file) => {
     const data = await llama.getEmbedding({
         prompt,
@@ -20,6 +19,7 @@ const getWordEmbeddings = async (prompt, file) => {
     await fs.promises.writeFile(path.resolve(process.cwd(), file), JSON.stringify(data));
 };
 const run = async () => {
+    await llama.load({ path: model });
     const dog1 = `My favourite animal is the dog`;
     await getWordEmbeddings(dog1, "./example/semantic-compare/dog1.json");
     const dog2 = `I have just adopted a cute dog`;
 
@@ -3,7 +3,6 @@ import { LLamaRS } from "llama-node/dist/llm/llama-rs.js";
 import path from "path";
 const model = path.resolve(process.cwd(), "../ggml-alpaca-7b-q4.bin");
 const llama = new LLM(LLamaRS);
-llama.load({ path: model });
 const template = `how are you`;
 const prompt = `Below is an instruction that describes a task. Write a response that appropriately completes the request.
 
@@ -12,7 +11,7 @@ const prompt = `Below is an instruction that describes a task. Write a response
 ${template}
 
 ### Response:`;
-llama.createCompletion({
+const params = {
     prompt,
     numPredict: 128,
     temp: 0.2,
@@ -22,6 +21,11 @@ llama.createCompletion({
     repeatLastN: 64,
     seed: 0,
     feedPrompt: true,
-}, (response) => {
-    process.stdout.write(response.token);
-});
+};
+const run = async () => {
+    await llama.load({ path: model });
+    await llama.createCompletion(params, (response) => {
+        process.stdout.write(response.token);
+    });
+};
+run();
@@ -3,6 +3,9 @@ import { LLamaRS } from "llama-node/dist/llm/llama-rs.js";
 import path from "path";
 const model = path.resolve(process.cwd(), "../ggml-alpaca-7b-q4.bin");
 const llama = new LLM(LLamaRS);
-llama.load({ path: model });
 const content = "how are you?";
-llama.tokenize(content).then(console.log);
+const run = async () => {
+    await llama.load({ path: model });
+    await llama.tokenize(content).then(console.log);
+};
+run();
@@ -10,18 +10,22 @@ const config = {
     nThreads: 4,
     enableLogging: true,
 };
-rwkv.load(config);
 const template = `Who is the president of the United States?`;
 const prompt = `Below is an instruction that describes a task. Write a response that appropriately completes the request.
 
 ### Instruction: ${template}
 
 ### Response:`;
-rwkv.createCompletion({
+const params = {
     maxPredictLength: 2048,
     topP: 0.1,
     temp: 0.1,
     prompt,
-}, (response) => {
-    process.stdout.write(response.token);
-});
+};
+const run = async () => {
+    await rwkv.load(config);
+    await rwkv.createCompletion(params, (response) => {
+        process.stdout.write(response.token);
+    });
+};
+run();
@@ -10,5 +10,8 @@ const config = {
     nThreads: 4,
     enableLogging: true,
 };
-rwkv.load(config);
-rwkv.tokenize({ content: "hello world" }).then(console.log);
+const run = async () => {
+    await rwkv.load(config);
+    await rwkv.tokenize({ content: "hello world" }).then(console.log);
+};
+run();
@@ -1,6 +1,6 @@
 {
   "name": "@llama-node/examples",
-  "version": "0.0.37",
+  "version": "0.1.0",
   "description": "",
   "main": "index.js",
   "type": "module",
@@ -18,9 +18,9 @@
     "langchain": "^0.0.56"
   },
   "dependencies": {
-    "@llama-node/core": "0.0.37",
-    "@llama-node/llama-cpp": "0.0.37",
-    "@llama-node/rwkv-cpp": "0.0.37",
-    "llama-node": "0.0.37"
+    "@llama-node/core": "0.1.0",
+    "@llama-node/llama-cpp": "0.1.0",
+    "@llama-node/rwkv-cpp": "0.1.0",
+    "llama-node": "0.1.0"
   }
 }