Atome-FE
diff --git a/‎packages/cli/src/index.ts‎
Lines changed: 2 additions & 2 deletions b/‎packages/cli/src/index.ts‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎packages/core/__test__/index.spec.ts‎
Lines changed: 1 addition & 1 deletion b/‎packages/core/__test__/index.spec.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/core/example/cachesession.ts‎
Lines changed: 36 additions & 32 deletions b/‎packages/core/example/cachesession.ts‎
Lines changed: 36 additions & 32 deletions
diff --git a/‎packages/core/example/embedding.ts‎
Lines changed: 35 additions & 39 deletions b/‎packages/core/example/embedding.ts‎
Lines changed: 35 additions & 39 deletions
diff --git a/‎packages/core/example/inference.ts‎
Lines changed: 33 additions & 31 deletions b/‎packages/core/example/inference.ts‎
Lines changed: 33 additions & 31 deletions
diff --git a/‎packages/core/example/loadsession.ts‎
Lines changed: 32 additions & 28 deletions b/‎packages/core/example/loadsession.ts‎
Lines changed: 32 additions & 28 deletions
diff --git a/‎packages/core/example/tokenize.ts‎
Lines changed: 12 additions & 9 deletions b/‎packages/core/example/tokenize.ts‎
Lines changed: 12 additions & 9 deletions
@@ -12,7 +12,7 @@ import { existsSync } from "fs";
 
 const convertType = ["q4_0", "q4_1", "f16", "f32"] as const;
 
-type ConvertType = typeof convertType[number];
+type ConvertType = (typeof convertType)[number];
 
 interface CLIInferenceArguments extends LLamaInferenceArguments, LLamaConfig {
     logger?: boolean;
@@ -75,7 +75,7 @@ class InferenceCommand implements yargs.CommandModule {
         if (logger) {
             LLama.enableLogger();
         }
-        const llama = LLama.create({ path: absolutePath, numCtxTokens });
+        const llama = await LLama.create({ path: absolutePath, numCtxTokens });
         llama.inference(rest, (result) => {
             switch (result.type) {
                 case InferenceResultType.Data:
 
@@ -6,7 +6,7 @@ test(
     async () => {
         LLama.enableLogger();
 
-        const llama = LLama.create({
+        const llama = await LLama.create({
             path: process.env.model?.toString()!,
             numCtxTokens: 128,
         });
 
@@ -6,46 +6,50 @@ const saveSession = path.resolve(process.cwd(), "./tmp/session.bin");
 
 LLama.enableLogger();
 
-const llama = LLama.create({
-    path: model,
-    numCtxTokens: 128,
-});
+const run = async () => {
+    const llama = await LLama.create({
+        path: model,
+        numCtxTokens: 128,
+    });
 
-const template = `how are you`;
+    const template = `how are you`;
 
-const prompt = `Below is an instruction that describes a task. Write a response that appropriately completes the request.
+    const prompt = `Below is an instruction that describes a task. Write a response that appropriately completes the request.
 
 ### Instruction:
 
 ${template}
 
 ### Response:`;
 
-llama.inference(
-    {
-        prompt,
-        numPredict: 128,
-        temp: 0.2,
-        topP: 1,
-        topK: 40,
-        repeatPenalty: 1,
-        repeatLastN: 64,
-        seed: 0,
-        feedPrompt: true,
-        feedPromptOnly: true,
-        saveSession,
-    },
-    (response) => {
-        switch (response.type) {
-            case InferenceResultType.Data: {
-                process.stdout.write(response.data?.token ?? "");
-                break;
-            }
-            case InferenceResultType.End:
-            case InferenceResultType.Error: {
-                console.log(response);
-                break;
+    llama.inference(
+        {
+            prompt,
+            numPredict: 128,
+            temp: 0.2,
+            topP: 1,
+            topK: 40,
+            repeatPenalty: 1,
+            repeatLastN: 64,
+            seed: 0,
+            feedPrompt: true,
+            feedPromptOnly: true,
+            saveSession,
+        },
+        (response) => {
+            switch (response.type) {
+                case InferenceResultType.Data: {
+                    process.stdout.write(response.data?.token ?? "");
+                    break;
+                }
+                case InferenceResultType.End:
+                case InferenceResultType.Error: {
+                    console.log(response);
+                    break;
+                }
             }
         }
-    }
-);
+    );
+};
+
+run();
@@ -1,51 +1,47 @@
-import { EmbeddingResultType, LLama } from "../index";
+import { LLama } from "../index";
 import path from "path";
 import fs from "fs";
 
 const model = path.resolve(process.cwd(), "../../ggml-alpaca-7b-q4.bin");
 
 LLama.enableLogger();
 
-const llama = LLama.create({
-    path: model,
-    numCtxTokens: 128,
-});
-
-const getWordEmbeddings = (prompt: string, file: string) => {
-    llama.getWordEmbeddings(
-        {
-            prompt,
-            numPredict: 128,
-            temp: 0.2,
-            topP: 1,
-            topK: 40,
-            repeatPenalty: 1,
-            repeatLastN: 64,
-            seed: 0,
-        },
-        (response) => {
-            switch (response.type) {
-                case EmbeddingResultType.Data: {
-                    fs.writeFileSync(
-                        path.resolve(process.cwd(), file),
-                        JSON.stringify(response.data)
-                    );
-                    break;
-                }
-                case EmbeddingResultType.Error: {
-                    console.log(response);
-                    break;
-                }
-            }
-        }
+const getWordEmbeddings = async (
+    llama: LLama,
+    prompt: string,
+    file: string
+) => {
+    const response = await llama.getWordEmbeddings({
+        prompt,
+        numPredict: 128,
+        temp: 0.2,
+        topP: 1,
+        topK: 40,
+        repeatPenalty: 1,
+        repeatLastN: 64,
+        seed: 0,
+    });
+
+    fs.writeFileSync(
+        path.resolve(process.cwd(), file),
+        JSON.stringify(response)
     );
 };
 
-const dog1 = `My favourite animal is the dog`;
-getWordEmbeddings(dog1, "./example/semantic-compare/dog1.json");
+const run = async () => {
+    const llama = await LLama.create({
+        path: model,
+        numCtxTokens: 128,
+    });
+
+    const dog1 = `My favourite animal is the dog`;
+    getWordEmbeddings(llama, dog1, "./example/semantic-compare/dog1.json");
 
-const dog2 = `I have just adopted a cute dog`;
-getWordEmbeddings(dog2, "./example/semantic-compare/dog2.json");
+    const dog2 = `I have just adopted a cute dog`;
+    getWordEmbeddings(llama, dog2, "./example/semantic-compare/dog2.json");
+
+    const cat1 = `My favourite animal is the cat`;
+    getWordEmbeddings(llama, cat1, "./example/semantic-compare/cat1.json");
+};
 
-const cat1 = `My favourite animal is the cat`;
-getWordEmbeddings(cat1, "./example/semantic-compare/cat1.json");
+run();
@@ -6,45 +6,47 @@ const model = path.resolve(process.cwd(), "../../ggml-alpaca-7b-q4.bin");
 
 LLama.enableLogger();
 
-const llama = LLama.create({
-    path: model,
-    numCtxTokens: 128,
-});
+const run = async () => {
+    const llama = await LLama.create({
+        path: model,
+        numCtxTokens: 128,
+    });
 
-const template = `how are you`;
+    const template = `how are you`;
 
-const prompt = `Below is an instruction that describes a task. Write a response that appropriately completes the request.
+    const prompt = `Below is an instruction that describes a task. Write a response that appropriately completes the request.
 
 ### Instruction:
 
 ${template}
 
 ### Response:`;
 
-llama.inference(
-    {
-        prompt,
-        numPredict: 128,
-        temp: 0.2,
-        topP: 1,
-        topK: 40,
-        repeatPenalty: 1,
-        repeatLastN: 64,
-        seed: 0,
-        feedPrompt: true,
-        // persistSession,
-    },
-    (response) => {
-        switch (response.type) {
-            case InferenceResultType.Data: {
-                process.stdout.write(response.data?.token ?? "");
-                break;
-            }
-            case InferenceResultType.End:
-            case InferenceResultType.Error: {
-                console.log(response);
-                break;
+    llama.inference(
+        {
+            prompt,
+            numPredict: 128,
+            temp: 0.2,
+            topP: 1,
+            topK: 40,
+            repeatPenalty: 1,
+            repeatLastN: 64,
+            seed: 0,
+            feedPrompt: true,
+        },
+        (response) => {
+            switch (response.type) {
+                case InferenceResultType.Data: {
+                    process.stdout.write(response.data?.token ?? "");
+                    break;
+                }
+                case InferenceResultType.End:
+                case InferenceResultType.Error: {
+                    console.log(response);
+                    break;
+                }
             }
         }
-    }
-);
+    );
+};
+run();
@@ -6,34 +6,38 @@ const loadSession = path.resolve(process.cwd(), "./tmp/session.bin");
 
 LLama.enableLogger();
 
-const llama = LLama.create({
-    path: model,
-    numCtxTokens: 128,
-});
+const run = async () => {
+    const llama = await LLama.create({
+        path: model,
+        numCtxTokens: 128,
+    });
 
-llama.inference(
-    {
-        prompt: "",
-        numPredict: 128,
-        temp: 0.2,
-        topP: 1,
-        topK: 40,
-        repeatPenalty: 1,
-        repeatLastN: 64,
-        seed: 0,
-        loadSession,
-    },
-    (response) => {
-        switch (response.type) {
-            case InferenceResultType.Data: {
-                process.stdout.write(response.data?.token ?? "");
-                break;
-            }
-            case InferenceResultType.End:
-            case InferenceResultType.Error: {
-                console.log(response);
-                break;
+    llama.inference(
+        {
+            prompt: "",
+            numPredict: 128,
+            temp: 0.2,
+            topP: 1,
+            topK: 40,
+            repeatPenalty: 1,
+            repeatLastN: 64,
+            seed: 0,
+            loadSession,
+        },
+        (response) => {
+            switch (response.type) {
+                case InferenceResultType.Data: {
+                    process.stdout.write(response.data?.token ?? "");
+                    break;
+                }
+                case InferenceResultType.End:
+                case InferenceResultType.Error: {
+                    console.log(response);
+                    break;
+                }
             }
         }
-    }
-);
+    );
+};
+
+run();
@@ -5,14 +5,17 @@ const model = path.resolve(process.cwd(), "../../ggml-alpaca-7b-q4.bin");
 
 LLama.enableLogger();
 
-const llama = LLama.create({
-    path: model,
-    numCtxTokens: 128,
-});
+const run = async () => {
+    const llama = await LLama.create({
+        path: model,
+        numCtxTokens: 128,
+    });
 
-const prompt = "My favourite animal is the cat";
+    const prompt = "My favourite animal is the cat";
 
-llama.tokenize(prompt, (response) => {
-    console.log(response);
-    console.log(response.data.length); // 7
-});
+    const tokens = await llama.tokenize(prompt);
+
+    console.log(tokens);
+};
+
+run();