HeyPuter
diff --git a/‎src/backend/src/modules/puterai/ClaudeService.js‎
Lines changed: 20 additions & 74 deletions b/‎src/backend/src/modules/puterai/ClaudeService.js‎
Lines changed: 20 additions & 74 deletions
diff --git a/‎src/backend/src/modules/puterai/OllamaService.js‎
Lines changed: 27 additions & 24 deletions b/‎src/backend/src/modules/puterai/OllamaService.js‎
Lines changed: 27 additions & 24 deletions
@@ -25,6 +25,7 @@ const Messages = require('./lib/Messages');
 const FSNodeParam = require('../../api/filesystem/FSNodeParam');
 const { LLRead } = require('../../filesystem/ll_operations/ll_read');
 const { Context } = require('../../util/context');
+const mime = require('mime-types');
 
 /**
 * ClaudeService class extends BaseService to provide integration with Anthropic's Claude AI models.
@@ -34,10 +35,6 @@ const { Context } = require('../../util/context');
 * @extends BaseService
 */
 class ClaudeService extends BaseService {
-    static MODULES = {
-        Anthropic: require('@anthropic-ai/sdk'),
-    };
-
     /**
      * @type {import('@anthropic-ai/sdk').Anthropic}
      */
@@ -53,7 +50,7 @@ class ClaudeService extends BaseService {
     /** @type {import('../../services/MeteringService/MeteringService').MeteringService} */
     #meteringService;
 
-    async _init() {
+    async _init () {
         this.anthropic = new Anthropic({
             apiKey: this.config.apiKey,
             // 10 minutes is the default; we need to override the timeout to
@@ -75,7 +72,7 @@ class ClaudeService extends BaseService {
     * Returns the default model identifier for Claude API interactions
     * @returns {string} The default model ID 'claude-3-5-sonnet-latest'
     */
-    get_default_model() {
+    get_default_model () {
         return 'claude-3-5-sonnet-latest';
     }
 
@@ -87,7 +84,7 @@ class ClaudeService extends BaseService {
              *
              * @returns Promise<Array<Object>> Array of model details
              */
-            async models() {
+            async models () {
                 return this.models_();
             },
 
@@ -97,7 +94,7 @@ class ClaudeService extends BaseService {
             * @description Retrieves all available model IDs and their aliases,
             * flattening them into a single array of strings that can be used for model selection
             */
-            async list() {
+            async list () {
                 const models = this.models_();
                 const model_names = [];
                 for ( const model of models ) {
@@ -118,10 +115,10 @@ class ClaudeService extends BaseService {
             * @returns {Object} Returns either a TypedValue with streaming response or a completion object
             * @this {ClaudeService}
             */
-            async complete({ messages, stream, model, tools, max_tokens, temperature }) {
+            async complete ({ messages, stream, model, tools, max_tokens, temperature }) {
                 tools = FunctionCalling.make_claude_tools(tools);
                 // console.log("here are the messages: ", messages)
-                
+
                 let system_prompts;
                 // unsure why system_prompts is an array but it always seems to only have exactly one element,
                 // and the real array of system_prompts seems to be the [0].content -- NS
@@ -140,32 +137,32 @@ class ClaudeService extends BaseService {
                 }
 
                 messages = messages.map(message => {
-                    if (message.cache_control) {
+                    if ( message.cache_control ) {
                         message.content[0].cache_control = message.cache_control;
                     }
                     delete message.cache_control;
-                    return message
-                })
+                    return message;
+                });
 
                 const sdk_params = {
                     model: model ?? this.get_default_model(),
                     max_tokens: Math.floor(max_tokens) ||
                         ((
                             model === 'claude-3-5-sonnet-20241022'
                             || model === 'claude-3-5-sonnet-20240620'
-                        ) ? 8192 : this.models_().filter(e=>e.name === model)[0].max_tokens || 4096), //required
+                        ) ? 8192 : this.models_().filter(e => e.name === model)[0].max_tokens || 4096), //required
                     temperature: temperature || 0, // required
                     ...( (system_prompts && system_prompts[0]?.content) ? {
-                        system: system_prompts[0]?.content
+                        system: system_prompts[0]?.content,
                     } : {}),
                     tool_choice: {
-                        type: "auto",
-                        disable_parallel_tool_use: true
+                        type: 'auto',
+                        disable_parallel_tool_use: true,
                     },
                     messages,
                     ...(tools ? { tools } : {}),
                 };
-                console.log(sdk_params.max_tokens)
+                console.log(sdk_params.max_tokens);
 
                 // console.log('\x1B[26;1m ===== SDK PARAMETERS', require('util').inspect(sdk_params, undefined, Infinity));
 
@@ -201,8 +198,6 @@ class ClaudeService extends BaseService {
                             fsNode: task.node,
                         });
 
-                        const require = this.require;
-                        const mime = require('mime-types');
                         const mimeType = mime.contentType(await task.node.get('name'));
 
                         beta_mode = true;
@@ -228,12 +223,6 @@ class ClaudeService extends BaseService {
                             return 'container_upload';
                         })();
 
-                        // {
-                        //     'application/pdf': 'document',
-                        //     'text/plain': 'document',
-                        //     'image/': 'image'
-                        // }[mimeType];
-
                         delete task.contentPart.puter_path,
                         task.contentPart.type = contentBlockTypeForFileBasedOnMime;
                         task.contentPart.source = {
@@ -251,7 +240,7 @@ class ClaudeService extends BaseService {
                             try {
                                 await this.anthropic.beta.files.delete(task.file_id,
                                                 { betas: ['files-api-2025-04-14'] });
-                            }  catch (e) {
+                            } catch (e) {
                                 this.errors.report('claude:file-delete-task', {
                                     source: e,
                                     trace: true,
@@ -328,26 +317,7 @@ class ClaudeService extends BaseService {
                         }
                         chatStream.end();
 
-                        this.billForUsage(actor, model || this.get_default_model(), usageSum);
-
-                        // Log token usage statistics
-                        const totalTokens = usageSum.input_tokens + usageSum.output_tokens;
-                        const cachedTokens = usageSum.ephemeral_5m_input_tokens + usageSum.ephemeral_1h_input_tokens;
-                        const cacheHits = usageSum.cache_read_input_tokens;
-                        const uncachedTokens = usageSum.input_tokens - cacheHits - cachedTokens;
-
-//                         console.log(`
-// ╔══════════════════════════════════════════════════════════════╗
-// ║           🎯 Token Usage Statistics 🎯                       ║
-// ╠══════════════════════════════════════════════════════════════╣
-// ║  📊 Total Tokens Used:     ${String(totalTokens).padStart(10)} 📊  ║
-// ║  💾 Cached Tokens:         ${String(cachedTokens).padStart(10)} 💾  ║
-// ║  ✅ Cache Hits:             ${String(cacheHits).padStart(10)} ✅  ║
-// ║  🔄 Uncached Tokens:        ${String(uncachedTokens).padStart(10)} 🔄  ║
-// ║  📥 Input Tokens:           ${String(usageSum.input_tokens).padStart(10)} 📥  ║
-// ║  📤 Output Tokens:          ${String(usageSum.output_tokens).padStart(10)} 📤  ║
-// ╚══════════════════════════════════════════════════════════════╝
-//                         `);
+                        this.#meteringService.utilRecordUsageObject(usageSum, actor, `claude:${this.models_().find(m => [m.id, ...(m.aliases || [])].includes(model || this.get_default_model())).id}`);
                     };
 
                     return {
@@ -361,26 +331,7 @@ class ClaudeService extends BaseService {
                 await cleanup_files();
 
                 const usage = this.usageFormatterUtil(msg.usage);
-                this.billForUsage(actor, model || this.get_default_model(), usage);
-
-                // Log token usage statistics
-                const totalTokens = usage.input_tokens + usage.output_tokens;
-                const cachedTokens = usage.ephemeral_5m_input_tokens + usage.ephemeral_1h_input_tokens;
-                const cacheHits = usage.cache_read_input_tokens;
-                const uncachedTokens = usage.input_tokens - cacheHits - cachedTokens;
-
-//                 console.log(`
-// ╔══════════════════════════════════════════════════════════════╗
-// ║           🎯 Token Usage Statistics 🎯                      ║
-// ╠══════════════════════════════════════════════════════════════╣
-// ║  📊 Total Tokens Used:     ${String(totalTokens).padStart(10)} 📊  ║
-// ║  💾 Cached Tokens:         ${String(cachedTokens).padStart(10)} 💾  ║
-// ║  ✅ Cache Hits:             ${String(cacheHits).padStart(10)} ✅  ║
-// ║  🔄 Uncached Tokens:        ${String(uncachedTokens).padStart(10)} 🔄  ║
-// ║  📥 Input Tokens:           ${String(usage.input_tokens).padStart(10)} 📥  ║
-// ║  📤 Output Tokens:          ${String(usage.output_tokens).padStart(10)} 📤  ║
-// ╚══════════════════════════════════════════════════════════════╝
-//                 `);
+                this.#meteringService.utilRecordUsageObject(usage, actor, `claude:${this.models_().find(m => [m.id, ...(m.aliases || [])].includes(model || this.get_default_model())).id}`);
 
                 // TODO DS: cleanup old usage tracking
                 return {
@@ -394,7 +345,7 @@ class ClaudeService extends BaseService {
 
     // TODO DS: get this inside the class as a private method once the methods aren't exported directly
     /** @type {(usage: import("@anthropic-ai/sdk/resources/messages.js").Usage | import("@anthropic-ai/sdk/resources/beta/messages/messages.js").BetaUsage) => {}}) */
-    usageFormatterUtil(usage) {
+    usageFormatterUtil (usage) {
         return {
             input_tokens: usage?.input_tokens || 0,
             ephemeral_5m_input_tokens: usage?.cache_creation?.ephemeral_5m_input_tokens || usage.cache_creation_input_tokens || 0, // this is because they're api is a bit inconsistent
@@ -404,11 +355,6 @@ class ClaudeService extends BaseService {
         };
     };
 
-    // TODO DS: get this inside the class as a private method once the methods aren't exported directly
-    billForUsage(actor, model, usage) {
-        this.#meteringService.utilRecordUsageObject(usage, actor, `claude:${this.models_().find(m => [m.id, ...(m.aliases || [])].includes(model)).id}`);
-    };
-
     /**
     * Retrieves available Claude AI models and their specifications
     * @returns Array of model objects containing:
@@ -421,7 +367,7 @@ class ClaudeService extends BaseService {
     *   - max_output: Maximum output tokens
     *   - training_cutoff: Training data cutoff date
     */
-    models_() {
+    models_ () {
         return [
             {
                 id: 'claude-haiku-4-5-20251001',
 
@@ -18,7 +18,6 @@
  */
 
 // METADATA // {"ai-commented":{"service":"claude"}}
-const APIError = require('../../api/APIError');
 const BaseService = require('../../services/BaseService');
 const OpenAIUtil = require('./lib/OpenAIUtil');
 const { Context } = require('../../util/context');
@@ -42,7 +41,7 @@ class OllamaService extends BaseService {
     * Gets the system prompt used for AI interactions
     * @returns {string} The base system prompt that identifies the AI as running on Puter
     */
-    adapt_model(model) {
+    adapt_model (model) {
         return model;
     }
 
@@ -51,14 +50,14 @@ class OllamaService extends BaseService {
     * @private
     * @returns {Promise<void>} Resolves when initialization is complete
     */
-    async _init() {
+    async _init () {
         // Ollama typically runs on HTTP, not HTTPS
         this.api_base_url = this.config?.api_base_url || 'http://localhost:11434';
 
         // OpenAI SDK is used to interact with the Ollama API
         this.openai = new this.modules.openai.OpenAI({
-            apiKey: "ollama", // Ollama doesn't use an API key, it uses the "ollama" string
-            baseURL: this.api_base_url + '/v1',
+            apiKey: 'ollama', // Ollama doesn't use an API key, it uses the "ollama" string
+            baseURL: `${this.api_base_url }/v1`,
         });
         this.kvkey = this.modules.uuidv4();
 
@@ -74,7 +73,7 @@ class OllamaService extends BaseService {
     * Returns the default model identifier for the Ollama service
     * @returns {string} The default model ID 'gpt-oss:20b'
     */
-    get_default_model() {
+    get_default_model () {
         return 'gpt-oss:20b';
     }
 
@@ -86,7 +85,7 @@ class OllamaService extends BaseService {
              *
              * @returns Promise<Array<Object>> Array of model details
              */
-            async models() {
+            async models () {
                 return await this.models_();
             },
             /**
@@ -95,7 +94,7 @@ class OllamaService extends BaseService {
             * @description Retrieves all available model IDs and their aliases,
             * flattening them into a single array of strings that can be used for model selection
             */
-            async list() {
+            async list () {
                 const models = await this.models_();
                 const model_names = [];
                 for ( const model of models ) {
@@ -108,7 +107,7 @@ class OllamaService extends BaseService {
              * AI Chat completion method.
              * See AIChatService for more details.
              */
-            async complete({ messages, stream, model, tools, max_tokens, temperature }) {
+            async complete ({ messages, stream, model, tools, max_tokens, temperature }) {
                 model = this.adapt_model(model);
 
                 if ( model.startsWith('ollama:') ) {
@@ -128,19 +127,23 @@ class OllamaService extends BaseService {
                     ...(stream ? {
                         stream_options: { include_usage: true },
                     } : {}),
-                }
+                };
 
                 const completion = await this.openai.chat.completions.create(sdk_params);
 
-                const modelDetails =  (await this.models_()).find(m => m.id === 'ollama:' + model);
+                const modelDetails =  (await this.models_()).find(m => m.id === `ollama:${model}`);
                 return OpenAIUtil.handle_completion_output({
                     usage_calculator: ({ usage }) => {
-                        // custom open router logic because its free
+
                         const trackedUsage = {
-                            prompt: 0,
-                            completion: 0,
-                            input_cache_read: 0,
+                            prompt: (usage.prompt_tokens ?? 0 ) - (usage.prompt_tokens_details?.cached_tokens ?? 0),
+                            completion: usage.completion_tokens ?? 0,
+                            input_cache_read: usage.prompt_tokens_details?.cached_tokens ?? 0,
                         };
+                        const costOverwrites = Object.fromEntries(Object.keys(trackedUsage).map((k) => {
+                            return [k, 0]; // override to 0 since local is free
+                        }));
+                        this.meteringService.utilRecordUsageObject(trackedUsage, actor, modelDetails.id, { costOverwrites });
                         const legacyCostCalculator = OpenAIUtil.create_usage_calculator({
                             model_details: modelDetails,
                         });
@@ -162,31 +165,31 @@ class OllamaService extends BaseService {
     *   - cost: Pricing information object with currency and rates
     * @private
     */
-    async models_(rawPriceKeys = false) {
+    async models_ (_rawPriceKeys = false) {
         const axios = this.require('axios');
 
         let models = this.modules.kv.get(`${this.kvkey}:models`);
-        if ( !models ) {
+        if ( ! models ) {
             try {
                 const resp = await axios.request({
                     method: 'GET',
-                    url: this.api_base_url + '/api/tags',
+                    url: `${this.api_base_url }/api/tags`,
                 });
                 models = resp.data.models || [];
                 if ( models.length > 0 ) {
                     this.modules.kv.set(`${this.kvkey}:models`, models);
                 }
-            } catch (error) {
+            } catch ( error ) {
                 this.log.error('Failed to fetch models from Ollama:', error.message);
                 // Return empty array if Ollama is not available
                 return [];
             }
         }
-        
+
         if ( !models || models.length === 0 ) {
             return [];
         }
-        
+
         const coerced_models = [];
         for ( const model of models ) {
             // Ollama API returns models with 'name' property, not 'model'
@@ -196,8 +199,8 @@ class OllamaService extends BaseService {
                 output: 0,
             };
             coerced_models.push({
-                id: 'ollama:' + modelName,
-                name: modelName + ' (Ollama)',
+                id: `ollama:${ modelName}`,
+                name: `${modelName } (Ollama)`,
                 max_tokens: model.size || model.max_context || 8192,
                 cost: {
                     currency: 'usd-cents',
@@ -206,7 +209,7 @@ class OllamaService extends BaseService {
                 },
             });
         }
-        console.log("coerced_models", coerced_models);
+        console.log('coerced_models', coerced_models);
         return coerced_models;
     }
 }