timescale
diff --git a/‎projects/extension/sql/idempotent/008-embedding.sql
Lines changed: 2 additions & 0 deletions b/‎projects/extension/sql/idempotent/008-embedding.sql
Lines changed: 2 additions & 0 deletions
diff --git a/‎projects/extension/sql/idempotent/013-vectorizer-api.sql
Lines changed: 47 additions & 2 deletions b/‎projects/extension/sql/idempotent/013-vectorizer-api.sql
Lines changed: 47 additions & 2 deletions
diff --git a/‎projects/extension/sql/idempotent/020-async-batch-api.sql
Lines changed: 164 additions & 0 deletions b/‎projects/extension/sql/idempotent/020-async-batch-api.sql
Lines changed: 164 additions & 0 deletions
diff --git a/‎projects/extension/sql/idempotent/900-semantic-catalog-init.sql
Lines changed: 3 additions & 8 deletions b/‎projects/extension/sql/idempotent/900-semantic-catalog-init.sql
Lines changed: 3 additions & 8 deletions
diff --git a/‎projects/extension/sql/incremental/020-vectorizer-async-batch.sql
Lines changed: 4 additions & 0 deletions b/‎projects/extension/sql/incremental/020-vectorizer-async-batch.sql
Lines changed: 4 additions & 0 deletions
@@ -7,6 +7,7 @@ create or replace function ai.embedding_openai
 , chat_user pg_catalog.text default null
 , api_key_name pg_catalog.text default 'OPENAI_API_KEY'
 , base_url text default null
+, async_batch_enabled pg_catalog.bool default false
 ) returns pg_catalog.jsonb
 as $func$
     select json_object
@@ -17,6 +18,7 @@ as $func$
     , 'user': chat_user
     , 'api_key_name': api_key_name
     , 'base_url': base_url
+    , 'async_batch_enabled': async_batch_enabled
     absent on null
     )
 $func$ language sql immutable security invoker
 
@@ -1,5 +1,3 @@
-
-
 -------------------------------------------------------------------------------
 -- execute_vectorizer
 create or replace function ai.execute_vectorizer(vectorizer_id pg_catalog.int4) returns void
@@ -31,6 +29,9 @@ create or replace function ai.create_vectorizer
 , queue_table pg_catalog.name default null
 , grant_to pg_catalog.name[] default ai.grant_to()
 , enqueue_existing pg_catalog.bool default true
+, async_batch_queue_table pg_catalog.name default null
+, async_batch_chunks_table pg_catalog.name default null
+, async_batch_polling_interval pg_catalog.interval default '5 minutes'::pg_catalog.interval
 ) returns pg_catalog.int4
 as $func$
 declare
@@ -44,6 +45,7 @@ declare
     _vectorizer_id pg_catalog.int4;
     _sql pg_catalog.text;
     _job_id pg_catalog.int8;
+    _async_batch_supported pg_catalog.bool;
 begin
     -- make sure all the roles listed in grant_to exist
     if grant_to is not null then
@@ -117,6 +119,14 @@ begin
     _trigger_name = pg_catalog.concat('_vectorizer_src_trg_', _vectorizer_id);
     queue_schema = coalesce(queue_schema, 'ai');
     queue_table = coalesce(queue_table, pg_catalog.concat('_vectorizer_q_', _vectorizer_id));
+    async_batch_queue_table = coalesce(
+      async_batch_queue_table,
+      pg_catalog.concat('_vectorizer_async_batch_q_', _vectorizer_id)
+    );
+    async_batch_chunks_table = coalesce(
+      async_batch_chunks_table,
+      pg_catalog.concat('_vectorizer_async_batch_chunks_', _vectorizer_id)
+    );
 
     -- make sure view name is available
     if pg_catalog.to_regclass(pg_catalog.format('%I.%I', view_schema, view_name)) is not null then
@@ -133,6 +143,16 @@ begin
         raise exception 'an object named %.% already exists. specify an alternate queue_table explicitly', queue_schema, queue_table;
     end if;
 
+    -- make sure embedding batch table name is available
+    if pg_catalog.to_regclass(pg_catalog.format('%I.%I', queue_schema, async_batch_queue_table)) is not null then
+        raise exception 'an object named %.% already exists. specify an alternate async_batch_queue_table explicitly', queue_schema, async_batch_queue_table;
+    end if;
+
+    -- make sure embedding batch chunks table name is available
+    if pg_catalog.to_regclass(pg_catalog.format('%I.%I', queue_schema, async_batch_chunks_table)) is not null then
+        raise exception 'an object named %.% already exists. specify an alternate async_batch_chunks_table explicitly', queue_schema, async_batch_chunks_table;
+    end if;
+
     -- validate the embedding config
     perform ai._validate_embedding(embedding);
 
@@ -225,6 +245,25 @@ begin
         scheduling = pg_catalog.jsonb_insert(scheduling, array['job_id'], pg_catalog.to_jsonb(_job_id));
     end if;
 
+    -- TODO: I wanted this to be created only when enabling the async batch
+    -- support, so that we don't create 2 extra tables that probably won't be
+    -- used. The issue is that we don't store the value of grant_to.
+    -- Tow new tables might not be enough to warrant any changes, but if you're
+    -- multi-tenant with 100 of customers, it'll be like 200 extra empty
+    -- tables.
+    --
+    -- create async batch tables.
+    select (embedding operator(pg_catalog.?) 'async_batch_enabled')::bool into _async_batch_supported;
+    if _async_batch_supported is true then
+        perform ai._vectorizer_create_async_batch_tables
+            ( queue_schema
+            , async_batch_queue_table
+            , async_batch_chunks_table
+            , _source_pk
+            , grant_to
+            );
+    end if;
+
     insert into ai.vectorizer
     ( id
     , source_schema
@@ -238,6 +277,9 @@ begin
     , queue_schema
     , queue_table
     , config
+    , async_batch_queue_table
+    , async_batch_chunks_table
+    , async_batch_polling_interval
     )
     values
     ( _vectorizer_id
@@ -260,6 +302,9 @@ begin
       , 'scheduling', scheduling
       , 'processing', processing
       )
+    , async_batch_queue_table
+    , async_batch_chunks_table
+    , async_batch_polling_interval
     );
 
     -- record dependencies in pg_depend
 
@@ -0,0 +1,164 @@
+-------------------------------------------------------------------------------
+-- _vectorizer_create_async_batch__table
+create or replace function ai._vectorizer_create_async_batch_tables(
+  schema_name name,
+  async_batch_queue_table name,
+  async_batch_chunks_table name,
+  source_pk pg_catalog.jsonb,
+  grant_to name []
+) returns void as
+$func$
+declare
+  _sql text;
+  _index_name text;
+  _pk_cols pg_catalog.text;
+begin
+    -- create the batches table
+    select pg_catalog.format
+           ( $sql$create table %I.%I(
+                    id VARCHAR(255)    PRIMARY KEY,
+                    created_at         TIMESTAMP(0) NOT NULL DEFAULT NOW(),
+                    status             TEXT NOT NULL,
+                    errors             JSONB,
+                    metadata           JSONB,
+                    next_attempt_after TIMESTAMPTZ NOT NULL,
+                    total_attempts INT NOT NULL DEFAULT 0
+                )$sql$
+            , schema_name
+            , async_batch_queue_table
+           ) into strict _sql
+    ;
+    execute _sql;
+
+    select pg_catalog.format
+           ( $sql$create index on %I.%I (status)$sql$
+               , schema_name
+               , async_batch_queue_table
+           ) into strict _sql
+    ;
+    execute _sql;
+
+    select pg_catalog.string_agg(pg_catalog.format('%I', x.attname), ', ' order by x.pknum)
+    into strict _pk_cols
+    from pg_catalog.jsonb_to_recordset(source_pk) x(pknum int, attname name)
+    ;
+
+    -- create the batch chunks table. The chunk content needs to be stored
+    -- because when retrieving the batches, we need to map each embedding to
+    -- the chunk so that we can save them in the embeddings store table.
+    select pg_catalog.format(
+      $sql$
+        create table %I.%I(
+        %s,
+        chunk_seq int not null,
+        created_at timestamptz not null default now(),
+        async_batch_id text not null references %I.%I (id) on delete cascade,
+        chunk text not null,
+        unique (%s, chunk_seq)
+      )$sql$,
+      schema_name,
+      async_batch_chunks_table,
+      (
+        select pg_catalog.string_agg(
+          pg_catalog.format('%I %s not null' , x.attname , x.typname),
+          ', '
+          order by x.attnum
+        )
+        from pg_catalog.jsonb_to_recordset(source_pk) x(attnum int, attname name, typname name)
+      ),
+      schema_name,
+      async_batch_queue_table,
+      _pk_cols
+    ) into strict _sql
+    ;
+    execute _sql;
+
+    if grant_to is not null then
+      -- grant select, update, delete on batches table to grant_to roles
+      select pg_catalog.format(
+        $sql$grant select, insert, update, delete on %I.%I to %s$sql$,
+        schema_name,
+        async_batch_queue_table,
+        (
+          select pg_catalog.string_agg(pg_catalog.quote_ident(x), ', ')
+          from pg_catalog.unnest(grant_to) x
+        )
+      ) into strict _sql;
+      execute _sql;
+
+      -- grant select, update, delete on batch chunks table to grant_to roles
+      select pg_catalog.format(
+        $sql$grant select, insert, update, delete on %I.%I to %s$sql$,
+        schema_name,
+        async_batch_chunks_table,
+        (
+          select pg_catalog.string_agg(pg_catalog.quote_ident(x), ', ')
+          from pg_catalog.unnest(grant_to) x
+        )
+      ) into strict _sql;
+      execute _sql;
+    end if;
+end;
+$func$
+language plpgsql volatile security invoker
+set search_path to pg_catalog, pg_temp;
+
+-------------------------------------------------------------------------------
+-- vectorizer_enable_async_batches
+create or replace function ai.vectorizer_enable_async_batches(
+    vectorizer_id pg_catalog.int4
+) returns void
+as $func$
+declare
+    _config pg_catalog.jsonb;
+begin
+    select config into _config
+    from ai.vectorizers
+    where id = vectorizer_id;
+
+    if _config is null then
+        raise exception 'vectorizer with id % not found', vectorizer_id;
+    end if;
+
+    if not _config ? 'use_async_batch_api' then
+        raise exception 'vectorizer configuration does not support async batch api';
+    end if;
+
+    update ai.vectorizers
+    set config = jsonb_set(config, '{async_batch_enabled}', 'true'::jsonb)
+    where id = vectorizer_id;
+
+    perform
+end
+$func$ language plpgsql security definer
+set search_path to pg_catalog, pg_temp;
+
+-------------------------------------------------------------------------------
+-- vectorizer_disable_async_batches
+create or replace function ai.vectorizer_disable_async_batches(
+    vectorizer_id pg_catalog.int4
+) returns void
+as $func$
+declare
+    _config pg_catalog.jsonb;
+begin
+    select config into _config
+    from ai.vectorizers
+    where id = vectorizer_id;
+
+    if _config is null then
+        raise exception 'vectorizer with id % not found', vectorizer_id;
+    end if;
+
+    if not _config ? 'use_async_batch_api' then
+        raise exception 'vectorizer configuration does not support async batch api';
+    end if;
+
+    update ai.vectorizers
+    set config = jsonb_set(config, '{async_batch_enabled}', 'false'::jsonb)
+    where id = vectorizer_id;
+
+    perform
+end
+$func$ language plpgsql security definer
+set search_path to pg_catalog, pg_temp;
@@ -1,20 +1,17 @@
 --FEATURE-FLAG: text_to_sql
 
 -------------------------------------------------------------------------------
--- create_semantic_catalog
-create or replace function ai.create_semantic_catalog
+-- initialize_semantic_catalog
+create or replace function ai.initialize_semantic_catalog
 ( embedding pg_catalog.jsonb default null
 , indexing pg_catalog.jsonb default ai.indexing_default()
 , scheduling pg_catalog.jsonb default ai.scheduling_default()
 , processing pg_catalog.jsonb default ai.processing_default()
 , grant_to pg_catalog.name[] default ai.grant_to()
-, text_to_sql pg_catalog.jsonb default null
 , catalog_name pg_catalog.name default 'default'
 ) returns pg_catalog.int4
 as $func$
 declare
-    _catalog_name pg_catalog.name = catalog_name;
-    _text_to_sql pg_catalog.jsonb = text_to_sql;
     _catalog_id pg_catalog.int4;
     _obj_vec_id pg_catalog.int4;
     _sql_vec_id pg_catalog.int4;
@@ -60,14 +57,12 @@ begin
     , catalog_name
     , obj_vectorizer_id
     , sql_vectorizer_id
-    , text_to_sql
     )
     values
     ( _catalog_id
-    , _catalog_name
+    , initialize_semantic_catalog.catalog_name
     , _obj_vec_id
     , _sql_vec_id
-    , _text_to_sql
     )
     returning id
     into strict _catalog_id
 
@@ -0,0 +1,4 @@
+ALTER TABLE ai.vectorizer
+    ADD COLUMN IF NOT EXISTS async_batch_queue_table pg_catalog.name DEFAULT NULL,
+    ADD COLUMN IF NOT EXISTS async_batch_chunks_table pg_catalog.name DEFAULT NULL,
+    ADD COLUMN IF NOT EXISTS async_batch_polling_interval interval DEFAULT interval '5 minutes';