GoogleCloudDataproc
diff --git a/‎spark-bigquery-connector-common/src/main/java/com/google/cloud/spark/bigquery/SparkBigQueryConfig.java‎
Lines changed: 74 additions & 25 deletions b/‎spark-bigquery-connector-common/src/main/java/com/google/cloud/spark/bigquery/SparkBigQueryConfig.java‎
Lines changed: 74 additions & 25 deletions
diff --git a/‎spark-bigquery-dsv2/spark-3.1-bigquery-lib/src/main/java/com/google/cloud/spark/bigquery/v2/Spark31BigQueryTable.java‎
Lines changed: 6 additions & 2 deletions b/‎spark-bigquery-dsv2/spark-3.1-bigquery-lib/src/main/java/com/google/cloud/spark/bigquery/v2/Spark31BigQueryTable.java‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎spark-bigquery-dsv2/spark-3.5-bigquery-lib/src/main/java/com/google/cloud/spark/bigquery/v2/BigQueryTableCatalog.java‎
Lines changed: 47 additions & 16 deletions b/‎spark-bigquery-dsv2/spark-3.5-bigquery-lib/src/main/java/com/google/cloud/spark/bigquery/v2/BigQueryTableCatalog.java‎
Lines changed: 47 additions & 16 deletions
@@ -268,6 +268,24 @@ public static SparkBigQueryConfig from(
       SparkSession spark,
       Optional<StructType> schema,
       boolean tableIsMandatory) {
+    return from(
+        options,
+        customDefaults,
+        dataSourceVersion,
+        spark,
+        schema,
+        tableIsMandatory,
+        Optional.empty());
+  }
+
+  public static SparkBigQueryConfig from(
+      Map<String, String> options,
+      ImmutableMap<String, String> customDefaults,
+      DataSourceVersion dataSourceVersion,
+      SparkSession spark,
+      Optional<StructType> schema,
+      boolean tableIsMandatory,
+      Optional<TableId> overrideTableId) {
     Map<String, String> optionsMap = new HashMap<>(options);
     dataSourceVersion.updateOptionsMap(optionsMap);
     return SparkBigQueryConfig.from(
@@ -279,7 +297,8 @@ public static SparkBigQueryConfig from(
         spark.sqlContext().conf(),
         spark.version(),
         schema,
-        tableIsMandatory);
+        tableIsMandatory,
+        overrideTableId);
   }
 
   @VisibleForTesting
@@ -293,6 +312,31 @@ public static SparkBigQueryConfig from(
       String sparkVersion,
       Optional<StructType> schema,
       boolean tableIsMandatory) {
+    return from(
+        optionsInput,
+        originalGlobalOptions,
+        hadoopConfiguration,
+        customDefaults,
+        defaultParallelism,
+        sqlConf,
+        sparkVersion,
+        schema,
+        tableIsMandatory,
+        Optional.empty());
+  }
+
+  @VisibleForTesting
+  public static SparkBigQueryConfig from(
+      Map<String, String> optionsInput,
+      ImmutableMap<String, String> originalGlobalOptions,
+      Configuration hadoopConfiguration,
+      ImmutableMap<String, String> customDefaults,
+      int defaultParallelism,
+      SQLConf sqlConf,
+      String sparkVersion,
+      Optional<StructType> schema,
+      boolean tableIsMandatory,
+      Optional<TableId> overrideTableId) {
     SparkBigQueryConfig config = new SparkBigQueryConfig();
 
     ImmutableMap<String, String> options = toLowerCaseKeysMap(optionsInput);
@@ -314,9 +358,6 @@ public static SparkBigQueryConfig from(
         com.google.common.base.Optional.fromNullable(
                 hadoopConfiguration.get(GCS_CONFIG_PROJECT_ID_PROPERTY))
             .toJavaUtil();
-    Optional<String> tableParam =
-        getOptionFromMultipleParams(options, ImmutableList.of("table", "path"), DEFAULT_FALLBACK)
-            .toJavaUtil();
     Optional<String> datasetParam = getOption(options, "dataset").or(fallbackDataset).toJavaUtil();
     Optional<String> projectParam =
         firstPresent(getOption(options, "project").toJavaUtil(), fallbackProject);
@@ -327,28 +368,36 @@ public static SparkBigQueryConfig from(
     config.partitionRangeEnd = getOption(options, "partitionRangeEnd").transform(Long::parseLong);
     config.partitionRangeInterval =
         getOption(options, "partitionRangeInterval").transform(Long::parseLong);
-    Optional<String> datePartitionParam = getOption(options, DATE_PARTITION_PARAM).toJavaUtil();
-    datePartitionParam.ifPresent(
-        date -> validateDateFormat(date, config.getPartitionTypeOrDefault(), DATE_PARTITION_PARAM));
-    // checking for query
-    if (tableParam.isPresent()) {
-      String tableParamStr = tableParam.get().trim();
-      if (isQuery(tableParamStr)) {
-        // it is a query in practice
-        config.query = com.google.common.base.Optional.of(tableParamStr);
-        config.tableId = parseTableId("QUERY", datasetParam, projectParam, datePartitionParam);
-      } else {
-        config.tableId =
-            parseTableId(tableParamStr, datasetParam, projectParam, datePartitionParam);
-      }
+    if (overrideTableId.isPresent()) {
+      config.tableId = overrideTableId.get();
     } else {
-      // no table has been provided, it is either a query or an error
-      config.query = getOption(options, "query").transform(String::trim);
-      if (config.query.isPresent()) {
-        config.tableId = parseTableId("QUERY", datasetParam, projectParam, datePartitionParam);
-      } else if (tableIsMandatory) {
-        // No table nor query were set. We cannot go further.
-        throw new IllegalArgumentException("No table has been specified");
+      // checking for query
+      Optional<String> tableParam =
+          getOptionFromMultipleParams(options, ImmutableList.of("table", "path"), DEFAULT_FALLBACK)
+              .toJavaUtil();
+      Optional<String> datePartitionParam = getOption(options, DATE_PARTITION_PARAM).toJavaUtil();
+      datePartitionParam.ifPresent(
+          date ->
+              validateDateFormat(date, config.getPartitionTypeOrDefault(), DATE_PARTITION_PARAM));
+      if (tableParam.isPresent()) {
+        String tableParamStr = tableParam.get().trim();
+        if (isQuery(tableParamStr)) {
+          // it is a query in practice
+          config.query = com.google.common.base.Optional.of(tableParamStr);
+          config.tableId = parseTableId("QUERY", datasetParam, projectParam, datePartitionParam);
+        } else {
+          config.tableId =
+              parseTableId(tableParamStr, datasetParam, projectParam, datePartitionParam);
+        }
+      } else {
+        // no table has been provided, it is either a query or an error
+        config.query = getOption(options, "query").transform(String::trim);
+        if (config.query.isPresent()) {
+          config.tableId = parseTableId("QUERY", datasetParam, projectParam, datePartitionParam);
+        } else if (tableIsMandatory) {
+          // No table nor query were set. We cannot go further.
+          throw new IllegalArgumentException("No table has been specified");
+        }
       }
     }
 
 
@@ -15,6 +15,7 @@
  */
 package com.google.cloud.spark.bigquery.v2;
 
+import com.google.cloud.bigquery.TableId;
 import com.google.cloud.bigquery.connector.common.BigQueryUtil;
 import com.google.cloud.spark.bigquery.DataSourceVersion;
 import com.google.cloud.spark.bigquery.SparkBigQueryConfig;
@@ -47,10 +48,12 @@ public class Spark31BigQueryTable implements Table, SupportsRead, SupportsWrite
 
   protected Injector injector;
   protected Supplier<StructType> schemaSupplier;
+  protected TableId tableId;
 
   public Spark31BigQueryTable(Injector injector, Supplier<StructType> schemaSupplier) {
     this.injector = injector;
     this.schemaSupplier = schemaSupplier;
+    this.tableId = injector.getInstance(SparkBigQueryConfig.class).getTableId();
   }
 
   @Override
@@ -67,8 +70,9 @@ protected BigQueryDataSourceReaderContext createBigQueryDataSourceReaderContext(
             ImmutableMap.of(),
             injector.getInstance(DataSourceVersion.class),
             injector.getInstance(SparkSession.class),
-            Optional.ofNullable(schemaSupplier.get()), /*tableIsMandatory*/
-            true);
+            Optional.ofNullable(schemaSupplier.get()),
+            true /* tableIsMandatory */,
+            Optional.of(tableId));
     Injector readerInjector =
         injector.createChildInjector(
             new BigQueryDataSourceReaderModule(Optional.of(tableScanConfig)));
 
@@ -28,6 +28,7 @@
 import com.google.common.collect.ImmutableMap;
 import com.google.inject.Injector;
 import java.util.Arrays;
+import java.util.HashMap;
 import java.util.Map;
 import java.util.Optional;
 import java.util.ServiceLoader;
@@ -48,9 +49,11 @@ public class BigQueryTableCatalog implements TableCatalog {
   private static final Logger logger = LoggerFactory.getLogger(BigQueryTableCatalog.class);
   private static final String[] DEFAULT_NAMESPACE = {"default"};
 
-  TableProvider tableProvider;
-  BigQueryClient bigQueryClient;
-  SchemaConverters schemaConverters;
+  private static Map<String, Table> identifierToTableMapping = new HashMap<>();
+
+  private TableProvider tableProvider;
+  private BigQueryClient bigQueryClient;
+  private SchemaConverters schemaConverters;
 
   @Override
   public void initialize(String name, CaseInsensitiveStringMap caseInsensitiveStringMap) {
@@ -99,10 +102,14 @@ public Identifier[] listTables(String[] namespace) throws NoSuchNamespaceExcepti
   @Override
   public Table loadTable(Identifier identifier) throws NoSuchTableException {
     logger.debug("loading table [{}])", format(identifier));
-    ImmutableMap<String, String> properties =
-        ImmutableMap.of("dataset", identifier.namespace()[0], "table", identifier.name());
-    // TODO: reuse injector
-    return Spark3Util.createBigQueryTableInstance(Spark35BigQueryTable::new, null, properties);
+    return identifierToTableMapping.computeIfAbsent(
+        identifier.toString(),
+        ignored ->
+            // TODO: reuse injector
+            Spark3Util.createBigQueryTableInstance(
+                Spark35BigQueryTable::new,
+                null,
+                ImmutableMap.of("dataset", identifier.namespace()[0], "table", identifier.name())));
   }
 
   @Override
@@ -125,20 +132,40 @@ public Table createTable(
       Map<String, String> properties)
       throws TableAlreadyExistsException, NoSuchNamespaceException {
     logger.debug("creating table [{}])", format(identifier));
+    if (tableExplicitlySet(properties)) {
+      logger.debug("Mapping Spark table to BigQuery table)");
+      // As the table is mapped to an actual table in BigQuery, we are relying on the BigQuery
+      // schema
+      return identifierToTableMapping.computeIfAbsent(
+          identifier.toString(),
+          ignored ->
+              Spark3Util.createBigQueryTableInstance(
+                  Spark35BigQueryTable::new, /* schema */ null, properties));
+    }
     Schema schema = schemaConverters.toBigQuerySchema(structType);
     bigQueryClient.createTable(
         toTableId(identifier),
         schema,
         BigQueryClient.CreateTableOptions.of(
             Optional.empty(), ImmutableMap.of(), Optional.empty()));
-    ImmutableMap<String, String> getTableProperties =
-        ImmutableMap.<String, String>builder()
-            .put("dataset", identifier.namespace()[0])
-            .put("table", identifier.name())
-            .putAll(properties)
-            .build();
+    ImmutableMap.Builder<String, String> getTableProperties =
+        ImmutableMap.<String, String>builder().putAll(properties);
+    // if the user provided an alternative table we do not want to ignore it
+    if (!tableExplicitlySet(properties)) {
+      getTableProperties.put("dataset", identifier.namespace()[0]).put("table", identifier.name());
+    }
     // TODO: Use the table constructor directly using the catalog's injector
-    return tableProvider.getTable(structType, transforms, getTableProperties);
+    return tableProvider.getTable(structType, transforms, getTableProperties.buildKeepingLast());
+  }
+
+  private static boolean tableExplicitlySet(Map<String, String> properties) {
+    if (properties.containsKey("table")) {
+      return true;
+    }
+    if (properties.containsKey("path")) {
+      return true;
+    }
+    return false;
   }
 
   @Override
@@ -151,8 +178,12 @@ public Table alterTable(Identifier identifier, TableChange... tableChanges)
   public boolean dropTable(Identifier identifier) {
     logger.debug("dropping table [{}])", format(identifier));
     TableId tableId = toTableId(identifier);
-    if (bigQueryClient.tableExists(tableId)) {
-      return bigQueryClient.deleteTable(tableId);
+    if (!bigQueryClient.tableExists(tableId)) {
+      return false;
+    }
+    if (bigQueryClient.deleteTable(tableId)) {
+      identifierToTableMapping.remove(identifier.toString());
+      return true;
     }
     return false;
   }