airbytehq · Vee7574 · Aug 2, 2024 · Aug 3, 2024 · Aug 6, 2024 · Aug 6, 2024
@@ -115,20 +115,29 @@ constructor(
         statementCreator: CheckedFunction<Connection, PreparedStatement, SQLException>,
         recordTransform: CheckedFunction<ResultSet, T, SQLException>
     ): Stream<T> {
-        val connection = dataSource.connection
-        return JdbcDatabase.Companion.toUnsafeStream<T>(
+        var connection = dataSource.connection
+
+        try {
+            return JdbcDatabase.Companion.toUnsafeStream<T>(
                 statementCreator.apply(connection).executeQuery(),
                 recordTransform
             )
-            .onClose(
-                Runnable {
-                    try {
-                        LOGGER.info { "closing connection" }
-                        connection.close()
-                    } catch (e: SQLException) {
-                        throw RuntimeException(e)
+                .onClose(
+                    Runnable {
+                        try {
+                            LOGGER.info { "closing connection" }
+                            connection.close()
+                        } catch (e: SQLException) {
+                            throw RuntimeException(e)
+                        }
                     }
-                }
-            )
+                )
+        } catch (e: Throwable) {
+            //Close the connection and rethrow the exception
+            if (connection != null) {
+                connection.close()
+            }
+            throw e
+        }
     }
 }
@@ -5,7 +5,8 @@ plugins {
 airbyteJavaConnector {
     cdkVersionRequired = '0.44.14'
     features = ['db-destinations', 's3-destinations', 'typing-deduping']
-    useLocalCdk = false
+//TODO: Change to false before merging to master
+    useLocalCdk = true
 }
 
 java {
@@ -44,4 +45,5 @@ integrationTestJava {
 dependencies {
     implementation 'net.snowflake:snowflake-jdbc:3.14.1'
     implementation 'org.apache.commons:commons-text:1.10.0'
+    implementation 'org.json:json:20210307'
 }
@@ -5,7 +5,7 @@ data:
   connectorSubtype: database
   connectorType: destination
   definitionId: 424892c4-daac-4491-b35d-c6688ba547ba
-  dockerImageTag: 3.11.9
+  dockerImageTag: 3.11.11
   dockerRepository: airbyte/destination-snowflake
   documentationUrl: https://docs.airbyte.com/integrations/destinations/snowflake
   githubIssueLabel: destination-snowflake
@@ -148,4 +148,4 @@ data:
           secretStore:
             type: GSM
             alias: airbyte-connector-testing-secret-store
-metadataSpecVersion: "1.0"
+metadataSpecVersion: "1.0"
@@ -293,4 +293,8 @@ object SnowflakeDatabaseUtils {
             AirbyteProtocolType.UNKNOWN -> "VARIANT"
         }
     }
+
+    fun fromIsNullableSnowflakeString(isNullable: String?): Boolean {
+        return "true".equals(isNullable, ignoreCase = true)
+    }
 }
@@ -26,17 +26,18 @@ import io.airbyte.integrations.base.destination.typing_deduping.Struct
 import io.airbyte.integrations.base.destination.typing_deduping.Union
 import io.airbyte.integrations.base.destination.typing_deduping.UnsupportedOneOf
 import io.airbyte.integrations.destination.snowflake.SnowflakeDatabaseUtils
+import io.airbyte.integrations.destination.snowflake.SnowflakeDatabaseUtils.fromIsNullableSnowflakeString
 import io.airbyte.integrations.destination.snowflake.migrations.SnowflakeState
 import io.airbyte.integrations.destination.snowflake.typing_deduping.SnowflakeSqlGenerator.Companion.QUOTE
 import java.sql.Connection
-import java.sql.DatabaseMetaData
 import java.sql.ResultSet
 import java.sql.SQLException
 import java.time.Instant
 import java.util.*
 import java.util.stream.Collectors
 import net.snowflake.client.jdbc.SnowflakeSQLException
 import org.apache.commons.text.StringSubstitutor
+import org.json.JSONObject
 import org.jooq.SQLDialect
 import org.slf4j.Logger
 import org.slf4j.LoggerFactory
@@ -70,75 +71,83 @@ class SnowflakeDestinationHandler(
     private fun getFinalTableRowCount(
         streamIds: List<StreamId>
     ): LinkedHashMap<String, LinkedHashMap<String, Int>> {
-        val tableRowCounts = LinkedHashMap<String, LinkedHashMap<String, Int>>()
-        // convert list stream to array
-        val namespaces = streamIds.map { it.finalNamespace }.toTypedArray()
-        val names = streamIds.map { it.finalName }.toTypedArray()
-        val query =
-            """
-            |SELECT table_schema, table_name, row_count
-            |FROM information_schema.tables
-            |WHERE table_catalog = ? 
-            |AND table_schema IN (${IntRange(1, streamIds.size).joinToString { "?" }}) 
-            |AND table_name IN (${IntRange(1, streamIds.size).joinToString { "?" }})
-            |""".trimMargin()
-        val bindValues = arrayOf(databaseName) + namespaces + names
-        val results: List<JsonNode> = database.queryJsons(query, *bindValues)
-        for (result in results) {
-            val tableSchema = result["TABLE_SCHEMA"].asText()
-            val tableName = result["TABLE_NAME"].asText()
-            val rowCount = result["ROW_COUNT"].asInt()
-            tableRowCounts
-                .computeIfAbsent(tableSchema) { _: String? -> LinkedHashMap() }[tableName] =
-                rowCount
+
+        val tableRowCountsFromShowQuery = LinkedHashMap<String, LinkedHashMap<String, Int>>()
+        var showColumnsResult: List<JsonNode> = listOf()
+
+        try {
+            for (stream in streamIds) {
+                val showColumnsQuery =
+                    String.format(
+                            """
+                                SHOW TABLES LIKE '%s' IN "%s"."%s";
+                            """.trimIndent(),
+                            stream.finalName,
+                            databaseName,
+                            stream.finalNamespace,
+                            )
+                showColumnsResult = database.queryJsons(
+                    showColumnsQuery,
+                )
+                for (result in showColumnsResult) {
+                    val tableSchema = result["schema_name"].asText()
+                    val tableName = result["name"].asText()
+                    val rowCount = result["rows"].asText()
+
+                    tableRowCountsFromShowQuery
+                        .computeIfAbsent(tableSchema) { _: String? -> LinkedHashMap() }[tableName] =
+                        rowCount.toInt()
+                }
+            }
+        } catch (e: SQLException) {
+            showColumnsResult.stream().close()
+            //Not re-throwing the exception since the SQLException occurs when the table does not exist
+            //throw e
         }
-        return tableRowCounts
+        return tableRowCountsFromShowQuery
     }
 
+
     @Throws(Exception::class)
     private fun getInitialRawTableState(
         id: StreamId,
         suffix: String,
     ): InitialRawTableStatus {
+
         val rawTableName = id.rawName + suffix
-        val tableExists =
-            database.executeMetadataQuery { databaseMetaData: DatabaseMetaData ->
-                LOGGER.info(
-                    "Retrieving table from Db metadata: {} {}",
+        var tableExists = false
+        var showTablesResult: List<JsonNode> = listOf()
+
+        try {
+            val showTablesQuery =
+                String.format(
+                    """
+                        SHOW TABLES LIKE '%s' IN "%s"."%s";
+                    """.trimIndent(),
+                    rawTableName,
+                    databaseName,
                     id.rawNamespace,
-                    rawTableName
-                )
-                try {
-                    val rs =
-                        databaseMetaData.getTables(
-                            databaseName,
-                            id.rawNamespace,
-                            rawTableName,
-                            null
-                        )
-                    // When QUOTED_IDENTIFIERS_IGNORE_CASE is set to true, the raw table is
-                    // interpreted as uppercase
-                    // in db metadata calls. check for both
-                    val rsUppercase =
-                        databaseMetaData.getTables(
-                            databaseName,
-                            id.rawNamespace.uppercase(),
-                            rawTableName.uppercase(),
-                            null
-                        )
-                    rs.next() || rsUppercase.next()
-                } catch (e: SQLException) {
-                    LOGGER.error("Failed to retrieve table metadata", e)
-                    throw RuntimeException(e)
-                }
+                    )
+            showTablesResult = database.queryJsons(
+                showTablesQuery,
+            )
+            if(showTablesResult.size > 0) {
+                tableExists = true
             }
+        } catch (e: SQLException) {
+            showTablesResult.stream().close()
+            //Not re-throwing the exception since the SQLException occurs when the table does not exist
+            //throw e
+        }
+
         if (!tableExists) {
             return InitialRawTableStatus(
                 rawTableExists = false,
                 hasUnprocessedRecords = false,
                 maxProcessedTimestamp = Optional.empty()
             )
         }
+
         // Snowflake timestamps have nanosecond precision, so decrement by 1ns
         // And use two explicit queries because COALESCE doesn't short-circuit.
         // This first query tries to find the oldest raw record with loaded_at = NULL
@@ -560,6 +569,7 @@ class SnowflakeDestinationHandler(
     }
 
     companion object {
+
         private val LOGGER: Logger =
             LoggerFactory.getLogger(SnowflakeDestinationHandler::class.java)
         const val EXCEPTION_COMMON_PREFIX: String =
@@ -573,39 +583,63 @@ class SnowflakeDestinationHandler(
             databaseName: String,
             streamIds: List<StreamId>
         ): LinkedHashMap<String, LinkedHashMap<String, TableDefinition>> {
-            val existingTables = LinkedHashMap<String, LinkedHashMap<String, TableDefinition>>()
-            // convert list stream to array
-            val namespaces = streamIds.map { it.finalNamespace }.toTypedArray()
-            val names = streamIds.map { it.finalName }.toTypedArray()
-            val query =
-                """
-                |SELECT table_schema, table_name, column_name, data_type, is_nullable 
-                |FROM information_schema.columns 
-                |WHERE table_catalog = ? 
-                |AND table_schema IN (${IntRange(1, streamIds.size).joinToString { "?" }}) 
-                |AND table_name IN (${IntRange(1, streamIds.size).joinToString { "?" }}) 
-                |ORDER BY table_schema, table_name, ordinal_position; 
-                |""".trimMargin()
-
-            val bindValues =
-                arrayOf(databaseName.uppercase(Locale.getDefault())) + namespaces + names
-            val results: List<JsonNode> = database.queryJsons(query, *bindValues)
-            for (result in results) {
-                val tableSchema = result["TABLE_SCHEMA"].asText()
-                val tableName = result["TABLE_NAME"].asText()
-                val columnName = result["COLUMN_NAME"].asText()
-                val dataType = result["DATA_TYPE"].asText()
-                val isNullable = result["IS_NULLABLE"].asText()
-                val tableDefinition =
-                    existingTables
-                        .computeIfAbsent(tableSchema) { _: String? -> LinkedHashMap() }
-                        .computeIfAbsent(tableName) { _: String? ->
-                            TableDefinition(LinkedHashMap())
+
+            val existingTablesFromShowQuery =
+                LinkedHashMap<String, LinkedHashMap<String, TableDefinition>>()
+            var showColumnsResult: List<JsonNode> = listOf()
+
+            try {
+                for (stream in streamIds) {
+                    val showColumnsQuery =
+                        String.format(
+                            """
+                                SHOW COLUMNS IN TABLE "%s"."%s"."%s";
+                            """.trimIndent(),
+                            databaseName,
+                            stream.finalNamespace,
+                            stream.finalName,
+                        )
+                    showColumnsResult = database.queryJsons(
+                        showColumnsQuery,
+                    )
+
+                    for (result in showColumnsResult) {
+                        val tableSchema = result["schema_name"].asText()
+                        val tableName = result["table_name"].asText()
+                        val columnName = result["column_name"].asText()
+                        var dataType = JSONObject(result["data_type"].asText()).getString("type")
+
+                        //TODO: Need to check if there are other datatype differences
+                        // between the original approach and the new approach with SHOW queries
+                        if(dataType.equals("FIXED")) {
+                            dataType = "NUMBER"
+                        } else if(dataType.equals("REAL")) {
+                            dataType = "FLOAT"
                         }
-                tableDefinition.columns[columnName] =
-                    ColumnDefinition(columnName, dataType, 0, fromIsNullableIsoString(isNullable))
+
+                        val isNullable = result["null?"].asText()
+                        val tableDefinition =
+                            existingTablesFromShowQuery
+                                .computeIfAbsent(tableSchema) { _: String? -> LinkedHashMap() }
+                                .computeIfAbsent(tableName) { _: String? ->
+                                    TableDefinition(LinkedHashMap())
+                                }
+                        tableDefinition.columns[columnName] =
+                            ColumnDefinition(
+                                columnName,
+                                dataType,
+                                0,
+                                fromIsNullableSnowflakeString(isNullable),
+                            )
+                    }
+                }
+            } catch (e: SQLException) {
+                showColumnsResult.stream().close()
+                //Not re-throwing the exception since the SQLException occurs when the table does not exist
+                //throw e
             }
-            return existingTables
+            return existingTablesFromShowQuery
         }
     }
 }
+