Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

SNOW-1628247: Fix Jackson Scala module Compatibility Issue #145

Merged
merged 13 commits into from
Aug 22, 2024
6 changes: 0 additions & 6 deletions fips-pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,6 @@
<scalaPluginVersion>4.3.0</scalaPluginVersion>
<jackson.version>2.13.2</jackson.version>
<jackson.databind.version>2.13.4.2</jackson.databind.version>
<jackson.module.scala.version>2.13.5</jackson.module.scala.version>
</properties>

<dependencyManagement>
Expand Down Expand Up @@ -145,11 +144,6 @@
<artifactId>jackson-annotations</artifactId>
<version>${jackson.version}</version>
</dependency>
<dependency>
<groupId>com.fasterxml.jackson.module</groupId>
<artifactId>jackson-module-scala_2.12</artifactId>
<version>${jackson.module.scala.version}</version>
</dependency>

<!-- Test -->
<dependency>
Expand Down
6 changes: 0 additions & 6 deletions pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -46,7 +46,6 @@
<scalaPluginVersion>4.3.0</scalaPluginVersion>
<jackson.version>2.13.2</jackson.version>
<jackson.databind.version>2.13.4.2</jackson.databind.version>
<jackson.module.scala.version>2.13.5</jackson.module.scala.version>

</properties>
<dependencyManagement>
Expand Down Expand Up @@ -133,11 +132,6 @@
<artifactId>jackson-annotations</artifactId>
<version>${jackson.version}</version>
</dependency>
<dependency>
<groupId>com.fasterxml.jackson.module</groupId>
<artifactId>jackson-module-scala_2.12</artifactId>
<version>${jackson.module.scala.version}</version>
</dependency>

<!-- Test -->
<dependency>
Expand Down
13 changes: 2 additions & 11 deletions src/main/scala/com/snowflake/snowpark/Session.scala
Original file line number Diff line number Diff line change
@@ -1,8 +1,5 @@
package com.snowflake.snowpark

import com.fasterxml.jackson.databind.json.JsonMapper
import com.fasterxml.jackson.module.scala.{ClassTagExtensions, DefaultScalaModule}

import java.io.{File, FileInputStream, FileNotFoundException}
import java.net.URI
import java.sql.{Connection, Date, Time, Timestamp}
Expand All @@ -29,7 +26,6 @@ import net.snowflake.client.jdbc.{SnowflakeConnectionV1, SnowflakeDriver, Snowfl
import scala.concurrent.{ExecutionContext, Future}
import scala.collection.JavaConverters._
import scala.reflect.runtime.universe.TypeTag
import scala.util.Try

/**
*
Expand Down Expand Up @@ -65,11 +61,6 @@ import scala.util.Try
* @since 0.1.0
*/
class Session private (private[snowpark] val conn: ServerConnection) extends Logging {
private val jsonMapper = JsonMapper
.builder()
.addModule(DefaultScalaModule)
.build() :: ClassTagExtensions

private val STAGE_PREFIX = "@"
// URI and file name with md5
private val classpathURIs = new ConcurrentHashMap[URI, Option[String]]().asScala
Expand Down Expand Up @@ -397,7 +388,7 @@ class Session private (private[snowpark] val conn: ServerConnection) extends Log
* successful, or `None` otherwise.
*/
private def parseJsonString(jsonString: String): Option[Map[String, Any]] = {
Try(jsonMapper.readValue[Map[String, Any]](jsonString)).toOption
Utils.jsonToMap(jsonString)
}

/**
Expand All @@ -408,7 +399,7 @@ class Session private (private[snowpark] val conn: ServerConnection) extends Log
* or `None` otherwise.
*/
private def toJsonString(map: Map[String, Any]): Option[String] = {
Try(jsonMapper.writeValueAsString(map)).toOption
Utils.mapToJson(map)
}

/*
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,6 @@ package com.snowflake.snowpark.internal
import com.fasterxml.jackson.annotation.JsonView
import com.fasterxml.jackson.core.TreeNode
import com.fasterxml.jackson.databind.JsonNode
import com.fasterxml.jackson.module.scala.DefaultScalaModule

import java.io.File
import java.net.{URI, URLClassLoader}
Expand All @@ -25,8 +24,6 @@ object UDFClassPath extends Logging {
val jacksonDatabindClass: Class[JsonNode] = classOf[com.fasterxml.jackson.databind.JsonNode]
val jacksonCoreClass: Class[TreeNode] = classOf[com.fasterxml.jackson.core.TreeNode]
val jacksonAnnotationClass: Class[JsonView] = classOf[com.fasterxml.jackson.annotation.JsonView]
val jacksonModuleScalaClass: Class[DefaultScalaModule] =
classOf[com.fasterxml.jackson.module.scala.DefaultScalaModule]
val jacksonJarSeq = Seq(
RequiredLibrary(
getPathForClass(jacksonDatabindClass),
Expand All @@ -36,11 +33,7 @@ object UDFClassPath extends Logging {
RequiredLibrary(
getPathForClass(jacksonAnnotationClass),
"jackson-annotation",
jacksonAnnotationClass),
RequiredLibrary(
getPathForClass(jacksonModuleScalaClass),
"jackson-module-scala",
jacksonModuleScalaClass))
jacksonAnnotationClass))

/*
* Libraries required to compile java code generated by snowpark for user's lambda.
Expand Down
80 changes: 80 additions & 0 deletions src/main/scala/com/snowflake/snowpark/internal/Utils.scala
Original file line number Diff line number Diff line change
@@ -1,5 +1,7 @@
package com.snowflake.snowpark.internal

import com.fasterxml.jackson.databind.{JsonNode, ObjectMapper}
import com.fasterxml.jackson.databind.node.JsonNodeType
import com.snowflake.snowpark.Column
import com.snowflake.snowpark.internal.analyzer.{
Attribute,
Expand All @@ -15,6 +17,7 @@ import java.util.Locale
import com.snowflake.snowpark.udtf.UDTF
import net.snowflake.client.jdbc.SnowflakeSQLException

import scala.collection.JavaConverters.asScalaIteratorConverter
import scala.collection.mutable
import scala.collection.mutable.ArrayBuffer
import scala.util.Random
Expand Down Expand Up @@ -447,4 +450,81 @@ object Utils extends Logging {
case _ => throw ErrorMessage.DF_JOIN_WITH_WRONG_ARGUMENT()
}
}

private val objectMapper = new ObjectMapper()

private[snowpark] def jsonToMap(jsonString: String): Option[Map[String, Any]] = {
try {
val node = objectMapper.readTree(jsonString)
assert(node.getNodeType == JsonNodeType.OBJECT)
Some(jsonToScala(node).asInstanceOf[Map[String, Any]])
} catch {
case ex: Exception =>
logError(ex.getMessage)
None
}
}

private def jsonToScala(node: JsonNode): Any = {
node.getNodeType match {
case JsonNodeType.STRING => node.asText()
case JsonNodeType.NULL => null
case JsonNodeType.OBJECT =>
node
.fields()
.asScala
.map(entry => {
entry.getKey -> jsonToScala(entry.getValue)
})
.toMap
case JsonNodeType.ARRAY =>
node.elements().asScala.map(entry => jsonToScala(entry)).toList
case JsonNodeType.BOOLEAN => node.asBoolean()
case JsonNodeType.NUMBER => node.numberValue()
case other =>
throw new UnsupportedOperationException(s"Unsupported Type: ${other.name()}")
}
}

private[snowpark] def mapToJson(map: Map[String, Any]): Option[String] = {
try {
Some(scalaToJson(map))
} catch {
case ex: Exception =>
logError(ex.getMessage)
None
}
}

private def scalaToJson(node: Any): String = {
Copy link
Collaborator

@sfc-gh-bli sfc-gh-bli Aug 21, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

let's simplify this function

 private def scalaToJson(input: Any): String =
    input match {
      // Scala's None and Python's None are different.
      case null => "null"
      case str: String => s""""$str""""
      case _: Int | _: Short | _: Long | _: Byte | _: Double | _: Float |
        _: Boolean => input.toString
      // only supports String keys
      case map: Map[String, _] => map.map {
        case (key, value) => s"${scalaToJson(key)}:${scalaToJson(value)}"
      }.mkString("{", ",", "}")
      // Seq is the most popular collection type in Scala,
      // It is parent type of all List types.
      case seq: Seq[_] => seq.map(scalaToJson).mkString("[", ",", "]")
      // I am not sure If seq can match Array too, so explicitly match Array here.
      // You can test if it is necessary.
      case arr: Array[_] => scalaToJson(arr.toSeq)
      case _ =>
        throw new UnsupportedOperationException(s"Unsupported Type: ${input.getClass.getName}")
    }

node match {
case n: Map[String, Any] =>
val mapRes = n.map {
case (key, value: Map[String, Any]) =>
s""""${key}":${scalaToJson(value)}"""
case (key, value: List[Any]) =>
s""""${key}":${scalaToJson(value)}"""
case (key, value: Number) =>
s""""${key}":${value}"""
case (key, value: String) =>
s""""${key}":"${value}""""
case (key, value: Boolean) =>
s""""${key}":${value}"""
case (key, None) =>
s""""${key}":null"""
case other =>
throw new UnsupportedOperationException(s"Unsupported Type: ${other.getClass}")
}
s"{${mapRes.mkString(",")}}"
case n: List[Any] =>
val listRes = n.map {
case v: List[Any] => scalaToJson(v)
case v: Map[String, Any] => scalaToJson(v)
case v => v.toString
}
s"[${listRes.mkString(",")}]"
case other =>
throw new UnsupportedOperationException(s"Unsupported Type: ${other.getClass}")
}
}
}
12 changes: 12 additions & 0 deletions src/test/scala/com/snowflake/snowpark/UtilsSuite.scala
Original file line number Diff line number Diff line change
Expand Up @@ -672,6 +672,18 @@ class UtilsSuite extends SNTestBase {
assert(Utils.quoteForOption("FALSE").equals("FALSE"))
assert(Utils.quoteForOption("abc").equals("'abc'"))
}

test("Scala and Json format transformation") {
val map = Map(
"integerKey" -> 1.1,
"stringKey" -> "stringValue",
"nestedMap" -> Map("insideKey" -> "stringValue", "insideList" -> Seq(1, 2, 3)),
"nestedList" -> Seq(1, Map("nestedKey" -> "nestedValue"), List(1, 2, 3)))
val jsonString = Utils.mapToJson(map)
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Please add a hard code string comparison here.

assert(jsonString == "<the expected output>"

Otherwise, we don't know if the output of mapToJson is correct.

val readMap = Utils.jsonToMap(jsonString.getOrElse(""))
val transformedString = Utils.mapToJson(readMap.getOrElse(Map()))
assert(jsonString.equals(transformedString))
}
}

object LoggingTester extends Logging {
Expand Down
Loading