From afa0271e33c24c83208cd63e34c80d9398cd4164 Mon Sep 17 00:00:00 2001 From: Andriy Plokhotnyuk Date: Thu, 9 Jan 2025 18:45:48 +0100 Subject: [PATCH 1/4] Fix remaining inconsistency in JSON codecs for `Schema.CaseClass*` and `Schema.GenericRecord` types --- .../scala/zio/schema/codec/JsonCodec.scala | 59 ++++++++++--------- .../zio/schema/codec/JsonCodecSpec.scala | 39 +++++++----- 2 files changed, 55 insertions(+), 43 deletions(-) diff --git a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala index 0f337e6d5..192f69587 100644 --- a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala +++ b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala @@ -805,6 +805,9 @@ object JsonCodec { case Json.Null => DynamicValue.NoneValue } + private def error(msg: String, trace: List[JsonError]): Nothing = + throw UnsafeJson(JsonError.Message(msg) :: trace) + private def enumDecoder[Z](parentSchema: Schema.Enum[Z]): ZJsonDecoder[Z] = { val caseNameAliases = new mutable.HashMap[String, Schema.Case[Z, Any]] parentSchema.cases.foreach { case_ => @@ -813,9 +816,6 @@ object JsonCodec { case_.caseNameAliases.foreach(a => caseNameAliases.put(a, schema)) } - def error(msg: String, trace: List[JsonError]): Nothing = - throw UnsafeJson(JsonError.Message(msg) :: trace) - if (parentSchema.cases.forall(_.schema.isInstanceOf[Schema.CaseClass0[_]])) { // if all cases are CaseClass0, decode as String if (caseNameAliases.size <= 64) { new ZJsonDecoder[Z] { @@ -970,18 +970,12 @@ object JsonCodec { schema: GenericRecord, discriminator: Option[String] ): ZJsonDecoder[ListMap[String, Any]] = { - val capacity = schema.fields.size * 2 val spansWithDecoders = - new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](capacity) - val defaults = new util.HashMap[String, Any](capacity) + new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](schema.fields.size * 2) schema.fields.foreach { field => - val fieldName = field.fieldName val spanWithDecoder = - (JsonError.ObjectAccess(fieldName), schemaDecoder(field.schema).asInstanceOf[ZJsonDecoder[Any]]) - field.nameAndAliases.foreach(x => spansWithDecoders.put(x, spanWithDecoder)) - if ((field.optional || field.transient) && field.defaultValue.isDefined) { - defaults.put(fieldName, field.defaultValue.get) - } + (JsonError.ObjectAccess(field.fieldName), schemaDecoder(field.schema).asInstanceOf[ZJsonDecoder[Any]]) + field.nameAndAliases.foreach(spansWithDecoders.put(_, spanWithDecoder)) } val skipExtraFields = !schema.annotations.exists(_.isInstanceOf[rejectExtraFields]) (trace: List[JsonError], in: RetractReader) => { @@ -1000,23 +994,37 @@ object JsonCodec { val dec = spanWithDecoder._2 val trace_ = span :: trace lexer.char(trace_, in, ':') - val fieldName = span.field + val fieldName = span.field // reuse strings with calculated hashCode val prev = map.put(fieldName, dec.unsafeDecode(trace_, in)) - if (prev != null) { - throw UnsafeJson(JsonError.Message("duplicate") :: trace_) - } + if (prev != null) error("duplicate", trace_) } else if (skipExtraFields || discriminator.contains(fieldNameOrAlias)) { lexer.char(trace, in, ':') lexer.skipValue(trace, in) - } else { - throw UnsafeJson(JsonError.Message(s"unexpected field: $fieldNameOrAlias") :: trace) - } + } else error("extra field", trace) continue = lexer.nextField(trace, in) } - val it = defaults.entrySet().iterator() - while (it.hasNext) { - val entry = it.next() - map.putIfAbsent(entry.getKey, entry.getValue) + schema.fields.foreach { field => + val fieldName = field.fieldName // reuse strings with calculated hashCode + if (map.get(fieldName) == null) { + map.put( // mitigation of a linking error for `map.computeIfAbsent` in Scala.js + fieldName, { + if ((field.optional || field.transient) && field.defaultValue.isDefined) { + field.defaultValue.get + } else { + var schema = field.schema + schema match { + case l: Schema.Lazy[_] => schema = l.schema + case _ => + } + schema match { + case _: Schema.Optional[_] => None + case collection: Schema.Collection[_, _] => collection.empty + case _ => error("missing", spansWithDecoders.get(fieldName)._1 :: trace) + } + } + } + ) + } } (ListMap.newBuilder[String, Any] ++= ({ // to avoid O(n) insert operations import scala.collection.JavaConverters.mapAsScalaMapConverter // use deprecated class for Scala 2.12 compatibility @@ -1095,10 +1103,7 @@ object JsonCodec { case (Some(a), Some(b)) => Fallback.Both(a, b) case (Some(a), _) => Fallback.Left(a) case (_, Some(b)) => Fallback.Right(b) - case _ => - throw UnsafeJson( - JsonError.Message("Fallback decoder was unable to decode both left and right sides") :: trace - ) + case _ => error("Fallback decoder was unable to decode both left and right sides", trace) } } } diff --git a/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala b/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala index ee7eb244c..35ce3e4db 100644 --- a/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala +++ b/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala @@ -477,9 +477,9 @@ object JsonCodecSpec extends ZIOSpecDefault { test("Do not encode transient field") { assertEncodes( RecordExample.schema, - RecordExample(f1 = Some("test"), f3 = Some("transient")), + RecordExample(f1 = "test", f3 = Some("transient"), f20 = None, f21 = Vector.empty, f22 = Nil), charSequenceToByteChunk( - """{"$f1":"test"}""".stripMargin + """{"$f1":"test","f20":null,"f21":[],"f22":[]}""".stripMargin ) ) } @@ -732,26 +732,33 @@ object JsonCodecSpec extends ZIOSpecDefault { charSequenceToByteChunk("""{"foo":"s","bar":1,"baz":2}""") ) }, - test("with missing fields") { + test("with empty optional and collection fields without default values") { assertDecodes( RecordExample.schema, - RecordExample(f1 = Some("test"), f2 = None), + RecordExample(f1 = "test", f2 = None, f20 = None, f21 = Vector.empty, f22 = Nil), charSequenceToByteChunk("""{"$f1":"test"}""") ) }, + test("missing required fields") { + assertDecodesToError( + RecordExample.schema, + """{}""", + JsonError.Message("missing") :: JsonError.ObjectAccess("$f1") :: Nil + ) + }, test("aliased field") { assertDecodes( RecordExample.schema, - RecordExample(f1 = Some("test"), f2 = Some("alias")), + RecordExample(f1 = "test", f2 = Some("alias"), f20 = None, f21 = Vector.empty, f22 = Nil), charSequenceToByteChunk("""{"$f1":"test", "field2":"alias"}""") ) }, test("reject extra fields") { assertDecodes( RecordExample.schema.annotate(rejectExtraFields()), - RecordExample(f1 = Some("test")), + RecordExample(f1 = "test", f20 = None, f21 = Vector.empty, f22 = Nil), charSequenceToByteChunk("""{"$f1":"test", "extraField":"extra"}""") - ).flip.map(err => assertTrue(err.getMessage() == "(unexpected field: extraField)")) + ).flip.map(err => assertTrue(err.getMessage() == "(extra field)")) }, test("reject duplicated fields") { assertDecodesToError( @@ -1697,7 +1704,7 @@ object JsonCodecSpec extends ZIOSpecDefault { assertDecodes(Schema[Command], Command.Cash, charSequenceToByteChunk("""{"type":"Cash","extraField":1}""")) &> assertDecodes(Schema[Command], Command.Cash, charSequenceToByteChunk("""{"extraField":1,"type":"Cash"}""")) ), - suite("of case objects with less than 64 cases")( + suite("of case objects with up to 64 cases")( test("without annotation")( assertEncodesThenDecodes(Schema[Color], Color.Red) ), @@ -1718,7 +1725,7 @@ object JsonCodecSpec extends ZIOSpecDefault { assertDecodesToError(Schema[Color], "\"not a color\"", JsonError.Message("unrecognized string") :: Nil) ) ), - suite("of case objects with 64 cases or more")( + suite("of case objects with more than 64 cases")( test("without annotation")( assertEncodesThenDecodes(Schema[BigEnum], BigEnum.Case69) ), @@ -2477,7 +2484,7 @@ object JsonCodecSpec extends ZIOSpecDefault { ) extends OneOf4 case class RecordExample( - @fieldName("$f1") f1: Option[String], // the only field that does not have a default value + @fieldName("$f1") f1: String, @fieldNameAliases("field2") f2: Option[String] = None, @transientField f3: Option[String] = None, f4: Option[String] = None, @@ -2493,12 +2500,12 @@ object JsonCodecSpec extends ZIOSpecDefault { f14: Option[String] = None, f15: Option[String] = None, f16: Option[String] = None, - f17: Option[String] = None, - f18: Option[String] = None, - f19: Option[String] = None, - f20: Option[String] = None, - f21: Option[String] = None, - f22: Option[String] = None, + f17: List[String] = Nil, + f18: Vector[String] = Vector.empty, + f19: Option[RecordExample] = None, + f20: Option[String], + f21: Vector[String], + f22: List[String], @fieldName("$f23") f23: Option[String] = None ) From b95d2001280a6868317f97e0774e99cc629edb9f Mon Sep 17 00:00:00 2001 From: Andriy Plokhotnyuk Date: Fri, 10 Jan 2025 11:43:27 +0100 Subject: [PATCH 2/4] Reduce redundant allocations and CPU overhead when decoding and encoding --- .../scala/zio/schema/codec/JsonCodec.scala | 152 +++++++++--------- 1 file changed, 79 insertions(+), 73 deletions(-) diff --git a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala index 192f69587..1cc980a29 100644 --- a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala +++ b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala @@ -10,7 +10,6 @@ import scala.collection.immutable.ListMap import scala.collection.mutable import scala.util.control.NonFatal -import zio.json.JsonCodec._ import zio.json.JsonDecoder.{ JsonError, UnsafeJson } import zio.json.ast.Json import zio.json.internal.{ Lexer, RecordingReader, RetractReader, StringMatrix, WithRecordingReader, Write } @@ -24,7 +23,7 @@ import zio.json.{ import zio.prelude.NonEmptyMap import zio.schema.Schema.GenericRecord import zio.schema._ -import zio.schema.annotation.{ rejectExtraFields, _ } +import zio.schema.annotation.{ discriminatorName, rejectExtraFields, _ } import zio.schema.codec.DecodeError.ReadError import zio.schema.codec.JsonCodec.JsonDecoder.schemaDecoder import zio.stream.{ ZChannel, ZPipeline } @@ -420,7 +419,7 @@ object JsonCodec { out.write(',') if (indent.isDefined) pad(indent_, out) } - string.encoder.unsafeEncode(key, indent_, out) + ZJsonEncoder.string.unsafeEncode(key, indent_, out) if (indent.isEmpty) out.write(':') else out.write(" : ") directEncoder.unsafeEncode(value, indent_, out) @@ -505,38 +504,44 @@ object JsonCodec { ) .toMap ZJsonEncoder.string.contramap(caseMap(_)) - } else { (value: Z, indent: Option[Int], out: Write) => - { - schema.nonTransientCases.find(_.isCase(value)) match { - case Some(case_) => - val caseName = case_.caseName - val noDiscriminators = schema.noDiscriminator - val discriminatorTuple = - if (noDiscriminators) None - else schema.annotations.collectFirst { case d: discriminatorName => (d.tag, caseName) } - val doJsonObjectWrapping = discriminatorTuple.isEmpty && !noDiscriminators - var indent_ = indent - if (doJsonObjectWrapping) { - out.write('{') - indent_ = bump(indent) - pad(indent_, out) - string.encoder.unsafeEncode(caseName, indent_, out) - if (indent.isEmpty) out.write(':') - else out.write(" : ") - } - schemaEncoder(case_.schema.asInstanceOf[Schema[Any]], cfg, discriminatorTuple) - .unsafeEncode({ - try case_.deconstruct(value) - catch { - case ex if NonFatal(ex) => throw new RuntimeException(s"Failed to encode enum type $schema", ex) - } - }, indent_, out) - if (doJsonObjectWrapping) { - pad(indent, out) - out.write('}') + } else { + new ZJsonEncoder[Z] { + private[this] val discriminatorName = + if (schema.noDiscriminator) None + else schema.annotations.collectFirst { case d: discriminatorName => d.tag } + private[this] val cases = schema.nonTransientCases.toArray + private[this] val decoders = cases.map { case_ => + val discriminatorTuple = + if (discriminatorName eq None) None + else Some((discriminatorName.get, case_.caseName)) + schemaEncoder(case_.schema.asInstanceOf[Schema[Any]], cfg, discriminatorTuple) + } + private[this] val doJsonObjectWrapping = discriminatorName.isEmpty && !schema.noDiscriminator + + override def unsafeEncode(a: Z, indent: Option[Int], out: Write): Unit = { + var idx = 0 + while (idx < cases.length) { + val case_ = cases(idx) + if (case_.isCase(a)) { + var indent_ = indent + if (doJsonObjectWrapping) { + out.write('{') + indent_ = bump(indent) + pad(indent_, out) + ZJsonEncoder.string.unsafeEncode(case_.caseName, indent_, out) + if (indent.isEmpty) out.write(':') + else out.write(" : ") + } + decoders(idx).unsafeEncode(case_.deconstruct(a), indent_, out) + if (doJsonObjectWrapping) { + pad(indent, out) + out.write('}') + } + return } - case _ => - out.write("{}") // for transient cases + idx += 1 + } + out.write("{}") // for transient cases } } } @@ -550,12 +555,17 @@ object JsonCodec { case Fallback.Right(b) => right.unsafeEncode(b, indent, out) case Fallback.Both(a, b) => out.write('[') - if (indent.isDefined) pad(bump(indent), out) + val doPrettyPrint = indent ne None + var indent_ = indent + if (doPrettyPrint) { + indent_ = bump(indent) + pad(indent_, out) + } left.unsafeEncode(a, indent, out) out.write(',') - if (indent.isDefined) pad(bump(indent), out) + if (doPrettyPrint) pad(indent_, out) right.unsafeEncode(b, indent, out) - if (indent.isDefined) pad(indent, out) + if (doPrettyPrint) pad(indent, out) out.write(']') } } @@ -578,7 +588,7 @@ object JsonCodec { indent_ = bump(indent) pad(indent_, out) } - val strEnc = string.encoder + val strEnc = ZJsonEncoder.string var first = true if (discriminatorTuple ne None) { val tuple = discriminatorTuple.get @@ -759,11 +769,9 @@ object JsonCodec { val valueDecoder = JsonDecoder.schemaDecoder(vs) jsonFieldDecoder(ks) match { case Some(jsonFieldDecoder) => - ZJsonDecoder.keyValueChunk(jsonFieldDecoder, valueDecoder).map(a => Chunk.fromIterable(a).toMap) + ZJsonDecoder.keyValueChunk(jsonFieldDecoder, valueDecoder).map(_.toMap) case None => - ZJsonDecoder - .chunk(schemaDecoder(ks).zip(schemaDecoder(vs))) - .map(_.toList.toMap) + ZJsonDecoder.chunk(schemaDecoder(ks).zip(schemaDecoder(vs))).map(_.toMap) } } @@ -778,18 +786,12 @@ object JsonCodec { case _ => None } - private def dynamicDecoder(schema: Schema.Dynamic): ZJsonDecoder[DynamicValue] = { - val directMapping = schema.annotations.exists { - case directDynamicMapping() => true - case _ => false - } - - if (directMapping) { + private def dynamicDecoder(schema: Schema.Dynamic): ZJsonDecoder[DynamicValue] = + if (schema.annotations.exists(_.isInstanceOf[directDynamicMapping])) { Json.decoder.map(jsonToDynamicValue) } else { schemaDecoder(DynamicValue.schema) } - } private def jsonToDynamicValue(json: Json): DynamicValue = json match { @@ -832,7 +834,7 @@ object JsonCodec { } } else { new ZJsonDecoder[Z] { - private[this] val cases = new util.HashMap[String, Z](caseNameAliases.size * 2) + private[this] val cases = new util.HashMap[String, Z](caseNameAliases.size << 1) caseNameAliases.foreach { case (name, case_) => @@ -888,7 +890,7 @@ object JsonCodec { } } else { val cases = - new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](caseNameAliases.size * 2) + new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](caseNameAliases.size << 1) caseNameAliases.foreach { case (name, case_) => cases.put(name, (JsonError.ObjectAccess(case_.caseName), schemaDecoder(case_.schema))) @@ -936,7 +938,7 @@ object JsonCodec { } else { val discriminatorSpan = JsonError.ObjectAccess(discriminatorName) val cases = - new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](caseNameAliases.size * 2) + new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](caseNameAliases.size << 1) caseNameAliases.foreach { case (name, case_) => cases.put(name, (JsonError.ObjectAccess(case_.caseName), schemaDecoder(case_.schema, discriminator))) @@ -969,23 +971,26 @@ object JsonCodec { private def recordDecoder( schema: GenericRecord, discriminator: Option[String] - ): ZJsonDecoder[ListMap[String, Any]] = { - val spansWithDecoders = - new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](schema.fields.size * 2) - schema.fields.foreach { field => - val spanWithDecoder = - (JsonError.ObjectAccess(field.fieldName), schemaDecoder(field.schema).asInstanceOf[ZJsonDecoder[Any]]) - field.nameAndAliases.foreach(spansWithDecoders.put(_, spanWithDecoder)) - } - val skipExtraFields = !schema.annotations.exists(_.isInstanceOf[rejectExtraFields]) - (trace: List[JsonError], in: RetractReader) => { + ): ZJsonDecoder[ListMap[String, Any]] = new ZJsonDecoder[ListMap[String, Any]] { + private[this] val fields = schema.fields.toArray + private[this] val spansWithDecoders = + new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](fields.length << 1) { + fields.foreach { field => + val spanWithDecoder = + (JsonError.ObjectAccess(field.fieldName), schemaDecoder(field.schema).asInstanceOf[ZJsonDecoder[Any]]) + field.nameAndAliases.foreach(put(_, spanWithDecoder)) + } + } + private[this] val skipExtraFields = !schema.annotations.exists(_.isInstanceOf[rejectExtraFields]) + + override def unsafeDecode(trace: List[JsonError], in: RetractReader): ListMap[String, Any] = { val lexer = Lexer var continue = true if (discriminator eq None) { lexer.char(trace, in, '{') continue = lexer.firstField(trace, in) } - val map = new util.HashMap[String, Any] + val map = new util.HashMap[String, Any](fields.length << 1) while (continue) { val fieldNameOrAlias = lexer.string(trace, in).toString val spanWithDecoder = spansWithDecoders.get(fieldNameOrAlias) @@ -1003,7 +1008,10 @@ object JsonCodec { } else error("extra field", trace) continue = lexer.nextField(trace, in) } - schema.fields.foreach { field => + var idx = 0 + while (idx < fields.length) { + val field = fields(idx) + idx += 1 val fieldName = field.fieldName // reuse strings with calculated hashCode if (map.get(fieldName) == null) { map.put( // mitigation of a linking error for `map.computeIfAbsent` in Scala.js @@ -1039,12 +1047,11 @@ object JsonCodec { private[this] val leftDecoder = schemaDecoder(schema.left) private[this] val rightDecoder = schemaDecoder(schema.right) + case class BadEnd() extends Throwable + def unsafeDecode(trace: List[JsonError], in: RetractReader): Fallback[A, B] = { var left: Option[A] = None var right: Option[B] = None - - case class BadEnd() extends Throwable - try { // If this doesn't throw exception, it is an array, so it encodes a `Fallback.Both` val lexer = Lexer @@ -1086,17 +1093,16 @@ object JsonCodec { } catch { // It's not an array, so it is of type A or B case BadEnd() => () - case _: UnsafeJson => { + case _: UnsafeJson => in.retract() val in2 = new zio.json.internal.WithRecordingReader(in, 64) try { - left = Some(schemaDecoder(schema.left).unsafeDecode(trace, in2)) + left = Some(leftDecoder.unsafeDecode(trace, in2)) } catch { case UnsafeJson(_) => in2.rewind() - right = Some(schemaDecoder(schema.right).unsafeDecode(trace, in2)) + right = Some(rightDecoder.unsafeDecode(trace, in2)) } - } } (left, right) match { @@ -1131,7 +1137,7 @@ object JsonCodec { indent_ = bump(indent) pad(indent_, out) } - val strEnc = string.encoder + val strEnc = ZJsonEncoder.string var first = true if (discriminatorTuple ne None) { val tuple = discriminatorTuple.get From 4b6228a8050b5123379355ce8072407fff18993f Mon Sep 17 00:00:00 2001 From: Andriy Plokhotnyuk Date: Fri, 10 Jan 2025 15:40:09 +0100 Subject: [PATCH 3/4] Reuse `CaseClassJsonDecoder` for faster decoding of small generic records --- .../scala/zio/schema/codec/JsonCodec.scala | 165 +++++++++++------- 1 file changed, 100 insertions(+), 65 deletions(-) diff --git a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala index 1cc980a29..be2fa8e09 100644 --- a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala +++ b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala @@ -971,76 +971,82 @@ object JsonCodec { private def recordDecoder( schema: GenericRecord, discriminator: Option[String] - ): ZJsonDecoder[ListMap[String, Any]] = new ZJsonDecoder[ListMap[String, Any]] { - private[this] val fields = schema.fields.toArray - private[this] val spansWithDecoders = - new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](fields.length << 1) { - fields.foreach { field => - val spanWithDecoder = - (JsonError.ObjectAccess(field.fieldName), schemaDecoder(field.schema).asInstanceOf[ZJsonDecoder[Any]]) - field.nameAndAliases.foreach(put(_, spanWithDecoder)) - } - } - private[this] val skipExtraFields = !schema.annotations.exists(_.isInstanceOf[rejectExtraFields]) - - override def unsafeDecode(trace: List[JsonError], in: RetractReader): ListMap[String, Any] = { - val lexer = Lexer - var continue = true - if (discriminator eq None) { - lexer.char(trace, in, '{') - continue = lexer.firstField(trace, in) - } - val map = new util.HashMap[String, Any](fields.length << 1) - while (continue) { - val fieldNameOrAlias = lexer.string(trace, in).toString - val spanWithDecoder = spansWithDecoders.get(fieldNameOrAlias) - if (spanWithDecoder ne null) { - val span = spanWithDecoder._1 - val dec = spanWithDecoder._2 - val trace_ = span :: trace - lexer.char(trace_, in, ':') - val fieldName = span.field // reuse strings with calculated hashCode - val prev = map.put(fieldName, dec.unsafeDecode(trace_, in)) - if (prev != null) error("duplicate", trace_) - } else if (skipExtraFields || discriminator.contains(fieldNameOrAlias)) { - lexer.char(trace, in, ':') - lexer.skipValue(trace, in) - } else error("extra field", trace) - continue = lexer.nextField(trace, in) - } - var idx = 0 - while (idx < fields.length) { - val field = fields(idx) - idx += 1 - val fieldName = field.fieldName // reuse strings with calculated hashCode - if (map.get(fieldName) == null) { - map.put( // mitigation of a linking error for `map.computeIfAbsent` in Scala.js - fieldName, { - if ((field.optional || field.transient) && field.defaultValue.isDefined) { - field.defaultValue.get - } else { - var schema = field.schema - schema match { - case l: Schema.Lazy[_] => schema = l.schema - case _ => - } - schema match { - case _: Schema.Optional[_] => None - case collection: Schema.Collection[_, _] => collection.empty - case _ => error("missing", spansWithDecoders.get(fieldName)._1 :: trace) + ): ZJsonDecoder[ListMap[String, Any]] = + if (schema.fields.foldLeft(0)(_ + _.nameAndAliases.size) <= 64) { + val ccjd = CaseClassJsonDecoder(schema, discriminator) + (trace: List[JsonError], in: RetractReader) => ccjd.unsafeDecodeListMap(trace, in) + } else { + new ZJsonDecoder[ListMap[String, Any]] { + private[this] val fields = schema.fields.toArray + private[this] val spansWithDecoders = + new util.HashMap[String, (JsonError.ObjectAccess, ZJsonDecoder[Any])](fields.length << 1) { + fields.foreach { field => + val spanWithDecoder = + (JsonError.ObjectAccess(field.fieldName), schemaDecoder(field.schema).asInstanceOf[ZJsonDecoder[Any]]) + field.nameAndAliases.foreach(put(_, spanWithDecoder)) + } + } + private[this] val skipExtraFields = !schema.annotations.exists(_.isInstanceOf[rejectExtraFields]) + + override def unsafeDecode(trace: List[JsonError], in: RetractReader): ListMap[String, Any] = { + val lexer = Lexer + var continue = true + if (discriminator eq None) { + lexer.char(trace, in, '{') + continue = lexer.firstField(trace, in) + } + val map = new util.HashMap[String, Any](fields.length << 1) + while (continue) { + val fieldNameOrAlias = lexer.string(trace, in).toString + val spanWithDecoder = spansWithDecoders.get(fieldNameOrAlias) + if (spanWithDecoder ne null) { + val span = spanWithDecoder._1 + val dec = spanWithDecoder._2 + val trace_ = span :: trace + lexer.char(trace_, in, ':') + val fieldName = span.field // reuse strings with calculated hashCode + val prev = map.put(fieldName, dec.unsafeDecode(trace_, in)) + if (prev != null) error("duplicate", trace_) + } else if (skipExtraFields || discriminator.contains(fieldNameOrAlias)) { + lexer.char(trace, in, ':') + lexer.skipValue(trace, in) + } else error("extra field", trace) + continue = lexer.nextField(trace, in) + } + var idx = 0 + while (idx < fields.length) { + val field = fields(idx) + idx += 1 + val fieldName = field.fieldName // reuse strings with calculated hashCode + if (map.get(fieldName) == null) { + map.put( // mitigation of a linking error for `map.computeIfAbsent` in Scala.js + fieldName, { + if ((field.optional || field.transient) && field.defaultValue.isDefined) { + field.defaultValue.get + } else { + var schema = field.schema + schema match { + case l: Schema.Lazy[_] => schema = l.schema + case _ => + } + schema match { + case _: Schema.Optional[_] => None + case collection: Schema.Collection[_, _] => collection.empty + case _ => error("missing", spansWithDecoders.get(fieldName)._1 :: trace) + } + } } - } + ) } - ) + } + (ListMap.newBuilder[String, Any] ++= ({ // to avoid O(n) insert operations + import scala.collection.JavaConverters.mapAsScalaMapConverter // use deprecated class for Scala 2.12 compatibility + + map.asScala + }: @scala.annotation.nowarn)).result() } } - (ListMap.newBuilder[String, Any] ++= ({ // to avoid O(n) insert operations - import scala.collection.JavaConverters.mapAsScalaMapConverter // use deprecated class for Scala 2.12 compatibility - - map.asScala - }: @scala.annotation.nowarn)).result() } - } private def fallbackDecoder[A, B](schema: Schema.Fallback[A, B]): ZJsonDecoder[Fallback[A, B]] = new ZJsonDecoder[Fallback[A, B]] { @@ -1553,6 +1559,35 @@ object JsonCodec { skipExtraFields: Boolean ) { + def unsafeDecodeListMap(trace: List[JsonError], in: RetractReader): ListMap[String, Any] = { + val buffer = unsafeDecodeFields(trace, in) + (ListMap.newBuilder[String, Any] ++= new collection.Map[String, Any] { // only `.iterator` method will be called + override def +[Any](kv: (String, Any)): collection.Map[String, Any] = ??? + + override def -(key: String): collection.Map[String, Any] = ??? + + @scala.annotation.nowarn + override def -(key1: String, key2: String, keys: String*): collection.Map[String, Any] = ??? + + override def get(key: String): Option[Any] = ??? + + override def iterator: Iterator[(String, Any)] = new Iterator[(String, Any)] { + private[this] val names = stringMatrix.xs // can contain a discriminator field name at the last position + private[this] val values = buffer + private[this] var nextIdx = 0 + + def hasNext: Boolean = nextIdx < values.length + + @inline + def next(): (String, Any) = { + val idx = nextIdx + nextIdx += 1 + (names(idx), values(idx)) + } + } + }).result() + } + def unsafeDecodeFields(trace: List[JsonError], in: RetractReader): Array[Any] = { val lexer = Lexer var continue = true From 483658b52cabdc368089f142cea05fb69d432873 Mon Sep 17 00:00:00 2001 From: Andriy Plokhotnyuk Date: Fri, 10 Jan 2025 18:13:52 +0100 Subject: [PATCH 4/4] Rollback incorrect and unsecure "Accept empty object for optional json values" --- .../scala/zio/schema/codec/JsonCodec.scala | 30 ++++--------------- .../zio/schema/codec/JsonCodecSpec.scala | 14 --------- 2 files changed, 6 insertions(+), 38 deletions(-) diff --git a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala index be2fa8e09..514cb80aa 100644 --- a/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala +++ b/zio-schema-json/shared/src/main/scala/zio/schema/codec/JsonCodec.scala @@ -12,7 +12,7 @@ import scala.util.control.NonFatal import zio.json.JsonDecoder.{ JsonError, UnsafeJson } import zio.json.ast.Json -import zio.json.internal.{ Lexer, RecordingReader, RetractReader, StringMatrix, WithRecordingReader, Write } +import zio.json.internal.{ Lexer, RecordingReader, RetractReader, StringMatrix, Write } import zio.json.{ JsonCodec => ZJsonCodec, JsonDecoder => ZJsonDecoder, @@ -649,16 +649,8 @@ object JsonCodec { case _: ZJsonDecoder[_] => } - private val emptyObjectDecoder: ZJsonDecoder[Boolean] = - (_: List[JsonError], in: RetractReader) => { - val c1 = in.nextNonWhitespace() - val c2 = in.nextNonWhitespace() - c1 == '{' && c2 == '}' - } - private[schema] def option[A](A: ZJsonDecoder[A]): ZJsonDecoder[Option[A]] = - new ZJsonDecoder[Option[A]] { self => - + new ZJsonDecoder[Option[A]] { private[this] val ull: Array[Char] = "ull".toCharArray def unsafeDecode(trace: List[JsonError], in: RetractReader): Option[A] = @@ -666,16 +658,6 @@ object JsonCodec { case 'n' => Lexer.readChars(trace, in, ull, "null") None - case '{' => - // If we encounter a `{` it could either be a legitimate object or an empty object marker - in.retract() - val rr = new WithRecordingReader(in, 2) - if (emptyObjectDecoder.unsafeDecode(trace, rr)) { - None - } else { - rr.rewind() - Some(A.unsafeDecode(trace, rr)) - } case _ => in.retract() Some(A.unsafeDecode(trace, in)) @@ -1101,13 +1083,13 @@ object JsonCodec { case BadEnd() => () case _: UnsafeJson => in.retract() - val in2 = new zio.json.internal.WithRecordingReader(in, 64) + val rr = RecordingReader(in) try { - left = Some(leftDecoder.unsafeDecode(trace, in2)) + left = Some(leftDecoder.unsafeDecode(trace, rr)) } catch { case UnsafeJson(_) => - in2.rewind() - right = Some(rightDecoder.unsafeDecode(trace, in2)) + rr.rewind() + right = Some(rightDecoder.unsafeDecode(trace, rr)) } } diff --git a/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala b/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala index 35ce3e4db..572ee55cf 100644 --- a/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala +++ b/zio-schema-json/shared/src/test/scala/zio/schema/codec/JsonCodecSpec.scala @@ -997,20 +997,6 @@ object JsonCodecSpec extends ZIOSpecDefault { charSequenceToByteChunk("""{"a":"s"}""") ) }, - test("case class with option fields accept empty json object as value") { - assertDecodes( - WithOptionFields.schema, - WithOptionFields(Some("s"), None), - charSequenceToByteChunk("""{"a":"s", "b":{}}""") - ) - }, - test("case class with complex option field accept empty json object as value") { - assertDecodes( - WithComplexOptionField.schema, - WithComplexOptionField(None), - charSequenceToByteChunk("""{"order":{}}""") - ) - }, test("case class with complex option field correctly decodes") { assertDecodes( WithComplexOptionField.schema,