From 4c6ad91d0b7c0f56aa51f95c8389384d83cd217a Mon Sep 17 00:00:00 2001 From: Joannis Orlandos Date: Sun, 5 Mar 2023 21:06:55 +0100 Subject: [PATCH 1/2] Add some codable performance improvements --- .../BSON/Codable/Decoding/BSONDecoder.swift | 8 + .../Decoding/BSONDecoderSettings.swift | 2 +- .../Decoding/Fast/FastBSONDecoder.swift | 831 ++++++++++++++++++ Sources/BSON/Document/Document+Array.swift | 32 +- .../BSON/Document/Document+Validation.swift | 6 +- Sources/BSON/Helpers/ByteBuffer+Helpers.swift | 24 + Sources/BSON/Types/Primitives.swift | 120 +-- Tests/BSONTests/BSONPublicTests.swift | 32 +- 8 files changed, 976 insertions(+), 79 deletions(-) create mode 100644 Sources/BSON/Codable/Decoding/Fast/FastBSONDecoder.swift diff --git a/Sources/BSON/Codable/Decoding/BSONDecoder.swift b/Sources/BSON/Codable/Decoding/BSONDecoder.swift index 9c19df5..8e88ef7 100644 --- a/Sources/BSON/Codable/Decoding/BSONDecoder.swift +++ b/Sources/BSON/Codable/Decoding/BSONDecoder.swift @@ -102,6 +102,14 @@ extension BSONDecoderSettings.IntegerDecodingStrategy { } /// Decodes the `value` without key to an integer of type `I` using the current strategy + @_specialize(where I == UInt8) + @_specialize(where I == Int8) + @_specialize(where I == UInt16) + @_specialize(where I == Int16) + @_specialize(where I == UInt32) + @_specialize(where I == Int32) + @_specialize(where I == UInt) + @_specialize(where I == Int) internal func decode( from decoder: _BSONDecoder, path: @autoclosure () -> [String] diff --git a/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift b/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift index ada20b1..bf6885c 100644 --- a/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift +++ b/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift @@ -159,7 +159,7 @@ public struct BSONDecoderSettings { public var decodeObjectIdFromString: Bool = false /// If `true`, allows decoding ObjectIds from Strings if they're formatted as a 24-character hexString - public var decodeDateFromTimestamp: Bool = false + public var decodeDateFromTimestamp: Bool = true /// A strategy that is applied when encountering a request to decode a `Float` public var floatDecodingStrategy: FloatDecodingStrategy diff --git a/Sources/BSON/Codable/Decoding/Fast/FastBSONDecoder.swift b/Sources/BSON/Codable/Decoding/Fast/FastBSONDecoder.swift new file mode 100644 index 0000000..9315d23 --- /dev/null +++ b/Sources/BSON/Codable/Decoding/Fast/FastBSONDecoder.swift @@ -0,0 +1,831 @@ +import Foundation + +public struct FastBSONDecoder { + public init() {} + + public func decode(_ type: D.Type = D.self, from primitive: P) throws -> D { + let decoder = _FastBSONDecoder(value: primitive) + return try D.init(from: decoder) + } +} + +struct _FastBSONDecoder: Decoder { + let value: P + var userInfo = [CodingUserInfoKey : Any]() + var codingPath: [CodingKey] { [] } + + func container(keyedBy type: Key.Type) throws -> KeyedDecodingContainer where Key : CodingKey, P == Document { + KeyedDecodingContainer(_FastKeyedContainer(document: value)) + } + + func container(keyedBy type: Key.Type) throws -> KeyedDecodingContainer where Key : CodingKey { + guard let value = value as? Document else { + throw BSONTypeConversionError(from: value, to: Document.self) + } + + return KeyedDecodingContainer(_FastKeyedContainer(document: value)) + } + + func singleValueContainer() throws -> SingleValueDecodingContainer { + _FastSingleValueContainer(value: value) + } + + func unkeyedContainer() throws -> UnkeyedDecodingContainer { + guard let value = value as? Document else { + throw BSONTypeConversionError(from: value, to: Document.self) + } + + return _FastUnkeyedContainer(document: value, endIndex: value.count) + } +} + +struct _FastKeyedContainer: KeyedDecodingContainerProtocol { + let document: Document + var codingPath: [CodingKey] { [] } + + var allKeys: [Key] { document.keys.compactMap(Key.init) } + + func contains(_ key: Key) -> Bool { + document.containsKey(key.stringValue) + } + + func decode(_ type: Int.Type, forKey key: Key) throws -> Int { + #if (arch(i386) || arch(arm)) && BSONInt64Primitive + let expectedType: TypeIdentifier = .int32 + #else + let expectedType: TypeIdentifier = .int64 + #endif + + guard + let (foundType, offset) = document.typeAndValueOffset(forKey: key.stringValue), + foundType == expectedType, + let int: Int = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Int.self, path: codingPath.map(\.stringValue)) + } + + return int + } + + func decode(_ type: Int8.Type, forKey key: Key) throws -> Int8 { + try decodeFixedWidthInteger(forKey: key) + } + + func decode(_ type: Int16.Type, forKey key: Key) throws -> Int16 { + try decodeFixedWidthInteger(forKey: key) + } + + func decode(_ type: Int32.Type, forKey key: Key) throws -> Int32 { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .int32, + let int: Int32 = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Int32.self, path: codingPath.map(\.stringValue)) + } + + return int + } + + func decode(_ type: Int64.Type, forKey key: Key) throws -> Int64 { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .int64, + let int: Int64 = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Int64.self, path: codingPath.map(\.stringValue)) + } + + return int + } + + func decode(_ type: UInt.Type, forKey key: Key) throws -> UInt { + try decodeFixedWidthInteger(forKey: key) + } + + func decode(_ type: UInt8.Type, forKey key: Key) throws -> UInt8 { + try decodeFixedWidthInteger(forKey: key) + } + + func decode(_ type: UInt16.Type, forKey key: Key) throws -> UInt16 { + try decodeFixedWidthInteger(forKey: key) + } + + func decode(_ type: UInt32.Type, forKey key: Key) throws -> UInt32 { + try decodeFixedWidthInteger(forKey: key) + } + + func decode(_ type: UInt64.Type, forKey key: Key) throws -> UInt64 { + try decodeFixedWidthInteger(forKey: key) + } + + @inline(__always) + func decodeFixedWidthInteger(_ type: F.Type = F.self, forKey key: Key) throws -> F { + guard let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue) else { + throw BSONValueNotFound(type: F.self, path: codingPath.map(\.stringValue)) + } + + switch type { + case .int32: + guard + let int: Int32 = document.storage.getInteger(at: offset, endianness: .little), + int >= F.min, + int <= F.max + else { + throw BSONTypeConversionError(from: type, to: F.self) + } + + return F(int) + case .int64: + guard + let int: _BSON64BitInteger = document.storage.getInteger(at: offset, endianness: .little), + int >= F.min, + int <= F.max + else { + throw BSONTypeConversionError(from: type, to: F.self) + } + + return F(int) + default: + throw BSONValueNotFound(type: F.self, path: codingPath.map(\.stringValue)) + } + } + + func decode(_ type: Bool.Type, forKey key: Key) throws -> Bool { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .boolean, + let int: UInt8 = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Bool.self, path: codingPath.map(\.stringValue)) + } + + return int == 0x01 + } + + func decode(_ type: String.Type, forKey key: Key) throws -> String { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .string, + let string = document.storage.getBSONString(at: offset) + else { + throw BSONValueNotFound(type: String.self, path: codingPath.map(\.stringValue)) + } + + return string + } + + func decode(_ type: Double.Type, forKey key: Key) throws -> Double { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .double, + let double = document.storage.getDouble(at: offset) + else { + throw BSONValueNotFound(type: Double.self, path: codingPath.map(\.stringValue)) + } + + return double + } + + func decode(_ type: T.Type, forKey key: Key) throws -> T where T : Decodable { + switch document[key.stringValue] { + case let value as Double: // 0x01 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as String: // 0x0 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Document: // 0x03 (embedded document) or 0x04 (array) + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Binary: // 0x05 + if T.self == Data.self { + return value.data as! T + } + + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + // 0x06 is deprecated + case let value as ObjectId: // 0x07 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Bool: // 0x08 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Date: // 0x09 + if T.self == Date.self { + return value as! T + } + + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case is Null: // 0x0A + let decoder = _FastBSONDecoder(value: Null()) + return try T.init(from: decoder) + case let value as RegularExpression: // 0x0B + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + // 0x0C is deprecated (DBPointer) + // 0x0E is deprecated (Symbol) + case let value as Int32: // 0x10 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Timestamp: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as _BSON64BitInteger: // 0x12 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Decimal128: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case is MaxKey: // 0x7F + let decoder = _FastBSONDecoder(value: MaxKey()) + return try T.init(from: decoder) + case is MinKey: // 0xFF + let decoder = _FastBSONDecoder(value: MinKey()) + return try T.init(from: decoder) + case let value as JavaScriptCode: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as JavaScriptCodeWithScope: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + default: + throw BSONValueNotFound(type: Void.self, path: codingPath.map(\.stringValue)) + } + } + + func decodeNil(forKey key: Key) throws -> Bool { + guard let type = document.typeIdentifier(of: key.stringValue) else { + return true + } + + return type == .null + } + + func decode(_ type: Float.Type, forKey key: Key) throws -> Float { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .double, + let double = document.storage.getDouble(at: offset) + else { + throw BSONValueNotFound(type: Float.self, path: codingPath.map(\.stringValue)) + } + + return Float(double) + } + + func nestedContainer(keyedBy type: NestedKey.Type, forKey key: Key) throws -> KeyedDecodingContainer where NestedKey : CodingKey { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .document, + let length = document.storage.getInteger(at: offset, endianness: .little, as: Int32.self), + let slice = document.storage.getSlice(at: offset, length: numericCast(length)) + else { + throw BSONValueNotFound(type: Document.self, path: codingPath.map(\.stringValue)) + } + + let nestedDocument = Document(buffer: slice, isArray: type == .array) + return KeyedDecodingContainer(_FastKeyedContainer(document: nestedDocument)) + } + + func nestedUnkeyedContainer(forKey key: Key) throws -> UnkeyedDecodingContainer { + guard + let (type, offset) = document.typeAndValueOffset(forKey: key.stringValue), + type == .array, + let length = document.storage.getInteger(at: offset, endianness: .little, as: Int32.self), + let slice = document.storage.getSlice(at: offset, length: numericCast(length)) + else { + throw BSONValueNotFound(type: Document.self, path: codingPath.map(\.stringValue)) + } + + let nestedDocument = Document(buffer: slice, isArray: type == .array) + return _FastUnkeyedContainer(document: nestedDocument, endIndex: nestedDocument.count) + } + + func superDecoder() throws -> Decoder { + fatalError() + } + + func superDecoder(forKey key: Key) throws -> Decoder { + fatalError() + } +} + +struct _FastSingleValueContainer: SingleValueDecodingContainer, AnySingleValueBSONDecodingContainer { + let value: P + var codingPath: [CodingKey] { [] } + + func decodeNil() -> Bool { + value is Null + } + + func decodeObjectId() throws -> ObjectId where P == ObjectId { + value + } + + func decodeObjectId() throws -> ObjectId { + guard let value = value as? ObjectId else { + throw BSONValueNotFound(type: ObjectId.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decodeDocument() throws -> Document where P == Document { + value + } + + func decodeDocument() throws -> Document { + guard let value = value as? Document else { + throw BSONValueNotFound(type: Document.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decodeDecimal128() throws -> Decimal128 where P == Decimal128 { + value + } + + func decodeDecimal128() throws -> Decimal128 { + guard let value = value as? Decimal128 else { + throw BSONValueNotFound(type: Decimal128.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decodeBinary() throws -> Binary where P == Binary { + value + } + + func decodeBinary() throws -> Binary { + guard let value = value as? Binary else { + throw BSONValueNotFound(type: Binary.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decodeRegularExpression() throws -> RegularExpression where P == RegularExpression { + value + } + + func decodeRegularExpression() throws -> RegularExpression { + guard let value = value as? RegularExpression else { + throw BSONValueNotFound(type: RegularExpression.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decodeNull() throws -> Null where P == Null { + value + } + + func decodeNull() throws -> Null { + guard value is Null else { + throw BSONValueNotFound(type: Null.self, path: codingPath.map(\.stringValue)) + } + + return Null() + } + + func decode(_ type: P.Type) throws -> P where P : Decodable { + return value + } + + func decode(_ type: Int.Type) throws -> Int { + if let value = value as? Int { + return value + } + + throw BSONValueNotFound(type: Int.self, path: codingPath.map(\.stringValue)) + } + + func decode(_ type: Int8.Type) throws -> Int8 { + try decodeFixedWidthInteger() + } + + func decode(_ type: Int16.Type) throws -> Int16 { + try decodeFixedWidthInteger() + } + + func decode(_ type: Int32.Type) throws -> Int32 { + if let value = value as? Int32 { + return value + } + + throw BSONValueNotFound(type: Int32.self, path: codingPath.map(\.stringValue)) + } + + func decode(_ type: Int64.Type) throws -> Int64 { + if let value = value as? Int64 { + return value + } + + throw BSONValueNotFound(type: Int64.self, path: codingPath.map(\.stringValue)) + } + + func decode(_ type: UInt.Type) throws -> UInt { + try decodeFixedWidthInteger() + } + + func decode(_ type: UInt8.Type) throws -> UInt8 { + try decodeFixedWidthInteger() + } + + func decode(_ type: UInt16.Type) throws -> UInt16 { + try decodeFixedWidthInteger() + } + + func decode(_ type: UInt32.Type) throws -> UInt32 { + try decodeFixedWidthInteger() + } + + func decode(_ type: UInt64.Type) throws -> UInt64 { + try decodeFixedWidthInteger() + } + + func decode(_ type: T.Type) throws -> T where T : Decodable { + if T.self == Date.self, let value = value as? Date { + return value as! T + } else if T.self == Data.self, let value = value as? Binary { + return value.data as! T + } + + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + } + + func decode(_ type: Float.Type) throws -> Float where P == Double { + return Float(value) + } + + func decode(_ type: Float.Type) throws -> Float { + guard let double = value as? Double else { + throw BSONValueNotFound(type: Float.self, path: codingPath.map(\.stringValue)) + } + + return Float(double) + } + + func decode(_ type: Bool.Type) throws -> Bool where P == Bool { + return value + } + + func decode(_ type: Bool.Type) throws -> Bool { + guard let value = value as? Bool else { + throw BSONValueNotFound(type: Bool.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decode(_ type: String.Type) throws -> String where P == String { + return value + } + + func decode(_ type: String.Type) throws -> String { + guard let value = value as? String else { + throw BSONValueNotFound(type: String.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + func decode(_ type: Double.Type) throws -> Double where P == Double { + return value + } + + func decode(_ type: Double.Type) throws -> Double { + guard let value = value as? Double else { + throw BSONValueNotFound(type: Double.self, path: codingPath.map(\.stringValue)) + } + + return value + } + + @inline(__always) + func decodeFixedWidthInteger(_ type: F.Type = F.self) throws -> F { + switch value { + case let int as F: + return int + case let int as Int32: + guard int >= F.min, int <= F.max else { + throw BSONTypeConversionError(from: int, to: F.self) + } + + return F(int) + case let int as _BSON64BitInteger: + guard int >= F.min, int <= F.max else { + throw BSONTypeConversionError(from: int, to: F.self) + } + + return F(int) + default: + throw BSONValueNotFound(type: F.self, path: codingPath.map(\.stringValue)) + } + } +} + +struct _FastUnkeyedContainer: UnkeyedDecodingContainer { + let document: Document + var endIndex: Int + var currentIndex: Int = 0 + var count: Int? { endIndex } + var codingPath: [CodingKey] { [] } + var isAtEnd: Bool { currentIndex >= endIndex } + + mutating func decodeNil() -> Bool { + guard + let (type, _) = document.typeAndValueOffset(at: currentIndex), + type == .null + else { + return false + } + + currentIndex += 1 + return true + } + + mutating func decodeObjectId() throws -> ObjectId { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .objectId, + let objectId = document.storage.getObjectId(at: offset) + else { + throw BSONValueNotFound(type: ObjectId.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return objectId + } + + mutating func decode(_ type: Bool.Type) throws -> Bool { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .boolean, + let bool: UInt8 = document.storage.getInteger(at: offset) + else { + throw BSONValueNotFound(type: Bool.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return bool == 0x01 + } + + mutating func decode(_ type: String.Type) throws -> String { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .string, + let string = document.storage.getBSONString(at: offset) + else { + throw BSONValueNotFound(type: String.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return string + } + + mutating func decode(_ type: Double.Type) throws -> Double { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .double, + let double = document.storage.getDouble(at: offset) + else { + throw BSONValueNotFound(type: Double.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return double + } + + mutating func decode(_ type: Float.Type) throws -> Float { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .double, + let double = document.storage.getDouble(at: offset) + else { + throw BSONValueNotFound(type: Double.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return Float(double) + } + + mutating func decode(_ type: Int.Type) throws -> Int { + #if (arch(i386) || arch(arm)) && BSONInt64Primitive + let expectedType: TypeIdentifier = .int32 + #else + let expectedType: TypeIdentifier = .int64 + #endif + + guard + let (foundType, offset) = document.typeAndValueOffset(at: currentIndex), + foundType == expectedType, + let int: Int = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Int.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return int + } + + mutating func decode(_ type: Int32.Type) throws -> Int32 { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .int32, + let int: Int32 = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Int32.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return int + } + + mutating func decode(_ type: Int64.Type) throws -> Int64 { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .int64, + let int: Int64 = document.storage.getInteger(at: offset, endianness: .little) + else { + throw BSONValueNotFound(type: Int64.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return int + } + + mutating func decode(_ type: Int8.Type) throws -> Int8 { + try decodeFixedWidthInteger() + } + + mutating func decode(_ type: Int16.Type) throws -> Int16 { + try decodeFixedWidthInteger() + } + + mutating func decode(_ type: UInt.Type) throws -> UInt { + try decodeFixedWidthInteger() + } + + mutating func decode(_ type: UInt8.Type) throws -> UInt8 { + try decodeFixedWidthInteger() + } + + mutating func decode(_ type: UInt16.Type) throws -> UInt16 { + try decodeFixedWidthInteger() + } + + mutating func decode(_ type: UInt32.Type) throws -> UInt32 { + try decodeFixedWidthInteger() + } + + mutating func decode(_ type: UInt64.Type) throws -> UInt64 { + try decodeFixedWidthInteger() + } + + @inline(__always) + mutating func decodeFixedWidthInteger(_ type: F.Type = F.self) throws -> F { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex) + else { + throw BSONValueNotFound(type: Int64.self, path: codingPath.map(\.stringValue)) + } + + switch type { + case .int32: + guard + let int: Int32 = document.storage.getInteger(at: offset, endianness: .little), + int >= F.min, + int <= F.max + else { + throw BSONValueNotFound(type: F.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return F(int) + case .int64: + guard + let int: _BSON64BitInteger = document.storage.getInteger(at: offset, endianness: .little), + int >= F.min, + int <= F.max + else { + throw BSONValueNotFound(type: F.self, path: codingPath.map(\.stringValue)) + } + + currentIndex += 1 + return F(int) + default: + throw BSONValueNotFound(type: F.self, path: codingPath.map(\.stringValue)) + } + } + + mutating func decode(_ type: T.Type) throws -> T where T : Decodable { + defer { currentIndex += 1 } + switch document[currentIndex] { + case let value as Double: // 0x01 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as String: // 0x0 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Document: // 0x03 (embedded document) or 0x04 (array) + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Binary: // 0x05 + if T.self == Data.self { + return value.data as! T + } + + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + // 0x06 is deprecated + case let value as ObjectId: // 0x07 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Bool: // 0x08 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Date: // 0x09 + if T.self == Date.self { + return value as! T + } + + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case is Null: // 0x0A + let decoder = _FastBSONDecoder(value: Null()) + return try T.init(from: decoder) + case let value as RegularExpression: // 0x0B + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + // 0x0C is deprecated (DBPointer) + // 0x0E is deprecated (Symbol) + case let value as Int32: // 0x10 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Timestamp: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as _BSON64BitInteger: // 0x12 + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as Decimal128: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case is MaxKey: // 0x7F + let decoder = _FastBSONDecoder(value: MaxKey()) + return try T.init(from: decoder) + case is MinKey: // 0xFF + let decoder = _FastBSONDecoder(value: MinKey()) + return try T.init(from: decoder) + case let value as JavaScriptCode: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + case let value as JavaScriptCodeWithScope: + let decoder = _FastBSONDecoder(value: value) + return try T.init(from: decoder) + default: + throw BSONValueNotFound(type: Void.self, path: codingPath.map(\.stringValue)) + } + } + + mutating func nestedContainer(keyedBy type: NestedKey.Type) throws -> KeyedDecodingContainer where NestedKey : CodingKey { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .document, + let length = document.storage.getInteger(at: offset, endianness: .little, as: Int32.self), + let slice = document.storage.getSlice(at: offset, length: numericCast(length)) + else { + throw BSONValueNotFound(type: Document.self, path: codingPath.map(\.stringValue)) + } + + let nestedDocument = Document(buffer: slice, isArray: type == .array) + currentIndex += 1 + return KeyedDecodingContainer(_FastKeyedContainer(document: nestedDocument)) + } + + mutating func nestedUnkeyedContainer() throws -> UnkeyedDecodingContainer { + guard + let (type, offset) = document.typeAndValueOffset(at: currentIndex), + type == .array, + let length = document.storage.getInteger(at: offset, endianness: .little, as: Int32.self), + let slice = document.storage.getSlice(at: offset, length: numericCast(length)) + else { + throw BSONValueNotFound(type: Document.self, path: codingPath.map(\.stringValue)) + } + + let nestedDocument = Document(buffer: slice, isArray: type == .array) + currentIndex += 1 + return _FastUnkeyedContainer(document: nestedDocument, endIndex: nestedDocument.count) + } + + mutating func superDecoder() throws -> Decoder { + fatalError() + } +} diff --git a/Sources/BSON/Document/Document+Array.swift b/Sources/BSON/Document/Document+Array.swift index a6e96fc..784a971 100644 --- a/Sources/BSON/Document/Document+Array.swift +++ b/Sources/BSON/Document/Document+Array.swift @@ -35,22 +35,32 @@ extension Document: ExpressibleByArrayLiteral { return values } + @inline(__always) + internal func typeAndValueOffset(at index: Int) -> (TypeIdentifier, Int)? { + var offset = 4 + for _ in 0.. Primitive { get { - var offset = 4 - for _ in 0.. ValidationResult { + static func validate(buffer: ByteBuffer) -> ValidationResult { var currentIndex = 0 func errorFound(reason: String, key: String? = nil) -> ValidationResult { @@ -91,7 +91,7 @@ extension Document { return errorFound(reason: .notEnoughBytesForValue) } - var recursiveValidation = Document.validate(buffer: subBuffer, asArray: array) + var recursiveValidation = Document.validate(buffer: subBuffer) currentIndex += Int(documentLength) guard recursiveValidation.isValid else { @@ -253,6 +253,6 @@ extension Document { /// /// If `validatingRecursively` is `true` the subdocuments will be traversed, too public func validate() -> ValidationResult { - return Document.validate(buffer: storage, asArray: self.isArray) + return Document.validate(buffer: storage) } } diff --git a/Sources/BSON/Helpers/ByteBuffer+Helpers.swift b/Sources/BSON/Helpers/ByteBuffer+Helpers.swift index 808df75..95833c6 100644 --- a/Sources/BSON/Helpers/ByteBuffer+Helpers.swift +++ b/Sources/BSON/Helpers/ByteBuffer+Helpers.swift @@ -20,6 +20,30 @@ extension ByteBuffer { return ObjectId(timestamp: timestamp, random: random) } + func getBSONString(at offset: Int) -> String? { + guard let length = getInteger(at: offset, endianness: .little, as: Int32.self) else { + return nil + } + + // Omit the null terminator as we don't use/need that in Swift + return getString(at: offset &+ 4, length: numericCast(length) - 1) + } + + func getBSONBinary(at offset: Int) -> Binary? { + guard let length = getInteger(at: offset, endianness: .little, as: Int32.self) else { + return nil + } + + guard + let subType = getByte(at: offset &+ 4), + let slice = getSlice(at: offset &+ 5, length: numericCast(length)) + else { + return nil + } + + return Binary(subType: Binary.SubType(subType), buffer: slice) + } + func getByte(at offset: Int) -> UInt8? { return self.getInteger(at: offset, endianness: .little, as: UInt8.self) } diff --git a/Sources/BSON/Types/Primitives.swift b/Sources/BSON/Types/Primitives.swift index 48972c5..4616b93 100644 --- a/Sources/BSON/Types/Primitives.swift +++ b/Sources/BSON/Types/Primitives.swift @@ -79,61 +79,70 @@ extension Document { } public init(from decoder: Decoder) throws { - if let decoder = try decoder.singleValueContainer() as? AnySingleValueBSONDecodingContainer { - self = try decoder.decodeDocument() + switch decoder { + case let decoder as _FastBSONDecoder: + self = decoder.value return - } - - struct Key: CodingKey { - var stringValue: String - var intValue: Int? { nil } - - init?(intValue: Int) { nil } - - init(stringValue: String) { - self.stringValue = stringValue - } - } - - let container = try decoder.container(keyedBy: Key.self) - var document = Document() - - nextKey: for key in container.allKeys { - if try container.decodeNil(forKey: key) { - continue nextKey - } - - if let string = try? container.decode(String.self, forKey: key) { - document[key.stringValue] = string - continue nextKey - } - - if let int = try? container.decode(Int.self, forKey: key) { - document[key.stringValue] = int - continue nextKey + case let decoder as _BSONDecoder: + let primitive = decoder.primitive + guard let document = primitive as? Document else { + throw BSONTypeConversionError(from: primitive, to: Document.self) } - if let int = try? container.decode(Int32.self, forKey: key) { - document[key.stringValue] = int - continue nextKey + self = document + return + default: + struct Key: CodingKey { + var stringValue: String + var intValue: Int? { nil } + + init?(intValue: Int) { nil } + + init(stringValue: String) { + self.stringValue = stringValue + } } - if let double = try? container.decode(Double.self, forKey: key) { - document[key.stringValue] = double - continue nextKey - } + let container = try decoder.container(keyedBy: Key.self) + var document = Document() - if let bool = try? container.decode(Bool.self, forKey: key) { - document[key.stringValue] = bool - continue nextKey + nextKey: for key in container.allKeys { + if try container.decodeNil(forKey: key) { + continue nextKey + } + + if let string = try? container.decode(String.self, forKey: key) { + document[key.stringValue] = string + continue nextKey + } + + if let int = try? container.decode(Int.self, forKey: key) { + document[key.stringValue] = int + continue nextKey + } + + if let int = try? container.decode(Int32.self, forKey: key) { + document[key.stringValue] = int + continue nextKey + } + + if let double = try? container.decode(Double.self, forKey: key) { + document[key.stringValue] = double + continue nextKey + } + + if let bool = try? container.decode(Bool.self, forKey: key) { + document[key.stringValue] = bool + continue nextKey + } + + // TODO: Niche Int cases + + throw UnsupportedDocumentDecoding() } - // TODO: Niche Int cases - - throw UnsupportedDocumentDecoding() + self = document } - - self = document } } @@ -164,11 +173,20 @@ extension ObjectId: Primitive { } public init(from decoder: Decoder) throws { - let container = try decoder.singleValueContainer() - - if let container = container as? AnySingleValueBSONDecodingContainer { - self = try container.decodeObjectId() - } else { + switch decoder { + case let decoder as _FastBSONDecoder: + self = decoder.value + return + case let decoder as _BSONDecoder: + let primitive = decoder.primitive + guard let value = primitive as? ObjectId else { + throw BSONTypeConversionError(from: primitive, to: ObjectId.self) + } + + self = value + return + default: + let container = try decoder.singleValueContainer() let string = try container.decode(String.self) self = try ObjectId.make(from: string) } diff --git a/Tests/BSONTests/BSONPublicTests.swift b/Tests/BSONTests/BSONPublicTests.swift index 54e5478..1156c35 100644 --- a/Tests/BSONTests/BSONPublicTests.swift +++ b/Tests/BSONTests/BSONPublicTests.swift @@ -289,6 +289,8 @@ final class BSONPublicTests: XCTestCase { } func testWrappedDateCodables() throws { + struct Oopsie: Error {} + @propertyWrapper struct Field: Codable { public let key: String? @@ -301,7 +303,8 @@ final class BSONPublicTests: XCTestCase { public init(from decoder: Decoder) throws { guard let key = decoder.codingPath.last?.stringValue else { - fatalError() + XCTFail() + throw Oopsie() } self.key = key @@ -426,18 +429,21 @@ final class BSONPublicTests: XCTestCase { "morePi": 3.14 ] - let decoder = BSONDecoder() - - let huge = try decoder.decode(HugeDocument.self, from: doc) - XCTAssertEqual(huge._id, id) - XCTAssertEqual(huge.age, 244) - XCTAssertEqual(huge.year, 1774) - XCTAssertEqual(huge.epoch, 1522809334) - XCTAssertEqual(huge.bigNum, .max) - XCTAssertEqual(huge.biggerNum, 1) - XCTAssertEqual(huge.awesome, true) - XCTAssertEqual(huge.pi, 3.14) - XCTAssertEqual(huge.morePi, 3.14) + for _ in 0..<100_000 { + let decoder = BSONDecoder() +// let decoder = BSONDecoder() + + _ = try decoder.decode(HugeDocument.self, from: doc) +// XCTAssertEqual(huge._id, id) +// XCTAssertEqual(huge.age, 244) +// XCTAssertEqual(huge.year, 1774) +// XCTAssertEqual(huge.epoch, 1522809334) +// XCTAssertEqual(huge.bigNum, .max) +// XCTAssertEqual(huge.biggerNum, 1) +// XCTAssertEqual(huge.awesome, true) +// XCTAssertEqual(huge.pi, 3.14) +// XCTAssertEqual(huge.morePi, 3.14) + } } func testEquality() { From 8b54dd06db57ba3936252df0891877d95451d6fb Mon Sep 17 00:00:00 2001 From: Joannis Orlandos Date: Sun, 5 Mar 2023 21:10:02 +0100 Subject: [PATCH 2/2] Default to incorrect behaviour in previous releases, decoding date from double --- Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift | 2 +- Tests/BSONTests/BSONEncoderTests.swift | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift b/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift index bf6885c..626a384 100644 --- a/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift +++ b/Sources/BSON/Codable/Decoding/BSONDecoderSettings.swift @@ -158,7 +158,7 @@ public struct BSONDecoderSettings { /// If `true`, allows decoding ObjectIds from Strings if they're formatted as a 24-character hexString public var decodeObjectIdFromString: Bool = false - /// If `true`, allows decoding ObjectIds from Strings if they're formatted as a 24-character hexString + /// If `true`, allows decoding Date from a Double (TimeInterval) public var decodeDateFromTimestamp: Bool = true /// A strategy that is applied when encountering a request to decode a `Float` diff --git a/Tests/BSONTests/BSONEncoderTests.swift b/Tests/BSONTests/BSONEncoderTests.swift index 2f75589..3530121 100644 --- a/Tests/BSONTests/BSONEncoderTests.swift +++ b/Tests/BSONTests/BSONEncoderTests.swift @@ -97,7 +97,7 @@ class BSONEncoderTests: XCTestCase { } let container = try BSONDecoder().decode(DateContainer.self, from: document) - XCTAssertEqual(date, container.date) + XCTAssertEqual(date.timeIntervalSince1970, container.date.timeIntervalSince1970) } @available(OSX 10.12, *)