forked from synopse/mORMot2
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmormot.db.nosql.bson.pas
4730 lines (4405 loc) · 157 KB
/
mormot.db.nosql.bson.pas
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
/// Database Framework BSON Encoding for MongoDB
// - this unit is a part of the Open Source Synopse mORMot framework 2,
// licensed under a MPL/GPL/LGPL three license - see LICENSE.md
unit mormot.db.nosql.bson;
{
*****************************************************************************
Efficient BSON Support for MongoDB Clients
- BSON Decimal128 Value
- BSON ObjectID Value
- TBsonVariantData / TBsonVariant Custom Variant Storage
- TBsonElement / TBsonIterator for BSON Decoding
- TBsonWriter for BSON Encoding
- High-Level BSON/JSON Function Helpers
*****************************************************************************
}
interface
{$I ..\mormot.defines.inc}
uses
sysutils,
classes,
variants,
mormot.core.base,
mormot.core.os,
mormot.core.unicode,
mormot.core.text,
mormot.core.buffers,
mormot.core.variants,
mormot.core.json,
mormot.core.rtti,
mormot.core.datetime,
mormot.core.data,
mormot.core.perf,
mormot.core.log,
mormot.db.core;
{ ************ BSON Decimal128 Value }
type
/// binary representation of a 128-bit decimal, stored as 16 bytes
// - i.e. IEEE 754-2008 128-bit decimal floating point as used in the
// BSON Decimal128 format, and processed by the TDecimal128 object
TDecimal128Bits = record
case integer of
0:
(lo, hi: QWord);
1:
(l, h: Int64);
2:
(b: array[0..15] of byte);
3:
(c: array[0..3] of cardinal);
end;
/// points to a 128-bit decimal binary
PDecimal128Bits = ^TDecimal128Bits;
/// enough characters to contain any TDecimal128 text representation
TDecimal128Str = array[0..42] of AnsiChar;
/// some special 128-bit decimal values
// - see TDecimal128.SetSpecial to set the corresponding value
// - dsvError is returned by TDecimal128.FromText() on parsing error
// - dsvValue indicates that this is not a known "special" value, but some
// valid decimal number
TDecimal128SpecialValue = (
dsvError,
dsvValue,
dsvNan,
dsvZero,
dsvPosInf,
dsvNegInf,
dsvMin,
dsvMax);
/// handles a 128-bit decimal value
// - i.e. IEEE 754-2008 128-bit decimal floating point as used in the
// BSON Decimal128 format, i.e. betDecimal128 TBsonElementType
// - the betFloat BSON format stores a 64-bit floating point value, which
// doesn't have exact decimals, so may suffer from rounding or approximation
// - for instance, if you work with some currency values, you may store
// betDecimal128 values in MongoDB - the easiest way is to include it as a
// TBsonVariant instance, via the NumberDecimal() function
// - there is no mathematical operator/methods for Decimal128 Value Objects,
// as required by MongoDB specifications: any computation must be done
// explicitly on native language value representation (e.g. currency, TBCD or
// any BigNumber library) - use ToCurr/FromCurr or ToText/FromText to make
// the appropriate safe conversions
{$ifdef USERECORDWITHMETHODS}
TDecimal128 = record
{$else}
TDecimal128 = object
{$endif USERECORDWITHMETHODS}
public
/// the raw binary storage
Bits: TDecimal128Bits;
/// fills with the Zero value
// - note: under IEEE 754, Zero can have sign and exponents, so is not Hi=Lo=0
// - is the same as Fill(dsvZero)
procedure SetZero;
/// fills with a special value
// - dsvError or dsvValue will set dsvNan binary content
procedure SetSpecial(special: TDecimal128SpecialValue);
/// checks if the value matches one of the known special values
// - will search for dsvNan, dsvZero, dsvPosInf, dsvNegInf, dsvMin, dsvMax
function IsSpecial: TDecimal128SpecialValue;
/// fills with a 32-bit signed value
procedure FromInt32(value: integer);
/// fills with a 32-bit unsigned value
procedure FromUInt32(value: cardinal);
{$ifdef HASINLINE}inline;{$endif}
/// fills with a 64-bit signed value
procedure FromInt64(value: Int64);
/// fills with a 64-bit unsigned value
procedure FromQWord(value: QWord);
{$ifdef HASINLINE}inline;{$endif}
/// fills with a fixed decimal value, as stored in currency
// - will store the content with explictly four decimals, as in currency
// - by design, this method is very fast and accurate
procedure FromCurr(const value: currency);
/// fills from the text representation of a decimal value
// - returns dsvValue or one of the dsvNan, dsvZero, dsvPosInf, dsvNegInf
// special value indicator otherwise on succes
// - returns dsvError on parsing failure
function FromText(text: PUtf8Char; textlen: integer): TDecimal128SpecialValue; overload;
/// fills from the text representation of a decimal value
// - returns dsvValue or one of the dsvNan, dsvZero, dsvPosInf, dsvNegInf
// special value indicator otherwise on succes
// - returns dsvError on parsing failure
function FromText(const text: RawUtf8): TDecimal128SpecialValue; overload;
/// convert a variant into one Decimal128 value
// - will first check for a TBsonVariant containing a betDecimal128 (e.g.
// as retrieved via the ToVariant method)
// - will recognize currency and VariantToInt64() stored values
// - then will try to convert the variant from its string value, expecting
// a floating-point text content
// - returns TRUE if conversion was made, FALSE on any error
function FromVariant(const value: variant): boolean;
/// fills with a native floating-point value
// - note that it doesn't make much sense to use this method: you should
// rather use the native betFloat BSON format, with native double precision
// - this method is just a wrapper around ExtendedToShort and ToText,
// so you should provide the expected precision, from the actual storage
// variable (you may specify e.g. SINGLE_PRECISION or EXTENDED_PRECISION if
// you don't use a double kind of value)
function FromFloat(const value: TSynExtended; precision: integer = 0): boolean;
/// fast bit-per-bit value comparison
function Equals(const other: TDecimal128): boolean;
{$ifdef HASINLINE}inline;{$endif}
/// converts the value to its string representation
// - returns the number of AnsiChar written to Buffer
function ToText(out Buffer: TDecimal128Str): integer; overload;
/// converts this Decimal128 value to its string representation
function ToText: RawUtf8; overload;
/// converts this Decimal128 value to its string representation
procedure ToText(var result: RawUtf8); overload;
/// convert this Decimal128 value to its TBsonVariant custom variant value
function ToVariant: variant; overload;
/// convert this Decimal128 value to its TBsonVariant custom variant value
procedure ToVariant(out Result: variant); overload;
/// converts this Decimal128 value to a floating-point value
// - by design, some information may be lost during conversion
// - note that it doesn't make much sense to use this method: you should
// rather use the native betFloat BSON format, with native double precision
function ToFloat: TSynExtended;
/// converts this Decimal128 value to a fixed decimal value
// - by design, some information may be lost during conversion, unless the
// value has been stored previously via the FromCurr() method - in this
// case, conversion is immediate and accurate
function ToCurr: currency; overload;
{$ifdef HASINLINE}inline;{$endif}
/// converts this Decimal128 value to a fixed decimal value
// - by design, some information may be lost during conversion, unless the
// value has been stored previously via the FromCurr() method - in this
// case, conversion is immediate and accurate
procedure ToCurr(out result: currency); overload;
/// converts this Decimal128 value to its string representation
procedure AddText(W: TJsonWriter);
end;
/// points to a 128-bit decimal value
PDecimal128 = ^TDecimal128;
const
/// the textual representation of the TDecimal128 special values
DECIMAL128_SPECIAL_TEXT: array[TDecimal128SpecialValue] of RawUtf8 = (
'', // dsvError
'', // dsvValue
'NaN', // dsvNan
'0', // dsvZero
'Infinity', // dsvPosInf
'-Infinity', // dsvNegInf
'-9.999999999999999999999999999999999E+6144', // dsvMin
'9.999999999999999999999999999999999E+6144'); // dsvMax
BSON_DECIMAL128_HI_NAN = $7c00000000000000;
BSON_DECIMAL128_HI_INT64POS = $3040000000000000; // 0 fixed decimals
BSON_DECIMAL128_HI_INT64NEG = $b040000000000000;
BSON_DECIMAL128_HI_CURRPOS = $3038000000000000; // 4 fixed decimals
BSON_DECIMAL128_HI_CURRNEG = $b038000000000000;
BSON_DECIMAL128_EXPONENT_MAX = 6111;
BSON_DECIMAL128_EXPONENT_MIN = -6176;
BSON_DECIMAL128_EXPONENT_BIAS = 6176;
BSON_DECIMAL128_MAX_DIGITS = 34;
/// ready-to-be displayed text of a TDecimal128SpecialValue
function ToText(spec: TDecimal128SpecialValue): PShortString; overload;
{ ************ BSON ObjectID Value }
type
/// 24-bit storage, mapped as a 3 bytes buffer
// - as used fo TBsonObjectID.MachineID and TBsonObjectID.Counter
TBson24 = record
b1, b2, b3: byte;
end;
/// points to 24-bit storage, mapped as a 3 bytes buffer
PBson24 = ^TBson24;
{$A-}
/// BSON ObjectID 12-byte internal binary representation
// - in MongoDB, documents stored in a collection require a unique _id field
// that acts as a primary key: by default, it uses such a 12-byte ObjectID
// - by design, sorting by _id: ObjectID is roughly equivalent to sorting by
// creation time, so ease sharding and BTREE storage
// - in our ODM, we rather use 64-bit genuine integer identifiers (TID),
// as computed by an internal sequence or TSynUniqueIdentifierGenerator
// - match betObjectID TBsonElementType
{$ifdef USERECORDWITHMETHODS}
TBsonObjectID = record
{$else}
TBsonObjectID = object
{$endif USERECORDWITHMETHODS}
public
/// big-endian 4-byte value representing the seconds since the Unix epoch
// - time is expressed in Coordinated Universal Time (UTC), not local time
UnixCreateTime: cardinal;
/// 3-byte machine identifier
// - ComputeNew will use a hash of Executable.Host and Executable.User
MachineID: TBson24;
/// 2-byte process id
// - ComputeNew will derivate it from MainThreadID
ProcessID: word;
/// 3-byte counter, starting with a random value
// - used to avoid collision
Counter: TBson24;
/// set all internal fields to zero
procedure Init;
{$ifdef HASSAFEINLINE}inline;{$endif}
/// ObjectID content be filled with some unique values
// - this implementation is thread-safe
procedure ComputeNew;
/// convert an hexadecimal string value into one ObjectID
// - returns TRUE if conversion was made, FALSE on any error
function FromText(const Text: RawUtf8): boolean; overload;
/// convert an hexadecimal string value into one ObjectID
// - returns TRUE if conversion was made, FALSE on any error
function FromText(Text: PUtf8Char): boolean; overload;
/// convert a variant into one ObjectID
// - will first check for a TBsonVariant containing a betObjectID
// - then will try to convert the variant from its string value, expecting
// an hexadecimal text content
// - returns TRUE if conversion was made, FALSE on any error
function FromVariant(const value: variant): boolean;
/// convert this ObjectID to its hexadecimal string value
function ToText: RawUtf8; overload;
/// convert this ObjectID to its hexadecimal string value
procedure ToText(var result: RawUtf8); overload;
/// convert this ObjectID to its TBsonVariant custom variant value
function ToVariant: variant; overload;
/// convert this ObjectID to its TBsonVariant custom variant value
procedure ToVariant(var result: variant); overload;
/// returns the timestamp portion of the ObjectId() object as a TDateTime
// - time is expressed in Coordinated Universal Time (UTC), not local time
// so you can compare it to NowUtc returned time
function CreateDateTime: TDateTime;
/// compare two Object IDs
function Equal(const Another: TBsonObjectID): boolean; overload;
{$ifdef HASINLINE}inline;{$endif}
/// compare two Object IDs, the second being stored in a TBsonVariant
function Equal(const Another: variant): boolean; overload;
{$ifdef HASINLINE}inline;{$endif}
end;
/// points to a BSON ObjectID internal binary representation
PBsonObjectID = ^TBsonObjectID;
{$A+}
{ ************ TBsonVariantData / TBsonVariant Custom Variant Storage }
type
/// exception type used for BSON process
EBsonException = class(ESynException);
/// storage of a BSON binary document
// - a specific type is defined for consistency with this unit classes
// - binary content should follow the "int32 e_list #0" standard layout
TBsonDocument = RawByteString;
/// dynamic array of BSON binary document storage
TBsonDocumentDynArray = array of TBsonDocument;
/// element types for BSON internal representation
TBsonElementType = (
betEOF,
betFloat,
betString,
betDoc,
betArray,
betBinary,
betDeprecatedUndefined,
betObjectID,
betBoolean,
betDateTime,
betNull,
betRegEx,
betDeprecatedDbptr,
betJS,
betDeprecatedSymbol,
betJSScope,
betInt32,
betTimestamp,
betInt64,
betDecimal128);
/// points to an element type for BSON internal representation
PBsonElementType = ^TBsonElementType;
/// sub-types for betBinary element BSON internal representation
TBsonElementBinaryType = (
bbtGeneric,
bbtFunction,
bbtOldBinary,
bbtOldUUID,
bbtUUID,
bbtMD5,
bbtEncryptedBsonValue, { MongoDB 4.2 introduced client side encryption }
bbtCompressedBsonColumn,
bbtUser = $80);
{$A-}
/// memory structure used for some special BSON storage as variant
// - betObjectID kind will store a TBsonObjectID
// - betBinary kind will store a BLOB content as RawByteString
// - betDoc and betArray kind will store a BSON document, in its original
// binary format as RawByteString (TBsonDocument)
// - betDeprecatedDbptr, betJSScope, betTimestamp and betRegEx will store the
// raw original BSON content as RawByteString
// - betJS and betDeprecatedSymbol will store the UTF-8 encoded string
// as a RawUtf8
// - betDeprecatedUndefined or betMinKey/betMaxKey do not contain any data
// - betDecimal128 will store the TDecimal128 16 bytes binary buffer
// - warning: VBlob/VText use should match BSON_ELEMENTVARIANTMANAGED constant
TBsonVariantData = packed record
/// the variant type
VType: TVarType;
/// the kind of element stored
case VKind: TBsonElementType of
betObjectID:
(
VObjectID: TBsonObjectID;
VPaddingToVarData: array[1..SizeOf(TVarData) - SizeOf(TVarType)
- SizeOf(TBsonElementType) - SizeOf(TBsonObjectID)] of byte;);
betBinary,
betDoc,
betArray,
betRegEx,
betDeprecatedDbptr,
betTimestamp,
betJSScope,
betDecimal128:
(
/// store the raw binary content as a RawByteString (or TBsonDocument for
// betDoc/betArray, i.e. the "int32 e_list #0" standard layout)
// - you have to use RawByteString(VBlob) when accessing this field
// - e.g. for betRegEx, it will contain raw [cstring cstring] content
VBlob: pointer;);
betJS,
betDeprecatedSymbol:
(
/// store here a RawUtf8 with the associated text
// - you have to use RawUF8(VText) when accessing this field
VText: pointer;);
end;
{$A+}
/// points to memory structure used for some special BSON storage as variant
PBsonVariantData = ^TBsonVariantData;
/// define how betDoc/betArray BSON elements will be converted as variants
// - by default a TBsonVariant custom type will be returned, containing the
// raw BSON binary content of the embedded document or array
// - asDocVariantPerValue or asDocVariantPerReference could be used to
// create a tree of TDocVariant custom kind of variant, able to access
// to its nested properties via late-binding (asDocVariantPerReference being
// also much faster in some cases - but less safe - than asDocVariantPerValue)
// - asDocVariantPerValue will set JSON_[mDefault] settings:
// ! [dvoReturnNullForUnknownProperty]
// - asDocVariantPerReference will set JSON_[mFast]/JSON_FAST
// settings:
// ! [dvoValueCopiedByReference,dvoReturnNullForUnknownProperty]
// - asDocVariantInternNamesPerValue and asDocVariantInternNamesPerReference
// will include dvoInternalNames to the TDocVariant.Options
TBsonDocArrayConversion = (
asBsonVariant,
asDocVariantPerValue,
asDocVariantPerReference,
asDocVariantInternNamesPerValue,
asDocVariantInternNamesPerReference);
/// custom variant type used to store some special BSON elements
// - internal layout will follow TBsonVariantData
// - handled kind of item are complex BSON types, like betObjectID, betBinary
// or betDoc/betArray
// - it will allow conversion to/from string (and to date for ObjectID)
TBsonVariant = class(TSynInvokeableVariantType)
protected
function GetNewDoc(const BsonDoc: TBsonDocument): variant;
public
/// notify the TryJsonToVariant/ToJson abilities
constructor Create; override;
/// customization of JSON conversion into TBsonVariant kind of variants
function TryJsonToVariant(var Json: PUtf8Char; var Value: variant;
EndOfObject: PUtf8Char): boolean; override;
/// variant serialization will use modMongoStrict JSON-compatible mode
procedure ToJson(W: TJsonWriter; Value: PVarData); override;
/// variant serialization will use modMongoStrict JSON-compatible mode
/// handle type conversion
// - only types processed by now are string/OleStr/UnicodeString/date
procedure Cast(var Dest: TVarData; const Source: TVarData); override;
/// handle type conversion
// - only types processed by now are string/OleStr/UnicodeString/date
procedure CastTo(var Dest: TVarData; const Source: TVarData;
const AVarType: TVarType); override;
/// clear the instance
procedure Clear(var V: TVarData); override;
/// copy one instance
procedure Copy(var Dest: TVarData; const Source: TVarData;
const Indirect: boolean); override;
/// convert a TBsonDocument binary content into a TBsonVariant of kind
// betDoc or betArray
// - see also all BsonVariant() overloaded functions, which also create
// a TBsonVariant betDoc instance
procedure FromBsonDocument(const BsonDoc: TBsonDocument; var result: variant;
Kind: TBsonElementType = betDoc);
/// convert a BLOB binary content into a TBsonVariant of kind betBinary
// - if Bin is '', will store a NULL variant
procedure FromBinary(const Bin: RawByteString;
BinType: TBsonElementBinaryType; var result: variant);
/// convert a JSON content into a TBsonVariant of kind betDoc or betArray
// - warning: the supplied JSON buffer will be modified in-place
// - will create a plain variant value if the JSON doesn't start with [ or {
procedure FromJson(json: PUtf8Char; var result: variant);
/// returns TRUE if the supplied variant stores the supplied BSON kind of value
function IsOfKind(const V: variant; Kind: TBsonElementType): boolean;
/// returns true if holds a betArray/betDoc with no items within
function IsVoid(const V: TVarData): boolean; override;
/// retrieve a betBinary content stored in a TBsonVariant instance
// - returns TRUE if the supplied variant is a betBinary, and set the
// binary value into the supplied Blob variable
// - returns FALSE otherwise
function ToBlob(const V: Variant; var Blob: RawByteString): boolean;
/// in-place append field(s) to a TBsonVariant document instance
// - if the supplied variant is a TBsonVariant betDoc, it will add the fields
// - if the supplied variant is a TDocVariant object, V will be replaced
// by a new TBsonVariant instance including the new fields
// - otherwise a new TBsonVariant betDoc is created with the fields
procedure AddItem(var V: variant; const NameValuePairs: array of const);
/// search and extract a field name from a TBsonVariant document instance
// - if the supplied variant is a TBsonVariant betDoc, it will search for
// the supplied name, and return true and the found item as variant
// - otherwise, return false
function GetItem(const V: variant; const Name: RawUtf8;
out Value: variant; ValueAs: TBsonDocArrayConversion = asBsonVariant): boolean;
/// convert a TBsonDocument binary content into a TBsonVariant of kind betDoc
// - is the default property, so that you can write:
// ! BsonVariantType[Bson(['BSON',_Arr(['awesome',5.05, 1986])])]
// - see also all BsonVariant() overloaded functions, which also create
// a TBsonVariant betDoc instance
property NewDoc[const BsonDoc: TBsonDocument]: variant
read GetNewDoc; default;
end;
{ ************ TBsonElement / TBsonIterator for BSON Decoding }
type
/// how TBsonElement.AddMongoJson() method and AddMongoJson() and
// VariantSaveMongoJson() functions will render their JSON content
// - modNoMongo will serialize dates as ISO-8601 strings, ObjectID as
// hexadecimal string and other MongoDB special objects in WrBase64() format,
// so won't supply any additional information about its BSON content
// - modMongoStrict will follow the MongoDB Extended JSON syntax - as
// {"$oid":"...} - for valid but verbose JSON with additional BSON information
// - modMongoShell will use a syntax incompatible with JSON RFC, but more
// common to MongoDB daily use - as 'ObjectId()' or '{ field: /acme.*corp/i }'
// - modMongoStrict and modNoMongo will follow the JSON RFC specifications
// - see http://docs.mongodb.org/manual/reference/mongodb-extended-json
TMongoJsonMode = (
modNoMongo,
modMongoStrict,
modMongoShell);
{$A-}
/// data structure used during BSON binary decoding of one BSON element
// - will be retrieved by FromVariant() or FromNext()
// - see http://bsonspec.org/#/specification
// - this structure has been optimized to map the BSON binary content,
// without any temporary memory allocation (the SAX way)
{$ifdef USERECORDWITHMETHODS}
TBsonElement = record
{$else}
TBsonElement = object
{$endif USERECORDWITHMETHODS}
private
/// used internally to set the TBsonElement content, once Kind has been set
procedure FromBson(bson: PByte);
public
/// the UTF-8 encoded name of this element
Name: PUtf8Char;
/// the name length (in chars) of this element - 16-bit encoded
NameLen: word;
/// index of this element in the original sequence list
// - is correct only when the element has been reset before the parsing
// loop, e.g.:
// ! item.Index := -1; // so item.Index will count starting at 0
// ! while item.FromNext(elem.Document) do
// ! writeln(item.Index,' ',Item.Name,' ',Item.ValueBytes);
Index: integer;
/// the element type
Kind: TBsonElementType;
/// number of bytes in the BSON element
// - will include the trailing #0 for string element
ElementBytes: integer;
/// pointer to the BSON element value
// - is the raw value, without any parsing, e.g. points to a double value or
// a document: "int32 e_list #0" standard layout (same as TBsonDocument)
// - you may cast it for simple types:
// ! PDouble(Element)^ PBoolean(Element)^ PInteger(Element)^
// ! PInt64(Element)^ PBsonObjectID(Element)^ PDecimal128(Element)^
// - or use the nested Data variant record to access more complex content
// - warning: equals nil for betString/betJS after FromVariant()
Element: pointer;
/// depending on the Kind, will point to parsed complex sub-data
// - since variable records can't have properties, we nest this information
// within this main Data variable record
// - not all Kind are handled here, only any complex data
Data: record
case TBsonElementType of
betFloat,
betBoolean,
betInt32,
betDateTime,
betInt64:
(
/// this variable is not to be used directly, but for some internal
// temporary storage, e.g. with FromVariant()
// - use P*(Element)^ typecast instead
InternalStorage: Int64;);
betString,
betJS:
(
/// points to the #0 ending string
Text: PUtf8Char;
/// number of bytes in Text (excluding trailing #0)
TextLen: integer;);
betDoc,
betArray:
(
/// points to a "e_list #0" standard layout
DocList: PByte;);
betBinary:
(
/// points to the binary content
Blob: pointer;
/// number of bytes in Blob
BlobLen: integer;
/// corresponding sub-type of this Blob
BlobSubType: TBsonElementBinaryType;);
betRegEx:
(RegEx: PUtf8Char;
RegExLen: integer;
RegExOptions: PUtf8Char;
RegExOptionsLen: integer;);
betJSScope:
(JavaScript: PUtf8Char;
JavaScriptLen: integer;
ScopeDocument: PByte;);
betTimestamp:
({ map InternalStorage: Int64 }
time_t: cardinal;
ordinal: cardinal;);
end;
/// fill a BSON Element structure from a variant content and associated name
// - perform the reverse conversion as made with ToVariant()
// - since the result won't store any data but points to the original binary
// content, the supplied Name/Value instances should remain available as long as
// you will access to the result content
// - aName here is just for convenience, and could be left void
// - supplied aTemp variable will be used for temporary storage, private to
// this initialized TBsonElement
procedure FromVariant(const aName: RawUtf8; const aValue: Variant;
var aTemp: RawByteString);
/// fill a BSON Element structure from a TBsonVariantData value
procedure FromBsonVariant(aValue: PVarData);
{$ifdef HASINLINE} inline; {$endif}
/// fill a BSON Element structure from a BSON document
// - will check the document length then set Kind := betDoc and Data.DocList
// - will return TRUE if the supplied doc has a valid length, FALSE otherwise
// - you can later on use DocItemToVariant, DocItemToRawUtf8 or
// DocItemToInteger methods
// - the supplied "doc" variable should remain available until you are done
// with this TBsonElement wrapper
function FromDocument(const doc: TBsonDocument): boolean;
/// fill a BSON Element structure from a BSON encoded binary buffer list
// - parse the next BSON element: BSON parameter should point to the
// "e_list" of the "int32 e_list #0" BSON document
// - will decode the supplied binary buffer into the BSON element structure,
// then it will let BSON point to the next element, and return TRUE
// - returns FALSE when you reached betEOF, so that you can use it in a loop,
// and retrieve all the content as consecutive events, without any memory
// allocation (the SAX way):
// ! var bson: PByte;
// ! item: TBsonElement;
// ! ...
// ! BsonParseLength(bson);
// ! while item.FromNext(bson) do
// ! writeln(item.Name);
// - will raise an EBsonException if BSON content is not correct
// - as an alternative, consider using TBsonIterator, which wrap both a
// PByte and a TBsonElement into one convenient item
function FromNext(var BSON: PByte): boolean;
/// search for a given name in a BSON encoded binary buffer list
// - BSON parameter should point to the first "e_list" item of the
// "int32 e_list #0" BSON document
// - returns false if the item was not found (with case-insensitive search)
// - otherwise returns TRUE and the matching element content has been
// decoded within this TBsonElement structure
function FromSearch(BSON: PByte; const aName: RawUtf8): boolean;
/// convert a BSON element, as retrieved by TBsonElement.FromNext(),
// into a variant
// - it will return either standard variant values, or TBsonVariant custom type
// for most complex kind of elements (see TBsonVariantData type definition)
// - note that betString types will be stored as RawUtf8 varString
// - by default, it will return TBsonVariant custom variants for documents or
// arrays - but if storeDocArrayAsDocVariant is set, it will return a
// TDocVariant custom kind of variant, able to access to its nested
// properties via late-binding
function ToVariant(
DocArrayConversion: TBsonDocArrayConversion = asBsonVariant): variant; overload;
/// convert a BSON element, as retrieved by TBsonElement.FromNext(),
// into a variant
// - same as the other ToVariant() overloaded function, but avoiding a copy
// of the resulting variant
procedure ToVariant(var result: variant;
DocArrayConversion: TBsonDocArrayConversion = asBsonVariant); overload;
/// convert a BSON element into an UTF-8 string
// - any complex types (e.g. nested documents) will be converted via a
// variant
function ToRawUtf8: RawUtf8;
/// convert a BSON element into an integer value
// - will work only for betBoolean/betInt32/betInt64 types
// - any other kind of values will return the supplied default value
function ToInteger(const default: Int64 = 0): Int64;
/// search a variant property value within the BSON element as document
// - returns true if aName has been found as property in the BSON element,
// and fills aValue with the corresponding value
// - returns false if aName was not found, or if Kind is not betDoc or betArray
function DocItemToVariant(const aName: RawUtf8; var aValue: variant;
DocArrayConversion: TBsonDocArrayConversion = asBsonVariant): boolean;
/// search an UTF-8 property value within the BSON element as document
// - returns the value if aName has been found as property in the BSON element
// - returns '' if aName was not found, or if Kind is not betDoc or betArray
function DocItemToRawUtf8(const aName: RawUtf8): RawUtf8;
/// search an integer property value within the BSON element as document
// - returns the value if aName has been found as property in the BSON element
// - returns default if aName was not found, or if Kind is not betDoc or betArray
function DocItemToInteger(const aName: RawUtf8; const default: Int64 = 0): Int64;
/// convert a BSON element, as retrieved by TBsonElement.FromNext(), into
// its JSON representation
// - this method will use by default the MongoDB Extended JSON syntax for
// specific MongoDB objects but you may use modMongoShell if needed
// - will raise an EBsonException if element is not correct
// - returns false on success, true if MaxSize has been reached
function AddMongoJson(W: TJsonWriter; Mode: TMongoJsonMode = modMongoStrict;
MaxSize: PtrUInt = 0): boolean; overload;
end;
PBsonElement = ^TBsonElement;
/// data structure used for iterating over a BSON binary buffer
// - is just a wrapper around a PByte value, to be used with a TBsonDocument
{$ifdef USERECORDWITHMETHODS}
TBsonIterator = record
{$else}
TBsonIterator = object
{$endif USERECORDWITHMETHODS}
private
fBson: PByte;
public
/// map the current item, after the Next method did return TRUE
// - map the global document, after Init() but before the first Next call
Item: TBsonElement;
/// initialize the iteration on the supplied BSON document
// - will check the document length and returns TRUE if it is correct
// - only accepted kind are betDoc and betArray (but not used later)
// - you can then use the Next method to iterate over the Item elements
// - after this call, the Item property map to the global BSON document
// (note that after any call to the Next method, Item will map the current
// iterated value, and not the global BSON document any more)
function Init(const doc: TBsonDocument; kind: TBsonElementType = betArray): boolean;
/// will iterate on the BSON document
// - returns TRUE if the item has been retrieved into the Item property
// - returns FALSE if we reached the end of the supplied BSON buffer
function Next: boolean;
{$ifdef HASINLINE}inline;{$endif}
end;
{$A+}
{ ************ TBsonWriter for BSON Encoding }
type
/// used to write the BSON context
TBsonWriter = class(TBufferWriter)
{ note: inlining methods generates 70% SLOWER code due to inefficient compiler :( }
protected
fDocumentCount: integer;
fDocument: array of record
Offset: cardinal;
Length: cardinal;
end;
fDocumentStack: integer;
fDocumentStackOffset: TCardinalDynArray;
fDocumentArray: integer;
procedure WriteCollectionName(Flags: integer; const CollectionName: RawUtf8);
public
/// rewind the Stream to the position when Create() was called
// - this will also reset the internal document offset table
procedure CancelAll; override;
/// write an element with no value
// - elemType can be either betNull, betMinKey or betMaxKey
procedure BsonWrite(const name: RawUtf8; elemtype: TBsonElementType); overload;
/// write a boolean value
procedure BsonWrite(const name: RawUtf8; const value: boolean); overload;
/// write a floating point value
procedure BsonWrite(const name: RawUtf8; const value: Double); overload;
/// write a 32 bit integer value
procedure BsonWrite(const name: RawUtf8; const value: integer); overload;
/// write a 64 bit integer value
procedure BsonWrite(const name: RawUtf8; const value: Int64); overload;
/// write a string (UTF-8) value
procedure BsonWriteUtf8(const name, value: RawUtf8);
/// write a string, detecting TJsonWriter.AddDateTime/WrBase64 patterns
procedure BsonWriteUtf8OrDecode(const name: RawUtf8; value: PUtf8Char;
valueLen: PtrInt);
/// write a string (UTF-8) value from a memory buffer
// - if valueLen is left to its -1 default, will use StrLen(value)
procedure BsonWriteText(const name: RawUtf8; value: PUtf8Char;
valueLen: PtrInt = -1);
/// write a binary (BLOB) value
procedure BsonWrite(const name: RawUtf8; Data: pointer; DataLen: integer); overload;
/// write an ObjectID value
procedure BsonWrite(const name: RawUtf8; const value: TBsonObjectID); overload;
/// write a RegEx value
procedure BsonWriteRegEx(const name: RawUtf8; const RegEx, Options: RawByteString);
/// write a data/time value
procedure BsonWriteDateTime(const name: RawUtf8; const value: TDateTime);
/// write an element with no value
procedure BsonWrite(const name: RawUtf8; const elem: TBsonElement); overload;
/// write a BsonVariant instance value
procedure BsonWrite(const name: RawUtf8; const bson: TBsonVariantData); overload;
/// write a DocVariant instance value
procedure BsonWrite(const name: RawUtf8; const doc: TDocVariantData); overload;
/// write a TDecimal128 value
procedure BsonWrite(const name: RawUtf8; const value: TDecimal128); overload;
/// write a variant value
// - handle simple types (numbers, strings...) and custom types (TDocVariant
// and TBsonVariant, trying a translation to JSON for other custom types)
procedure BsonWriteVariant(const name: RawUtf8; const value: variant); overload;
/// write an open array (const Args: array of const) argument
// - handle simple types (numbers, strings...) and custom types (TDocVariant)
procedure BsonWrite(const name: RawUtf8; const value: TVarRec); overload;
/// write a value from the supplied JSON content
// - is able to handle any kind of values, including nested documents or
// BSON extended syntax (if DoNotTryExtendedMongoSyntax=false)
// - this method is used recursively by BsonWriteDocFromJson(), and should
// not be called directly
// - will return JSON=nil in case of unexpected error in the supplied JSON
procedure BsonWriteFromJson(const name: RawUtf8; var Json: PUtf8Char;
EndOfObject: PUtf8Char; DoNotTryExtendedMongoSyntax: boolean = false);
/// recursive writing of a BSON document or value from a TDocVariant
// object or array, used e.g. by Bson(const doc: TDocVariantData) function
// - caller should execute BsonAdjustDocumentsSize() on the resulting buffer
// - this method will call BsonDocumentBegin/BsonDocumentEnd internally
// - will raise an EBsonException if doc is not a valid TDocVariant or null
// or if the resulting binary content is bigger than BSON_MAXDOCUMENTSIZE
procedure BsonWriteDoc(const doc: TDocVariantData); overload;
/// write a BSON document stored in a TDocVariant or a TBsonVariant
procedure BsonWriteDoc(const doc: variant); overload;
/// write an object specified as name/value pairs as a BSON document
// - data must be supplied two by two, as Name,Value pairs, e.g.
// ! aBsonWriter.BsonWriteObject(['name','John','year',1972]);
// - this method wil be faster than using a BsonWriteDoc(_ObjFast(...))
procedure BsonWriteObject(const NameValuePairs: array of const);
/// write a projection specified as fieldname:1 pairs as a BSON document
procedure BsonWriteProjection(const FieldNamesCsv: RawUtf8);
/// write an object as query parameter
// - will handle all SQL operators, including IN (), IS NULL or LIKE
// - see @http://docs.mongodb.org/manual/reference/operator/query
// - inverted should be TRUE e.g. for a NOT ... expression
// - returns TRUE on success, FALSE if the operator is not implemented yet
function BsonWriteQueryOperator(name: RawUtf8; inverted: boolean;
op: TSelectStatementOperator; const Value: variant): boolean;
/// write one array item, i.e. the ASCII index name as text
// - only one level of array should be used per TBsonWriter class
procedure BsonWriteArray(const kind: TBsonElementType); overload;
/// write an array specified as a list of items as a BSON document
// - data must be supplied as a list of values e.g.
// ! aBsonWriter.BsonWriteArray(['John',1972]);
// - this method wil be faster than using a BsonWriteDoc(_ArrFast(...))
procedure BsonWriteArray(const Items: array of const); overload;
/// write an array of integers as a BSON Document
procedure BsonWriteArrayOfInteger(const Integers: array of integer);
/// write an array of integers as a BSON Document
procedure BsonWriteArrayOfInt64(const Integers: array of Int64);
/// write some BSON document from a supplied (extended) JSON array or object
// - warning: the incoming JSON buffer will be modified in-place: so you
// should make a private copy before running this method (see e.g. TSynTempBuffer)
// - will handle only '{ ... }', '[ ... ]' or 'null' input, with the standard
// strict JSON format, or BSON-like extensions, e.g. unquoted field names:
// $ {id:10,doc:{name:"John",birthyear:1972}}
// - if DoNotTryExtendedMongoSyntax is default FALSE, then the MongoDB Shell
// syntax will also be recognized to create BSON custom types, like
// $ new Date() ObjectId() MinKey MaxKey /<jRegex>/<jOptions>
// see @http://docs.mongodb.org/manual/reference/mongodb-extended-json
// $ {id:new ObjectId(),doc:{name:"John",date:ISODate()}}
// $ {name:"John",field:/acme.*corp/i}
// - if DoNotTryExtendedMongoSyntax is TRUE, process may be slightly faster
// - will create the BSON binary without any temporary TDocVariant storage
function BsonWriteDocFromJson(Json: PUtf8Char; aEndOfObject: PUtf8Char;
out Kind: TBsonElementType; DoNotTryExtendedMongoSyntax: boolean = false): PUtf8Char;
/// to be called before a BSON document will be written
// - each BsonDocumentBegin should be followed by its nested BsonDocumentEnd
procedure BsonDocumentBegin; overload; virtual;
/// to be called before a BSON document will be written
// - each BsonDocumentBegin should be followed by its nested BsonDocumentEnd
// - you could create a new BSON object by specifying a name and its
// type, i.e. either betDoc or betArray
procedure BsonDocumentBegin(const name: RawUtf8;
kind: TBsonElementType = betDoc); overload;
/// to be called before a BSON document will be written in an array
// - only one level of array should be used per TBsonWriter class
procedure BsonDocumentBeginInArray(const name: RawUtf8;
kind: TBsonElementType = betDoc);
/// to be called when a BSON document has been written
// - it will store the current stream position into an internal array,
// which will be written when you call AdjustDocumentsSize()
// - you can optional specify how many nested documents should be closed,
// and/or if it should not write an ending betEof item
procedure BsonDocumentEnd(CloseNumber: integer = 1;
WriteEndingZero: boolean = true); virtual;
/// after all content has been written, call this method on the resulting
// memory buffer to store all document size as expected by the standard
procedure BsonAdjustDocumentsSize(BSON: PByteArray); virtual;
/// flush the content and return the whole binary encoded stream
// - call BsonAdjustDocumentsSize() to adjust all internal document sizes
// - expect the TBsonWriter instance to have been created as such:
// ! TBsonWriter.Create(TRawByteStringStream) or Create(tmp)
procedure ToBsonDocument(var result: TBsonDocument); virtual;
/// flush the content and return the whole document as a TBsonVariant
// - call ToBsonDocument() to adjust all internal document sizes
// - expect the TBsonWriter instance to have been created as such:
// ! TBsonWriter.Create(TRawByteStringStream) or Create(tmp)
procedure ToBsonVariant(var result: variant; Kind: TBsonElementType = betDoc);
end;
{ ************ High-Level BSON/JSON Function Helpers }
const
/// fake BSON element type which compares lower than all other possible values
// - element type sounds to be stored as shortint, so here $ff=-1<0=betEOF
// - defined as an integer to circumvent a compilation issue with FPC trunk
betMinKey = $ff;
/// fake BSON element type which compares higher than all other possible values
// - element type sounds to be stored as shortint, so here betInt64=$12<$7f
// - defined as an integer to circumvent a compilation issue with FPC trunk
betMaxKey = $7f;
/// kind of elements which will store a RawByteString/RawUtf8 content
// within its TBsonVariant kind
// - i.e. TBsonVariantData.VBlob/VText field is to be managed
BSON_ELEMENTVARIANTMANAGED =
[betBinary, betDoc, betArray, betRegEx, betDeprecatedDbptr, betTimestamp,
betJSScope, betJS, betDeprecatedSymbol, betDecimal128];
/// by definition, maximum MongoDB document size is 16 MB
BSON_MAXDOCUMENTSIZE = 16 * 1024 * 1024;
/// special JSON string content which will be used to store a betDeprecatedUndefined item
// - *[false] is for strict JSON, *[true] for MongoDB Extended JSON
BSON_JSON_UNDEFINED: array[boolean] of string[23] = (
'{"$undefined":true}',
'undefined');
/// special JSON string content which will be used to store a betMinKey item
// - *[false] is for strict JSON, *[true] for MongoDB Extended JSON
BSON_JSON_MINKEY: array[boolean] of string[15] = (
'{"$minKey":1}',
'MinKey');
/// special JSON string content which will be used to store a betMaxKey item
// - *[false] is for strict JSON, *[true] for MongoDB Extended JSON
BSON_JSON_MAXKEY: array[boolean] of string[15] = (
'{"$maxKey":1}',
'MaxKey');
/// special JSON patterns which will be used to format a betObjectID item
// - *[false,*] is to be written before the hexadecimal ID, *[true,*] after
BSON_JSON_OBJECTID: array[boolean, TMongoJsonMode] of string[15] = (
('"', '{"$oid":"', 'ObjectId("'),
('"', '"}', '")'));
/// special JSON patterns which will be used to format a betBinary item
// - *[false,*] is for strict JSON, *[true,*] for MongoDB Extended JSON
BSON_JSON_BINARY: array[boolean, boolean] of string[15] = (
('{"$binary":"', '","$type":"'),
('BinData(', ',"'));
/// special JSON string content which will be used to store a betDeprecatedDbptr
// - *[false,*] is for strict JSON, *[true,*] for MongoDB Extended JSON
// - (not used by now for this deprecated content)
BSON_JSON_DBREF: array[boolean, 0..2] of string[15] = (
('{"$ref":"', '","$id":"', '"}'),
('DBRef("', '","', '")'));
/// special JSON string content which will be used to store a betRegEx
BSON_JSON_REGEX: array[0..2] of string[15] = (
'{"$regex":"', '","$options":"', '"}');
/// special JSON patterns which will be used to format a betDateTime item
// - *[*,false] is to be written before the date value, *[*,true] after
BSON_JSON_DATE: array[TMongoJsonMode, boolean] of string[15] = (
('"', '"'),
('{"$date":"', '"}'),
('ISODate("', '")'));
/// special JSON patterns which will be used to format a betDecimal128 item
// - *[false,*] is to be written before the decimal value, *[true,*] after
BSON_JSON_DECIMAL: array[boolean, TMongoJsonMode] of string[23] = (
('"', '{"$numberDecimal":"', 'NumberDecimal("'), ('"', '"}', '")'));
var
/// global TCustomVariantType used to register BSON variant types
// - if you use this unit, both TDocVariant and TBsonVariant custom types
// will be registered, since they are needed for any MongoDB / BSON process
BsonVariantType: TBsonVariant;
/// ready-to-be displayed text of a TBsonElementType value
function ToText(kind: TBsonElementType): PShortString; overload;
/// create a TBsonVariant custom variant type containing a BSON Object ID
// - will be filled with some unique values, ready to create a new document key
// - will store a BSON element of betObjectID kind
function ObjectID: variant; overload;
/// create a TBsonVariant Object ID custom variant type from a supplied text
// - will raise an EBsonException if the supplied text is not valid hexadecimal
// - will set a BSON element of betObjectID kind
function ObjectID(const Hexa: RawUtf8): variant; overload;
/// convert a TBsonVariant Object ID custom variant into a TBsonObjectID
// - raise an exception if the supplied variant is not a TBsonVariant Object ID
function BsonObjectID(const aObjectID: variant): TBsonObjectID;
/// create a TBsonVariant JavaScript custom variant type from a supplied code