Skip to content

Commit

Permalink
MongoDB: Fixed BSON decoding of {"$date": 1180690093000} timestamps
Browse files Browse the repository at this point in the history
  • Loading branch information
amotl committed Oct 9, 2024
1 parent 502619b commit 865b733
Show file tree
Hide file tree
Showing 3 changed files with 19 additions and 10 deletions.
1 change: 1 addition & 0 deletions CHANGES.md
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
# Changelog

## Unreleased
- MongoDB: Fixed BSON decoding of `{"$date": 1180690093000}` timestamps

## 2024/09/30 v0.0.20
- DynamoDB: Change CrateDB data model to use (`pk`, `data`, `aux`) columns
Expand Down
18 changes: 10 additions & 8 deletions src/commons_codec/transform/mongodb.py
Original file line number Diff line number Diff line change
Expand Up @@ -121,15 +121,17 @@ def decode_extended_json(self, value: t.Dict[str, t.Any]) -> t.Any:

# Special handling for datetime representation in NUMBERLONG format (emulated depth-first).
type_ = next(iter(value)) # Get key of first item in dictionary.
is_date_numberlong = type_ == "$date" and "$numberLong" in value["$date"]
if is_date_numberlong:
try:
out = dt.datetime.fromtimestamp(int(value["$date"]["$numberLong"]) / 1000, tz=dt.timezone.utc)
except ValueError as ex:
logger.error(f"Decoding legacy timestamp failed: {ex}. value={value}")
out = 0
else:
if type_ == "$date" and isinstance(value["$date"], dict):
value = {"$date": int(value["$date"]["$numberLong"])}

# Invoke BSON decoder.
try:
out = object_hook(value)
except bson.errors.InvalidBSON as ex:
logger.error(f"Decoding BSON value failed: {ex}. value={value}")
out = None
if "Python int too large to convert to C int" in str(ex):
out = 0

is_bson = isinstance(out, all_bson_types())

Expand Down
10 changes: 8 additions & 2 deletions tests/transform/mongodb/test_mongodb_convert.py
Original file line number Diff line number Diff line change
Expand Up @@ -104,7 +104,7 @@ class DateConversionCase:
DateConversionCase(
converter=MongoDBCrateDBConverter(),
data_in={"$date": {"$numberLong": "1655210544987"}},
data_out=dt.datetime(2022, 6, 14, 12, 42, 24, 987000, tzinfo=dt.timezone.utc),
data_out=dt.datetime(2022, 6, 14, 12, 42, 24, 987000),
),
DateConversionCase(
converter=MongoDBCrateDBConverter(timestamp_to_epoch=True, timestamp_use_milliseconds=True),
Expand All @@ -124,7 +124,12 @@ class DateConversionCase:
DateConversionCase(
converter=MongoDBCrateDBConverter(timestamp_to_iso8601=True),
data_in={"$date": {"$numberLong": "1655210544987"}},
data_out="2022-06-14T12:42:24.987000+00:00",
data_out="2022-06-14T12:42:24.987000",
),
DateConversionCase(
converter=MongoDBCrateDBConverter(timestamp_to_iso8601=True),
data_in={"$date": 1180690093000},
data_out="2007-06-01T09:28:13",
),
]

Expand All @@ -136,6 +141,7 @@ class DateConversionCase:
"epochms-$date-legacy",
"iso8601-$date-canonical",
"iso8601-$date-legacy",
"iso8601-$date-ultra-legacy",
]


Expand Down

0 comments on commit 865b733

Please sign in to comment.