
283 lines
9.0 KiB

# Copyright 2009-2015 MongoDB, Inc.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# See the License for the specific language governing permissions and
# limitations under the License.
"""Tools for working with MongoDB ObjectIds."""
import binascii
import calendar
import datetime
import os
import struct
import threading
import time
from random import SystemRandom
from typing import Any, NoReturn, Optional, Type, Union
from bson.errors import InvalidId
from bson.tz_util import utc
def _raise_invalid_id(oid: str) -> NoReturn:
raise InvalidId(
"%r is not a valid ObjectId, it must be a 12-byte input"
" or a 24-character hex string" % oid
def _random_bytes() -> bytes:
"""Get the 5-byte random field of an ObjectId."""
return os.urandom(5)
class ObjectId:
"""A MongoDB ObjectId."""
_pid = os.getpid()
_inc = SystemRandom().randint(0, _MAX_COUNTER_VALUE)
_inc_lock = threading.Lock()
__random = _random_bytes()
__slots__ = ("__id",)
_type_marker = 7
def __init__(self, oid: Optional[Union[str, "ObjectId", bytes]] = None) -> None:
"""Initialize a new ObjectId.
An ObjectId is a 12-byte unique identifier consisting of:
- a 4-byte value representing the seconds since the Unix epoch,
- a 5-byte random value,
- a 3-byte counter, starting with a random value.
By default, ``ObjectId()`` creates a new unique identifier. The
optional parameter `oid` can be an :class:`ObjectId`, or any 12
For example, the 12 bytes b'foo-bar-quux' do not follow the ObjectId
specification but they are acceptable input::
>>> ObjectId(b'foo-bar-quux')
`oid` can also be a :class:`str` of 24 hex digits::
>>> ObjectId('0123456789ab0123456789ab')
Raises :class:`~bson.errors.InvalidId` if `oid` is not 12 bytes nor
24 hex digits, or :class:`TypeError` if `oid` is not an accepted type.
- `oid` (optional): a valid ObjectId.
.. seealso:: The MongoDB documentation on `ObjectIds <>`_.
.. versionchanged:: 3.8
:class:`~bson.objectid.ObjectId` now implements the `ObjectID
specification version 0.2
if oid is None:
elif isinstance(oid, bytes) and len(oid) == 12:
self.__id = oid
def from_datetime(cls: Type["ObjectId"], generation_time: datetime.datetime) -> "ObjectId":
"""Create a dummy ObjectId instance with a specific generation time.
This method is useful for doing range queries on a field
containing :class:`ObjectId` instances.
.. warning::
It is not safe to insert a document containing an ObjectId
generated using this method. This method deliberately
eliminates the uniqueness guarantee that ObjectIds
generally provide. ObjectIds generated with this method
should be used exclusively in queries.
`generation_time` will be converted to UTC. Naive datetime
instances will be treated as though they already contain UTC.
An example using this helper to get documents where ``"_id"``
was generated before January 1, 2010 would be:
>>> gen_time = datetime.datetime(2010, 1, 1)
>>> dummy_id = ObjectId.from_datetime(gen_time)
>>> result = collection.find({"_id": {"$lt": dummy_id}})
- `generation_time`: :class:`~datetime.datetime` to be used
as the generation time for the resulting ObjectId.
offset = generation_time.utcoffset()
if offset is not None:
generation_time = generation_time - offset
timestamp = calendar.timegm(generation_time.timetuple())
oid = struct.pack(">I", int(timestamp)) + b"\x00\x00\x00\x00\x00\x00\x00\x00"
return cls(oid)
def is_valid(cls: Type["ObjectId"], oid: Any) -> bool:
"""Checks if a `oid` string is valid or not.
- `oid`: the object id to validate
.. versionadded:: 2.3
if not oid:
return False
return True
except (InvalidId, TypeError):
return False
def _random(cls) -> bytes:
"""Generate a 5-byte random number once per process."""
pid = os.getpid()
if pid != cls._pid:
cls._pid = pid
cls.__random = _random_bytes()
return cls.__random
def __generate(self) -> None:
"""Generate a new value for this ObjectId."""
# 4 bytes current time
oid = struct.pack(">I", int(time.time()))
# 5 bytes random
oid += ObjectId._random()
# 3 bytes inc
with ObjectId._inc_lock:
oid += struct.pack(">I", ObjectId._inc)[1:4]
ObjectId._inc = (ObjectId._inc + 1) % (_MAX_COUNTER_VALUE + 1)
self.__id = oid
def __validate(self, oid: Any) -> None:
"""Validate and use the given id for this ObjectId.
Raises TypeError if id is not an instance of
(:class:`basestring` (:class:`str` or :class:`bytes`
in python 3), ObjectId) and InvalidId if it is not a
valid ObjectId.
- `oid`: a valid ObjectId
if isinstance(oid, ObjectId):
self.__id = oid.binary
elif isinstance(oid, str):
if len(oid) == 24:
self.__id = bytes.fromhex(oid)
except (TypeError, ValueError):
raise TypeError(f"id must be an instance of (bytes, str, ObjectId), not {type(oid)}")
def binary(self) -> bytes:
"""12-byte binary representation of this ObjectId."""
return self.__id
def generation_time(self) -> datetime.datetime:
"""A :class:`datetime.datetime` instance representing the time of
generation for this :class:`ObjectId`.
The :class:`datetime.datetime` is timezone aware, and
represents the generation time in UTC. It is precise to the
timestamp = struct.unpack(">I", self.__id[0:4])[0]
return datetime.datetime.fromtimestamp(timestamp, utc)
def __getstate__(self) -> bytes:
"""Return value of object for pickling.
needed explicitly because __slots__() defined.
return self.__id
def __setstate__(self, value: Any) -> None:
"""Explicit state set from pickling"""
# Provide backwards compatibility with OIDs
# pickled with pymongo-1.9 or older.
if isinstance(value, dict):
oid = value["_ObjectId__id"]
oid = value
# ObjectIds pickled in python 2.x used `str` for __id.
# In python 3.x this has to be converted to `bytes`
# by encoding latin-1.
if isinstance(oid, str):
self.__id = oid.encode("latin-1")
self.__id = oid
def __str__(self) -> str:
return binascii.hexlify(self.__id).decode()
def __repr__(self):
return f"ObjectId('{str(self)}')"
def __eq__(self, other: Any) -> bool:
if isinstance(other, ObjectId):
return self.__id == other.binary
return NotImplemented
def __ne__(self, other: Any) -> bool:
if isinstance(other, ObjectId):
return self.__id != other.binary
return NotImplemented
def __lt__(self, other: Any) -> bool:
if isinstance(other, ObjectId):
return self.__id < other.binary
return NotImplemented
def __le__(self, other: Any) -> bool:
if isinstance(other, ObjectId):
return self.__id <= other.binary
return NotImplemented
def __gt__(self, other: Any) -> bool:
if isinstance(other, ObjectId):
return self.__id > other.binary
return NotImplemented
def __ge__(self, other: Any) -> bool:
if isinstance(other, ObjectId):
return self.__id >= other.binary
return NotImplemented
def __hash__(self) -> int:
"""Get a hash value for this :class:`ObjectId`."""
return hash(self.__id)