* Examples work * setup.py kinda updasted * Fork of txmongo but with new pymongo embedded
244 lines
8.2 KiB
Python
244 lines
8.2 KiB
Python
# Copyright 2009-2012 10gen, Inc.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
"""Tools for creating and manipulating SON, the Serialized Ocument Notation.
|
|
|
|
Regular dictionaries can be used instead of SON objects, but not when the order
|
|
of keys is important. A SON object can be used just like a normal Python
|
|
dictionary."""
|
|
|
|
import copy
|
|
import re
|
|
|
|
# This sort of sucks, but seems to be as good as it gets...
|
|
# This is essentially the same as re._pattern_type
|
|
RE_TYPE = type(re.compile(""))
|
|
|
|
|
|
class SON(dict):
|
|
"""SON data.
|
|
|
|
A subclass of dict that maintains ordering of keys and provides a
|
|
few extra niceties for dealing with SON. SON objects can be
|
|
converted to and from asyncio_mongo._bson.
|
|
|
|
The mapping from Python types to BSON types is as follows:
|
|
|
|
=================================== ============= ===================
|
|
Python Type BSON Type Supported Direction
|
|
=================================== ============= ===================
|
|
None null both
|
|
bool boolean both
|
|
int [#int]_ int32 / int64 py -> bson
|
|
long int64 both
|
|
float number (real) both
|
|
string string py -> bson
|
|
unicode string both
|
|
list array both
|
|
dict / `SON` object both
|
|
datetime.datetime [#dt]_ [#dt2]_ date both
|
|
compiled re regex both
|
|
`bson.binary.Binary` binary both
|
|
`bson.objectid.ObjectId` oid both
|
|
`bson.dbref.DBRef` dbref both
|
|
None undefined bson -> py
|
|
unicode code bson -> py
|
|
`bson.code.Code` code py -> bson
|
|
unicode symbol bson -> py
|
|
bytes (Python 3) [#bytes]_ binary both
|
|
=================================== ============= ===================
|
|
|
|
Note that to save binary data it must be wrapped as an instance of
|
|
`bson.binary.Binary`. Otherwise it will be saved as a BSON string
|
|
and retrieved as unicode.
|
|
|
|
.. [#int] A Python int will be saved as a BSON int32 or BSON int64 depending
|
|
on its size. A BSON int32 will always decode to a Python int. In Python 2.x
|
|
a BSON int64 will always decode to a Python long. In Python 3.x a BSON
|
|
int64 will decode to a Python int since there is no longer a long type.
|
|
.. [#dt] datetime.datetime instances will be rounded to the nearest
|
|
millisecond when saved
|
|
.. [#dt2] all datetime.datetime instances are treated as *naive*. clients
|
|
should always use UTC.
|
|
.. [#bytes] The bytes type from Python 3.x is encoded as BSON binary with
|
|
subtype 0. In Python 3.x it will be decoded back to bytes. In Python 2.x
|
|
it will be decoded to an instance of :class:`~bson.binary.Binary` with
|
|
subtype 0.
|
|
"""
|
|
|
|
def __init__(self, data=None, **kwargs):
|
|
self.__keys = []
|
|
dict.__init__(self)
|
|
self.update(data)
|
|
self.update(kwargs)
|
|
|
|
def __new__(cls, *args, **kwargs):
|
|
instance = super(SON, cls).__new__(cls, *args, **kwargs)
|
|
instance.__keys = []
|
|
return instance
|
|
|
|
def __repr__(self):
|
|
result = []
|
|
for key in self.__keys:
|
|
result.append("(%r, %r)" % (key, self[key]))
|
|
return "SON([%s])" % ", ".join(result)
|
|
|
|
def __setitem__(self, key, value):
|
|
if key not in self:
|
|
self.__keys.append(key)
|
|
dict.__setitem__(self, key, value)
|
|
|
|
def __delitem__(self, key):
|
|
self.__keys.remove(key)
|
|
dict.__delitem__(self, key)
|
|
|
|
def keys(self):
|
|
return list(self.__keys)
|
|
|
|
def copy(self):
|
|
other = SON()
|
|
other.update(self)
|
|
return other
|
|
|
|
# TODO this is all from UserDict.DictMixin. it could probably be made more
|
|
# efficient.
|
|
# second level definitions support higher levels
|
|
def __iter__(self):
|
|
for k in list(self.keys()):
|
|
yield k
|
|
|
|
def has_key(self, key):
|
|
return key in list(self.keys())
|
|
|
|
def __contains__(self, key):
|
|
return key in list(self.keys())
|
|
|
|
# third level takes advantage of second level definitions
|
|
def iteritems(self):
|
|
for k in self:
|
|
yield (k, self[k])
|
|
|
|
def iterkeys(self):
|
|
return self.__iter__()
|
|
|
|
# fourth level uses definitions from lower levels
|
|
def itervalues(self):
|
|
for _, v in self.items():
|
|
yield v
|
|
|
|
def values(self):
|
|
return [v for _, v in self.items()]
|
|
|
|
def items(self):
|
|
return [(key, self[key]) for key in self]
|
|
|
|
def clear(self):
|
|
for key in list(self.keys()):
|
|
del self[key]
|
|
|
|
def setdefault(self, key, default=None):
|
|
try:
|
|
return self[key]
|
|
except KeyError:
|
|
self[key] = default
|
|
return default
|
|
|
|
def pop(self, key, *args):
|
|
if len(args) > 1:
|
|
raise TypeError("pop expected at most 2 arguments, got "\
|
|
+ repr(1 + len(args)))
|
|
try:
|
|
value = self[key]
|
|
except KeyError:
|
|
if args:
|
|
return args[0]
|
|
raise
|
|
del self[key]
|
|
return value
|
|
|
|
def popitem(self):
|
|
try:
|
|
k, v = next(iter(self.items()))
|
|
except StopIteration:
|
|
raise KeyError('container is empty')
|
|
del self[k]
|
|
return (k, v)
|
|
|
|
def update(self, other=None, **kwargs):
|
|
# Make progressively weaker assumptions about "other"
|
|
if other is None:
|
|
pass
|
|
elif hasattr(other, 'iteritems'): # iteritems saves memory and lookups
|
|
for k, v in other.items():
|
|
self[k] = v
|
|
elif hasattr(other, 'keys'):
|
|
for k in list(other.keys()):
|
|
self[k] = other[k]
|
|
else:
|
|
for k, v in other:
|
|
self[k] = v
|
|
if kwargs:
|
|
self.update(kwargs)
|
|
|
|
def get(self, key, default=None):
|
|
try:
|
|
return self[key]
|
|
except KeyError:
|
|
return default
|
|
|
|
def __eq__(self, other):
|
|
"""Comparison to another SON is order-sensitive while comparison to a
|
|
regular dictionary is order-insensitive.
|
|
"""
|
|
if isinstance(other, SON):
|
|
return len(self) == len(other) and list(self.items()) == list(other.items())
|
|
return self.to_dict() == other
|
|
|
|
def __ne__(self, other):
|
|
return not self == other
|
|
|
|
def __len__(self):
|
|
return len(list(self.keys()))
|
|
|
|
def to_dict(self):
|
|
"""Convert a SON document to a normal Python dictionary instance.
|
|
|
|
This is trickier than just *dict(...)* because it needs to be
|
|
recursive.
|
|
"""
|
|
|
|
def transform_value(value):
|
|
if isinstance(value, list):
|
|
return [transform_value(v) for v in value]
|
|
if isinstance(value, SON):
|
|
value = dict(value)
|
|
if isinstance(value, dict):
|
|
for k, v in value.items():
|
|
value[k] = transform_value(v)
|
|
return value
|
|
|
|
return transform_value(dict(self))
|
|
|
|
def __deepcopy__(self, memo):
|
|
out = SON()
|
|
val_id = id(self)
|
|
if val_id in memo:
|
|
return memo.get(val_id)
|
|
memo[val_id] = out
|
|
for k, v in self.items():
|
|
if not isinstance(v, RE_TYPE):
|
|
v = copy.deepcopy(v, memo)
|
|
out[k] = v
|
|
return out
|