Source code for redpipe.structs

# -*- coding: utf-8 -*-
"""
The Struct is a convenient way to access data in a hash.
Makes it possible to load data from redis as an object and access the fields.
Then store changes back into redis.
"""
from six import add_metaclass
from json.encoder import JSONEncoder
from functools import wraps
from .pipelines import autoexec
from .keyspaces import Hash
from .fields import TextField
from .exceptions import InvalidOperation
from .futures import Future, IS

__all__ = ['Struct']


class StructMeta(type):
    """
    Data binding of a redpipe.Hash to the core of the Struct object.
    Creates it dynamically on class construction.
    uses the keyspace and connection fields
    Meta Classes are strange beasts.
    """

    def __new__(mcs, name, bases, d):
        if name in ['Struct'] and d.get('__module__', '') == 'redpipe.structs':
            return type.__new__(mcs, name, bases, d)

        class StructHash(Hash):
            keyspace = d.get('keyspace', name)
            connection = d.get('connection', None)
            fields = d.get('fields', {})
            keyparse = d.get('keyparse', TextField)
            valueparse = d.get('valueparse', TextField)
            memberparse = d.get('memberparse', TextField)
            keyspace_template = d.get('keyspace_template', '%s{%s}')

        d['core'] = StructHash

        return type.__new__(mcs, name, bases, d)


[docs]@add_metaclass(StructMeta)
class Struct(object):
    """
    load and store structured data in redis using OOP patterns.

    If you pass in a dictionary-like object, redpipe will write all the
    values you pass in to redis to the key you specify.

    By default, the primary key name is `_key`.
    But you should override this in your Struct with the `key_name`
    property.

    .. code-block:: python

        class Beer(redpipe.Struct):
            fields = {'name': redpipe.TextField}
            key_name = 'beer_id'

        beer = Beer({'beer_id': '1', 'name': 'Schlitz'})

    This will store the data you pass into redis.
    It will also load any additional fields to hydrate the object.
    **RedPipe** does this in the same pipelined call.

    If you need a stub record that neither loads or saves data, do:

    .. code-block:: python

        beer = Beer({'beer_id': '1'}, no_op=True)

    You can later load the fields you want using, load.

    If you pass in a string we assume it is the key of the record.
    redpipe loads the data from redis:

    .. code-block:: python

        beer = Beer('1')
        assert(beer['beer_id'] == '1')
        assert(beer['name'] == 'Schlitz')

    If you need to load a record but only specific fields, you can say so.

    .. code-block:: python

        beer = Beer('1', fields=['name'])

    This will exclude all other fields.

    **RedPipe** cares about pipelining and efficiency, so if you need to
    bundle a bunch of reads or writes together, by all means do so!

    .. code-block:: python

        beer_ids = ['1', '2', '3']
        with redpipe.pipeline() as pipe:
            beers = [Beer(i, pipe=pipe) for i in beer_ids]
        print(beers)

    This will pipeline all 3 together and load them in a single pass
    from redis.

    The following methods all accept a pipe:

    * __init__
    * update
    * incr
    * decr
    * pop
    * remove
    * clear
    * delete

    You can pass a pipeline into them to make sure that the network i/o is
    combined with another pipeline operation.
    The other methods on the object are about accessing the data
    already loaded.
    So you shouldn't need to pipeline them.


    One more thing ... suppose you are storing temporary data and you want it
    to expire after a few days. You can easily make that happen just by
    changing the object definition:

    .. code-block:: python

        class Beer(redpipe.Struct):
            fields = {'name': redpipe.TextField}
            key_name = 'beer_id'
            ttl = 24 * 60 * 60 * 3

    This makes sure that any set operations on the Struct will set the expiry
    at the same time. If the object isn't modified for more than the seconds
    specified in the ttl (stands for time-to-live), then the object will be
    expired from redis. This is useful for temporary objects.
    """
    __slots__ = ['key', '_data']
    keyspace = None
    connection = None
    key_name = '_key'
    fields = {}
    required = set()
    default_fields = 'all'  # set as 'defined', 'all', or ['a', b', 'c']
    field_attr_on = False
    ttl = None

    def __init__(self, _key_or_data, pipe=None, fields=None, no_op=False,
                 nx=False):
        """
        class constructor

        :param _key_or_data:
        :param pipe:
        :param fields:
        :param no_op: bool
        :param nx: bool
        """

        self._data = {}
        with self._pipe(pipe=pipe) as pipe:
            # first we try treat the first arg as a dictionary.
            # this is if we are passing in data to be set into the redis hash.
            # if that doesn't work, we assume it must be the name of the key.
            try:
                # force type to dict.
                # this blows up if it's a string.
                coerced = dict(_key_or_data)

                # look for the primary key in the data
                # won't work if we don't have this.
                keyname = self.key_name

                # track the primary key
                # it's the name of the key only.
                # the keyspace we defined will transform it into the full
                # name of the key.
                self.key = coerced[keyname]

                # remove it from our data set.
                # we don't write this value into redis.
                del coerced[keyname]

                # no op flag means don't write or read from the db.
                # if so, we just set the dictionary.
                # this is useful if we are cloning the object
                # or rehydrating it somehow.
                if no_op:
                    self._data = coerced
                    return

                required_found = self.required.intersection(coerced.keys())
                if len(required_found) != len(self.required):
                    raise InvalidOperation('missing required field(s): %s' %
                                           list(self.required - required_found)
                                           )

                self.update(coerced, pipe=pipe, nx=nx)

            # we wind up here if a dictionary was passed in, but it
            # didn't contain the primary key
            except KeyError:
                # can't go any further, blow up.
                raise InvalidOperation(
                    'must specify primary key when cloning a struct')

            # this is a normal case, not really exceptional.
            # If you pass in the name of the key, you wind up here.
            except (ValueError, TypeError):
                self.key = _key_or_data

            # normally we ask redis for the data from redis.
            # if the no_op flag was passed we skip it.
            if not no_op:
                self.load(fields=fields, pipe=pipe)

[docs]    def load(self, fields=None, pipe=None):
        """
        Load data from redis.
        Allows you to specify what fields to load.
        This method is also called implicitly from the constructor.

        :param fields: 'all', 'defined', or array of field names
        :param pipe: Pipeline(), NestedPipeline() or None
        :return: None
        """
        if fields is None:
            fields = self.default_fields

        if fields == 'all':
            return self._load_all(pipe=pipe)

        if fields == 'defined':
            fields = [k for k in self.fields.keys()]

        if not fields:
            return

        with self._pipe(pipe) as pipe:
            # get the list of fields.
            # it returns a numerically keyed array.
            # when that happens we match up the results
            # to the keys we requested.
            ref = self.core(pipe=pipe).hmget(self.key, fields)

            def cb():
                """
                This callback fires when the root pipeline executes.
                At that point, we hydrate the response into this object.

                :return: None
                """
                for i, v in enumerate(ref.result):
                    k = fields[i]

                    # redis will return all of the fields we requested
                    # regardless of whether or not they are set.
                    # if the value is None, it's not set in redis.
                    # Use that as a signal to remove that value from local.
                    if v is None:
                        self._data.pop(k, None)

                    # as long as the field is not the primary key,
                    # map it into the local data strucure
                    elif k != self.key_name:
                        self._data[k] = v

            # attach the callback to the pipeline.
            pipe.on_execute(cb)

    def _load_all(self, pipe=None):
        """
        Load all data from the redis hash key into this local object.

        :param pipe: optional pipeline
        :return: None
        """
        with self._pipe(pipe) as pipe:
            ref = self.core(pipe=pipe).hgetall(self.key)

            def cb():
                if not ref.result:
                    return

                for k, v in ref.result.items():
                    if k != self.key_name:
                        self._data[k] = v

            pipe.on_execute(cb)

[docs]    def incr(self, field, amount=1, pipe=None):
        """
        Increment a field by a given amount.
        Return the future

        Also update the field.

        :param field:
        :param amount:
        :param pipe:
        :return:
        """
        with self._pipe(pipe) as pipe:
            core = self.core(pipe=pipe)
            # increment the key
            new_amount = core.hincrby(self.key, field, amount)
            self._expire(pipe=pipe)

            # we also read the value of the field.
            # this is a little redundant, but otherwise we don't know exactly
            # how to format the field.
            # I suppose we could pass the new_amount through the formatter?
            ref = core.hget(self.key, field)

            def cb():
                """
                Once we hear back from redis, set the value locally
                in the object.

                :return:
                """
                self._data[field] = ref.result

            pipe.on_execute(cb)

            return new_amount

[docs]    def decr(self, field, amount=1, pipe=None):
        """
        Inverse of incr function.

        :param field:
        :param amount:
        :param pipe:
        :return: Pipeline, NestedPipeline, or None
        """
        return self.incr(field, amount * -1, pipe=pipe)

[docs]    def update(self, changes, pipe=None, nx=False):
        """
        update the data in the Struct.

        This will update the values in the underlying redis hash.
        After the pipeline executes, the changes will be reflected here
        in the local struct.
        If any values in the changes dict are None, those fields will be
        removed from redis and the instance.
        The changes should be a dictionary representing the fields to change
        and the values to change them to.
        If you pass the nx flag, only sets the fields if they don't exist yet.

        :param changes: dict
        :param pipe: Pipeline, NestedPipeline, or None
        :param nx: bool
        :return: None
        """
        if not changes:
            return

        # can't remove the primary key.
        # maybe you meant to delete the object?
        # look at delete method.
        if self.key_name in changes:
            raise InvalidOperation('cannot update the redis key')

        # sort the change set into updates and deletes.
        # the deletes are entries with None as the value.
        # updates are everything else.
        deletes = [k for k, v in changes.items() if IS(v, None)]
        updates = {k: v for k, v in changes.items() if k not in deletes}

        with self._pipe(pipe) as pipe:

            core = self.core(pipe=pipe)
            set_method = core.hsetnx if nx else core.hset

            def build(k, v):
                """
                Internal closure so we can set the field in redis and
                set up a callback to write the data into the local instance
                data once we hear back from redis.

                :param k: the member of the hash key
                :param v: the value we want to set
                :return: None
                """

                res = set_method(self.key, k, v)

                def cb():
                    """
                    Here's the callback.
                    Now that the data has been written to redis, we can
                    update the local state.

                    :return: None
                    """
                    if not nx or res == 1:
                        self._data[k] = v

                # attach the callback.
                pipe.on_execute(cb)

            # all the other stuff so far was just setup for this part
            # iterate through the updates and set up the calls to redis
            # along with the callbacks to update local state once the
            # changes come back from redis.
            for k, v in updates.items():
                build(k, v)

            # pass off all the delete operations to the remove call.
            # happens in the same pipeline.
            self.remove(deletes, pipe=pipe)
            self._expire(pipe=pipe)

[docs]    def remove(self, fields, pipe=None):
        """
        remove some fields from the struct.
        This will remove data from the underlying redis hash object.
        After the pipe executes successfully, it will also remove it from
        the current instance of Struct.

        :param fields: list or iterable, names of the fields to remove.
        :param pipe: Pipeline, NestedPipeline, or None
        :return: None
        """
        # no fields specified? It's a no op.
        if not fields:
            return

        # can't remove the primary key.
        # maybe you meant to call the delete method?
        if self.key_name in fields:
            raise InvalidOperation('cannot remove the redis key')

        removed_required_fields = self.required.intersection(fields)
        if len(removed_required_fields):
            raise InvalidOperation('cannot remove required field(s): %s'
                                   % list(removed_required_fields))

        with self._pipe(pipe) as pipe:
            # remove all the fields specified from redis.
            core = self.core(pipe=pipe)
            core.hdel(self.key, *fields)
            self._expire(pipe=pipe)

            # set up a callback to remove the fields from this local object.
            def cb():
                """
                once the data has been removed from redis,
                Remove the data here.

                :return:
                """
                for k in fields:
                    self._data.pop(k, None)

            # attach the callback.
            pipe.on_execute(cb)

[docs]    def copy(self):
        """
        like the dictionary copy method.

        :return:
        """
        return self.__class__(dict(self))

    @property
    def persisted(self):
        """
        Not certain I want to keep this around.
        Is it useful?

        :return:
        """
        return True if self._data else False

[docs]    def clear(self, pipe=None):
        """
        delete the current redis key.

        :param pipe:
        :return:
        """
        with self._pipe(pipe) as pipe:
            self.core(pipe=pipe).delete(self.key)

            def cb():
                self._data = {}

            pipe.on_execute(cb)

[docs]    def get(self, item, default=None):
        """
        works like the dict get method.

        :param item:
        :param default:
        :return:
        """
        return self._data.get(item, default)

[docs]    def pop(self, name, default=None, pipe=None):
        """
        works like the dictionary pop method.

        IMPORTANT!

        This method removes the key from redis.
        If this is not the behavior you want, first convert your
        Struct data to a dict.

        :param name:
        :param default:
        :param pipe:
        :return:
        """
        f = Future()
        with self._pipe(pipe) as pipe:
            c = self.core(pipe)
            ref = c.hget(self.key, name)
            c.hdel(self.key, name)
            self._expire(pipe=pipe)

            def cb():
                f.set(default if ref.result is None else ref.result)
                self._data.pop(name)

            pipe.on_execute(cb)

        return f

[docs]    @classmethod
    def delete(cls, keys, pipe=None):
        """
        Delete one or more keys from the Struct namespace.

        This is a class method and unlike the `clear` method,
        can be invoked without instantiating a Struct.

        :param keys: the names of the keys to remove from the keyspace
        :param pipe: Pipeline, NestedPipeline, or None
        :return: None
        """
        with cls._pipe(pipe) as pipe:
            core = cls.core(pipe)
            core.delete(*keys)

    def _expire(self, pipe=None):
        """
        delete the current redis key.

        :param pipe:
        :return:
        """
        if self.ttl:
            self.core(pipe=pipe).expire(self.key, self.ttl)

    @classmethod
    def _pipe(cls, pipe=None):
        """
        Internal method for automatically wrapping a pipeline and
        turning it into a nested pipeline with the correct connection
        and one that automatically executes as it exits the context.

        :param pipe: Pipeline, NestedPipeline or None
        :return: Pipeline or NestedPipeline
        """
        return autoexec(pipe, name=cls.connection)

    def __getitem__(self, item):
        """
        magic python method to make the object behave like a dictionary.
        You can access data like so:

        .. code-block:: python

            user = User('1')
            assert(user['name'] == 'bill')
            assert(user['_key'] == '1')

        The primary key is also included in this.
        If you have defined the name of the primary key, you use that name.
        Otherwise it defaults to `_key`.

        If the data doesn't exist in redis, it will raise a KeyError.
        I thought about making it return None, but if you want that
        behavior, use the `get` method.

        :param item: the name of the element in the dictionary
        :return: the value of the element.
        """
        if item == self.key_name:
            return self.key

        return self._data[item]

    def __delitem__(self, key):
        """
        Explicitly prevent deleting data from the object via the `del`
        command.

        .. code-block:: python

            del user['name']  # raises InvalidOperation exception!

        The reason is because I want you to use the `remove` method instead.
        That way you can pipeline the removal of the redis field with
        something else.

        Also, you probably want to avoid a scenario where you accidentally
        delete data from redis without meaning to.

        :param key: the name of the element to remove from the dict.
        :raise: InvalidOperation
        """
        tpl = 'cannot delete %s from %s indirectly. Use the delete method.'
        raise InvalidOperation(tpl % (key, self))

    def __setitem__(self, key, value):
        """
        Explicitly prevent setting data into this dictionary-like object.

        Example:

        .. code-block:: python

            user = User('1')
            user['name'] = 'Bob' # raises InvalidOperation exception

        RedPipe does not support this because you should be using the
        `update` method to change properties on the object where you can
        pipeline the operation with other calls to redis.

        It also avoids the problem where you accidentally change data
        if you were confused and thought you were just manipulating a
        regular dictionary.

        :param key: the name of the element in this pseudo dict.
        :param value: the value to set it to
        :raise: InvalidOperation
        """
        tpl = 'cannot set %s key on %s indirectly. Use the update method.'
        raise InvalidOperation(tpl % (key, self))

    def __getattr__(self, item):
        """
        magic python method -- returns fields as an attribute of the object.
        This is off by default.
        You can enable it by setting `field_attr_on = True` on
        your struct.

        Then you can access data like so:

        .. code-block:: python

            user = User('1')
            assert(user.name == 'bill')

        :param item: str
        :return: mixed
        """
        try:
            if self.field_attr_on:
                if item == self.key_name:
                    return self.key

                return self._data[item]
        except KeyError:
            if item in self.fields:
                return None

        raise AttributeError(
            "'%s' object has no attribute '%s'" % (
                self.__class__.__name__, item))

    def __setattr__(self, key, value):
        """
        magic python method to control setting attributes on the object.

        :param key:
        :param value:
        :return:
        """
        if self.field_attr_on and key in self.fields:
            tpl = 'cannot set %s.%s directly. Use the update method.'
            raise InvalidOperation(tpl % (self, key))

        if key in self.__slots__ or key in self.__dict__:
            return super(Struct, self).__setattr__(key, value)

        raise AttributeError("'%s' object has no attribute '%s'" %
                             (self.__class__.__name__, key))

    def __iter__(self):
        """
        Make the `Struct` iterable, like a dictionary.
        When you iterate on a dict, it yields the keys of the dictionary.
        Emulating the same behavior here.

        :return: generator, a list of key names in the Struct
        """
        for k in self.keys():
            yield k

    def __len__(self):
        """
        How many elements in the Struct?
        This includes all the fields returned from redis + the key.

        :return: int
        """
        return len(dict(self))

    def __contains__(self, item):
        if item == self.key_name:
            return True
        return item in self._data

[docs]    def iteritems(self):
        """
        Support for the python 2 iterator of key/value pairs.
        This includes the primary key name and value.

        Example:

        .. code-block:: python

            u = User('1')
            data = {k: v for k, v in u.iteritems()}

        Or:

        .. code-block:: python

            u = User('1')
            for k, v in u.iteritems():
                print("%s: %s" % (k, v)


        :return: generator, a list of key/value pair tuples
        """
        yield self.key_name, self.key
        for k, v in self._data.items():
            yield k, v

[docs]    def items(self):
        """
        We return the list of key/value pair tuples.
        Similar to iteritems but in list form instead of as
        a generator.
        The reason we do this is because python2 code probably expects this to
        be a list. Not sure if I could care, but just covering my bases.

        Example:

        .. code-block:: python

            u = User('1')
            data = {k: v for k, v in u.items()}

        Or:

        .. code-block:: python

            u = User('1')
            for k, v in u.items():
                print("%s: %s" % (k, v)


        :return: list, containing key/value pair tuples.
        """
        return [row for row in self.iteritems()]

    def __eq__(self, other):
        """
        Test for equality with another python object.

        Example:

        ..code-block:: python

            u = User('1')
            assert(u == {'_key': '1', 'name': 'Bob'})
            assert(u == User('1'))

        The object you pass in should be a dict or an object that can
        be coerced into a dict, like another Struct.
        Returns True if all the keys and values match up.

        :param other: can be another dictionary, or a Struct.
        :return: bool
        """
        if self is other:
            return True
        try:
            if dict(self) == dict(other):
                return True
        except (TypeError, ValueError):
            pass

        return False

[docs]    def keys(self):
        """
        Get a list of all the keys in the Struct.
        This includes the primary key name, and all the elements
        that are set into redis.

        Note: even if you define fields on the Struct, those keys won't
        be returned unless the fields are actually written into the redis
        hash.

        .. code-block:: python

            u = User('1')
            assert(u.keys() == ['_key', 'name'])


        :return: list
        """
        return [row[0] for row in self.items()]

    def __str__(self):
        """
        A simple string representation of the object.
        Contins the class name, and the primary key.
        Doesn't print out all the data.
        The reason is because there could be some really
        complex data types in there or some really big values.
        Printing that out, especially in the context of an exception
        seems like a bad idea.

        :return: str
        """
        return "<%s:%s>" % (self.__class__.__name__, self.key)

    def __repr__(self):
        """
        Emulate the behavior of a dict when it is passed to repr.

        :return: str
        """
        return repr(dict(self))

    def __getstate__(self):
        """
        Used for pickling the Struct.

        :return: tuple of key, and internal `_data`
        """
        return self.key, self._data,

    def __setstate__(self, state):
        """
        used for unplickling the Struct.

        :param state:
        :return:
        """
        self.key = state[0]
        self._data = state[1]

    @property
    def _redpipe_struct_as_dict(self):
        """
        A special namespaced property used for json encoding.
        We use duck-typing and look for this property (which no other
        type of object should have) so that we can try to json
        serialize it by coercing it into a dict.

        :return: dict
        """
        return dict(self)


def _json_default_encoder(func):
    """
    Monkey-Patch the core json encoder library.
    This isn't as bad as it sounds.
    We override the default method so that if an object
    falls through and can't be encoded normally, we see if it is
    a Future object and return the result to be encoded.

    I set a special attribute on the Struct object so I can tell
    that's what it is.

    If that doesn't work, I fall back to the earlier behavior.
    The nice thing about patching the library this way is that it
    won't inerfere with existing code and it can itself be wrapped
    by other methods.

    So it's very extensible.

    :param func: the JSONEncoder.default method.
    :return: an object that can be json serialized.
    """

    @wraps(func)
    def inner(self, o):
        try:
            return o._redpipe_struct_as_dict  # noqa
        except AttributeError:
            pass
        return func(self, o)

    return inner


JSONEncoder.default = _json_default_encoder(JSONEncoder.default)
Source code for redpipe.structs

Navigation

Related Topics