/usr/lib/python2.7/dist-packages/happybase/batch.py is in python-happybase 0.7-1build1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 | """
HappyBase Batch module.
"""
from collections import defaultdict
import logging
from numbers import Integral
from .hbase.ttypes import BatchMutation, Mutation
logger = logging.getLogger(__name__)
class Batch(object):
"""Batch mutation class.
This class cannot be instantiated directly; use :py:meth:`Table.batch`
instead.
"""
def __init__(self, table, timestamp=None, batch_size=None,
transaction=False, wal=True):
"""Initialise a new Batch instance."""
if not (timestamp is None or isinstance(timestamp, Integral)):
raise TypeError("'timestamp' must be an integer or None")
if batch_size is not None:
if transaction:
raise TypeError("'transaction' cannot be used when "
"'batch_size' is specified")
if not batch_size > 0:
raise ValueError("'batch_size' must be > 0")
self._table = table
self._batch_size = batch_size
self._timestamp = timestamp
self._transaction = transaction
self._wal = wal
self._families = None
self._reset_mutations()
def _reset_mutations(self):
"""Reset the internal mutation buffer."""
self._mutations = defaultdict(list)
self._mutation_count = 0
def send(self):
"""Send the batch to the server."""
bms = [BatchMutation(row, m) for row, m in self._mutations.iteritems()]
if not bms:
return
logger.debug("Sending batch for '%s' (%d mutations on %d rows)",
self._table.name, self._mutation_count, len(bms))
if self._timestamp is None:
self._table.connection.client.mutateRows(self._table.name, bms, {})
else:
self._table.connection.client.mutateRowsTs(
self._table.name, bms, self._timestamp, {})
self._reset_mutations()
#
# Mutation methods
#
def put(self, row, data, wal=None):
"""Store data in the table.
See :py:meth:`Table.put` for a description of the `row`, `data`,
and `wal` arguments. The `wal` argument should normally not be
used; its only use is to override the batch-wide value passed to
:py:meth:`Table.batch`.
"""
if wal is None:
wal = self._wal
self._mutations[row].extend(
Mutation(
isDelete=False,
column=column,
value=value,
writeToWAL=wal)
for column, value in data.iteritems())
self._mutation_count += len(data)
if self._batch_size and self._mutation_count >= self._batch_size:
self.send()
def delete(self, row, columns=None, wal=None):
"""Delete data from the table.
See :py:meth:`Table.put` for a description of the `row`, `data`,
and `wal` arguments. The `wal` argument should normally not be
used; its only use is to override the batch-wide value passed to
:py:meth:`Table.batch`.
"""
# Work-around Thrift API limitation: the mutation API can only
# delete specified columns, not complete rows, so just list the
# column families once and cache them for later use by the same
# batch instance.
if columns is None:
if self._families is None:
self._families = self._table._column_family_names()
columns = self._families
if wal is None:
wal = self._wal
self._mutations[row].extend(
Mutation(isDelete=True, column=column, writeToWAL=wal)
for column in columns)
self._mutation_count += len(columns)
if self._batch_size and self._mutation_count >= self._batch_size:
self.send()
#
# Context manager methods
#
def __enter__(self):
"""Called upon entering a ``with`` block"""
return self
def __exit__(self, exc_type, exc_value, traceback):
"""Called upon exiting a ``with`` block"""
# If the 'with' block raises an exception, the batch will not be
# sent to the server.
if self._transaction and exc_type is not None:
return
self.send()
|