#!/usr/bin/env python
"""
Implementation of class Table, representing tables in the database.
"""

import logging
import locking
import subprocess
import tables
import numpy as np
import os, os.path
import sys
import json
import utils
import cPickle
import copy
import glob
import shutil
import errno
from table_catalog import TableCatalog
from utils        import is_scalar_of_type
from pixelization import Pixelization
from collections  import OrderedDict
from contextlib   import contextmanager
from colgroup     import ColGroup

logger = logging.getLogger("lsd.table")

class BLOBAtom(tables.ObjectAtom):
	"""
	A PyTables atom representing BLOBs

	Same as tables.ObjectAtom, except that it uses the highest available
        pickle protocol to serialize the value into a BLOB.
        """

	def _tobuffer(self, object_):
		return cPickle.dumps(object_, -1)

class ColumnType(object):
	"""
	Description of a column in a Table

	A simple record representing columns of a table. Built at runtime
	from _cgroups entries, and stored in Table.columns.
	"""
	name    = None		#: The name of the column
	cgroup  = None		#: The name of the column's column group
	dtype   = None		#: Dtype (a numpy.dtype instance) of the column
	is_blob = False		#: True if the column is a BLOB

class Table:
	"""
	A spatially and temporally partitioned table.

	Instances of this object typically shouldn't be used directly, but
	queried via DB.query calls.

	If needed, this object must never be instantiated directly, but
	through a call to DB.table(). If always instantiated via db.table()
	calls, a Table instance is unique to a given table:
	
	    >>> a = db.table('sometable')
	    >>> b = db.table('sometable')
	    >>> a is b
	    True
	"""

	path = '.'		#: Full path to the table directory (set by controlling DB instance)
	pix  = None		#: Pixelization object for the table (initialized in __init__)
				# t0: default starting epoch (== 2pm HST, Aug 22 2007 (night of GPC1 first light))
				# td: default temporal resolution (in days)
	_nrows = 0		#: The number of rows in the table (use nrows() to access)

	_cgroups = None		#: Column groups in the table ( OrderedDict of table definitions (dicts), keyed by tablename; the first table is the primary one)
	_fgroups = None		#: Map of file group name -> file group definition. File groups define where and how external blobs are stored.
	_filters = None		#: Default PyTables filters to be applied to every Leaf in the file (can be overridden on per-tablet and per-blob basis)
	_commit_hooks = None	#: List of hooks to be called upon COMMIT

	columns        = None	#: OrderedDict of ColumnType objects describing the columns in the table
	primary_cgroup = None	#: The primary cgroup of this table (IDs and spatial/temporal keys are always in the primary group)
	primary_key    = None	#: A ColumnType instance for the primary_key (the unique "ID" of each row)
	spatial_keys   = None	#: A tuple of two ColumnType instances, for (lon, lat). None if no spatial key exists.
	temporal_key   = None	#: A ColumnType instance for the temporal key. None if no temporal key exist.

	snapid         = 0      #: Snapshot ID of the opened table
	_snapshots     = [ 0 ]  #: Sorted (newest to oldest) list of available, committed, snapshots
	transaction    = False  #: True if we're in a transaction (the current snapshot is writable)

	_default_commit_hooks = [('Updating neighbors', 0, 'lsd.tasks', 'build_neighbor_cache')] #: Default commit hook rebuilds the neighbor cache
	remote = None

	### Transaction/Snapshotting support
	def set_snapshot(self, snapid):
	        """ Load the list of committed snapshots <= than snapid
                    NOTE: This may get called even before the schema is loaded
		"""
		# Snapshot ID
		self.snapid = snapid

		# Check if we have a .remote set; if yes, pull all the metadata from
		# the remote
		dot_remote = '%s/.remote' % self.path
		if os.path.exists(dot_remote):
			self.remote = open(dot_remote).read().strip()

			# Fetch/update the list of snapshots
			snapshot_cat_fn = '%s/snapshots/.listing' % self.path
			self.fetch_from_remote(snapshot_cat_fn)

			# Fetch the catalogs+schemas for all snapshots
			# NOTE: we can change this to fetch the catalog only for the requested snapshot
			# once the code below that enumerates snapshots is changed to read from
			# the .listing file
			snapids = [ s.strip() for s in open(snapshot_cat_fn).xreadlines() if s.strip() != '' ]
			for snapid in snapids:
				local = self._snapshot_path(snapid) + '/'
				utils.mkdir_p(local)
				for fn in ['catalog.pkl', 'schema.cfg', '.committed']:
					if str(snapid) == "0" and fn == '.committed':	# Backwards compatibility
						continue
					local_fn = local + fn
					if not os.path.exists(local_fn):
						self.fetch_from_remote(local_fn)

		self._snapshots = self.list_snapshots(self.snapid)
		# Sorted list of snapshots, newest first
		self._snapshots.sort(reverse=True)

	def list_snapshots(self, snapid=None):
		# Load the list of committed snapshots that are older than snapid
		snaps = [ 0 ] if os.path.exists('%s/schema.cfg' % self.path) else []
		for path in glob.iglob('%s/snapshots/*/.committed' % (self.path)):
			s = path.split('/')[-2]
			if snapid is None or s <= snapid:
				snaps.append(s)

		return snaps

        def _load_catalog(self):
		# Load the tablet cache.
		#
		tabtreepkl = self._find_metadata_path('catalog.pkl')
		if os.path.isfile(tabtreepkl):
			self.catalog = TableCatalog(fn=tabtreepkl)
		elif os.path.isdir(os.path.join(self.path, 'tablets')) and not os.path.isdir(os.path.join(self.path, 'tablets', 'snapshots')):
			# Backwards compatibility: Auto-create it for old-style (pre v0.4) tables
		        assert self._snapshots[0] == 0
			print >> sys.stderr, "[%s] Updating tablet catalog:" % (self.name),
 			self.rebuild_catalog(rebuild_pre_v050_snap=True)
		else:
		        # A new table, opened on an uncommitted snapshot, has no saved catalog
		        # Create an empty one.
		        assert len(self._snapshots) == 0
		        self.catalog = TableCatalog(pix=self.pix)

	def get_cells_in_snapshot(self, snapid, include_cached=True):
		return self.catalog.get_cells_in_snapshot(snapid, include_cached=include_cached)

	def rebuild_catalog(self, rebuild_pre_v050_snap=False):
		self._check_transaction()

		# A bit of backwards compatibility for older tables
		if not rebuild_pre_v050_snap:
			snapid = self.snapid
		else:
			# Initialize an empty catalog
			snapid = 0

		# Update to the requested snapshot
		pattern = self._tablet_filename(self.primary_cgroup)
		self.catalog.update(self.path, pattern, snapid)

		# Save
		fn = os.path.join(self._snapshot_path(snapid), 'catalog.pkl')
		self.catalog.save(fn)

	def _check_transaction(self):
		if not self.transaction:
			raise Exception("Trying to modify a table without starting a transaction. This can also happen if you have multiple directories on LSD_DB path, and the table you're trying to modify is not in the first directory.")

	def begin_transaction(self, snapid, load_state=True):
		assert not self.transaction

		if os.path.exists(os.path.join(self.path, '.remote')):
			raise Exception("Tables that mirror remote tables cannot be written to (remove the .remote file first)")

		# Begin a new transaction
		path = self._snapshot_path(snapid)
		if os.path.isfile('%s/.committed' % path):
			raise Exception("Trying to reopen an already committed transaction")

		self.transaction = True

		if load_state:
        		# Reload state
        		self.set_snapshot(snapid)
        		self._load_schema()
        		self._load_catalog()

	def commit0(self, db, pri):
		""" Do post-transaction housekeeping """
		if pri == -1:
			# Build the tablet cache (hardwired)
			print >> sys.stderr, "[%s] Updating tablet catalog:" % (self.name),
			self.rebuild_catalog()
			self._snapshots.insert(0, self.snapid)

		# Call post-commit hooks of the given priority. By default, these
		# rebuild the neighbor cache.
		import importlib
		for hookdef in self._commit_hooks:
			(msg, priority, module, func) = hookdef[:4]

			if priority == pri:
				print >>sys.stderr, "[%s] %s:" % (self.name, msg),
				try:
					args = hookdef[4]
				except IndexError:
					args = []
				try:
					kwargs = hookdef[5]
				except IndexError:
					kwargs = {}

				m = importlib.import_module(module)
				func = "commit_hook__" + func
				getattr(m, func)(db, self, *args, **kwargs)

		if pri == 10:
			print >>sys.stderr, "[%s] Updating stats:" % self.name,
			# Compute summary stats (hardwired)
			from tasks import compute_counts
			self._nrows = compute_counts(db, self.name)
			self._store_schema()

			# Set all files read only
			print >>sys.stderr, "[%s] Marking tablets read-only..." % self.name
			path = os.path.abspath(self._snapshot_path(self.snapid))
			for root, dirs, files in os.walk(path):
				root = os.path.abspath(root)
				if root != path:
					os.chmod(root, 0555)			# r-x
				for f in files:
					os.chmod(os.path.join(root, f), 0444)	# r--

	def commit1(self):
		""" Do the actual commit """
		self._check_transaction()

		# Set commit marker
		path = self._snapshot_path(self.snapid)
		commit_marker = '%s/.committed' % path
		open(commit_marker, 'w').close()

		os.chmod(commit_marker, 0444)
		os.chmod(path, 0555)

		self.transaction = False

		# Reload state
		self.set_snapshot(self.snapid)
		self._load_schema()
		self._load_catalog()

	def rollback(self):
		""" Abort the transaction """
		self._check_transaction()

		self.transaction = False

		# Reload state
		self.set_snapshot(self.snapid)
		self._load_schema()
		self._load_catalog()

	### File name/path related methods
	def _resolve_uri(self, uri, mode, return_parts=False):
		"""
		Resolve an lsd: URI referring to this table. Used _only_ from
		open_uri()

		If mode == 'w', resolve into the path of last snapshot.
		If mode == 'r', find the latest snapshot that has the file.
		"""
		assert uri[:4] == 'lsd:'

		_, tabname, fgroup, fn = uri.split(':', 3)

		(file, args, suffix) = self._get_fgroup_filter(fgroup)
		subpath = 'files/%s/%s%s' % (fgroup, fn, suffix)

		if mode == 'r':
			# Go through the list of snapshots until one is found that
			# has our file.
			for snapid in self._snapshots:
				path = '%s/%s' % (self._snapshot_path(snapid), subpath)
				if os.path.exists(path):
					break
				if self.remote is not None:
					try:
						self.fetch_from_remote(path)
						break
					except IOError:
						pass
			else:
				raise IOError((errno.ENOENT, "No file for URI", uri))
		elif mode == 'w':
			self._check_transaction()
			path = '%s/%s' % (self._snapshot_path(self.snapid), subpath)
		else:
			raise Exception("Invalid file access mode '%s'" % mode)

		if not return_parts:
			return path
		else:
			return path, (tabname, fgroup, fn), (file, args, suffix)

	@contextmanager
	def open_uri(self, uri, mode='r'):
		"""
		Open the resource (a file) identified by the URI
		and return a file-like object. The resource is
		closed automatically when the context is exited.

		Parameters
		----------
		uri : string
		    The URI of the file to be opened. It is assumed that the
		    URI is an lsd: URI, referring to this table (i.e., it
		    must begin with lsd:tablename:).
		mode : string
		    The mode keyword is passed to the call that opens the
		    URI, but in general it is the same or similar to the
		    mode keyword of file(). If mode != 'r', the resource is
		    assumed to be opened for writing.
		"""
		(fn, (_, _, _), (file, kwargs, _)) = self._resolve_uri(uri, mode, return_parts=True)

		if mode != 'r':
			# Create directory to the file, if it
			# doesn't exist.
			path = fn[:fn.rfind('/')];
			if not os.path.exists(path):
				utils.mkdir_p(path)

		f = file(fn, mode, **kwargs)
		
		yield f
		
		f.close()

	def _snapshot_path(self, snapid, create=False):
		""" Return full path to given snapshot """
		if str(snapid) != "0":
			path = "%s/snapshots/%s" % (self.path, snapid)
		else:
			path = self.path

		if create:
			utils.mkdir_p(path)

		return path

	def _cell_path(self, cell_id, mode='r'):
		""" Return the full path to a particular cell """
		if mode == 'r':
			snapid = self.catalog.snapshot_of_cell(cell_id)
		elif mode in ['w', 'r+']:
			self._check_transaction()
			snapid = self.snapid
		else:
			raise Exception("Invalid mode '%s'" % mode)

		return '%s/tablets/%s' % (self._snapshot_path(snapid), self.pix.path_to_cell(cell_id))

	def _tablet_filename(self, cgroup):
		""" Return the filename of a tablet of the given cgroup """
		return '%s.%s.h5' % (self.name, cgroup)

	def _tablet_file(self, cell_id, cgroup, mode='r'):
		"""
		Return the full path to the tablet of the given cgroup
		"""
		path = self._cell_path(cell_id, mode)
		return '%s/%s' % (path, self._tablet_filename(cgroup))

        def cell_exists(self, cell_id):
        	try:
	        	self.catalog.snapshot_of_cell(cell_id)
	        	return True
		except LookupError:
			return False

	def fetch_from_remote(self, local):
		# Fetch the given local file from a remote repository
		# Raise IOError if anything goes wrong
		remote = local[len(self.path)+1:]
#		print "FETCHING:", remote

		utils.mkdir_p(os.path.dirname(local))

		try:
			g = self._fetcher
		except AttributeError:
			from fetcher import Fetcher
			g = self._fetcher = Fetcher(self.remote)

		g.fetch_to_file(remote, local)

	def tablet_exists(self, cell_id, cgroup):
		"""
		Check if a tablet exists.

		Return True if the given tablet exists in cell_id. For
		pseudo-cgroups check the existence of primary_cgroup.

		"""
		if cgroup is None or self._is_pseudotablet(cgroup):
			cgroup = self.primary_cgroup

		assert cgroup in self._cgroups

		try:
			fn = self._tablet_file(cell_id, cgroup)
		except LookupError:
			return False

		if os.access(fn, os.R_OK):
			return True
		if self.remote is None:
			return False

	        # If the tablet does not exist, try fetching it from a
	        # remote database
		try:
			self.fetch_from_remote(fn)
			return True
		except IOError:
			return False

	#############

	def get_cells(self, bounds=None, return_bounds=False, include_cached=True):
		"""
		Returns a list of cells (cell_id-s) overlapping the bounds.

		Used by the query engine to retrieve the list of cells to
		visit when evaluating a query. Uses TableCatalog to
		accelerate the lookup (and autocreates it if it doesn't
		exist).

		Parameters
		----------
		bounds : list of (Polygon, intervalset) tuples or None
		    The bounds to be checked
		return_bounds : boolean
		    If true, for return a list of (cell_id, bounds) tuples,
		    where the returned bounds in each tuple are the
		    intersection of input bounds and the bounds of that
		    cell (i.e., for an object known to be in that cell, you
		    only need to check the associated bounds to verify
		    whether it's within the input bounds).
		    If the bounds cover the entire cell, (cell_id, (None,
		    None)) will be returned.
		include_cached : boolean
		    If true, return the cells that have cached data only,
		    and no "true" data belonging to that cell.
		"""
		return self.catalog.get_cells(bounds, return_bounds, include_cached)

	def static_if_no_temporal(self, cell_id):
		"""
		Return the associated static cell, if no data exist in
		temporal.

		See if we have data in cell_id. If not, return a
		corresponding static sky cell_id. Useful when evaluating
		static-temporal JOINs
		
		If the cell_id already refers to a static cell, this
		function is a NOOP.
		"""
		if not self.pix.is_temporal_cell(cell_id):
			return cell_id

		if self.cell_exists(cell_id):
			##print "Temporal cell found!", self._cell_prefix(cell_id)
			return cell_id

		# return corresponding static-sky cell
		cell_id = self.pix.static_cell_for_cell(cell_id)
		#print "Reverting to static sky", self._cell_prefix(cell_id)
		return cell_id

	def _get_fgroup_filter(self, fgroup):
		"""
		Fetch the I/O filter associated with the file group.
		
		Each file group can have an "I/O filter" associated with it. 
		The typical use for filters is to enable transparent
		compression of external BLOBs.
		
		Available I/O filters are:
		    gzip : gzip compression
		    bzip2 : bzip2 compression

		Returns
		-------
		file : callable
		    A callable with an interface equal to that of file().
		    For example, gzip.GzipFile is returned for gzip I/O
		    filter.
		kwargs : dict
		    A dictionary of keyword arguments the caller should pass
		    in a call to file callable (the one above). For example,
		    kwargs would be { 'compresslevel': 5 } to set the
		    compression level in a call to GzipFile.
		suffix : string
		    Any suffix that the caller should append to the file
		    name to get to the actual file as stored on the disk
		    (example: .gz for gzip compressed files).
		"""
		# Check for any filters associated with this fgroup
		if fgroup in self._fgroups and 'filter' in self._fgroups[fgroup]:
			(filter, kwargs) = self._fgroups[fgroup]['filter']
			if filter == 'gzip':
				# Gzipped file
				import gzip
				file = gzip.GzipFile
				suffix = '.gz'
			elif filter == 'bzip2':
				# Bzipped file
				import bz2
				file = bz2.BZ2File
				suffix = '.bz2'
			else:
				raise Exception('Unknown filter "%s" on file group %f' % fgroup)
		else:
			# Plain file
			import __builtin__
			file = __builtin__.file
			kwargs = {}
			suffix = ''

		return file, kwargs, suffix

	def set_default_filters(self, **filters):
		"""
		Set default PyTables filters (compression, checksums)
		
		Immediately commits the change to disk.
		"""
		self._filters = filters
		self._store_schema()

	def define_commit_hooks(self, hooks):
		self._commit_hooks = hooks
		self._store_schema()

	def define_fgroup(self, fgroup, fgroupdef):
		"""
		Define a new (or redefine an existing) file group
		
		Immediately commits the change to disk.
		"""
		self._fgroups[fgroup] = fgroupdef
		self._store_schema()

	def _unicode_to_str(self, arr):
		"""
			HACK: Recursively in-place convert unicode objects to str objects
		"""
		if isinstance(arr, list):
			it = enumerate(arr)
		elif isinstance(arr, dict):
			it = arr.iteritems()
		else:
			return

		for k, v in it:
			if isinstance(v, unicode):
				arr[k] = v.encode('utf-8')
			else:
				self._unicode_to_str(v)

	def _find_metadata_path(self, fn):
		if self.transaction:
			path = os.path.join(self._snapshot_path(self.snapid), fn)
			if os.path.isfile(path):
				return path

		if self._snapshots:
			return os.path.join(self._snapshot_path(self._snapshots[0]), fn)
		else:
			# Completely empty table -- return dummy metadata path
			return os.path.join(self._snapshot_path(0), fn)

	def _load_schema(self):
		"""
		Load the table schema.
		
		Load the table schema from schema.cfg file, and rebuild
		the internal representation of the table (the self.columns
		dict).
		"""

		schemacfg = self._find_metadata_path('schema.cfg')
		data = json.loads(file(schemacfg).read(), object_pairs_hook=OrderedDict)
		self._unicode_to_str(data)

		self.name = data["name"]
		self._nrows = data.get("nrows", None)

		######################
		# Backwards compatibility
		level, t0, dt = data["level"], data["t0"], data["dt"]
		self.pix = Pixelization(level, t0, dt)

		# Load cgroup definitions
		if isinstance(data['cgroups'], dict):
			# Backwards compatibility, keeps ordering because of objecct_pairs_hook=OrderedDict above
			self._cgroups = data["cgroups"]
		else:
			self._cgroups = OrderedDict(data['cgroups'])

		# Postprocessing: fix cases where JSON restores arrays instead
		# of tuples, and tuples are required
		for _, schema in self._cgroups.iteritems():
			schema['columns'] = [ tuple(val) for val in schema['columns'] ]

		self._fgroups = data.get('fgroups', {})
		self._filters = data.get('filters', {})
		self._aliases = data.get('aliases', {})
		self._commit_hooks = data.get('commit_hooks', self._default_commit_hooks)
		
		# Add pseudocolumns cgroup
		self._cgroups['_PSEUDOCOLS'] = \
		{
			'columns': [
				('_CACHED', 'bool'),
				('_ROWIDX', 'u8'),
				('_ROWID',  'u8')
			]
		}

		self._rebuild_internal_schema()

	def _store_schema(self):
		"""
		Store the table schema.

		Store the table schema to schema.cfg, in JSON format.
		"""
		self._check_transaction()

		data = dict()
		data["level"], data["t0"], data["dt"] = self.pix.level, self.pix.t0, self.pix.dt
		data["nrows"] = self._nrows
		data["cgroups"] = [ (name, schema) for (name, schema) in self._cgroups.iteritems() if name[0] != '_' ]
		data["name"] = self.name
		data["fgroups"] = self._fgroups
		data["filters"] = self._filters
		data["aliases"] = self._aliases
		data["commit_hooks"] = self._commit_hooks

		fn = self._snapshot_path(self.snapid, create=True) + '/schema.cfg'
		f = open(fn, 'w')
		f.write(json.dumps(data, indent=4, sort_keys=True))
		f.close()

	def _rebuild_internal_schema(self):
		"""
		(Re)Build the internal representation of the schema.

		Rebuild the internal representation of the schema from
		self._cgroups OrderedDict. This means populating the
		self.columns dict, as well as primary_cgroup, primary_key
		and other similar data members.
		"""
		self.columns = OrderedDict()
		self.primary_cgroup = None

		for cgroup, schema in self._cgroups.iteritems():
			for colname, dtype in schema['columns']:
				assert colname not in self.columns
				self.columns[colname] = ColumnType()
				self.columns[colname].name  = colname
				self.columns[colname].dtype = np.dtype(dtype)
				self.columns[colname].cgroup = cgroup

			if self.primary_cgroup is None and not self._is_pseudotablet(cgroup):
				self.primary_cgroup = cgroup
				if 'primary_key'  in schema:
					self.primary_key  = self.columns[schema['primary_key']]
				if 'temporal_key' in schema:
					self.temporal_key = self.columns[schema['temporal_key']]
				if 'spatial_keys' in schema:
					(lon, lat) = schema['spatial_keys']
					self.spatial_keys = (self.columns[lon], self.columns[lat])
			else:
				# If any of these are defined, they must be defined in the
				# primary cgroup
				assert 'primary_key'  not in schema
				assert 'spatial_keys' not in schema
				assert 'temporak_key' not in schema

			if 'blobs' in schema:
				for colname in schema['blobs']:
					assert self.columns[colname].dtype.base == np.int64, "Data structure error: blob reference columns must be of int64 type"
					self.columns[colname].is_blob = True

	#################

	@property
	def dtype(self):
		"""
		Return the dtype of a row in this table.
		
		Returns
		-------
		dtype : numpy.dtype
		"""
		return np.dtype([ (name, coltype.dtype) for (name, coltype) in self.columns.iteritems() ])

	def dtype_for(self, cols):
		"""
		Return the dtype of a row of a subset of columns.

		Parameters
		----------
		cols : iterable of strings
		    The subset of columns for which to return the dtype.
		    Column aliases are allowed.

		Returns
		-------
		dtype : numpy.dtype
		"""
		return np.dtype([ (name, self.columns[self.resolve_alias(name)].dtype) for name in cols ])

	#################

	def create_cgroup(self, cgroup, schema, ignore_if_exists=False):
		"""
		Create a new column group.

		Immediately commits the change to the disk.

		Parameters
		----------
		cgroup : string
		    The name of the new column group.
		schema : dict-like
		    The schema of the new column group.
		ignore_if_exists: boolean
		    If False, and the cgroup already exists, an Exception
		    will be raised.
		"""
		# Create a new table and set it as primary if it
		# has a primary_key
		if cgroup in self._cgroups and not ignore_if_exists:
			raise Exception('Trying to create a cgroup that already exists!')
		if self._is_pseudotablet(cgroup):
			raise Exception("cgroups beginning with '_' are reserved for system use.")

		schema = copy.deepcopy(schema)

		# convert all dtypes with type='O8' to blobrefs (type='i8')
		for (pos, (name, dtype)) in enumerate(schema['columns']):
			s0 = dtype
			s1 = s0.replace('O8', 'i8')
			if s0 != s1:
				schema['columns'][pos] = (name, s1)
				# Add it to blobs array, if not already there
				if 'blobs' not in schema: schema['blobs'] = {}
				if name not in schema['blobs']:
					schema['blobs'][name] = {}

		if 'spatial_keys' in schema and 'primary_key' not in schema:
			raise Exception('Trying to create spatial keys in a non-primary cgroup!')

		if 'primary_key' in schema:
			if self.primary_cgroup is not None:
				raise Exception('Trying to create a primary cgroup ("%s") while one ("%s") already exists!' % (cgroup, self.primary_cgroup))
			self.primary_cgroup = cgroup

		if 'blobs' in schema:
			cols = dict(schema['columns'])
			for blobcol in schema['blobs']:
				assert is_scalar_of_type(cols[blobcol], np.int64)

		self._cgroups[cgroup] = schema

		self._rebuild_internal_schema()
		self._store_schema()

	### Cell locking routines
	def _lock_cell(self, cell_id, timeout=None):
		"""
		Low-level: Lock a given cell for writing.

		You should prefer the lock_cell() context manager to this
		function.

		If timeout != None, and the cell is locked, we will retry
		for timeout seconds to lock the cell.  If all attempts fail,
		locking.LockTimeout exception will be thrown.

		Returns
		-------
		lock : opaque object
		    The lock handle.
		"""
		self._check_transaction()

		# create directory if needed
		path = self._cell_path(cell_id, 'w')
		if not os.path.exists(path):
			utils.mkdir_p(path)

		fn = '%s/.__%s.lock' % (path, self.name)

		lock = locking.acquire(fn, timeout)
		logger.debug("Acquired lock %s" % (fn))

		return lock

	def _unlock_cell(self, lock):
		"""
		Unlock a previously locked cell.
		"""
		locking.release(lock)
		logger.debug("Released lock %s" % (lock))

	#### Low level tablet creation/access routines. These employ no locking
	def _get_row_group(self, fp, group, cgroup):
		"""
		Get a handle to the given HDF5 node.
		
		Obtain a handle to the given HDF5 node, autocreating it if
		necessary. If auto-creating, use the information from the
		table schema to create the HDF5 objects (tables, arrays)
		corresponding to the cgroup.

		The parameter 'group' specifies whether we're
		retreiving/creating the group with data belonging to the
		cell ('main'), or the neighbor cache ('cached').

		TODO: I feel this whole 'group' business hasn't been well
		      though out and should be reconsidered/redesigned...
		"""
		assert group in ['main', 'cached']

		g = getattr(fp.root, group, None)

		if g is None:
			schema = self._get_schema(cgroup)

			# cgroup
			filters      = schema.get('filters', self._filters)
			expectedrows = schema.get('expectedrows', 20*1000*1000)

			fp.create_table('/' + group, 'table', np.dtype(schema["columns"]), createparents=True, expectedrows=expectedrows, filters=tables.Filters(**filters))
			g = getattr(fp.root, group)

			# Primary key sequence
			if group == 'main' and 'primary_key' in schema:
				seqname = '_seq_' + schema['primary_key']
				fp.create_array(g, seqname, np.array([1], dtype=np.uint64))

			# BLOB storage arrays
			if 'blobs' in schema:
				for blobcol, blobdef in schema['blobs'].iteritems():
					filters          = blobdef.get('filters', filters)
					expectedsizeinMB = blobdef.get('expectedsizeinMB', 1.0)

					# Decide what type of VLArray to create
					type = blobdef.get('type', 'object')
					if type == 'object':
						atom = BLOBAtom()
					else:
						atom = tables.Atom.from_dtype(np.dtype(type))

					fp.createVLArray('/' + group +'/blobs', blobcol, atom, "BLOBs", createparents=True, filters=tables.Filters(**filters), expectedsizeinMB=expectedsizeinMB)
					
					b = getattr(g.blobs, blobcol)
					if isinstance(atom, BLOBAtom):
						b.append(None)	# ref=0 always points to None (for BLOBs)
					else:
						b.append([]) # ref=0 points to an empty array for other BLOB types
		return g

	def drop_row_group(self, cell_id, group):
		"""
		Delete the given HDF5 group and all its children from all
		tablets of cell cell_id

		TODO: I feel this whole 'group' business hasn't been well
		      though out and should be reconsidered/redesigned...
		"""
		with self.lock_cell(cell_id, mode='r+') as cell:
			for cgroup in self._cgroups:
				if self._is_pseudotablet(cgroup):
					continue
				with cell.open(cgroup) as fp:
					if group in fp.root:
						fp.removeNode('/', group, recursive=True);

	def _create_tablet(self, fn, cgroup):
		"""
		Create a new tablet.
		
		Create a tablet in file <fn>, for column group <cgroup>.
		"""
		self._check_transaction()

		# Create a tablet at a given path, for cgroup 'cgroup'
		assert os.access(fn, os.R_OK) == False

		# Create the cell directory if it doesn't exist
		path = fn[:fn.rfind('/')];
		if not os.path.exists(path):
			utils.mkdir_p(path)

		# Create the tablet
		logger.debug("Creating tablet %s" % (fn))
		fp  = tables.open_file(fn, mode='w')

		# Force creation of the main subgroup
		self._get_row_group(fp, 'main', cgroup)

		return fp

	def _open_tablet(self, cell_id, cgroup, mode='r'):
		"""
		Open (or create) a tablet.

		mode='r' : Open an existing tablet, read-obly
		mode='w' : Open or create a tablet, truncating its contents
		mode='r+': Open an existing tablet, for reading/writing

		Modes that imply writablility require a transaction to be
		open.

		Employs no locking of any kind.
		"""

		if mode == 'r':
			fn_r = self._tablet_file(cell_id, cgroup)
		        # --- hack: preload the entire file to have it appear in filesystem cache
		        #     this will speed up subsequent random reads within the file
			with open(fn_r) as f:
				f.read()
			# ---
			fp = tables.open_file(fn_r)
		elif mode == 'r+':
			self._check_transaction()
			fn_w = self._tablet_file(cell_id, cgroup, mode='w')
			if os.path.isfile(fn_w):
				fp = tables.open_file(fn_w, mode='a')
			elif self.tablet_exists(cell_id, cgroup): 	# Note: this will download the tablet from remote, if needed
				# A file exists in an older snapshot. Copy it over here.
				fn_r = self._tablet_file(cell_id, cgroup)
				assert fn_r != fn_w, (fn_r, fn_w)
				shutil.copy(fn_r, fn_w)
				os.chmod(fn_w, 0664)	# Ensure it's writable
				fp = tables.open_file(fn_w, mode='a')
			else:
				# No file exists
				fp = self._create_tablet(fn_w, cgroup)
		elif mode == 'w':
			self._check_transaction()
			fn_w = self._tablet_file(cell_id, cgroup, mode='w')
			fp = self._create_tablet(fn_w, cgroup)
		else:
			raise Exception("Mode must be one of 'r', 'r+', or 'w'")

		return fp

	### Public methods
	def __init__(self, path, snapid, open_transaction, mode='r', name=None):
		"""
		Constructor.
		
		Never use directly. Use DB.table() to obtain an instance of
		this class.
		"""
		if mode == 'r' and not os.path.isdir(self.path):
			raise IOError('Cannot access table: "%s" is inexistent or unreadable.' % (path))

		self.path = path
		self.set_snapshot(snapid)

		if open_transaction:
			self.begin_transaction(snapid, load_state=False)

		if mode == 'c':
			self._create(snapid, name, path)

		# Load the state
		self._load_schema()
		self._load_catalog()

	def _create(self, snapid, name, path):
		"""
		Create an empty table and store its schema.
		"""
		assert name is not None
		self._check_transaction()

		for path in glob.iglob('%s/snapshots/*/.committed' % (self.path)):
			raise Exception("Creating a new table in '%s' would overwrite an existing one." % self.path)

		utils.mkdir_p(self.path)

		self._cgroups = OrderedDict()
		self._fgroups = dict()
		self._filters = dict()
		self._aliases = dict()
		self._commit_hooks = []
		self.columns = OrderedDict()
		self.name = name

		# Pixelization
		self.pix = Pixelization(level=int(os.getenv("PIXLEVEL", 6)), t0=54335, dt=1)

		# Empty table catalog
		self.catalog = TableCatalog(pix=self.pix)

		# Save the newly constructed schema
		self._store_schema()

	def define_alias(self, alias, colname):
		"""
		Define an alias to a column

		Immediately commits the change to disk.

		Parameters
		----------
		alias : string
		    The new alias of the column
		colname : string
		    The column being aliased
		"""
		assert colname in self.columns

		self._aliases[alias] = colname
		self._store_schema()

	def resolve_alias(self, colname):
		"""
		Return the name of an aliased column.

		Given an alias, return the column name it aliases. This
		function is a no-op if the alias is a column name itself.

		Besides the aliases defined by the user using
		.define_alias(), there are five built-in special aliases:
		
		    _ID   : Alias to the primary_key
		    _LON  : Alias to the longitude spatial key (if any)
		    _LAT  : Alias to the latitude spatial key (if any)
		    _TIME : Alias to the temporal key (if any)
		    _EXP  : Alias to exposure key
		"""
		schema = self._get_schema(self.primary_cgroup);

		# built-in aliases
		if   colname == '_ID'     and 'primary_key'  in schema: return schema['primary_key']
		elif colname == '_LON'    and 'spatial_keys' in schema: return schema['spatial_keys'][0]
		elif colname == '_LAT'    and 'spatial_keys' in schema: return schema['spatial_keys'][1]
		elif colname == '_TIME'   and 'temporal_key' in schema: return schema['temporal_key']
		# TODO: Consider moving these to user aliases at some point
		elif colname == '_EXP'    and 'exposure_key' in schema: return schema['exposure_key']

		# User aliases
		return self._aliases.get(colname, colname)

	def append(self, cols_, group='main', cell_id=None, _update=False):
		"""
		Append or update a set of rows in this table.
		
		Appends or updates a set of rows into this table. Protects
		against multiple writers simultaneously inserting into the
		same table.

		Returns
		-------
		ids : numarray
		    The primary keys of appended/updated rows

		TODO: Document (and simplify!!!) the algorithm deciding how the
		      append/update happens.  For now, see the comments in
		      the source or e-mail me (mjuric@youknowtherest).
		TODO: Refactor and rework this monstrosity. It brings shame to
		      my family ;-).
		"""

		assert group in ['main', 'cached']
		assert _update == False or group != 'cached'

		# Must be in a transaction to modify things
		self._check_transaction()

		# Resolve aliases in the input, and prepare a ColGroup()
		cols = ColGroup()
		if getattr(cols_, 'items', None):			# Permit cols_ to be a dict()-like object
			cols_ = cols_.items()
		if getattr(cols_, 'dtype', None):			# Allow cols_ to be a ndarray or ColGroup
			cols_ = [ (name, cols_[name]) for name in cols_.dtype.names ]
		for name, col in cols_:
			cols.add_column(self.resolve_alias(name), col)
		assert cols.ncols()

		# if the primary key column has not been supplied by the user, add it
		key = self.get_primary_key()
		if key not in cols:
			cols[key] = np.zeros(len(cols), dtype=self.columns[key].dtype)
		else:
			# If the primary column has been supplied by the user, it either
			# has to refer to cells only, or this append() must be allowed to
			# update/insert rows.
			# Alternatively, cell_id may be != None (e.g., for filling in neighbor caches)
			cid = self.pix.is_cell_id(cols[key])
			assert cid.all() or _update or cell_id is not None, "If keys are given, they must refer to the cell only."

			# Setup the 'base' keys (with obj_id part equal to zero)
			cols[key][cid] &= np.uint64(0xFFFFFFFF00000000)

		# Locate the cells into which we're going to store the rows
		# - if <cell_id> is not None: override everything else and insert into the requested cell(s).
		# - elif <primary_key> column exists and not all zeros: compute destination cells from it
		# - elif <spatial_keys> columns exist: use them to determine destination cells
		#
		# Rules for (auto)generation of keys:
		# - if the key is all zeros, the cell part (higher 32 bits) will be set to the cell_part of cell_id
		# - if the object part of the key is all zeros, it will be generated from the cell's sequence
		#
		# Note that a key with cell part of 0x0 points to a valid cell (the south pole)!
		#
		if cell_id is not None:
			# Explicit vector (or scalar) of destination cell(s) has been provided
			# Overrides anything that would've been computed from primary_key or spatial_keys
			# Shouldn't be used EVER (unless you really, really, really know what you're doing.)
			assert group != 'main'	# Allowed only for neighbor cache builds, really...
			cells = np.array(cell_id, copy=False, ndmin=1)
			if len(cells) == 1:
				cells = np.resize(cells, len(cols))
		else:
			# Deduce any unset keys from spatial_keys
			if not cols[key].all():
				assert group == 'main'

				need_key = cols[key] == 0

				# Deduce remaining cells from spatial and temporal keys
				lonKey, latKey = self.get_spatial_keys()
				assert lonKey and latKey, "The table must have at least the spatial keys!"
				assert lonKey in cols and latKey in cols, "The input must contain at least the spatial keys!"
				tKey = self.get_temporal_key()

				lon = cols[lonKey][need_key]
				lat = cols[latKey][need_key]
				t   = cols[tKey][need_key]   if tKey is not None else None

				cols[key][need_key] = self.pix.obj_id_from_pos(lon, lat, t)

			# Deduce destination cells from keys
			cells = self.pix.cell_for_id(cols[key])

		#
		# Do the storing, cell by cell
		#
		ntot = 0
		unique_cells = list(set(cells))
		while unique_cells:
			# Find a cell that is ready to be written to (that isn't locked
			# by another writer) and lock it
			for k in xrange(3600):
				try:
					i = k % len(unique_cells)
					cur_cell_id = unique_cells[i]

					# Try to acquire a lock for the entire cell
					lock = self._lock_cell(cur_cell_id, timeout=1)

					unique_cells.pop(i)
					break
				except locking.LockTimeout as _:
#					print "LOCK:", _
					pass
			else:
				raise Exception('Appear to be stuck on a lock file!')

			# Mask for rows belonging to this cell
			incell = cells == cur_cell_id

			# Store cell groups into their tablets
			for cgroup, schema in self._cgroups.iteritems():
				if self._is_pseudotablet(cgroup):
					continue

				# Get the tablet file handles
				fp    = self._open_tablet(cur_cell_id, mode='r+', cgroup=cgroup)
				g     = self._get_row_group(fp, group, cgroup)
				t     = g.table
				blobs = schema['blobs'] if 'blobs' in schema else dict()

				# select out only the columns belonging to this tablet and cell
				colsT = ColGroup([ (colname, cols[colname][incell]) for colname, _ in schema['columns'] if colname in cols ])
				colsB = dict([ (colname, colsT[colname]) for colname in colsT.keys() if colname in blobs ])

				if cgroup == self.primary_cgroup:
					# Logical number of rows in this cell
					nrows = len(t)

					# Find keys needing an autogenerated ID and generate it
					_, _, _, i = self.pix._xyti_from_id(colsT[key])

					# Ensure that autogenerated keys are greater than any that
					# will be inserted in this operation
					id_seq = getattr(g, '_seq_' + key, None)
					if id_seq:
						id0 = id_seq[0] = max(id_seq[0], np.max(i)+1)
					else:
						assert group == 'cached'

					if not i.all():
						assert group != 'cached'
						#assert not _update, "Shouldn't pass here"
						assert cell_id is None
						need_keys = i == 0
						nnk = need_keys.sum()

						# Generate nnk keys
						genIds = np.arange(id0, id0 + nnk, dtype=np.uint64)
						id_seq[0] = id0 + nnk

						# Store the keys where they're needed
						colsT[key][need_keys] += genIds
						cols[key][incell] = colsT[key]

					# If this is an update, find where the new rows map
					if _update:
						id1 = t.col(self.primary_key.name)	# Load the primary keys of existing rows
						id2 = colsT[key]			# Primary keys of new rows

						# The "find-insertion-points" idiom (if only np.in1d returned indices...)
						ii = id1.argsort()
						id1 = id1[ii]
						idx = np.searchsorted(id1, id2)

						# If this is a pure append, unset idx
						if np.min(idx) == len(id1):
							idx = slice(None)
						else:
							# Find rows which will be added, and those which will be updated
							in_      = idx < len(id1)		    # Rows with IDs less than the maximum existing one
							app      = np.ones(len(id2), dtype=np.bool)
							app[in_] = id1[idx[in_]] != id2[in_]	 # These rows will be appended
							nnew     = app.sum()

							# Reindex new rows past the end
							idx[app] = np.arange(len(id1), len(id1)+nnew)
							
							# Reindex existing rows to unsorted id1 ordering
							napp = ~app
							idx[napp] = ii[idx[napp]]
#							print id1, id2, idx, app, nnew; exit()

				if _update and not isinstance(idx, slice):
					# Load existing rows (and imediately delete them)
					rows = t.read()
					t.truncate(0)

					# Resolve blobs, merge them with ours (and immediately delete)
					for colname in colsB:
						bb = self._fetch_blobs_fp(fp, colname, rows[colname])
						len0 = len(bb)
						bb = np.resize(bb, (nrows + nnew,) + bb.shape[1:])
						# Since np.resize fills the newly allocated part with zeros, change it to None
						bb[len0:] = None
						bb[idx] = colsB[colname]
						colsB[colname] = bb

						getattr(g.blobs, colname).truncate(1) # Leave the 'None' BLOB

					# Close and reopen (otherwise truncate appears to have no effect)
					# -- bug in PyTables ??
					logger.debug("Closing tablet (%s)" % (fp.filename))
					fp.close()
					fp = self._open_tablet(cur_cell_id, mode='r+', cgroup=cgroup)
					g  = self._get_row_group(fp, group, cgroup)
					t  = g.table

					# Enlarge the array to accommodate new rows (this will also set them to zero)
					rows.resize(nrows + nnew)

#					print len(colsB['hdr']), len(rows), nnew
#					print colsB['hdr']
#					exit()
				else:
					# Construct a compatible numpy array, that will leave
					# unspecified columns set to zero
					nnew = np.sum(incell)
					rows = np.zeros(nnew, dtype=np.dtype(schema['columns']))
					idx = slice(None)

				# Update/add regular columns
				for colname in colsT.keys():
					if colname in blobs:
						continue
					rows[colname][idx] = colsT[colname]

				# Update/add blobs. They're different as they'll touch all
				# the rows, every time (even when updating).
				for colname in colsB:
					# BLOB column - find unique objects, insert them
					# into the BLOB VLArray, and put the indices to those
					# into the actual cgroup
					assert colsB[colname].dtype == object
					flatB = colsB[colname].reshape(colsB[colname].size)
					idents = np.fromiter(( id(v) for v in flatB ), dtype=np.uint64, count=flatB.size)
					_, idx, ito = np.unique(idents, return_index=True, return_inverse=True)	# Note: implicitly flattens multi-D input arrays
					uobjs = flatB[idx]
					ito = ito.reshape(rows[colname].shape)	# De-flatten the output indices

					# Offset indices
					barray = getattr(g.blobs, colname)
					bsize = len(barray)
					ito = ito + bsize

					# Remap any None values to index 0 (where None is stored by convention)
					# We use the fact that None will be sorted to the front of the unique sequence, if exists
					if len(uobjs) and uobjs[0] is None:
						##print "Remapping None", len((ito == bsize).nonzero()[0])
						uobjs = uobjs[1:]
						ito -= 1
						ito[ito == bsize-1] = 0

					rows[colname] = ito

					# Check we've correctly mapped everything
					uobjs2 = np.append(uobjs, [None])
					assert (uobjs2[np.where(rows[colname] != 0, rows[colname]-bsize, len(uobjs))] == colsB[colname]).all()

					# Do the storing
					for obj in uobjs:
						if obj is None and not isinstance(barray.atom, tables.ObjectAtom):
							obj = []
						barray.append(obj)

#					print 'LEN:', colname, bsize, len(barray), ito

				t.append(rows)
				logger.debug("Closing tablet (%s)" % (fp.filename))
				fp.close()
#				exit()

			self._unlock_cell(lock)

			#print '[', nrows, ']'
			self._nrows = self._nrows + nnew
			ntot = ntot + nnew

		assert _update or ntot == len(cols), 'ntot != len(cols), ntot=%d, len(cols)=%d, cur_cell_id=%d' % (ntot, len(cols), cur_cell_id)
		assert len(np.unique(cols[key])) == len(cols), 'len(np.unique(cols[key])) != len(cols) (%s != %s) in cell %s' % (len(np.unique(cols[key])), len(cols), cur_cell_id)

		return cols[key]

	def nrows(self):
		"""
		Returns the (cached) number of rows in the table
		"""
		return self._nrows

	def close(self):
		pass

	def __str__(self):
		""" Return some basic (human readable) information about the
		    table.
		"""
		i =  'Path:          %s\n' % self.path
		i += 'Partitioning:  level=%d\n' % (self.pix.level)
		i += '(t0, dt):      %f, %f \n' % (self.pix.t0, self.pix.dt)
		i += 'Rows:          %d\n' % (self.nrows())
		i += 'Columns:       %d\n' % (len(self.columns) - len(self._cgroups['_PSEUDOCOLS']['columns']))
		i += 'Primary key:   %s\n' % self.get_primary_key()
		if self.spatial_keys:
			i += 'Spatial keys:  (%s, %s)\n' % tuple([ self.spatial_keys[i].name for i in xrange(2) ])
		if self.temporal_key:
			i += 'Temporal key:  %s\n' % self.get_temporal_key()
		ek = self.resolve_alias('_EXP')
		if ek != '_EXP':
			i += 'Exposure key:  %s\n' % ek
		i += 'Aliases:       %s\n' % str(self._aliases.items())
		i += 'Column groups: %s\n' % str([key for key in self._cgroups.iterkeys() if key[0] != '_'])
		s = ''
		for cgroup, schema in self._cgroups.iteritems():
			if cgroup[0] == '_': # Skip pseudo-tablets
				continue
			s += '-'*31 + '\n'
			s += 'Column group \'' + cgroup + '\':\n'
			s += "%20s %10s\n" % ('Column', 'Type')
			s += '-'*31 + '\n'
			for col in schema["columns"]:
				s = s + "%20s %10s\n" % (col[0], col[1])
			s = s + '-'*31 + '\n'
		return i + s

	def _get_schema(self, cgroup):
		"""
		Return the schema of the given column group.
		"""
		return self._cgroups[cgroup]

	def _smart_load_blobs(self, barray, refs):
		"""
		Intelligently load an array of BLOBs
		
		Load an ndarray of BLOBs from a set of refs refs, taking
		into account not to instantiate duplicate objects for the
		same BLOBs.

		Parameters
		----------
		barray : tables.VLArray
		    The PyTables VLArray from which to read the BLOBs
		refs : ndarray of int64
		    The 1-dimensional list of BLOB references to be
		    instantiated.

		Returns
		-------
		blobs : numpy array of objects
		    A 1D array of blobs, corresponding to the refs.
		"""
		##return np.ones(len(refs), dtype=object);
		assert len(refs.shape) == 1

		ui, _, idx = np.unique(refs, return_index=True, return_inverse=True)
		assert (ui >= 0).all()	# Negative refs are illegal. Index 0 means None

		objlist = barray[ui]
		if len(ui) == 1 and tables.__version__ == '2.2':
			# bug workaround -- PyTables 2.2 returns a scalar for length-1 arrays
			objlist = [ objlist ]

		# Note: using np.empty followed by a loop (as opposed to
		#       np.array) ensures a 1D array will be created, even
		#       if objlist[0] is an array (in which case np.array
		#       misinterprets it as a request to create a 2D numpy
		#       array)
		blobs    = np.empty(len(objlist), dtype=object)
		for i, obj in enumerate(objlist):
			blobs[i] = obj
		blobs = blobs[idx]

		#print >> sys.stderr, 'Loaded %d unique objects for %d refs' % (len(objlist), len(idx))

		return blobs

	def _fetch_blobs_fp(self, fp, column, refs, include_cached=False):
		"""
		Fetch the BLOBs referenced by refs from PyTables file object fp

		The BLOB references are indices into a VLArray (variable
		length array) in the HDF5 file. By convention, the indices
		to BLOBs in the 'main' subgroup of the file (that contains
		the rows belonging to the cell, as opposed to those in
		neighbor cache), are positive. Conversly, the refs to cached
		BLOBs are negative (and should be loaded from the 'cached'
		subgroup of the file). This function transparently takes
		care of all of that.
		
		Parameters
		----------
		fp : table.File
		    PyTables file object from which to load the BLOBs
		column : string
		    The column name of the BLOB column
		refs : ndarray of int64
		    The BLOB references to BLOBs to instantiate
		include_cached : boolean
		    Whether to load the cached BLOBs or not.
		
		Returns
		-------
		blobs : numpy array of objects
		    A 1D array of blobs, corresponding to the refs.

		TODO: Why do we need include_cached param here, when it
		      could be inferred from whether there are any negative
		      refs?
		"""
		# Flatten refs; we'll deflatten the blobs in the end
		shape = refs.shape
		refs = refs.reshape(refs.size)

		# Load the blobs
		b1 = getattr(fp.root.main.blobs, column)
		if include_cached and 'cached' in fp.root:
			# We have cached objects in 'cached' group -- read the blobs
			# from there as well. blob refs of cached objects are
			# negative.
			b2 = getattr(fp.root.cached.blobs, column)

			blobs = np.empty(len(refs), dtype=object)
			blobs[refs >= 0] = self._smart_load_blobs(b1,   refs[refs >= 0]),
			blobs[ refs < 0] = self._smart_load_blobs(b2,  -refs[ refs < 0]),
		else:
			blobs = self._smart_load_blobs(b1, refs)

		# Bring back to original shape
		blobs = blobs.reshape(shape)

		return blobs

	def fetch_blobs(self, cell_id, column, refs, include_cached=False, _fp=None):
		"""
		Instantiate BLOBs for a given column.

		Fetch blobs from column 'column' in cell cell_id, given a
		vector of references 'refs'

		If the cell_id has a temporal component, and there's no
		tablet in that cell, a static sky cell corresponding to it
		is tried next.

		See documentation for _fetch_blobs_fp() for more details.
		"""
		# short-circuit if there's nothing to be loaded
		if len(refs) == 0:
			return np.empty(refs.shape, dtype=np.object_)

		# Get the table for this column
		cgroup = self.columns[column].cgroup

		# revert to static sky cell if cell_id is temporal but
		# unpopulated (happens in static-temporal JOINs)
		cell_id = self.static_if_no_temporal(cell_id)

		# load the blobs arrays
		with self.lock_cell(cell_id) as cell:
			with cell.open(cgroup) as fp:
				blobs = self._fetch_blobs_fp(fp, column, refs, include_cached)

		return blobs

	def fetch_tablet(self, cell_id, cgroup=None, include_cached=False):
		"""
		Load and return the contents of a tablet.

		Parameters
		----------
		cell_id : number
		    The cell ID from which to load
		cgroup : string or None
		    The column group whose tablet to load. If set to None,
		    the primary column group's tablet will be loaded.
		include_cached : boolean
		    If True, data from the neighbor cache will be returned
		    as well.

		Returns
		-------
		rows : structured ndarray
		    The rows from the tablet.

		Notes
		-----
		If the tablet contains BLOB columns, only the references
		will be returned by this function. Call fetch_blobs to
		instantiate the actual objects.
		
		If include_cached=True, and the tablet contains BLOB
		columns, the references to blobs in the neighbor cache will
		be negative. fetch_blobs() understands and automatically
		takes care of this.
		
		If the cell_id has a temporal component, and there's no
		tablet in that cell, a static sky cell corresponding to it
		is tried next.
		"""
		if cgroup is None:
			cgroup = self.primary_cgroup

		# revert to static sky cell if cell_id is temporal but
		# unpopulated (happens in static-temporal JOINs)
		cell_id = self.static_if_no_temporal(cell_id)

		if self._is_pseudotablet(cgroup):
			return self._fetch_pseudotablet(cell_id, cgroup, include_cached)

		if self.tablet_exists(cell_id, cgroup):	# Note: this will download the tablet from remote, if needed
			with self.lock_cell(cell_id) as cell:
				with cell.open(cgroup) as fp:
					rows = fp.root.main.table.read()
					if include_cached and 'cached' in fp.root:
						rows2 = fp.root.cached.table.read()
						# Make any neighbor cache BLOBs negative (so that fetch_blobs() know to
						# look for them in the cache, instead of 'main')
						schema = self._get_schema(cgroup)
						if 'blobs' in schema:
							for blobcol in schema['blobs']:
								rows2[blobcol] *= -1
						# Append the data from cache to the main tablet
						rows = np.append(rows, rows2)
		else:
			schema = self._get_schema(cgroup)
			rows = np.empty(0, dtype=np.dtype(schema['columns']))

		return rows

	def _fetch_pseudotablet(self, cell_id, cgroup, include_cached=False):
		"""
		Internal: Fetch a "pseudotablet".
		
		A pseudotablet is a tablet that contains pseudocolumns,
		columns that are computed on the fly:  _CACHED, _ROWID and
		_ROWIDX
		
		DO NOT CALL THIS FUNCTION DIRECTLY. It will be called by
		fetch_tablet, when a pseudotablet name is encountered (a
		name beginning with '_').
		"""

		assert cgroup == '_PSEUDOCOLS'

		# Find out how many rows are there in this cell
		nrows1 = nrows2 = 0
		if self.cell_exists(cell_id):
			with self.lock_cell(cell_id) as cell:
				with cell.open(self.primary_cgroup) as fp:
					nrows1 = len(fp.root.main.table)
					nrows2 = len(fp.root.cached.table) if (include_cached and 'cached' in fp.root) else 0
		nrows = nrows1 + nrows2

		cached = np.zeros(nrows, dtype=np.bool)			# _CACHED
		cached[nrows1:] = True
		rowidx = np.arange(0, nrows, dtype=np.uint64)		# _ROWIDX
		rowid  = self.pix.id_for_cell_i(cell_id, rowidx)	# _ROWID

		pcols  = ColGroup([('_CACHED', cached), ('_ROWIDX', rowidx), ('_ROWID', rowid)])
		return pcols

	def _is_pseudotablet(self, cgroup):
		"""
		Test whether a given cgroup is a pseudotablet.
		
		The current implementation checks if the name begins with an
		underscore.
		"""
		return cgroup[0] == '_'

	class CellProxy:
		"""
		Helper for Table.lock_cell()
		"""
		table   = None
		cell_id = None
		mode    = None

		def __init__(self, table, cell_id, mode):
			self.table = table
			self.cell_id = cell_id
			self.mode = mode

		@contextmanager
		def open(self, cgroup=None):
			"""
			Opens the requested table within a locked cell.
			"""
			if cgroup is None:
				cgroup = self.table.primary_cgroup

			fp = self.table._open_tablet(self.cell_id, mode=self.mode, cgroup=cgroup)

			yield fp

			logger.debug("Closing tablet (%s)" % (fp.filename))
			fp.close()

	@contextmanager
	def lock_cell(self, cell_id, mode='r', timeout=None):
		""" Open and return a proxy object for the given cell, that allows
		    one to safely open individual tablets stored there.

		    If mode is not 'r', the entire cell will be locked
		    for the duration of this context manager, and automatically
		    unlocked upon exit.
		"""
		lock = None if mode == 'r' else self._lock_cell(cell_id, timeout=None)

		try:
        		yield Table.CellProxy(self, cell_id, mode=mode)
                finally:
        		if lock != None:
        			self._unlock_cell(lock)

	def get_spatial_keys(self):
		"""
		Names of spatial keys, or (None, None) if they don't exist.
		"""
		# Find out which columns are our spatial keys
		return (self.spatial_keys[0].name, self.spatial_keys[1].name) if self.spatial_keys is not None else (None, None)

	def get_primary_key(self):
		"""
		Returns the name of the primary key.
		"""
		return self.primary_key.name

	def get_temporal_key(self):
		"""
		Returns the name of the temporal key, or None if it's not
		defined.
		"""
		return self.temporal_key.name if self.temporal_key is not None else None