Package org.kiji.schema.impl.cassandra

Source Code of org.kiji.schema.impl.cassandra.CassandraTableKeyValueDatabase

/**
* (c) Copyright 2014 WibiData, Inc.
*
* See the NOTICE file distributed with this work for additional
* information regarding copyright ownership.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.kiji.schema.impl.cassandra;

import java.io.IOException;
import java.nio.ByteBuffer;
import java.util.Date;
import java.util.HashSet;
import java.util.List;
import java.util.NavigableMap;
import java.util.Set;

import com.datastax.driver.core.PreparedStatement;
import com.datastax.driver.core.ResultSet;
import com.datastax.driver.core.Row;
import com.google.common.base.Preconditions;
import com.google.common.collect.Lists;
import com.google.common.collect.Maps;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import org.kiji.annotations.ApiAudience;
import org.kiji.commons.ByteUtils;
import org.kiji.schema.KijiTableKeyValueDatabase;
import org.kiji.schema.KijiURI;
import org.kiji.schema.avro.KeyValueBackup;
import org.kiji.schema.avro.KeyValueBackupEntry;
import org.kiji.schema.cassandra.CassandraTableName;

/**
* Manages key-value pairs on a per table basis. Storage of these key-value pairs is provided by
* a column family of an HTable.
*/
@ApiAudience.Private
public class CassandraTableKeyValueDatabase
    implements KijiTableKeyValueDatabase<CassandraTableKeyValueDatabase> {

  public static final Logger LOG = LoggerFactory.getLogger(CassandraTableKeyValueDatabase.class);

  // Hard-code the names of the various columns in the underlying Cassandra table.
  public static final String KV_COLUMN_TABLE = "table_name";
  public static final String KV_COLUMN_KEY = "key";
  // Avoid conflicts with any Cassandra CQL reserved words.
  // We should be okay because we are using quotes around column names, but let's be extra-safe!
  public static final String KV_COLUMN_VALUE = "myval";
  public static final String KV_COLUMN_TIME = "mytime";

  /**  The HBase table that stores Kiji metadata. */
  private final CassandraTableName mTable;

  /** Cassandra cluster connection. */
  private final CassandraAdmin mAdmin;

  private final PreparedStatement mPutValueStatement;
  private final PreparedStatement mKeySetStatement;
  private final PreparedStatement mRestoreKeyValuesFromBackupStatement;
  private final PreparedStatement mGetRowsStatement;
  private final PreparedStatement mRemoveValuesStatement;

  /**
   * Prepare statement to reuse many times.
   *
   * TODO (SCHEMA-748): Don't need statement preparation after adding statement cache.
   *
   * @return the prepared statement.
   */
  private PreparedStatement getPutValueStatement() {
    final String queryText = String.format(
        "INSERT INTO %s (%s, %s, %s, %s) VALUES (?, ?, ?, ?)",
        mTable,
        KV_COLUMN_TABLE,
        KV_COLUMN_KEY,
        KV_COLUMN_TIME,
        KV_COLUMN_VALUE);
    return mAdmin.getPreparedStatement(queryText);
  }

  /**
   * Prepare statement to reuse many times.
   *
   * TODO (SCHEMA-748): Don't need statement preparation after adding statement cache.
   *
   * @return the prepared statement.
   */
  private PreparedStatement getKeySetStatement() {
    final String queryText =
        String.format("SELECT %s FROM %s WHERE %s=?", KV_COLUMN_KEY, mTable, KV_COLUMN_TABLE);
    return mAdmin.getPreparedStatement(queryText);
  }

  /**
   * Prepare statement to reuse many times.
   *
   * TODO (SCHEMA-748): Don't need statement preparation after adding statement cache.
   *
   * @return the prepared statement.
   */
  private PreparedStatement getRestoreKeyValuesFromBackupStatement() {
    // TODO: Make this query a member of the class and prepare in the constructor
    final String queryText = String.format(
        "INSERT INTO %s (%s, %s, %s, %s) VALUES (?, ?, ?, ?)",
        mTable,
        KV_COLUMN_TABLE,
        KV_COLUMN_KEY,
        KV_COLUMN_TIME,
        KV_COLUMN_VALUE);
    return mAdmin.getPreparedStatement(queryText);
  }

  /**
   * Prepare statement to reuse many times.
   *
   * TODO (SCHEMA-748): Don't need statement preparation after adding statement cache.
   *
   * @return the prepared statement.
   */
  private PreparedStatement getGetRowsStatement() {
    final String queryText = String.format(
        "SELECT * FROM %s WHERE %s=? AND %s=? LIMIT ?",
        mTable,
        KV_COLUMN_TABLE,
        KV_COLUMN_KEY);
    return mAdmin.getPreparedStatement(queryText);
  }

  /**
   * Prepare statement to reuse many times.
   *
   * TODO (SCHEMA-748): Don't need statement preparation after adding statement cache.
   *
   * @return the prepared statement.
   */
  private PreparedStatement getRemoveValuesStatement() {
    String queryText = String.format(
        "DELETE FROM %s WHERE %s=? AND %s=?",
        mTable,
        KV_COLUMN_TABLE,
        KV_COLUMN_KEY);
    return mAdmin.getPreparedStatement(queryText);
  }

  /**
  * This class manages the storage and retrieval of key-value pairs on a per table basis. It is
  * backed by a C* table.
  *
  * @param admin Cassandra cluster connection.
  * @param instanceURI of Kiji instance.
  */
  public CassandraTableKeyValueDatabase(KijiURI instanceURI, CassandraAdmin admin) {
    mAdmin = Preconditions.checkNotNull(admin);
    mTable = CassandraTableName.getMetaKeyValueTableName(instanceURI);

    mPutValueStatement = getPutValueStatement();
    mKeySetStatement = getKeySetStatement();
    mRestoreKeyValuesFromBackupStatement = getRestoreKeyValuesFromBackupStatement();
    mGetRowsStatement = getGetRowsStatement();
    mRemoveValuesStatement = getRemoveValuesStatement();
  }

  /**
   * Install a table for user-defined key-value pairs.
   * @param admin A wrapper around an open C* session.
   * @param uri The KijiURI of the instance for this table.
   */
  public static void install(CassandraAdmin admin, KijiURI uri) {
    CassandraTableName tableName = CassandraTableName.getMetaKeyValueTableName(uri);

    // Standard C* table layout.  Use text key + timestamp as composite primary key to allow
    // selection by timestamp.
    String tableDescription = String.format(
        "CREATE TABLE %s (%s text, %s text, %s timestamp, %s blob, PRIMARY KEY (%s, %s, %s)) "
            + "WITH CLUSTERING ORDER BY (%s ASC, %s DESC);",
        tableName,
        KV_COLUMN_TABLE,
        KV_COLUMN_KEY,
        KV_COLUMN_TIME,
        KV_COLUMN_VALUE,
        KV_COLUMN_TABLE,
        KV_COLUMN_KEY,
        KV_COLUMN_TIME,
        KV_COLUMN_KEY,
        KV_COLUMN_TIME);
    admin.createTable(tableName, tableDescription);

    // Create secondary index for time.  Should be acceptable given that these key-value databases
    // should not get that large.
    //String queryText = String.format("CREATE INDEX ON %s (%s);", tableName, KV_COLUMN_TIME);
    //admin.getSession().execute(queryText);

  }

  /** {@inheritDoc} */
  @Override
  public byte[] getValue(String table, String key) throws IOException {
   final List<byte[]> values = getValues(table, key, 1);
   return values.get(0);
  }


  /**
   * Internal helper method containing common code for ready values for a given key from the table.
   * @param table Name of the table for which to fetch the values
   *              (part of the key-value database key).
   * @param key Name of the key for the KV store for the given table
   *            (part of the key-value database key).
   * @param numVersions Number of versions to fetch for the given table, key combination.
   * @return A list of C* rows for the query.
   */
  private List<Row> getRows(String table, String key, int numVersions) {
    Preconditions.checkArgument(numVersions >= 1"numVersions must be positive");
    ResultSet resultSet = mAdmin.execute(mGetRowsStatement.bind(table, key, numVersions));
    return resultSet.all();
  }

  /** {@inheritDoc} */
  @Override
  public List<byte[]> getValues(String table, String key, int numVersions) throws IOException {
    final List<Row> rows = getRows(table, key, numVersions);
    if (rows.isEmpty()) {
      throw new IOException(String.format(
          "Could not find any values associated with table %s and key %s", table, key));
    }

    // Convert result into a list of bytes
    final List<byte[]> values = Lists.newArrayList();
    for (Row row: rows) {
      final ByteBuffer blob = row.getBytes(KV_COLUMN_VALUE);
      values.add(ByteUtils.toBytes(blob));
    }
    return values;
  }

  /** {@inheritDoc} */
  @Override
  public NavigableMap<Long, byte[]> getTimedValues(String table, String key, int numVersions)
      throws IOException {
    List<Row> rows = getRows(table, key, numVersions);
    if (0 == rows.size()) {
      throw new IOException(String.format(
          "Could not find any values associated with table %s and key %s", table, key));
    }

    // Convert result into a map from timestamps to values
    final NavigableMap<Long, byte[]> timedValues = Maps.newTreeMap();
    for (Row row: rows) {
      ByteBuffer blob = row.getBytes(KV_COLUMN_VALUE);
      final byte[] bytes = ByteUtils.toBytes(blob);
      Long timestamp = row.getDate(KV_COLUMN_TIME).getTime();
      Preconditions.checkState(timedValues.put(timestamp, bytes) == null);
    }
    return timedValues;
  }

  /** {@inheritDoc} */
  @Override
  public CassandraTableKeyValueDatabase putValue(String table, String key, byte[] value)
      throws IOException {
    Preconditions.checkNotNull(mPutValueStatement);
    ByteBuffer valAsByteBuffer = ByteBuffer.wrap(value);
    // TODO: Check for success?
    mAdmin.execute(mPutValueStatement.bind(table, key, new Date(), valAsByteBuffer));
    return this;
  }

  /** {@inheritDoc} */
  @Override
  public void removeValues(String table, String key) throws IOException {
    // TODO: Check for success?
    mAdmin.execute(mRemoveValuesStatement.bind(table, key));
  }

  /** {@inheritDoc} */
  @Override
  public Set<String> keySet(String table) throws IOException {
    // Just return a set of in-use keys
    final ResultSet resultSet = mAdmin.execute(mKeySetStatement.bind(table));

    final Set<String> keys = new HashSet<String>();
    for (Row row: resultSet.all()) {
      keys.add(row.getString(KV_COLUMN_KEY));
    }
    return keys;
}

  /** {@inheritDoc} */
  @Override
  public Set<String> tableSet() throws IOException {
    // Just return a set of in-use tables
    final String queryText = String.format("SELECT %s FROM %s", KV_COLUMN_TABLE, mTable);
    final ResultSet resultSet = mAdmin.execute(queryText);

    final Set<String> keys = new HashSet<String>();
    for (Row row: resultSet.all()) {
      final String tableName = row.getString(KV_COLUMN_TABLE);
      keys.add(tableName);
    }
    return keys;
  }

/** {@inheritDoc} */
@Override
public void removeAllValues(String table) throws IOException {
   final Set<String> keysToRemove = keySet(table);
   LOG.info("Removing all values for table {}, keys = {}.", table, keysToRemove);
   for (String key : keysToRemove) {
     removeValues(table, key);
   }
}

/** {@inheritDoc} */
@Override
public KeyValueBackup keyValuesToBackup(String table) throws IOException {
   final List<KeyValueBackupEntry> kvBackupEntries = Lists.newArrayList();
   final Set<String> keys = keySet(table);
   for (String key : keys) {
     NavigableMap<Long, byte[]> versionedValues = getTimedValues(table, key, Integer.MAX_VALUE);
     for (Long timestamp : versionedValues.descendingKeySet()) {
       kvBackupEntries.add(KeyValueBackupEntry.newBuilder()
           .setKey(key)
           .setValue(ByteBuffer.wrap(versionedValues.get(timestamp)))
           .setTimestamp(timestamp)
           .build());
     }
   }
   return KeyValueBackup.newBuilder().setKeyValues(kvBackupEntries).build();
}

/** {@inheritDoc} */
@Override
public void restoreKeyValuesFromBackup(final String tableName, KeyValueBackup keyValueBackup)
     throws IOException {
   LOG.debug("Restoring '{}' key-value(s) from backup for table '{}'.",
       keyValueBackup.getKeyValues().size(), tableName);

   for (KeyValueBackupEntry kvRecord : keyValueBackup.getKeyValues()) {
     final String key = kvRecord.getKey();
     final ByteBuffer valAsByteBuffer = kvRecord.getValue(); // Read in ByteBuffer of values
     final long timestamp = kvRecord.getTimestamp();

     LOG.debug("For the table '{}' we are writing key '{}', timestamp '{}', "
             + "and value '{}' to the metatable named '{}'.",
         tableName,
         key,
         timestamp,
         valAsByteBuffer.toString(),
         mTable);

     mAdmin.execute(
         mRestoreKeyValuesFromBackupStatement
             .bind(tableName, key, new Date(timestamp), valAsByteBuffer));
   }
   LOG.debug("Flushing commits to restore key-values from backup.");
   // TODO: Any flush needed?
   //mTable.flushCommits();
}
}
TOP

Related Classes of org.kiji.schema.impl.cassandra.CassandraTableKeyValueDatabase

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.