Package com.cloudera.cdk.data.hbase.impl

Source Code of com.cloudera.cdk.data.hbase.impl.EntitySchema

/**
* Copyright 2013 Cloudera Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.cloudera.cdk.data.hbase.impl;

import com.cloudera.cdk.data.SchemaValidationException;
import java.io.UnsupportedEncodingException;
import java.util.Arrays;
import java.util.Collection;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;

/**
* An EntitySchema is the parsed schema that contains the properties of an HBase
* Common entity schema.
*/
public class EntitySchema {

  private final Collection<String> tables;
  private final Map<String, FieldMapping> fieldMappings = new HashMap<String, FieldMapping>();
  private final String rawSchema;
  private final String name;

  /**
   * Constructs the EntitySchema
   *
   * @param tables
   *          The tables this EntitySchema can be persisted to
   * @param name
   *          The name of the entity schema
   * @param rawSchema
   *          The raw schema type that underlies the EntitySchema implementation
   * @param fieldMappings
   *          The list of FieldMappings that specify how each field maps to an
   *          HBase row
   */
  public EntitySchema(Collection<String> tables, String name, String rawSchema,
      Collection<FieldMapping> fieldMappings) {
    this.tables = tables;
    this.name = name;
    this.rawSchema = rawSchema;
    validateFieldMappings(fieldMappings);
    for (FieldMapping fieldMapping : fieldMappings) {
      this.fieldMappings.put(fieldMapping.getFieldName(), fieldMapping);
    }
  }

  /**
   * Get the tables this EntitySchema can be persisted to.
   *
   * @return The list of tables.
   */
  public Collection<String> getTables() {
    return tables;
  }

  /**
   * Get the name of this EntitySchema
   *
   * @return The name
   */
  public String getName() {
    return name;
  }

  /**
   * Get the FieldMapping for the specified fieldName. Returns null if one
   * doesn't exist.
   *
   * @param fieldName
   *          The field name to get the FieldMapping for
   * @return The FieldMapping, or null if one doesn't exist fo rthe fieldName.
   */
  public FieldMapping getFieldMapping(String fieldName) {
    return fieldMappings.get(fieldName);
  }

  /**
   * Get the FieldMappings for this schema.
   *
   * @return The collection of FieldMappings
   */
  public Collection<FieldMapping> getFieldMappings() {
    return fieldMappings.values();
  }

  /**
   * Get the raw schema that was parsed to create this schema.
   *
   * @return The raw scheam.
   */
  public String getRawSchema() {
    return rawSchema;
  }

  /**
   * Get the HBase columns required by this schema.
   *
   * @return The set of columns
   */
  public Set<String> getRequiredColumns() {
    Set<String> set = new HashSet<String>();
    for (FieldMapping fieldMapping : fieldMappings.values()) {
      if (MappingType.COLUMN == fieldMapping.getMappingType()
          || MappingType.COUNTER == fieldMapping.getMappingType()) {
        set.add(fieldMapping.getMappingValue());
      } else if (MappingType.KEY_AS_COLUMN == fieldMapping.getMappingType()) {
        String family = fieldMapping.getMappingValue().split(":", 1)[0];
        family = family + ":";
        set.add(family);
      } else if (MappingType.OCC_VERSION == fieldMapping.getMappingType()) {
        set.add(new String(Constants.SYS_COL_FAMILY) + ":"
            + new String(Constants.VERSION_CHECK_COL_QUALIFIER));
      }
    }
    return set;
  }

  /**
   * Get the HBase column families required by this schema.
   *
   * @return The set of column families.
   */
  public Set<String> getRequiredColumnFamilies() {
    Set<String> set = new HashSet<String>();
    Set<String> columnSet = getRequiredColumns();
    for (String column : columnSet) {
      set.add(column.split(":")[0]);
    }
    return set;
  }

  /**
   * Method meant to determine if two EntitySchemas are compatible with each
   * other for schema migration purposes. Classes that inherit EntitySchema
   * should override this implementation, since this implemetnation isn't able
   * to make that determination.
   *
   * TODO: Figure out a base set of properties that all entity schema
   * implementations should share in their implementation of determining
   * compatibility and execute that here.
   *
   * @param entitySchema
   *          The other EntitySchema to determine compatible with
   * @return
   */
  public boolean compatible(EntitySchema entitySchema) {
    // throw an exception if anyone calls this directly, as this should be
    // overridden in derived classes.
    throw new UnsupportedOperationException(
        "EntityScheam class can't determine if two entity schemas are compatible.");
  }

  /**
   * Validate that the field mappings provided for this schema are compatible
   * with a valid schema. The rules are:
   *
   * <pre>
   * 1. An entity schema can't contain multiple occVersion mapping fields
   * 2. An entity schema can't contain both an occVersion field and a counter
   *    field.
   * </pre>
   *
   * This method will throw a SchemaValidationException if any of these
   * rules are violated. Otherwise, no exception is thrown.
   *
   * @param fieldMappings The collection of FieldMappings to validate
   */
  private void validateFieldMappings(Collection<FieldMapping> fieldMappings) {
    boolean hasOCCVersion = false;
    boolean hasCounter = false;

    for (FieldMapping fieldMapping : fieldMappings) {
      if (fieldMapping.getMappingType() == MappingType.OCC_VERSION) {
        if (hasOCCVersion) {
          throw new SchemaValidationException(
              "Schema can't contain multiple occVersion fields.");
        }
        if (hasCounter) {
          throw new SchemaValidationException(
              "Schema can't contain both an occVersion field and a counter field.");
        }
        hasOCCVersion = true;
      } else if (fieldMapping.getMappingType() == MappingType.COUNTER) {
        if (hasOCCVersion) {
          throw new SchemaValidationException(
              "Schema can't contain both an occVersion field and a counter field.");
        }
        hasCounter = true;
      }
    }
  }

  /**
   * A field mapping represents a type that specifies how a schema field maps to
   * a column in HBase.
   */
  public static class FieldMapping {

    private final String fieldName;
    private final MappingType mappingType;
    private final String mappingValue;
    private final Object defaultValue;
    private final String prefix;
    private final byte[] family;
    private final byte[] qualifier;

    public FieldMapping(String fieldName, MappingType mappingType,
        String mappingValue, Object defaultValue, String prefix) {
      this.fieldName = fieldName;
      this.mappingType = mappingType;
      this.mappingValue = mappingValue;
      this.defaultValue = defaultValue;
      this.prefix = prefix;
      this.family = getFamilyFromMappingValue(mappingValue);
      this.qualifier = getQualifierFromMappingValue(mappingValue);
    }

    public String getFieldName() {
      return fieldName;
    }

    public MappingType getMappingType() {
      return mappingType;
    }

    public String getMappingValue() {
      return mappingValue;
    }

    public Object getDefaultValue() {
      return defaultValue;
    }

    public String getPrefix() {
      return prefix;
    }

    public byte[] getFamily() {
      return family;
    }

    public byte[] getQualifier() {
      return qualifier;
    }

    private byte[] getFamilyFromMappingValue(String mappingValue) {
      if (mappingType == MappingType.KEY) {
        return null;
      } else if (mappingType == MappingType.OCC_VERSION) {
        return Constants.SYS_COL_FAMILY;
      } else {
        String[] familyQualifier = mappingValue.split(":", 2);
        byte[] family;
        try {
          family = familyQualifier[0].getBytes("UTF-8");
        } catch (UnsupportedEncodingException exc) {
          throw new SchemaValidationException(
              "fieldType Must support UTF-8 encoding", exc);
        }
        return family;
      }
    }

    private byte[] getQualifierFromMappingValue(String mappingValue) {
      if (mappingType == MappingType.KEY) {
        return null;
      } else if (mappingType == MappingType.OCC_VERSION) {
        return Constants.VERSION_CHECK_COL_QUALIFIER;
      } else {
        String[] familyQualifier = mappingValue.split(":", 2);
        byte[] qualifier;
        try {
          qualifier = familyQualifier.length == 1 ? new byte[0]
              : familyQualifier[1].getBytes("UTF-8");
        } catch (UnsupportedEncodingException exc) {
          throw new SchemaValidationException(
              "fieldType Must support UTF-8 encoding", exc);
        }
        return qualifier;
      }
    }

    @Override
    public int hashCode() {
      final int prime = 31;
      int result = 1;
      result = prime * result
          + ((defaultValue == null) ? 0 : defaultValue.hashCode());
      result = prime * result + Arrays.hashCode(family);
      result = prime * result
          + ((fieldName == null) ? 0 : fieldName.hashCode());
      result = prime * result
          + ((mappingType == null) ? 0 : mappingType.hashCode());
      result = prime * result
          + ((mappingValue == null) ? 0 : mappingValue.hashCode());
      result = prime * result + ((prefix == null) ? 0 : prefix.hashCode());
      result = prime * result + Arrays.hashCode(qualifier);
      return result;
    }

    @Override
    public boolean equals(Object obj) {
      if (this == obj)
        return true;
      if (obj == null)
        return false;
      if (getClass() != obj.getClass())
        return false;
      FieldMapping other = (FieldMapping) obj;
      if (defaultValue == null) {
        if (other.defaultValue != null)
          return false;
      } else if (!defaultValue.equals(other.defaultValue))
        return false;
      if (!Arrays.equals(family, other.family))
        return false;
      if (fieldName == null) {
        if (other.fieldName != null)
          return false;
      } else if (!fieldName.equals(other.fieldName))
        return false;
      if (mappingType != other.mappingType)
        return false;
      if (mappingValue == null) {
        if (other.mappingValue != null)
          return false;
      } else if (!mappingValue.equals(other.mappingValue))
        return false;
      if (prefix == null) {
        if (other.prefix != null)
          return false;
      } else if (!prefix.equals(other.prefix))
        return false;
      if (!Arrays.equals(qualifier, other.qualifier))
        return false;
      return true;
    }
  }
}
TOP

Related Classes of com.cloudera.cdk.data.hbase.impl.EntitySchema

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.