Package org.apache.giraph.partition

Source Code of org.apache.giraph.partition.ByteArrayPartition$RepresentativeVertexIterator

/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.giraph.partition;

import org.apache.giraph.graph.Vertex;
import org.apache.giraph.utils.UnsafeByteArrayInputStream;
import org.apache.giraph.utils.WritableUtils;
import org.apache.hadoop.io.Writable;
import org.apache.hadoop.io.WritableComparable;
import org.apache.hadoop.util.Progressable;

import com.google.common.collect.MapMaker;
import com.google.common.primitives.Ints;

import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;
import java.util.Iterator;
import java.util.Map;
import java.util.concurrent.ConcurrentMap;

/**
* Byte array based partition.  Should reduce the amount of memory used since
* the entire graph is compressed into byte arrays.  Must guarantee, however,
* that only one thread at a time will call getVertex since it is a singleton.
*
* @param <I> Vertex index value
* @param <V> Vertex value
* @param <E> Edge value
* @param <M> Message data
*/
public class ByteArrayPartition<I extends WritableComparable,
    V extends Writable, E extends Writable, M extends Writable>
    extends BasicPartition<I, V, E, M>
    implements ReusesObjectsPartition<I, V, E, M> {
  /**
   * Vertex map for this range (keyed by index).  Note that the byte[] is a
   * serialized vertex with the first four bytes as the length of the vertex
   * to read.
   */
  private ConcurrentMap<I, byte[]> vertexMap;
  /** Representative vertex */
  private Vertex<I, V, E, M> representativeVertex;
  /** Use unsafe serialization */
  private boolean useUnsafeSerialization;

  /**
   * Constructor for reflection.
   */
  public ByteArrayPartition() { }

  @Override
  public void initialize(int partitionId, Progressable progressable) {
    super.initialize(partitionId, progressable);
    vertexMap = new MapMaker().concurrencyLevel(
        getConf().getNettyServerExecutionConcurrency()).makeMap();
    representativeVertex = getConf().createVertex();
    representativeVertex.initialize(
        getConf().createVertexId(),
        getConf().createVertexValue(),
        getConf().createOutEdges());
    useUnsafeSerialization = getConf().useUnsafeSerialization();
  }

  @Override
  public Vertex<I, V, E, M> getVertex(I vertexIndex) {
    byte[] vertexData = vertexMap.get(vertexIndex);
    if (vertexData == null) {
      return null;
    }
    WritableUtils.reinitializeVertexFromByteArray(
        vertexData, representativeVertex, useUnsafeSerialization, getConf());
    return representativeVertex;
  }

  @Override
  public Vertex<I, V, E, M> putVertex(Vertex<I, V, E, M> vertex) {
    byte[] vertexData =
        WritableUtils.writeVertexToByteArray(
            vertex, useUnsafeSerialization, getConf());
    byte[] oldVertexBytes = vertexMap.put(vertex.getId(), vertexData);
    if (oldVertexBytes == null) {
      return null;
    } else {
      WritableUtils.reinitializeVertexFromByteArray(oldVertexBytes,
          representativeVertex, useUnsafeSerialization, getConf());
      return representativeVertex;
    }
  }

  @Override
  public Vertex<I, V, E, M> removeVertex(I vertexIndex) {
    byte[] vertexBytes = vertexMap.remove(vertexIndex);
    if (vertexBytes == null) {
      return null;
    }
    WritableUtils.reinitializeVertexFromByteArray(vertexBytes,
        representativeVertex, useUnsafeSerialization, getConf());
    return representativeVertex;
  }

  @Override
  public void addPartition(Partition<I, V, E, M> partition) {
    // Only work with other ByteArrayPartition instances
    if (!(partition instanceof ByteArrayPartition)) {
      throw new IllegalStateException("addPartition: Cannot add partition " +
          "of type " + partition.getClass());
    }

    ByteArrayPartition<I, V, E, M> byteArrayPartition =
        (ByteArrayPartition<I, V, E, M>) partition;
    for (Map.Entry<I, byte[]> entry :
        byteArrayPartition.vertexMap.entrySet()) {
      vertexMap.put(entry.getKey(), entry.getValue());
    }
  }

  @Override
  public long getVertexCount() {
    return vertexMap.size();
  }

  @Override
  public long getEdgeCount() {
    long edges = 0;
    for (byte[] vertexBytes : vertexMap.values()) {
      WritableUtils.reinitializeVertexFromByteArray(vertexBytes,
          representativeVertex, useUnsafeSerialization, getConf());
      edges += representativeVertex.getNumEdges();
    }
    return edges;
  }

  @Override
  public void saveVertex(Vertex<I, V, E, M> vertex) {
    // Reuse the old buffer whenever possible
    byte[] oldVertexData = vertexMap.get(vertex.getId());
    if (oldVertexData != null) {
      vertexMap.put(vertex.getId(),
          WritableUtils.writeVertexToByteArray(
              vertex, oldVertexData, useUnsafeSerialization, getConf()));
    } else {
      vertexMap.put(vertex.getId(),
          WritableUtils.writeVertexToByteArray(
              vertex, useUnsafeSerialization, getConf()));
    }
  }

  @Override
  public void write(DataOutput output) throws IOException {
    super.write(output);
    output.writeInt(vertexMap.size());
    for (Map.Entry<I, byte[]> entry : vertexMap.entrySet()) {
      progress();
      entry.getKey().write(output);
      // Note here that we are writing the size of the vertex data first
      // as it is encoded in the first four bytes of the byte[]
      int vertexDataSize;
      if (useUnsafeSerialization) {
        vertexDataSize = UnsafeByteArrayInputStream.getInt(entry.getValue(),
            0);
      } else {
        vertexDataSize = Ints.fromByteArray(entry.getValue());
      }

      output.writeInt(vertexDataSize);
      output.write(entry.getValue(), 0, vertexDataSize);
    }
  }

  @Override
  public void readFields(DataInput input) throws IOException {
    super.readFields(input);
    int size = input.readInt();
    vertexMap = new MapMaker().concurrencyLevel(
        getConf().getNettyServerExecutionConcurrency()).initialCapacity(
        size).makeMap();
    representativeVertex = getConf().createVertex();
    representativeVertex.initialize(
        getConf().createVertexId(),
        getConf().createVertexValue(),
        getConf().createOutEdges());
    useUnsafeSerialization = getConf().useUnsafeSerialization();
    for (int i = 0; i < size; ++i) {
      progress();
      I vertexId = getConf().createVertexId();
      vertexId.readFields(input);
      int vertexDataSize = input.readInt();
      byte[] vertexData = new byte[vertexDataSize];
      input.readFully(vertexData);
      if (vertexMap.put(vertexId, vertexData) != null) {
        throw new IllegalStateException("readFields: Already saw vertex " +
            vertexId);
      }
    }
  }

  @Override
  public Iterator<Vertex<I, V, E, M>> iterator() {
    return new RepresentativeVertexIterator();
  }

  /**
   * Iterator that deserializes a vertex from a byte array on the fly, using
   * the same representative vertex object.
   */
  private class RepresentativeVertexIterator implements
      Iterator<Vertex<I, V, E, M>> {
    /** Iterator to the vertex values */
    private Iterator<byte[]> vertexDataIterator =
        vertexMap.values().iterator();

    @Override
    public boolean hasNext() {
      return vertexDataIterator.hasNext();
    }

    @Override
    public Vertex<I, V, E, M> next() {
      WritableUtils.reinitializeVertexFromByteArray(
          vertexDataIterator.next(), representativeVertex,
          useUnsafeSerialization, getConf());
      return representativeVertex;
    }

    @Override
    public void remove() {
      throw new IllegalAccessError("remove: This method is not supported.");
    }
  }
}
TOP

Related Classes of org.apache.giraph.partition.ByteArrayPartition$RepresentativeVertexIterator

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.