Package com.cloudera.flume.handlers.batch

Source Code of com.cloudera.flume.handlers.batch.GunzipDecorator

/**
* Licensed to Cloudera, Inc. under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  Cloudera, Inc. licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.cloudera.flume.handlers.batch;

import java.io.ByteArrayInputStream;
import java.io.DataInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.concurrent.atomic.AtomicLong;
import java.util.zip.GZIPInputStream;

import com.cloudera.flume.conf.Context;
import com.cloudera.flume.conf.SinkFactory.SinkDecoBuilder;
import com.cloudera.flume.core.Event;
import com.cloudera.flume.core.EventSink;
import com.cloudera.flume.core.EventSinkDecorator;
import com.cloudera.flume.handlers.hdfs.WriteableEvent;
import com.cloudera.flume.reporter.ReportEvent;
import com.google.common.base.Preconditions;

/**
* This gunzip's any event that is gzip'ed, otherwise events just pass through.
*/
public class GunzipDecorator<S extends EventSink> extends EventSinkDecorator<S> {

  public static final String R_PASSTHROUGH = "passthroughCount";
  public static final String R_GZIPCOUNT = "gzippedCount";
  public static final String R_GZIPSIZE = "gzippedSize";
  public static final String R_GUNZIPSIZE = "gunzippedSize";

  AtomicLong passthrough = new AtomicLong(0);
  AtomicLong gzipCnt = new AtomicLong(0);
  AtomicLong gzipSize = new AtomicLong(0);
  AtomicLong gunzipSize = new AtomicLong(0);

  public GunzipDecorator(S s) {
    super(s);
  }

  public final static String GZDOC = "compressGzip";

  public static boolean isGzEven(Event e) {
    return e.get(GZDOC) != null;
  }

  /**
   * This is a terrible hack to expose the number bytes that the compressed
   * input stream got decompressed to.
   */
  static class GZIPInputStreamExposeSize extends GZIPInputStream {
    GZIPInputStreamExposeSize(InputStream in) throws IOException {
      super(in);
    }

    long getDecompressSize() {
      // inf is protected by GZIPInputStream
      return inf.getBytesWritten();
    }
  }

  @Override
  public void append(Event e) throws IOException, InterruptedException {

    byte[] bs = e.get(GZDOC);
    if (bs == null) {
      super.append(e);
      passthrough.incrementAndGet();
      return;
    }

    gzipCnt.incrementAndGet();
    gzipSize.addAndGet(bs.length);
    ByteArrayInputStream bais = new ByteArrayInputStream(bs);
    GZIPInputStreamExposeSize gzis = new GZIPInputStreamExposeSize(bais);
    DataInputStream dis = new DataInputStream(gzis);

    WriteableEvent out = new WriteableEvent();
    out.readFields(dis);
    long gunSz = gzis.getDecompressSize(); // must be done before closed.
    dis.close();
    super.append(out);
    gunzipSize.addAndGet(gunSz);
  }

  @Override
  public ReportEvent getMetrics() {
    ReportEvent rpt = super.getMetrics();
    rpt.setLongMetric(R_PASSTHROUGH, passthrough.get());
    rpt.setLongMetric(R_GZIPCOUNT, gzipCnt.get());
    rpt.setLongMetric(R_GZIPSIZE, gzipSize.get());
    rpt.setLongMetric(R_GUNZIPSIZE, gunzipSize.get());
    return rpt;
  }

  public static SinkDecoBuilder builder() {
    return new SinkDecoBuilder() {
      @Override
      public EventSinkDecorator<EventSink> build(Context context,
          String... argv) {
        Preconditions.checkArgument(argv.length == 0, "usage: gunzip");
        return new GunzipDecorator<EventSink>(null);
      }
    };
  }
}
TOP

Related Classes of com.cloudera.flume.handlers.batch.GunzipDecorator

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.