Package org.apache.jena.tdbloader4

Source Code of org.apache.jena.tdbloader4.StatsMapper

/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.jena.tdbloader4;

import java.io.IOException;

import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.jena.tdbloader4.io.QuadWritable;
import org.openjena.atlas.event.Event;
import org.openjena.atlas.event.EventManager;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import com.hp.hpl.jena.graph.Node;
import com.hp.hpl.jena.sparql.core.Quad;
import com.hp.hpl.jena.vocabulary.RDF;

public class StatsMapper extends Mapper<LongWritable, QuadWritable, Text, IntWritable> {

    private static final Logger log = LoggerFactory.getLogger(StatsMapper.class);

    private Counters counters;
    private Text outputKey = new Text();
    private static final IntWritable one = new IntWritable(1);

    private static final String LABEL_TRIPLE = "t";
    private static final String LABEL_QUAD = "q";

    private static final String LABEL_PROPERTY = "p";
    private static final String LABEL_CLASS = "c";
    private static final String LABEL_NAMESPACE = "n";
   
    private static final String POSTFIX_TOTAL = "t";
    private static final String POSTFIX_PER_GRAPH = "g";
   
    @Override
    protected void setup(Context context) throws IOException, InterruptedException {
      counters = new Counters(context);
    };
   
    @Override
  public void map (LongWritable key, QuadWritable value, Context context) throws IOException, InterruptedException {
        log.debug("< ({}, {})", key, value);

        Quad quad = value.getQuad();
        if ( quad.isTriple() ) {
        EventManager.send(counters, new Event(Constants.eventTriple, null));
        } else {
        EventManager.send(counters, new Event(Constants.eventQuad, null));
        }
        emit (quad, context);

    Node g = quad.getGraph();
    Node p = quad.getPredicate();
    emit (LABEL_PROPERTY, g, p, context);
   
    if ( RDF.type.asNode().equals(p) ) {
      Node o = quad.getObject();
      if ( o.isURI() ) {
        emit (LABEL_CLASS, g, o, context);
      } else {
        // TODO: WARN!
      }
    }
  }

    private void emit(Quad quad, Context context) throws IOException, InterruptedException {
      StringBuffer sb = new StringBuffer();
      String label = quad.isTriple() ? LABEL_TRIPLE : LABEL_QUAD;

      sb.append(label);
      sb.append(POSTFIX_TOTAL);
      emit(sb, context);

      sb = new StringBuffer();
      sb.append(label);
      sb.append(POSTFIX_PER_GRAPH);
    sb.append("|");
    sb.append(quad.getGraph());
    emit(sb, context);
    }
   
    private void emit(String label, Node graph, Node node, Context context) throws IOException, InterruptedException {
    StringBuffer sb = new StringBuffer(label);
    sb.append(POSTFIX_TOTAL);
    sb.append("|");
    sb.append(node.getURI());
    emit(sb, context);
   
    sb = new StringBuffer(label);
    sb.append(POSTFIX_PER_GRAPH);
    sb.append("|");
    sb.append(graph.getURI());
    sb.append("|");
    sb.append(node.getURI());
    emit(sb, context);
   
    sb = new StringBuffer(LABEL_NAMESPACE);
    sb.append(POSTFIX_TOTAL);
    sb.append("|");
    sb.append(node.getNameSpace());
    emit(sb, context);

    sb = new StringBuffer(LABEL_NAMESPACE);
    sb.append(POSTFIX_PER_GRAPH);
    sb.append("|");
    sb.append(graph.getURI());
    sb.append("|");
    sb.append(node.getNameSpace());
    emit(sb, context);
    }
   
    private void emit (StringBuffer sb, Context context) throws IOException, InterruptedException {
    outputKey.set(sb.toString());
    context.write(outputKey, one);
    log.debug("> ({}, {})", outputKey, one);
    outputKey.clear();
    }
   
    @Override
    protected void cleanup(Context context) throws IOException, InterruptedException {
      counters.close();
    }

}
TOP

Related Classes of org.apache.jena.tdbloader4.StatsMapper

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.