Package org.apache.mahout.utils.vectors.io

Source Code of org.apache.mahout.utils.vectors.io.DelimitedTermInfoWriter

/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.mahout.utils.vectors.io;

import java.io.IOException;
import java.io.Writer;
import java.util.Iterator;

import com.google.common.io.Closeables;
import org.apache.mahout.utils.vectors.TermEntry;
import org.apache.mahout.utils.vectors.TermInfo;

/**
* Write {@link TermInfo} to a {@link Writer} in a textual, delimited format with header.
*/
public class DelimitedTermInfoWriter implements TermInfoWriter {
 
  private final Writer writer;
  private final String delimiter;
  private final String field;
 
  public DelimitedTermInfoWriter(Writer writer, String delimiter, String field) {
    this.writer = writer;
    this.delimiter = delimiter;
    this.field = field;
  }
 
  @Override
  public void write(TermInfo ti) throws IOException {
   
    Iterator<TermEntry> entIter = ti.getAllEntries();
    try {
      writer.write(String.valueOf(ti.totalTerms(field)));
      writer.write('\n');
      writer.write("#term" + delimiter + "doc freq" + delimiter + "idx");
      writer.write('\n');
      while (entIter.hasNext()) {
        TermEntry entry = entIter.next();
        writer.write(entry.getTerm());
        writer.write(delimiter);
        writer.write(String.valueOf(entry.getDocFreq()));
        writer.write(delimiter);
        writer.write(String.valueOf(entry.getTermIdx()));
        writer.write('\n');
      }
    } finally {
      Closeables.close(writer, false);
    }
  }
 
  /**
   * Does NOT close the underlying writer
   */
  @Override
  public void close() {

  }
}
TOP

Related Classes of org.apache.mahout.utils.vectors.io.DelimitedTermInfoWriter

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.