Package proj.zoie.impl.indexing

Source Code of proj.zoie.impl.indexing.FileIndexableInterpreter

package proj.zoie.impl.indexing;

/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements.  See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
import java.io.BufferedReader;
import java.io.File;
import java.io.FileReader;
import java.io.IOException;

import org.apache.log4j.Logger;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field.Store;
import org.apache.lucene.document.StringField;
import org.apache.lucene.document.TextField;

import proj.zoie.api.indexing.AbstractZoieIndexable;
import proj.zoie.api.indexing.ZoieIndexable;
import proj.zoie.api.indexing.ZoieIndexableInterpreter;

public class FileIndexableInterpreter implements ZoieIndexableInterpreter<File> {
  protected static int id = 0;
  private static final Logger log = Logger.getLogger(FileIndexableInterpreter.class);
  static ThreadLocal<StringBuilder> myStringBuilder = new ThreadLocal<StringBuilder>();
  static ThreadLocal<char[]> myCharBuffer = new ThreadLocal<char[]>();

  protected static class FileIndexable extends AbstractZoieIndexable {
    private final File _file;
    private final int _uid;

    private FileIndexable(File file, int uid) {
      _file = file;
      _uid = uid;
    }

    @Override
    public IndexingReq[] buildIndexingReqs() {
      IndexingReq req = new IndexingReq(buildDocument(), null);
      return new IndexingReq[] { req };
    }

    public Document buildDocument() {
      Document doc = new Document();
      doc.add(new StringField("foo", "bar", Store.NO));
      StringBuilder sb = myStringBuilder.get();
      char[] cb = myCharBuffer.get();
      if (sb == null || cb == null) {
        sb = new StringBuilder(15500);
        sb.ensureCapacity(15500);
        myStringBuilder.set(sb);
        cb = new char[15500];
        myCharBuffer.set(cb);
      }
      sb.append(_file.getAbsoluteFile()).append("\n");
      doc.add(new TextField("path", _file.getAbsolutePath(), Store.YES));
      FileReader freader = null;
      try {
        freader = new FileReader(_file);
        BufferedReader br = new BufferedReader(freader);
        int len = br.read(cb, 0, cb.length);
        int start = 0;
        int end = 0;
        while (end < len) {
          if (cb[end] == '\n' || cb[end] == '\r') {
            sb.append(cb, start, end - start).append('\n');
            start = end;
            while (start < len && (cb[start] == '\n' || cb[start] == '\r')) {
              start++;
            }
            end = start;
          }
          end++;
        }
      } catch (Exception e) {
        log.error(e);
      } finally {
        if (freader != null) {
          try {
            freader.close();
          } catch (IOException e) {
            log.error(e);
          }
        }
      }
      doc.add(new TextField("content", sb.toString(), Store.YES));
      sb.setLength(0);
      return doc;
    }

    @Override
    public boolean isSkip() {
      return false;
    }

    @Override
    public boolean isDeleted() {
      return false;
    }

    @Override
    public long getUID() {
      return _uid;
    }
  }

  @Override
  public ZoieIndexable convertAndInterpret(File src) {
    ZoieIndexable idxable = new FileIndexable(src, id);
    id++;
    return idxable;
  }
}
TOP

Related Classes of proj.zoie.impl.indexing.FileIndexableInterpreter

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.