Package cc.mallet.types

Examples of cc.mallet.types.Alphabet


  /**
   *
   */
  public FeatureSequenceConvolution() {
    // TODO Auto-generated constructor stub
    super(new Alphabet(), null);
  }
View Full Code Here


    int inputVocabSize = 4;
    int numStates = 5;
    // Create a file to store the CRF
    File f = new File("TestObject.obj");
    File f2 = new File("TestObject2.obj");
    Alphabet inputAlphabet = new Alphabet();
    for (int i = 0; i < inputVocabSize; i++)
      inputAlphabet.lookupIndex("feature" + i);
    Alphabet outputAlphabet = new Alphabet();
    // Store the dictionary
    if (outputAlphabet == null) {
      System.err.println("Output dictionary null.");
    }
    MEMM crf = new MEMM(inputAlphabet, outputAlphabet);
View Full Code Here

  private PipeUtils () {}; // no instances

  public static Pipe concatenatePipes (Pipe p1, Pipe p2)
  {
    Alphabet dataDict = combinedDataDicts (p1, p2);
    Alphabet targetDict = combinedTargetDicts (p1, p2);
    Pipe ret = new SerialPipes (new Pipe[] { p1, p2 });

    if (dataDict != null) ret.dataAlphabetResolved = true;
    if (targetDict != null) ret.targetAlphabetResolved = true;
   
View Full Code Here

        LinkedHashSet<Integer> stateIndices = new LinkedHashSet<Integer>();
        stateIndices.add(labelIndex);
        labelToState.put(labelIndex, stateIndices);
      }
    } else {
      stateAlphabet = new Alphabet();

      labelIter = labelAlphabet.iterator();
      while (labelIter.hasNext()) {
        String label = (String) labelIter.next();
        labelToState.put(labelAlphabet.lookupIndex(label, false),
View Full Code Here

   
   
   
    if (p.isTargetProcessing())
    {
      Alphabet targets = p.getTargetAlphabet();
      StringBuffer buf = new StringBuffer("Labels:");
      for (int i = 0; i < targets.size(); i++)
        buf.append(" ").append(targets.lookupObject(i).toString());
      logger.info(buf.toString());
    }
    if (trainOption.value) {
      if (crf == null) {
        crf = getCRF(trainingData, ordersOption.value, defaultOption.value, forbiddenOption.value, allowedOption.value, true);
View Full Code Here

    }


   
    if (p.isTargetProcessing()) {
      Alphabet targets = p.getTargetAlphabet();
      StringBuffer buf = new StringBuffer("Labels:");
      for (int i = 0; i < targets.size(); i++)
        buf.append(" ").append(targets.lookupObject(i).toString());
      logger.info(buf.toString());
    }

    if (trainOption.value) {
      crf = train(trainingData, testData, eval,
View Full Code Here

    super (dataDict, null);
  }

  public TokenSequence2FeatureSequence ()
  {
    super(new Alphabet(), null);
  }
View Full Code Here

    /**
     * Creates a new
     * <code>SimpleTaggerSentence2FeatureVectorSequence</code> instance.
     */
    public SimpleTaggerSentence2FeatureVectorSequence () {
      super (new Alphabet(), new LabelAlphabet());
    }
View Full Code Here

    }

    public Instance pipe (Instance carrier) {

      Object inputData = carrier.getData();
      Alphabet features = getDataAlphabet();
      LabelAlphabet labels;
      LabelSequence target = null;
      String [][] tokens;

      if (inputData instanceof String) {
        tokens = parseSentence((String)inputData);
      }
      else if (inputData instanceof String[][]) {
        tokens = (String[][])inputData;
      }
      else {
        throw new IllegalArgumentException("Not a String or String[][]; got " + inputData);
      }

      FeatureVector[] fvs = new FeatureVector[tokens.length];
      if (isTargetProcessing()) {
        labels = (LabelAlphabet)getTargetAlphabet();
        target = new LabelSequence (labels, tokens.length);
      }

      for (int l = 0; l < tokens.length; l++) {
        int nFeatures;
        if (isTargetProcessing()) {
          if (tokens[l].length < 1) {
            throw new IllegalStateException ("Missing label at line " + l + " instance "+carrier.getName ());
          }
          nFeatures = tokens[l].length - 1;
          target.add(tokens[l][nFeatures]);
        }
        else nFeatures = tokens[l].length;
        ArrayList<Integer> featureIndices = new ArrayList<Integer>();
        for (int f = 0; f < nFeatures; f++) {
          int featureIndex = features.lookupIndex(tokens[l][f]);
          // gdruck
          // If the data alphabet's growth is stopped, featureIndex
          // will be -1.  Ignore these features.
          if (featureIndex >= 0) {
            featureIndices.add(featureIndex);
View Full Code Here

   */
  private void triangulate(final UndirectedGraph mdl)
  {
    UndirectedGraph mdl2 = dupGraph (mdl);
    ArrayList vars = new ArrayList(mdl.vertexSet());
    Alphabet varMap = makeVertexMap(vars);
    cliques = new ArrayList();

    // debug
    if (logger.isLoggable (Level.FINER)) {
      logger.finer ("Triangulating model: "+mdl);
View Full Code Here

TOP

Related Classes of cc.mallet.types.Alphabet

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.