Package cc.mallet.types

Examples of cc.mallet.types.Alphabet


  }


  private Alphabet makeVertexMap(ArrayList vars)
  {
    Alphabet map = new Alphabet (vars.size (), Variable.class);
    map.lookupIndices(vars.toArray(), true);
    return map;
  }
View Full Code Here


                new String[] {"z"},
                new double[] {11},
                new String[] {"2"});

    seq = new ArrayListSequence ();
    Alphabet dict = transducer.getInputAlphabet ();
    seq.add ("a");
    seq.add ("a");
    seq.add ("b");
    seq.add ("c");
    seq.add ("d");
View Full Code Here

  }
 
 
  public void testEstimating ()
  {
    Alphabet dict = new Alphabet ();
    Multinomial.Estimator e = new Multinomial.LaplaceEstimator (dict);
    FeatureSequence fs = new FeatureSequence (dict);
    fs.add (dict.lookupIndex ("a"));
    fs.add (dict.lookupIndex ("n"));
    fs.add (dict.lookupIndex ("d"));
    fs.add (dict.lookupIndex ("r"));
    fs.add (dict.lookupIndex ("e"));
    fs.add (dict.lookupIndex ("w"));
    fs.add (dict.lookupIndex ("m"));
    fs.add (dict.lookupIndex ("c"));
    fs.add (dict.lookupIndex ("c"));
    fs.add (dict.lookupIndex ("a"));
    fs.add (dict.lookupIndex ("l"));
    fs.add (dict.lookupIndex ("l"));
    fs.add (dict.lookupIndex ("u"));
    fs.add (dict.lookupIndex ("m"));
    //System.out.println (fs.toString());
    e.increment (fs);
    assertTrue (e.size() == 10);

    Multinomial m = e.estimate ();
    assertTrue (m.size() == 10);
    assertTrue (m.probability (dict.lookupIndex ("a")) == (2.0+1)/(14.0+10));
    assertTrue (m.probability ("w") == (1.0+1)/(14.0+10));
    Multinomial.Logged ml = new Multinomial.Logged (m);
    assertTrue (m.logProbability ("w") == ml.logProbability ("w"));
  }
View Full Code Here

public class Csv2FeatureVector extends Pipe {

    private static Logger logger = MalletLogger.getLogger(Csv2FeatureVector.class.getName());

    public Csv2FeatureVector(int capacity) {
        this.dataAlphabet = new Alphabet(capacity);
    }
View Full Code Here

  public FeatureValueString2FeatureVector (Alphabet dataDict) {
    super (dataDict, null);
  }

  public FeatureValueString2FeatureVector () {
    super(new Alphabet(), null);
  }
View Full Code Here

  }


  private static Alphabet dictOfSize (int size)
  {
    Alphabet ret = new Alphabet ();
    for (int i = 0; i < size; i++)
      ret.lookupIndex ("feature"+i);
    return ret;
  }
View Full Code Here

  private double testRandomTrainedOn (InstanceList training)
  {
    ClassifierTrainer trainer = new MaxEntTrainer ();

    Alphabet fd = dictOfSize (3);
    String[] classNames = new String[] {"class0", "class1", "class2"};

    Randoms r = new Randoms (1);
    Iterator<Instance> iter = new RandomTokenSequenceIterator (r,  new Dirichlet(fd, 2.0),
          30, 0, 10, 200, classNames);
View Full Code Here

    return new SerialPipes(pipes.subList(start, end));
  }
 
  private void resolveAlphabets ()
  {
    Alphabet da = null, ta = null;
    for (Pipe p : pipes) {
      p.preceedingPipeDataAlphabetNotification(da);
      da = p.getDataAlphabet();
      p.preceedingPipeTargetAlphabetNotification(ta);
      ta = p.getTargetAlphabet();
View Full Code Here

    t.setFeatureValue ("length", 3);
    t.setFeatureValue ("containsVowel", 1);
    t.setFeatureValue ("in /usr/dict/words", 0);

    Alphabet dict = new Alphabet();
    FeatureVector fv = t.toFeatureVector (dict, false);
    assertTrue (fv.numLocations() == 2);
    assertTrue (fv.value (dict.lookupIndex("length")) == 3);
  }
View Full Code Here

  public static class TestCRFTokenSequenceRemoveSpaces extends Pipe implements
      Serializable {

    public TestCRFTokenSequenceRemoveSpaces() {
      super(null, new Alphabet());
    }
View Full Code Here

TOP

Related Classes of cc.mallet.types.Alphabet

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.