Package ch.akuhn.hapax.index

Examples of ch.akuhn.hapax.index.TermDocumentMatrix.documentCount()


    public TermDocumentMatrix makeTermDocumentMatrix() {
        TermDocumentMatrix tdm = new TermDocumentMatrix();
        for (String[] each: DATA) {
            tdm.putDocument(each[0], new Terms(each[1]));
        }
        assertEquals(9, tdm.documentCount());
        assertEquals(45, tdm.termCount());
        return tdm;
    }
   
    @Test
View Full Code Here


    @Test
    @Given("#makeTermDocumentMatrix")
    public TermDocumentMatrix rejectStopWords(final TermDocumentMatrix matrix) {
        TermDocumentMatrix tdm = matrix;
        tdm = tdm.toLowerCase();
        assertEquals(9, tdm.documentCount());
        assertEquals(42, tdm.termCount());
        tdm = tdm.rejectHapaxes();
        assertEquals(9, tdm.documentCount());
        assertEquals(16, tdm.termCount());
        tdm = tdm.toLowerCase().rejectStopwords();
View Full Code Here

        TermDocumentMatrix tdm = matrix;
        tdm = tdm.toLowerCase();
        assertEquals(9, tdm.documentCount());
        assertEquals(42, tdm.termCount());
        tdm = tdm.rejectHapaxes();
        assertEquals(9, tdm.documentCount());
        assertEquals(16, tdm.termCount());
        tdm = tdm.toLowerCase().rejectStopwords();
        assertEquals(9, tdm.documentCount());
        assertEquals(12, tdm.termCount());
        assertEquals(SORTED, Get.sorted(tdm.terms().elementSet()).toString());
View Full Code Here

        assertEquals(42, tdm.termCount());
        tdm = tdm.rejectHapaxes();
        assertEquals(9, tdm.documentCount());
        assertEquals(16, tdm.termCount());
        tdm = tdm.toLowerCase().rejectStopwords();
        assertEquals(9, tdm.documentCount());
        assertEquals(12, tdm.termCount());
        assertEquals(SORTED, Get.sorted(tdm.terms().elementSet()).toString());
        return tdm;
    }
   
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.