package hapax.test;
import static org.junit.Assert.assertEquals;
import org.junit.Test;
import ch.akuhn.hapax.corpus.Terms;
import ch.akuhn.hapax.index.LatentSemanticIndex;
import ch.akuhn.hapax.index.TermDocumentMatrix;
public class SmallDocumentsTest {
@Test
public void corpusWithSmallDocuments() {
TermDocumentMatrix tdm = new TermDocumentMatrix();
tdm.putDocument("m1", new Terms("Lorem ipsum dolor."));
tdm.putDocument("m2", new Terms("Lorem ipsum dolor."));
tdm.putDocument("m3", new Terms("Lorem ipsum dolor."));
LatentSemanticIndex lsi = tdm.rejectAndWeight().createIndex();
assertEquals(3, lsi.documentCount());
assertEquals(3, lsi.rankDocumentsByQuery("Lorem").size());
}
@Test
public void corpusWithoutDocuments() {
TermDocumentMatrix tdm = new TermDocumentMatrix();
LatentSemanticIndex lsi = tdm.rejectAndWeight().createIndex();
assertEquals(0, lsi.documentCount());
assertEquals(0, lsi.rankDocumentsByQuery("Lorem").size());
}
@Test
public void corpusWithoutOneDocuments() {
TermDocumentMatrix tdm = new TermDocumentMatrix();
tdm.putDocument("m1", new Terms("Lorem ipsum dolor."));
LatentSemanticIndex lsi = tdm.rejectAndWeight().createIndex();
assertEquals(1, lsi.documentCount());
assertEquals(1, lsi.rankDocumentsByQuery("Lorem").size());
}
}