Examples of Tika


Examples of org.apache.tika.Tika

        if (types == null) {
            types = config.getMimeRepository();
        }

        if(tika == null) {
            tika = new Tika(config);
        }
    }
View Full Code Here

Examples of org.apache.tika.Tika

public class ClassParserTest extends TestCase {

    public void testClassParsing() throws Exception {
        String path = "/test-documents/AutoDetectParser.class";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                ClassParserTest.class.getResourceAsStream(path), metadata);

        assertEquals("AutoDetectParser", metadata.get(Metadata.TITLE));
        assertEquals(
                "AutoDetectParser.class",
View Full Code Here

Examples of org.apache.tika.Tika

    }

    public void XtestParseUTF8() throws IOException, SAXException, TikaException {
        String path = "/test-documents/testXHTML_utf8.html";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                HtmlParserTest.class.getResourceAsStream(path), metadata);

        assertTrue("Did not contain expected text:"
                + "Title : Tilte with UTF-8 chars öäå", content
                .contains("Title : Tilte with UTF-8 chars öäå"));
View Full Code Here

Examples of org.apache.tika.Tika

    }

    public void testXhtmlParsing() throws Exception {
        String path = "/test-documents/testXHTML.html";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                HtmlParserTest.class.getResourceAsStream(path), metadata);

        assertEquals("application/xhtml+xml", metadata.get(Metadata.CONTENT_TYPE));
        assertEquals("XHTML test document", metadata.get(Metadata.TITLE));
View Full Code Here

Examples of org.apache.tika.Tika

     * Test case for TIKA-210
     * @see <a href="https://issues.apache.org/jira/browse/TIKA-210">TIKA-210</a>
     */
    public void testCharactersDirectlyUnderBodyElement() throws Exception {
        String test = "<html><body>test</body></html>";
        String content = new Tika().parseToString(
                new ByteArrayInputStream(test.getBytes("UTF-8")));
        assertEquals("test", content);
    }
View Full Code Here

Examples of org.apache.tika.Tika

     * @see <a href="https://issues.apache.org/jira/browse/TIKA-268">TIKA-268</a>
     */
    public void testWhitespaceBetweenTableCells() throws Exception {
        String test =
            "<html><body><table><tr><td>a</td><td>b</td></table></body></html>";
        String content = new Tika().parseToString(
                new ByteArrayInputStream(test.getBytes("UTF-8")));
        assertTrue(content.contains("a"));
        assertTrue(content.contains("b"));
        assertFalse(content.contains("ab"));
    }
View Full Code Here

Examples of org.apache.tika.Tika

public class AudioParserTest extends TestCase {

    public void testWAV() throws Exception {
        String path = "/test-documents/testWAV.wav";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                AudioParserTest.class.getResourceAsStream(path), metadata);

        assertEquals("audio/x-wav", metadata.get(Metadata.CONTENT_TYPE));
        assertEquals("44100.0", metadata.get("samplerate"));
        assertEquals("2", metadata.get("channels"));
View Full Code Here

Examples of org.apache.tika.Tika

    }

    public void testAIFF() throws Exception {
        String path = "/test-documents/testAIFF.aif";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                AudioParserTest.class.getResourceAsStream(path), metadata);

        assertEquals("audio/x-aiff", metadata.get(Metadata.CONTENT_TYPE));
        assertEquals("44100.0", metadata.get("samplerate"));
        assertEquals("2", metadata.get("channels"));
View Full Code Here

Examples of org.apache.tika.Tika

    }

    public void testAU() throws Exception {
        String path = "/test-documents/testAU.au";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                AudioParserTest.class.getResourceAsStream(path), metadata);

        assertEquals("audio/basic", metadata.get(Metadata.CONTENT_TYPE));
        assertEquals("44100.0", metadata.get("samplerate"));
        assertEquals("2", metadata.get("channels"));
View Full Code Here

Examples of org.apache.tika.Tika

public class MidiParserTest extends TestCase {

    public void testMID() throws Exception {
        String path = "/test-documents/testMID.mid";
        Metadata metadata = new Metadata();
        String content = new Tika().parseToString(
                MidiParserTest.class.getResourceAsStream(path), metadata);

        assertEquals("audio/midi", metadata.get(Metadata.CONTENT_TYPE));
        assertEquals("2", metadata.get("tracks"));
        assertEquals("0", metadata.get("patches"));
View Full Code Here
TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.