/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tika.config;
import java.net.URL;
import java.util.List;
import java.util.Map;
import org.apache.tika.ResourceLoggingClassLoader;
import org.apache.tika.exception.TikaException;
import org.apache.tika.parser.AutoDetectParser;
import org.apache.tika.parser.DefaultParser;
import org.junit.Test;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotNull;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;
public class TikaConfigTest {
/**
* Make sure that a configuration file can't reference the
* {@link AutoDetectParser} class a <parser> configuration element.
*
* @see <a href="https://issues.apache.org/jira/browse/TIKA-866">TIKA-866</a>
*/
@Test
public void testInvalidParser() throws Exception {
URL url = TikaConfigTest.class.getResource("TIKA-866-invalid.xml");
System.setProperty("tika.config", url.toExternalForm());
try {
new TikaConfig();
fail("AutoDetectParser allowed in a <parser> element");
} catch (TikaException expected) {
} finally {
System.clearProperty("tika.config");
}
}
/**
* Make sure that a configuration file can reference also a composite
* parser class like {@link DefaultParser} in a <parser>
* configuration element.
*
* @see <a href="https://issues.apache.org/jira/browse/TIKA-866">TIKA-866</a>
*/
public void testCompositeParser() throws Exception {
URL url = TikaConfigTest.class.getResource("TIKA-866-composite.xml");
System.setProperty("tika.config", url.toExternalForm());
try {
new TikaConfig();
} catch (TikaException e) {
fail("Unexpected TikaException: " + e);
} finally {
System.clearProperty("tika.config");
}
}
/**
* Make sure that a valid configuration file without mimetypes or
* detector entries can be loaded without problems.
*
* @see <a href="https://issues.apache.org/jira/browse/TIKA-866">TIKA-866</a>
*/
public void testValidParser() throws Exception {
URL url = TikaConfigTest.class.getResource("TIKA-866-valid.xml");
System.setProperty("tika.config", url.toExternalForm());
try {
new TikaConfig();
} catch (TikaException e) {
fail("Unexpected TikaException: " + e);
} finally {
System.clearProperty("tika.config");
}
}
/**
* TIKA-1145 If the TikaConfig has a ClassLoader set on it,
* that should be used when loading the mimetypes and when
* discovering services
*/
public void testClassLoaderUsedEverywhere() throws Exception {
ResourceLoggingClassLoader customLoader =
new ResourceLoggingClassLoader(getClass().getClassLoader());
TikaConfig config;
// Without a classloader set, normal one will be used
config = new TikaConfig();
config.getMediaTypeRegistry();
config.getParser();
assertEquals(0, customLoader.getLoadedResources().size());
// With a classloader set, resources will come through it
config = new TikaConfig(customLoader);
config.getMediaTypeRegistry();
config.getParser();
Map<String,List<URL>> resources = customLoader.getLoadedResources();
int resourcesCount = resources.size();
assertTrue(
"Not enough things used the classloader, found only " + resourcesCount,
resourcesCount > 3
);
// Ensure everything that should do, did use it
// - Parsers
assertNotNull(resources.get("META-INF/services/org.apache.tika.parser.Parser"));
// - Detectors
assertNotNull(resources.get("META-INF/services/org.apache.tika.detect.Detector"));
// - Built-In Mimetypes
assertNotNull(resources.get("org/apache/tika/mime/tika-mimetypes.xml"));
// - Custom Mimetypes
assertNotNull(resources.get("org/apache/tika/mime/custom-mimetypes.xml"));
}
}