blob: b28291e42b56b77374ed23cee59ba2f359df0fcc [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tika.parser.image;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
import java.util.Arrays;
import java.util.GregorianCalendar;
import java.util.Iterator;
import java.util.List;
import java.util.Locale;
import java.util.TimeZone;
import com.drew.metadata.Directory;
import com.drew.metadata.MetadataException;
import com.drew.metadata.Tag;
import com.drew.metadata.exif.ExifIFD0Directory;
import com.drew.metadata.exif.ExifSubIFDDirectory;
import com.drew.metadata.jpeg.JpegCommentDirectory;
import org.junit.Test;
import org.mockito.Mockito;
import org.apache.tika.metadata.Metadata;
import org.apache.tika.metadata.TikaCoreProperties;
public class ImageMetadataExtractorTest {
@SuppressWarnings({"rawtypes", "unchecked"})
@Test
public void testHandleDirectories() throws MetadataException {
Metadata metadata = Mockito.mock(Metadata.class);
ImageMetadataExtractor.DirectoryHandler handler1 =
Mockito.mock(ImageMetadataExtractor.DirectoryHandler.class);
ImageMetadataExtractor e = new ImageMetadataExtractor(metadata, handler1);
Directory directory = new JpegCommentDirectory();
Iterator directories = Mockito.mock(Iterator.class);
Mockito.when(directories.hasNext()).thenReturn(true, false);
Mockito.when(directories.next()).thenReturn(directory);
Mockito.when(handler1.supports(JpegCommentDirectory.class)).thenReturn(true);
e.handle(directories);
Mockito.verify(handler1).supports(JpegCommentDirectory.class);
Mockito.verify(handler1).handle(directory, metadata);
}
@Test
public void testExifHandlerSupports() {
assertTrue(new ImageMetadataExtractor.ExifHandler().supports(ExifIFD0Directory.class));
assertTrue(new ImageMetadataExtractor.ExifHandler().supports(ExifSubIFDDirectory.class));
assertFalse(new ImageMetadataExtractor.ExifHandler().supports(Directory.class));
assertFalse(new ImageMetadataExtractor.ExifHandler().supports(JpegCommentDirectory.class));
}
@Test
public void testExifHandlerParseDate() throws MetadataException {
ExifSubIFDDirectory exif = Mockito.mock(ExifSubIFDDirectory.class);
Mockito.when(exif.containsTag(ExifSubIFDDirectory.TAG_DATETIME_ORIGINAL)).thenReturn(true);
GregorianCalendar calendar = new GregorianCalendar(TimeZone.getDefault(), Locale.ROOT);
calendar.setTimeInMillis(0);
calendar.set(2000, 0, 1, 0, 0, 0);
Mockito.when(exif.getDate(ExifSubIFDDirectory.TAG_DATETIME_ORIGINAL))
.thenReturn(calendar.getTime()); // jvm default timezone as in Metadata Extractor
Metadata metadata = new Metadata();
new ImageMetadataExtractor.ExifHandler().handle(exif, metadata);
assertEquals("Should be ISO date without time zone", "2000-01-01T00:00:00",
metadata.get(TikaCoreProperties.CREATED));
}
@Test
public void testExifHandlerParseDateFallback() throws MetadataException {
ExifIFD0Directory exif = Mockito.mock(ExifIFD0Directory.class);
Mockito.when(exif.containsTag(ExifIFD0Directory.TAG_DATETIME)).thenReturn(true);
GregorianCalendar calendar = new GregorianCalendar(TimeZone.getDefault(), Locale.ROOT);
calendar.setTimeInMillis(0);
calendar.set(1999, 0, 1, 0, 0, 0);
Mockito.when(exif.getDate(ExifIFD0Directory.TAG_DATETIME))
.thenReturn(calendar.getTime()); // jvm default timezone as in Metadata Extractor
Metadata metadata = new Metadata();
new ImageMetadataExtractor.ExifHandler().handle(exif, metadata);
assertEquals("Should try EXIF Date/Time if Original is not set", "1999-01-01T00:00:00",
metadata.get(TikaCoreProperties.CREATED));
}
@Test
public void testExifHandlerParseDateError() throws MetadataException {
ExifIFD0Directory exif = Mockito.mock(ExifIFD0Directory.class);
Mockito.when(exif.containsTag(ExifSubIFDDirectory.TAG_DATETIME_ORIGINAL)).thenReturn(true);
Mockito.when(exif.getDate(ExifSubIFDDirectory.TAG_DATETIME_ORIGINAL)).thenReturn(null);
Metadata metadata = new Metadata();
new ImageMetadataExtractor.ExifHandler().handle(exif, metadata);
assertEquals("Parsing should proceed without date", null,
metadata.get(TikaCoreProperties.CREATED));
}
@Test
public void testCopyUnknownFieldsHandler() throws MetadataException {
Directory d = Mockito.mock(Directory.class);
Tag t1 = Mockito.mock(Tag.class);
Mockito.when(t1.getTagName()).thenReturn("Image Description");
Mockito.when(t1.getDescription()).thenReturn("t1");
Tag t2 = Mockito.mock(Tag.class);
Mockito.when(t2.getTagName()).thenReturn(TikaCoreProperties.SUBJECT.toString());
Mockito.when(t2.getDescription()).thenReturn("known");
Tag t3 = Mockito.mock(Tag.class);
Mockito.when(t3.getTagName()).thenReturn(TikaCoreProperties.DESCRIPTION.getName());
Mockito.when(t3.getDescription()).thenReturn("known");
List<Tag> tags = Arrays.asList(t1, t2, t3);
Mockito.when(d.getTags()).thenReturn(tags);
Metadata metadata = new Metadata();
new ImageMetadataExtractor.CopyUnknownFieldsHandler().handle(d, metadata);
assertEquals("t1", metadata.get("Image Description"));
assertNull("keywords should be excluded from bulk copy because it is a defined field",
metadata.get(TikaCoreProperties.SUBJECT));
assertNull(metadata.get(TikaCoreProperties.DESCRIPTION));
}
}