/*
* #%L
* Alfresco Repository
* %%
* Copyright (C) 2005 - 2016 Alfresco Software Limited
* %%
* This file is part of the Alfresco software.
* If the software was purchased under a paid Alfresco license, the terms of
* the paid license agreement will prevail. Otherwise, the software is
* provided under the following open source license terms:
*
* Alfresco is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Alfresco is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with Alfresco. If not, see .
* #L%
*/
/*
* Copyright (C) 2005 Jesper Steen Møller
*
* This file is part of Alfresco
*
* Alfresco is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Alfresco is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with Alfresco. If not, see .
*/
package org.alfresco.repo.content.metadata;
import java.io.Serializable;
import java.util.Arrays;
import java.util.HashSet;
import java.util.Map;
import org.alfresco.repo.content.MimetypeMap;
import org.alfresco.service.cmr.repository.ContentReader;
import org.alfresco.util.PropertyCheck;
/**
* Extracts values from Star Office documents into the following:
*
* author: -- cm:author
* title: -- cm:title
* description: -- cm:description
*
*
* Note - not converted to Apache Tika, as currently Tika
* lacks support for these older formats
*
* @author Jesper Steen Møller
*/
public class OpenOfficeMetadataExtracter extends AbstractMappingMetadataExtracter implements OpenOfficeMetadataWorker
{
public static String[] SUPPORTED_MIMETYPES = new String[] {
MimetypeMap.MIMETYPE_STAROFFICE5_WRITER,
MimetypeMap.MIMETYPE_STAROFFICE5_IMPRESS,
MimetypeMap.MIMETYPE_OPENOFFICE1_WRITER,
MimetypeMap.MIMETYPE_OPENOFFICE1_IMPRESS
};
private OpenOfficeMetadataWorker worker;
public OpenOfficeMetadataExtracter()
{
super(new HashSet(Arrays.asList(SUPPORTED_MIMETYPES)));
}
public void setWorker(OpenOfficeMetadataWorker worker)
{
this.worker = worker;
}
/**
* Initialises the bean by establishing an UNO connection
*/
@Override
public synchronized void init()
{
PropertyCheck.mandatory("OpenOfficeMetadataExtracter", "worker", worker);
// Base initialization
super.init();
}
/**
* {@inheritDoc}
*/
public boolean isConnected()
{
return worker.isConnected();
}
/**
* Perform the default check, but also check if the OpenOffice connection is good.
*/
@Override
public boolean isSupported(String sourceMimetype)
{
if (!isConnected())
{
return false;
}
return super.isSupported(sourceMimetype);
}
/**
* {@inheritDoc}
*/
@Override
public Map extractRaw(ContentReader reader) throws Throwable
{
Map rawProperties = newRawMap();
Map result = this.worker.extractRaw(reader);
for (Map.Entry entry : result.entrySet())
{
putRawValue(entry.getKey(), entry.getValue(), rawProperties);
}
return rawProperties;
}
}