/*
* Copyright (C) 2005 Jesper Steen Møller
*
* This file is part of Alfresco
*
* Alfresco is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Alfresco is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with Alfresco. If not, see
* author: -- cm:author * title: -- cm:title * subject: -- cm:description * createDateTime: -- cm:created * lastSaveDateTime: -- cm:modified * comments: * editTime: * format: * keywords: * lastAuthor: * lastPrinted: * osVersion: * thumbnail: * pageCount: * wordCount: ** * Uses Apache Tika * * @author Derek Hulley * @author Nick Burch */ public class OfficeMetadataExtracter extends TikaPoweredMetadataExtracter { public static final String KEY_CREATE_DATETIME = "createDateTime"; public static final String KEY_LAST_SAVE_DATETIME = "lastSaveDateTime"; public static final String KEY_EDIT_TIME = "editTime"; public static final String KEY_FORMAT = "format"; public static final String KEY_KEYWORDS = "keywords"; public static final String KEY_LAST_AUTHOR = "lastAuthor"; public static final String KEY_LAST_PRINTED = "lastPrinted"; public static final String KEY_OS_VERSION = "osVersion"; // TODO public static final String KEY_THUMBNAIL = "thumbnail"; // TODO public static final String KEY_PAGE_COUNT = "pageCount"; public static final String KEY_PARAGRAPH_COUNT = "paragraphCount"; public static final String KEY_WORD_COUNT = "wordCount"; public static ArrayList