/*
 * Copyright (C) 2005 Jesper Steen Møller
 *
 * This file is part of Alfresco
 *
 * Alfresco is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * Alfresco is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License
 * along with Alfresco. If not, see 
* author: -- cm:author * title: -- cm:title * subject: -- cm:description * createDateTime: -- cm:created * lastSaveDateTime: -- cm:modified * comments: * editTime: * format: * keywords: * lastAuthor: * lastPrinted: * osVersion: * thumbnail: * pageCount: * wordCount: ** * Uses Apache Tika * * @author Derek Hulley * @author Nick Burch */ public class OfficeMetadataExtracter extends TikaPoweredMetadataExtracter { public static final String KEY_CREATE_DATETIME = "createDateTime"; public static final String KEY_LAST_SAVE_DATETIME = "lastSaveDateTime"; public static final String KEY_EDIT_TIME = "editTime"; public static final String KEY_FORMAT = "format"; public static final String KEY_KEYWORDS = "keywords"; public static final String KEY_LAST_AUTHOR = "lastAuthor"; public static final String KEY_LAST_PRINTED = "lastPrinted"; public static final String KEY_OS_VERSION = "osVersion"; // TODO public static final String KEY_THUMBNAIL = "thumbnail"; // TODO public static final String KEY_PAGE_COUNT = "pageCount"; public static final String KEY_PARAGRAPH_COUNT = "paragraphCount"; public static final String KEY_WORD_COUNT = "wordCount"; public static ArrayList