/* * Copyright (C) 2005-2009 Alfresco Software Limited. * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. * As a special exception to the terms and conditions of version 2.0 of * the GPL, you may redistribute this Program in connection with Free/Libre * and Open Source Software ("FLOSS") applications as described in Alfresco's * FLOSS exception. You should have recieved a copy of the text describing * the FLOSS exception, and it is also available here: * http://www.alfresco.com/legal/licensing" */ package org.alfresco.repo.content.metadata; import java.io.IOException; import java.io.InputStream; import java.io.Serializable; import java.io.UnsupportedEncodingException; import java.util.Arrays; import java.util.Enumeration; import java.util.HashSet; import java.util.Map; import java.util.Set; import javax.mail.Header; import javax.mail.internet.InternetAddress; import javax.mail.internet.MimeMessage; import javax.mail.internet.MimeUtility; import javax.mail.internet.MimeMessage.RecipientType; import org.alfresco.repo.content.MimetypeMap; import org.alfresco.service.cmr.repository.ContentReader; /** * Metadata extractor for the PDF documents. *
 *   messageFrom:              --      imap:messageFrom
 *   messageTo:                --      imap:messageTo
 *   messageCc:                --      imap:messageCc
 *   messageSubject:           --      imap:messageSubject, cm:title, cm:description
 *   All {@link Header#getName() header names}:
 *      Thread-Index:          --      imap:threadIndex
 *      Message-ID:            --      imap:messageId
 * 
 * @author Derek Hulley
 * @since 3.2
 */
public class RFC822MetadataExtracter extends AbstractMappingMetadataExtracter
{

    private static final String KEY_MESSAGE_FROM = "messageFrom";
    private static final String KEY_MESSAGE_TO = "messageTo";
    private static final String KEY_MESSAGE_CC = "messageCc";
    private static final String KEY_MESSAGE_SUBJECT = "messageSubject";

    public static String[] SUPPORTED_MIMETYPES = new String[] { MimetypeMap.MIMETYPE_RFC822 };

    public RFC822MetadataExtracter()
    {
        super(new HashSet(Arrays.asList(SUPPORTED_MIMETYPES)));
    }

    @Override
    protected Map extractRaw(ContentReader reader) throws Throwable
    {
        Map rawProperties = newRawMap();

        InputStream is = null;
        try
        {
            is = reader.getContentInputStream();
            MimeMessage mimeMessage = new MimeMessage(null, is);

            if (mimeMessage != null)
            {
                //Extract values that doesn't match to headers and need to be encoded.
                putRawValue(KEY_MESSAGE_FROM, InternetAddress.toString(mimeMessage.getFrom()), rawProperties);
                putRawValue(KEY_MESSAGE_TO, InternetAddress.toString(mimeMessage.getRecipients(RecipientType.TO)), rawProperties);
                putRawValue(KEY_MESSAGE_CC, InternetAddress.toString(mimeMessage.getRecipients(RecipientType.CC)), rawProperties);

                String[] subj = mimeMessage.getHeader("Subject");
                if (subj != null && subj.length > 0)
                {
                    String decodedSubject = subj[0];
                    try
                    {
                        decodedSubject = MimeUtility.decodeText(decodedSubject);
                    }
                    catch (UnsupportedEncodingException e)
                    {
                        logger.warn(e.toString());
                    }
                    putRawValue(KEY_MESSAGE_SUBJECT, decodedSubject, rawProperties);
                }
                
                //Extract values from headers
                Set keys = getMapping().keySet();
                Enumeration
headers = mimeMessage.getAllHeaders(); while (headers.hasMoreElements()) { Header header = (Header) headers.nextElement(); if (keys.contains(header.getName())) { header.getValue(); putRawValue(header.getName(), header.getValue(), rawProperties); } } } } finally { if (is != null) { try { is.close(); } catch (IOException e) { } } } // Done return rawProperties; } }