k-9/k9mail-library/src/main/java/com/fsck/k9/mail/internet/MessageExtractor.java

package com.fsck.k9.mail.internet;

import android.util.Log;

import com.fsck.k9.mail.Body;
import com.fsck.k9.mail.BodyPart;
import com.fsck.k9.mail.Message;
import com.fsck.k9.mail.MessagingException;
import com.fsck.k9.mail.Multipart;
import com.fsck.k9.mail.Part;

import java.io.IOException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
import java.util.Set;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import static com.fsck.k9.mail.K9MailLib.LOG_TAG;
import static com.fsck.k9.mail.internet.CharsetSupport.fixupCharset;
import static com.fsck.k9.mail.internet.MimeUtility.getHeaderParameter;
import static com.fsck.k9.mail.internet.Viewable.Alternative;
import static com.fsck.k9.mail.internet.Viewable.Html;
import static com.fsck.k9.mail.internet.Viewable.MessageHeader;
import static com.fsck.k9.mail.internet.Viewable.Text;
import static com.fsck.k9.mail.internet.Viewable.Textual;

public class MessageExtractor {
    private MessageExtractor() {}

    public static String getTextFromPart(Part part) {
        try {
            if ((part != null) && (part.getBody() != null)) {
                final Body body = part.getBody();
                if (body instanceof TextBody) {
                    return ((TextBody)body).getText();
                }

                final String mimeType = part.getMimeType();
                if ((mimeType != null) && MimeUtility.mimeTypeMatches(mimeType, "text/*")) {
                    /*
                     * We've got a text part, so let's see if it needs to be processed further.
                     */
                    String charset = getHeaderParameter(part.getContentType(), "charset");
                    /*
                     * determine the charset from HTML message.
                     */
                    if (mimeType.equalsIgnoreCase("text/html") && charset == null) {
                        InputStream in = MimeUtility.decodeBody(body);
                        try {
                            byte[] buf = new byte[256];
                            in.read(buf, 0, buf.length);
                            String str = new String(buf, "US-ASCII");

                            if (str.isEmpty()) {
                                return "";
                            }
                            Pattern p = Pattern.compile("<meta http-equiv=\"?Content-Type\"? content=\"text/html; charset=(.+?)\">", Pattern.CASE_INSENSITIVE);
                            Matcher m = p.matcher(str);
                            if (m.find()) {
                                charset = m.group(1);
                            }
                        } finally {
                            try {
                                MimeUtility.closeInputStreamWithoutDeletingTemporaryFiles(in);
                            } catch (IOException e) { /* ignore */ }
                        }
                    }
                    charset = fixupCharset(charset, getMessageFromPart(part));

                    /*
                     * Now we read the part into a buffer for further processing. Because
                     * the stream is now wrapped we'll remove any transfer encoding at this point.
                     */
                    InputStream in = MimeUtility.decodeBody(body);
                    try {
                        return CharsetSupport.readToString(in, charset);
                    } finally {
                        try {
                            MimeUtility.closeInputStreamWithoutDeletingTemporaryFiles(in);
                        } catch (IOException e) { /* Ignore */ }
                    }
                }
            }

        } catch (OutOfMemoryError oom) {
            /*
             * If we are not able to process the body there's nothing we can do about it. Return
             * null and let the upper layers handle the missing content.
             */
            Log.e(LOG_TAG, "Unable to getTextFromPart " + oom.toString());
        } catch (Exception e) {
            /*
             * If we are not able to process the body there's nothing we can do about it. Return
             * null and let the upper layers handle the missing content.
             */
            Log.e(LOG_TAG, "Unable to getTextFromPart", e);
        }
        return null;
    }


    /**
     * Traverse the MIME tree of a message an extract viewable parts.
     *
     * @param part
     *         The message part to start from.
     * @param attachments
     *         A list that will receive the parts that are considered attachments.
     *
     * @return A list of {@link Viewable}s.
     *
     * @throws MessagingException
     *          In case of an error.
     */
    public static List<Viewable> getViewables(Part part, List<Part> attachments) throws MessagingException {
        List<Viewable> viewables = new ArrayList<Viewable>();

        Body body = part.getBody();
        if (body instanceof Multipart) {
            Multipart multipart = (Multipart) body;
            if (part.getMimeType().equalsIgnoreCase("multipart/alternative")) {
                /*
                 * For multipart/alternative parts we try to find a text/plain and a text/html
                 * child. Everything else we find is put into 'attachments'.
                 */
                List<Viewable> text = findTextPart(multipart, true);

                Set<Part> knownTextParts = getParts(text);
                List<Viewable> html = findHtmlPart(multipart, knownTextParts, attachments, true);

                if (!text.isEmpty() || !html.isEmpty()) {
                    Alternative alternative = new Alternative(text, html);
                    viewables.add(alternative);
                }
            } else {
                // For all other multipart parts we recurse to grab all viewable children.
                for (Part bodyPart : multipart.getBodyParts()) {
                    viewables.addAll(getViewables(bodyPart, attachments));
                }
            }
        } else if (body instanceof Message &&
                !("attachment".equalsIgnoreCase(getContentDisposition(part)))) {
            /*
             * We only care about message/rfc822 parts whose Content-Disposition header has a value
             * other than "attachment".
             */
            Message message = (Message) body;

            // We add the Message object so we can extract the filename later.
            viewables.add(new MessageHeader(part, message));

            // Recurse to grab all viewable parts and attachments from that message.
            viewables.addAll(getViewables(message, attachments));
        } else if (isPartTextualBody(part)) {
            /*
             * Save text/plain and text/html
             */
            String mimeType = part.getMimeType();
            if (mimeType.equalsIgnoreCase("text/plain")) {
                Text text = new Text(part);
                viewables.add(text);
            } else {
                Html html = new Html(part);
                viewables.add(html);
            }
        } else if (part.getMimeType().equalsIgnoreCase("application/pgp-signature")) {
            // ignore this type explicitly
        } else {
            // Everything else is treated as attachment.
            attachments.add(part);
        }

        return viewables;
    }

    public static Set<Part> getTextParts(Part part) throws MessagingException {
        List<Part> attachments = new ArrayList<Part>();
        return getParts(getViewables(part, attachments));
    }

    /**
     * Collect attachment parts of a message.
     * @return A list of parts regarded as attachments.
     * @throws MessagingException In case of an error.
     */
    public static List<Part> collectAttachments(Message message) throws MessagingException {
        try {
            List<Part> attachments = new ArrayList<Part>();
            getViewables(message, attachments);
            return attachments;
        } catch (Exception e) {
            throw new MessagingException("Couldn't collect attachment parts", e);
        }
    }

    /**
     * Collect the viewable textual parts of a message.
     * @return A set of viewable parts of the message.
     * @throws MessagingException In case of an error.
     */
    public static Set<Part> collectTextParts(Message message) throws MessagingException {
        try {
            return getTextParts(message);
        } catch (Exception e) {
            throw new MessagingException("Couldn't extract viewable parts", e);
        }
    }

    private static Message getMessageFromPart(Part part) {
        while (part != null) {
            if (part instanceof Message)
                return (Message)part;

            if (!(part instanceof BodyPart))
                return null;

            Multipart multipart = ((BodyPart)part).getParent();
            if (multipart == null)
                return null;

            part = multipart.getParent();
        }
        return null;
    }

    /**
     * Search the children of a {@link Multipart} for {@code text/plain} parts.
     *
     * @param multipart The {@code Multipart} to search through.
     * @param directChild If {@code true}, this method will return after the first {@code text/plain} was
     *         found.
     *
     * @return A list of {@link Text} viewables.
     *
     * @throws MessagingException
     *          In case of an error.
     */
    private static List<Viewable> findTextPart(Multipart multipart, boolean directChild)
            throws MessagingException {
        List<Viewable> viewables = new ArrayList<Viewable>();

        for (Part part : multipart.getBodyParts()) {
            Body body = part.getBody();
            if (body instanceof Multipart) {
                Multipart innerMultipart = (Multipart) body;

                /*
                 * Recurse to find text parts. Since this is a multipart that is a child of a
                 * multipart/alternative we don't want to stop after the first text/plain part
                 * we find. This will allow to get all text parts for constructions like this:
                 *
                 * 1. multipart/alternative
                 * 1.1. multipart/mixed
                 * 1.1.1. text/plain
                 * 1.1.2. text/plain
                 * 1.2. text/html
                 */
                List<Viewable> textViewables = findTextPart(innerMultipart, false);

                if (!textViewables.isEmpty()) {
                    viewables.addAll(textViewables);
                    if (directChild) {
                        break;
                    }
                }
            } else if (isPartTextualBody(part) && part.getMimeType().equalsIgnoreCase("text/plain")) {
                Text text = new Text(part);
                viewables.add(text);
                if (directChild) {
                    break;
                }
            }
        }
        return viewables;
    }

    /**
     * Search the children of a {@link Multipart} for {@code text/html} parts.
     * Every part that is not a {@code text/html} we want to display, we add to 'attachments'.
     *
     * @param multipart The {@code Multipart} to search through.
     * @param knownTextParts A set of {@code text/plain} parts that shouldn't be added to 'attachments'.
     * @param attachments A list that will receive the parts that are considered attachments.
     * @param directChild If {@code true}, this method will add all {@code text/html} parts except the first
     *         found to 'attachments'.
     *
     * @return A list of {@link Text} viewables.
     *
     * @throws MessagingException In case of an error.
     */
    private static List<Viewable> findHtmlPart(Multipart multipart, Set<Part> knownTextParts,
                                               List<Part> attachments, boolean directChild) throws MessagingException {
        List<Viewable> viewables = new ArrayList<Viewable>();

        boolean partFound = false;
        for (Part part : multipart.getBodyParts()) {
            Body body = part.getBody();
            if (body instanceof Multipart) {
                Multipart innerMultipart = (Multipart) body;

                if (directChild && partFound) {
                    // We already found our text/html part. Now we're only looking for attachments.
                    findAttachments(innerMultipart, knownTextParts, attachments);
                } else {
                    /*
                     * Recurse to find HTML parts. Since this is a multipart that is a child of a
                     * multipart/alternative we don't want to stop after the first text/html part
                     * we find. This will allow to get all text parts for constructions like this:
                     *
                     * 1. multipart/alternative
                     * 1.1. text/plain
                     * 1.2. multipart/mixed
                     * 1.2.1. text/html
                     * 1.2.2. text/html
                     * 1.3. image/jpeg
                     */
                    List<Viewable> htmlViewables = findHtmlPart(innerMultipart, knownTextParts,
                            attachments, false);

                    if (!htmlViewables.isEmpty()) {
                        partFound = true;
                        viewables.addAll(htmlViewables);
                    }
                }
            } else if (!(directChild && partFound) && isPartTextualBody(part) &&
                    part.getMimeType().equalsIgnoreCase("text/html")) {
                Html html = new Html(part);
                viewables.add(html);
                partFound = true;
            } else if (!knownTextParts.contains(part)) {
                // Only add this part as attachment if it's not a viewable text/plain part found
                // earlier.
                attachments.add(part);
            }
        }

        return viewables;
    }

    /**
     * Traverse the MIME tree and add everything that's not a known text part to 'attachments'.
     *
     * @param multipart
     *         The {@link Multipart} to start from.
     * @param knownTextParts
     *         A set of known text parts we don't want to end up in 'attachments'.
     * @param attachments
     *         A list that will receive the parts that are considered attachments.
     */
    private static void findAttachments(Multipart multipart, Set<Part> knownTextParts,
                                        List<Part> attachments) {
        for (Part part : multipart.getBodyParts()) {
            Body body = part.getBody();
            if (body instanceof Multipart) {
                Multipart innerMultipart = (Multipart) body;
                findAttachments(innerMultipart, knownTextParts, attachments);
            } else if (!knownTextParts.contains(part)) {
                attachments.add(part);
            }
        }
    }

    /**
     * Build a set of message parts for fast lookups.
     *
     * @param viewables
     *         A list of {@link Viewable}s containing references to the message parts to include in
     *         the set.
     *
     * @return The set of viewable {@code Part}s.
     *
     * @see MessageExtractor#findHtmlPart(Multipart, Set, List, boolean)
     * @see MessageExtractor#findAttachments(Multipart, Set, List)
     */
    private static Set<Part> getParts(List<Viewable> viewables) {
        Set<Part> parts = new HashSet<Part>();

        for (Viewable viewable : viewables) {
            if (viewable instanceof Textual) {
                parts.add(((Textual) viewable).getPart());
            } else if (viewable instanceof Alternative) {
                Alternative alternative = (Alternative) viewable;
                parts.addAll(getParts(alternative.getText()));
                parts.addAll(getParts(alternative.getHtml()));
            }
        }

        return parts;
    }

    private static Boolean isPartTextualBody(Part part) throws MessagingException {
        String disposition = part.getDisposition();
        String dispositionType = null;
        String dispositionFilename = null;
        if (disposition != null) {
            dispositionType = MimeUtility.getHeaderParameter(disposition, null);
            dispositionFilename = MimeUtility.getHeaderParameter(disposition, "filename");
        }

        /*
         * A best guess that this part is intended to be an attachment and not inline.
         */
        boolean attachment = ("attachment".equalsIgnoreCase(dispositionType) || (dispositionFilename != null));

        if ((!attachment) && (part.getMimeType().equalsIgnoreCase("text/html"))) {
            return true;
        }
        /*
         * If the part is plain text and it got this far it's part of a
         * mixed (et al) and should be rendered inline.
         */
        else if ((!attachment) && (part.getMimeType().equalsIgnoreCase("text/plain"))) {
            return true;
        }
        /*
         * Finally, if it's nothing else we will include it as an attachment.
         */
        else {
            return false;
        }
    }

    private static String getContentDisposition(Part part) {
        try {
            String disposition = part.getDisposition();
            if (disposition != null) {
                return MimeUtility.getHeaderParameter(disposition, null);
            }
        } catch (MessagingException e) { /* ignore */ }
        return null;
    }
}
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`package com.fsck.k9.mail.internet;`

			`import android.util.Log;`

			`import com.fsck.k9.mail.Body;`
			`import com.fsck.k9.mail.BodyPart;`
			`import com.fsck.k9.mail.Message;`
			`import com.fsck.k9.mail.MessagingException;`
			`import com.fsck.k9.mail.Multipart;`
			`import com.fsck.k9.mail.Part;`

			`import java.io.IOException;`
			`import java.io.InputStream;`
			`import java.util.ArrayList;`
			`import java.util.HashSet;`
			`import java.util.List;`
			`import java.util.Set;`
			`import java.util.regex.Matcher;`
			`import java.util.regex.Pattern;`

break/centralize dependencies to K9 2014-12-16 06:51:52 -05:00			`import static com.fsck.k9.mail.K9MailLib.LOG_TAG;`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`import static com.fsck.k9.mail.internet.CharsetSupport.fixupCharset;`
			`import static com.fsck.k9.mail.internet.MimeUtility.getHeaderParameter;`
			`import static com.fsck.k9.mail.internet.Viewable.Alternative;`
Cleanup 2014-12-15 07:01:13 -05:00			`import static com.fsck.k9.mail.internet.Viewable.Html;`
			`import static com.fsck.k9.mail.internet.Viewable.MessageHeader;`
			`import static com.fsck.k9.mail.internet.Viewable.Text;`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`import static com.fsck.k9.mail.internet.Viewable.Textual;`

			`public class MessageExtractor {`
Remove unused method 2014-12-15 06:42:05 -05:00			`private MessageExtractor() {}`

MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`public static String getTextFromPart(Part part) {`
			`try {`
			`if ((part != null) && (part.getBody() != null)) {`
			`final Body body = part.getBody();`
			`if (body instanceof TextBody) {`
			`return ((TextBody)body).getText();`
			`}`

			`final String mimeType = part.getMimeType();`
			`if ((mimeType != null) && MimeUtility.mimeTypeMatches(mimeType, "text/*")) {`
			`/*`
			`* We've got a text part, so let's see if it needs to be processed further.`
			`*/`
			`String charset = getHeaderParameter(part.getContentType(), "charset");`
			`/*`
			`* determine the charset from HTML message.`
			`*/`
			`if (mimeType.equalsIgnoreCase("text/html") && charset == null) {`
Work around the BinaryTempFileBodyInputStream mess 2015-01-21 22:56:08 -05:00			`InputStream in = MimeUtility.decodeBody(body);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`try {`
			`byte[] buf = new byte[256];`
			`in.read(buf, 0, buf.length);`
			`String str = new String(buf, "US-ASCII");`

			`if (str.isEmpty()) {`
			`return "";`
			`}`
			`Pattern p = Pattern.compile("<meta http-equiv=\"?Content-Type\"? content=\"text/html; charset=(.+?)\">", Pattern.CASE_INSENSITIVE);`
			`Matcher m = p.matcher(str);`
			`if (m.find()) {`
			`charset = m.group(1);`
			`}`
			`} finally {`
			`try {`
Work around the BinaryTempFileBodyInputStream mess 2015-01-21 22:56:08 -05:00			`MimeUtility.closeInputStreamWithoutDeletingTemporaryFiles(in);`
			`} catch (IOException e) { /* ignore */ }`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`}`
			`}`
			`charset = fixupCharset(charset, getMessageFromPart(part));`

			`/*`
			`* Now we read the part into a buffer for further processing. Because`
			`* the stream is now wrapped we'll remove any transfer encoding at this point.`
			`*/`
Properly decode the body in MessageExtractor.getTextFromPart() 2015-01-04 18:57:25 -05:00			`InputStream in = MimeUtility.decodeBody(body);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`try {`
Work around the BinaryTempFileBodyInputStream mess 2015-01-21 22:56:08 -05:00			`return CharsetSupport.readToString(in, charset);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`} finally {`
			`try {`
Work around the BinaryTempFileBodyInputStream mess 2015-01-21 22:56:08 -05:00			`MimeUtility.closeInputStreamWithoutDeletingTemporaryFiles(in);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`} catch (IOException e) { /* Ignore */ }`
			`}`
			`}`
			`}`

			`} catch (OutOfMemoryError oom) {`
			`/*`
			`* If we are not able to process the body there's nothing we can do about it. Return`
			`* null and let the upper layers handle the missing content.`
			`*/`
break/centralize dependencies to K9 2014-12-16 06:51:52 -05:00			`Log.e(LOG_TAG, "Unable to getTextFromPart " + oom.toString());`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`} catch (Exception e) {`
			`/*`
			`* If we are not able to process the body there's nothing we can do about it. Return`
			`* null and let the upper layers handle the missing content.`
			`*/`
break/centralize dependencies to K9 2014-12-16 06:51:52 -05:00			`Log.e(LOG_TAG, "Unable to getTextFromPart", e);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`}`
			`return null;`
			`}`


			`/**`
			`* Traverse the MIME tree of a message an extract viewable parts.`
			`*`
			`* @param part`
			`* The message part to start from.`
			`* @param attachments`
			`* A list that will receive the parts that are considered attachments.`
			`*`
			`* @return A list of {@link Viewable}s.`
			`*`
			`* @throws MessagingException`
			`* In case of an error.`
			`*/`
			`public static List<Viewable> getViewables(Part part, List<Part> attachments) throws MessagingException {`
			`List<Viewable> viewables = new ArrayList<Viewable>();`

			`Body body = part.getBody();`
			`if (body instanceof Multipart) {`
			`Multipart multipart = (Multipart) body;`
			`if (part.getMimeType().equalsIgnoreCase("multipart/alternative")) {`
			`/*`
			`* For multipart/alternative parts we try to find a text/plain and a text/html`
			`* child. Everything else we find is put into 'attachments'.`
			`*/`
			`List<Viewable> text = findTextPart(multipart, true);`

			`Set<Part> knownTextParts = getParts(text);`
			`List<Viewable> html = findHtmlPart(multipart, knownTextParts, attachments, true);`

			`if (!text.isEmpty() \|\| !html.isEmpty()) {`
			`Alternative alternative = new Alternative(text, html);`
			`viewables.add(alternative);`
			`}`
			`} else {`
			`// For all other multipart parts we recurse to grab all viewable children.`
			`for (Part bodyPart : multipart.getBodyParts()) {`
			`viewables.addAll(getViewables(bodyPart, attachments));`
			`}`
			`}`
			`} else if (body instanceof Message &&`
Remove unused method 2014-12-15 06:42:05 -05:00			`!("attachment".equalsIgnoreCase(getContentDisposition(part)))) {`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`/*`
			`* We only care about message/rfc822 parts whose Content-Disposition header has a value`
			`* other than "attachment".`
			`*/`
			`Message message = (Message) body;`

			`// We add the Message object so we can extract the filename later.`
Cleanup 2014-12-15 07:01:13 -05:00			`viewables.add(new MessageHeader(part, message));`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00
			`// Recurse to grab all viewable parts and attachments from that message.`
			`viewables.addAll(getViewables(message, attachments));`
			`} else if (isPartTextualBody(part)) {`
			`/*`
			`* Save text/plain and text/html`
			`*/`
			`String mimeType = part.getMimeType();`
			`if (mimeType.equalsIgnoreCase("text/plain")) {`
Cleanup 2014-12-15 07:01:13 -05:00			`Text text = new Text(part);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`viewables.add(text);`
			`} else {`
Cleanup 2014-12-15 07:01:13 -05:00			`Html html = new Html(part);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`viewables.add(html);`
			`}`
ignore application/pgp-signature parts for display 2015-01-30 07:19:53 -05:00			`} else if (part.getMimeType().equalsIgnoreCase("application/pgp-signature")) {`
			`// ignore this type explicitly`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`} else {`
			`// Everything else is treated as attachment.`
			`attachments.add(part);`
			`}`

			`return viewables;`
			`}`

			`public static Set<Part> getTextParts(Part part) throws MessagingException {`
			`List<Part> attachments = new ArrayList<Part>();`
			`return getParts(getViewables(part, attachments));`
			`}`

Revert adding methods to Message and Part 2014-12-15 23:40:44 -05:00			`/**`
			`* Collect attachment parts of a message.`
			`* @return A list of parts regarded as attachments.`
			`* @throws MessagingException In case of an error.`
			`*/`
			`public static List<Part> collectAttachments(Message message) throws MessagingException {`
			`try {`
			`List<Part> attachments = new ArrayList<Part>();`
			`getViewables(message, attachments);`
			`return attachments;`
			`} catch (Exception e) {`
			`throw new MessagingException("Couldn't collect attachment parts", e);`
			`}`
			`}`

			`/**`
			`* Collect the viewable textual parts of a message.`
			`* @return A set of viewable parts of the message.`
			`* @throws MessagingException In case of an error.`
			`*/`
			`public static Set<Part> collectTextParts(Message message) throws MessagingException {`
			`try {`
			`return getTextParts(message);`
			`} catch (Exception e) {`
			`throw new MessagingException("Couldn't extract viewable parts", e);`
			`}`
			`}`

MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`private static Message getMessageFromPart(Part part) {`
			`while (part != null) {`
			`if (part instanceof Message)`
			`return (Message)part;`

			`if (!(part instanceof BodyPart))`
			`return null;`

			`Multipart multipart = ((BodyPart)part).getParent();`
			`if (multipart == null)`
			`return null;`

			`part = multipart.getParent();`
			`}`
			`return null;`
			`}`

			`/**`
			`* Search the children of a {@link Multipart} for {@code text/plain} parts.`
			`*`
			`* @param multipart The {@code Multipart} to search through.`
			`* @param directChild If {@code true}, this method will return after the first {@code text/plain} was`
			`* found.`
			`*`
Cleanup 2014-12-15 07:01:13 -05:00			`* @return A list of {@link Text} viewables.`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`*`
			`* @throws MessagingException`
			`* In case of an error.`
			`*/`
			`private static List<Viewable> findTextPart(Multipart multipart, boolean directChild)`
			`throws MessagingException {`
			`List<Viewable> viewables = new ArrayList<Viewable>();`

			`for (Part part : multipart.getBodyParts()) {`
			`Body body = part.getBody();`
			`if (body instanceof Multipart) {`
			`Multipart innerMultipart = (Multipart) body;`

			`/*`
			`* Recurse to find text parts. Since this is a multipart that is a child of a`
			`* multipart/alternative we don't want to stop after the first text/plain part`
			`* we find. This will allow to get all text parts for constructions like this:`
			`*`
			`* 1. multipart/alternative`
			`* 1.1. multipart/mixed`
			`* 1.1.1. text/plain`
			`* 1.1.2. text/plain`
			`* 1.2. text/html`
			`*/`
			`List<Viewable> textViewables = findTextPart(innerMultipart, false);`

			`if (!textViewables.isEmpty()) {`
			`viewables.addAll(textViewables);`
			`if (directChild) {`
			`break;`
			`}`
			`}`
			`} else if (isPartTextualBody(part) && part.getMimeType().equalsIgnoreCase("text/plain")) {`
Cleanup 2014-12-15 07:01:13 -05:00			`Text text = new Text(part);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`viewables.add(text);`
			`if (directChild) {`
			`break;`
			`}`
			`}`
			`}`
			`return viewables;`
			`}`

			`/**`
			`* Search the children of a {@link Multipart} for {@code text/html} parts.`
			`* Every part that is not a {@code text/html} we want to display, we add to 'attachments'.`
			`*`
			`* @param multipart The {@code Multipart} to search through.`
			`* @param knownTextParts A set of {@code text/plain} parts that shouldn't be added to 'attachments'.`
			`* @param attachments A list that will receive the parts that are considered attachments.`
			`* @param directChild If {@code true}, this method will add all {@code text/html} parts except the first`
			`* found to 'attachments'.`
			`*`
Cleanup 2014-12-15 07:01:13 -05:00			`* @return A list of {@link Text} viewables.`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`*`
			`* @throws MessagingException In case of an error.`
			`*/`
			`private static List<Viewable> findHtmlPart(Multipart multipart, Set<Part> knownTextParts,`
			`List<Part> attachments, boolean directChild) throws MessagingException {`
			`List<Viewable> viewables = new ArrayList<Viewable>();`

			`boolean partFound = false;`
			`for (Part part : multipart.getBodyParts()) {`
			`Body body = part.getBody();`
			`if (body instanceof Multipart) {`
			`Multipart innerMultipart = (Multipart) body;`

			`if (directChild && partFound) {`
			`// We already found our text/html part. Now we're only looking for attachments.`
			`findAttachments(innerMultipart, knownTextParts, attachments);`
			`} else {`
			`/*`
			`* Recurse to find HTML parts. Since this is a multipart that is a child of a`
			`* multipart/alternative we don't want to stop after the first text/html part`
			`* we find. This will allow to get all text parts for constructions like this:`
			`*`
			`* 1. multipart/alternative`
			`* 1.1. text/plain`
			`* 1.2. multipart/mixed`
			`* 1.2.1. text/html`
			`* 1.2.2. text/html`
			`* 1.3. image/jpeg`
			`*/`
			`List<Viewable> htmlViewables = findHtmlPart(innerMultipart, knownTextParts,`
			`attachments, false);`

			`if (!htmlViewables.isEmpty()) {`
			`partFound = true;`
			`viewables.addAll(htmlViewables);`
			`}`
			`}`
			`} else if (!(directChild && partFound) && isPartTextualBody(part) &&`
			`part.getMimeType().equalsIgnoreCase("text/html")) {`
Cleanup 2014-12-15 07:01:13 -05:00			`Html html = new Html(part);`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`viewables.add(html);`
			`partFound = true;`
			`} else if (!knownTextParts.contains(part)) {`
			`// Only add this part as attachment if it's not a viewable text/plain part found`
			`// earlier.`
			`attachments.add(part);`
			`}`
			`}`

			`return viewables;`
			`}`

			`/**`
			`* Traverse the MIME tree and add everything that's not a known text part to 'attachments'.`
			`*`
			`* @param multipart`
			`* The {@link Multipart} to start from.`
			`* @param knownTextParts`
			`* A set of known text parts we don't want to end up in 'attachments'.`
			`* @param attachments`
			`* A list that will receive the parts that are considered attachments.`
			`*/`
			`private static void findAttachments(Multipart multipart, Set<Part> knownTextParts,`
			`List<Part> attachments) {`
			`for (Part part : multipart.getBodyParts()) {`
			`Body body = part.getBody();`
			`if (body instanceof Multipart) {`
			`Multipart innerMultipart = (Multipart) body;`
			`findAttachments(innerMultipart, knownTextParts, attachments);`
			`} else if (!knownTextParts.contains(part)) {`
			`attachments.add(part);`
			`}`
			`}`
			`}`

			`/**`
			`* Build a set of message parts for fast lookups.`
			`*`
			`* @param viewables`
			`* A list of {@link Viewable}s containing references to the message parts to include in`
			`* the set.`
			`*`
			`* @return The set of viewable {@code Part}s.`
			`*`
Cleanup 2014-12-15 07:01:13 -05:00			`* @see MessageExtractor#findHtmlPart(Multipart, Set, List, boolean)`
			`* @see MessageExtractor#findAttachments(Multipart, Set, List)`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`*/`
			`private static Set<Part> getParts(List<Viewable> viewables) {`
			`Set<Part> parts = new HashSet<Part>();`

			`for (Viewable viewable : viewables) {`
			`if (viewable instanceof Textual) {`
			`parts.add(((Textual) viewable).getPart());`
			`} else if (viewable instanceof Alternative) {`
			`Alternative alternative = (Alternative) viewable;`
			`parts.addAll(getParts(alternative.getText()));`
			`parts.addAll(getParts(alternative.getHtml()));`
			`}`
			`}`

			`return parts;`
			`}`

			`private static Boolean isPartTextualBody(Part part) throws MessagingException {`
			`String disposition = part.getDisposition();`
			`String dispositionType = null;`
			`String dispositionFilename = null;`
			`if (disposition != null) {`
			`dispositionType = MimeUtility.getHeaderParameter(disposition, null);`
			`dispositionFilename = MimeUtility.getHeaderParameter(disposition, "filename");`
			`}`

			`/*`
			`* A best guess that this part is intended to be an attachment and not inline.`
			`*/`
			`boolean attachment = ("attachment".equalsIgnoreCase(dispositionType) \|\| (dispositionFilename != null));`

			`if ((!attachment) && (part.getMimeType().equalsIgnoreCase("text/html"))) {`
			`return true;`
			`}`
			`/*`
			`* If the part is plain text and it got this far it's part of a`
			`* mixed (et al) and should be rendered inline.`
			`*/`
			`else if ((!attachment) && (part.getMimeType().equalsIgnoreCase("text/plain"))) {`
			`return true;`
			`}`
			`/*`
			`* Finally, if it's nothing else we will include it as an attachment.`
			`*/`
			`else {`
			`return false;`
			`}`
			`}`
Remove unused method 2014-12-15 06:42:05 -05:00
WS / visibility 2014-12-15 06:45:04 -05:00			`private static String getContentDisposition(Part part) {`
Remove unused method 2014-12-15 06:42:05 -05:00			`try {`
			`String disposition = part.getDisposition();`
			`if (disposition != null) {`
			`return MimeUtility.getHeaderParameter(disposition, null);`
			`}`
			`} catch (MessagingException e) { /* ignore */ }`
			`return null;`
			`}`
MimeUtility / Message refactor * break MimeUtility class into manageable pieces (MessageExtractor/CharsetSupport) * move HTML related code out of the mail package 2014-12-15 06:05:21 -05:00			`}`