| /**************************************************************** |
| * Licensed to the Apache Software Foundation (ASF) under one * |
| * or more contributor license agreements. See the NOTICE file * |
| * distributed with this work for additional information * |
| * regarding copyright ownership. The ASF licenses this file * |
| * to you under the Apache License, Version 2.0 (the * |
| * "License"); you may not use this file except in compliance * |
| * with the License. You may obtain a copy of the License at * |
| * * |
| * http://www.apache.org/licenses/LICENSE-2.0 * |
| * * |
| * Unless required by applicable law or agreed to in writing, * |
| * software distributed under the License is distributed on an * |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * |
| * KIND, either express or implied. See the License for the * |
| * specific language governing permissions and limitations * |
| * under the License. * |
| ****************************************************************/ |
| |
| package org.apache.james.mime4j.parser; |
| |
| import org.apache.james.mime4j.MimeException; |
| import org.apache.james.mime4j.descriptor.BodyDescriptor; |
| |
| import java.io.IOException; |
| import java.io.InputStream; |
| |
| /** |
| * <p> |
| * Parses MIME (or RFC822) message streams of bytes or characters and reports |
| * parsing events to a <code>ContentHandler</code> instance. |
| * </p> |
| * <p> |
| * Typical usage:<br/> |
| * <pre> |
| * ContentHandler handler = new MyHandler(); |
| * MimeStreamParser parser = new MimeStreamParser(); |
| * parser.setContentHandler(handler); |
| * parser.parse(new FileInputStream("mime.msg")); |
| * </pre> |
| */ |
| public class MimeStreamParser { |
| |
| private ContentHandler handler = null; |
| private boolean contentDecoding; |
| |
| private final MimeTokenStream mimeTokenStream; |
| |
| public MimeStreamParser(final MimeEntityConfig config) { |
| super(); |
| MimeEntityConfig localConfig; |
| if (config != null) { |
| localConfig = config.clone(); |
| } else { |
| localConfig = new MimeEntityConfig(); |
| } |
| this.mimeTokenStream = new MimeTokenStream(localConfig); |
| this.contentDecoding = false; |
| } |
| |
| public MimeStreamParser() { |
| this(null); |
| } |
| |
| /** |
| * Determines whether this parser automatically decodes body content |
| * based on the on the MIME fields with the standard defaults. |
| */ |
| public boolean isContentDecoding() { |
| return contentDecoding; |
| } |
| |
| /** |
| * Defines whether parser should automatically decode body content |
| * based on the on the MIME fields with the standard defaults. |
| */ |
| public void setContentDecoding(boolean b) { |
| this.contentDecoding = b; |
| } |
| |
| /** |
| * Parses a stream of bytes containing a MIME message. |
| * |
| * @param is the stream to parse. |
| * @throws MimeException if the message can not be processed |
| * @throws IOException on I/O errors. |
| */ |
| public void parse(InputStream is) throws MimeException, IOException { |
| mimeTokenStream.parse(is); |
| OUTER: for (;;) { |
| int state = mimeTokenStream.getState(); |
| switch (state) { |
| case MimeTokenStream.T_BODY: |
| BodyDescriptor desc = mimeTokenStream.getBodyDescriptor(); |
| InputStream bodyContent; |
| if (contentDecoding) { |
| bodyContent = mimeTokenStream.getDecodedInputStream(); |
| } else { |
| bodyContent = mimeTokenStream.getInputStream(); |
| } |
| handler.body(desc, bodyContent); |
| break; |
| case MimeTokenStream.T_END_BODYPART: |
| handler.endBodyPart(); |
| break; |
| case MimeTokenStream.T_END_HEADER: |
| handler.endHeader(); |
| break; |
| case MimeTokenStream.T_END_MESSAGE: |
| handler.endMessage(); |
| break; |
| case MimeTokenStream.T_END_MULTIPART: |
| handler.endMultipart(); |
| break; |
| case MimeTokenStream.T_END_OF_STREAM: |
| break OUTER; |
| case MimeTokenStream.T_EPILOGUE: |
| handler.epilogue(mimeTokenStream.getInputStream()); |
| break; |
| case MimeTokenStream.T_FIELD: |
| handler.field(mimeTokenStream.getField()); |
| break; |
| case MimeTokenStream.T_PREAMBLE: |
| handler.preamble(mimeTokenStream.getInputStream()); |
| break; |
| case MimeTokenStream.T_RAW_ENTITY: |
| handler.raw(mimeTokenStream.getInputStream()); |
| break; |
| case MimeTokenStream.T_START_BODYPART: |
| handler.startBodyPart(); |
| break; |
| case MimeTokenStream.T_START_HEADER: |
| handler.startHeader(); |
| break; |
| case MimeTokenStream.T_START_MESSAGE: |
| handler.startMessage(); |
| break; |
| case MimeTokenStream.T_START_MULTIPART: |
| handler.startMultipart(mimeTokenStream.getBodyDescriptor()); |
| break; |
| default: |
| throw new IllegalStateException("Invalid state: " + state); |
| } |
| state = mimeTokenStream.next(); |
| } |
| } |
| |
| /** |
| * Determines if this parser is currently in raw mode. |
| * |
| * @return <code>true</code> if in raw mode, <code>false</code> |
| * otherwise. |
| * @see #setRaw(boolean) |
| */ |
| public boolean isRaw() { |
| return mimeTokenStream.isRaw(); |
| } |
| |
| /** |
| * Enables or disables raw mode. In raw mode all future entities |
| * (messages or body parts) in the stream will be reported to the |
| * {@link ContentHandler#raw(InputStream)} handler method only. |
| * The stream will contain the entire unparsed entity contents |
| * including header fields and whatever is in the body. |
| * |
| * @param raw <code>true</code> enables raw mode, <code>false</code> |
| * disables it. |
| */ |
| public void setRaw(boolean raw) { |
| mimeTokenStream.setRecursionMode(MimeTokenStream.M_RAW); |
| } |
| |
| /** |
| * Finishes the parsing and stops reading lines. |
| * NOTE: No more lines will be parsed but the parser |
| * will still call |
| * {@link ContentHandler#endMultipart()}, |
| * {@link ContentHandler#endBodyPart()}, |
| * {@link ContentHandler#endMessage()}, etc to match previous calls |
| * to |
| * {@link ContentHandler#startMultipart(BodyDescriptor)}, |
| * {@link ContentHandler#startBodyPart()}, |
| * {@link ContentHandler#startMessage()}, etc. |
| */ |
| public void stop() { |
| mimeTokenStream.stop(); |
| } |
| |
| /** |
| * Sets the <code>ContentHandler</code> to use when reporting |
| * parsing events. |
| * |
| * @param h the <code>ContentHandler</code>. |
| */ |
| public void setContentHandler(ContentHandler h) { |
| this.handler = h; |
| } |
| |
| } |