SMTP: correct unescaping of posted messages containing lines with single dot.
1.1 --- a/src/org/sonews/daemon/command/PostCommand.java Sun Oct 30 22:15:49 2011 +0100
1.2 +++ b/src/org/sonews/daemon/command/PostCommand.java Sat Nov 05 00:06:09 2011 +0100
1.3 @@ -37,6 +37,7 @@
1.4 import org.sonews.storage.StorageManager;
1.5 import org.sonews.feed.FeedManager;
1.6 import org.sonews.util.Stats;
1.7 +import org.sonews.util.io.SMTPInputStream;
1.8
1.9 /**
1.10 * Implementation of the POST command. This command requires multiple lines
1.11 @@ -103,6 +104,7 @@
1.12 if ("".equals(line) || ".".equals(line)) {
1.13 // we finally met the blank line
1.14 // separating headers from body
1.15 + // WTF: "."
1.16
1.17 try {
1.18 // Parse the header using the InternetHeader class from JavaMail API
1.19 @@ -124,6 +126,7 @@
1.20
1.21 state = PostState.ReadingBody;
1.22
1.23 + // WTF: do we need articles without bodies?
1.24 if (".".equals(line)) {
1.25 // Post an article without body
1.26 postArticle(conn, article);
1.27 @@ -138,7 +141,7 @@
1.28 headers.setHeader(Headers.LINES, Integer.toString(lineCount));
1.29 headers.setHeader(Headers.BYTES, Long.toString(bodySize));
1.30
1.31 - byte[] body = bufBody.toByteArray();
1.32 + byte[] body = unescapeDots(bufBody.toByteArray());
1.33 if (body.length >= 2) {
1.34 // Remove trailing CRLF
1.35 body = Arrays.copyOf(body, body.length - 2);
1.36 @@ -213,7 +216,7 @@
1.37 if (conn.getUser() != null && conn.getUser().isAuthenticated()) {
1.38 article.setAuthenticatedUser(conn.getUser().getUserName());
1.39 }
1.40 -
1.41 +
1.42 if (article.getHeader(Headers.CONTROL)[0].length() > 0) {
1.43 controlMessage(conn, article);
1.44 } else if (article.getHeader(Headers.SUPERSEDES)[0].length() > 0) {
1.45 @@ -273,4 +276,27 @@
1.46 }
1.47 }
1.48 }
1.49 +
1.50 + /**
1.51 + * TODO: rework, integrate into NNTPConnection
1.52 + *
1.53 + * @param body message body with doubled dots
1.54 + * @return message body with unescaped dots (.. → .)
1.55 + */
1.56 + private static byte[] unescapeDots(byte[] body) throws IOException {
1.57 + byte[] result = new byte[body.length];
1.58 + int resultLength = 0;
1.59 +
1.60 + ByteArrayInputStream escapedInput = new ByteArrayInputStream(body);
1.61 + SMTPInputStream unescapedInput = new SMTPInputStream(escapedInput);
1.62 +
1.63 + int ch = unescapedInput.read();
1.64 + while (ch >= 0) {
1.65 + result[resultLength] = (byte) ch;
1.66 + resultLength++;
1.67 + ch = unescapedInput.read();
1.68 + }
1.69 +
1.70 + return Arrays.copyOfRange(result, 0, resultLength);
1.71 + }
1.72 }
2.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000
2.2 +++ b/src/org/sonews/util/io/SMTPInputStream.java Sat Nov 05 00:06:09 2011 +0100
2.3 @@ -0,0 +1,110 @@
2.4 +/*
2.5 + * SONEWS News Server
2.6 + * see AUTHORS for the list of contributors
2.7 + *
2.8 + * This program is free software: you can redistribute it and/or modify
2.9 + * it under the terms of the GNU General Public License as published by
2.10 + * the Free Software Foundation, either version 3 of the License, or
2.11 + * (at your option) any later version.
2.12 + *
2.13 + * This program is distributed in the hope that it will be useful,
2.14 + * but WITHOUT ANY WARRANTY; without even the implied warranty of
2.15 + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
2.16 + * GNU General Public License for more details.
2.17 + *
2.18 + * You should have received a copy of the GNU General Public License
2.19 + * along with this program. If not, see <http://www.gnu.org/licenses/>.
2.20 + */
2.21 +package org.sonews.util.io;
2.22 +
2.23 +import java.io.FilterInputStream;
2.24 +import java.io.IOException;
2.25 +import java.io.InputStream;
2.26 +
2.27 +/**
2.28 + * Filter input stream for reading from SMTP (or NNTP or similar) socket
2.29 + * where lines containing single dot have special meaning – end of message.
2.30 + *
2.31 + * @author František Kučera (frantovo.cz)
2.32 + */
2.33 +public class SMTPInputStream extends FilterInputStream {
2.34 +
2.35 + public static final int CR = 0x0d;
2.36 + public static final int LF = 0x0a;
2.37 + public static final int DOT = 0x2e;
2.38 + protected int last;
2.39 +
2.40 + public SMTPInputStream(InputStream in) {
2.41 + super(in);
2.42 + }
2.43 +
2.44 + /**
2.45 + * @return one byte as expected
2.46 + * or -2 if there was line with single dot (which means end of message)
2.47 + * @throws IOException
2.48 + */
2.49 + @Override
2.50 + public int read() throws IOException {
2.51 + // read current character
2.52 + int ch = super.read();
2.53 +
2.54 + if (ch == DOT) {
2.55 + if (last == LF) {
2.56 + int next = super.read();
2.57 +
2.58 + if (next == CR || next == LF) { // There should be CRLF, but we may accept also just LF or CR with missing LF. Or should we be more strict?
2.59 + // <CRLF>.<CRLF> → end of current message
2.60 + ch = -2;
2.61 + } else {
2.62 + // <CRLF>.… → eat one dot and return next character
2.63 + ch = next;
2.64 + }
2.65 + }
2.66 + }
2.67 +
2.68 + last = ch;
2.69 + return ch;
2.70 + }
2.71 +
2.72 + /**
2.73 + * @param buffer
2.74 + * @param offset
2.75 + * @param length
2.76 + * @return See {@link FilterInputStream#read(byte[], int, int)} or -2 (then see {@link #read(byte[])})
2.77 + * @throws IOException
2.78 + */
2.79 + @Override
2.80 + public int read(byte[] buffer, int offset, int length) throws IOException {
2.81 + if (buffer == null) {
2.82 + throw new NullPointerException("Byte array should not be null.");
2.83 + } else if ((offset < 0) || (offset > buffer.length) || (length < 0) || ((offset + length) > buffer.length) || ((offset + length) < 0)) {
2.84 + throw new IndexOutOfBoundsException("Invalid offset or length.");
2.85 + } else if (length == 0) {
2.86 + return 0;
2.87 + }
2.88 +
2.89 + int ch = read();
2.90 +
2.91 + if (ch == -1 || ch == -2) {
2.92 + return ch;
2.93 + }
2.94 +
2.95 + buffer[offset] = (byte) ch;
2.96 +
2.97 + int readCounter = 1;
2.98 +
2.99 + for (; readCounter < length; readCounter++) {
2.100 + ch = read();
2.101 +
2.102 + if (ch == -1 || ch == -2) {
2.103 + break;
2.104 + }
2.105 +
2.106 + if (buffer != null) {
2.107 + buffer[offset + readCounter] = (byte) ch;
2.108 + }
2.109 + }
2.110 +
2.111 + return readCounter;
2.112 + }
2.113 +}