hedgewars: comparison project_files/frontlib/base64/base64.c

equal deleted inserted replaced

-:6171f0bad318
+:f7b49b2c5d84
 /* base64.c -- Encode binary data using printable characters.
-Copyright (C) 1999, 2000, 2001, 2004, 2005, 2006 Free Software
+Copyright (C) 1999-2001, 2004-2006, 2009-2012 Free Software Foundation, Inc.
-Foundation, Inc.
 This program is free software; you can redistribute it and/or modify
 it under the terms of the GNU General Public License as published by
 the Free Software Foundation; either version 2, or (at your option)
 any later version.
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU General Public License for more details.
 You should have received a copy of the GNU General Public License
-along with this program; if not, write to the Free Software Foundation,
+along with this program; if not, see <http://www.gnu.org/licenses/>.  */
-Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.  */
 /* Written by Simon Josefsson.  Partially adapted from GNU MailUtils
 * (mailbox/filter_trans.c, as of 2004-11-28).  Improved by review
 * from Paul Eggert, Bruno Haible, and Stepan Kasal.
 *
-* See also RFC 3548 <http://www.ietf.org/rfc/rfc3548.txt>.
+* See also RFC 4648 <http://www.ietf.org/rfc/rfc4648.txt>.
 *
 * Be careful with error checking.  Here is how you would typically
 * use these functions:
 *
 * bool ok = base64_decode_alloc (in, inlen, &out, &outlen);
 #include <stdlib.h>
 /* Get UCHAR_MAX. */
 #include <limits.h>
+#include <string.h>
 /* C89 compliant way to cast 'char' to 'unsigned char'. */
 static inline unsigned char
 to_uchar (char ch)
 {
 return ch;
 If OUTLEN is less than BASE64_LENGTH(INLEN), write as many bytes as
 possible.  If OUTLEN is larger than BASE64_LENGTH(INLEN), also zero
 terminate the output buffer. */
 void
 base64_encode (const char *restrict in, size_t inlen,
-	       char *restrict out, size_t outlen)
+char *restrict out, size_t outlen)
 {
 static const char b64str[64] =
 "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
 while (inlen && outlen)
 {
 *out++ = b64str[(to_uchar (in[0]) >> 2) & 0x3f];
 if (!--outlen)
-	break;
+break;
 *out++ = b64str[((to_uchar (in[0]) << 4)
-		       + (--inlen ? to_uchar (in[1]) >> 4 : 0))
++ (--inlen ? to_uchar (in[1]) >> 4 : 0))
-		      & 0x3f];
+& 0x3f];
 if (!--outlen)
-	break;
+break;
 *out++ =
-	(inlen
+(inlen
-	 ? b64str[((to_uchar (in[1]) << 2)
+? b64str[((to_uchar (in[1]) << 2)
-		   + (--inlen ? to_uchar (in[2]) >> 6 : 0))
++ (--inlen ? to_uchar (in[2]) >> 6 : 0))
-		  & 0x3f]
+& 0x3f]
-	 : '=');
+: '=');
 if (!--outlen)
-	break;
+break;
 *out++ = inlen ? b64str[to_uchar (in[2]) & 0x3f] : '=';
 if (!--outlen)
-	break;
+break;
 if (inlen)
-	inlen--;
+inlen--;
 if (inlen)
-	in += 3;
+in += 3;
 }
 if (outlen)
 *out = '\0';
 }
 quantities, though, taking care of that problem.  But this may be a
 potential problem on non-POSIX C99 platforms.
 IBM C V6 for AIX mishandles "#define B64(x) ...'x'...", so use "_"
 as the formal parameter rather than "x".  */
-#define B64(_)					\
+#define B64(_)                                  \
-((_) == 'A' ? 0				\
+((_) == 'A' ? 0                               \
-: (_) == 'B' ? 1				\
+: (_) == 'B' ? 1                             \
-: (_) == 'C' ? 2				\
+: (_) == 'C' ? 2                             \
-: (_) == 'D' ? 3				\
+: (_) == 'D' ? 3                             \
-: (_) == 'E' ? 4				\
+: (_) == 'E' ? 4                             \
-: (_) == 'F' ? 5				\
+: (_) == 'F' ? 5                             \
-: (_) == 'G' ? 6				\
+: (_) == 'G' ? 6                             \
-: (_) == 'H' ? 7				\
+: (_) == 'H' ? 7                             \
-: (_) == 'I' ? 8				\
+: (_) == 'I' ? 8                             \
-: (_) == 'J' ? 9				\
+: (_) == 'J' ? 9                             \
-: (_) == 'K' ? 10				\
+: (_) == 'K' ? 10                            \
-: (_) == 'L' ? 11				\
+: (_) == 'L' ? 11                            \
-: (_) == 'M' ? 12				\
+: (_) == 'M' ? 12                            \
-: (_) == 'N' ? 13				\
+: (_) == 'N' ? 13                            \
-: (_) == 'O' ? 14				\
+: (_) == 'O' ? 14                            \
-: (_) == 'P' ? 15				\
+: (_) == 'P' ? 15                            \
-: (_) == 'Q' ? 16				\
+: (_) == 'Q' ? 16                            \
-: (_) == 'R' ? 17				\
+: (_) == 'R' ? 17                            \
-: (_) == 'S' ? 18				\
+: (_) == 'S' ? 18                            \
-: (_) == 'T' ? 19				\
+: (_) == 'T' ? 19                            \
-: (_) == 'U' ? 20				\
+: (_) == 'U' ? 20                            \
-: (_) == 'V' ? 21				\
+: (_) == 'V' ? 21                            \
-: (_) == 'W' ? 22				\
+: (_) == 'W' ? 22                            \
-: (_) == 'X' ? 23				\
+: (_) == 'X' ? 23                            \
-: (_) == 'Y' ? 24				\
+: (_) == 'Y' ? 24                            \
-: (_) == 'Z' ? 25				\
+: (_) == 'Z' ? 25                            \
-: (_) == 'a' ? 26				\
+: (_) == 'a' ? 26                            \
-: (_) == 'b' ? 27				\
+: (_) == 'b' ? 27                            \
-: (_) == 'c' ? 28				\
+: (_) == 'c' ? 28                            \
-: (_) == 'd' ? 29				\
+: (_) == 'd' ? 29                            \
-: (_) == 'e' ? 30				\
+: (_) == 'e' ? 30                            \
-: (_) == 'f' ? 31				\
+: (_) == 'f' ? 31                            \
-: (_) == 'g' ? 32				\
+: (_) == 'g' ? 32                            \
-: (_) == 'h' ? 33				\
+: (_) == 'h' ? 33                            \
-: (_) == 'i' ? 34				\
+: (_) == 'i' ? 34                            \
-: (_) == 'j' ? 35				\
+: (_) == 'j' ? 35                            \
-: (_) == 'k' ? 36				\
+: (_) == 'k' ? 36                            \
-: (_) == 'l' ? 37				\
+: (_) == 'l' ? 37                            \
-: (_) == 'm' ? 38				\
+: (_) == 'm' ? 38                            \
-: (_) == 'n' ? 39				\
+: (_) == 'n' ? 39                            \
-: (_) == 'o' ? 40				\
+: (_) == 'o' ? 40                            \
-: (_) == 'p' ? 41				\
+: (_) == 'p' ? 41                            \
-: (_) == 'q' ? 42				\
+: (_) == 'q' ? 42                            \
-: (_) == 'r' ? 43				\
+: (_) == 'r' ? 43                            \
-: (_) == 's' ? 44				\
+: (_) == 's' ? 44                            \
-: (_) == 't' ? 45				\
+: (_) == 't' ? 45                            \
-: (_) == 'u' ? 46				\
+: (_) == 'u' ? 46                            \
-: (_) == 'v' ? 47				\
+: (_) == 'v' ? 47                            \
-: (_) == 'w' ? 48				\
+: (_) == 'w' ? 48                            \
-: (_) == 'x' ? 49				\
+: (_) == 'x' ? 49                            \
-: (_) == 'y' ? 50				\
+: (_) == 'y' ? 50                            \
-: (_) == 'z' ? 51				\
+: (_) == 'z' ? 51                            \
-: (_) == '0' ? 52				\
+: (_) == '0' ? 52                            \
-: (_) == '1' ? 53				\
+: (_) == '1' ? 53                            \
-: (_) == '2' ? 54				\
+: (_) == '2' ? 54                            \
-: (_) == '3' ? 55				\
+: (_) == '3' ? 55                            \
-: (_) == '4' ? 56				\
+: (_) == '4' ? 56                            \
-: (_) == '5' ? 57				\
+: (_) == '5' ? 57                            \
-: (_) == '6' ? 58				\
+: (_) == '6' ? 58                            \
-: (_) == '7' ? 59				\
+: (_) == '7' ? 59                            \
-: (_) == '8' ? 60				\
+: (_) == '8' ? 60                            \
-: (_) == '9' ? 61				\
+: (_) == '9' ? 61                            \
-: (_) == '+' ? 62				\
+: (_) == '+' ? 62                            \
-: (_) == '/' ? 63				\
+: (_) == '/' ? 63                            \
 : -1)
 static const signed char b64[0x100] = {
 B64 (0), B64 (1), B64 (2), B64 (3),
 B64 (4), B64 (5), B64 (6), B64 (7),
 isbase64 (char ch)
 {
 return uchar_in_range (to_uchar (ch)) && 0 <= b64[to_uchar (ch)];
 }
-/* Decode base64 encoded input array IN of length INLEN to output
+/* Initialize decode-context buffer, CTX.  */
-array OUT that can hold *OUTLEN bytes.  Return true if decoding was
+void
-successful, i.e. if the input was valid base64 data, false
+base64_decode_ctx_init (struct base64_decode_context *ctx)
-otherwise.  If *OUTLEN is too small, as many bytes as possible will
+{
-be written to OUT.  On return, *OUTLEN holds the length of decoded
+ctx->i = 0;
-bytes in OUT.  Note that as soon as any non-alphabet characters are
+}
-encountered, decoding is stopped and false is returned.  This means
-that, when applicable, you must remove any line terminators that is
+/* If CTX->i is 0 or 4, there are four or more bytes in [*IN..IN_END), and
-part of the data stream before calling this function.  */
+none of those four is a newline, then return *IN.  Otherwise, copy up to
+4 - CTX->i non-newline bytes from that range into CTX->buf, starting at
+index CTX->i and setting CTX->i to reflect the number of bytes copied,
+and return CTX->buf.  In either case, advance *IN to point to the byte
+after the last one processed, and set *N_NON_NEWLINE to the number of
+verified non-newline bytes accessible through the returned pointer.  */
+static inline char *
+get_4 (struct base64_decode_context *ctx,
+char const *restrict *in, char const *restrict in_end,
+size_t *n_non_newline)
+{
+if (ctx->i == 4)
+ctx->i = 0;
+if (ctx->i == 0)
+{
+char const *t = *in;
+if (4 <= in_end - *in && memchr (t, '\n', 4) == NULL)
+{
+/* This is the common case: no newline.  */
+*in += 4;
+*n_non_newline = 4;
+return (char *) t;
+}
+}
+{
+/* Copy non-newline bytes into BUF.  */
+char const *p = *in;
+while (p < in_end)
+{
+char c = *p++;
+if (c != '\n')
+{
+ctx->buf[ctx->i++] = c;
+if (ctx->i == 4)
+break;
+}
+}
+*in = p;
+*n_non_newline = ctx->i;
+return ctx->buf;
+}
+}
+#define return_false                            \
+do                                            \
+{                                           \
+*outp = out;                              \
+return false;                             \
+}                                           \
+while (false)
+/* Decode up to four bytes of base64-encoded data, IN, of length INLEN
+into the output buffer, *OUT, of size *OUTLEN bytes.  Return true if
+decoding is successful, false otherwise.  If *OUTLEN is too small,
+as many bytes as possible are written to *OUT.  On return, advance
+*OUT to point to the byte after the last one written, and decrement
+*OUTLEN to reflect the number of bytes remaining in *OUT.  */
+static inline bool
+decode_4 (char const *restrict in, size_t inlen,
+char *restrict *outp, size_t *outleft)
+{
+char *out = *outp;
+if (inlen < 2)
+return false;
+if (!isbase64 (in[0]) || !isbase64 (in[1]))
+return false;
+if (*outleft)
+{
+*out++ = ((b64[to_uchar (in[0])] << 2)
+| (b64[to_uchar (in[1])] >> 4));
+--*outleft;
+}
+if (inlen == 2)
+return_false;
+if (in[2] == '=')
+{
+if (inlen != 4)
+return_false;
+if (in[3] != '=')
+return_false;
+}
+else
+{
+if (!isbase64 (in[2]))
+return_false;
+if (*outleft)
+{
+*out++ = (((b64[to_uchar (in[1])] << 4) & 0xf0)
+| (b64[to_uchar (in[2])] >> 2));
+--*outleft;
+}
+if (inlen == 3)
+return_false;
+if (in[3] == '=')
+{
+if (inlen != 4)
+return_false;
+}
+else
+{
+if (!isbase64 (in[3]))
+return_false;
+if (*outleft)
+{
+*out++ = (((b64[to_uchar (in[2])] << 6) & 0xc0)
+| b64[to_uchar (in[3])]);
+--*outleft;
+}
+}
+}
+*outp = out;
+return true;
+}
+/* Decode base64-encoded input array IN of length INLEN to output array
+OUT that can hold *OUTLEN bytes.  The input data may be interspersed
+with newlines.  Return true if decoding was successful, i.e. if the
+input was valid base64 data, false otherwise.  If *OUTLEN is too
+small, as many bytes as possible will be written to OUT.  On return,
+*OUTLEN holds the length of decoded bytes in OUT.  Note that as soon
+as any non-alphabet, non-newline character is encountered, decoding
+is stopped and false is returned.  If INLEN is zero, then process
+only whatever data is stored in CTX.
+Initially, CTX must have been initialized via base64_decode_ctx_init.
+Subsequent calls to this function must reuse whatever state is recorded
+in that buffer.  It is necessary for when a quadruple of base64 input
+bytes spans two input buffers.
+If CTX is NULL then newlines are treated as garbage and the input
+buffer is processed as a unit.  */
 bool
-base64_decode (const char *restrict in, size_t inlen,
+base64_decode_ctx (struct base64_decode_context *ctx,
-	       char *restrict out, size_t *outlen)
+const char *restrict in, size_t inlen,
+char *restrict out, size_t *outlen)
 {
 size_t outleft = *outlen;
+bool ignore_newlines = ctx != NULL;
-while (inlen >= 2)
+bool flush_ctx = false;
-{
+unsigned int ctx_i = 0;
-if (!isbase64 (in[0]) || !isbase64 (in[1]))
-	break;
+if (ignore_newlines)
+{
-if (outleft)
+ctx_i = ctx->i;
-	{
+flush_ctx = inlen == 0;
-	  *out++ = ((b64[to_uchar (in[0])] << 2)
+}
-		    | (b64[to_uchar (in[1])] >> 4));
-	  outleft--;
-	}
+while (true)
+{
-if (inlen == 2)
+size_t outleft_save = outleft;
-	break;
+if (ctx_i == 0 && !flush_ctx)
+{
-if (in[2] == '=')
+while (true)
-	{
+{
-	  if (inlen != 4)
+/* Save a copy of outleft, in case we need to re-parse this
-	    break;
+block of four bytes.  */
+outleft_save = outleft;
-	  if (in[3] != '=')
+if (!decode_4 (in, inlen, &out, &outleft))
-	    break;
+break;
-	}
+in += 4;
-else
+inlen -= 4;
-	{
+}
-	  if (!isbase64 (in[2]))
+}
-	    break;
+if (inlen == 0 && !flush_ctx)
-	  if (outleft)
+break;
-	    {
-	      *out++ = (((b64[to_uchar (in[1])] << 4) & 0xf0)
+/* Handle the common case of 72-byte wrapped lines.
-			| (b64[to_uchar (in[2])] >> 2));
+This also handles any other multiple-of-4-byte wrapping.  */
-	      outleft--;
+if (inlen && *in == '\n' && ignore_newlines)
-	    }
+{
+++in;
-	  if (inlen == 3)
+--inlen;
-	    break;
+continue;
+}
-	  if (in[3] == '=')
-	    {
+/* Restore OUT and OUTLEFT.  */
-	      if (inlen != 4)
+out -= outleft_save - outleft;
-		break;
+outleft = outleft_save;
-	    }
-	  else
+{
-	    {
+char const *in_end = in + inlen;
-	      if (!isbase64 (in[3]))
+char const *non_nl;
-		break;
+if (ignore_newlines)
-	      if (outleft)
+non_nl = get_4 (ctx, &in, in_end, &inlen);
-		{
+else
-		  *out++ = (((b64[to_uchar (in[2])] << 6) & 0xc0)
+non_nl = in;  /* Might have nl in this case. */
-			    | b64[to_uchar (in[3])]);
-		  outleft--;
+/* If the input is empty or consists solely of newlines (0 non-newlines),
-		}
+then we're done.  Likewise if there are fewer than 4 bytes when not
-	    }
+flushing context and not treating newlines as garbage.  */
-	}
+if (inlen == 0 || (inlen < 4 && !flush_ctx && ignore_newlines))
+{
-in += 4;
+inlen = 0;
-inlen -= 4;
+break;
+}
+if (!decode_4 (non_nl, inlen, &out, &outleft))
+break;
+inlen = in_end - in;
+}
 }
 *outlen -= outleft;
-if (inlen != 0)
+return inlen == 0;
-return false;
-return true;
 }
 /* Allocate an output buffer in *OUT, and decode the base64 encoded
 data stored in IN of size INLEN to the *OUT buffer.  On return, the
 size of the decoded data is stored in *OUTLEN.  OUTLEN may be NULL,
 *OUT and *OUTLEN parameters to differentiate between successful
 decoding and memory error.)  The function returns false if the
 input was invalid, in which case *OUT is NULL and *OUTLEN is
 undefined. */
 bool
-base64_decode_alloc (const char *in, size_t inlen, char **out,
+base64_decode_alloc_ctx (struct base64_decode_context *ctx,
-		     size_t *outlen)
+const char *in, size_t inlen, char **out,
-{
+size_t *outlen)
-/* This may allocate a few bytes too much, depending on input,
+{
-but it's not worth the extra CPU time to compute the exact amount.
+/* This may allocate a few bytes too many, depending on input,
-The exact amount is 3 * inlen / 4, minus 1 if the input ends
+but it's not worth the extra CPU time to compute the exact size.
-with "=" and minus another 1 if the input ends with "==".
+The exact size is 3 * (inlen + (ctx ? ctx->i : 0)) / 4, minus 1 if the
+input ends with "=" and minus another 1 if the input ends with "==".
 Dividing before multiplying avoids the possibility of overflow.  */
-size_t needlen = 3 * (inlen / 4) + 2;
+size_t needlen = 3 * (inlen / 4) + 3;
 *out = malloc (needlen);
 if (!*out)
 return true;
-if (!base64_decode (in, inlen, *out, &needlen))
+if (!base64_decode_ctx (ctx, in, inlen, *out, &needlen))
 {
 free (*out);
 *out = NULL;
 return false;
 }

changeset 7316	f7b49b2c5d84
parent 7271	5608ac657362