libubox
C utility functions for OpenWrt.
base64.c
Go to the documentation of this file.
1 /*
2  * base64 - libubox base64 functions
3  *
4  * Copyright (C) 2015 Felix Fietkau <nbd@openwrt.org>
5  *
6  * Permission to use, copy, modify, and/or distribute this software for any
7  * purpose with or without fee is hereby granted, provided that the above
8  * copyright notice and this permission notice appear in all copies.
9  *
10  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
11  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
12  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
13  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
14  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
15  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
16  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17  */
18 
19 /* $OpenBSD: base64.c,v 1.7 2013/12/31 02:32:56 tedu Exp $ */
20 
21 /*
22  * Copyright (c) 1996 by Internet Software Consortium.
23  *
24  * Permission to use, copy, modify, and distribute this software for any
25  * purpose with or without fee is hereby granted, provided that the above
26  * copyright notice and this permission notice appear in all copies.
27  *
28  * THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SOFTWARE CONSORTIUM DISCLAIMS
29  * ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES
30  * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL INTERNET SOFTWARE
31  * CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
32  * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
33  * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
34  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
35  * SOFTWARE.
36  */
37 
38 /*
39  * Portions Copyright (c) 1995 by International Business Machines, Inc.
40  *
41  * International Business Machines, Inc. (hereinafter called IBM) grants
42  * permission under its copyrights to use, copy, modify, and distribute this
43  * Software with or without fee, provided that the above copyright notice and
44  * all paragraphs of this notice appear in all copies, and that the name of IBM
45  * not be used in connection with the marketing of any product incorporating
46  * the Software or modifications thereof, without specific, written prior
47  * permission.
48  *
49  * To the extent it has a right to do so, IBM grants an immunity from suit
50  * under its patents, if any, for the use, sale or manufacture of products to
51  * the extent that such products are used for performing Domain Name System
52  * dynamic updates in TCP/IP networks by means of the Software. No immunity is
53  * granted for any product per se or for any other function of any product.
54  *
55  * THE SOFTWARE IS PROVIDED "AS IS", AND IBM DISCLAIMS ALL WARRANTIES,
56  * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
57  * PARTICULAR PURPOSE. IN NO EVENT SHALL IBM BE LIABLE FOR ANY SPECIAL,
58  * DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER ARISING
59  * OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE, EVEN
60  * IF IBM IS APPRISED OF THE POSSIBILITY OF SUCH DAMAGES.
61  */
62 
63 #include <sys/types.h>
64 #include <ctype.h>
65 #include <stdio.h>
66 #include <stdlib.h>
67 #include <string.h>
68 
69 #include "assert.h"
70 #include "utils.h"
71 
72 static const char Base64[] =
73  "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
74 static const char Pad64 = '=';
75 
76 /* (From RFC1521 and draft-ietf-dnssec-secext-03.txt)
77  The following encoding technique is taken from RFC 1521 by Borenstein
78  and Freed. It is reproduced here in a slightly edited form for
79  convenience.
80 
81  A 65-character subset of US-ASCII is used, enabling 6 bits to be
82  represented per printable character. (The extra 65th character, "=",
83  is used to signify a special processing function.)
84 
85  The encoding process represents 24-bit groups of input bits as output
86  strings of 4 encoded characters. Proceeding from left to right, a
87  24-bit input group is formed by concatenating 3 8-bit input groups.
88  These 24 bits are then treated as 4 concatenated 6-bit groups, each
89  of which is translated into a single digit in the base64 alphabet.
90 
91  Each 6-bit group is used as an index into an array of 64 printable
92  characters. The character referenced by the index is placed in the
93  output string.
94 
95  Table 1: The Base64 Alphabet
96 
97  Value Encoding Value Encoding Value Encoding Value Encoding
98  0 A 17 R 34 i 51 z
99  1 B 18 S 35 j 52 0
100  2 C 19 T 36 k 53 1
101  3 D 20 U 37 l 54 2
102  4 E 21 V 38 m 55 3
103  5 F 22 W 39 n 56 4
104  6 G 23 X 40 o 57 5
105  7 H 24 Y 41 p 58 6
106  8 I 25 Z 42 q 59 7
107  9 J 26 a 43 r 60 8
108  10 K 27 b 44 s 61 9
109  11 L 28 c 45 t 62 +
110  12 M 29 d 46 u 63 /
111  13 N 30 e 47 v
112  14 O 31 f 48 w (pad) =
113  15 P 32 g 49 x
114  16 Q 33 h 50 y
115 
116  Special processing is performed if fewer than 24 bits are available
117  at the end of the data being encoded. A full encoding quantum is
118  always completed at the end of a quantity. When fewer than 24 input
119  bits are available in an input group, zero bits are added (on the
120  right) to form an integral number of 6-bit groups. Padding at the
121  end of the data is performed using the '=' character.
122 
123  Since all base64 input is an integral number of octets, only the
124  -------------------------------------------------
125  following cases can arise:
126 
127  (1) the final quantum of encoding input is an integral
128  multiple of 24 bits; here, the final unit of encoded
129  output will be an integral multiple of 4 characters
130  with no "=" padding,
131  (2) the final quantum of encoding input is exactly 8 bits;
132  here, the final unit of encoded output will be two
133  characters followed by two "=" padding characters, or
134  (3) the final quantum of encoding input is exactly 16 bits;
135  here, the final unit of encoded output will be three
136  characters followed by one "=" padding character.
137  */
138 
139 int b64_encode(const void *_src, size_t srclength,
140  void *dest, size_t targsize)
141 {
142  const unsigned char *src = _src;
143  char *target = dest;
144  size_t datalength = 0;
145  u_char input[3] = {0};
146  u_char output[4];
147  size_t i;
148 
149  assert(dest && targsize > 0);
150 
151  while (2 < srclength) {
152  input[0] = *src++;
153  input[1] = *src++;
154  input[2] = *src++;
155  srclength -= 3;
156 
157  output[0] = input[0] >> 2;
158  output[1] = ((input[0] & 0x03) << 4) + (input[1] >> 4);
159  output[2] = ((input[1] & 0x0f) << 2) + (input[2] >> 6);
160  output[3] = input[2] & 0x3f;
161 
162  if (datalength + 4 > targsize)
163  return (-1);
164  target[datalength++] = Base64[output[0]];
165  target[datalength++] = Base64[output[1]];
166  target[datalength++] = Base64[output[2]];
167  target[datalength++] = Base64[output[3]];
168  }
169 
170  /* Now we worry about padding. */
171  if (0 != srclength) {
172  /* Get what's left. */
173  input[0] = input[1] = input[2] = '\0';
174  for (i = 0; i < srclength; i++)
175  input[i] = *src++;
176 
177  output[0] = input[0] >> 2;
178  output[1] = ((input[0] & 0x03) << 4) + (input[1] >> 4);
179  output[2] = ((input[1] & 0x0f) << 2) + (input[2] >> 6);
180 
181  if (datalength + 4 > targsize)
182  return (-1);
183  target[datalength++] = Base64[output[0]];
184  target[datalength++] = Base64[output[1]];
185  if (srclength == 1)
186  target[datalength++] = Pad64;
187  else
188  target[datalength++] = Base64[output[2]];
189  target[datalength++] = Pad64;
190  }
191  if (datalength >= targsize)
192  return (-1);
193  target[datalength] = '\0'; /* Returned value doesn't count \0. */
194  return (datalength);
195 }
196 
197 /* skips all whitespace anywhere.
198  converts characters, four at a time, starting at (or after)
199  src from base - 64 numbers into three 8 bit bytes in the target area.
200  it returns the number of data bytes stored at the target, or -1 on error.
201  */
202 
203 int b64_decode(const void *_src, void *dest, size_t targsize)
204 {
205  const char *src = _src;
206  unsigned char *target = dest;
207  int state, ch;
208  size_t tarindex;
209  u_char nextbyte;
210  char *pos;
211 
212  state = 0;
213  tarindex = 0;
214 
215  assert(dest && targsize > 0);
216 
217  while ((ch = (unsigned char)*src++) != '\0') {
218  if (isspace(ch)) /* Skip whitespace anywhere. */
219  continue;
220 
221  if (ch == Pad64)
222  break;
223 
224  pos = strchr(Base64, ch);
225  if (pos == 0) /* A non-base64 character. */
226  return (-1);
227 
228  switch (state) {
229  case 0:
230  if (target) {
231  if (tarindex >= targsize)
232  return (-1);
233  target[tarindex] = (pos - Base64) << 2;
234  }
235  state = 1;
236  break;
237  case 1:
238  if (target) {
239  if (tarindex >= targsize)
240  return (-1);
241  target[tarindex] |= (pos - Base64) >> 4;
242  nextbyte = ((pos - Base64) & 0x0f) << 4;
243  if (tarindex + 1 < targsize)
244  target[tarindex+1] = nextbyte;
245  else if (nextbyte)
246  return (-1);
247  }
248  tarindex++;
249  state = 2;
250  break;
251  case 2:
252  if (target) {
253  if (tarindex >= targsize)
254  return (-1);
255  target[tarindex] |= (pos - Base64) >> 2;
256  nextbyte = ((pos - Base64) & 0x03) << 6;
257  if (tarindex + 1 < targsize)
258  target[tarindex+1] = nextbyte;
259  else if (nextbyte)
260  return (-1);
261  }
262  tarindex++;
263  state = 3;
264  break;
265  case 3:
266  if (target) {
267  if (tarindex >= targsize)
268  return (-1);
269  target[tarindex] |= (pos - Base64);
270  }
271  tarindex++;
272  state = 0;
273  break;
274  }
275  }
276 
277  /*
278  * We are done decoding Base-64 chars. Let's see if we ended
279  * on a byte boundary, and/or with erroneous trailing characters.
280  */
281 
282  if (ch == Pad64) { /* We got a pad char. */
283  ch = (unsigned char)*src++; /* Skip it, get next. */
284  switch (state) {
285  case 0: /* Invalid = in first position */
286  case 1: /* Invalid = in second position */
287  return (-1);
288 
289  case 2: /* Valid, means one byte of info */
290  /* Skip any number of spaces. */
291  for (; ch != '\0'; ch = (unsigned char)*src++)
292  if (!isspace(ch))
293  break;
294  /* Make sure there is another trailing = sign. */
295  if (ch != Pad64)
296  return (-1);
297  ch = (unsigned char)*src++; /* Skip the = */
298  /* Fall through to "single trailing =" case. */
299  /* FALLTHROUGH */
300 
301  case 3: /* Valid, means two bytes of info */
302  /*
303  * We know this char is an =. Is there anything but
304  * whitespace after it?
305  */
306  for (; ch != '\0'; ch = (unsigned char)*src++)
307  if (!isspace(ch))
308  return (-1);
309 
310  /*
311  * Now make sure for cases 2 and 3 that the "extra"
312  * bits that slopped past the last full byte were
313  * zeros. If we don't check them, they become a
314  * subliminal channel.
315  */
316  if (target && tarindex < targsize &&
317  target[tarindex] != 0)
318  return (-1);
319  }
320  } else {
321  /*
322  * We ended by seeing the end of the string. Make sure we
323  * have no partial bytes lying around.
324  */
325  if (state != 0)
326  return (-1);
327  }
328 
329  /* Null-terminate if we have room left */
330  if (tarindex < targsize)
331  target[tarindex] = 0;
332 
333  return (tarindex);
334 }
int b64_encode(const void *_src, size_t srclength, void *dest, size_t targsize)
Definition: base64.c:139
static const char Base64[]
Definition: base64.c:72
static const char Pad64
Definition: base64.c:74
int b64_decode(const void *_src, void *dest, size_t targsize)
Definition: base64.c:203
static lua_State * state
Definition: uloop.c:54