##// END OF EJS Templates
Handle odd-sized base85 input and output
Brendan Cully -
r3288:e93c926e default
parent child Browse files
Show More
@@ -1,132 +1,155 b''
1 1 /*
2 2 base85 codec
3 3
4 4 Copyright 2006 Brendan Cully <brendan@kublai.com>
5 5
6 6 This software may be used and distributed according to the terms of
7 7 the GNU General Public License, incorporated herein by reference.
8 8
9 9 Largely based on git's implementation
10 10 */
11 11
12 12 #include <Python.h>
13 13
14 14 static const char b85chars[] = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ"
15 15 "abcdefghijklmnopqrstuvwxyz!#$%&()*+-;<=>?@^_`{|}~";
16 16 static char b85dec[256];
17 17
18 18 static void
19 19 b85prep(void)
20 20 {
21 21 int i;
22 22
23 23 memset(b85dec, 0, sizeof(b85dec));
24 24 for (i = 0; i < sizeof(b85chars); i++)
25 25 b85dec[(int)(b85chars[i])] = i + 1;
26 26 }
27 27
28 28 static PyObject *
29 29 b85encode(PyObject *self, PyObject *args)
30 30 {
31 31 const unsigned char *text;
32 32 PyObject *out;
33 33 char *dst;
34 34 int len, olen, i;
35 35 unsigned int acc, val, ch;
36 int pad = 0;
36 37
37 if (!PyArg_ParseTuple(args, "s#", &text, &len))
38 if (!PyArg_ParseTuple(args, "s#|i", &text, &len, &pad))
38 39 return NULL;
39 40
40 olen = (len + 3) / 4 * 5;
41 if (!(out = PyString_FromStringAndSize(NULL, olen)))
41 if (pad)
42 olen = ((len + 3) / 4 * 5) - 3;
43 else {
44 olen = len % 4;
45 if (olen)
46 olen++;
47 olen += len / 4 * 5;
48 }
49 if (!(out = PyString_FromStringAndSize(NULL, olen + 3)))
42 50 return NULL;
43 51
44 52 dst = PyString_AS_STRING(out);
45 53
46 while (len)
47 {
54 while (len) {
48 55 acc = 0;
49 56 for (i = 24; i >= 0; i -= 8) {
50 57 ch = *text++;
51 58 acc |= ch << i;
52 59 if (--len == 0)
53 60 break;
54 61 }
55 62 for (i = 4; i >= 0; i--) {
56 63 val = acc % 85;
57 64 acc /= 85;
58 65 dst[i] = b85chars[val];
59 66 }
60 67 dst += 5;
61 68 }
62 69
70 if (!pad)
71 _PyString_Resize(&out, olen);
72
63 73 return out;
64 74 }
65 75
66 76 static PyObject *
67 77 b85decode(PyObject *self, PyObject *args)
68 78 {
69 79 PyObject *out;
70 80 const char *text;
71 81 char *dst;
72 int len, i, j, olen, c;
82 int len, i, j, olen, c, cap;
73 83 unsigned int acc;
74 84
75 85 if (!PyArg_ParseTuple(args, "s#", &text, &len))
76 86 return NULL;
77 87
78 olen = (len + 4) / 5 * 4;
88 olen = len / 5 * 4;
89 i = len % 5;
90 if (i)
91 olen += i - 1;
79 92 if (!(out = PyString_FromStringAndSize(NULL, olen)))
80 93 return NULL;
81 94
82 95 dst = PyString_AS_STRING(out);
83 96
84 for (i = 1; len; i++)
97 i = 0;
98 while (i < len)
85 99 {
86 100 acc = 0;
87 for (j = 0; j < 4 && --len; j++)
101 cap = len - i - 1;
102 if (cap > 4)
103 cap = 4;
104 for (j = 0; j < cap; i++, j++)
88 105 {
89 106 c = b85dec[(int)*text++] - 1;
90 107 if (c < 0)
91 108 return PyErr_Format(PyExc_ValueError, "Bad base85 character at position %d", i);
92 109 acc = acc * 85 + c;
93 110 }
94 if (len--)
111 if (i++ < len)
95 112 {
96 113 c = b85dec[(int)*text++] - 1;
97 114 if (c < 0)
98 115 return PyErr_Format(PyExc_ValueError, "Bad base85 character at position %d", i);
99 }
100 else
101 c = 0;
102 116 /* overflow detection: 0xffffffff == "|NsC0",
103 117 * "|NsC" == 0x03030303 */
104 118 if (acc > 0x03030303 || (acc *= 85) > 0xffffffff - c)
105 119 return PyErr_Format(PyExc_ValueError, "Bad base85 sequence at position %d", i);
120 acc += c;
121 }
106 122
107 acc += c;
108
109 for (j = 0; j < 4; j++)
123 cap = olen < 4 ? olen : 4;
124 olen -= cap;
125 for (j = 0; j < 4 - cap; j++)
126 acc *= 85;
127 if (cap && cap < 4)
128 acc += 0xffffff >> (cap - 1) * 8;
129 for (j = 0; j < cap; j++)
110 130 {
111 131 acc = (acc << 8) | (acc >> 24);
112 *dst++ = (char)acc;
132 *dst++ = acc;
113 133 }
114 134 }
115 135
116 136 return out;
117 137 }
118 138
119 139 static char base85_doc[] = "Base85 Data Encoding";
120 140
121 141 static PyMethodDef methods[] = {
122 {"b85encode", b85encode, METH_VARARGS, "encode text in base85\n"},
123 {"b85decode", b85decode, METH_VARARGS, "decode base85 text\n"},
142 {"b85encode", b85encode, METH_VARARGS,
143 "Encode text in base85.\n\n"
144 "If the second parameter is true, pad the result to a multiple of "
145 "five characters.\n"},
146 {"b85decode", b85decode, METH_VARARGS, "Decode base85 text.\n"},
124 147 {NULL, NULL}
125 148 };
126 149
127 150 PyMODINIT_FUNC initbase85(void)
128 151 {
129 152 Py_InitModule3("base85", methods, base85_doc);
130 153
131 154 b85prep();
132 155 }
General Comments 0
You need to be logged in to leave comments. Login now