-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathBase36.cs
202 lines (180 loc) · 6.98 KB
/
Base36.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
using System;
using System.Linq;
using System.Numerics;
using System.Text;
namespace Ipfs
{
/// <summary>
/// A codec for Base-36.
/// </summary>
/// <remarks>
/// <para>
/// Provides encoding and decoding functionality for Base-36, with methods <see cref="EncodeToStringUc"/> and <see cref="EncodeToStringLc"/> for encoding,
/// and <see cref="DecodeString"/> for decoding. The encoding methods offer both uppercase and lowercase options.
/// </para>
/// <para>
/// The implementation is case-insensitive for decoding and allows for efficient conversion between byte arrays and Base-36 strings.
/// </para>
/// <para>
/// Ported from https://github.com/multiformats/go-base36/blob/v0.2.0/base36.go
/// </para>
/// </remarks>
public static class Base36
{
// Constants for the encoding alphabets
private const string UcAlphabet = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ";
private const string LcAlphabet = "0123456789abcdefghijklmnopqrstuvwxyz";
private const int MaxDigitOrdinal = 'z';
private const byte MaxDigitValueB36 = 35;
// Reverse lookup table for decoding
private static readonly byte[] RevAlphabet = new byte[MaxDigitOrdinal + 1];
// Static constructor to initialize the reverse lookup table
static Base36()
{
// Initialize the reverse alphabet array with default values
for (int i = 0; i < RevAlphabet.Length; i++)
{
RevAlphabet[i] = MaxDigitValueB36 + 1;
}
// Populate the reverse alphabet array for decoding
for (int i = 0; i < UcAlphabet.Length; i++)
{
char c = UcAlphabet[i];
RevAlphabet[c] = (byte)i;
if (c > '9')
{
RevAlphabet[char.ToLower(c)] = (byte)i;
}
}
}
/// <summary>
/// Encodes a byte array to a Base-36 string using uppercase characters.
/// </summary>
/// <param name="bytes">
/// The byte array to encode.
/// </param>
/// <returns>
/// The encoded Base-36 string in uppercase.
/// </returns>
public static string EncodeToStringUc(byte[] bytes) => Encode(bytes, UcAlphabet);
/// <summary>
/// Encodes a byte array to a Base-36 string using lowercase characters.
/// </summary>
/// <param name="bytes">
/// The byte array to encode.
/// </param>
/// <returns>
/// The encoded Base-36 string in lowercase.
/// </returns>
public static string EncodeToStringLc(byte[] bytes) => Encode(bytes, LcAlphabet);
// Core encoding logic for Base-36 conversion
private static string Encode(byte[] input, string alphabet)
{
int zeroCount = 0;
while (zeroCount < input.Length && input[zeroCount] == 0)
{
zeroCount++;
}
int size = zeroCount + (input.Length - zeroCount) * 277 / 179 + 1;
byte[] buffer = new byte[size];
int index, stopIndex;
uint carry;
stopIndex = size - 1;
for (int i = zeroCount; i < input.Length; i++)
{
index = size - 1;
carry = input[i];
while (index > stopIndex || carry != 0)
{
carry += (uint)(buffer[index]) * 256;
buffer[index] = (byte)(carry % 36);
carry /= 36;
index--;
}
stopIndex = index;
}
// The purpose of this loop is to skip over the portion of the buffer that contains only zeros (after accounting for any leading zeros in the original input).
// This is important for the encoding process, as these leading zeros are not represented in the base-36 encoded string.
for (stopIndex = zeroCount; stopIndex < size && buffer[stopIndex] == 0; stopIndex++)
{
}
// Once the first non-zero byte is found, the actual encoding of the non-zero part of the buffer can begin.
byte[] valueBuffer = new byte[buffer.Length - (stopIndex - zeroCount)];
for (int i = 0; i < valueBuffer.Length; i++)
{
valueBuffer[i] = (byte)alphabet[buffer[stopIndex - zeroCount + i]];
}
return Encoding.ASCII.GetString(valueBuffer);
}
/// <summary>
/// Decodes a Base-36 encoded string to a byte array.
/// </summary>
/// <param name="s">
/// The Base-36 encoded string to decode.
/// </param>
/// <returns>
/// The decoded byte array.
/// </returns>
/// <exception cref="ArgumentException">
/// Thrown if the input string is null or empty.
/// </exception>
/// <exception cref="FormatException">
/// Thrown if the input string contains characters not valid in Base-36.
/// </exception>
public static byte[] DecodeString(string s)
{
if (string.IsNullOrEmpty(s))
{
return Array.Empty<byte>();
}
int zeroCount = 0;
while (zeroCount < s.Length && s[zeroCount] == '0')
{
zeroCount++;
}
byte[] binu = new byte[2 * ((s.Length) * 179 / 277 + 1)];
uint[] outi = new uint[(s.Length + 3) / 4];
foreach (char r in s)
{
if (r > MaxDigitOrdinal || RevAlphabet[r] > MaxDigitValueB36)
{
throw new FormatException($"Invalid base36 character ({r}).");
}
ulong c = RevAlphabet[r];
for (int j = outi.Length - 1; j >= 0; j--)
{
ulong t = (ulong)outi[j] * 36 + c;
c = (t >> 32);
outi[j] = (uint)(t & 0xFFFFFFFF);
}
}
uint mask = (uint)((s.Length % 4) * 8);
if (mask == 0)
{
mask = 32;
}
mask -= 8;
int outIndex = 0;
for (int j = 0; j < outi.Length; j++)
{
for (; mask < 32; mask -= 8)
{
binu[outIndex] = (byte)(outi[j] >> (int)mask);
outIndex++;
}
mask = 24;
}
for (int msb = zeroCount; msb < outIndex; msb++)
{
if (binu[msb] > 0)
{
int lengthToCopy = outIndex - msb;
byte[] result = new byte[lengthToCopy];
Array.Copy(binu, msb, result, 0, lengthToCopy);
return result;
}
}
return new byte[outIndex - zeroCount];
}
}
}