1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
|
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
namespace IrcTokens
{
public class StatefulDecoder
{
private byte[] _buffer;
private Encoding _encoding;
private Encoding _fallback;
public Encoding Encoding
{
get => _encoding ?? Encoding.GetEncoding(Encoding.UTF8.CodePage, EncoderFallback.ExceptionFallback,
DecoderFallback.ExceptionFallback);
set
{
if (value != null)
_encoding = Encoding.GetEncoding(value.CodePage, EncoderFallback.ExceptionFallback,
DecoderFallback.ReplacementFallback);
}
}
public Encoding Fallback
{
get => _fallback ?? Encoding.GetEncoding(Encoding.GetEncoding("iso-8859-1").CodePage,
EncoderFallback.ExceptionFallback, DecoderFallback.ExceptionFallback);
set
{
if (value != null)
_encoding = Encoding.GetEncoding(value.CodePage, EncoderFallback.ReplacementFallback,
DecoderFallback.ReplacementFallback);
}
}
public string Pending => Encoding.GetString(_buffer);
public StatefulDecoder()
{
Clear();
}
public void Clear()
{
_buffer = Array.Empty<byte>();
}
public List<Line> Push(string data)
{
return Push(Encoding.GetBytes(data));
}
public List<Line> Push(byte[] data)
{
if (data == null || data.Length == 0)
return null;
_buffer = _buffer.Concat(data).ToArray();
// simulate string.Split('\n') before decoding
var newLineIndices = _buffer.Select((b, i) => b == '\n' ? i : -1).Where(i => i != -1).ToArray();
var lines = new List<byte[]>();
for (int i = 0, currentIndex = 0; i < newLineIndices.Length; ++i)
{
var n = new byte[newLineIndices[i] - currentIndex];
Array.Copy(_buffer, currentIndex, n, 0, newLineIndices[i] - currentIndex);
currentIndex = newLineIndices[i] + 1;
lines.Add(n);
}
var listLines = lines.Select(l => l.ToList()).ToList();
// simulate string.Trim('\r') before decoding
foreach (var line in listLines)
{
var i = 0;
while (line[i] == '\r')
{
line.RemoveAt(i);
i++;
}
i = line.Count - 1;
while (line[i] == '\r')
{
line.RemoveAt(i);
i--;
}
}
var decodeLines = new List<string>();
foreach (var line in listLines.Select(l => l.ToArray()))
{
try
{
decodeLines.Add(Encoding.GetString(line));
}
catch (DecoderFallbackException)
{
decodeLines.Add(Fallback.GetString(line));
}
}
return decodeLines
.Select(l => new Line(l))
.ToList();
}
}
}
|