about summary refs log tree commit diff
path: root/IrcTokens/StatefulDecoder.cs
blob: e094760724f35d288a32fa4642ada63cafd176fa (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;

namespace IrcTokens
{
    public class StatefulDecoder
    {
        private byte[] _buffer;
        private Encoding _encoding;
        private Encoding _fallback;

        public Encoding Encoding
        {
            get => _encoding ?? Encoding.UTF8;
            set => _encoding = value;
        }

        public Encoding Fallback
        {
            get => _fallback ?? Encoding.GetEncoding("iso-8859-1");
            set => _fallback = value;
        }

        public string Pending => Encoding.GetString(_buffer);

        public StatefulDecoder()
        {
            Clear();
        }

        public void Clear()
        {
            _buffer = Array.Empty<byte>();
        }

        public List<Line> Push(string data)
        {
            return Push(Encoding.GetBytes(data));
        }

        public List<Line> Push(byte[] data)
        {
            if (data == null || data.Length == 0)
                return null;

            _buffer = _buffer.Concat(data).ToArray();

            // simulate string.Split('\n') before decoding
            var newLineIndices = _buffer.Select((b, i) => b == '\n' ? i : -1).Where(i => i != -1).ToArray();
            var lines = new List<byte[]>();

            for (int i = 0, currentIndex = 0; i < newLineIndices.Length; ++i)
            {
                var n = new byte[newLineIndices[i] - currentIndex];
                Array.Copy(_buffer, currentIndex, n, 0, newLineIndices[i] - currentIndex);
                currentIndex = newLineIndices[i] + 1;
                lines.Add(n);
            }

            var listLines = lines.Select(l => l.ToList()).ToList();

            // simulate string.Trim('\r') before decoding
            foreach (var line in listLines)
            {
                var i = 0;
                while (line[i] == '\r')
                {
                    line.RemoveAt(i);
                    i++;
                }

                i = line.Count - 1;
                while (line[i] == '\r')
                {
                    line.RemoveAt(i);
                    i--;
                }
            }

            //_buffer = listLines.Last().ToArray();
            //listLines.RemoveAt(listLines.Count - 1);

            var decodeLines = new List<string>();
            foreach (var line in listLines.Select(l => l.ToArray()))
            {
                try
                {
                    decodeLines.Add(Encoding.GetString(line));
                }
                catch (DecoderFallbackException)
                {
                    decodeLines.Add(Fallback.GetString(line));
                }
            }

            return decodeLines
                .Select(l => new Line(l))
                .ToList();
        }
    }
}