-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathFileEncoder.cs
More file actions
83 lines (68 loc) · 2.42 KB
/
FileEncoder.cs
File metadata and controls
83 lines (68 loc) · 2.42 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
using System;
using System.Collections.Generic;
using System.IO;
using System.Linq;
using System.Text;
namespace NN
{
public class FileEncoder
{
private readonly string _filename;
public FileEncoder(string filename)
{
_filename = filename;
}
public List<string> Encode(List<EncodeMessage> encoding)
{
string[] tokens;
var lines = new List<String>();
var d = new Dictionary<int, Dictionary<string, int>>();
var result = new List<String>();
using (var ifs = new FileStream(_filename, FileMode.Open))
{
var sr = new StreamReader(ifs);
string fileLine;
while ((fileLine = sr.ReadLine()) != null)
{
lines.Add(fileLine);
}
sr.Close();
}
foreach (var encode in encoding)
{
var itemNum = 0;
d.Add(encode.Column, new Dictionary<string, int>());
foreach (var line in lines)
{
tokens = line.Split(',');
var column = encode.Column;
if (d[column].ContainsKey(tokens[column]) == false)
d[column].Add(tokens[column], itemNum++);
}
}
var builder = new StringBuilder();
foreach(var line in lines)
{
tokens = line.Split(',');
for (var i = 0; i < tokens.Length; ++i)
{
// see if we have a matching encoder
var encoderMatch = encoding.FirstOrDefault(t => t.Column == i);
if(encoderMatch != null) // encode this string
{
var n = d[encoderMatch.Column].Count;
var index = d[encoderMatch.Column][tokens[i]]; // 0, 1, 2, or . . .
builder.Append(encoderMatch.Encoding.EncodeData(index, n));
}
else
builder.Append(tokens[i]);
builder.Append(",");
}
builder.Remove(builder.Length - 1, 1); // Remove trailing ','.
result.Add(builder.ToString());
builder.Clear();
}
return result;
}
}
}