55
|
1 using Implab;
|
|
2 using System;
|
|
3 using System.Collections.Generic;
|
|
4 using System.Diagnostics;
|
|
5 using System.Linq;
|
|
6 using System.Text;
|
|
7 using System.Threading.Tasks;
|
|
8
|
|
9 namespace Implab.Parsing {
|
|
10 public abstract class AlphabetBase<T> : IAlphabet<T> {
|
|
11 public const int UNCLASSIFIED = 0;
|
|
12
|
|
13 int m_nextId = 1;
|
|
14 int[] m_map;
|
|
15
|
|
16 public int Count {
|
|
17 get { return m_nextId; }
|
|
18 }
|
|
19
|
|
20 protected AlphabetBase() {
|
|
21 m_map = new int[MapSize];
|
|
22 }
|
|
23
|
|
24 protected AlphabetBase(int[] map) {
|
|
25 Debug.Assert(map != null);
|
|
26 Debug.Assert(map.Length == MapSize);
|
|
27
|
|
28 m_map = map;
|
|
29 m_nextId = map.Max() + 1;
|
|
30 }
|
|
31
|
|
32 public int DefineSymbol(T symbol) {
|
|
33 var index = GetSymbolIndex(symbol);
|
|
34 if (m_map[index] == UNCLASSIFIED)
|
|
35 m_map[index] = m_nextId++;
|
|
36 return m_map[index];
|
|
37 }
|
|
38
|
|
39 public int DefineClass(IEnumerable<T> symbols) {
|
|
40 Safe.ArgumentNotNull(symbols, "symbols");
|
|
41 symbols = symbols.Distinct();
|
|
42
|
|
43 foreach (var symbol in symbols) {
|
|
44 var index = GetSymbolIndex(symbol);
|
|
45 if (m_map[index] == UNCLASSIFIED)
|
|
46 m_map[GetSymbolIndex(symbol)] = m_nextId;
|
|
47 else
|
|
48 throw new InvalidOperationException(String.Format("Symbol '{0}' already in use", symbol));
|
|
49 }
|
|
50 return m_nextId++;
|
|
51 }
|
|
52
|
|
53 public List<T>[] CreateReverseMap() {
|
|
54 return
|
|
55 Enumerable.Range(UNCLASSIFIED, Count)
|
|
56 .Select(
|
|
57 i => InputSymbols
|
|
58 .Where(x => i != UNCLASSIFIED && m_map[GetSymbolIndex(x)] == i)
|
|
59 .ToList()
|
|
60 )
|
|
61 .ToArray();
|
|
62 }
|
|
63
|
|
64 public int[] Reclassify(IAlphabet<T> newAlphabet, IEnumerable<ICollection<int>> classes) {
|
|
65 Safe.ArgumentNotNull(newAlphabet, "newAlphabet");
|
|
66 Safe.ArgumentNotNull(classes, "classes");
|
|
67 var reverseMap = CreateReverseMap();
|
|
68
|
|
69 int[] translationMap = new int[Count];
|
|
70
|
|
71 foreach (var scl in classes) {
|
|
72 // skip if the supper class contains the unclassified element
|
|
73 if (scl.Contains(UNCLASSIFIED))
|
|
74 continue;
|
|
75 var range = new List<T>();
|
|
76 foreach (var cl in scl) {
|
|
77 if (cl < 0 || cl >= reverseMap.Length)
|
|
78 throw new ArgumentOutOfRangeException(String.Format("Class {0} is not valid for the current alphabet", cl));
|
|
79 range.AddRange(reverseMap[cl]);
|
|
80 }
|
|
81 var newClass = newAlphabet.DefineClass(range);
|
|
82 foreach (var cl in scl)
|
|
83 translationMap[cl] = newClass;
|
|
84 }
|
|
85
|
|
86 return translationMap;
|
|
87 }
|
|
88
|
|
89 public int Translate(T symbol) {
|
|
90 return m_map[GetSymbolIndex(symbol)];
|
|
91 }
|
|
92
|
|
93 public abstract int GetSymbolIndex(T symbol);
|
|
94
|
|
95 public abstract IEnumerable<T> InputSymbols { get; }
|
|
96
|
|
97 protected abstract int MapSize { get; }
|
|
98
|
|
99 public int[] GetTranslationMap() {
|
|
100 return m_map;
|
|
101 }
|
|
102 }
|
|
103 }
|