Mercurial > pub > ImplabNet
comparison Implab/Parsing/AlphabetBase.cs @ 55:c0bf853aa04f
Added initial JSON support
+JSONParser
+JSONWriter
| author | cin |
|---|---|
| date | Sun, 15 Jun 2014 19:39:11 +0400 |
| parents | |
| children | 21611344d366 |
comparison
equal
deleted
inserted
replaced
| 51:2c332a9c64c0 | 55:c0bf853aa04f |
|---|---|
| 1 using Implab; | |
| 2 using System; | |
| 3 using System.Collections.Generic; | |
| 4 using System.Diagnostics; | |
| 5 using System.Linq; | |
| 6 using System.Text; | |
| 7 using System.Threading.Tasks; | |
| 8 | |
| 9 namespace Implab.Parsing { | |
| 10 public abstract class AlphabetBase<T> : IAlphabet<T> { | |
| 11 public const int UNCLASSIFIED = 0; | |
| 12 | |
| 13 int m_nextId = 1; | |
| 14 int[] m_map; | |
| 15 | |
| 16 public int Count { | |
| 17 get { return m_nextId; } | |
| 18 } | |
| 19 | |
| 20 protected AlphabetBase() { | |
| 21 m_map = new int[MapSize]; | |
| 22 } | |
| 23 | |
| 24 protected AlphabetBase(int[] map) { | |
| 25 Debug.Assert(map != null); | |
| 26 Debug.Assert(map.Length == MapSize); | |
| 27 | |
| 28 m_map = map; | |
| 29 m_nextId = map.Max() + 1; | |
| 30 } | |
| 31 | |
| 32 public int DefineSymbol(T symbol) { | |
| 33 var index = GetSymbolIndex(symbol); | |
| 34 if (m_map[index] == UNCLASSIFIED) | |
| 35 m_map[index] = m_nextId++; | |
| 36 return m_map[index]; | |
| 37 } | |
| 38 | |
| 39 public int DefineClass(IEnumerable<T> symbols) { | |
| 40 Safe.ArgumentNotNull(symbols, "symbols"); | |
| 41 symbols = symbols.Distinct(); | |
| 42 | |
| 43 foreach (var symbol in symbols) { | |
| 44 var index = GetSymbolIndex(symbol); | |
| 45 if (m_map[index] == UNCLASSIFIED) | |
| 46 m_map[GetSymbolIndex(symbol)] = m_nextId; | |
| 47 else | |
| 48 throw new InvalidOperationException(String.Format("Symbol '{0}' already in use", symbol)); | |
| 49 } | |
| 50 return m_nextId++; | |
| 51 } | |
| 52 | |
| 53 public List<T>[] CreateReverseMap() { | |
| 54 return | |
| 55 Enumerable.Range(UNCLASSIFIED, Count) | |
| 56 .Select( | |
| 57 i => InputSymbols | |
| 58 .Where(x => i != UNCLASSIFIED && m_map[GetSymbolIndex(x)] == i) | |
| 59 .ToList() | |
| 60 ) | |
| 61 .ToArray(); | |
| 62 } | |
| 63 | |
| 64 public int[] Reclassify(IAlphabet<T> newAlphabet, IEnumerable<ICollection<int>> classes) { | |
| 65 Safe.ArgumentNotNull(newAlphabet, "newAlphabet"); | |
| 66 Safe.ArgumentNotNull(classes, "classes"); | |
| 67 var reverseMap = CreateReverseMap(); | |
| 68 | |
| 69 int[] translationMap = new int[Count]; | |
| 70 | |
| 71 foreach (var scl in classes) { | |
| 72 // skip if the supper class contains the unclassified element | |
| 73 if (scl.Contains(UNCLASSIFIED)) | |
| 74 continue; | |
| 75 var range = new List<T>(); | |
| 76 foreach (var cl in scl) { | |
| 77 if (cl < 0 || cl >= reverseMap.Length) | |
| 78 throw new ArgumentOutOfRangeException(String.Format("Class {0} is not valid for the current alphabet", cl)); | |
| 79 range.AddRange(reverseMap[cl]); | |
| 80 } | |
| 81 var newClass = newAlphabet.DefineClass(range); | |
| 82 foreach (var cl in scl) | |
| 83 translationMap[cl] = newClass; | |
| 84 } | |
| 85 | |
| 86 return translationMap; | |
| 87 } | |
| 88 | |
| 89 public int Translate(T symbol) { | |
| 90 return m_map[GetSymbolIndex(symbol)]; | |
| 91 } | |
| 92 | |
| 93 public abstract int GetSymbolIndex(T symbol); | |
| 94 | |
| 95 public abstract IEnumerable<T> InputSymbols { get; } | |
| 96 | |
| 97 protected abstract int MapSize { get; } | |
| 98 | |
| 99 public int[] GetTranslationMap() { | |
| 100 return m_map; | |
| 101 } | |
| 102 } | |
| 103 } |
