Mercurial > pub > ImplabNet
comparison Implab/Formats/Grammar.cs @ 178:d5c5db0335ee ref20160224
working on JSON parser
author | cin |
---|---|
date | Wed, 23 Mar 2016 19:51:45 +0300 |
parents | a0ff6a0e9c44 |
children | 6fa235c5a760 |
comparison
equal
deleted
inserted
replaced
177:a0ff6a0e9c44 | 178:d5c5db0335ee |
---|---|
7 | 7 |
8 namespace Implab.Formats { | 8 namespace Implab.Formats { |
9 /// <summary> | 9 /// <summary> |
10 /// Базовый абстрактный класс. Грамматика, позволяет формулировать выражения над алфавитом типа <c>char</c>. | 10 /// Базовый абстрактный класс. Грамматика, позволяет формулировать выражения над алфавитом типа <c>char</c>. |
11 /// </summary> | 11 /// </summary> |
12 public abstract class Grammar<TSymbol, TTag> { | 12 public abstract class Grammar<TSymbol> { |
13 | 13 |
14 protected abstract IAlphabetBuilder<TSymbol> AlphabetBuilder { | 14 protected abstract IAlphabetBuilder<TSymbol> AlphabetBuilder { |
15 get; | 15 get; |
16 } | 16 } |
17 | 17 |
18 protected SymbolToken<TTag> UnclassifiedToken() { | 18 protected SymbolToken UnclassifiedToken() { |
19 return new SymbolToken<TTag>(DFAConst.UNCLASSIFIED_INPUT); | 19 return new SymbolToken(AutomatonConst.UNCLASSIFIED_INPUT); |
20 } | 20 } |
21 | 21 |
22 protected void DefineAlphabet(IEnumerable<TSymbol> alphabet) { | 22 protected void DefineAlphabet(IEnumerable<TSymbol> alphabet) { |
23 Safe.ArgumentNotNull(alphabet, "alphabet"); | 23 Safe.ArgumentNotNull(alphabet, "alphabet"); |
24 | 24 |
25 foreach (var ch in alphabet) | 25 foreach (var ch in alphabet) |
26 AlphabetBuilder.DefineSymbol(ch); | 26 AlphabetBuilder.DefineSymbol(ch); |
27 } | 27 } |
28 | 28 |
29 protected Token<TTag> SymbolToken(TSymbol symbol) { | 29 protected Token SymbolToken(TSymbol symbol) { |
30 return Token<TTag>.New(TranslateOrAdd(symbol)); | 30 return Token.New(TranslateOrAdd(symbol)); |
31 } | 31 } |
32 | 32 |
33 protected Token<TTag> SymbolToken(IEnumerable<TSymbol> symbols) { | 33 protected Token SymbolToken(IEnumerable<TSymbol> symbols) { |
34 Safe.ArgumentNotNull(symbols, "symbols"); | 34 Safe.ArgumentNotNull(symbols, "symbols"); |
35 | 35 |
36 return Token<TTag>.New(TranslateOrAdd(symbols).ToArray()); | 36 return Token.New(TranslateOrAdd(symbols).ToArray()); |
37 } | 37 } |
38 | 38 |
39 protected Token<TTag> SymbolSetToken(params TSymbol[] set) { | 39 protected Token SymbolSetToken(params TSymbol[] set) { |
40 return SymbolToken(set); | 40 return SymbolToken(set); |
41 } | 41 } |
42 | 42 |
43 int TranslateOrAdd(TSymbol ch) { | 43 int TranslateOrAdd(TSymbol ch) { |
44 var t = AlphabetBuilder.Translate(ch); | 44 var t = AlphabetBuilder.Translate(ch); |
45 if (t == DFAConst.UNCLASSIFIED_INPUT) | 45 if (t == AutomatonConst.UNCLASSIFIED_INPUT) |
46 t = AlphabetBuilder.DefineSymbol(ch); | 46 t = AlphabetBuilder.DefineSymbol(ch); |
47 return t; | 47 return t; |
48 } | 48 } |
49 | 49 |
50 IEnumerable<int> TranslateOrAdd(IEnumerable<TSymbol> symbols) { | 50 IEnumerable<int> TranslateOrAdd(IEnumerable<TSymbol> symbols) { |
51 return symbols.Distinct().Select(TranslateOrAdd); | 51 return symbols.Distinct().Select(TranslateOrAdd); |
52 } | 52 } |
53 | 53 |
54 int TranslateOrDie(TSymbol ch) { | 54 int TranslateOrDie(TSymbol ch) { |
55 var t = AlphabetBuilder.Translate(ch); | 55 var t = AlphabetBuilder.Translate(ch); |
56 if (t == DFAConst.UNCLASSIFIED_INPUT) | 56 if (t == AutomatonConst.UNCLASSIFIED_INPUT) |
57 throw new ApplicationException(String.Format("Symbol '{0}' is UNCLASSIFIED", ch)); | 57 throw new ApplicationException(String.Format("Symbol '{0}' is UNCLASSIFIED", ch)); |
58 return t; | 58 return t; |
59 } | 59 } |
60 | 60 |
61 IEnumerable<int> TranslateOrDie(IEnumerable<TSymbol> symbols) { | 61 IEnumerable<int> TranslateOrDie(IEnumerable<TSymbol> symbols) { |
62 return symbols.Distinct().Select(TranslateOrDie); | 62 return symbols.Distinct().Select(TranslateOrDie); |
63 } | 63 } |
64 | 64 |
65 protected Token<TTag> SymbolTokenExcept(IEnumerable<TSymbol> symbols) { | 65 protected Token SymbolTokenExcept(IEnumerable<TSymbol> symbols) { |
66 Safe.ArgumentNotNull(symbols, "symbols"); | 66 Safe.ArgumentNotNull(symbols, "symbols"); |
67 | 67 |
68 return Token<TTag>.New( Enumerable.Range(0, AlphabetBuilder.Count).Except(TranslateOrDie(symbols)).ToArray() ); | 68 return Token.New( Enumerable.Range(0, AlphabetBuilder.Count).Except(TranslateOrDie(symbols)).ToArray() ); |
69 } | 69 } |
70 | 70 |
71 protected abstract IndexedAlphabetBase<TSymbol> CreateAlphabet(); | 71 protected abstract IndexedAlphabetBase<TSymbol> CreateAlphabet(); |
72 | 72 |
73 protected ScannerContext<TTag> BuildScannerContext(Token<TTag> regexp) { | 73 protected ScannerContext<TTag> BuildScannerContext<TTag>(Token regexp) { |
74 | 74 |
75 var dfa = new RegularDFA<TSymbol, TTag>(AlphabetBuilder); | 75 var dfa = new RegularDFA<TSymbol, TTag>(AlphabetBuilder); |
76 | 76 |
77 var visitor = new RegularExpressionVisitor<TTag>(); | 77 var visitor = new RegularExpressionVisitor<TTag>(dfa); |
78 regexp.Accept( visitor ); | 78 regexp.Accept(visitor); |
79 | 79 visitor.BuildDFA(); |
80 visitor.BuildDFA(dfa); | |
81 | 80 |
82 if (dfa.IsFinalState(dfa.InitialState)) | 81 if (dfa.IsFinalState(dfa.InitialState)) |
83 throw new ApplicationException("The specified language contains empty token"); | 82 throw new ApplicationException("The specified language contains empty token"); |
84 | 83 |
85 var ab = CreateAlphabet(); | 84 var ab = CreateAlphabet(); |