Mercurial > pub > ImplabNet
comparison Implab/Formats/BufferScanner.cs @ 174:983df35b3ca1 ref20160224
sync
| author | cin |
|---|---|
| date | Fri, 18 Mar 2016 18:10:30 +0300 |
| parents | ecfece82ca11 |
| children |
comparison
equal
deleted
inserted
replaced
| 173:ecfece82ca11 | 174:983df35b3ca1 |
|---|---|
| 1 using System; | 1 using System; |
| 2 using Implab.Automaton.RegularExpressions; | 2 using Implab.Automaton.RegularExpressions; |
| 3 using Implab.Automaton; | 3 using Implab.Automaton; |
| 4 using System.Diagnostics; | |
| 4 | 5 |
| 5 namespace Implab.Formats { | 6 namespace Implab.Formats { |
| 6 public struct BufferScanner<TTag> { | 7 public struct BufferScanner<TTag> { |
| 7 char[] m_buffer; | |
| 8 int m_offset; | |
| 9 int m_position; | |
| 10 int m_hi; | |
| 11 | |
| 12 readonly int m_chunk; | |
| 13 readonly int m_limit; | |
| 14 | |
| 15 readonly DFAStateDescriptor<TTag>[] m_dfa; | 8 readonly DFAStateDescriptor<TTag>[] m_dfa; |
| 16 int m_state; | 9 int m_state; |
| 10 int m_pos; | |
| 17 | 11 |
| 18 public BufferScanner(DFAStateDescriptor<TTag>[] dfa, int initialState, int chunk, int limit) { | 12 public BufferScanner(DFAStateDescriptor<TTag>[] dfa, int initialState) { |
| 19 m_dfa = dfa; | 13 m_dfa = dfa; |
| 20 m_state = initialState; | 14 m_state = initialState; |
| 21 m_chunk = chunk; | |
| 22 m_limit = limit; | |
| 23 m_buffer = null; | |
| 24 m_offset = 0; | |
| 25 m_position = 0; | |
| 26 m_hi = 0; | |
| 27 } | |
| 28 | |
| 29 public char[] Buffer { | |
| 30 get { | |
| 31 return m_buffer; | |
| 32 } | |
| 33 } | |
| 34 | |
| 35 public int HiMark { | |
| 36 get { | |
| 37 return m_hi; | |
| 38 } | |
| 39 } | 15 } |
| 40 | 16 |
| 41 public int Position { | 17 public int Position { |
| 42 get { | 18 get { return m_pos; } |
| 43 return m_position; | |
| 44 } | |
| 45 } | |
| 46 | |
| 47 public int Length { | |
| 48 get { | |
| 49 return m_hi - m_position; | |
| 50 } | |
| 51 } | |
| 52 | |
| 53 public int TokenOffset { | |
| 54 get { | |
| 55 return m_offset; | |
| 56 } | |
| 57 } | |
| 58 | |
| 59 public int TokenLength { | |
| 60 get { | |
| 61 return m_position - m_offset; | |
| 62 } | |
| 63 } | |
| 64 | |
| 65 public void Init(char[] buffer, int position, int length) { | |
| 66 m_buffer = buffer; | |
| 67 m_position = position; | |
| 68 m_offset = position; | |
| 69 m_hi = position + length; | |
| 70 } | |
| 71 | |
| 72 public int Extend() { | |
| 73 // free space | |
| 74 var free = m_buffer.Length - m_hi; | |
| 75 | |
| 76 // if the buffer have enough free space | |
| 77 if (free > 0) | |
| 78 return free; | |
| 79 | |
| 80 // effective size of the buffer | |
| 81 var size = m_buffer.Length - m_offset; | |
| 82 | |
| 83 // calculate the new size | |
| 84 int grow = Math.Min(m_limit - size, m_chunk); | |
| 85 if (grow <= 0) | |
| 86 throw new ParserException(String.Format("Input buffer {0} bytes limit exceeded", m_limit)); | |
| 87 | |
| 88 var temp = new char[size + grow]; | |
| 89 Array.Copy(m_buffer, m_offset, temp, 0, m_hi - m_offset); | |
| 90 m_position -= m_offset; | |
| 91 m_hi -= m_offset; | |
| 92 m_offset = 0; | |
| 93 m_buffer = temp; | |
| 94 | |
| 95 return free + grow; | |
| 96 } | |
| 97 | |
| 98 public void RaiseMark(int size) { | |
| 99 m_hi += size; | |
| 100 } | 19 } |
| 101 | 20 |
| 102 /// <summary> | 21 /// <summary> |
| 103 /// Scan this instance. | 22 /// Scan this instance. |
| 104 /// </summary> | 23 /// </summary> |
| 105 /// <returns><c>true</c> - additional data required</returns> | 24 /// <returns><c>true</c> - additional data required</returns> |
| 106 public bool Scan() { | 25 public bool Scan(int[] buffer, int position, int length) { |
| 107 while (m_position < m_hi) { | 26 var hi = position + length; |
| 108 var ch = m_buffer[m_position]; | 27 m_pos = position; |
| 109 var next = m_dfa[m_state].transitions[(int)ch]; | 28 |
| 29 while (position < hi) { | |
| 30 var next = m_dfa[m_state].transitions[buffer[position]]; | |
| 110 if (next == DFAConst.UNREACHABLE_STATE) { | 31 if (next == DFAConst.UNREACHABLE_STATE) { |
| 111 if (m_dfa[m_state].final) | 32 if (m_dfa[m_state].final) |
| 112 return false; | 33 return false; |
| 113 | 34 |
| 114 throw new ParserException( | 35 throw new ParserException( |
| 115 String.Format( | 36 String.Format( |
| 116 "Unexpected token '{0}'", | 37 "Unexpected symbol" |
| 117 new string(m_buffer, m_offset, m_position - m_offset) | |
| 118 ) | 38 ) |
| 119 ); | 39 ); |
| 120 } | 40 } |
| 41 m_pos++; | |
| 121 m_state = next; | 42 m_state = next; |
| 122 m_position++; | |
| 123 } | 43 } |
| 124 | 44 |
| 125 return true; | 45 return true; |
| 126 } | 46 } |
| 127 | 47 |
| 128 public void Eof() { | 48 public void Eof() { |
| 129 if (!m_dfa[m_state].final) | 49 if (!m_dfa[m_state].final) |
| 130 throw new ParserException( | 50 throw new ParserException( |
| 131 String.Format( | 51 String.Format( |
| 132 "Unexpected token '{0}'", | 52 "Unexpected EOF" |
| 133 new string(m_buffer, m_offset, m_position - m_offset) | |
| 134 ) | 53 ) |
| 135 ); | 54 ); |
| 136 } | 55 } |
| 137 | 56 |
| 138 public TTag[] GetTokenTags() { | 57 public TTag[] GetTokenTags() { |
