RegularDFA.cs
91 lines
| 3.1 KiB
| text/x-csharp
|
CSharpLexer
cin
|
r289 | using System.Collections.Generic; | ||
using System.Linq; | ||||
namespace Implab.Automaton.RegularExpressions { | ||||
public class RegularDFA<TInput, TTag> : DFATable, ITaggedDFABuilder<TTag> { | ||||
readonly Dictionary<int,TTag[]> m_tags = new Dictionary<int, TTag[]>(); | ||||
readonly IAlphabet<TInput> m_alphabet; | ||||
public RegularDFA(IAlphabet<TInput> alphabet) { | ||||
Safe.ArgumentNotNull(alphabet, "aplhabet"); | ||||
m_alphabet = alphabet; | ||||
} | ||||
public IAlphabet<TInput> InputAlphabet { | ||||
get { | ||||
return m_alphabet; | ||||
} | ||||
} | ||||
public void MarkFinalState(int s, TTag[] tags) { | ||||
MarkFinalState(s); | ||||
SetStateTag(s, tags); | ||||
} | ||||
public void SetStateTag(int s, TTag[] tags) { | ||||
Safe.ArgumentNotNull(tags, "tags"); | ||||
m_tags[s] = tags; | ||||
} | ||||
public TTag[] GetStateTag(int s) { | ||||
TTag[] tags; | ||||
return m_tags.TryGetValue(s, out tags) ? tags : new TTag[0]; | ||||
} | ||||
public TTag[][] CreateTagTable() { | ||||
var table = new TTag[StateCount][]; | ||||
foreach (var pair in m_tags) | ||||
table[pair.Key] = pair.Value; | ||||
return table; | ||||
} | ||||
/// <summary> | ||||
/// Optimize the specified alphabet. | ||||
/// </summary> | ||||
/// <param name="alphabet">Пустой алфавит, который будет зполнен в процессе оптимизации.</param> | ||||
public RegularDFA<TInput,TTag> Optimize(IAlphabetBuilder<TInput> alphabet) { | ||||
Safe.ArgumentNotNull(alphabet, "alphabet"); | ||||
var dfa = new RegularDFA<TInput, TTag>(alphabet); | ||||
var alphaMap = new Dictionary<int,int>(); | ||||
var stateMap = new Dictionary<int,int>(); | ||||
Optimize(dfa, alphaMap, stateMap); | ||||
// mark tags in the new DFA | ||||
foreach (var g in m_tags.Where(x => x.Key < StateCount).GroupBy(x => stateMap[x.Key], x => x.Value )) | ||||
dfa.SetStateTag(g.Key, g.SelectMany(x => x).ToArray()); | ||||
// make the alphabet for the new DFA | ||||
// skip all unclassified symbols | ||||
foreach (var pair in alphaMap.Where(x => x.Value != 0)) | ||||
alphabet.DefineClass(m_alphabet.GetSymbols(pair.Key), pair.Value); | ||||
return dfa; | ||||
} | ||||
protected override IEnumerable<HashSet<int>> SplitFinalStates(IEnumerable<int> states) { | ||||
var arrayComparer = new CustomEqualityComparer<TTag[]>( | ||||
(x,y) => x.Length == y.Length && x.All(it => y.Contains(it)), | ||||
x => x.Sum(it => x.GetHashCode()) | ||||
); | ||||
return states.GroupBy(x => m_tags[x] ?? new TTag[0], arrayComparer).Select(g => new HashSet<int>(g)); | ||||
} | ||||
/*public override string ToString() { | ||||
var states = new MapAlphabet<string>(false, null); | ||||
for (int i = 0; i < StateCount; i++) | ||||
states.DefineSymbol(string.Format("s{0}", i), i); | ||||
return string.Format("//[RegularDFA {1} x {2}]\n{0}", PrintDFA(InputAlphabet, states),StateCount, AlphabetSize); | ||||
}*/ | ||||
} | ||||
} | ||||