rj-action-library/Runtime/Text/Lexing/Lexer.cs

126 lines
3.2 KiB
C#

using System.Collections;
using System.Collections.Generic;
using System.Text.RegularExpressions;
namespace Rokojori
{
public class Lexer
{
Dictionary<string,List<LexerMatcher>> _modes = new Dictionary<string, List<LexerMatcher>>();
bool _hasError =false;
public bool hasError => _hasError;
void AddMatcher( LexerMatcher matcher )
{
var list = _modes.ContainsKey( matcher.mode ) ? _modes[ matcher.mode ] : null;
if ( list == null )
{
list = new List<LexerMatcher>();
_modes[ matcher.mode ] = list;
}
list.Add( matcher );
}
public void AddAllMatchers( params LexerMatcher[] matchers )
{
for ( int i = 0; i < matchers.Length; i++ )
{
AddMatcher( matchers[ i ] );
}
}
public void AddMatcher( string type, Regex regex, string mode = "", string nextMode = null )
{
AddMatcher( new LexerMatcher( type, regex, mode, nextMode ) );
}
public void AddMatcher( string type, string regex, string mode = "", string nextMode = null )
{
AddMatcher( type, new Regex( regex ), mode, nextMode );
}
public void Lex( string source, System.Action<LexerEvent> callback, int offset = 0, string mode = "" )
{
var ERROR_FLAG = -1;
var DONE_FLAG = -2;
var lexerEvent = new LexerEvent( "", 0, -2 );
while ( offset < source.Length )
{
if ( ! _modes.ContainsKey( mode ) )
{
var errorMessage = "@Lexer-Error. Mode not found: '" + mode + "'";
RJLog.Log( errorMessage, "@", offset );
lexerEvent.set( errorMessage, offset, ERROR_FLAG );
_hasError = true;
callback( lexerEvent );
return;
}
var matchers = _modes[ mode ];
var foundSomething = false;
for ( var i = 0; i < matchers.Count; i++ )
{
var matcher = matchers[ i ];
var matchLength = matcher.MatchLength( source, offset );
if ( matchLength > 0 )
{
lexerEvent.set( matcher.type, offset, matchLength );
//Logs.Log(matcher.type, ">>", "'"+source.Substring( offset, matchLength )+"'", "@", offset, matchLength );
callback( lexerEvent );
foundSomething = true;
i = matchers.Count;
if ( matcher.nextMode != null )
{
mode = matcher.nextMode;
}
offset += matchLength;
}
}
if ( ! foundSomething )
{
var errorMessage = "@Lexer-Error. No match: '" + mode + "'";
RJLog.Log(errorMessage, "@", offset );
lexerEvent.set( errorMessage, offset, ERROR_FLAG );
_hasError = true;
callback( lexerEvent );
return;
}
}
lexerEvent.set( mode, offset, DONE_FLAG );
callback( lexerEvent );
}
public List<LexerEvent> LexToList( string source, int offset = 0, string mode = "" )
{
var list = new List<LexerEvent>();
Lex(
source,
( LexerEvent token )=>
{
list.Add( token.Copy() );
},
offset, mode
);
return list;
}
}
}