Epsilon transitions in lexer

This commit is contained in:
Suzanne Soy 2020-08-16 02:57:20 +00:00
parent ff459fb1fd
commit c534c2c6ab
11 changed files with 132 additions and 19 deletions

4
Ast.cs
View File

@ -42,6 +42,8 @@ namespace Ast {
public override int GetHashCode() { public override int GetHashCode() {
return HashCode.Combine("Int", this.value); return HashCode.Combine("Int", this.value);
} }
public override string ToString() => "Int";
} }
public partial class Visitor<T> { public Func<string, T> String { get; set; } } public partial class Visitor<T> { public Func<string, T> String { get; set; } }
@ -62,6 +64,8 @@ namespace Ast {
public override int GetHashCode() { public override int GetHashCode() {
return HashCode.Combine("String", this.value); return HashCode.Combine("String", this.value);
} }
public override string ToString() => "String";
} }
} }

View File

@ -78,10 +78,9 @@ public static partial class Lexer {
Rule(S.Space, '"', S.StringOpen, S.String), Rule(S.Space, '"', S.StringOpen, S.String),
Rule(S.Int, C.DecimalDigitNumber, S.Int), Rule(S.Int, C.DecimalDigitNumber, S.Int),
Rule(S.Int, C.SpaceSeparator, S.Space), // epsilon Rule(S.Int, C.SpaceSeparator, S.Space),
Rule(S.Int, new[]{'.',','}, S.Decimal, S.Int), Rule(S.Int, new[]{'.',','}, S.Decimal, S.Int),
Rule(S.Int, EOF, S.End), // epsilon Rule(S.Decimal, C.SpaceSeparator, S.Space),
Rule(S.Decimal, C.SpaceSeparator, S.Space), // epsilon
Rule(S.String, C.LowercaseLetter, S.String), Rule(S.String, C.LowercaseLetter, S.String),
Rule(S.String, C.UppercaseLetter, S.String), Rule(S.String, C.UppercaseLetter, S.String),
@ -92,8 +91,22 @@ public static partial class Lexer {
public static Dictionary<S, List<Rule>> Dict = public static Dictionary<S, List<Rule>> Dict =
Default Default
.GroupBy(r => r.oldState, r => r) .GroupBy(r => r.oldState, r => r)
.ToDictionary(rs => rs.Key, rs => rs.ToList()) ; .ToDefaultDictionary(
// TODO: upon failure, do an epsilon-transition to the whitespace state, and try again. new List<Rule>(),
rs => rs.Key,
rs => rs.ToList()) ;
// This adds transitions through an implicit empty whitespace.
public static Dictionary<S, List<Rule>> WithEpsilonTransitions =
Dict.ToDefaultDictionary(
new List<Rule>(),
kv => kv.Key,
kv => kv.Value.Any(r => true) // r.test(" ")
// This is a bit of a hack, the lexer tries the rules in
// order so later rules with different results are masked
// by former rules
? kv.Value.Concat(Dict[S.Space]).ToList()
: kv.Value);
} }
public struct Lexeme { public struct Lexeme {
@ -125,7 +138,7 @@ public static partial class Lexer {
return result; return result;
} }
public static void ParseError(StringBuilder context, IEnumerator<GraphemeCluster> stream, S state, List<Rule> possibleNext, GraphemeCluster gc) { public static Exception ParseError(StringBuilder context, IEnumerator<GraphemeCluster> stream, S state, List<Rule> possibleNext, GraphemeCluster gc) {
var rest = var rest =
stream stream
.SingleUseEnumerable() .SingleUseEnumerable()
@ -139,7 +152,7 @@ public static partial class Lexer {
.First() .First()
.Match(some: (x => x.UnicodeCategory(0).ToString()), .Match(some: (x => x.UnicodeCategory(0).ToString()),
none: "None (empty string)"); none: "None (empty string)");
throw new Exception( return new Exception(
$"Unexpected {actual} (Unicode category {cat}) while the lexer was in state {state}: expected one of {expected}{Environment.NewLine}{context} <--HERE {rest}" $"Unexpected {actual} (Unicode category {cat}) while the lexer was in state {state}: expected one of {expected}{Environment.NewLine}{context} <--HERE {rest}"
); );
} }
@ -155,15 +168,13 @@ public static partial class Lexer {
while (e.MoveNext()) { while (e.MoveNext()) {
var c = e.Current; var c = e.Current;
context.Append(c.str); context.Append(c.str);
List<Rule> possibleNext; var possibleNext = Rules.WithEpsilonTransitions
if (Rules.Dict.TryGetValue(state, out possibleNext)) { .GetOrDefault(state, new List<Rule>());
var rule = possibleNext.FirstOrDefault(r => r.test(c)); yield return
if (rule != null) { possibleNext
yield return Transition(ref state, ref lexeme, c, rule); .First(r => r.test(c))
} else { .IfSome(rule => Transition(ref state, ref lexeme, c, rule))
ParseError(context, e, state, possibleNext, c); .ElseThrow(() => ParseError(context, e, state, possibleNext, c));
}
}
} }
} }

View File

@ -56,6 +56,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "End";
} }
public partial class Visitor<T> { public Func<T> Space { get; set; } } public partial class Visitor<T> { public Func<T> Space { get; set; } }
@ -70,6 +72,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "Space";
} }
public partial class Visitor<T> { public Func<T> Int { get; set; } } public partial class Visitor<T> { public Func<T> Int { get; set; } }
@ -84,6 +88,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "Int";
} }
public partial class Visitor<T> { public Func<T> Decimal { get; set; } } public partial class Visitor<T> { public Func<T> Decimal { get; set; } }
@ -98,6 +104,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "Decimal";
} }
public partial class Visitor<T> { public Func<T> String { get; set; } } public partial class Visitor<T> { public Func<T> String { get; set; } }
@ -112,6 +120,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "String";
} }
public partial class Visitor<T> { public Func<T> StringOpen { get; set; } } public partial class Visitor<T> { public Func<T> StringOpen { get; set; } }
@ -126,6 +136,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "StringOpen";
} }
public partial class Visitor<T> { public Func<T> StringClose { get; set; } } public partial class Visitor<T> { public Func<T> StringClose { get; set; } }
@ -140,6 +152,8 @@ public static partial class Lexer {
public override int GetHashCode() { public override int GetHashCode() {
return "C".GetHashCode(); return "C".GetHashCode();
} }
public override string ToString() => "StringClose";
} }
} }

View File

@ -90,6 +90,8 @@ public static class Generator {
o.WriteLine($" return HashCode.Combine(\"{C}\", this.value);"); o.WriteLine($" return HashCode.Combine(\"{C}\", this.value);");
} }
o.WriteLine($" }}"); o.WriteLine($" }}");
o.WriteLine("");
o.WriteLine($" public override string ToString() => \"{C}\";");
o.WriteLine($" }}"); o.WriteLine($" }}");
o.WriteLine(""); o.WriteLine("");
} }

1
Tests/004-foo42.e Normal file
View File

@ -0,0 +1 @@
"foo"42

1
Tests/004-foo42.o Normal file
View File

@ -0,0 +1 @@
foo42

1
Tests/005-42foo.e Normal file
View File

@ -0,0 +1 @@
42"foo"

1
Tests/005-42foo.o Normal file
View File

@ -0,0 +1 @@
42foo

View File

@ -128,6 +128,17 @@ public static class Collection {
} }
} }
public static Option<T> First<T>(this IEnumerable<T> ie, Func<T, bool> predicate) {
var e = ie.GetEnumerator();
bool found = false;
while (e.MoveNext()) {
if (predicate(e.Current)) {
return e.Current.Some();
}
}
return Option.None<T>();
}
public static Option<T> Single<T>(this IEnumerable<T> ie) { public static Option<T> Single<T>(this IEnumerable<T> ie) {
var e = ie.GetEnumerator(); var e = ie.GetEnumerator();
if (e.MoveNext()) { if (e.MoveNext()) {
@ -141,4 +152,41 @@ public static class Collection {
return Option.None<T>(); return Option.None<T>();
} }
} }
public static Option<V> GetValue<K, V>(this Dictionary<K, V> d, K key) {
V result = default(V);
if (d.TryGetValue(key, out result)) {
return result.Some();
} else {
return Option.None<V>();
}
}
public static V GetOrDefault<K, V>(this Dictionary<K, V> d, K key, V defaultValue) {
V result = default(V);
if (d.TryGetValue(key, out result)) {
return result;
} else {
return defaultValue;
}
}
public class DefaultDictionary<TKey, TValue> : Dictionary<TKey, TValue> {
public readonly TValue defaultValue;
//public readonly Dictionary<TKey, TValue> dictionary;
public DefaultDictionary(TValue defaultValue, Dictionary<TKey, TValue> dictionary) : base(dictionary) {
this.defaultValue = defaultValue;
//this.dictionary = dictionary;
}
public TValue this[TKey key] {
get {
return this.GetOrDefault(key, defaultValue);
}
}
}
public static DefaultDictionary<UKey, UValue> ToDefaultDictionary<T, UKey, UValue>(this IEnumerable<T> e, UValue defaultValue, Func<T, UKey> key, Func<T, UValue> value)
=> new DefaultDictionary<UKey, UValue>(defaultValue, e.ToDictionary(key, value));
} }

View File

@ -1,7 +1,7 @@
namespace Immutable { namespace Immutable {
using System; using System;
public interface Option<out T> { public interface Option<out T> : System.Collections.Generic.IEnumerable<T> {
U Match_<U>(Func<T, U> some, Func<U> none); U Match_<U>(Func<T, U> some, Func<U> none);
} }
@ -10,18 +10,30 @@ namespace Immutable {
public static Option<T> None<T>() => new Types.None<T>(); public static Option<T> None<T>() => new Types.None<T>();
private static class Types { private static class Types {
public class Some<T> : Option<T> { public class Some<T> : Option<T>, System.Collections.IEnumerable {
public readonly T value; public readonly T value;
public Some(T value) { this.value = value; } public Some(T value) { this.value = value; }
public U Match_<U>(Func<T, U> Some, Func<U> None) => Some(value); public U Match_<U>(Func<T, U> Some, Func<U> None) => Some(value);
public System.Collections.Generic.IEnumerator<T> GetEnumerator()
=> value.Singleton().GetEnumerator();
System.Collections.IEnumerator System.Collections.IEnumerable.GetEnumerator()
=> this.GetEnumerator();
} }
public class None<T> : Option<T> { public class None<T> : Option<T>, System.Collections.IEnumerable {
public None() { } public None() { }
public U Match_<U>(Func<T, U> Some, Func<U> None) => None(); public U Match_<U>(Func<T, U> Some, Func<U> None) => None();
public System.Collections.Generic.IEnumerator<T> GetEnumerator()
=> System.Linq.Enumerable.Empty<T>().GetEnumerator();
System.Collections.IEnumerator System.Collections.IEnumerable.GetEnumerator()
=> this.GetEnumerator();
} }
} }
} }
@ -34,5 +46,20 @@ namespace Immutable {
public static U Match<T, U>(this Option<T> o, Func<T, U> some, U none) public static U Match<T, U>(this Option<T> o, Func<T, U> some, U none)
=> o.Match_(some, () => none); => o.Match_(some, () => none);
public static Option<U> Map<T, U>(this Option<T> o, Func<T, U> some)
=> o.Match_(value => some(value).Some(), () => Option.None<U>());
public static Option<U> IfSome<T, U>(this Option<T> o, Func<T, U> some)
=> o.Map(some);
public static T Else<T>(this Option<T> o, Func<T> none)
=> o.Match_(some => some, none);
public static Option<T> Else<T>(this Option<T> o, Func<Option<T>> none)
=> o.Match_(value => value.Some(), none);
public static T ElseThrow<T>(this Option<T> o, Func<Exception> none)
=> o.Match_(value => value, () => throw none());
} }
} }

View File

@ -12,6 +12,9 @@ public struct GraphemeCluster {
this.str = str; this.str = str;
this.codePoints = codePoints; this.codePoints = codePoints;
} }
public static implicit operator GraphemeCluster(char c)
=> new GraphemeCluster(false, c.ToString(), c.ToString().Singleton());
} }
public static class UnicodeExtensionMethods { public static class UnicodeExtensionMethods {