From e95cbfd1e5705c7483288adc53b868b8c4bcadcc Mon Sep 17 00:00:00 2001
From: Ruediger Ludwig <github@savinien.de>
Date: Sat, 10 Dec 2022 21:06:18 +0100
Subject: [PATCH] improvements to parser

---
 advent/parser/parser.py      | 37 ++++++++++++--------------
 advent/parser/test_parser.py | 50 ++++++++++++++++++------------------
 2 files changed, 42 insertions(+), 45 deletions(-)

diff --git a/advent/parser/parser.py b/advent/parser/parser.py
index 43b5954..986f867 100644
--- a/advent/parser/parser.py
+++ b/advent/parser/parser.py
@@ -207,7 +207,7 @@ class P(Generic[T]):
     def sep_by_lazy(self, sep: P[Any]) -> P[list[T]]:
         return P.map2(self, P.second(sep, self).many_lazy(), lambda f, r: [f] + r)
 
-    def no(self) -> P[tuple[()]]:
+    def no_match(self) -> P[tuple[()]]:
         def inner(parserPos: ParserInput) -> ParserResult[tuple[()]]:
             result = self.func(parserPos)
             try:
@@ -341,8 +341,10 @@ class P(Generic[T]):
     def choice2(cls, *ps: P[T]) -> P[T]:
         return P.choice(*ps)
 
+    # Start of String functions
+
     @classmethod
-    def one_char(cls) -> P[str]:
+    def any_char(cls) -> P[str]:
         def inner(parserPos: ParserInput) -> ParserResult[str]:
             if parserPos.has_data():
                 yield parserPos.step()
@@ -350,22 +352,19 @@ class P(Generic[T]):
 
     @classmethod
     def eof(cls) -> P[tuple[()]]:
-        def inner(parserPos: ParserInput) -> ParserResult[tuple[()]]:
-            if not parserPos.has_data():
-                yield parserPos, ()
-        return P(inner)
+        return P.any_char().no_match()
 
     @classmethod
     def char_func(cls, cmp: Callable[[str], bool]) -> P[str]:
-        return P.one_char().satisfies(cmp)
+        return P.any_char().satisfies(cmp)
 
     @classmethod
-    def is_char(cls, cmp: str) -> P[str]:
+    def char(cls, cmp: str) -> P[str]:
         return P.char_func(lambda c: c == cmp)
 
     @classmethod
     def string(cls, s: str) -> P[str]:
-        return P.seq(*map(P.is_char, s)).replace(s)
+        return P.seq(*map(P.char, s)).replace(s)
 
     @classmethod
     def one_of(cls, s: str) -> P[str]:
@@ -395,16 +394,14 @@ class P(Generic[T]):
     def space(cls) -> P[str]:
         return P.char_func(lambda c: c.isspace())
 
-    @classmethod
-    def word(cls, p1: P[str]) -> P[str]:
-        return P.first(p1.many().fmap(lambda cs: ''.join(cs)), p1.no())
+    def word(self) -> P[str]:
+        return P.first(self.many().fmap(lambda cs: ''.join(str(c) for c in cs)), self.no_match())
 
     @classmethod
     def unsigned(cls) -> P[int]:
-        return P.either(P.first(P.is_decimal(0), P.any_decimal().no()),
-                        P.map2(P.is_not_decimal(0), P.word(P.any_decimal()),
-                               lambda f, s: f + s)
-                        ).fmap(int)
+        return P.either(P.first(P.is_decimal(0), P.any_decimal().no_match()).replace(0),
+                        P.map2(P.is_not_decimal(0), P.any_decimal().word(),
+                               lambda f, s: int(f + s)))
 
     @classmethod
     def signed(cls) -> P[int]:
@@ -412,16 +409,16 @@ class P(Generic[T]):
                       lambda sign, num: num if sign != '-' else -num)
 
     def in_parens(self) -> P[T]:
-        return self.between(P.is_char('('), P.is_char(')'))
+        return self.between(P.char('('), P.char(')'))
 
     def in_angles(self) -> P[T]:
-        return self.between(P.is_char('<'), P.is_char('>'))
+        return self.between(P.char('<'), P.char('>'))
 
     def in_brackets(self) -> P[T]:
-        return self.between(P.is_char('['), P.is_char(']'))
+        return self.between(P.char('['), P.char(']'))
 
     def in_curleys(self) -> P[T]:
-        return self.between(P.is_char('{'), P.is_char('}'))
+        return self.between(P.char('{'), P.char('}'))
 
     def trim_left(self) -> P[T]:
         return P.second(WHITE_SPACE, self)
diff --git a/advent/parser/test_parser.py b/advent/parser/test_parser.py
index 485fc2d..c8f9817 100644
--- a/advent/parser/test_parser.py
+++ b/advent/parser/test_parser.py
@@ -3,7 +3,7 @@ import pytest
 
 
 def test_one_letter():
-    parser = P.is_char('!')
+    parser = P.char('!')
     input = '!'
     expected = '!'
     result = parser.parse(input).get()
@@ -11,7 +11,7 @@ def test_one_letter():
 
 
 def test_one_letter_longer():
-    parser = P.is_char('!')
+    parser = P.char('!')
     input = '!!'
     expected = '!'
     result = parser.parse(input).get()
@@ -66,7 +66,7 @@ def test_starting_zero():
 
 
 def test_between():
-    parser = P.signed().between(P.is_char('<'), P.is_char('>'))
+    parser = P.signed().between(P.char('<'), P.char('>'))
     input = '<-123456>'
     expected = -123456
     result = parser.parse(input).get()
@@ -74,7 +74,7 @@ def test_between():
 
 
 def test_sep_by():
-    parser = P.signed().sep_by(P.is_char(','))
+    parser = P.signed().sep_by(P.char(','))
     input = '2,3,5'
     expected = [[2, 3, 5], [2, 3], [2]]
     result = list(parser.parse_multi(input))
@@ -82,7 +82,7 @@ def test_sep_by():
 
 
 def test_sep_by_lazy():
-    parser = P.signed().sep_by_lazy(P.is_char(','))
+    parser = P.signed().sep_by_lazy(P.char(','))
     input = '2,3,5'
     expected = [[2], [2, 3], [2, 3, 5]]
     result = list(parser.parse_multi(input))
@@ -98,7 +98,7 @@ def test_trim():
 
 
 def test_sep_by_trim():
-    parser = P.signed().sep_by(P.is_char(',').trim()).trim()
+    parser = P.signed().sep_by(P.char(',').trim()).trim()
     input = ' 1 , 1 , 2 , 3 , 5 , 8 , 13!'
     expected = [1, 1, 2, 3, 5, 8, 13]
     result = parser.parse(input).get()
@@ -106,7 +106,7 @@ def test_sep_by_trim():
 
 
 def test_choice2():
-    parser = P.choice(P.is_char('a'), P.unsigned(), P.string('hallo'))
+    parser = P.choice(P.char('a'), P.unsigned(), P.string('hallo'))
     input = '1'
     expected = 1
     result = parser.parse(input).get()
@@ -120,7 +120,7 @@ def test_choice2():
 
 def test_seq():
     input = '1234'
-    parser = P.seq(P.one_char(), P.one_char(), P.one_char(), P.one_char())
+    parser = P.seq(P.any_char(), P.any_char(), P.any_char(), P.any_char())
     expected = ('1', '2', '3', '4')
     result = parser.parse(input).get()
     assert result == expected
@@ -129,7 +129,7 @@ def test_seq():
 def test_seq_seq():
     input = '1,2,3,4'
     digit = P.char_func(lambda c: c.isdigit(), )
-    parser = P.sep_seq(digit, digit, digit, digit, sep=P.is_char(','))
+    parser = P.sep_seq(digit, digit, digit, digit, sep=P.char(','))
 
     expected = ('1', '2', '3', '4')
     result = parser.parse(input).get()
@@ -138,7 +138,7 @@ def test_seq_seq():
 
 def test_not():
     input = 'a'
-    parser = P.second(P.is_char('!').no(), P.is_char('a'))
+    parser = P.second(P.char('!').no_match(), P.char('a'))
     expected = 'a'
     result = parser.parse(input).get()
     assert result == expected
@@ -150,7 +150,7 @@ def test_not():
 
 def test_multi():
     input = 'aa'
-    parser = P.is_char('a').many()
+    parser = P.char('a').many()
     expected = [['a', 'a'], ['a'], []]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -160,7 +160,7 @@ def test_either():
     input = 'aab'
     parser = P.either(
         P.seq(
-            P.is_char('a').many(), P.string('b')), P.seq(
+            P.char('a').many(), P.string('b')), P.seq(
             P.string('a'), P.string('ab')))
     expected = [(['a', 'a'], 'b'), ('a', 'ab')]
     result = list(parser.parse_multi(input))
@@ -169,7 +169,7 @@ def test_either():
 
 def test_seq_eof():
     input = 'aa'
-    parser = P.seq(P.is_char('a').many(), P.eof())
+    parser = P.seq(P.char('a').many(), P.eof())
     expected = [(['a', 'a'], ())]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -177,7 +177,7 @@ def test_seq_eof():
 
 def test_optional():
     input = '12'
-    parser = P.seq(P.is_char('1').optional(), P.unsigned())
+    parser = P.seq(P.char('1').optional(), P.unsigned())
     expected = [('1', 2), (None, 12)]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -185,7 +185,7 @@ def test_optional():
 
 def test_choice():
     input = '1'
-    parser = P.choice(P.is_char('1'), P.is_char('b'), P.unsigned())
+    parser = P.choice(P.char('1'), P.char('b'), P.unsigned())
     expected = ['1', 1]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -193,7 +193,7 @@ def test_choice():
 
 def test_times_exact():
     input = 'aaa'
-    parser = P.is_char('a').times(exact=2)
+    parser = P.char('a').times(exact=2)
     expected = [['a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -201,7 +201,7 @@ def test_times_exact():
 
 def test_times_min():
     input = 'aaa'
-    parser = P.is_char('a').times(min=2)
+    parser = P.char('a').times(min=2)
     expected = [['a', 'a', 'a'], ['a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -209,7 +209,7 @@ def test_times_min():
 
 def test_times_max():
     input = 'aaa'
-    parser = P.is_char('a').times(max=2)
+    parser = P.char('a').times(max=2)
     expected = [['a', 'a'], ['a'], []]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -217,7 +217,7 @@ def test_times_max():
 
 def test_some_lazy():
     input = 'aa'
-    parser = P.is_char('a').some_lazy()
+    parser = P.char('a').some_lazy()
     expected = [['a'], ['a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -225,7 +225,7 @@ def test_some_lazy():
 
 def test_many_lazy():
     input = 'aa'
-    parser = P.is_char('a').many_lazy()
+    parser = P.char('a').many_lazy()
     expected = [[], ['a'], ['a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -233,7 +233,7 @@ def test_many_lazy():
 
 def test_times_lazy_exact():
     input = 'aaa'
-    parser = P.is_char('a').times_lazy(exact=2)
+    parser = P.char('a').times_lazy(exact=2)
     expected = [['a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -241,7 +241,7 @@ def test_times_lazy_exact():
 
 def test_times_lazy_min():
     input = 'aaa'
-    parser = P.is_char('a').times_lazy(min=2)
+    parser = P.char('a').times_lazy(min=2)
     expected = [['a', 'a'], ['a', 'a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -249,7 +249,7 @@ def test_times_lazy_min():
 
 def test_times_lazy_max():
     input = 'aaa'
-    parser = P.is_char('a').times_lazy(max=2)
+    parser = P.char('a').times_lazy(max=2)
     expected = [[], ['a'], ['a', 'a']]
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -257,7 +257,7 @@ def test_times_lazy_max():
 
 def test_word():
     input = '123'
-    parser = P.word(P.any_decimal())
+    parser = P.any_decimal().word()
     expected = ['123']
     result = list(parser.parse_multi(input))
     assert result == expected
@@ -265,7 +265,7 @@ def test_word():
 
 def test_word2():
     input = '123a'
-    parser = P.seq(P.word(P.any_decimal()), P.is_char('a'))
+    parser = P.seq(P.any_decimal().word(), P.char('a'))
     expected = [('123', 'a')]
     result = list(parser.parse_multi(input))
     assert result == expected