Fix LineReader bug (infinite loop)

Add UnitTest to FastLexer revealing bug

Fix LineReader bug (infinite loop)
Add UnitTest to FastLexer revealing bug
Cédric RICARD
1 parent bde59c8c
Showing 9 changed files with 347 additions and 225 deletions Show diff stats
anubis_dev/library/lexical_analysis/fast_lexer.anubis
anubis_dev/library/system/convert.anubis
anubis_dev/library/test/Anubis UnitTest.aproj
anubis_dev/library/test/all_unit_test.anubis
anubis_dev/library/test/lexical_analysis/fast_lexer.ut.anubis
anubis_dev/library/test/predefined/fast_lexer.unit_test.anubis
anubis_dev/library/test/tools/line_reader.ut.anubis
anubis_dev/library/tools/line_reader.anubis
anubis_dev/library/tools/unit_test.anubis
@@ -447,24 +447,24 @@ public define Maybe(LexingStream)   make_lexing_stream(SSL_Connection stream,
    file, in  particular at the  actual definition of  type 'LexingStream', and  write down
    another  such   function  (in  a   file  of  yours   within  which  you  put   a  'read
    fast_lexer.anubis').
-
-
-   To each lexing  stream is attached a function  for counting of type 'One  -> Int'. When
-   applied to  'unique', this function returns the  number of bytes already  read from the
-   lexing  stream,  i.e. the  position  from  which the  reading  of  te  next token  will
-   occur. This function is obtained as follows:
+
+
+   To each lexing  stream is attached a function  for counting of type 'One  -> Int'. When
+   applied to  'unique', this function returns the  number of bytes already  read from the
+   lexing  stream,  i.e. the  position  from  which the  reading  of  te  next token  will
+   occur. This function is obtained as follows:
-public define One -> Int
-   offset_counter
-     (
-       LexingStream ls
-     ).
+public define One -> Int
+   offset_counter
+     (
+       LexingStream ls
+     ).
+   
+   If youn need  this function, it is recommended to call  'offset_counter' only once just
+   after the lexing stream is created.
-   If youn need  this function, it is recommended to call  'offset_counter' only once just
-   after the lexing stream is created.
-   
    *** (4) Constructing a lexer. 
       *** (4.1) Construction. 
@@ -580,7 +580,7 @@ public define Printable_tree
 read tools/basis.anubis
 read tools/streams.anubis
-
+read system/convert.anubis
    -------------------------------- Table of Contents ------------------------------------
@@ -740,13 +740,7 @@ define Maybe(ExChar)
          *** [1.5.1] Truncating a Word32 to a Word8. 
-define Word8
-   truncate_to_Word8
-     (
-       Word32 x
-     ) =
-   if x is word32(l1,_) then if l1 is word16(l2,_) then l2. 
-   
+  moved to system/convert.anubis   
          *** [1.5.2] Creating a range of consecutive characters.
@@ -1223,24 +1217,24 @@ public define String
 public type LexingStream:
    lexing_stream
      (
-       Var(ByteArray)               buffer_v,         // the current buffer
-       Var(Int)                     start_v,          // start of lexem in buffer
-       Var(FastLexerLastAccepted)   last_accept_v,    // last accepting position (if any)
-       Var(Int)                     current_v,        // position of reading in buffer
-       Int -> Maybe(One)            reload_buffer,    // command for loading the sequel in the buffer
-       Var(Int)                     current_offset_v  // accumulator for current offset
+       Var(ByteArray)               buffer_v,         // the current buffer
+       Var(Int)                     start_v,          // start of lexem in buffer
+       Var(FastLexerLastAccepted)   last_accept_v,    // last accepting position (if any)
+       Var(Int)                     current_v,        // position of reading in buffer
+       Int -> Maybe(One)            reload_buffer,    // command for loading the sequel in the buffer
+       Var(Int)                     current_offset_v  // accumulator for current offset
      ).
-   
-public define One -> Int
-   offset_counter
-     (
-       LexingStream ls
-     ) =
-   if ls is lexing_stream(_,_,_,_,_,v) then 
-   (One u) |-> *v. 
-   
-   
+   
+public define One -> Int
+   offset_counter
+     (
+       LexingStream ls
+     ) =
+   if ls is lexing_stream(_,_,_,_,_,v) then 
+   (One u) |-> *v. 
+   
+   
    While we are reading a lexeme, we keep the starting position (offset of first character
    of the  current lexeme) in 'start_v'  so as to be  able to extract the  lexeme. We also
    keep the last position at which a lexeme was accepted. This is because the lexer always
@@ -1272,8 +1266,8 @@ public define LexingStream
                  var(0),                // starting position
                  var(none),             // last accepting position
                  var(0),                // current position
-                 (Int u) |-> failure,   // buffer cannot be reloaded
-                 var(0)). 
+                 (Int u) |-> failure,   // buffer cannot be reloaded
+                 var(0)). 
@@ -1308,7 +1302,7 @@ public define Maybe(LexingStream)
                 start_v          = var((Int)0), 
                 last_accepted_v  = var((FastLexerLastAccepted)none),
                 current_v        = var((Int)0), 
-                offset_v         = var((Int)0), 
+                offset_v         = var((Int)0), 
                 reload_buffer    = (Int i) |-> 
                   if read(stream,buffer_size,timeout) is 
                     {
@@ -1317,13 +1311,13 @@ public define Maybe(LexingStream)
                       ok(more)   then 
                         //print("Buffer reloaded ("+abs_to_decimal(length(more))+" bytes).\n"); 
                         if length(more) = 0
-                        then (with old_buffer  = *buffer_v, 
-                                   old_length  = length(old_buffer), 
-                                   dropped     = *start_v, // number of bytes dropped from old buffer
+                        then (with old_buffer  = *buffer_v, 
+                                   old_length  = length(old_buffer), 
+                                   dropped     = *start_v, // number of bytes dropped from old buffer
                               buffer_v <- extract(old_buffer,dropped,old_length); 
                               start_v <- 0; 
                               current_v <- *current_v - dropped; 
-                              /* reloading does not change the current offset */
+                              /* reloading does not change the current offset */
                               last_accepted_v <-
                                 if *last_accepted_v is 
                                   {
@@ -1337,7 +1331,7 @@ public define Maybe(LexingStream)
                               buffer_v <- extract(old_buffer,dropped,old_length)+more; 
                               start_v <- 0; 
                               current_v <- *current_v - dropped; 
-                              /* reloading does not change the current offset */
+                              /* reloading does not change the current offset */
                               last_accepted_v <-
                                 if *last_accepted_v is 
                                   {
@@ -1350,8 +1344,8 @@ public define Maybe(LexingStream)
                                start_v,
                                last_accepted_v,
                                current_v,
-                               reload_buffer,
-                               offset_v))
+                               reload_buffer,
+                               offset_v))
      }.
@@ -1390,7 +1384,7 @@ public define Maybe(LexingStream)
                 start_v          = var((Int)0), 
                 last_accepted_v  = var((FastLexerLastAccepted)none),
                 current_v        = var((Int)0), 
-                offset_v         = var((Int)0), 
+                offset_v         = var((Int)0), 
                 reload_buffer    = (Int i) |-> 
                   if (Maybe(ByteArray))read(stream,buffer_size,timeout) is 
                     {
@@ -1403,7 +1397,7 @@ public define Maybe(LexingStream)
                               buffer_v <- extract(old_buffer,dropped,old_length); 
                               start_v <- 0; 
                               current_v <- *current_v - dropped; 
-                              /* reloading does not change the current offset */
+                              /* reloading does not change the current offset */
                               last_accepted_v <-
                                 if *last_accepted_v is 
                                   {
@@ -1417,7 +1411,7 @@ public define Maybe(LexingStream)
                               buffer_v <- extract(old_buffer,dropped,old_length)+more; 
                               start_v <- 0; 
                               current_v <- *current_v - dropped; 
-                              /* reloading does not change the current offset */
+                              /* reloading does not change the current offset */
                               last_accepted_v <-
                                 if *last_accepted_v is 
                                   {
@@ -1430,8 +1424,8 @@ public define Maybe(LexingStream)
                                start_v,
                                last_accepted_v,
                                current_v,
-                               reload_buffer,
-                               offset_v))
+                               reload_buffer,
+                               offset_v))
      }.
@@ -2289,9 +2283,9 @@ define One -&gt; LexerOutput($Token)
         Word16                      starting_state) -> FastLexerOutput    lexer, 
        MVar(LexerAction($Token))                                          actions       
      ) = 
-   if stream is lexing_stream(buffer_v,start_v,last_accept_v,current_v,reload_buffer,offset_v) then 
-   (One _) |-l-> with old_current = *current_v, 
-                 if lexer(*buffer_v,
+   if stream is lexing_stream(buffer_v,start_v,last_accept_v,current_v,reload_buffer,offset_v) then 
+   (One _) |-l-> with old_current = *current_v, 
+                 if lexer(*buffer_v,
                           *last_accept_v,
                           *current_v,
                           0) // reading a new token always starts in state 0
@@ -2303,7 +2297,7 @@ define One -&gt; LexerOutput($Token)
                 not_at_end_of_input then 
                   with result = (LexerOutput($Token))error(extract(*buffer_v,*start_v,end)),
                   current_v <- end+1; 
-                  offset_v <- *offset_v + (end + 1 - old_current);
+                  offset_v <- *offset_v + (end + 1 - old_current);
                   start_v <- end+1; 
                   last_accept_v <- none;
                   result, 
@@ -2326,7 +2320,7 @@ define One -&gt; LexerOutput($Token)
                     {
                       ignore then 
                         current_v <- end; 
-                        offset_v <- *offset_v + (end - old_current);
+                        offset_v <- *offset_v + (end - old_current);
                         start_v <- end; 
                         last_accept_v <- none; 
                         l(unique),   // ignore and try to read the next token 
@@ -2334,7 +2328,7 @@ define One -&gt; LexerOutput($Token)
                       return(f) then 
                         with result = f(extract(*buffer_v,*start_v,end)),
                         current_v <- end; 
-                        offset_v <- *offset_v + (end - old_current);
+                        offset_v <- *offset_v + (end - old_current);
                         start_v <- end; 
                         last_accept_v <- none; 
                         result
@@ -2351,7 +2345,7 @@ define One -&gt; LexerOutput($Token)
                             return(f)  then 
                               with result = f(extract(*buffer_v,*start_v,end)),
                               current_v <- end; 
-                              offset_v <- *offset_v + (end - old_current);
+                              offset_v <- *offset_v + (end - old_current);
                               start_v <- end; 
                               last_accept_v <- none; 
                               result
@@ -92,18 +92,18 @@ public define inline ByteArray
 // Obsolete name, should be removed
 public define inline Word8
-  truncate_to_word8
-  (
-    Word32 value
-  ) =
-  truncate_to_Word8(to_Int(value)).
+   truncate_to_word8
+     (
+       Word32 x
+     ) =
+   if x is word32(l1,_) then if l1 is word16(l2,_) then l2. 
 public define inline Word8
-  truncate_to_Word8
-  (
-    Word32 value
-  ) =
-  truncate_to_Word8(to_Int(value)).
+   truncate_to_Word8
+     (
+       Word32 x
+     ) =
+   if x is word32(l1,_) then if l1 is word16(l2,_) then l2. 
 public define inline Word32
   word8_to_Word32
@@ -32,6 +32,7 @@
   <Import Project="$(AnubisBinPath)\Anubis.Build.targets" />
   <ItemGroup>
     <Compile Include="all_unit_test.anubis" />
+    <Compile Include="lexical_analysis\fast_lexer.ut.anubis" />
     <Compile Include="predefined\date_and_time.unit_test.anubis" />
     <Compile Include="predefined\decimal_scan.unit_test.anubis" />
     <Compile Include="predefined\fast_lexer.unit_test.anubis" />
@@ -48,6 +49,7 @@
     <Compile Include="tools\utf-8.unit_test.anubis" />
   </ItemGroup>
   <ItemGroup>
+    <Folder Include="lexical_analysis" />
     <Folder Include="predefined" />
     <Folder Include="system" />
     <Folder Include="tools" />
@@ -10,6 +10,7 @@ read test/predefined/sqlite.unit_test.anubis
 read test/predefined/fast_lexer.unit_test.anubis
 read test/system/convert.unit_test.anubis
+read test/lexical_analysis/fast_lexer.ut.anubis
 read test/system/message_queue.unit_test.anubis
 read test/system/message_transceiver.unit_test.anubis
 read test/system/string.unit_test.anubis
@@ -37,7 +38,8 @@ define List(UnitTestSuite)
     make_SQLite_test_suite,
     make_UTF8_test_suite,
     make_line_reader_test_suite,
-    make_fast_lexer_test_suite
+    make_fast_lexer_test_suite,
+    make_fast_lexer_test_suite2,
   ]
   .
+/*
+ * Created by PyramIDE.
+ * User: ricard
+ * Date: 19/09/2008
+ * Time: 14:24
+ * 
+ */
+
+read tools/unit_test.anubis
+read lexical_analysis/fast_lexer.anubis
+
+type InfLoopToken:
+   line(String),
+   eol.   
+   
+define String
+  token_to_string
+  (
+    LexerOutput(InfLoopToken) output
+  ) =
+  if output is
+  {
+    end_of_input   then /* no more token: exit the main loop */ 
+      "End of input",
+    
+    error(b)       then
+      /* should never happen with this lexer (see the above comment) */
+      "Lexer error: ["+to_string(b)+"]",
+    
+    token(t)       then 
+      /* a token has been recognized */
+      if t is 
+      {
+        line(l) then
+          "token: line("+l+")"
+        eol then 
+          "token: eol"
+      }
+  }.
+
+
+define One
+   infinite_loop_test
+     (
+       UnitTestContext ut
+     ) =
+  if make_lexer_and_automaton([
+                                lexer_item("#r?#n", return((ByteArray b) |-> token(eol))),
+                                lexer_item("[^\r\n]*", return((ByteArray b) |-> token(line(to_string(b))))),
+                              ],
+                              '#') is
+  {
+    error(msg) then print("Syntax error in regular expression: "+to_English(msg)+"\n"); assertIsTrue(ut, false, "Can't create lexer"),
+    ok(p) then if p is (lexer, automaton) then
+      with next_token = lexer(make_lexing_stream("mon texte\n\r\nla suite")),
+      assertIsSame(ut, next_token(unique), token(line("mon texte")), token_to_string,  "#1 1st line");
+      assertIsSame(ut, next_token(unique), token(eol),               token_to_string,  "#1 1st EOF");
+      //assertIsSame(ut, next_token(unique), token(line("")),          token_to_string,  "#1 2nd line");
+      assertIsSame(ut, next_token(unique), token(eol),               token_to_string,  "#1 2nd EOF");
+      assertIsSame(ut, next_token(unique), token(line("la suite")),   token_to_string, "#1 3rd line");
+      //assertIsSame(ut, next_token(unique), token(eol),               token_to_string,  "#1 3rd EOF");
+      assertIsSame(ut, next_token(unique), end_of_input,            token_to_string,   "#1 EOF");
+
+
+      with next_token = lexer(make_lexing_stream("mon texte\r\n\rla suite")),
+      assertIsSame(ut, next_token(unique), token(line("mon texte")), token_to_string,  "#2 1st line");
+      assertIsSame(ut, next_token(unique), token(eol),               token_to_string,  "#2 1st EOF");
+      assertIsSame(ut, next_token(unique), error(to_byte_array("\r")), token_to_string,  "#2 error");
+      //assertIsSame(ut, next_token(unique), token(line("")),          token_to_string,  "#2 2nd line");
+      //assertIsSame(ut, next_token(unique), token(eol),               token_to_string,  "#2 2nd EOF");
+      //assertIsSame(ut, next_token(unique), token(line("la suite")),   token_to_string, "#2 3rd line");
+      //assertIsSame(ut, next_token(unique), token(eol),               token_to_string,  "#2 3rd EOF");
+      //assertIsSame(ut, next_token(unique), end_of_input,            token_to_string,   "#2 EOF");
+      unique
+  }. 
+
+
+   
+public define UnitTestSuite 
+   make_fast_lexer_test_suite2
+      =
+   ut_suite("lexical_analysis.fast_lexer",
+     [
+       ut_fixture("infinite_loop",  infinite_loop_test)
+     ]).
+   
+   
-
-   
-read tools/unit_test.anubis
-
-   
-define String
-   format
-     (
-       AtEndOfInput a
-     )  =
-   if a is
-     {
-       not_at_end_of_input then "not_at_end_of_input", 
-       at_end_of_input then "at_end_of_input"
-     }.
-   
-   
-define FastLexerOutput
-   test_fast_lexer
-     (
-        List(FastLexerState)        lexer,
-        ByteArray                   input, 
-        FastLexerLastAccepted       last_accepted,
-        Int                         position,
-        Word16                      state
-     ) =
-   if make_fast_lexer(lexer) is 
-     {
-       unknown_state(n) then print("fast lexer unknown state: "+to_decimal(n)+"\n"); alert, 
-       too_many_states  then print("too many states.\n"); alert,
-       ok(fl) then with result = fl(input,last_accepted,position,state),
-         
-         if result is 
-           {
-             rejected(w,e,a) then 
-               print("\nrejected("+to_decimal(w)+","+abs_to_decimal(e)+","+format(a)+")\n"),
-             accepted(w,e,a,_) then 
-               print("\naccepted("+to_decimal(w)+","+abs_to_decimal(e)+","+format(a)+")\n")
-           };
-         
-         result
-     }. 
-   
-
-   
-   A lexer accepting "g+abu", "g+abuzo",
-   
-define List(FastLexerState)   
-   lexer_1 
-     =
-   [
-     /* state 0  */ rejecting([transition('g',1)]),
-     /* state 1  */ rejecting([transition('a',2),transition('g',1)]),
-     /* state 2  */ rejecting([transition('b',3)]),
-     /* state 3  */ rejecting([transition('u',4)]),
-     /* state 4  */ accepting([transition('z',5)]),
-     /* state 5  */ rejecting([transition('o',6)]),
-     /* state 6  */ accepting([ ])
-   ]. 
-   
-   
-define One
-   fast_lexer_test
-     (
-       UnitTestContext ut
-     ) =
-   
-   /* starting in state 0, position 0 */
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gab"),none,0,0),
-                rejected(3,3,at_end_of_input),    "1");
-   unique. 
-   
-   
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gabu"),none,bol,neol,0,0),
-                accepted(4,4,at_end_of_input),    "2");
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("ggggabu"),none,bol,neol,0,0),
-                accepted(4,7,at_end_of_input),    "2bis");
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gabuz"),none,bol,neol,0,0),
-                accepted(4,4,at_end_of_input),    "3");
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gmbuz"),none,bol,neol,0,0),
-                rejected(1,1,not_at_end_of_input),"4");
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gabuzo"),none,bol,neol,0,0),
-                accepted(6,6,at_end_of_input),    "5"); 
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gabuzobof"),none,bol,neol,0,0),
-                accepted(6,6,not_at_end_of_input),    "6"); 
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gggggabuzobof"),none,bol,neol,0,0),
-                accepted(6,10,not_at_end_of_input),    "6bis"); 
-   
-   /* restarting from some other state (with or without an already accepted position) */ 
-   
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("bu"),none,bol,neol,0,2),
-                accepted(4,2,at_end_of_input),    "7"); 
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gabuzfff"),last(4,4),bol,neol,5,5),
-                accepted(4,4,not_at_end_of_input),    "8"); 
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("gabuzomeu"),last(4,4),bol,neol,5,5),
-                accepted(6,6,not_at_end_of_input),    "9"); 
-
-   /* testing bol and eol */ 
-   assertIsSame(ut,
-                test_fast_lexer(lexer_1,to_byte_array("meu"),none,bol,neol,0,0),
-                accepted(6,6,not_at_end_of_input),    "9"); 
-   
-   
-   unique. 
-   
-   
-   
-   
-   
-   
-   
-public define UnitTestSuite 
-   make_fast_lexer_test_suite
-      =
-   ut_suite("predefined.fast_lexer",
-     [
-       ut_fixture("fast lexer",  fast_lexer_test)
-     ]).
-   
-   
-global define One
-  fast_lexer_unit_test
-  (
-    List(String) args
-  )=
-  execute_tests([make_fast_lexer_test_suite], args).
-
-   
 \ No newline at end of file
+
+   
+read tools/unit_test.anubis
+
+   
+define String
+   format
+     (
+       AtEndOfInput a
+     )  =
+   if a is
+     {
+       not_at_end_of_input then "not_at_end_of_input", 
+       at_end_of_input then "at_end_of_input"
+     }.
+   
+   
+define FastLexerOutput
+   test_fast_lexer
+     (
+        List(FastLexerState)        lexer,
+        ByteArray                   input, 
+        FastLexerLastAccepted       last_accepted,
+        Int                         position,
+        Word16                      state
+     ) =
+   if make_fast_lexer(lexer) is 
+     {
+       unknown_state(n) then print("fast lexer unknown state: "+to_decimal(n)+"\n"); alert, 
+       too_many_states  then print("too many states.\n"); alert,
+       ok(fl) then with result = fl(input,last_accepted,position,state),
+         
+         if result is 
+           {
+             rejected(w,e,a) then 
+               print("\nrejected("+to_decimal(w)+","+abs_to_decimal(e)+","+format(a)+")\n"),
+             accepted(w,e,a,_) then 
+               print("\naccepted("+to_decimal(w)+","+abs_to_decimal(e)+","+format(a)+")\n")
+           };
+         
+         result
+     }. 
+   
+
+   
+   A lexer accepting "g+abu", "g+abuzo",
+   
+define List(FastLexerState)   
+   lexer_1 
+     =
+   [
+     /* state 0  */ rejecting([transition('g',1)]),
+     /* state 1  */ rejecting([transition('a',2),transition('g',1)]),
+     /* state 2  */ rejecting([transition('b',3)]),
+     /* state 3  */ rejecting([transition('u',4)]),
+     /* state 4  */ accepting([transition('z',5)]),
+     /* state 5  */ rejecting([transition('o',6)]),
+     /* state 6  */ accepting([ ])
+   ]. 
+   
+   
+define One
+   fast_lexer_test
+     (
+       UnitTestContext ut
+     ) =
+   
+   /* starting in state 0, position 0 */
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gab"),none,0,0),
+                rejected(3,3,at_end_of_input),    "1");
+   unique. 
+   
+   
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gabu"),none,bol,neol,0,0),
+                accepted(4,4,at_end_of_input),    "2");
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("ggggabu"),none,bol,neol,0,0),
+                accepted(4,7,at_end_of_input),    "2bis");
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gabuz"),none,bol,neol,0,0),
+                accepted(4,4,at_end_of_input),    "3");
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gmbuz"),none,bol,neol,0,0),
+                rejected(1,1,not_at_end_of_input),"4");
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gabuzo"),none,bol,neol,0,0),
+                accepted(6,6,at_end_of_input),    "5"); 
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gabuzobof"),none,bol,neol,0,0),
+                accepted(6,6,not_at_end_of_input),    "6"); 
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gggggabuzobof"),none,bol,neol,0,0),
+                accepted(6,10,not_at_end_of_input),    "6bis"); 
+   
+   /* restarting from some other state (with or without an already accepted position) */ 
+   
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("bu"),none,bol,neol,0,2),
+                accepted(4,2,at_end_of_input),    "7"); 
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gabuzfff"),last(4,4),bol,neol,5,5),
+                accepted(4,4,not_at_end_of_input),    "8"); 
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("gabuzomeu"),last(4,4),bol,neol,5,5),
+                accepted(6,6,not_at_end_of_input),    "9"); 
+
+   /* testing bol and eol */ 
+   assertIsSame(ut,
+                test_fast_lexer(lexer_1,to_byte_array("meu"),none,bol,neol,0,0),
+                accepted(6,6,not_at_end_of_input),    "9"); 
+   
+   
+   unique. 
+   
+
+
+   
+   
+   
+public define UnitTestSuite 
+   make_fast_lexer_test_suite
+      =
+   ut_suite("predefined.fast_lexer",
+     [
+       ut_fixture("fast lexer",  fast_lexer_test)
+     ]).
+   
+   
@@ -31,11 +31,39 @@ define One
       }
   }.
+define One 
+  infinite_loop_test
+  (
+    UnitTestContext ut
+  ) =
+  if make_line_reader("mon texte\n\r\nla suite") is
+  {
+    failure then assertIsTrue(ut, false, "#1 make_line_reader"),
+    success(lr) then
+      assertIsSuccessString(ut, read_line(lr), "mon texte", "#1 1st line");
+      assertIsSuccessString(ut, read_line(lr), "",          "#1 2nd line");
+      assertIsSuccessString(ut, read_line(lr), "la suite",  "#1 3rd line");
+      assertIsFailure(ut, read_line(lr), "#1 EOF");
+      unique
+  };
+
+  if make_line_reader("mon texte\r\n\rla suite") is
+  {
+    failure then assertIsTrue(ut, false, "#2 make_line_reader"),
+    success(lr) then
+      assertIsSuccessString(ut, read_line(lr), "mon texte", "#2 1st line");
+      assertIsSuccessString(ut, read_line(lr), "",          "#2 2nd line");
+      assertIsSuccessString(ut, read_line(lr), "la suite",  "#2 3rd line");
+      assertIsFailure(ut, read_line(lr), "#2 EOF");
+      unique
+  }.
+  
 public define UnitTestSuite 
    make_line_reader_test_suite
       =
    ut_suite("tools.line_reader",
      [
        ut_fixture("line_reader",  line_reader_test),
+       ut_fixture("infinite_loop",  infinite_loop_test, false),
      ]).
@@ -30,7 +30,7 @@ public define Maybe(String)
   (
     LineReader   lr,
   ) = 
-  if lr is line_reader(lexer, _) then
+  if lr is line_reader(lexer, offset) then
   if lexer(unique) is 
   {
     end_of_input   then /* no more token: exit the main loop */ 
@@ -46,7 +46,7 @@ public define Maybe(String)
       if t is 
       {
         line(l) then
-          //print("tk: line("+l+")\n");
+          //print("tk: line("+l+") @ "+abs_to_decimal(offset(unique))+"\n");
           forget(lexer(unique)); // reading EOL
           success(l),
         eol then 
@@ -64,6 +64,7 @@ public define Maybe(LineReader)
   ) =
   if make_lexer_and_automaton([
                                 lexer_item("#r?#n", return((ByteArray b) |-> token(eol))),
+                                lexer_item("#r", return((ByteArray b) |-> token(eol))),
                                 lexer_item("[^\r\n]*", return((ByteArray b) |-> token(line(to_string(b))))),
                               ],
                               '#') is
@@ -18,11 +18,13 @@ type UnitTestSuiteResult:
   ut_suite_result(String                    test_suite_name,
                   Word32                       passed_count,
                   Word32                       failed_count,
+                  Word32                       ignored_count,
                   List(UnitTestResult)      fixture_results).
 type UnitTestGlobalResult:
   ut_global_result(Word32                       total_passed,
                    Word32                       total_failed,
+                   Word32                       total_ignored,
                    List(UnitTestSuiteResult) suite_results).
 public type UnitTestContext:
@@ -51,28 +53,34 @@ define UnitTestContext
 public type UnitTestFixture:
   ut_fixture(String                   test_name, 
-             (UnitTestContext) -> One the_test).
+             (UnitTestContext) -> One the_test, 
+             Bool                     active).  // set this to false to ignore this fixture
+
+public define UnitTestFixture
+  ut_fixture(String                   test_name, 
+             (UnitTestContext) -> One the_test) =   ut_fixture(test_name, the_test, true).
 public type UnitTestSuite:
   ut_suite(String                 suite_name,
            List(UnitTestFixture)  fixtures).
-define (Word32 /*passed*/, Word32 /*failed*/, List(UnitTestResult))
+define (Word32 /*passed*/, Word32 /*failed*/, Word32 /*ignored*/, List(UnitTestResult))
   run_test_suite
   (
     List(UnitTestFixture)      tests,
     String                     filter,
     Word32                     passed,
     Word32                     failed,
+    Word32                     ignored,
     List(UnitTestResult)       results
   ) =
   if tests is
     {
-      [ ]         then (passed, failed, reverse(results)), //print("All tests finish"),
+      [ ]         then (passed, failed, ignored, reverse(results)), //print("All tests finish"),
       [test . t]  then
         //print("\nTesting " + test.test_name + "...    (filter = '"+filter+"')\n");
         with ut = make_new_context,
-        if length(filter) = 0 | filter = test.test_name then
+        if (length(filter) = 0 & active(test)) | filter = test.test_name then
           the_test(test)(ut);
           if *ut.failed_tests is
           {
@@ -81,6 +89,7 @@ define (Word32 /*passed*/, Word32 /*failed*/, List(UnitTestResult))
                              filter,
                              passed + 1, 
                              failed, 
+                             ignored,
                              [ut_result(test.test_name, ok(unique)) . results]),
             [h . _] then print("F"); 
@@ -94,13 +103,15 @@ define (Word32 /*passed*/, Word32 /*failed*/, List(UnitTestResult))
                              filter,
                              passed, 
                              failed + 1, 
+                             ignored,
                              map_add(*ut.failed_tests, results))
           }
         else
           run_test_suite(t, 
                          filter,
                          passed, 
-                         failed, 
+                         failed,
+                         ignored + if active(test) then 0 else 1, // only explicitely ignored test are counted
                          results)
      }.
@@ -108,18 +119,19 @@ define (Word32 /*passed*/, Word32 /*failed*/, List(UnitTestResult))
-define (Word32 /* passed */, Word32 /* failed */, List(UnitTestSuiteResult))
+define (Word32 /* passed */, Word32 /* failed */, Word32 /*ignored*/, List(UnitTestSuiteResult))
    execute_tests
      (
        List(UnitTestSuite)          suites,
        String                       filter,
        Word32                       passed,
        Word32                       failed,
+       Word32                       ignored,
        List(UnitTestSuiteResult)    results
      )=
   if suites is
   {
-    [ ]      then (passed, failed, results),
+    [ ]      then (passed, failed, ignored, results),
     [h . t]  then
       with filter_length = length(filter),
            fixture_name_length = length(h.suite_name),
@@ -127,15 +139,16 @@ define (Word32 /* passed */, Word32 /* failed */, List(UnitTestSuiteResult))
               if filter_length = 0 | start_with(filter + ".", h.suite_name + ".") | start_with(h.suite_name + ".", filter + ".") then  //"." is added to avoid partial name match
                 with new_filter = if filter_length > fixture_name_length then force(sub_string(filter, fixture_name_length + 1, filter_length - fixture_name_length - 1), "")
                                                                          else "",
-                run_test_suite(h.fixtures, new_filter, 0, 0, []) 
+                run_test_suite(h.fixtures, new_filter, 0, 0, 0, []) 
               else
-                (0, 0, []),
-      if all_fixture_results is (fixture_passed, fixture_failed, fixture_results) then
+                (0, 0, 0, []),
+      if all_fixture_results is (fixture_passed, fixture_failed, fixture_ignored, fixture_results) then
         execute_tests(t,
                       filter,
                       passed + fixture_passed, 
                       failed + fixture_failed, 
-                      [ut_suite_result(h.suite_name, fixture_passed, fixture_failed, fixture_results) 
+                      ignored + fixture_ignored,
+                      [ut_suite_result(h.suite_name, fixture_passed, fixture_failed, fixture_ignored, fixture_results) 
                          . results])
   }.
@@ -196,7 +209,7 @@ public define One
   )=
   with start_time = (UTime)unow,
        filter = force(nth(0, args), ""),
-  if execute_tests(suites, filter, 0, 0, []) is (passed, failed, results) then
+  if execute_tests(suites, filter, 0, 0, 0, []) is (passed, failed, ignored, results) then
 	println("");
   output_suite_results(results);
   println("----------------------------------------------------------------------");  
@@ -204,9 +217,13 @@ public define One
   println("Ran " + (passed + failed) + " tests in " + 
      to_decimal(duration.seconds) + "." + zero_pad_n(3, duration.microseconds \ 1000) + "s");
   println("");
+  println("Tests passed  = " + passed);
+  println("Tests failed  = " + failed);
+  println("Tests ignored = " + ignored);
+  println("");
   (
   if failed >+ 0 then
-    println("FAILED (failures=" + failed + ")")
+    println("FAILED")
   else
     println("OK")
   );