The R13B03 release.OTP_R13B03

author: Erlang/OTP <[email protected]> 2009-11-20 14:54:40 +0000
committer: Erlang/OTP <[email protected]> 2009-11-20 14:54:40 +0000
commit: 84adefa331c4159d432d22840663c38f155cd4c1 (patch)
tree: bff9a9c66adda4df2106dfd0e5c053ab182a12bd /lib/stdlib/test/erl_scan_SUITE.erl
download: otp-84adefa331c4159d432d22840663c38f155cd4c1.tar.gz
otp-84adefa331c4159d432d22840663c38f155cd4c1.tar.bz2
otp-84adefa331c4159d432d22840663c38f155cd4c1.zip
1 files changed, 1214 insertions, 0 deletions
diff --git a/lib/stdlib/test/erl_scan_SUITE.erl b/lib/stdlib/test/erl_scan_SUITE.erl
new file mode 100644
index 0000000000..32a06d15c7
--- /dev/null
+++ b/lib/stdlib/test/erl_scan_SUITE.erl
@@ -0,0 +1,1214 @@
+%%
+%% %CopyrightBegin%
+%% 
+%% Copyright Ericsson AB 1998-2009. All Rights Reserved.
+%% 
+%% The contents of this file are subject to the Erlang Public License,
+%% Version 1.1, (the "License"); you may not use this file except in
+%% compliance with the License. You should have received a copy of the
+%% Erlang Public License along with this software. If not, it can be
+%% retrieved online at http://www.erlang.org/.
+%% 
+%% Software distributed under the License is distributed on an "AS IS"
+%% basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See
+%% the License for the specific language governing rights and limitations
+%% under the License.
+%% 
+%% %CopyrightEnd%
+
+-module(erl_scan_SUITE).
+-export([all/1]).
+
+-export([error/1, error_1/1, error_2/1, iso88591/1, otp_7810/1]).
+
+-import(lists, [nth/2,flatten/1]).
+-import(io_lib, [print/1]).
+
+%%
+%% Define to run outside of test server
+%%
+%-define(STANDALONE,1).
+
+-ifdef(STANDALONE).
+-compile(export_all).
+-define(line, put(line, ?LINE), ).
+-define(config(A,B),config(A,B)).
+-define(t, test_server).
+%% config(priv_dir, _) ->    
+%%     ".";
+%% config(data_dir, _) ->
+%%     ".".
+-else.
+-include("test_server.hrl").
+-export([init_per_testcase/2, fin_per_testcase/2]).
+
+init_per_testcase(_Case, Config) when is_list(Config) ->
+    ?line Dog=test_server:timetrap(test_server:seconds(1200)),
+    [{watchdog, Dog}|Config].
+ 
+fin_per_testcase(_Case, Config) ->
+    Dog=?config(watchdog, Config),
+    test_server:timetrap_cancel(Dog),
+    ok.
+-endif.
+
+% Default timetrap timeout (set in init_per_testcase).
+-define(default_timeout, ?t:minutes(1)).
+
+all(doc) ->
+    ["Test cases for the 'erl_scan' module."];
+all(suite) ->
+    [error,iso88591,otp_7810].
+
+error(doc) ->
+    ["Error cases"];
+error(suite) ->
+    [error_1, error_2].
+
+error_1(doc) ->
+    ["(OTP-2347)"];
+error_1(suite) ->
+    [];
+error_1(Config) when is_list(Config) ->
+    ?line {error, _, _} = erl_scan:string("'a"),
+    ok.
+
+error_2(doc) ->
+    ["Checks that format_error works on the error cases."];
+error_2(suite) ->
+    [];
+error_2(Config) when is_list(Config) ->
+    ?line lists:foreach(fun check/1, error_cases()),
+    ok.
+
+error_cases() ->
+    ["'a",
+     "\"a",
+     "'\\",
+     "\"\\",
+     "$",
+     "$\\",
+     "2.3e",
+     "2.3e-",
+     "91#9"
+].
+
+assert_type(N, integer) when is_integer(N) ->
+    ok;
+assert_type(N, atom) when is_atom(N) ->
+    ok.
+    
+check(String) ->
+    Error = erl_scan:string(String),
+    check_error(Error, erl_scan).
+
+%%% (This should be useful for all format_error functions.)
+check_error({error, Info, EndLine}, Module0) ->
+    ?line {ErrorLine, Module, Desc} = Info,
+    ?line true = (Module == Module0),
+    ?line assert_type(EndLine, integer),
+    ?line assert_type(ErrorLine, integer),
+    ?line true = (ErrorLine =< EndLine),
+    ?line String = lists:flatten(Module0:format_error(Desc)),
+    ?line true = io_lib:printable_list(String).
+
+iso88591(doc) -> ["Tests the support for ISO-8859-1 i.e Latin-1"];
+iso88591(suite) -> [];
+iso88591(Config) when is_list(Config) ->
+    ?line ok =
+     case catch begin
+		   %% Some atom and variable names
+		   V1s = [$�,$�,$�,$�],
+		   V2s = [$N,$�,$r],
+		   A1s = [$h,$�,$r],
+		   A2s = [$�,$r,$e],
+		   %% Test parsing atom and variable characters.
+		   {ok,Ts1,_} = erl_scan:string(V1s ++ " " ++ V2s ++
+					       "\327" ++
+					       A1s ++ " " ++ A2s),
+		   V1s = atom_to_list(element(3, nth(1, Ts1))),
+		   V2s = atom_to_list(element(3, nth(2, Ts1))),
+		   A1s = atom_to_list(element(3, nth(4, Ts1))),
+		   A2s = atom_to_list(element(3, nth(5, Ts1))),
+		   %% Test printing atoms
+		   A1s = flatten(print(element(3, nth(4, Ts1)))),
+		   A2s = flatten(print(element(3, nth(5, Ts1)))),
+		   %% Test parsing and printing strings.
+		   S1 = V1s ++ "\327" ++ A1s ++ "\250" ++ A2s,
+		   S1s = "\"" ++ S1 ++ "\"",
+		   {ok,Ts2,_} = erl_scan:string(S1s),
+		   S1 = element(3, nth(1, Ts2)),
+		   S1s = flatten(print(element(3, nth(1, Ts2)))),
+		   ok				%It all worked
+	       end of
+	{'EXIT',R} ->				%Something went wrong!
+	     {error,R};
+	ok -> ok				%Aok
+    end.
+
+otp_7810(doc) -> 
+    ["OTP-7810. White spaces, comments, and more.."];
+otp_7810(suite) ->
+    [];
+otp_7810(Config) when is_list(Config) ->
+    ?line ok = reserved_words(),
+    ?line ok = atoms(),
+    ?line ok = punctuations(),
+    ?line ok = comments(),
+    ?line ok = errors(),
+    ?line ok = integers(),
+    ?line ok = base_integers(),
+    ?line ok = floats(),
+    ?line ok = dots(),
+    ?line ok = chars(),
+    ?line ok = variables(),
+    ?line ok = eof(),
+    ?line ok = illegal(),
+    ?line ok = crashes(),
+
+    ?line ok = options(),
+    ?line ok = token_info(),
+    ?line ok = column_errors(),
+    ?line ok = white_spaces(),
+
+    ?line ok = unicode(),
+
+    ?line ok = more_chars(),
+    ?line ok = more_options(),
+    ?line ok = attributes_info(),
+    ?line ok = set_attribute(),
+
+    ok.
+
+reserved_words() ->
+    L = ['after', 'begin', 'case', 'try', 'cond', 'catch',
+         'andalso', 'orelse', 'end', 'fun', 'if', 'let', 'of',
+         'query', 'receive', 'when', 'bnot', 'not', 'div',
+         'rem', 'band', 'and', 'bor', 'bxor', 'bsl', 'bsr',
+         'or', 'xor', 'spec'] , % 'spec' shouldn't be there...
+    [begin
+         ?line {RW, true} = {RW, erl_scan:reserved_word(RW)},
+         S = atom_to_list(RW),
+         Ts = [{RW,1}],
+         ?line test_string(S, Ts)
+     end || RW <- L],
+    ok.
+
+
+atoms() ->
+    ?line test_string("a
+                 b", [{atom,1,a},{atom,2,b}]),
+    ?line test_string("'a b'", [{atom,1,'a b'}]),
+    ?line test_string("a", [{atom,1,a}]),
+    ?line test_string("a@2", [{atom,1,a@2}]),
+    ?line test_string([39,65,200,39], [{atom,1,'A�'}]),
+    ?line test_string("�rlig �sten", [{atom,1,�rlig},{atom,1,�sten}]),
+    ?line {ok,[{atom,_,'$a'}],{1,6}} = 
+        erl_scan:string("'$\\a'", {1,1}),
+    ?line test("'$\\a'"),
+    ok.
+
+punctuations() ->
+    L = ["<<", "<-", "<=", "<", ">>", ">=", ">", "->", "--",
+         "-", "++", "+", "=:=", "=/=", "=<", "==", "=", "/=",
+         "/", "||", "|", ":-", "::", ":"],
+    %% One token at a time:
+    [begin
+         W = list_to_atom(S),
+         Ts = [{W,1}],
+         ?line test_string(S, Ts)
+     end || S <- L],
+    Three = ["/=:=", "<=:=", "==:=", ">=:="], % three tokens...
+    No = Three ++ L,
+    SL0 = [{S1++S2,{-length(S1),S1,S2}} ||
+              S1 <- L, 
+              S2 <- L, 
+              not lists:member(S1++S2, No)],
+    SL = family_list(SL0),
+    %% Two tokens. When there are several answers, the one with
+    %% the longest first token is chosen:
+    %% [the special case "=<<" is among the tested ones]
+    [begin
+         W1 = list_to_atom(S1),
+         W2 = list_to_atom(S2),
+         Ts = [{W1,1},{W2,1}],
+         ?line test_string(S, Ts)
+     end || {S,[{_,S1,S2}|_]}  <- SL],
+
+    PTs1 = [{'!',1},{'(',1},{')',1},{',',1},{';',1},{'=',1},{'[',1},
+            {']',1},{'{',1},{'|',1},{'}',1}],
+    ?line test_string("!(),;=[]{|}", PTs1),
+
+    PTs2 = [{'#',1},{'&',1},{'*',1},{'+',1},{'/',1},
+            {':',1},{'<',1},{'>',1},{'?',1},{'@',1},
+            {'\\',1},{'^',1},{'`',1},{'~',1}],
+    ?line test_string("#&*+/:<>?@\\^`~", PTs2),
+
+    ok.
+
+comments() ->
+    ?line test("a %%\n b"),
+    ?line {ok,[],1} = erl_scan:string("%"),
+    ?line test("a %%\n b"),
+    ?line {ok,[{atom,_,a},{atom,_,b}],{2,3}} = 
+        erl_scan:string("a %%\n b",{1,1}),
+    ?line {ok,[{atom,_,a},{comment,_,"%%"},{atom,_,b}],{2,3}} = 
+        erl_scan:string("a %%\n b",{1,1}, [return_comments]),
+    ?line {ok,[{atom,_,a},
+               {white_space,_," "},
+               {white_space,_,"\n "},
+               {atom,_,b}],
+           {2,3}} = 
+        erl_scan:string("a %%\n b",{1,1},[return_white_spaces]),
+    ?line {ok,[{atom,_,a},
+               {white_space,_," "},
+               {comment,_,"%%"},
+               {white_space,_,"\n "},
+               {atom,_,b}],
+           {2,3}} = erl_scan:string("a %%\n b",{1,1},[return]),
+    ok.
+
+errors() ->
+    ?line {error,{1,erl_scan,{string,$',"qa"}},1} = erl_scan:string("'qa"), %'
+    ?line {error,{1,erl_scan,{string,$","str"}},1} = %"
+        erl_scan:string("\"str"), %"
+    ?line {error,{1,erl_scan,char},1} = erl_scan:string("$"),
+    ?line test_string([34,65,200,34], [{string,1,"A�"}]),
+    ?line test_string("\\", [{'\\',1}]),
+    ?line {'EXIT',_} = 
+        (catch {foo, erl_scan:string('$\\a', {1,1})}), % type error
+    ?line {'EXIT',_} = 
+        (catch {foo, erl_scan:tokens([], '$\\a', {1,1})}), % type error
+
+    ?line "{a,tuple}" = erl_scan:format_error({a,tuple}),
+    ok.
+    
+integers() ->
+    [begin
+         I = list_to_integer(S),
+         Ts = [{integer,1,I}],
+         ?line test_string(S, Ts)
+     end || S <- [[N] || N <- lists:seq($0, $9)] ++ ["2323","000"] ],
+    ok.
+
+base_integers() ->
+    [begin
+         B = list_to_integer(BS),
+         I = erlang:list_to_integer(S, B),
+         Ts = [{integer,1,I}],
+         ?line test_string(BS++"#"++S, Ts)
+     end || {BS,S} <- [{"2","11"}, {"5","23234"}, {"12","05a"},
+                       {"16","abcdef"}, {"16","ABCDEF"}] ],
+    
+    ?line {error,{1,erl_scan,{base,1}},1} = erl_scan:string("1#000"),
+    
+    ?line test_string("12#bc", [{integer,1,11},{atom,1,c}]),
+    
+    [begin
+         Str = BS ++ "#" ++ S,
+         ?line {error,{1,erl_scan,{illegal,integer}},1} = 
+             erl_scan:string(Str)
+     end || {BS,S} <- [{"3","3"},{"15","f"}, {"12","c"}] ],
+
+    ?line {ok,[{integer,1,239},{'@',1}],1} = erl_scan:string("16#ef@"),
+    ?line {ok,[{integer,1,14},{atom,1,g@}],1} = erl_scan:string("16#eg@"),
+
+    ok.
+
+floats() ->
+    [begin
+         F = list_to_float(FS),
+         Ts = [{float,1,F}],
+         ?line test_string(FS, Ts)
+     end || FS <- ["1.0","001.17","3.31200","1.0e0","1.0E17",
+                   "34.21E-18", "17.0E+14"]],
+    ?line test_string("1.e2", [{integer,1,1},{'.',1},{atom,1,e2}]),
+    
+    ?line {error,{1,erl_scan,{illegal,float}},1} = 
+        erl_scan:string("1.0e400"),
+    [begin
+         ?line {error,{1,erl_scan,{illegal,float}},1} = erl_scan:string(S)
+     end || S <- ["1.14Ea"]],
+
+    ok.
+
+dots() ->
+    Dot = [{".",    {ok,[{dot,1}],1}},
+           {". ",   {ok,[{dot,1}],1}},
+           {".\n",  {ok,[{dot,1}],2}},
+           {".%",   {ok,[{dot,1}],1}},
+           {".\210",{ok,[{dot,1}],1}},
+           {".% �h",{ok,[{dot,1}],1}},
+           {".%\n", {ok,[{dot,1}],2}},
+           {".$",   {error,{1,erl_scan,char},1}},
+           {".$\\", {error,{1,erl_scan,char},1}},
+           {".a",   {ok,[{'.',1},{atom,1,a}],1}}
+          ],
+    ?line [R = erl_scan:string(S) || {S, R} <- Dot],
+    
+    ?line {ok,[{dot,_}=T1],{1,2}} = erl_scan:string(".", {1,1}, text),
+    ?line [{column,1},{length,1},{line,1},{text,"."}] = 
+        erl_scan:token_info(T1, [column, length, line, text]),
+    ?line {ok,[{dot,_}=T2],{1,3}} = erl_scan:string(".%", {1,1}, text),
+    ?line [{column,1},{length,1},{line,1},{text,"."}] = 
+        erl_scan:token_info(T2, [column, length, line, text]),
+    ?line {ok,[{dot,_}=T3],{1,6}} =
+        erl_scan:string(".% �h", {1,1}, text),
+    ?line [{column,1},{length,1},{line,1},{text,"."}] = 
+        erl_scan:token_info(T3, [column, length, line, text]),
+    ?line {error,{{1,2},erl_scan,char},{1,3}} =
+        erl_scan:string(".$", {1,1}),
+    ?line {error,{{1,2},erl_scan,char},{1,4}} =
+        erl_scan:string(".$\\", {1,1}),
+
+    ?line test(". "),
+    ?line test(".  "),
+    ?line test(".\n"),
+    ?line test(".\n\n"),
+    ?line test(".\n\r"),
+    ?line test(".\n\n\n"),
+    ?line test(".\210"),
+    ?line test(".%\n"),
+    ?line test(".a"),
+
+    ?line test("%. \n. "),
+    ?line {more,C} = erl_scan:tokens([], "%. ",{1,1}, return),
+    ?line {done,{ok,[{comment,_,"%. "},
+                     {white_space,_,"\n"},
+                     {dot,_}],
+                 {2,3}}, ""} = 
+        erl_scan:tokens(C, "\n. ", {1,1}, return), % any loc, any options
+
+    ?line [test_string(S, R) || 
+              {S, R} <- [{".$\n",   [{'.',1},{char,1,$\n}]},
+                         {"$\\\n",  [{char,1,$\n}]},
+                         {"'\\\n'", [{atom,1,'\n'}]},
+                         {"$\n",    [{char,1,$\n}]}] ],
+    ok.
+
+chars() ->
+    [begin
+         L = lists:flatten(io_lib:format("$\\~.8b", [C])),
+         Ts = [{char,1,C}],
+         ?line test_string(L, Ts)
+     end || C <- lists:seq(0, 255)],
+    
+    %% Leading zeroes...
+    [begin
+         L = lists:flatten(io_lib:format("$\\~3.8.0b", [C])),
+         Ts = [{char,1,C}],
+         ?line test_string(L, Ts)
+     end || C <- lists:seq(0, 255)],
+
+    %% $\^\n now increments the line...
+    [begin
+         L = "$\\^" ++ [C],
+         Ts = [{char,1,C band 2#11111}],
+         ?line test_string(L, Ts)
+     end || C <- lists:seq(0, 255)],
+    
+    [begin
+         L = "$\\" ++ [C],
+         Ts = [{char,1,V}],
+         ?line test_string(L, Ts)
+     end || {C,V} <- [{$n,$\n}, {$r,$\r}, {$t,$\t}, {$v,$\v}, 
+                      {$b,$\b}, {$f,$\f}, {$e,$\e}, {$s,$\s}, 
+                      {$d,$\d}]],
+
+    EC = [$\n,$\r,$\t,$\v,$\b,$\f,$\e,$\s,$\d],
+    Ds = lists:seq($0, $9),
+    X = [$^,$n,$r,$t,$v,$b,$f,$e,$s,$d],
+    New = [${,$x],
+    No = EC ++ Ds ++ X ++ New,
+    [begin
+         L = "$\\" ++ [C],
+         Ts = [{char,1,C}],
+         ?line test_string(L, Ts)
+     end || C <- lists:seq(0, 255) -- No],
+
+    [begin
+         L = "'$\\" ++ [C] ++ "'",
+         Ts = [{atom,1,list_to_atom("$"++[C])}],
+         ?line test_string(L, Ts)
+     end || C <- lists:seq(0, 255) -- No],
+
+    ?line test_string("\"\\013a\\\n\"", [{string,1,"\va\n"}]),
+
+    ?line test_string("'\n'", [{atom,1,'\n'}]),
+    ?line test_string("\"\n\a\"", [{string,1,"\na"}]),
+
+    %% No escape
+    [begin
+         L = "$" ++ [C],
+         Ts = [{char,1,C}],
+         ?line test_string(L, Ts)
+     end || C <- lists:seq(0, 255) -- (No ++ [$\\])],
+    ?line test_string("$\n", [{char,1,$\n}]),
+
+    ?line {error,{{1,1},erl_scan,char},{1,4}} = 
+        erl_scan:string("$\\^",{1,1}),
+    ?line test_string("$\\\n", [{char,1,$\n}]),
+    %% Robert's scanner returns line 1:
+    ?line test_string("$\\\n", [{char,1,$\n}]),
+    ?line test_string("$\n\n", [{char,1,$\n}]),
+    ?line test("$\n\n"),
+    ok.
+           
+
+variables() ->
+    ?line test_string("     \237_Aou�eiy��", [{var,1,'_Aou�eiy��'}]),
+    ?line test_string("A_b_c@", [{var,1,'A_b_c@'}]),
+    ?line test_string("V@2", [{var,1,'V@2'}]),
+    ?line test_string("ABD�", [{var,1,'ABD�'}]),
+    ?line test_string("�rlig �sten", [{var,1,'�rlig'},{var,1,'�sten'}]),
+    ok.
+
+eof() ->
+    ?line {done,{eof,1},eof} = erl_scan:tokens([], eof, 1),
+    {more, C1} = erl_scan:tokens([],"    \n", 1),
+    ?line {done,{eof,2},eof} = erl_scan:tokens(C1, eof, 1),
+    {more, C2} = erl_scan:tokens([], "abra", 1),
+    %% An error before R13A.
+    %% ?line {done,Err={error,{1,erl_scan,scan},1},eof} = 
+    ?line {done,{ok,[{atom,1,abra}],1},eof} = 
+        erl_scan:tokens(C2, eof, 1),
+
+    %% With column.
+    ?line {more, C3} = erl_scan:tokens([],"    \n",{1,1}),
+    ?line {done,{eof,{2,1}},eof} = erl_scan:tokens(C3, eof, 1),
+    {more, C4} = erl_scan:tokens([], "abra", {1,1}),
+    %% An error before R13A.
+    %% ?line {done,{error,{{1,1},erl_scan,scan},{1,5}},eof} = 
+    ?line {done,{ok,[{atom,_,abra}],{1,5}},eof} =
+        erl_scan:tokens(C4, eof, 1),
+
+    %% Robert's scanner returns "" as LeftoverChars;
+    %% the R12B scanner returns eof as LeftoverChars: (eof is correct)
+    ?line {more, C5} = erl_scan:tokens([], "a", 1),
+    %% An error before R13A.
+    %% ?line {done,{error,{1,erl_scan,scan},1},eof} = 
+    ?line {done,{ok,[{atom,1,a}],1},eof} =
+        erl_scan:tokens(C5,eof,1),
+
+    %% A dot followed by eof is special:
+    ?line {more, C} = erl_scan:tokens([], "a.", 1),
+    ?line {done,{ok,[{atom,1,a},{dot,1}],1},eof} = erl_scan:tokens(C,eof,1),
+    ?line {ok,[{atom,1,foo},{dot,1}],1} = erl_scan:string("foo."),
+
+    ok.
+
+illegal() ->
+    Atom = lists:duplicate(1000, $a),
+    ?line {error,{1,erl_scan,{illegal,atom}},1} = erl_scan:string(Atom),
+    ?line {done,{error,{1,erl_scan,{illegal,atom}},1},". "} =
+        erl_scan:tokens([], Atom++". ", 1),
+    QAtom = "'" ++ Atom ++ "'",
+    ?line {error,{1,erl_scan,{illegal,atom}},1} = erl_scan:string(QAtom),
+    ?line {done,{error,{1,erl_scan,{illegal,atom}},1},". "} =
+        erl_scan:tokens([], QAtom++". ", 1),
+    Var = lists:duplicate(1000, $A),
+    ?line {error,{1,erl_scan,{illegal,var}},1} = erl_scan:string(Var),
+    ?line {done,{error,{1,erl_scan,{illegal,var}},1},". "} =
+        erl_scan:tokens([], Var++". ", 1),
+    Float = "1" ++ lists:duplicate(400, $0) ++ ".0",
+    ?line {error,{1,erl_scan,{illegal,float}},1} = erl_scan:string(Float),
+    ?line {done,{error,{1,erl_scan,{illegal,float}},1},". "} =
+        erl_scan:tokens([], Float++". ", 1),
+    String = "\"43\\x{aaaaaa}34\"",
+    ?line {error,{1,erl_scan,{illegal,character}},1} = erl_scan:string(String),
+    ?line {done,{error,{1,erl_scan,{illegal,character}},1},"34\". "} =
+        %% Would be nice if `34\"' were skipped...
+        %% Maybe, but then the LeftOverChars would not be the characters
+        %% immediately following the end location of the error.
+        erl_scan:tokens([], String++". ", 1),
+
+    ?line {error,{{1,1},erl_scan,{illegal,atom}},{1,1001}} =
+        erl_scan:string(Atom, {1,1}),
+    ?line {done,{error,{{1,5},erl_scan,{illegal,atom}},{1,1005}},". "} =
+        erl_scan:tokens([], "foo "++Atom++". ", {1,1}),
+    ?line {error,{{1,1},erl_scan,{illegal,atom}},{1,1003}} =
+        erl_scan:string(QAtom, {1,1}),
+    ?line {done,{error,{{1,5},erl_scan,{illegal,atom}},{1,1007}},". "} = 
+        erl_scan:tokens([], "foo "++QAtom++". ", {1,1}),
+    ?line {error,{{1,1},erl_scan,{illegal,var}},{1,1001}} =
+        erl_scan:string(Var, {1,1}),
+    ?line {done,{error,{{1,5},erl_scan,{illegal,var}},{1,1005}},". "} =
+        erl_scan:tokens([], "foo "++Var++". ", {1,1}),
+    ?line {error,{{1,1},erl_scan,{illegal,float}},{1,404}} =
+        erl_scan:string(Float, {1,1}),
+    ?line {done,{error,{{1,5},erl_scan,{illegal,float}},{1,408}},". "} =
+        erl_scan:tokens([], "foo "++Float++". ", {1,1}),
+    ?line {error,{{1,4},erl_scan,{illegal,character}},{1,14}} =
+        erl_scan:string(String, {1,1}),
+    ?line {done,{error,{{1,4},erl_scan,{illegal,character}},{1,14}},"34\". "} =
+        erl_scan:tokens([], String++". ", {1,1}),
+    ok.
+
+crashes() ->
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([-1])}), % type error
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("$"++[-1])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("$\\"++[-1])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("$\\^"++[-1])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([$",-1,$"],{1,1})}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("\"\\v"++[-1,$"])}), %$"
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([$",-1,$"])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("% foo"++[-1])}),
+    ?line {'EXIT',_} = 
+         (catch {foo, erl_scan:string("% foo"++[-1],{1,1})}),
+
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([a])}), % type error
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("$"++[a])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("$\\"++[a])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("$\\^"++[a])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([$",a,$"],{1,1})}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("\"\\v"++[a,$"])}), %$"
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([$",a,$"])}),
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string("% foo"++[a])}),
+    ?line {'EXIT',_} = 
+         (catch {foo, erl_scan:string("% foo"++[a],{1,1})}),
+
+    ?line {'EXIT',_} = (catch {foo, erl_scan:string([3.0])}), % type error
+
+    ok.
+
+options() ->
+    %% line and column are not options, but tested here
+    ?line {ok,[{atom,1,foo},{white_space,1," "},{comment,1,"% bar"}], 1} = 
+        erl_scan:string("foo % bar", 1, return),
+    ?line {ok,[{atom,1,foo},{white_space,1," "}],1} = 
+        erl_scan:string("foo % bar", 1, return_white_spaces),
+    ?line {ok,[{atom,1,foo},{comment,1,"% bar"}],1} = 
+        erl_scan:string("foo % bar", 1, return_comments),
+    ?line {ok,[{atom,17,foo}],17} = 
+        erl_scan:string("foo % bar", 17),
+    ?line {'EXIT',{function_clause,_}} = 
+        (catch {foo, 
+                erl_scan:string("foo % bar", {a,1}, [])}), % type error
+    ?line {ok,[{atom,_,foo}],{17,18}} = 
+        erl_scan:string("foo % bar", {17,9}, []),
+    ?line {'EXIT',{function_clause,_}} = 
+        (catch {foo,
+                erl_scan:string("foo % bar", {1,0}, [])}), % type error
+    ?line {ok,[{foo,1}],1} = 
+        erl_scan:string("foo % bar",1, [{reserved_word_fun,
+                                         fun(W) -> W =:= foo end}]),
+    ?line {'EXIT',{badarg,_}} = 
+        (catch {foo,
+                erl_scan:string("foo % bar",1, % type error
+                                [{reserved_word_fun,
+                                  fun(W,_) -> W =:= foo end}])}),
+    ok.
+
+more_options() ->
+    ?line {ok,[{atom,A1,foo}],{19,20}} =
+        erl_scan:string("foo", {19,17},[]),
+    ?line [{column,17},{line,19}] = erl_scan:attributes_info(A1),
+    ?line {done,{ok,[{atom,A2,foo},{dot,_}],{19,22}},[]} =
+        erl_scan:tokens([], "foo. ", {19,17}, [bad_opt]), % type error
+    ?line [{column,17},{line,19}] = erl_scan:attributes_info(A2),
+    ?line {ok,[{atom,A3,foo}],{19,20}} =
+        erl_scan:string("foo", {19,17},[text]),
+    ?line [{column,17},{length,3},{line,19},{text,"foo"}] =
+        erl_scan:attributes_info(A3),
+
+    ?line {ok,[{atom,A4,foo}],1} = erl_scan:string("foo", 1, [text]),
+    ?line [{length,3},{line,1},{text,"foo"}] = erl_scan:attributes_info(A4),
+
+    ok.
+
+token_info() ->
+    ?line {ok,[T1],_} = erl_scan:string("foo", {1,18}, [text]),
+    {'EXIT',{badarg,_}} = 
+        (catch {foo, erl_scan:token_info(T1, foo)}), % type error
+    ?line {line,1} = erl_scan:token_info(T1, line),
+    ?line {column,18} = erl_scan:token_info(T1, column),
+    ?line {length,3} = erl_scan:token_info(T1, length),
+    ?line {text,"foo"} = erl_scan:token_info(T1, text),
+    ?line [{category,atom},{column,18},{length,3},{line,1},
+           {symbol,foo},{text,"foo"}] = 
+        erl_scan:token_info(T1),
+    ?line [{length,3},{column,18}] =
+        erl_scan:token_info(T1, [length, column]),
+    ?line [{location,{1,18}}] =
+        erl_scan:token_info(T1, [location]),
+    ?line {category,atom} = erl_scan:token_info(T1, category),
+    ?line [{symbol,foo}] = erl_scan:token_info(T1, [symbol]),
+
+    ?line {ok,[T2],_} = erl_scan:string("foo", 1, []),
+    ?line {line,1} = erl_scan:token_info(T2, line),
+    ?line undefined = erl_scan:token_info(T2, column),
+    ?line undefined = erl_scan:token_info(T2, length),
+    ?line undefined = erl_scan:token_info(T2, text),
+    ?line {location,1} = erl_scan:token_info(T2, location),
+    ?line [{category,atom},{line,1},{symbol,foo}] = erl_scan:token_info(T2),
+    ?line [{line,1}] = erl_scan:token_info(T2, [length, line]),
+
+    ?line {ok,[T3],_} = erl_scan:string("=", 1, []),
+    ?line [{line,1}] = erl_scan:token_info(T3, [column, line]),
+    ?line {category,'='} = erl_scan:token_info(T3, category),
+    ?line [{symbol,'='}] = erl_scan:token_info(T3, [symbol]),
+    ok.
+    
+attributes_info() ->
+    ?line {'EXIT',_} = 
+        (catch {foo,erl_scan:attributes_info(foo)}), % type error
+    ?line [{line,18}] = erl_scan:attributes_info(18),
+    ?line {location,19} = erl_scan:attributes_info(19, location),
+    ?line {ok,[{atom,A0,foo}],_} = erl_scan:string("foo", 19, [text]),
+    ?line {location,19} = erl_scan:attributes_info(A0, location),
+
+    ?line {ok,[{atom,A3,foo}],_} = erl_scan:string("foo", {1,3}, [text]),
+    ?line {line,1} = erl_scan:attributes_info(A3, line),
+    ?line {column,3} = erl_scan:attributes_info(A3, column),
+    ?line {location,{1,3}} = erl_scan:attributes_info(A3, location),
+    ?line {text,"foo"} = erl_scan:attributes_info(A3, text),
+
+    ?line {ok,[{atom,A4,foo}],_} = erl_scan:string("foo", 2, [text]),
+    ?line {line,2} = erl_scan:attributes_info(A4, line),
+    ?line undefined = erl_scan:attributes_info(A4, column),
+    ?line {location,2} = erl_scan:attributes_info(A4, location),
+    ?line {text,"foo"} = erl_scan:attributes_info(A4, text),
+
+    ?line {ok,[{atom,A5,foo}],_} = erl_scan:string("foo", {1,3}, []),
+    ?line {line,1} = erl_scan:attributes_info(A5, line),
+    ?line {column,3} = erl_scan:attributes_info(A5, column),
+    ?line {location,{1,3}} = erl_scan:attributes_info(A5, location),
+    ?line undefined = erl_scan:attributes_info(A5, text),
+
+    ?line undefined = erl_scan:attributes_info([], line), % type error
+
+    ok.
+
+set_attribute() ->
+    F = fun(Line) -> -Line end,
+    ?line -2 = erl_scan:set_attribute(line, 2, F),
+    ?line {ok,[{atom,A1,foo}],_} = erl_scan:string("foo", {9,17}),
+    ?line A2 = erl_scan:set_attribute(line, A1, F),
+    ?line {line,-9} = erl_scan:attributes_info(A2, line),
+    ?line {location,{-9,17}} = erl_scan:attributes_info(A2, location),
+    ?line [{line,-9},{column,17}] =
+        erl_scan:attributes_info(A2, [line,column,text]),
+
+    F2 = fun(Line) -> {17,Line} end,
+    ?line Attr1 = erl_scan:set_attribute(line, 2, F2),
+    ?line {line,{17,2}} = erl_scan:attributes_info(Attr1, line),
+    ?line undefined = erl_scan:attributes_info(Attr1, column),
+    ?line {location,{17,2}} = % a bit mixed up
+        erl_scan:attributes_info(Attr1, location),
+
+    ?line A3 = erl_scan:set_attribute(line, A1, F2),
+    ?line {line,{17,9}} = erl_scan:attributes_info(A3, line),
+    ?line {location,{{17,9},17}} = erl_scan:attributes_info(A3, location),
+    ?line [{line,{17,9}},{column,17}] =
+        erl_scan:attributes_info(A3, [line,column,text]),
+
+    ?line {ok,[{atom,A4,foo}],_} = erl_scan:string("foo", {9,17}, [text]),
+    ?line A5 = erl_scan:set_attribute(line, A4, F),
+    ?line {line,-9} = erl_scan:attributes_info(A5, line),
+    ?line {location,{-9,17}} = erl_scan:attributes_info(A5, location),
+    ?line [{line,-9},{column,17},{text,"foo"}] =
+        erl_scan:attributes_info(A5, [line,column,text]),
+
+    ?line {ok,[{atom,A6,foo}],_} = erl_scan:string("foo", 11, [text]),
+    ?line A7 = erl_scan:set_attribute(line, A6, F2),
+    ?line {line,{17,11}} = erl_scan:attributes_info(A7, line),
+    ?line {location,{17,11}} = % mixed up
+        erl_scan:attributes_info(A7, location),
+    ?line [{line,{17,11}},{text,"foo"}] =
+        erl_scan:attributes_info(A7, [line,column,text]),
+
+    ?line {'EXIT',_} = 
+        (catch {foo, erl_scan:set_attribute(line, [], F2)}), % type error
+    ?line {'EXIT',{badarg,_}} = 
+        (catch {foo, erl_scan:set_attribute(column, [], F2)}), % type error
+    ok.
+
+column_errors() ->
+    ?line {error,{{1,1},erl_scan,{string,$',""}},{1,3}} = % $'
+        erl_scan:string("'\\",{1,1}),
+    ?line {error,{{1,1},erl_scan,{string,$",""}},{1,3}} = % $"
+        erl_scan:string("\"\\",{1,1}),
+
+    ?line {error,{{1,1},erl_scan,{string,$',""}},{1,2}} =  % $'
+        erl_scan:string("'",{1,1}),
+    ?line {error,{{1,1},erl_scan,{string,$",""}},{1,2}} =  % $"
+        erl_scan:string("\"",{1,1}),
+
+    ?line {error,{{1,1},erl_scan,char},{1,2}} =
+        erl_scan:string("$",{1,1}),
+
+    ?line {error,{{1,2},erl_scan,{string,$',"1234567890123456"}},{1,20}} = %'
+        erl_scan:string(" '12345678901234567", {1,1}),
+    ?line {error,{{1,2},erl_scan,{string,$',"123456789012345 "}}, {1,20}} = %'
+        erl_scan:string(" '123456789012345\\s", {1,1}),
+    ?line {error,{{1,2},erl_scan,{string,$","1234567890123456"}},{1,20}} = %"
+        erl_scan:string(" \"12345678901234567", {1,1}),
+    ?line {error,{{1,2},erl_scan,{string,$","123456789012345 "}}, {1,20}} = %"
+        erl_scan:string(" \"123456789012345\\s", {1,1}),
+    ?line {error,{{1,2},erl_scan,{string,$',"1234567890123456"}},{2,1}} = %'
+        erl_scan:string(" '12345678901234567\n", {1,1}),
+    ok.
+
+white_spaces() ->
+    ?line {ok,[{white_space,_,"\r"},
+               {white_space,_,"   "},
+               {atom,_,a},
+               {white_space,_,"\n"}],
+           _} = erl_scan:string("\r   a\n", {1,1}, return),
+    ?line test("\r   a\n"),
+    L = "{\"a\nb\", \"a\\nb\",\nabc\r,def}.\n\n",
+    ?line {ok,[{'{',_},
+               {string,_,"a\nb"},
+               {',',_},
+               {white_space,_," "},
+               {string,_,"a\nb"},
+               {',',_},
+               {white_space,_,"\n"},
+               {atom,_,abc},
+               {white_space,_,"\r"},
+               {',',_},
+               {atom,_,def},
+               {'}',_},
+               {dot,_},
+               {white_space,_,"\n"}],
+           _} = erl_scan:string(L, {1,1}, return),
+    ?line test(L),
+    ?line test("\"\n\"\n"),
+    ?line test("\n\r\n"),
+    ?line test("\n\r"),
+    ?line test("\r\n"),
+    ?line test("\n\f"),
+    ?line [test(lists:duplicate(N, $\t)) || N <- lists:seq(1, 20)],
+    ?line [test([$\n|lists:duplicate(N, $\t)]) || N <- lists:seq(1, 20)],
+    ?line [test(lists:duplicate(N, $\s)) || N <- lists:seq(1, 20)],
+    ?line [test([$\n|lists:duplicate(N, $\s)]) || N <- lists:seq(1, 20)],
+    ?line test("\v\f\n\v "),
+    ?line test("\n\e\n\b\f\n\da\n"),
+    ok.
+
+unicode() ->
+    ?line {ok,[{char,1,83},{integer,1,45}],1} =
+        erl_scan:string("$\\12345"), % not unicode
+
+    ?line {error,{1,erl_scan,{illegal,character}},1} = 
+        erl_scan:string([1089]),
+    ?line {error,{{1,1},erl_scan,{illegal,character}},{1,2}} = 
+        erl_scan:string([1089], {1,1}),
+    ?line {error,{1,erl_scan,{illegal,character}},1} =
+    %% ?line {error,{1,erl_scan,{illegal,atom}},1} = 
+        erl_scan:string("'a"++[1089]++"b'"),
+    ?line {error,{{1,3},erl_scan,{illegal,character}},{1,4}} = 
+        erl_scan:string("'a"++[1089]++"b'", {1,1}),
+    ?line test("\"a"++[1089]++"b\""),
+    ?line {ok,[{char,1,1}],1} = erl_scan:string([$$,$\\,$^,1089]),
+
+    ?line {error,{1,erl_scan,Error},1} = erl_scan:string("\"qa\x{aaa}"),
+    ?line "unterminated string starting with \"qa\\x{AAA}\"" =
+        erl_scan:format_error(Error),
+    ?line {error,{{1,1},erl_scan,_},{1,11}} =
+        erl_scan:string("\"qa\\x{aaa}",{1,1}),
+    ?line {error,{{1,4},erl_scan,{illegal,character}},{1,11}} =
+        erl_scan:string("'qa\\x{aaa}'",{1,1}),
+
+    Tags = [category, column, length, line, symbol, text],
+
+    %% Workaround. No character codes greater than 255! To be changed.
+    %% Note: don't remove these tests, just modify them!
+
+    ?line {ok,[{integer,1,1089}],1} = erl_scan:string([$$,1089]),
+    ?line {ok,[{integer,1,1089}],1} = erl_scan:string([$$,$\\,1089]),
+
+    Qs = "$\\x{aaa}",
+    ?line {ok,[{integer,1,16#aaa}],1} = erl_scan:string(Qs),
+    ?line {ok,[Q2],{1,9}} = erl_scan:string("$\\x{aaa}", {1,1}, text),
+    ?line [{category,integer},{column,1},{length,8},
+           {line,1},{symbol,16#aaa},{text,Qs}] = 
+        erl_scan:token_info(Q2),
+
+    U1 = "\"\\x{aaa}\"",
+    ?line {ok,[T1,T2,T3],{1,10}} = erl_scan:string(U1, {1,1}, text),
+    ?line [{category,'['},{column,1},{length,1},{line,1},
+           {symbol,'['},{text,"\""}] = erl_scan:token_info(T1, Tags),
+    ?line [{category,integer},{column,2},{length,7},
+           {line,1},{symbol,16#aaa},{text,"\\x{aaa}"}] = 
+        erl_scan:token_info(T2, Tags),
+    ?line [{category,']'},{column,9},{length,1},{line,1},
+           {symbol,']'},{text,"\""}] = erl_scan:token_info(T3, Tags),
+    ?line  {ok,[{'[',1},{integer,1,16#aaa},{']',1}],1} = 
+        erl_scan:string(U1, 1),
+
+    U2 = "\"\\x41\\x{fff}\\x42\"",
+    ?line {ok,[{'[',1},{char,1,16#41},{',',1},{integer,1,16#fff},
+               {',',1},{char,1,16#42},{']',1}],1} = erl_scan:string(U2, 1),
+
+    U3 = "\"a\n\\x{fff}\n\"",
+    ?line {ok,[{'[',1},{char,1,$a},{',',1},{char,1,$\n},
+               {',',2},{integer,2,16#fff},{',',2},{char,2,$\n},
+               {']',3}],3} = 
+        erl_scan:string(U3, 1),
+
+    U4 = "\"\\^\n\\x{aaa}\\^\n\"",
+    ?line {ok,[{'[',1},{char,1,$\n},{',',2},{integer,2,16#aaa},
+               {',',2},{char,2,$\n},{']',3}],3} = erl_scan:string(U4, 1),
+
+    %% Keep these tests:
+    ?line test(Qs),
+    ?line test(U1),
+    ?line test(U2),
+    ?line test(U3),
+    ?line test(U4),
+
+    Str1 = "\"ab" ++ [1089] ++ "cd\"",
+    ?line {ok,[{'[',1},{char,1,$a},{',',1},{char,1,$b},{',',1},
+               {integer,1,1089},{',',1},{char,1,$c},{',',1},
+               {char,1,$d},{']',1}],1} = erl_scan:string(Str1),
+    ?line {ok,[{'[',_},{char,_,$a},{',',_},{char,_,$b},{',',_},
+               {integer,_,1089},{',',_},{char,_,$c},{',',_},
+               {char,_,$d},{']',_}],{1,8}} = erl_scan:string(Str1, {1,1}),
+    ?line test(Str1),
+    Comment = "%% "++[1089],
+    ?line {ok,[{comment,1,[$%,$%,$\s,1089]}],1} = 
+        erl_scan:string(Comment, 1, return),
+    ?line {ok,[{comment,_,[$%,$%,$\s,1089]}],{1,5}} = 
+        erl_scan:string(Comment, {1,1}, return),                           
+    ok.
+
+more_chars() ->
+    %% Due to unicode, the syntax has been incompatibly augmented:
+    %% $\x{...}, $\xHH
+
+    %% All kinds of tests...
+    ?line {ok,[{char,_,123}],{1,4}} =
+        erl_scan:string("$\\{",{1,1}),
+    ?line {more, C1} = erl_scan:tokens([], "$\\{", {1,1}),
+    ?line {done,{ok,[{char,_,123}],{1,4}},eof} =
+        erl_scan:tokens(C1, eof, 1),
+    ?line {ok,[{char,1,123},{atom,1,a},{'}',1}],1} =
+        erl_scan:string("$\\{a}"),
+    
+    ?line {error,{{1,1},erl_scan,char},{1,4}} =
+        erl_scan:string("$\\x", {1,1}),
+    ?line {error,{{1,1},erl_scan,char},{1,5}} =
+        erl_scan:string("$\\x{",{1,1}),
+    ?line {more, C3} = erl_scan:tokens([], "$\\x", {1,1}),
+    ?line {done,{error,{{1,1},erl_scan,char},{1,4}},eof} =
+        erl_scan:tokens(C3, eof, 1),
+    ?line {error,{{1,1},erl_scan,char},{1,5}} = 
+        erl_scan:string("$\\x{",{1,1}),
+    ?line {more, C2} = erl_scan:tokens([], "$\\x{", {1,1}),
+    ?line {done,{error,{{1,1},erl_scan,char},{1,5}},eof} = 
+        erl_scan:tokens(C2, eof, 1),
+    ?line {error,{1,erl_scan,{illegal,character}},1} = 
+        erl_scan:string("$\\x{g}"),
+    ?line {error,{{1,1},erl_scan,{illegal,character}},{1,5}} =
+        erl_scan:string("$\\x{g}", {1,1}),
+    ?line {error,{{1,1},erl_scan,{illegal,character}},{1,6}} =
+        erl_scan:string("$\\x{}",{1,1}),
+
+    ?line test("\"\\{0}\""),
+    ?line test("\"\\x{0}\""),
+    ?line test("\'\\{0}\'"),
+    ?line test("\'\\x{0}\'"),
+
+    ?line {error,{{2,3},erl_scan,{illegal,character}},{2,6}} =
+        erl_scan:string("\"ab \n $\\x{g}\"",{1,1}),
+    ?line {error,{{2,3},erl_scan,{illegal,character}},{2,6}} =
+        erl_scan:string("\'ab \n $\\x{g}\'",{1,1}),
+
+    ?line test("$\\{34}"),
+    ?line test("$\\x{34}"),
+    ?line test("$\\{377}"),
+    ?line test("$\\x{FF}"),
+    ?line test("$\\{400}"),
+    ?line test("$\\x{100}"),
+    ?line test("$\\x{10FFFF}"),
+    ?line test("$\\x{10ffff}"),
+    ?line test("\"$\n \\{1}\""),
+    ?line {error,{1,erl_scan,{illegal,character}},1} = 
+        erl_scan:string("$\\x{110000}"),
+    ?line {error,{{1,1},erl_scan,{illegal,character}},{1,12}} = 
+        erl_scan:string("$\\x{110000}", {1,1}),
+
+    ?line {error,{{1,1},erl_scan,{illegal,character}},{1,4}} = 
+        erl_scan:string("$\\xfg", {1,1}),
+
+    ?line test("$\\xffg"),
+
+    ?line {error,{{1,1},erl_scan,{illegal,character}},{1,4}} =
+        erl_scan:string("$\\xg", {1,1}),
+    ok.
+
+test_string(String, Expected) ->
+    {ok, Expected, _End} = erl_scan:string(String),
+    test(String).
+
+%% test_string(String, Expected, StartLocation, Options) ->
+%%     {ok, Expected, _End} = erl_scan:string(String, StartLocation, Options),
+%%     test(String).
+
+%% There are no checks of the tags...
+test(String) ->
+    %% io:format("Testing `~ts'~n", [String]),
+    [{Tokens, End},
+     {Wtokens, Wend},
+     {Ctokens, Cend},
+     {CWtokens, CWend},
+     {CWtokens2, _}] = 
+        [scan_string_with_column(String, X) ||
+            X <- [[], 
+                  [return_white_spaces], 
+                  [return_comments], 
+                  [return],
+                  [return]]], % for white space compaction test
+
+    {end1,End,Wend} = {end1,Wend,End},
+    {end2,Wend,Cend} = {end2,Cend,Wend},
+    {end3,Cend,CWend} = {end3,CWend,Cend},
+
+    %% Test that the tokens that are common to two token lists are identical.
+    {none,Tokens} = {none, filter_tokens(CWtokens, [white_space,comment])},
+    {comments,Ctokens} =
+        {comments,filter_tokens(CWtokens, [white_space])},
+    {white_spaces,Wtokens} = 
+        {white_spaces,filter_tokens(CWtokens, [comment])},
+
+    %% Use token attributes to extract parts from the original string,
+    %% and check that the parts are identical to the token strings.
+    {Line,Column} = test_decorated_tokens(String, CWtokens),
+    {deco,{Line,Column},End} = {deco,End,{Line,Column}},
+
+    %% Almost the same again: concat texts to get the original:
+    Text = get_text(CWtokens),
+    {text,Text,String} = {text,String,Text},
+
+    %% Test that white spaces occupy less heap than the worst case.
+    ok = test_white_space_compaction(CWtokens, CWtokens2),
+
+    %% Test that white newlines are always first in text:
+    WhiteTokens = select_tokens(CWtokens, [white_space]),
+    ok = newlines_first(WhiteTokens),
+
+    %% Line attribute only:
+    [Simple,Wsimple,Csimple,WCsimple] = Simples =
+        [element(2, erl_scan:string(String, 1, Opts)) ||
+            Opts <- [[], 
+                     [return_white_spaces], 
+                     [return_comments], 
+                     [return]]],
+    {consistent,true} = {consistent,consistent_attributes(Simples)},
+    {simple_wc,WCsimple} = {simple_wc,simplify(CWtokens)},
+    {simple,Simple} = {simple,filter_tokens(WCsimple, [white_space,comment])},
+    {simple_c,Csimple} = {simple_c,filter_tokens(WCsimple, [white_space])},
+    {simple_w,Wsimple} = {simple_w,filter_tokens(WCsimple, [comment])},
+
+    %% Line attribute only, with text:
+    [SimpleTxt,WsimpleTxt,CsimpleTxt,WCsimpleTxt] = SimplesTxt =
+        [element(2, erl_scan:string(String, 1, [text|Opts])) ||
+            Opts <- [[], 
+                     [return_white_spaces], 
+                     [return_comments], 
+                     [return]]],
+    TextTxt = get_text(WCsimpleTxt),
+    {text_txt,TextTxt,String} = {text_txt,String,TextTxt},
+    {consistent_txt,true} = 
+        {consistent_txt,consistent_attributes(SimplesTxt)},
+    {simple_txt,SimpleTxt} = 
+        {simple_txt,filter_tokens(WCsimpleTxt, [white_space,comment])},
+    {simple_c_txt,CsimpleTxt} = 
+        {simple_c_txt,filter_tokens(WCsimpleTxt, [white_space])},
+    {simple_w_txt,WsimpleTxt} = 
+        {simple_w_txt,filter_tokens(WCsimpleTxt, [comment])},
+
+    ok.
+
+test_white_space_compaction(Tokens, Tokens2) when Tokens =:= Tokens2 ->
+    [WS, WS2] = [select_tokens(Ts, [white_space]) || Ts <- [Tokens, Tokens2]],
+    test_wsc(WS, WS2).
+    
+test_wsc([], []) ->
+    ok;
+test_wsc([Token|Tokens], [Token2|Tokens2]) ->
+    [Text, Text2] = [Text || 
+                        {text, Text} <- 
+                            [erl_scan:token_info(T, text) ||
+                                T <- [Token, Token2]]],
+    Sz = erts_debug:size(Text),
+    Sz2 = erts_debug:size({Text, Text2}),
+    IsCompacted = Sz2 < 2*Sz+erts_debug:size({a,a}),
+    ToBeCompacted = is_compacted(Text),    
+    if
+        IsCompacted =:= ToBeCompacted ->
+            test_wsc(Tokens, Tokens2);
+        true ->
+            {compaction_error, Token}
+    end.
+
+is_compacted("\r") ->
+    true;
+is_compacted("\n\r") ->
+    true;
+is_compacted("\n\f") ->
+    true;
+is_compacted([$\n|String]) ->
+      all_spaces(String) 
+    orelse
+      all_tabs(String);
+is_compacted(String) ->
+      all_spaces(String)
+    orelse
+      all_tabs(String).
+  
+all_spaces(L) ->
+    all_same(L, $\s).
+
+all_tabs(L) ->
+    all_same(L, $\t).
+
+all_same(L, Char) ->
+    lists:all(fun(C) -> C =:= Char end, L).
+
+newlines_first([]) ->
+    ok;
+newlines_first([Token|Tokens]) ->
+    {text,Text} = erl_scan:token_info(Token, text),
+    Nnls = length([C || C <- Text, C =:= $\n]),
+    OK = case Text of
+             [$\n|_] ->
+                 Nnls =:= 1;
+             _ ->
+                 Nnls =:= 0
+         end,
+    if 
+        OK -> newlines_first(Tokens);
+        true -> OK
+    end.
+
+filter_tokens(Tokens, Tags) ->
+    lists:filter(fun(T) -> not lists:member(element(1, T), Tags) end, Tokens).
+
+select_tokens(Tokens, Tags) ->
+    lists:filter(fun(T) -> lists:member(element(1, T), Tags) end, Tokens).
+
+simplify([Token|Tokens]) ->
+    {line,Line} = erl_scan:token_info(Token, line),
+    [setelement(2, Token, Line) | simplify(Tokens)];
+simplify([]) ->
+    [].
+
+get_text(Tokens) ->
+    lists:flatten(
+      [T || 
+          Token <- Tokens,
+          ({text,T} = erl_scan:token_info(Token, text)) =/= []]).
+
+test_decorated_tokens(String, Tokens) ->
+    ToksAttrs = token_attrs(Tokens),
+    test_strings(ToksAttrs, String, 1, 1).
+
+token_attrs(Tokens) ->
+    [{L,C,Len,T} ||
+        Token <- Tokens,
+        ([{line,L},{column,C},{length,Len},{text,T}] = 
+         erl_scan:token_info(Token, [line,column,length,text])) =/= []].
+
+test_strings([], _S, Line, Column) ->
+    {Line,Column};
+test_strings([{L,C,Len,T}=Attr|Attrs], String0, Line0, Column0) ->
+    {String1, Column1} = skip_newlines(String0, L, Line0, Column0),
+    String = skip_chars(String1, C-Column1),
+    {Str,Rest} = lists:split(Len, String),
+    if
+        Str =:= T ->
+            {Line,Column} = string_newlines(T, L, C),
+            test_strings(Attrs, Rest, Line, Column);
+        true ->
+            {token_error, Attr, Str}
+    end.
+
+skip_newlines(String, Line, Line, Column) ->
+    {String, Column};
+skip_newlines([$\n|String], L, Line, _Column) ->
+    skip_newlines(String, L, Line+1, 1);
+skip_newlines([_|String], L, Line, Column) ->
+    skip_newlines(String, L, Line, Column+1).
+
+skip_chars(String, 0) ->
+    String;
+skip_chars([_|String], N) ->
+    skip_chars(String, N-1).
+
+string_newlines([$\n|String], Line, _Column) ->
+    string_newlines(String, Line+1, 1);
+string_newlines([], Line, Column) ->
+    {Line, Column};
+string_newlines([_|String], Line, Column) ->
+    string_newlines(String, Line, Column+1).
+
+scan_string_with_column(String, Options0) ->
+    Options = [text | Options0],
+    StartLoc = {1, 1},
+    {ok, Ts1, End1} = erl_scan:string(String, StartLoc, Options),
+    TString = String ++ ". ",
+    {ok,Ts2,End2} = scan_tokens(TString, Options, [], StartLoc),
+    {ok, Ts3, End3} = 
+        scan_tokens_1({more, []}, TString, Options, [], StartLoc),
+    {end_2,End2,End3} = {end_2,End3,End2},
+    {EndLine1,EndColumn1} = End1,
+    End2 = {EndLine1,EndColumn1+2},
+    {ts_1,Ts2,Ts3} = {ts_1,Ts3,Ts2},
+    Ts2 = Ts1 ++ [lists:last(Ts2)],
+
+    %% Attributes are keylists, but have no text.
+    {ok, Ts7, End7} = erl_scan:string(String, {1,1}, Options),
+    {ok, Ts8, End8} = scan_tokens(TString, Options, [], {1,1}),
+    {end1, End1} = {end1, End7},
+    {end2, End2} = {end2, End8},
+    Ts8 = Ts7 ++ [lists:last(Ts8)],
+    {cons,true} = {cons,consistent_attributes([Ts1,Ts2,Ts3,Ts7,Ts8])},
+
+    {Ts1, End1}.
+
+scan_tokens(String, Options, Rs, Location) ->
+    case erl_scan:tokens([], String, Location, Options) of
+        {done, {ok,Ts,End}, ""} ->
+            {ok, lists:append(lists:reverse([Ts|Rs])), End};
+        {done, {ok,Ts,End}, Rest} ->
+            scan_tokens(Rest, Options, [Ts|Rs], End)
+    end.
+
+scan_tokens_1({done, {ok,Ts,End}, ""}, "", _Options, Rs, _Location) ->
+    {ok,lists:append(lists:reverse([Ts|Rs])),End};
+scan_tokens_1({done, {ok,Ts,End}, Rest}, Cs, Options, Rs, _Location) ->
+    scan_tokens_1({more,[]}, Rest++Cs, Options, [Ts|Rs], End);
+scan_tokens_1({more, Cont}, [C | Cs], Options, Rs, Loc) ->
+    R = erl_scan:tokens(Cont, [C], Loc, Options),
+    scan_tokens_1(R, Cs, Options, Rs, Loc).
+
+consistent_attributes([]) ->
+    true;
+consistent_attributes([Ts | TsL]) ->
+    L = [T || T <- Ts, is_integer(element(2, T))],
+    case L of
+        [] ->
+            TagsL = [[Tag || {Tag,_} <- 
+                                 erl_scan:attributes_info(element(2, T))] || 
+                        T <- Ts],
+            case lists:usort(TagsL) of
+                [_] ->
+                    consistent_attributes(TsL);
+                [] when Ts =:= [] ->
+                    consistent_attributes(TsL);
+                _ ->
+                    Ts
+            end;
+        Ts ->
+            consistent_attributes(TsL);
+        _ ->
+            Ts
+    end.
+
+family_list(L) ->
+    sofs:to_external(family(L)).
+
+family(L) ->
+    sofs:relation_to_family(sofs:relation(L)).
author	Erlang/OTP <[email protected]>	2009-11-20 14:54:40 +0000
committer	Erlang/OTP <[email protected]>	2009-11-20 14:54:40 +0000
commit	84adefa331c4159d432d22840663c38f155cd4c1 (patch)
tree	bff9a9c66adda4df2106dfd0e5c053ab182a12bd /lib/stdlib/test/erl_scan_SUITE.erl
download	otp-84adefa331c4159d432d22840663c38f155cd4c1.tar.gz otp-84adefa331c4159d432d22840663c38f155cd4c1.tar.bz2 otp-84adefa331c4159d432d22840663c38f155cd4c1.zip