1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
|
%%-*-erlang-*-
%%--------------------------------------------------------------------
%% %CopyrightBegin%
%%
%% Copyright Ericsson AB 2008-2017. All Rights Reserved.
%%
%% Licensed under the Apache License, Version 2.0 (the "License");
%% you may not use this file except in compliance with the License.
%% You may obtain a copy of the License at
%%
%% http://www.apache.org/licenses/LICENSE-2.0
%%
%% Unless required by applicable law or agreed to in writing, software
%% distributed under the License is distributed on an "AS IS" BASIS,
%% WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
%% See the License for the specific language governing permissions and
%% limitations under the License.
%%
%% %CopyrightEnd%
%%----------------------------------------------------------------------
%% File : xmerl_sax_parser_utf16be.erl
%% Description :
%%
%% Created : 26 May 2008
%%----------------------------------------------------------------------
-module(xmerl_sax_parser_utf16be).
%%----------------------------------------------------------------------
%% Macros
%%----------------------------------------------------------------------
-define(STRING_EMPTY, <<>>).
-define(STRING(MatchStr), <<MatchStr/big-utf16>>).
-define(STRING_REST(MatchStr, Rest), <<MatchStr/big-utf16, Rest/binary>>).
-define(APPEND_STRING(Rest, New), <<Rest/binary, New/binary>>).
-define(TO_INPUT_FORMAT(Val), unicode:characters_to_binary(Val, unicode, {utf16, big})).
-define(STRING_UNBOUND_REST(MatchChar, Rest), <<MatchChar/big-utf16, Rest/binary>>).
-define(BYTE_ORDER_MARK_1, <<16#FE>>).
-define(BYTE_ORDER_MARK_REST(Rest), <<16#FE, 16#FF, Rest/binary>>).
-define(PARSE_BYTE_ORDER_MARK(Bytes, State),
parse_byte_order_mark(?STRING_EMPTY, State) ->
cf(?STRING_EMPTY, State, fun parse_byte_order_mark/2);
parse_byte_order_mark(?BYTE_ORDER_MARK_1, State) ->
cf(?BYTE_ORDER_MARK_1, State, fun parse_byte_order_mark/2);
parse_byte_order_mark(?BYTE_ORDER_MARK_REST(Rest), State) ->
parse_xml_decl(Rest, State);
parse_byte_order_mark(Bytes, State) ->
parse_xml_decl(Bytes, State)).
-define(PARSE_XML_DECL(Bytes, State),
parse_xml_decl(Bytes, #xmerl_sax_parser_state{encoding=Enc} = State) when is_binary(Bytes) ->
case unicode:characters_to_list(Bytes, Enc) of
{incomplete, _, _} ->
cf(Bytes, State, fun parse_xml_decl/2);
{error, _Encoded, _Rest} ->
?fatal_error(State, lists:flatten(io_lib:format("Bad character, not in ~p\n", [Enc])));
_ ->
parse_prolog(Bytes, State)
end;
parse_xml_decl(Bytes, State) ->
parse_prolog(Bytes, State)).
-define(WHITESPACE(Bytes, State, Acc),
whitespace(?STRING_UNBOUND_REST(_C, _) = Bytes, State, Acc) ->
{lists:reverse(Acc), Bytes, State};
whitespace(Bytes, #xmerl_sax_parser_state{encoding=Enc} = State, Acc) when is_binary(Bytes) ->
case unicode:characters_to_list(Bytes, Enc) of
{incomplete, _, _} ->
cf(Bytes, State, Acc, fun whitespace/3);
{error, _Encoded, _Rest} ->
?fatal_error(State, lists:flatten(io_lib:format("Bad character, not in ~p\n", [Enc])))
end).
-define(PARSE_EXTERNAL_ENTITY_BYTE_ORDER_MARK(Bytes, State),
parse_external_entity_byte_order_mark(?STRING_EMPTY, State) ->
cf(?STRING_EMPTY, State, fun parse_external_entity_byte_order_mark/2);
parse_external_entity_byte_order_mark(?BYTE_ORDER_MARK_1, State) ->
cf(?BYTE_ORDER_MARK_1, State, fun parse_external_entity_byte_order_mark/2);
parse_external_entity_byte_order_mark(?BYTE_ORDER_MARK_REST(Rest), State) ->
parse_external_entity_1(Rest, State);
parse_external_entity_byte_order_mark(Bytes, State) ->
parse_external_entity_1(Bytes, State)).
|