aboutsummaryrefslogtreecommitdiffstats
path: root/lib/xmerl/src/xmerl_otpsgml.erl
diff options
context:
space:
mode:
Diffstat (limited to 'lib/xmerl/src/xmerl_otpsgml.erl')
-rw-r--r--lib/xmerl/src/xmerl_otpsgml.erl162
1 files changed, 162 insertions, 0 deletions
diff --git a/lib/xmerl/src/xmerl_otpsgml.erl b/lib/xmerl/src/xmerl_otpsgml.erl
new file mode 100644
index 0000000000..38688e788f
--- /dev/null
+++ b/lib/xmerl/src/xmerl_otpsgml.erl
@@ -0,0 +1,162 @@
+%%
+%% %CopyrightBegin%
+%%
+%% Copyright Ericsson AB 2004-2009. All Rights Reserved.
+%%
+%% The contents of this file are subject to the Erlang Public License,
+%% Version 1.1, (the "License"); you may not use this file except in
+%% compliance with the License. You should have received a copy of the
+%% Erlang Public License along with this software. If not, it can be
+%% retrieved online at http://www.erlang.org/.
+%%
+%% Software distributed under the License is distributed on an "AS IS"
+%% basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See
+%% the License for the specific language governing rights and limitations
+%% under the License.
+%%
+%% %CopyrightEnd%
+%%
+
+%%% Description : Callback module for exporting XHTML to OTP-SGML.
+
+-module(xmerl_otpsgml).
+
+-export(['#xml-inheritance#'/0]).
+
+%% Note: we assume XML data, so all tags are lowercase!
+
+-export(['#root#'/4,
+ '#element#'/5,
+ '#text#'/1,
+ p/4]).
+
+-import(xmerl_lib, [markup/3, start_tag/2, is_empty_data/1,
+ export_text/1]).
+
+-include("xmerl.hrl").
+
+
+'#xml-inheritance#'() -> [xmerl_sgml].
+
+
+%% The '#text#' function is called for every text segment.
+
+'#text#'(Text) ->
+ export_text(Text).
+
+
+%% The '#root#' tag is called when the entire structure has been
+%% exported. It does not appear in the structure itself.
+
+'#root#'(Data, _Attrs, [], _E) ->
+ ["<!doctype erlref PUBLIC \"-//Stork//DTD erlref//EN\">\n",Data].
+
+
+%% Note that SGML does not have the <Tag/> empty-element form.
+%% Furthermore, for some element types, the end tag is forbidden. (In
+%% all other cases, we always generate the end tag, to make sure that
+%% the scope of a markup is not extended by mistake.)
+
+'#element#'(Tag, Data, Attrs, _Parents, _E) ->
+% io:format("parents:\n~p\n",[_Parents]),
+ case convert_tag(Tag,Attrs) of
+ {false,NewTag,NewAttrs} ->
+ markup(NewTag, NewAttrs, Data);
+ {true,NewTag,NewAttrs} ->
+ [start_tag(NewTag, NewAttrs), Data]
+ end.
+
+
+%% HTML tags with special handling
+
+p(Data, Attrs, _Parents, _E) ->
+ %% In general, we cannot drop the end tag for paragraph elements;
+ %% that is only allowed if we know that it is immediately followed
+ %% by some other block-level tag.
+ case is_empty_data(Data) of
+ true ->
+ %% Paragraph elements should never be completely empty.
+ markup(p, Attrs, "\s");
+ false ->
+ markup(p, Attrs, Data)
+ end.
+
+
+%% Utility functions
+
+convert_tag(code,Attrs) -> convert_tag(c,Attrs);
+convert_tag(strong,Attrs) -> convert_tag(em,Attrs);
+convert_tag(b,Attrs) -> convert_tag(em,Attrs);
+convert_tag(underline,Attrs) -> convert_tag(em,Attrs); % what is underline in sgml???
+convert_tag(dl,Attrs) -> convert_tag(taglist,Attrs);
+convert_tag(dt,Attrs) -> convert_tag(tag,Attrs);
+convert_tag(dd,Attrs) -> convert_tag(item,Attrs);
+convert_tag(ul,Attrs) -> convert_tag(list,Attrs);
+convert_tag(li,Attrs) -> convert_tag(item,Attrs);
+convert_tag(tt,Attrs) -> convert_tag(c,Attrs);
+%convert_tag(a, Attrs) -> convert_tag(seealso,convert_seealso_attrs(Attrs));
+convert_tag(a, Attrs) -> convert_tag(convert_aref(Attrs),convert_aref_attrs(convert_aref(Attrs),Attrs));
+convert_tag(Tag,Attrs) -> {forbid_end(Tag),Tag,Attrs}.
+
+convert_aref([#xmlAttribute{name = href, value = V}|_Rest]) ->
+ %% search if it is a html link, thus make it a 'url' ref otherwise
+ %% a 'seealso'.
+ case html_content(V) of
+ true ->
+ url;
+ _ ->
+ seealso
+ end;
+convert_aref([#xmlAttribute{name = K}|Rest]) ->
+ io:format("Warning: ignoring attribute \'~p\' for tag \'a\'\n",[K]),
+ convert_aref(Rest).
+convert_aref_attrs(url,Attrs) ->
+ Attrs;
+convert_aref_attrs(SA,[#xmlAttribute{name = href, value = V}=A|Rest]) ->
+ [A#xmlAttribute{name=marker,value=V}|convert_aref_attrs(SA,Rest)];
+convert_aref_attrs(_,[])->
+ [].
+html_content([]) ->
+ false;
+html_content([$.|Rest]) ->
+ case Rest of
+ "htm"++_EmaNfeR ->
+ true;
+ _ -> html_content(Rest)
+ end;
+html_content([_H|T]) ->
+ html_content(T).
+
+% convert_seealso_attrs([#xmlAttribute{name = href, value = V} = A|Rest]) ->
+% [A#xmlAttribute{name=marker,value=normalize_web_ref(V)}|convert_seealso_attrs(Rest)];
+% convert_seealso_attrs([#xmlAttribute{name = K}|Rest]) ->
+% io:format("Warning: ignoring attribute \'~p\' for tag \'a\'\n",[K]),
+% convert_seealso_attrs(Rest);
+% convert_seealso_attrs([]) ->
+% [].
+
+% normalize_web_ref(RefName) ->
+% normalize_web_ref1(lists:reverse(RefName)).
+
+% normalize_web_ref1("lmth."++EmaNfeR) ->
+% lists:reverse(EmaNfeR);
+% normalize_web_ref1("mth"++EmaNfeR) ->
+% lists:reverse(EmaNfeR);
+% normalize_web_ref1(RefName) ->
+% RefName.
+
+forbid_end(area) -> true;
+forbid_end(base) -> true;
+forbid_end(basefont) -> true;
+forbid_end(br) -> true;
+forbid_end(col) -> true;
+forbid_end(frame) -> true;
+forbid_end(hr) -> true;
+forbid_end(img) -> true;
+forbid_end(input) -> true;
+forbid_end(isindex) -> true;
+forbid_end(link) -> true;
+forbid_end(marker) -> true;
+forbid_end(meta) -> true;
+forbid_end(param) -> true;
+forbid_end(_) -> false.