aboutsummaryrefslogtreecommitdiffstats
path: root/lib/xmerl/src/xmerl_html.erl
diff options
context:
space:
mode:
Diffstat (limited to 'lib/xmerl/src/xmerl_html.erl')
-rw-r--r--lib/xmerl/src/xmerl_html.erl122
1 files changed, 122 insertions, 0 deletions
diff --git a/lib/xmerl/src/xmerl_html.erl b/lib/xmerl/src/xmerl_html.erl
new file mode 100644
index 0000000000..38fdeb2205
--- /dev/null
+++ b/lib/xmerl/src/xmerl_html.erl
@@ -0,0 +1,122 @@
+%%
+%% %CopyrightBegin%
+%%
+%% Copyright Ericsson AB 2003-2009. All Rights Reserved.
+%%
+%% The contents of this file are subject to the Erlang Public License,
+%% Version 1.1, (the "License"); you may not use this file except in
+%% compliance with the License. You should have received a copy of the
+%% Erlang Public License along with this software. If not, it can be
+%% retrieved online at http://www.erlang.org/.
+%%
+%% Software distributed under the License is distributed on an "AS IS"
+%% basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See
+%% the License for the specific language governing rights and limitations
+%% under the License.
+%%
+%% %CopyrightEnd%
+%%
+
+%%% Description : Callback module for exporting XHTML to HTML.
+
+-module(xmerl_html).
+
+-export(['#xml-inheritance#'/0]).
+
+%% Note: we assume XHTML data, so all tags are lowercase!
+
+-export(['#root#'/4,
+ '#element#'/5,
+ '#text#'/1,
+ p/4]).
+
+-import(xmerl_lib, [start_tag/2, end_tag/1, is_empty_data/1,
+ find_attribute/2, export_text/1]).
+
+-include("xmerl.hrl").
+
+
+'#xml-inheritance#'() -> [].
+
+
+%% The '#text#' function is called for every text segment.
+
+'#text#'(Text) ->
+ export_text(Text).
+
+
+%% The '#root#' tag is called when the entire structure has been
+%% exported. It does not appear in the structure itself.
+
+'#root#'(Data, Attrs, [], _E) ->
+ Ver = case find_attribute(version, Attrs) of
+ {value, V} ->
+ V;
+ false ->
+%%% "-//W3C//DTD HTML 4.01//EN" % strict
+ "-//W3C//DTD HTML 4.01 Transitional//EN" % loose
+ end,
+ URI = case find_attribute(uri, Attrs) of
+ {value, U} ->
+ [" \"", U, "\""];
+ false ->
+%%% " \"http://www.w3.org/TR/html4/strict.dtd\""
+%%% " \"http://www.w3.org/TR/html4/loose.dtd\""
+ ""
+ end,
+ ["<!DOCTYPE HTML PUBLIC \"", Ver, "\"", URI, ">\n", Data].
+
+
+%% HTML does not have the <Tag/> empty-element form of XML/XHTML.
+markup(Tag, Attrs, Data) ->
+ [start_tag(Tag, Attrs), Data, end_tag(Tag)].
+
+%% Some HTML elements must not have an end tag at all.
+markup_noend(Tag, Attrs, Data) ->
+ [start_tag(Tag, Attrs), Data].
+
+
+%% For some element types, the end tag is forbidden. (In all other
+%% cases, we always generate the end tag, to make sure that the scope of
+%% a markup is not extended by mistake.)
+
+'#element#'(Tag, Data, Attrs, _Parents, _E) ->
+ case forbid_end(Tag) of
+ false ->
+ markup(Tag, Attrs, Data);
+ true ->
+ markup_noend(Tag, Attrs, Data)
+ end.
+
+
+%% HTML tags with special handling
+
+p(Data, Attrs, _Parents, _E) ->
+ %% In general, we cannot drop the end tag for paragraph elements;
+ %% that is only allowed if we know that it is immediately followed
+ %% by some other block-level tag.
+ case is_empty_data(Data) of
+ true ->
+ %% Paragraph elements should never be completely empty.
+ markup(p, Attrs, "\s");
+ false ->
+ markup(p, Attrs, Data)
+ end.
+
+
+%% Utility functions
+
+forbid_end(area) -> true;
+forbid_end(base) -> true;
+forbid_end(basefont) -> true;
+forbid_end(br) -> true;
+forbid_end(col) -> true;
+forbid_end(frame) -> true;
+forbid_end(hr) -> true;
+forbid_end(img) -> true;
+forbid_end(input) -> true;
+forbid_end(isindex) -> true;
+forbid_end(link) -> true;
+forbid_end(meta) -> true;
+forbid_end(param) -> true;
+forbid_end(_) -> false.