From eec56b21f02368b085b0b1076233448459b4c555 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Bj=C3=B6rn-Egil=20Dahlberg?= <psyeugenic@gmail.com>
Date: Mon, 1 Feb 2010 11:51:06 +0100
Subject: Add lcnt documentation

Documentation for the lock profiling tool
---
 lib/tools/doc/src/Makefile         |   2 +
 lib/tools/doc/src/lcnt.xml         | 465 +++++++++++++++++++++++++++++++++++++
 lib/tools/doc/src/lcnt_chapter.xml | 301 ++++++++++++++++++++++++
 lib/tools/doc/src/part.xml         |   3 +
 lib/tools/doc/src/ref_man.xml      |   6 +
 5 files changed, 777 insertions(+)
 create mode 100644 lib/tools/doc/src/lcnt.xml
 create mode 100644 lib/tools/doc/src/lcnt_chapter.xml
diff --git a/lib/tools/doc/src/Makefile b/lib/tools/doc/src/Makefile
index bab607c4bd..5ac8718b61 100644
--- a/lib/tools/doc/src/Makefile
+++ b/lib/tools/doc/src/Makefile
@@ -41,6 +41,7 @@ XML_REF3_FILES = \
 	eprof.xml \
 	fprof.xml \
 	cprof.xml \
+	lcnt.xml \
 	instrument.xml \
 	make.xml \
 	tags.xml \
@@ -53,6 +54,7 @@ XML_CHAPTER_FILES = \
 	cover_chapter.xml \
 	fprof_chapter.xml \
 	cprof_chapter.xml \
+	lcnt_chapter.xml \
 	erlang_mode_chapter.xml \
 	xref_chapter.xml \
 	notes.xml \
diff --git a/lib/tools/doc/src/lcnt.xml b/lib/tools/doc/src/lcnt.xml
new file mode 100644
index 0000000000..3c55e4e422
--- /dev/null
+++ b/lib/tools/doc/src/lcnt.xml
@@ -0,0 +1,465 @@
+<?xml version="1.0" encoding="latin1" ?>
+<!DOCTYPE erlref SYSTEM "erlref.dtd">
+
+<erlref>
+    <header>
+	<copyright>
+	    <year>2009</year>
+	    <year>2010</year>
+	    <holder>Ericsson AB, All Rights Reserved</holder>
+	</copyright>
+	<legalnotice>
+	    The contents of this file are subject to the Erlang Public License,
+	    Version 1.1, (the "License"); you may not use this file except in
+	    compliance with the License. You should have received a copy of the
+	    Erlang Public License along with this software. If not, it can be
+	    retrieved online at http://www.erlang.org/.
+
+	    Software distributed under the License is distributed on an "AS IS"
+	    basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See
+	    the License for the specific language governing rights and limitations
+	    under the License.
+
+	    The Initial Developer of the Original Code is Ericsson AB.
+	</legalnotice>
+
+	<title>lcnt</title>
+	<prepared>Björn-Egil Dahlberg</prepared>
+	<responsible>nobody</responsible>
+	<docno></docno>
+	<approved>nobody</approved>
+	<checked></checked>
+	<date>2009-11-26</date>
+	<rev>PA1</rev>
+	<file>lcnt.xml</file>
+    </header>
+    <module>lcnt</module>
+    <modulesummary>A runtime system Lock Profiling tool.</modulesummary>
+    <description>
+	<p>The <c>lcnt</c> module is used to profile the internal ethread locks in the
+	    Erlang Runtime System. With <c>lcnt</c> enabled, Internal counters in the
+	    runtime system are updated each time a lock is taken. The counters stores
+	    information about the number of acquisition tries and the number of collisions
+	    that has occurred during the acquisition tries. The counters also record the
+	    waiting time a lock has caused for a blocked thread when a collision has occurred.
+	</p>
+	<p>
+	    The data produced by the lock counters will give an estimate on how well
+	    the runtime system will behave from a parallelizable view point for the
+	    scenarios tested. This tool was mainly developed to help erlang runtime
+	    developers iron out potential and generic bottlenecks.
+	</p>
+	<p>Locks in the emulator are named after what type of resource they protect and where
+	    in the emulator they are initialized, those are lock 'classes'. Most of those
+	    locks are also instantiated several times, and given unique identifiers, to increase
+	    locking granularity. Typically an instantiated lock protects a disjunct set of
+	    the resource, i.e ets-tables, processes or ports. In other cases it protects a
+	    specific range of a resource, e.g. <c>pix_lock</c> which protects index to process
+	    mappings, and is given a unique number within the class. A unique lock in <c>lcnt</c>
+	    is referenced by a name (class) and an identifier, <c>{Name, Id}</c>.
+	</p>
+	<p>Some locks in the system are static and protects global resources, for example
+	    <c>bif_timers</c> and the <c>run_queue</c> locks. Other locks are dynamic and not
+	    necessarily long lived, for example process locks and ets-table locks. The
+	    statistics data from short lived locks can be stored separately when the locks
+	    are deleted. This behavior is by default turned off to save memory but can be
+	    turned on via <c>lcnt:rt_opt({copy_save, true})</c>. The <c>lcnt:apply/1,2,3</c>
+	    functions enables this behavior during profiling.
+	</p>
+    </description>
+    <funcs>
+
+	<func>
+	    <name>start() -> {ok, Pid} | {error, {already_started, Pid}} </name>
+	    <fsummary>Starts the lock profiler server.</fsummary>
+	    <type>
+		<v>Pid = pid()</v>
+	    </type>
+	    <desc>
+		<p>Starts the lock profiler server. The server only act as a medium for the
+		    user and performs filtering and printing of data collected by <c>lcnt:collect/1</c>.
+		</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>stop() -> ok</name>
+	    <fsummary>Stops the lock profiler server.</fsummary>
+	    <desc>
+		<p>Stops the lock profiler server.</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>collect() -> ok</name>
+	    <fsummary>Same as <c>collect(node())</c>.</fsummary>
+	    <desc><p>Same as <c>collect(node())</c>.</p></desc>
+	</func>
+
+	<func>
+	    <name>collect(Node) -> ok</name>
+	    <fsummary>Collects lock statistics from the runtime system.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+	    </type>
+	    <desc>
+		<p>Collects lock statistics from the runtime system. The function starts a
+		    server if it is not already started. It then populates the server with lock
+		    statistics. If the server held any lock statistics data before the collect then
+		    that data is lost.
+		</p>
+		<note>
+		    <p>
+			When collection occurs the runtime system transitions to a single thread,
+			blocking all other threads. No other tasks will be scheduled during this
+			operation. Depending on the size of the data this might take a long time
+			(several seconds) and cause timeouts in the system.
+		    </p>
+		</note>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>clear() -> ok</name>
+	    <fsummary>Same as <c>clear(node())</c>.</fsummary>
+	    <desc><p>Same as <c>clear(node())</c>.</p></desc>
+	</func>
+
+	<func>
+	    <name>clear(Node) -> ok</name>
+	    <fsummary>Clears the internal lock statistics from runtime system.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+	    </type>
+	    <desc>
+		<p>Clears the internal lock statistics from the runtime system. This does not clear the
+		    data on the server only on runtime system. All counters for static locks are zeroed,
+		    all dynamic locks currently alive are zeroed and all saved locks now destroyed are removed.
+		    It also resets the duration timer.
+		</p>
+	    </desc>
+	</func>
+	<func>
+	    <name>conflicts() -> ok</name>
+	    <fsummary>Same as <c>conflicts([])</c>.</fsummary>
+	    <desc><p>Same as <c>conflicts([])</c>.</p></desc>
+	</func>
+	<func>
+	    <name>conflicts([Option]) -> ok</name>
+	    <fsummary>Prints a list of internal lock counters.</fsummary>
+	    <type>
+		<v>Option     = {sort, Sort} | {reverse, bool()} | {thresholds, [Thresholds]} | {print, [Print | {Print, integer()}]} | {max_locks, MaxLocks} | {combine, bool()}</v>
+		<v>Sort       = name | id | type | tries | colls | ratio | time | entry</v>
+		<v>Thresholds = {tries, integer()} | {colls, integer()} | {time, integer()}</v>
+		<v>Print      = name | id | type | entry | tries | colls | ratio | time | duration</v>
+		<v>MaxLocks   = integer() | none</v>
+	    </type>
+	    <desc>
+		<p>Prints a list of internal locks and its statistics.</p>
+		<p>For option description, see <seealso marker="#inspect/2">lcnt:inspect/2</seealso>.</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>locations() -> ok</name>
+	    <fsummary>Same as <c>locations([])</c>.</fsummary>
+	    <desc>
+		<p>Same as <c>locations([])</c>.</p>
+	    </desc>
+	</func>
+	<func>
+	    <name>locations([Option]) -> ok</name>
+	    <fsummary>Prints a list of internal lock counters by source code locations.</fsummary>
+	    <type>
+		<v>Option     = {sort, Sort} | {thresholds, [Thresholds]} | {print, [Print | {Print, integer()}]} | {max_locks, MaxLocks} | {combine, bool()}</v>
+		<v>Sort       = name | id | type | tries | colls | ratio | time | entry</v>
+		<v>Thresholds = {tries, integer()} | {colls, integer()} | {time, integer()}</v>
+		<v>Print      = name | id | type | entry | tries | colls | ratio | time | duration</v>
+		<v>MaxLocks   = integer() | none</v>
+	    </type>
+	    <desc>
+		<p>Prints a list of internal lock counters by source code locations.</p>
+		<p>For option description, see <seealso marker="#inspect/2">lcnt:inspect/2</seealso>.</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>inspect(Lock) -> ok</name>
+	    <fsummary>Same as <c>inspect(Lock, [])</c>.</fsummary>
+	    <desc><p>Same as <c>inspect(Lock, [])</c>.</p></desc>
+	</func>
+	<func>
+	    <name>inspect(Lock, [Option]) -> ok</name>
+	    <fsummary>Prints a list of internal lock counters for a specific lock.</fsummary>
+	    <type>
+		<v>Lock       = Name | {Name, Id | [Id]}</v>
+		<v>Name       = atom() | pid() | port()</v>
+		<v>Id         = atom() | integer() | pid() | port()</v>
+		<v>Option     = {sort, Sort} | {thresholds, [Thresholds]} | {print, [Print | {Print, integer()}]} | {max_locks, MaxLocks} | {combine, bool()} | {locations, bool()}</v>
+		<v>Sort       = name | id | type | tries | colls | ratio | time</v>
+		<v>Thresholds = {tries, integer()} | {colls, integer()} | {time, integer()}</v>
+		<v>Print      = name | id | type | entry | tries | colls | ratio | time | duration</v>
+		<v>MaxLocks   = integer() | none</v>
+	    </type>
+	    <desc>
+		<p>Prints a list of internal lock counters for a specific lock.</p>
+		<p>Lock <c>Name</c> and <c>Id</c> for ports and processes are interchangeable with the use of <c>lcnt:swap_pid_keys/0</c> and is the reason why <c>pid()</c> and <c>port()</c> options can be used in both <c>Name</c> and <c>Id</c> space. Both pids and ports are special identifiers with stripped creation and can be recreated with <seealso marker="#pid/3">lcnt:pid/2,3</seealso> and <seealso marker="#port/2">lcnt:port/1,2</seealso>.  </p>
+		<p>Option description:</p>
+		<taglist>
+		    <tag><c>{combine, bool()}</c></tag>
+		    <item>Combine the statistics from different instances of a lock class.
+			<br/>Default: <c>true</c>
+		    </item>
+
+		    <tag><c>{locations, bool()}</c></tag>
+		    <item>Print the statistics by source file and line numbers.
+			<br/>Default: <c>false</c>
+		    </item>
+
+		    <tag><c>{max_locks, MaxLocks}</c></tag>
+		    <item>Maximum number of locks printed or no limit with <c>none</c>.
+			<br/>Default: <c>20</c>
+		    </item>
+
+		    <tag><c>{print, PrintOptions}</c></tag>
+		    <item>Printing options:
+			<taglist>
+			    <tag><c>name</c></tag>
+			    <item>Named lock or named set of locks (classes). The same name used for initializing the lock in the VM.</item>
+
+			    <tag><c>id</c></tag>
+			    <item>Internal id for set of locks, not always unique. This could be table name for ets tables (db_tab), port id for ports, integer identifiers for allocators, etc.</item>
+
+			    <tag><c>type</c></tag>
+			    <item>Type of lock: <c>rw_mutex</c>, <c>mutex</c>, <c>spinlock</c>, <c>rw_spinlock</c> or <c>proclock</c>.</item>
+
+			    <tag><c>entry</c></tag>
+			    <item>In combination with <c>{locations, true}</c> this option prints the lock operations source file and line number entry-points along with statistics for each entry. </item>
+
+			    <tag><c>tries</c></tag>
+			    <item>Number of acquisitions of this lock.</item>
+
+			    <tag><c>colls</c></tag>
+			    <item>Number of collisions when a thread tried to acquire this lock. This is when a trylock is EBUSY, a write try on read held rw_lock, a try read on write held rw_lock, a thread tries to lock an already locked lock. (Internal states supervises this).</item>
+
+			    <tag><c>ratio</c></tag>
+			    <item>The ratio between the number of collisions and the number of tries (acquisitions) in percentage.</item>
+
+			    <tag><c>time</c></tag>
+			    <item>Accumulated waiting time for this lock. This could be greater than actual wall clock time, it is accumulated for all threads. Trylock conflicts does not accumulate time.</item>
+
+			    <tag><c>duration</c></tag>
+			    <item>Percentage of accumulated waiting time of wall clock time. This percentage can be higher than 100% since accumulated time is from all threads.</item>
+			</taglist>
+			<br/>Default: <c>[name,id,tries,colls,ratio,time,duration]</c>
+		    </item>
+
+		    <tag><c>{reverse, bool()}</c></tag>
+		    <item>Reverses the order of sorting.
+			<br/>Default: <c>false</c>
+		    </item>
+
+		    <tag><c>{sort, Sort}</c></tag>
+		    <item>Column sorting orders.
+			<br/>Default: <c>time</c>
+		    </item>
+
+		    <tag><c>{thresholds, Thresholds}</c></tag>
+		    <item>Filtering thresholds. Anything values above the threshold value are passed through.
+			<br/>Default: <c>[{tries, 0}, {colls, 0}, {time, 0}]</c>
+		    </item>
+
+		</taglist>
+
+	    </desc>
+	</func>
+
+	<func>
+	    <name>information() -> ok</name>
+	    <fsummary>Prints lcnt server state and generic information about collected lock statistics.</fsummary>
+	    <desc>
+		<p>Prints lcnt server state and generic information about collected lock statistics.</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>swap_pid_keys() -> ok</name>
+	    <fsummary>Swaps places on <c>Name</c> and <c>Id</c> space for ports and processes.</fsummary>
+	    <desc>
+		<p>Swaps places on <c>Name</c> and <c>Id</c> space for ports and processes.</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>load(Filename) -> ok</name>
+	    <fsummary>Restores previously saved data to the server.</fsummary>
+	    <type>
+		<v>Filename = filename()</v>
+	    </type>
+	    <desc>
+		<p>Restores previously saved data to the server.</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>save(Filename) -> ok</name>
+	    <fsummary>Saves the collected data to file.</fsummary>
+	    <type>
+		<v>Filename = filename()</v>
+	    </type>
+	    <desc>
+		<p>Saves the collected data to file.</p>
+	    </desc>
+	</func>
+    </funcs>
+
+    <section>
+	<title>Convenience functions</title>
+	<p>The following functions are used for convenience.</p>
+    </section>
+    <funcs>
+	<func>
+	    <name>apply(Fun) -> term()</name>
+	    <fsummary>Same as <c>apply(Fun, [])</c>.</fsummary>
+	    <desc>
+		<p>Same as <c>apply(Fun, [])</c>.</p>
+	    </desc>
+	</func>
+	<func>
+	    <name>apply(Fun, Args) -> term()</name>
+	    <fsummary>Clears counters, applies function and collects the profiling results.</fsummary>
+	    <type>
+		<v>Fun = fun()</v>
+		<v>Args = [term()]</v>
+	    </type>
+	    <desc>
+		<p> Clears the lock counters and then setups the instrumentation to save all destroyed locks.
+		    After setup the fun is called, passing the elements in <c>Args</c> as arguments.
+		    When the fun returns the statistics are immediately collected to the server. After the
+		    collection the instrumentation is returned to its previous behavior.
+		    The result of the applied fun is returned.
+		</p>
+	    </desc>
+	</func>
+	<func>
+	    <name>apply(Module, Function, Args) -> term()</name>
+	    <fsummary>Clears counters, applies function and collects the profiling results.</fsummary>
+	    <type>
+		<v>Module = atom()</v>
+		<v>Function = atom()</v>
+		<v>Args = [term()]</v>
+	    </type>
+	    <desc>
+		<p> Clears the lock counters and then setups the instrumentation to save all destroyed locks.
+		    After setup the function is called, passing the elements in <c>Args</c> as arguments.
+		    When the function returns the statistics are immediately collected to the server. After the
+		    collection the instrumentation is returned to its previous behavior.
+		    The result of the applied function is returned.
+		</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>pid(Id, Serial) -> pid()</name>
+	    <fsummary>Same as <c>pid(node(), Id, Serial)</c>.</fsummary>
+	    <desc><p>Same as <c>pid(node(), Id, Serial)</c>.</p></desc>
+	</func>
+	<func>
+	    <name>pid(Node, Id, Serial) -> pid()</name>
+	    <fsummary>Creates a process id with creation 0.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+		<v>Id = integer()</v>
+		<v>Serial = integer()</v>
+	    </type>
+	    <desc>
+		<p>Creates a process id with creation 0. Example:</p>
+	    </desc>
+	</func>
+
+	<func>
+	    <name>port(Id) -> port()</name>
+	    <fsummary>Same as <c>port(node(), Id)</c>.</fsummary>
+	    <desc><p>Same as <c>port(node(), Id)</c>.</p></desc>
+	</func>
+	<func>
+	    <name>port(Node, Id) -> port()</name>
+	    <fsummary>Creates a port id with creation 0.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+		<v>Id = integer()</v>
+	    </type>
+	    <desc><p>Creates a port id with creation 0.</p></desc>
+	</func>
+
+    </funcs>
+
+    <section>
+	<title>Internal runtime lock counter controllers</title>
+	<p> The following functions control the behavior of the internal counters.  </p>
+    </section>
+
+    <funcs>
+	<func>
+	    <name>rt_collect() -> [lock_counter_data()]</name>
+	    <fsummary>Same as <c>rt_collect(node())</c>.</fsummary>
+	    <desc> <p>Same as <c>rt_collect(node())</c>.</p> </desc>
+	</func>
+	<func>
+	    <name>rt_collect(Node) -> [lock_counter_data()]</name>
+	    <fsummary>Returns a list of raw lock counter data.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+	    </type>
+	    <desc> <p>Returns a list of raw lock counter data.</p> </desc>
+	</func>
+
+	<func>
+	    <name>rt_clear() -> ok</name>
+	    <fsummary>Same as <c>rt_clear(node())</c>.</fsummary>
+	    <desc> <p>Same as <c>rt_clear(node())</c>.</p> </desc>
+	</func>
+	<func>
+	    <name>rt_clear(Node) -> ok</name>
+	    <fsummary>Clears the internal counters.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+	    </type>
+	    <desc> <p>Clear the internal counters. Same as <c>lcnt:clear(Node)</c>.</p></desc>
+	</func>
+
+	<func>
+	    <name>rt_opt({Type, bool()}) -> bool()</name>
+	    <fsummary>Same as <c>rt_opt(node(), {Type, Opt})</c>.</fsummary>
+	    <desc> <p>Same as <c>rt_opt(node(), {Type, Opt})</c>.</p> </desc>
+	</func>
+	<func>
+	    <name>rt_opt(Node, {Type, bool()}) -> bool()</name>
+	    <fsummary>Changes the lock counter behavior and returns the previous behaviour.</fsummary>
+	    <type>
+		<v>Node = node()</v>
+		<v>Type = copy_save | process_locks</v>
+	    </type>
+	    <desc>
+		<p>Changes the lock counter behavior and returns the previous behaviour.</p>
+		<p>Option description:</p>
+		<taglist>
+		    <tag><c>{copy_save, bool()}</c></tag>
+		    <item>Enable statistics saving from destroyed locks by copying. This might consume a lot of memory.
+			<br/>Default: <c>false</c>
+		    </item>
+
+		    <tag><c>{process_locks, bool()}</c></tag>
+		    <item>Profile process locks.
+			<br/>Default: <c>true</c>
+		    </item>
+		</taglist>
+	    </desc>
+	</func>
+    </funcs>
+
+    <section>
+	<title>See Also</title>
+	<p> <seealso marker="lcnt_chapter">LCNT User's Guide</seealso></p>
+    </section>
+</erlref>
diff --git a/lib/tools/doc/src/lcnt_chapter.xml b/lib/tools/doc/src/lcnt_chapter.xml
new file mode 100644
index 0000000000..8f44b23f59
--- /dev/null
+++ b/lib/tools/doc/src/lcnt_chapter.xml
@@ -0,0 +1,301 @@
+<?xml version="1.0" encoding="latin1" ?>
+<!DOCTYPE chapter SYSTEM "chapter.dtd">
+
+<chapter>
+    <header>
+	<copyright>
+	    <year>2009</year><year>2010</year>
+	    <holder>Ericsson AB. All Rights Reserved.</holder>
+	</copyright>
+	<legalnotice>
+	    The contents of this file are subject to the Erlang Public License,
+	    Version 1.1, (the "License"); you may not use this file except in
+	    compliance with the License. You should have received a copy of the
+	    Erlang Public License along with this software. If not, it can be
+	    retrieved online at http://www.erlang.org/.
+
+	    Software distributed under the License is distributed on an "AS IS"
+	    basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See
+	    the License for the specific language governing rights and limitations
+	    under the License.
+
+	</legalnotice>
+
+	<title>lcnt - The Lock Profiler</title>
+	<prepared>Björn-Egil Dahlberg</prepared>
+	<responsible>nobody</responsible>
+	<docno></docno>
+	<approved>nobody</approved>
+	<checked>no</checked>
+	<date>2009-11-26</date>
+	<rev>PA1</rev>
+	<file>lcnt_chapter.xml</file>
+    </header>
+    <p>
+	Internally in the Erlang runtime system locks are used to protect resources from being updated from multiple threads in a fatal way. Locks are necessary
+	to ensure that the runtime system works properly but it also introduces a couple of limitations. Lock contention and locking overhead.
+    </p>
+    <p>
+	With lock contention we mean when one thread locks a resource and another thread, or threads, tries to acquire the same resource at the same time. The lock will deny
+	the other thread access to the resource and the thread will be blocked from continuing its execution. The second thread has to wait until the first thread has
+	completed its access to the resource and unlocked it. The <c>lcnt</c> tool measures these lock conflicts.
+    </p>
+    <p>
+	Locks has an inherent cost in execution time and memory space. It takes time initialize, destroy, aquiring or releasing locks. To decrease lock contention it
+	some times necessary to use finer grained locking strategies. This will usually also increase the locking overhead and hence there is a tradeoff
+	between lock contention and overhead. In general, lock contention increases with the number of threads running concurrently. The <c>lcnt</c> tool does not measure locking overhead.
+    </p>
+    <section>
+	<title> Enabling lock-counting </title>
+	<p>For investigation of locks in the emulator we use an internal tool called <c>lcnt</c> (short for lock-count). The VM needs to be compiled with this option enabled. To enable this, use:</p>
+
+	<pre>
+cd $ERL_TOP
+./configure --enable-lock-counter
+	</pre>
+
+	<p>
+	    Another way to enable this alongside a normal VM is to compile it at emulator directory level, much like a debug build. To compile it this way do the following,
+	</p>
+	<pre>
+cd $ERL_TOP/erts/emulator
+make lcnt FLAVOR=smp
+	</pre>
+	<p> and then starting Erlang with,</p>
+	<pre>
+$ERL_TOP/bin/cerl -lcnt
+	</pre>
+	<p>To verify that you lock-counting enabled check that <c>[lock-counting]</c> appears in the status text when the VM is started.</p>
+	<pre>
+Erlang R13B03 (erts-5.7.4) [source] [64-bit] [smp:8:8] [rq:8] [async-threads:0] [hipe]
+ [kernel-poll:false] [lock-counting]
+	</pre>
+    </section>
+    <section>
+	<title>Getting started</title>
+	<p>Once you have a lock counting enabled VM the module <c>lcnt</c> can be used. The module is intended to be used from the current running nodes shell. To access remote nodes use <c>lcnt:clear(Node)</c> and <c>lcnt:collect(Node)</c>. </p>
+
+	<p>All locks are continuously monitored and its statistics updated. Use <c>lcnt:clear/0</c> to initially clear all counters before running any specific tests. This command will also reset the duration timer internally.</p>
+	<p>To retrieve lock statistics information use, <c>lcnt:collect/0,1</c>. The collect operation will start a <c>lcnt</c> server if it not already started. All collected data will be built into an erlang term and uploaded to the server and a duration time will also be uploaded. This duration is the time between <c>lcnt:clear/0,1</c> and <c>lcnt:collect/0,1</c>.</p>
+
+	<p>Once the data is collected to the server it can be filtered, sorted and printed in many different ways.</p>
+	<p>See the <seealso marker="lcnt">reference manual</seealso> for a description of each function.</p>
+    </section>
+    <section>
+	<title> Example of usage </title>
+	<p>From the Erlang shell:</p>
+	<pre>
+Erlang R13B03 (erts-5.7.4) [source] [smp:8:8] [rq:8] [async-threads:0] [hipe]
+ [kernel-poll:false] [lock-counting]
+1> lcnt:rt_opt({copy_save, true}).
+false
+2> lcnt:clear(), big:bang(1000), lcnt:collect().
+ok
+3> lcnt:conflicts().
+                   lock   id  #tries  #collisions  collisions [%]  time [us]  duration [%]
+                  -----  --- ------- ------------ --------------- ---------- -------------
+         alcu_allocator   50 4113692       158921          3.8632     215464        4.4962
+               pix_lock  256 4007140         4882          0.1218      12221        0.2550
+              run_queue    8 2287246         6949          0.3038       9825        0.2050
+              proc_main 1029 3115778        25755          0.8266       1199        0.0250
+              proc_msgq 1029 2467022         1910          0.0774       1048        0.0219
+            proc_status 1029 5708439         2435          0.0427        706        0.0147
+ message_pre_alloc_lock    8 2008569          134          0.0067         90        0.0019
+              timeofday    1   54065            8          0.0148         22        0.0005
+                gc_info    1    7071            7          0.0990          5        0.0001
+ok
+</pre>
+<p>
+    Another way to to profile a specific function is to use <c>lcnt:apply/3</c> or <c>lcnt:apply/1</c> which does <c>lcnt:clear/0</c> before the function and <c>lcnt:collect/0</c> after its invocation.
+    It also sets <c>copy_save</c> to <c>true</c> for the duration of the function call
+</p>
+<pre>
+Erlang R13B03 (erts-5.7.4) [source] [smp:8:8] [rq:8] [async-threads:0] [hipe]
+ [kernel-poll:false] [lock-counting]
+1> lcnt:apply(fun() -> big:bang(1000) end).
+4384.338
+2> lcnt:conflicts().
+                   lock   id  #tries  #collisions  collisions [%]  time [us]  duration [%]
+                  -----  --- ------- ------------ --------------- ---------- -------------
+         alcu_allocator   50 4117913       183091          4.4462     234232        5.1490
+              run_queue    8 2050398         3801          0.1854       6700        0.1473
+               pix_lock  256 4007080         4943          0.1234       2847        0.0626
+              proc_main 1028 3000178        28247          0.9415       1022        0.0225
+              proc_msgq 1028 2293677         1352          0.0589        545        0.0120
+            proc_status 1028 5258029         1744          0.0332        442        0.0097
+ message_pre_alloc_lock    8 2009322          147          0.0073         82        0.0018
+              timeofday    1   48616            9          0.0185         13        0.0003
+                gc_info    1    7455           12          0.1610          9        0.0002
+ok
+</pre>
+<p> The process locks are sorted after its class like all other locks. It is convenient to look at specific processes and ports as classes. We can do this by swapping class and class identifiers with <c>lcnt:swap_pid_keys/0</c>.  </p>
+<pre>
+3> lcnt:swap_pid_keys().
+ok
+4> lcnt:conflicts([{print, [name, tries, ratio, time]}]).
+                   lock  #tries  collisions [%]  time [us]
+                  ----- ------- --------------- ----------
+         alcu_allocator 4117913          4.4462     234232
+              run_queue 2050398          0.1854       6700
+               pix_lock 4007080          0.1234       2847
+ message_pre_alloc_lock 2009322          0.0073         82
+  &lt;nonode@nohost.660.0&gt;   13493          1.4452         41
+  &lt;nonode@nohost.724.0&gt;   13504          1.1404         36
+  &lt;nonode@nohost.803.0&gt;   13181          1.6235         35
+  &lt;nonode@nohost.791.0&gt;   13534          0.8202         22
+   &lt;nonode@nohost.37.0&gt;    8744          5.8326         22
+  &lt;nonode@nohost.876.0&gt;   13335          1.1174         19
+  &lt;nonode@nohost.637.0&gt;   13452          1.3678         19
+  &lt;nonode@nohost.799.0&gt;   13497          1.8745         18
+  &lt;nonode@nohost.469.0&gt;   11009          2.5343         18
+  &lt;nonode@nohost.862.0&gt;   13131          1.2566         16
+  &lt;nonode@nohost.642.0&gt;   13216          1.7327         15
+  &lt;nonode@nohost.582.0&gt;   13156          1.1098         15
+  &lt;nonode@nohost.622.0&gt;   13420          0.7303         14
+  &lt;nonode@nohost.596.0&gt;   13141          1.6437         14
+  &lt;nonode@nohost.592.0&gt;   13346          1.2064         13
+  &lt;nonode@nohost.526.0&gt;   13076          1.1701         13
+ok
+</pre>
+      </section>
+      <section>
+	<title> Example with Mnesia Transaction Benchmark </title>
+	<p>From the Erlang shell:</p>
+<pre>
+Erlang R13B03 (erts-5.7.4) [source] [smp:8:8] [rq:8] [async-threads:0] [hipe]
+ [kernel-poll:false] [lock-counting]
+
+Eshell V5.7.4  (abort with ^G)
+1> Conf=[{db_nodes, [node()]}, {driver_nodes, [node()]}, {replica_nodes, [node()]},
+ {n_drivers_per_node, 10}, {n_branches, 1000}, {n_accounts_per_branch, 10},
+ {replica_type, ram_copies}, {stop_after, 60000}, {reuse_history_id, true}].
+[{db_nodes,[nonode@nohost]},
+ {driver_nodes,[nonode@nohost]},
+ {replica_nodes,[nonode@nohost]},
+ {n_drivers_per_node,10},
+ {n_branches,1000},
+ {n_accounts_per_branch,10},
+ {replica_type,ram_copies},
+ {stop_after,60000},
+ {reuse_history_id,true}]
+2> mnesia_tpcb:init([{use_running_mnesia, false}|Conf]).
+ignore
+</pre>
+<p>Initial configuring of the benchmark is done. It is time to profile the actual benchmark and Mnesia</p>
+<pre>
+3> lcnt:apply(fun() -> {ok,{time, Tps,_,_,_,_}} = mnesia_tpcb:run([{use_running_mnesia,
+ true}|Conf]), Tps/60 end).
+12037.483333333334
+ok
+4> lcnt:swap_pid_keys().
+ok
+</pre>
+<p>The <c>id</c> header represents the number of unique identifiers under a class when the option <c>{combine, true}</c> is used (which is on by default). It will otherwise show the specific identifier.
+The <c>db_tab</c> listing shows 722287 unique locks, it is one for each ets-table created and Mnesia creates one for each transaction.
+</p>
+<pre>
+5> lcnt:conflicts().
+                   lock     id   #tries  #collisions  collisions [%]  time [us]  duration [%]
+                  -----    ---  ------- ------------ --------------- ---------- -------------
+         alcu_allocator     50 56355118       732662          1.3001    2934747        4.8862
+                 db_tab 722287 94513441        63203          0.0669    1958797        3.2613
+              timeofday      1  2701048       175854          6.5106    1746079        2.9071
+               pix_lock    256 24306168       163214          0.6715     918309        1.5289
+              run_queue      8 11813811       152637          1.2920     357040        0.5945
+ message_pre_alloc_lock      8 17671449        57203          0.3237     263043        0.4380
+          mnesia_locker      4 17477633      1618548          9.2607      97092        0.1617
+              mnesia_tm      4  9891408       463788          4.6888      86353        0.1438
+                gc_info      1   823460          628          0.0763      24826        0.0413
+     meta_main_tab_slot     16 41393400         7193          0.0174      11393        0.0190
+ &lt;nonode@nohost.1108.0&gt;      4  4331412          333          0.0077       7148        0.0119
+            timer_wheel      1   203185           30          0.0148       3108        0.0052
+ &lt;nonode@nohost.1110.0&gt;      4  4291098          210          0.0049        885        0.0015
+ &lt;nonode@nohost.1114.0&gt;      4  4294702          288          0.0067        442        0.0007
+ &lt;nonode@nohost.1113.0&gt;      4  4346066          235          0.0054        390        0.0006
+ &lt;nonode@nohost.1106.0&gt;      4  4348159          287          0.0066        379        0.0006
+ &lt;nonode@nohost.1111.0&gt;      4  4279309          290          0.0068        325        0.0005
+ &lt;nonode@nohost.1107.0&gt;      4  4292190          302          0.0070        315        0.0005
+ &lt;nonode@nohost.1112.0&gt;      4  4208858          265          0.0063        276        0.0005
+ &lt;nonode@nohost.1109.0&gt;      4  4377502          267          0.0061        276        0.0005
+ok
+</pre>
+<p>The listing shows <c>mnesia_locker</c>, a process, has highly contended locks.</p>
+<pre>
+6> lcnt:inspect(mnesia_locker).
+          lock          id  #tries  #collisions  collisions [%]  time [us]  duration [%]
+         -----         --- ------- ------------ --------------- ---------- -------------
+ mnesia_locker   proc_msgq 5449930        59374          1.0894      69781        0.1162
+ mnesia_locker   proc_main 4462782      1487374         33.3284      14398        0.0240
+ mnesia_locker proc_status 7564921        71800          0.9491      12913        0.0215
+ mnesia_locker   proc_link       0            0          0.0000          0        0.0000
+ok
+</pre>
+<p>Listing without class combiner.</p>
+
+<pre>
+7> lcnt:conflicts([{combine, false}, {print, [name, id, tries, ratio, time]}]).
+                   lock                        id   #tries  collisions [%]  time [us]
+                  -----                       ---  ------- --------------- ----------
+                 db_tab mnesia_transient_decision   722250          3.9463    1856852
+              timeofday                 undefined  2701048          6.5106    1746079
+         alcu_allocator                 ets_alloc  7490696          2.2737     692655
+         alcu_allocator                 ets_alloc  7081771          2.3294     664522
+         alcu_allocator                 ets_alloc  7047750          2.2520     658495
+         alcu_allocator                 ets_alloc  5883537          2.3177     610869
+               pix_lock                        58 11011355          1.1924     564808
+               pix_lock                        60  4426484          0.7120     262490
+         alcu_allocator                 ets_alloc  1897004          2.4248     219543
+ message_pre_alloc_lock                 undefined  4211267          0.3242     128299
+              run_queue                         3  2801555          1.3003     116792
+              run_queue                         2  2799988          1.2700     100091
+              run_queue                         1  2966183          1.2712      78834
+          mnesia_locker                 proc_msgq  5449930          1.0894      69781
+ message_pre_alloc_lock                 undefined  3495672          0.3262      65773
+ message_pre_alloc_lock                 undefined  4189752          0.3174      58607
+              mnesia_tm                 proc_msgq  2094144          1.7184      56361
+              run_queue                         4  2343585          1.3115      44300
+                 db_tab                    branch  1446529          0.5229      38244
+                gc_info                 undefined   823460          0.0763      24826
+ok
+</pre>
+<p>
+In this scenario the lock that protects ets-table <c>mnesia_transient_decision</c> has spent most of its waiting for. That is 1.8 seconds in a test that run for 60 seconds. The time is also spread on eight different scheduler threads.
+</p>
+<pre>
+8> lcnt:inspect(db_tab, [{print, [name, id, tries, colls, ratio, duration]}]).
+   lock                        id  #tries  #collisions  collisions [%]  duration [%]
+  -----                       --- ------- ------------ --------------- -------------
+ db_tab mnesia_transient_decision  722250        28502          3.9463        3.0916
+ db_tab                    branch 1446529         7564          0.5229        0.0637
+ db_tab                   account 1464500         8203          0.5601        0.0357
+ db_tab                    teller 1464529         8110          0.5538        0.0291
+ db_tab                   history  722250         3767          0.5216        0.0232
+ db_tab              mnesia_stats  750332         7057          0.9405        0.0180
+ db_tab        mnesia_trans_store      61            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      61            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ db_tab        mnesia_trans_store      53            0          0.0000        0.0000
+ok
+</pre>
+
+    </section>
+    <section>
+	<title> Deciphering the output </title>
+	<p> Typically high <c>time</c> values are bad and this is often the thing to look for. However, one should also look for high lock acquisition frequencies (#tries) since locks generate overhead and because high frequency could become problematic if they begin to have conflicts even if it is not shown in a particular test.  </p>
+    </section>
+
+    <section>
+	<title>See Also</title>
+	<p> <seealso marker="lcnt">LCNT Reference Manual</seealso></p>
+    </section>
+</chapter>
diff --git a/lib/tools/doc/src/part.xml b/lib/tools/doc/src/part.xml
index 3e02086b80..19f0763410 100644
--- a/lib/tools/doc/src/part.xml
+++ b/lib/tools/doc/src/part.xml
@@ -55,6 +55,8 @@
       <tag><em>instrument</em></tag>
       <item>Utility functions for obtaining and analysing resource usage
        in an instrumented Erlang runtime system.</item>
+      <tag><em>lcnt</em></tag>
+      <item>A lock profiling tool for the Erlang runtime system.</item>
       <tag><em>make</em></tag>
       <item>A make utility for Erlang similar to UNIX make.</item>
       <tag><em>tags</em></tag>
@@ -69,6 +71,7 @@
   <xi:include href="cprof_chapter.xml"/>
   <xi:include href="erlang_mode_chapter.xml"/>
   <xi:include href="fprof_chapter.xml"/>
+  <xi:include href="lcnt_chapter.xml"/>
   <xi:include href="xref_chapter.xml"/>
 </part>
 
diff --git a/lib/tools/doc/src/ref_man.xml b/lib/tools/doc/src/ref_man.xml
index aea74e3746..6cd4975075 100644
--- a/lib/tools/doc/src/ref_man.xml
+++ b/lib/tools/doc/src/ref_man.xml
@@ -51,9 +51,14 @@
        Erlang programs. Uses trace to file to minimize runtime
        performance impact, and displays time for calling and called 
        functions.</item>
+
       <tag><em>instrument</em></tag>
       <item>Utility functions for obtaining and analysing resource usage
        in an instrumented Erlang runtime system.</item>
+
+      <tag><em>lcnt</em></tag>
+      <item>A lock profiling tool for the Erlang runtime system.</item>
+
       <tag><em>make</em></tag>
       <item>A make utility for Erlang similar to UNIX make.</item>
       <tag><em>tags</em></tag>
@@ -70,6 +75,7 @@
   <xi:include href="erlang_mode.xml"/>
   <xi:include href="fprof.xml"/>
   <xi:include href="instrument.xml"/>
+  <xi:include href="lcnt.xml"/>
   <xi:include href="make.xml"/>
   <xi:include href="tags.xml"/>
   <xi:include href="xref.xml"/>
-- 
cgit v1.2.3