From a64fd47f6196f769f19a205885a8ca5a4a0388c5 Mon Sep 17 00:00:00 2001 From: June McEnroe Date: Tue, 7 Sep 2021 16:53:43 -0400 Subject: Add dehtml --- bin/man1/dehtml.1 | 35 +++++++++++++++++++++++++++++++++++ 1 file changed, 35 insertions(+) create mode 100644 bin/man1/dehtml.1 (limited to 'bin/man1/dehtml.1') diff --git a/bin/man1/dehtml.1 b/bin/man1/dehtml.1 new file mode 100644 index 00000000..a0c5a8c4 --- /dev/null +++ b/bin/man1/dehtml.1 @@ -0,0 +1,35 @@ +.Dd September 7, 2021 +.Dt DEHTML 1 +.Os +. +.Sh NAME +.Nm dehtml +.Nd extract text from HTML +. +.Sh SYNOPSIS +.Nm +.Op Fl s +.Op Ar +. +.Sh DESCRIPTION +The +.Nm +utility extracts text +from HTML documents. +Text inside +.Sy , +.Sy <style> +and +.Sy <script> +tags is discarded. +Numeric and common named HTML entities +are converted. +. +.Pp +The arguments are as follows: +.Bl -tag -width Ds +.It Fl s +Collapse whitespace outside of +.Sy <pre> +tags. +.El -- cgit 1.4.1 ='/src/'>summary</a> <a href='/src/refs/?id=399db92745bcbaa8a9345eed26848d39dc3ea220'>refs</a> <a class='active' href='/src/log/bin/dash/configure.ac?follow=1'>log</a> <a href='/src/tree/bin/dash/configure.ac?id=399db92745bcbaa8a9345eed26848d39dc3ea220'>tree</a> <a href='/src/commit/bin/dash/configure.ac?id=399db92745bcbaa8a9345eed26848d39dc3ea220&follow=1'>commit</a> <a href='/src/diff/bin/dash/configure.ac?id=399db92745bcbaa8a9345eed26848d39dc3ea220&follow=1'>diff</a></td><td class='form'><form class='right' method='get' action='/src/log/bin/dash/configure.ac'> <input type='hidden' name='id' value='399db92745bcbaa8a9345eed26848d39dc3ea220'/><select name='qt'> <option value='grep'>log msg</option> <option value='author'>author</option> <option value='committer'>committer</option> <option value='range'>range</option> </select> <input class='txt' type='search' size='10' name='q' value=''/> <input type='submit' value='search'/> </form> </td></tr></table> <div class='path'>path: <a href='/src/log/?id=399db92745bcbaa8a9345eed26848d39dc3ea220&follow=1'>root</a>/<a href='/src/log/bin?id=399db92745bcbaa8a9345eed26848d39dc3ea220&follow=1'>bin</a>/<a href='/src/log/bin/dash?id=399db92745bcbaa8a9345eed26848d39dc3ea220&follow=1'>dash</a>/<a href='/src/log/bin/dash/configure.ac?id=399db92745bcbaa8a9345eed26848d39dc3ea220&follow=1'>configure.ac</a> (<a href='/src/log/bin/dash/configure.ac?id=399db92745bcbaa8a9345eed26848d39dc3ea220'>unfollow</a>)</div><div class='content'><table class='list nowrap'><tr class='nohover'><th></th><th class='left'>Commit message (<a href='/src/log/bin/dash/configure.ac?id=399db92745bcbaa8a9345eed26848d39dc3ea220&showmsg=1&follow=1'>Expand</a>)</th><th class='left'>Author</th></tr> <tr><td><span title='2021-01-19 20:15:13 -0500'>2021-01-19</span></td><td><a href='/src/commit/bin/man1/hilex.1?id=f44f549f0caf9bcf41c68c9fdd694b36adace996&follow=1'>Support BSD make syntax and match *.am</a></td><td>June McEnroe</td></tr> <tr><td><span title='2021-01-19 19:40:31 -0500'>2021-01-19</span></td><td><a href='/src/commit/bin/make.l?id=5426534a897c735e3906788a94a5d61a3bd00701&follow=1'>Match tab following escaped newline in make assignments</a></td><td>June McEnroe</td></tr> <tr><td><span title='2021-01-18 21:33:21 -0500'>2021-01-18</span></td><td><a href='/src/commit/bin/man1/hilex.1?id=6c4a03e8fb0d6df2e244177500f4820efc6f7876&follow=1'>Allow matching lexers using first input line</a></td><td>June McEnroe