From 95ae2be15891eae0b62a83d1adcc8380548c9290 Mon Sep 17 00:00:00 2001 From: June McEnroe Date: Fri, 18 Dec 2020 22:59:41 -0500 Subject: Add scripts to download, compress and tag IETF RFCs --- rfc/.gitignore | 3 +++ rfc/Makefile | 11 +++++++++++ rfc/rfctags.pl | 26 ++++++++++++++++++++++++++ 3 files changed, 40 insertions(+) create mode 100644 rfc/.gitignore create mode 100644 rfc/Makefile create mode 100644 rfc/rfctags.pl diff --git a/rfc/.gitignore b/rfc/.gitignore new file mode 100644 index 00000000..808cd63e --- /dev/null +++ b/rfc/.gitignore @@ -0,0 +1,3 @@ +*.txt +*.txt.gz +tags diff --git a/rfc/Makefile b/rfc/Makefile new file mode 100644 index 00000000..ed89a4e4 --- /dev/null +++ b/rfc/Makefile @@ -0,0 +1,11 @@ +tags: rfctags.pl + perl rfctags.pl > $@ + +sync: + rsync -z ftp.rfc-editor.org::rfcs-text-only/'rfc[0-9]*.txt' . + +compress: + gzip -9f *.txt + +clean: + rm -f *.txt *.txt.gz tags diff --git a/rfc/rfctags.pl b/rfc/rfctags.pl new file mode 100644 index 00000000..cd3ba288 --- /dev/null +++ b/rfc/rfctags.pl @@ -0,0 +1,26 @@ +use strict; +use warnings; +use open ':encoding(ISO-8859-1)'; + +use IO::Uncompress::Gunzip qw($GunzipError); + +($,, $\) = ("\t", "\n"); +for my $rfc (<*.txt.gz>) { + my $handle = new IO::Uncompress::Gunzip $rfc + or die "${rfc}: ${GunzipError}"; + while (<$handle>) { + chomp; + # Section headings + if (/^([\d.]+|[A-Z][.])\s+([^\t]+)/) { + print $1, $rfc, $.; + print $2, $rfc, $.; + } + # References + if (/^\s*(\[[\w-]+\])\s{2,}/) { + print $1, $rfc, $.; + print "\\$1", $rfc, $.; # vim ^] prepends \ to [ + } + } + die "${rfc}: $!" if $!; + close $handle; +} -- cgit 1.4.1