From 6f98b4dfb2b80e3eb3072dd3f140351581746db2 Mon Sep 17 00:00:00 2001 From: Jonas Smedegaard Date: Tue, 30 Dec 2014 01:50:08 +0100 Subject: Move mediawiki tweaks to separate scripts. --- mediawiki-extract | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100755 mediawiki-extract (limited to 'mediawiki-extract') diff --git a/mediawiki-extract b/mediawiki-extract new file mode 100755 index 0000000..c2dae68 --- /dev/null +++ b/mediawiki-extract @@ -0,0 +1,22 @@ +#!/usr/bin/perl + +# extract and decode mediawiki content from HTML source view + +use warnings; +use strict; + +use Path::Tiny; +use HTML::Entities; + +my $infile = shift; +my $outfile = shift || $infile; + +$_ = path($infile)->slurp_utf8; + +s!.*]*>!!s; +s!spew_utf8($_); + +1; -- cgit v1.2.3