From 4d3abe74035d7d3c2c5d6927cc0cbb9032486b30 Mon Sep 17 00:00:00 2001
From: Jonas Smedegaard
Date: Fri, 31 Aug 2012 15:12:31 +0200
Subject: Add tidying scripts.
---
report/normalize-html.pl | 29 +++++++++++++++++++++++++++++
1 file changed, 29 insertions(+)
create mode 100755 report/normalize-html.pl
(limited to 'report/normalize-html.pl')
diff --git a/report/normalize-html.pl b/report/normalize-html.pl
new file mode 100755
index 0000000..7245a4e
--- /dev/null
+++ b/report/normalize-html.pl
@@ -0,0 +1,29 @@
+#!/usr/bin/perl
+
+use File::Slurp;
+
+my $_ = read_file( $ARGV[0] ) ;
+
+#s!( )! !g; # filler horisontal space
+s!( )+! !g; # filler horisontal space
+#s!(\s*
\s*)+!
!g; # filler vertical space
+s!(\s*
\s*)+!
!g; # filler vertical space
+s,
(?=(?:)?
),,ig; # filler horisontal space
+s,\s*
,,ig; # filler horisontal space
+s!\s*\s*\s*!!g; # filler vertical space
+s!!!gi; # page dividers
+#s!]+>\K
(.+?)!$1
!i; # H1
+#s!
(.+?)!$1
!i; # H1
+s!\.(ft\d+){font\-size:52px;.*?\K]*\bclass="\1"[^>]*>(.*?)
!$2
!is;
+s!\.(ft\d+){font\-size:19px;.*?\K]*\bclass="\1"[^>]*>(.*?)
!$2
!isg;
+s!\.(ft\d+){font\-size:16px;.*?\K]*\bclass="\1"[^>]*>(.*?)
!$2
!isg;
+s!]*>([^<\s][^<]*?)
!$1
!isg;
+s,]*>(?!),
,isg;
+s,,,isg;
+s,,,isg;
+s,