summaryrefslogtreecommitdiff
path: root/ikiwiki
blob: 72b1021eca97a323bc14724f98c29cab8d285b3e (plain)
  1. #!/usr/bin/perl -T
  2. use warnings;
  3. use strict;
  4. use File::Find;
  5. use Memoize;
  6. use File::Spec;
  7. BEGIN {
  8. $blosxom::version="is a proper perl module too much to ask?";
  9. do "/usr/bin/markdown";
  10. }
  11. memoize('pagename');
  12. memoize('bestlink');
  13. sub usage {
  14. die "usage: ikiwiki [options] source dest\n";
  15. }
  16. my $link=qr/\[\[([^\s]+)\]\]/;
  17. my $verbose=0;
  18. my $rebuild=0;
  19. my $wikiname="wiki";
  20. if (grep /^-/, @ARGV) {
  21. eval {use Getopt::Long};
  22. GetOptions(
  23. "wikiname=s" => \$wikiname,
  24. "verbose|v" => \$verbose,
  25. "rebuild" => \$rebuild,
  26. ) || usage();
  27. }
  28. usage() unless @ARGV == 2;
  29. my ($srcdir) = shift =~ /(.*)/; # untaint
  30. my ($destdir) = shift =~ /(.*)/; # untaint
  31. my %links;
  32. my %oldlinks;
  33. my %oldpagemtime;
  34. my %renderedfiles;
  35. my %pagesources;
  36. sub error ($) {
  37. die @_;
  38. }
  39. sub debug ($) {
  40. print "@_\n" if $verbose;
  41. }
  42. sub mtime ($) {
  43. my $page=shift;
  44. return (stat($page))[9];
  45. }
  46. sub basename {
  47. my $file=shift;
  48. $file=~s!.*/!!;
  49. return $file;
  50. }
  51. sub dirname {
  52. my $file=shift;
  53. $file=~s!/?[^/]+$!!;
  54. return $file;
  55. }
  56. sub pagetype ($) {
  57. my $page=shift;
  58. if ($page =~ /\.mdwn$/) {
  59. return ".mdwn";
  60. }
  61. else {
  62. return "unknown";
  63. }
  64. }
  65. sub pagename ($) {
  66. my $file=shift;
  67. my $type=pagetype($file);
  68. my $page=$file;
  69. $page=~s/\Q$type\E*$// unless $type eq 'unknown';
  70. return $page;
  71. }
  72. sub htmlpage ($) {
  73. my $page=shift;
  74. return $page.".html";
  75. }
  76. sub readpage ($) {
  77. my $page=shift;
  78. local $/=undef;
  79. open (PAGE, "$srcdir/$page") || error("failed to read $page: $!");
  80. my $ret=<PAGE>;
  81. close PAGE;
  82. return $ret;
  83. }
  84. sub writepage ($$) {
  85. my $page=shift;
  86. my $content=shift;
  87. my $dir=dirname("$destdir/$page");
  88. if (! -d $dir) {
  89. my $d="";
  90. foreach my $s (split(m!/+!, $dir)) {
  91. $d.="$s/";
  92. if (! -d $d) {
  93. mkdir($d) || error("failed to create directory $d: $!");
  94. }
  95. }
  96. }
  97. open (PAGE, ">$destdir/$page") || error("failed to write $page: $!");
  98. print PAGE $content;
  99. close PAGE;
  100. }
  101. sub findlinks {
  102. my $content=shift;
  103. my @links;
  104. while ($content =~ /$link/g) {
  105. push @links, lc($1);
  106. }
  107. return @links;
  108. }
  109. # Given a page and the text of a link on the page, determine which existing
  110. # page that link best points to. Prefers pages under a subdirectory with
  111. # the same name as the source page, failing that goes down the directory tree
  112. # to the base looking for matching pages.
  113. sub bestlink ($$) {
  114. my $page=shift;
  115. my $link=lc(shift);
  116. my $cwd=$page;
  117. do {
  118. my $l=$cwd;
  119. $l.="/" if length $l;
  120. $l.=$link;
  121. if (exists $links{$l}) {
  122. #debug("for $page, \"$link\", use $l");
  123. return $l;
  124. }
  125. } while $cwd=~s!/?[^/]+$!!;
  126. #print STDERR "warning: page $page, broken link: $link\n";
  127. return "";
  128. }
  129. sub isinlinableimage ($) {
  130. my $file=shift;
  131. $file=~/\.(png|gif|jpg|jpeg)$/;
  132. }
  133. sub htmllink ($$) {
  134. my $page=shift;
  135. my $link=shift;
  136. my $bestlink=bestlink($page, $link);
  137. return $link if $page eq $bestlink;
  138. # TODO BUG: %renderedfiles may not have it, if the linked to page
  139. # was also added and isn't yet rendered! Note that this bug is
  140. # masked by the bug mentioned below that makes all new files
  141. # be rendered twice.
  142. if (! grep { $_ eq $bestlink } values %renderedfiles) {
  143. $bestlink=htmlpage($bestlink);
  144. }
  145. if (! grep { $_ eq $bestlink } values %renderedfiles) {
  146. return "<a href=\"?\">?</a>$link"
  147. }
  148. $bestlink=File::Spec->abs2rel($bestlink, dirname($page));
  149. if (isinlinableimage($bestlink)) {
  150. return "<img src=\"$bestlink\">";
  151. }
  152. return "<a href=\"$bestlink\">$link</a>";
  153. }
  154. sub linkify ($$) {
  155. my $content=shift;
  156. my $file=shift;
  157. $content =~ s/$link/htmllink(pagename($file), $1)/eg;
  158. return $content;
  159. }
  160. sub htmlize ($$) {
  161. my $type=shift;
  162. my $content=shift;
  163. if ($type eq '.mdwn') {
  164. return Markdown::Markdown($content);
  165. }
  166. else {
  167. error("htmlization of $type not supported");
  168. }
  169. }
  170. sub linkbacks ($$) {
  171. my $content=shift;
  172. my $page=shift;
  173. my @links;
  174. foreach my $p (keys %links) {
  175. next if bestlink($page, $p) eq $page;
  176. if (grep { length $_ && bestlink($p, $_) eq $page } @{$links{$p}}) {
  177. my $href=File::Spec->abs2rel(htmlpage($p), dirname($page));
  178. # Trim common dir prefixes from both pages.
  179. my $p_trimmed=$p;
  180. my $page_trimmed=$page;
  181. my $dir;
  182. 1 while (($dir)=$page_trimmed=~m!^([^/]+/)!) &&
  183. defined $dir &&
  184. $p_trimmed=~s/^\Q$dir\E// &&
  185. $page_trimmed=~s/^\Q$dir\E//;
  186. push @links, "<a href=\"$href\">$p_trimmed</a>";
  187. }
  188. }
  189. $content.="<hr><p>Links: ".join(" ", sort @links)."</p>\n" if @links;
  190. return $content;
  191. }
  192. sub finalize ($$) {
  193. my $content=shift;
  194. my $page=shift;
  195. my $title=basename($page);
  196. $title=~s/_/ /g;
  197. my $pagelink="";
  198. my $path="";
  199. foreach my $dir (reverse split("/", $page)) {
  200. if (length($pagelink)) {
  201. $pagelink="<a href=\"$path$dir.html\">$dir</a>/ $pagelink";
  202. }
  203. else {
  204. $pagelink=$dir;
  205. }
  206. $path.="../";
  207. }
  208. $path=~s/\.\.\/$/index.html/;
  209. $pagelink="<a href=\"$path\">$wikiname</a>/ $pagelink";
  210. $content="<html>\n<head><title>$title</title></head>\n<body>\n".
  211. "<h1>$pagelink</h1>\n".
  212. $content.
  213. "</body>\n</html>\n";
  214. return $content;
  215. }
  216. sub render ($) {
  217. my $file=shift;
  218. my $type=pagetype($file);
  219. my $content=readpage($file);
  220. if ($type ne 'unknown') {
  221. my $page=pagename($file);
  222. $links{$page}=[findlinks($content)];
  223. $content=linkify($content, $file);
  224. $content=htmlize($type, $content);
  225. $content=linkbacks($content, $page);
  226. $content=finalize($content, $page);
  227. writepage(htmlpage($page), $content);
  228. $oldpagemtime{$page}=time;
  229. $renderedfiles{$page}=htmlpage($page);
  230. }
  231. else {
  232. $links{$file}=[];
  233. writepage($file, $content);
  234. $oldpagemtime{$file}=time;
  235. $renderedfiles{$file}=$file;
  236. }
  237. }
  238. sub loadindex () {
  239. open (IN, "$srcdir/.index") || return;
  240. while (<IN>) {
  241. ($_)=/(.*)/; # untaint
  242. chomp;
  243. my ($mtime, $file, $rendered, @links)=split(' ', $_);
  244. my $page=pagename($file);
  245. $pagesources{$page}=$file;
  246. $oldpagemtime{$page}=$mtime;
  247. $oldlinks{$page}=[@links];
  248. $links{$page}=[@links];
  249. $renderedfiles{$page}=$rendered;
  250. }
  251. close IN;
  252. }
  253. sub saveindex () {
  254. open (OUT, ">$srcdir/.index") || error("cannot write to .index: $!");
  255. foreach my $page (keys %oldpagemtime) {
  256. print OUT "$oldpagemtime{$page} $pagesources{$page} $renderedfiles{$page} ".
  257. join(" ", @{$links{$page}})."\n"
  258. if $oldpagemtime{$page};
  259. }
  260. close OUT;
  261. }
  262. sub prune ($) {
  263. my $file=shift;
  264. unlink($file);
  265. my $dir=dirname($file);
  266. while (rmdir($dir)) {
  267. $dir=dirname($dir);
  268. }
  269. }
  270. sub refresh () {
  271. # Find existing pages.
  272. my %exists;
  273. my @files;
  274. find({
  275. no_chdir => 1,
  276. wanted => sub {
  277. if (/\/\.svn\//) {
  278. $File::Find::prune=1;
  279. }
  280. elsif (! -d $_ && ! /\.html$/ && ! /\/\./) {
  281. my ($f)=/(^[-A-Za-z0-9_.:\/+]+$)/; # untaint
  282. if (! defined $f) {
  283. warn("skipping bad filename $_\n");
  284. }
  285. else {
  286. $f=~s/^\Q$srcdir\E\/?//;
  287. push @files, $f;
  288. $exists{pagename($f)}=1;
  289. }
  290. }
  291. },
  292. }, $srcdir);
  293. my %rendered;
  294. # check for added or removed pages
  295. my @add;
  296. foreach my $file (@files) {
  297. my $page=pagename($file);
  298. if (! $oldpagemtime{$page}) {
  299. debug("new page $page");
  300. push @add, $file;
  301. $links{$page}=[];
  302. $pagesources{$page}=$file;
  303. }
  304. }
  305. my @del;
  306. foreach my $page (keys %oldpagemtime) {
  307. if (! $exists{$page}) {
  308. debug("removing old page $page");
  309. push @del, $renderedfiles{$page};
  310. prune($destdir."/".$renderedfiles{$page});
  311. delete $renderedfiles{$page};
  312. $oldpagemtime{$page}=0;
  313. delete $pagesources{$page};
  314. }
  315. }
  316. # render any updated files
  317. foreach my $file (@files) {
  318. my $page=pagename($file);
  319. if (! exists $oldpagemtime{$page} ||
  320. mtime("$srcdir/$file") > $oldpagemtime{$page}) {
  321. debug("rendering changed file $file");
  322. render($file);
  323. $rendered{$file}=1;
  324. }
  325. }
  326. # if any files were added or removed, check to see if each page
  327. # needs an update due to linking to them
  328. # TODO: inefficient; pages may get rendered above and again here;
  329. # problem is the bestlink may have changed and we won't know until
  330. # now
  331. if (@add || @del) {
  332. FILE: foreach my $file (@files) {
  333. my $page=pagename($file);
  334. foreach my $f (@add, @del) {
  335. my $p=pagename($f);
  336. foreach my $link (@{$links{$page}}) {
  337. if (bestlink($page, $link) eq $p) {
  338. debug("rendering $file, which links to $p");
  339. render($file);
  340. $rendered{$file}=1;
  341. next FILE;
  342. }
  343. }
  344. }
  345. }
  346. }
  347. # handle linkbacks; if a page has added/removed links, update the
  348. # pages it links to
  349. # TODO: inefficient; pages may get rendered above and again here;
  350. # problem is the linkbacks could be wrong in the first pass render
  351. # above
  352. if (%rendered) {
  353. my %linkchanged;
  354. foreach my $file (keys %rendered, @del) {
  355. my $page=pagename($file);
  356. if (exists $links{$page}) {
  357. foreach my $link (@{$links{$page}}) {
  358. $link=bestlink($page, $link);
  359. if (length $link &&
  360. ! exists $oldlinks{$page} ||
  361. ! grep { $_ eq $link } @{$oldlinks{$page}}) {
  362. $linkchanged{$link}=1;
  363. }
  364. }
  365. }
  366. if (exists $oldlinks{$page}) {
  367. foreach my $link (@{$oldlinks{$page}}) {
  368. $link=bestlink($page, $link);
  369. if (length $link &&
  370. ! exists $links{$page} ||
  371. ! grep { $_ eq $link } @{$links{$page}}) {
  372. $linkchanged{$link}=1;
  373. }
  374. }
  375. }
  376. }
  377. foreach my $link (keys %linkchanged) {
  378. my $linkfile=$pagesources{$link};
  379. if (defined $linkfile) {
  380. debug("rendering $linkfile, to update its linkbacks");
  381. render($linkfile);
  382. }
  383. }
  384. }
  385. }
  386. loadindex() unless $rebuild;
  387. refresh();
  388. saveindex();