summaryrefslogtreecommitdiff
path: root/IkiWiki/Render.pm
blob: e863141070b802db6b2f824c65fe0ca9e8afe1e5 (plain)
  1. #!/usr/bin/perl
  2. package IkiWiki;
  3. use warnings;
  4. use strict;
  5. use IkiWiki;
  6. use Encode;
  7. my (%backlinks, %rendered);
  8. our %brokenlinks;
  9. my $links_calculated=0;
  10. sub calculate_links () {
  11. return if $links_calculated;
  12. %backlinks=%brokenlinks=();
  13. foreach my $page (keys %links) {
  14. foreach my $link (@{$links{$page}}) {
  15. my $bestlink=bestlink($page, $link);
  16. if (length $bestlink) {
  17. $backlinks{$bestlink}{$page}=1
  18. if $bestlink ne $page;
  19. }
  20. else {
  21. push @{$brokenlinks{$link}}, $page;
  22. }
  23. }
  24. }
  25. $links_calculated=1;
  26. }
  27. sub backlink_pages ($) {
  28. my $page=shift;
  29. calculate_links();
  30. return keys %{$backlinks{$page}};
  31. }
  32. sub backlinks ($) {
  33. my $page=shift;
  34. my @links;
  35. foreach my $p (backlink_pages($page)) {
  36. my $href=urlto($p, $page);
  37. # Trim common dir prefixes from both pages.
  38. my $p_trimmed=$p;
  39. my $page_trimmed=$page;
  40. my $dir;
  41. 1 while (($dir)=$page_trimmed=~m!^([^/]+/)!) &&
  42. defined $dir &&
  43. $p_trimmed=~s/^\Q$dir\E// &&
  44. $page_trimmed=~s/^\Q$dir\E//;
  45. push @links, { url => $href, page => pagetitle($p_trimmed) };
  46. }
  47. return @links;
  48. }
  49. sub genpage ($$) {
  50. my $page=shift;
  51. my $content=shift;
  52. my $templatefile;
  53. run_hooks(templatefile => sub {
  54. return if defined $templatefile;
  55. my $file=shift->(page => $page);
  56. if (defined $file && defined template_file($file)) {
  57. $templatefile=$file;
  58. }
  59. });
  60. my $template=template(defined $templatefile ? $templatefile : 'page.tmpl', blind_cache => 1);
  61. my $actions=0;
  62. if (length $config{cgiurl}) {
  63. $template->param(editurl => cgiurl(do => "edit", page => $page))
  64. if IkiWiki->can("cgi_editpage");
  65. $template->param(prefsurl => cgiurl(do => "prefs"))
  66. if exists $hooks{auth};
  67. $actions++;
  68. }
  69. if (defined $config{historyurl} && length $config{historyurl}) {
  70. my $u=$config{historyurl};
  71. $u=~s/\[\[file\]\]/$pagesources{$page}/g;
  72. $template->param(historyurl => $u);
  73. $actions++;
  74. }
  75. if ($config{discussion}) {
  76. if ($page !~ /.*\/\Q$config{discussionpage}\E$/ &&
  77. (length $config{cgiurl} ||
  78. exists $links{$page."/".$config{discussionpage}})) {
  79. $template->param(discussionlink => htmllink($page, $page, $config{discussionpage}, noimageinline => 1, forcesubpage => 1));
  80. $actions++;
  81. }
  82. }
  83. if ($actions) {
  84. $template->param(have_actions => 1);
  85. }
  86. my @backlinks=sort { $a->{page} cmp $b->{page} } backlinks($page);
  87. my ($backlinks, $more_backlinks);
  88. if (@backlinks <= $config{numbacklinks} || ! $config{numbacklinks}) {
  89. $backlinks=\@backlinks;
  90. $more_backlinks=[];
  91. }
  92. else {
  93. $backlinks=[@backlinks[0..$config{numbacklinks}-1]];
  94. $more_backlinks=[@backlinks[$config{numbacklinks}..$#backlinks]];
  95. }
  96. $template->param(
  97. title => $page eq 'index'
  98. ? $config{wikiname}
  99. : pagetitle(basename($page)),
  100. wikiname => $config{wikiname},
  101. content => $content,
  102. backlinks => $backlinks,
  103. more_backlinks => $more_backlinks,
  104. mtime => displaytime($pagemtime{$page}),
  105. ctime => displaytime($pagectime{$page}),
  106. baseurl => baseurl($page),
  107. );
  108. run_hooks(pagetemplate => sub {
  109. shift->(page => $page, destpage => $page, template => $template);
  110. });
  111. $content=$template->output;
  112. run_hooks(postscan => sub {
  113. shift->(page => $page, content => $content);
  114. });
  115. run_hooks(format => sub {
  116. $content=shift->(
  117. page => $page,
  118. content => $content,
  119. );
  120. });
  121. return $content;
  122. }
  123. sub scan ($) {
  124. my $file=shift;
  125. debug(sprintf(gettext("scanning %s"), $file));
  126. my $type=pagetype($file);
  127. if (defined $type) {
  128. my $srcfile=srcfile($file);
  129. my $content=readfile($srcfile);
  130. my $page=pagename($file);
  131. will_render($page, htmlpage($page), 1);
  132. if ($config{discussion}) {
  133. # Discussion links are a special case since they're
  134. # not in the text of the page, but on its template.
  135. $links{$page}=[ $page."/".lc($config{discussionpage}) ];
  136. }
  137. else {
  138. $links{$page}=[];
  139. }
  140. run_hooks(scan => sub {
  141. shift->(
  142. page => $page,
  143. content => $content,
  144. );
  145. });
  146. # Preprocess in scan-only mode.
  147. preprocess($page, $page, $content, 1);
  148. }
  149. else {
  150. will_render($file, $file, 1);
  151. }
  152. }
  153. sub fast_file_copy (@) {
  154. my $srcfile=shift;
  155. my $destfile=shift;
  156. my $srcfd=shift;
  157. my $destfd=shift;
  158. my $cleanup=shift;
  159. my $blksize = 16384;
  160. my ($len, $buf, $written);
  161. while ($len = sysread $srcfd, $buf, $blksize) {
  162. if (! defined $len) {
  163. next if $! =~ /^Interrupted/;
  164. error("failed to read $srcfile: $!", $cleanup);
  165. }
  166. my $offset = 0;
  167. while ($len) {
  168. defined($written = syswrite $destfd, $buf, $len, $offset)
  169. or error("failed to write $destfile: $!", $cleanup);
  170. $len -= $written;
  171. $offset += $written;
  172. }
  173. }
  174. }
  175. sub render ($$) {
  176. my $file=shift;
  177. return if $rendered{$file};
  178. debug(shift);
  179. $rendered{$file}=1;
  180. my $type=pagetype($file);
  181. my $srcfile=srcfile($file);
  182. if (defined $type) {
  183. my $page=pagename($file);
  184. delete $depends{$page};
  185. delete $depends_simple{$page};
  186. will_render($page, htmlpage($page), 1);
  187. return if $type=~/^_/;
  188. my $content=htmlize($page, $page, $type,
  189. linkify($page, $page,
  190. preprocess($page, $page,
  191. filter($page, $page,
  192. readfile($srcfile)))));
  193. my $output=htmlpage($page);
  194. writefile($output, $config{destdir}, genpage($page, $content));
  195. }
  196. else {
  197. delete $depends{$file};
  198. delete $depends_simple{$file};
  199. will_render($file, $file, 1);
  200. if ($config{hardlink}) {
  201. # only hardlink if owned by same user
  202. my @stat=stat($srcfile);
  203. if ($stat[4] == $>) {
  204. prep_writefile($file, $config{destdir});
  205. unlink($config{destdir}."/".$file);
  206. if (link($srcfile, $config{destdir}."/".$file)) {
  207. return;
  208. }
  209. }
  210. # if hardlink fails, fall back to copying
  211. }
  212. my $srcfd=readfile($srcfile, 1, 1);
  213. writefile($file, $config{destdir}, undef, 1, sub {
  214. fast_file_copy($srcfile, $file, $srcfd, @_);
  215. });
  216. }
  217. }
  218. sub prune ($) {
  219. my $file=shift;
  220. unlink($file);
  221. my $dir=dirname($file);
  222. while (rmdir($dir)) {
  223. $dir=dirname($dir);
  224. }
  225. }
  226. sub srcdir_check () {
  227. # security check, avoid following symlinks in the srcdir path by default
  228. my $test=$config{srcdir};
  229. while (length $test) {
  230. if (-l $test && ! $config{allow_symlinks_before_srcdir}) {
  231. error(sprintf(gettext("symlink found in srcdir path (%s) -- set allow_symlinks_before_srcdir to allow this"), $test));
  232. }
  233. unless ($test=~s/\/+$//) {
  234. $test=dirname($test);
  235. }
  236. }
  237. }
  238. sub find_src_files () {
  239. my @files;
  240. my %pages;
  241. eval q{use File::Find};
  242. error($@) if $@;
  243. find({
  244. no_chdir => 1,
  245. wanted => sub {
  246. $_=decode_utf8($_);
  247. if (file_pruned($_, $config{srcdir})) {
  248. $File::Find::prune=1;
  249. }
  250. elsif (! -l $_ && ! -d _) {
  251. my ($f)=/$config{wiki_file_regexp}/; # untaint
  252. if (! defined $f) {
  253. warn(sprintf(gettext("skipping bad filename %s"), $_)."\n");
  254. }
  255. else {
  256. $f=~s/^\Q$config{srcdir}\E\/?//;
  257. push @files, $f;
  258. my $page = pagename($f);
  259. if ($pages{$page}) {
  260. debug(sprintf(gettext("%s has multiple possible source pages"), $page));
  261. }
  262. $pages{$page}=1;
  263. }
  264. }
  265. },
  266. }, $config{srcdir});
  267. foreach my $dir (@{$config{underlaydirs}}, $config{underlaydir}) {
  268. find({
  269. no_chdir => 1,
  270. wanted => sub {
  271. $_=decode_utf8($_);
  272. if (file_pruned($_, $dir)) {
  273. $File::Find::prune=1;
  274. }
  275. elsif (! -l $_ && ! -d _) {
  276. my ($f)=/$config{wiki_file_regexp}/; # untaint
  277. if (! defined $f) {
  278. warn(sprintf(gettext("skipping bad filename %s"), $_)."\n");
  279. }
  280. else {
  281. $f=~s/^\Q$dir\E\/?//;
  282. # avoid underlaydir
  283. # override attacks; see
  284. # security.mdwn
  285. if (! -l "$config{srcdir}/$f" &&
  286. ! -e _) {
  287. my $page=pagename($f);
  288. if (! $pages{$page}) {
  289. push @files, $f;
  290. $pages{$page}=1;
  291. }
  292. }
  293. }
  294. }
  295. },
  296. }, $dir);
  297. };
  298. return \@files, \%pages;
  299. }
  300. sub find_new_files ($) {
  301. my $files=shift;
  302. my @new;
  303. my @internal_new;
  304. foreach my $file (@$files) {
  305. my $page=pagename($file);
  306. if (exists $pagesources{$page} && $pagesources{$page} ne $file) {
  307. # the page has changed its type
  308. $forcerebuild{$page}=1;
  309. }
  310. $pagesources{$page}=$file;
  311. if (! $pagemtime{$page}) {
  312. if (isinternal($page)) {
  313. push @internal_new, $file;
  314. }
  315. else {
  316. push @new, $file;
  317. if ($config{getctime} && -e "$config{srcdir}/$file") {
  318. eval {
  319. my $time=rcs_getctime("$config{srcdir}/$file");
  320. $pagectime{$page}=$time;
  321. };
  322. if ($@) {
  323. print STDERR $@;
  324. }
  325. }
  326. }
  327. $pagecase{lc $page}=$page;
  328. if (! exists $pagectime{$page}) {
  329. $pagectime{$page}=(srcfile_stat($file))[10];
  330. }
  331. }
  332. }
  333. return \@new, \@internal_new;
  334. }
  335. sub find_del_files ($) {
  336. my $pages=shift;
  337. my @del;
  338. my @internal_del;
  339. foreach my $page (keys %pagemtime) {
  340. if (! $pages->{$page}) {
  341. if (isinternal($page)) {
  342. push @internal_del, $pagesources{$page};
  343. }
  344. else {
  345. debug(sprintf(gettext("removing old page %s"), $page));
  346. push @del, $pagesources{$page};
  347. }
  348. $links{$page}=[];
  349. $renderedfiles{$page}=[];
  350. $pagemtime{$page}=0;
  351. foreach my $old (@{$oldrenderedfiles{$page}}) {
  352. prune($config{destdir}."/".$old);
  353. }
  354. delete $pagesources{$page};
  355. foreach my $source (keys %destsources) {
  356. if ($destsources{$source} eq $page) {
  357. delete $destsources{$source};
  358. }
  359. }
  360. }
  361. }
  362. return \@del, \@internal_del;
  363. }
  364. sub find_changed ($) {
  365. my $files=shift;
  366. my @changed;
  367. my @internal_changed;
  368. foreach my $file (@$files) {
  369. my $page=pagename($file);
  370. my ($srcfile, @stat)=srcfile_stat($file);
  371. if (! exists $pagemtime{$page} ||
  372. $stat[9] > $pagemtime{$page} ||
  373. $forcerebuild{$page}) {
  374. $pagemtime{$page}=$stat[9];
  375. if (isinternal($page)) {
  376. # Preprocess internal page in scan-only mode.
  377. preprocess($page, $page, readfile($srcfile), 1);
  378. push @internal_changed, $file;
  379. }
  380. else {
  381. push @changed, $file;
  382. }
  383. }
  384. }
  385. return \@changed, \@internal_changed;
  386. }
  387. sub calculate_old_links ($$) {
  388. my ($changed, $del)=@_;
  389. my %oldlink_targets;
  390. foreach my $file (@$changed, @$del) {
  391. my $page=pagename($file);
  392. if (exists $oldlinks{$page}) {
  393. foreach my $l (@{$oldlinks{$page}}) {
  394. $oldlink_targets{$page}{$l}=bestlink($page, $l);
  395. }
  396. }
  397. }
  398. return \%oldlink_targets;
  399. }
  400. sub derender_internal ($) {
  401. my $file=shift;
  402. my $page=pagename($file);
  403. delete $depends{$page};
  404. delete $depends_simple{$page};
  405. foreach my $old (@{$renderedfiles{$page}}) {
  406. delete $destsources{$old};
  407. }
  408. $renderedfiles{$page}=[];
  409. }
  410. sub render_linkers ($) {
  411. my $f=shift;
  412. my $p=pagename($f);
  413. foreach my $page (keys %{$backlinks{$p}}) {
  414. my $file=$pagesources{$page};
  415. render($file, sprintf(gettext("building %s, which links to %s"), $file, $p));
  416. }
  417. }
  418. sub remove_unrendered () {
  419. foreach my $src (keys %rendered) {
  420. my $page=pagename($src);
  421. foreach my $file (@{$oldrenderedfiles{$page}}) {
  422. if (! grep { $_ eq $file } @{$renderedfiles{$page}}) {
  423. debug(sprintf(gettext("removing %s, no longer built by %s"), $file, $page));
  424. prune($config{destdir}."/".$file);
  425. }
  426. }
  427. }
  428. }
  429. sub calculate_changed_links ($$$) {
  430. my ($changed, $del, $oldlink_targets)=@_;
  431. my (%backlinkchanged, %linkchangers);
  432. foreach my $file (@$changed, @$del) {
  433. my $page=pagename($file);
  434. if (exists $links{$page}) {
  435. foreach my $l (@{$links{$page}}) {
  436. my $target=bestlink($page, $l);
  437. if (! exists $oldlink_targets->{$page}{$l} ||
  438. $target ne $oldlink_targets->{$page}{$l}) {
  439. $backlinkchanged{$l}=1;
  440. $linkchangers{lc($page)}=1;
  441. }
  442. delete $oldlink_targets->{$page}{$l};
  443. }
  444. }
  445. if (exists $oldlink_targets->{$page} &&
  446. %{$oldlink_targets->{$page}}) {
  447. foreach my $target (keys %{$oldlink_targets->{$page}}) {
  448. $backlinkchanged{$target}=1;
  449. }
  450. $linkchangers{lc($page)}=1;
  451. }
  452. }
  453. return \%backlinkchanged, \%linkchangers;
  454. }
  455. sub render_dependent ($$$$$$$) {
  456. my ($files, $new, $internal_new, $del, $internal_del,
  457. $internal_changed, $linkchangers)=@_;
  458. my @changed=(keys %rendered, @$del);
  459. my @exists_changed=(@$new, @$del);
  460. my %lc_changed = map { lc(pagename($_)) => 1 } @changed;
  461. my %lc_exists_changed = map { lc(pagename($_)) => 1 } @exists_changed;
  462. foreach my $f (@$files) {
  463. next if $rendered{$f};
  464. my $p=pagename($f);
  465. my $reason = undef;
  466. if (exists $depends_simple{$p}) {
  467. foreach my $d (keys %{$depends_simple{$p}}) {
  468. if (($depends_simple{$p}{$d} & $IkiWiki::DEPEND_CONTENT &&
  469. $lc_changed{$d})
  470. ||
  471. ($depends_simple{$p}{$d} & $IkiWiki::DEPEND_PRESENCE &&
  472. $lc_exists_changed{$d})
  473. ||
  474. ($depends_simple{$p}{$d} & $IkiWiki::DEPEND_LINKS &&
  475. $linkchangers->{$d})
  476. ) {
  477. $reason = $d;
  478. last;
  479. }
  480. }
  481. }
  482. if (exists $depends{$p} && ! defined $reason) {
  483. D: foreach my $d (keys %{$depends{$p}}) {
  484. my $sub=pagespec_translate($d);
  485. next if $@ || ! defined $sub;
  486. # only consider internal files
  487. # if the page explicitly depends
  488. # on such files
  489. my $internal_dep=$d =~ /internal\(/;
  490. my @candidates;
  491. if ($depends{$p}{$d} & $IkiWiki::DEPEND_PRESENCE) {
  492. @candidates=@exists_changed;
  493. push @candidates, @$internal_new, @$internal_del
  494. if $internal_dep;
  495. }
  496. if (($depends{$p}{$d} & ($IkiWiki::DEPEND_CONTENT | $IkiWiki::DEPEND_LINKS))) {
  497. @candidates=@changed;
  498. push @candidates, @$internal_new, @$internal_del, @$internal_changed
  499. if $internal_dep;
  500. }
  501. foreach my $file (@candidates) {
  502. next if $file eq $f;
  503. my $page=pagename($file);
  504. if ($sub->($page, location => $p)) {
  505. if ($depends{$p}{$d} & $IkiWiki::DEPEND_LINKS &&
  506. ! $depends{$p}{$d} & $IkiWiki::DEPEND_CONTENT) {
  507. next unless $linkchangers->{lc($page)};
  508. }
  509. $reason = $page;
  510. last D;
  511. }
  512. }
  513. }
  514. }
  515. if (defined $reason) {
  516. render($f, sprintf(gettext("building %s, which depends on %s"), $f, $reason));
  517. return 1;
  518. }
  519. }
  520. return 0;
  521. }
  522. sub render_backlinks ($) {
  523. my $backlinkchanged=shift;
  524. foreach my $link (keys %$backlinkchanged) {
  525. my $linkfile=$pagesources{$link};
  526. if (defined $linkfile) {
  527. render($linkfile, sprintf(gettext("building %s, to update its backlinks"), $linkfile));
  528. }
  529. }
  530. }
  531. sub refresh () {
  532. srcdir_check();
  533. run_hooks(refresh => sub { shift->() });
  534. my ($files, $pages)=find_src_files();
  535. my ($new, $internal_new)=find_new_files($files);
  536. my ($del, $internal_del)=find_del_files($pages);
  537. my ($changed, $internal_changed)=find_changed($files);
  538. run_hooks(needsbuild => sub { shift->($changed) });
  539. my $oldlink_targets=calculate_old_links($changed, $del);
  540. foreach my $file (@$changed) {
  541. scan($file);
  542. }
  543. calculate_links();
  544. foreach my $file (@$changed) {
  545. render($file, sprintf(gettext("building %s"), $file));
  546. }
  547. foreach my $file (@$internal_new, @$internal_del, @$internal_changed) {
  548. derender_internal($file);
  549. }
  550. my ($backlinkchanged, $linkchangers)=calculate_changed_links($changed,
  551. $del, $oldlink_targets);
  552. foreach my $file (@$new, @$del) {
  553. render_linkers($file);
  554. }
  555. if (@$changed || @$internal_changed ||
  556. @$del || @$internal_del || @$internal_new) {
  557. 1 while render_dependent($files, $new, $internal_new,
  558. $del, $internal_del, $internal_changed,
  559. $linkchangers);
  560. }
  561. render_backlinks($backlinkchanged);
  562. remove_unrendered();
  563. if (@$del) {
  564. run_hooks(delete => sub { shift->(@$del) });
  565. }
  566. if (%rendered) {
  567. run_hooks(change => sub { shift->(keys %rendered) });
  568. }
  569. }
  570. sub commandline_render () {
  571. lockwiki();
  572. loadindex();
  573. unlockwiki();
  574. my $srcfile=possibly_foolish_untaint($config{render});
  575. my $file=$srcfile;
  576. $file=~s/\Q$config{srcdir}\E\/?//;
  577. my $type=pagetype($file);
  578. die sprintf(gettext("ikiwiki: cannot build %s"), $srcfile)."\n" unless defined $type;
  579. my $content=readfile($srcfile);
  580. my $page=pagename($file);
  581. $pagesources{$page}=$file;
  582. $content=filter($page, $page, $content);
  583. $content=preprocess($page, $page, $content);
  584. $content=linkify($page, $page, $content);
  585. $content=htmlize($page, $page, $type, $content);
  586. $pagemtime{$page}=(stat($srcfile))[9];
  587. $pagectime{$page}=$pagemtime{$page} if ! exists $pagectime{$page};
  588. print genpage($page, $content);
  589. exit 0;
  590. }
  591. 1