summaryrefslogtreecommitdiff
path: root/IkiWiki/Plugin/meta.pm
blob: 73bc2128cb6cf4304eebcbca0358cbf4cdf9db1c (plain)
  1. #!/usr/bin/perl
  2. # Ikiwiki metadata plugin.
  3. package IkiWiki::Plugin::meta;
  4. use warnings;
  5. use strict;
  6. use IkiWiki 3.00;
  7. my %metaheaders;
  8. sub import {
  9. hook(type => "getsetup", id => "meta", call => \&getsetup);
  10. hook(type => "needsbuild", id => "meta", call => \&needsbuild);
  11. hook(type => "preprocess", id => "meta", call => \&preprocess, scan => 1);
  12. hook(type => "pagetemplate", id => "meta", call => \&pagetemplate);
  13. }
  14. sub getsetup () {
  15. return
  16. plugin => {
  17. safe => 1,
  18. rebuild => undef,
  19. section => "core",
  20. },
  21. }
  22. sub needsbuild (@) {
  23. my $needsbuild=shift;
  24. foreach my $page (keys %pagestate) {
  25. if (exists $pagestate{$page}{meta}) {
  26. if (exists $pagesources{$page} &&
  27. grep { $_ eq $pagesources{$page} } @$needsbuild) {
  28. # remove state, it will be re-added
  29. # if the preprocessor directive is still
  30. # there during the rebuild
  31. delete $pagestate{$page}{meta};
  32. }
  33. }
  34. }
  35. return $needsbuild;
  36. }
  37. sub scrub ($$$) {
  38. if (IkiWiki::Plugin::htmlscrubber->can("sanitize")) {
  39. return IkiWiki::Plugin::htmlscrubber::sanitize(
  40. content => shift, page => shift, destpage => shift);
  41. }
  42. else {
  43. return shift;
  44. }
  45. }
  46. sub safeurl ($) {
  47. my $url=shift;
  48. if (exists $IkiWiki::Plugin::htmlscrubber::{safe_url_regexp} &&
  49. defined $IkiWiki::Plugin::htmlscrubber::safe_url_regexp) {
  50. return $url=~/$IkiWiki::Plugin::htmlscrubber::safe_url_regexp/;
  51. }
  52. else {
  53. return 1;
  54. }
  55. }
  56. sub htmlize ($$$) {
  57. my $page = shift;
  58. my $destpage = shift;
  59. return IkiWiki::htmlize($page, $destpage, pagetype($pagesources{$page}),
  60. IkiWiki::linkify($page, $destpage,
  61. IkiWiki::preprocess($page, $destpage, shift)));
  62. }
  63. sub preprocess (@) {
  64. return "" unless @_;
  65. my %params=@_;
  66. my $key=shift;
  67. my $value=$params{$key};
  68. delete $params{$key};
  69. my $page=$params{page};
  70. delete $params{page};
  71. my $destpage=$params{destpage};
  72. delete $params{destpage};
  73. delete $params{preview};
  74. eval q{use HTML::Entities};
  75. # Always decode, even if encoding later, since it might not be
  76. # fully encoded.
  77. $value=decode_entities($value);
  78. # Metadata collection that needs to happen during the scan pass.
  79. if ($key eq 'title') {
  80. $pagestate{$page}{meta}{title}=$value;
  81. if (exists $params{sortas}) {
  82. $pagestate{$page}{meta}{titlesort}=$params{sortas};
  83. }
  84. else {
  85. delete $pagestate{$page}{meta}{titlesort};
  86. }
  87. return "";
  88. }
  89. elsif ($key eq 'description') {
  90. $pagestate{$page}{meta}{description}=$value;
  91. # fallthrough
  92. }
  93. elsif ($key eq 'guid') {
  94. $pagestate{$page}{meta}{guid}=$value;
  95. # fallthrough
  96. }
  97. elsif ($key eq 'license') {
  98. push @{$metaheaders{$page}}, '<link rel="license" href="#pagelicense" />';
  99. $pagestate{$page}{meta}{license}=$value;
  100. return "";
  101. }
  102. elsif ($key eq 'copyright') {
  103. push @{$metaheaders{$page}}, '<link rel="copyright" href="#pagecopyright" />';
  104. $pagestate{$page}{meta}{copyright}=$value;
  105. return "";
  106. }
  107. elsif ($key eq 'link' && ! %params) {
  108. # hidden WikiLink
  109. add_link($page, $value);
  110. return "";
  111. }
  112. elsif ($key eq 'enclosure') {
  113. my $link=bestlink($page, $value);
  114. if (! length $link) {
  115. error gettext("enclosure not found")
  116. }
  117. add_depends($page, $link, deptype("presence"));
  118. $value=urlto($link, $page, 1);
  119. $pagestate{$page}{meta}{enclosure}=$value;
  120. $pagestate{$page}{meta}{enclosurefile}=$link;
  121. # fallthrough
  122. }
  123. elsif ($key eq 'author') {
  124. $pagestate{$page}{meta}{author}=$value;
  125. if (exists $params{sortas}) {
  126. $pagestate{$page}{meta}{authorsort}=$params{sortas};
  127. }
  128. else {
  129. delete $pagestate{$page}{meta}{authorsort};
  130. }
  131. # fallthorough
  132. }
  133. elsif ($key eq 'authorurl') {
  134. $pagestate{$page}{meta}{authorurl}=$value if safeurl($value);
  135. # fallthrough
  136. }
  137. elsif ($key eq 'permalink') {
  138. $pagestate{$page}{meta}{permalink}=$value if safeurl($value);
  139. # fallthrough
  140. }
  141. elsif ($key eq 'date') {
  142. eval q{use Date::Parse};
  143. if (! $@) {
  144. my $time = str2time($value);
  145. if (defined $time) {
  146. $IkiWiki::pagectime{$page}=$time;
  147. }
  148. else {
  149. error(sprintf(gettext('cannot parse date/time: %s'), $value));
  150. }
  151. }
  152. else {
  153. error $@;
  154. }
  155. }
  156. elsif ($key eq 'updated') {
  157. eval q{use Date::Parse};
  158. if (! $@) {
  159. my $time = str2time($value);
  160. if (defined $time) {
  161. $pagestate{$page}{meta}{updated}=$time;
  162. }
  163. else {
  164. error(sprintf(gettext('cannot parse date/time: %s'), $value));
  165. }
  166. }
  167. else {
  168. error $@;
  169. }
  170. }
  171. if (! defined wantarray) {
  172. # avoid collecting duplicate data during scan pass
  173. return;
  174. }
  175. # Metadata handling that happens only during preprocessing pass.
  176. if ($key eq 'permalink') {
  177. if (safeurl($value)) {
  178. push @{$metaheaders{$page}}, scrub('<link rel="bookmark" href="'.encode_entities($value).'" />', $page, $destpage);
  179. }
  180. }
  181. elsif ($key eq 'stylesheet') {
  182. my $rel=exists $params{rel} ? $params{rel} : "alternate stylesheet";
  183. my $title=exists $params{title} ? $params{title} : $value;
  184. # adding .css to the value prevents using any old web
  185. # editable page as a stylesheet
  186. my $stylesheet=bestlink($page, $value.".css");
  187. if (! length $stylesheet) {
  188. error gettext("stylesheet not found")
  189. }
  190. push @{$metaheaders{$page}}, scrub('<link href="'.urlto($stylesheet, $page).
  191. '" rel="'.encode_entities($rel).
  192. '" title="'.encode_entities($title).
  193. "\" type=\"text/css\" />", $page, $destpage);
  194. }
  195. elsif ($key eq 'script') {
  196. my $defer=exists $params{defer} ? ' defer="defer"' : '';
  197. my $async=exists $params{async} ? ' async="async"' : '';
  198. my $srcurl=$value;
  199. my $js=bestlink($page, $value.".js");
  200. if (length $js) {
  201. $srcurl=urlto($js, $page);
  202. }
  203. push @{$metaheaders{$page}}, scrub('<script src="'. $srcurl .
  204. '"' . $defer . $async . ' type="text/javascript"></script>',
  205. $page, $destpage);
  206. }
  207. elsif ($key eq 'openid') {
  208. my $delegate=0; # both by default
  209. if (exists $params{delegate}) {
  210. $delegate = 1 if lc $params{delegate} eq 'openid';
  211. $delegate = 2 if lc $params{delegate} eq 'openid2';
  212. }
  213. if (exists $params{server} && safeurl($params{server})) {
  214. push @{$metaheaders{$page}}, '<link href="'.encode_entities($params{server}).
  215. '" rel="openid.server" />' if $delegate ne 2;
  216. push @{$metaheaders{$page}}, '<link href="'.encode_entities($params{server}).
  217. '" rel="openid2.provider" />' if $delegate ne 1;
  218. }
  219. if (safeurl($value)) {
  220. push @{$metaheaders{$page}}, '<link href="'.encode_entities($value).
  221. '" rel="openid.delegate" />' if $delegate ne 2;
  222. push @{$metaheaders{$page}}, '<link href="'.encode_entities($value).
  223. '" rel="openid2.local_id" />' if $delegate ne 1;
  224. }
  225. if (exists $params{"xrds-location"} && safeurl($params{"xrds-location"})) {
  226. # force url absolute
  227. eval q{use URI};
  228. error($@) if $@;
  229. my $url=URI->new_abs($params{"xrds-location"}, $config{url});
  230. push @{$metaheaders{$page}}, '<meta http-equiv="X-XRDS-Location" '.
  231. 'content="'.encode_entities($url).'" />';
  232. }
  233. }
  234. elsif ($key eq 'foaf') {
  235. if (safeurl($value)) {
  236. push @{$metaheaders{$page}}, '<link rel="meta" '.
  237. 'type="application/rdf+xml" title="FOAF" '.
  238. 'href="'.encode_entities($value).'" />';
  239. }
  240. }
  241. elsif ($key eq 'redir') {
  242. return "" if $page ne $destpage;
  243. my $safe=0;
  244. if ($value !~ /^\w+:\/\//) {
  245. my ($redir_page, $redir_anchor) = split /\#/, $value;
  246. my $link=bestlink($page, $redir_page);
  247. if (! length $link) {
  248. error gettext("redir page not found")
  249. }
  250. add_depends($page, $link, deptype("presence"));
  251. $value=urlto($link, $page);
  252. $value.='#'.$redir_anchor if defined $redir_anchor;
  253. $safe=1;
  254. # redir cycle detection
  255. $pagestate{$page}{meta}{redir}=$link;
  256. my $at=$page;
  257. my %seen;
  258. while (exists $pagestate{$at}{meta}{redir}) {
  259. if ($seen{$at}) {
  260. error gettext("redir cycle is not allowed")
  261. }
  262. $seen{$at}=1;
  263. $at=$pagestate{$at}{meta}{redir};
  264. }
  265. }
  266. else {
  267. $value=encode_entities($value);
  268. }
  269. my $delay=int(exists $params{delay} ? $params{delay} : 0);
  270. my $redir="<meta http-equiv=\"refresh\" content=\"$delay; URL=$value\" />";
  271. if (! $safe) {
  272. $redir=scrub($redir, $page, $destpage);
  273. }
  274. push @{$metaheaders{$page}}, $redir;
  275. }
  276. elsif ($key eq 'link') {
  277. if (%params) {
  278. push @{$metaheaders{$page}}, scrub("<link href=\"".encode_entities($value)."\" ".
  279. join(" ", map {
  280. encode_entities($_)."=\"".encode_entities(decode_entities($params{$_}))."\""
  281. } keys %params).
  282. " />\n", $page, $destpage);
  283. }
  284. }
  285. elsif ($key eq 'robots') {
  286. push @{$metaheaders{$page}}, '<meta name="robots"'.
  287. ' content="'.encode_entities($value).'" />';
  288. }
  289. elsif ($key eq 'description' || $key eq 'author') {
  290. push @{$metaheaders{$page}}, '<meta name="'.$key.
  291. '" content="'.encode_entities($value).'" />';
  292. }
  293. elsif ($key eq 'name') {
  294. push @{$metaheaders{$page}}, scrub('<meta name="'.
  295. encode_entities($value).
  296. '" '.
  297. join(' ', map { "$_=\"$params{$_}\"" } keys %params).
  298. ' />', $page, $destpage);
  299. }
  300. elsif ($key eq 'keywords') {
  301. # Make sure the keyword string is safe: only allow alphanumeric
  302. # characters, space and comma and strip the rest.
  303. $value =~ s/[^[:alnum:], ]+//g;
  304. push @{$metaheaders{$page}}, '<meta name="keywords"'.
  305. ' content="'.encode_entities($value).'" />';
  306. }
  307. else {
  308. push @{$metaheaders{$page}}, scrub('<meta name="'.
  309. encode_entities($key).'" content="'.
  310. encode_entities($value).'" />', $page, $destpage);
  311. }
  312. return "";
  313. }
  314. sub pagetemplate (@) {
  315. my %params=@_;
  316. my $page=$params{page};
  317. my $destpage=$params{destpage};
  318. my $template=$params{template};
  319. if (exists $metaheaders{$page} && $template->query(name => "meta")) {
  320. # avoid duplicate meta lines
  321. my %seen;
  322. $template->param(meta => join("\n", grep { (! $seen{$_}) && ($seen{$_}=1) } @{$metaheaders{$page}}));
  323. }
  324. if (exists $pagestate{$page}{meta}{title} && $template->query(name => "title")) {
  325. eval q{use HTML::Entities};
  326. $template->param(title => HTML::Entities::encode_numeric($pagestate{$page}{meta}{title}));
  327. $template->param(title_overridden => 1);
  328. }
  329. if (exists $pagestate{$page}{meta}{enclosure}) {
  330. $template->param(enclosure => HTML::Entities::encode_entities(IkiWiki::urlabs($pagestate{$page}{meta}{enclosure}, $config{url})));
  331. }
  332. foreach my $field (qw{authorurl}) {
  333. eval q{use HTML::Entities};
  334. $template->param($field => HTML::Entities::encode_entities($pagestate{$page}{meta}{$field}))
  335. if exists $pagestate{$page}{meta}{$field} && $template->query(name => $field);
  336. }
  337. foreach my $field (qw{permalink}) {
  338. if (exists $pagestate{$page}{meta}{$field} && $template->query(name => $field)) {
  339. eval q{use HTML::Entities};
  340. $template->param($field => HTML::Entities::encode_entities(IkiWiki::urlabs($pagestate{$page}{meta}{$field}, $config{url})));
  341. }
  342. }
  343. foreach my $field (qw{description author}) {
  344. eval q{use HTML::Entities};
  345. $template->param($field => HTML::Entities::encode_numeric($pagestate{$page}{meta}{$field}))
  346. if exists $pagestate{$page}{meta}{$field} && $template->query(name => $field);
  347. }
  348. foreach my $field (qw{license copyright}) {
  349. if (exists $pagestate{$page}{meta}{$field} && $template->query(name => $field) &&
  350. ($page eq $destpage || ! exists $pagestate{$destpage}{meta}{$field} ||
  351. $pagestate{$page}{meta}{$field} ne $pagestate{$destpage}{meta}{$field})) {
  352. $template->param($field => htmlize($page, $destpage, $pagestate{$page}{meta}{$field}));
  353. }
  354. }
  355. }
  356. sub get_sort_key {
  357. my $page = shift;
  358. my $meta = shift;
  359. # e.g. titlesort (also makes sense for author)
  360. my $key = $pagestate{$page}{meta}{$meta . "sort"};
  361. return $key if defined $key;
  362. # e.g. title
  363. $key = $pagestate{$page}{meta}{$meta};
  364. return $key if defined $key;
  365. # fall back to closer-to-core things
  366. if ($meta eq 'title') {
  367. return pagetitle(IkiWiki::basename($page));
  368. }
  369. elsif ($meta eq 'date') {
  370. return $IkiWiki::pagectime{$page};
  371. }
  372. elsif ($meta eq 'updated') {
  373. return $IkiWiki::pagemtime{$page};
  374. }
  375. else {
  376. return '';
  377. }
  378. }
  379. sub match {
  380. my $field=shift;
  381. my $page=shift;
  382. # turn glob into a safe regexp
  383. my $re=IkiWiki::glob2re(shift);
  384. my $val;
  385. if (exists $pagestate{$page}{meta}{$field}) {
  386. $val=$pagestate{$page}{meta}{$field};
  387. }
  388. elsif ($field eq 'title') {
  389. $val = pagetitle($page);
  390. }
  391. if (defined $val) {
  392. if ($val=~$re) {
  393. return IkiWiki::SuccessReason->new("$re matches $field of $page", $page => $IkiWiki::DEPEND_CONTENT, "" => 1);
  394. }
  395. else {
  396. return IkiWiki::FailReason->new("$re does not match $field of $page", $page => $IkiWiki::DEPEND_CONTENT, "" => 1);
  397. }
  398. }
  399. else {
  400. return IkiWiki::FailReason->new("$page does not have a $field", $page => $IkiWiki::DEPEND_CONTENT);
  401. }
  402. }
  403. package IkiWiki::PageSpec;
  404. sub match_title ($$;@) {
  405. IkiWiki::Plugin::meta::match("title", @_);
  406. }
  407. sub match_author ($$;@) {
  408. IkiWiki::Plugin::meta::match("author", @_);
  409. }
  410. sub match_authorurl ($$;@) {
  411. IkiWiki::Plugin::meta::match("authorurl", @_);
  412. }
  413. sub match_license ($$;@) {
  414. IkiWiki::Plugin::meta::match("license", @_);
  415. }
  416. sub match_copyright ($$;@) {
  417. IkiWiki::Plugin::meta::match("copyright", @_);
  418. }
  419. sub match_guid ($$;@) {
  420. IkiWiki::Plugin::meta::match("guid", @_);
  421. }
  422. package IkiWiki::SortSpec;
  423. sub cmp_meta {
  424. my $meta = shift;
  425. error(gettext("sort=meta requires a parameter")) unless defined $meta;
  426. if ($meta eq 'updated' || $meta eq 'date') {
  427. return IkiWiki::Plugin::meta::get_sort_key($a, $meta)
  428. <=>
  429. IkiWiki::Plugin::meta::get_sort_key($b, $meta);
  430. }
  431. return IkiWiki::Plugin::meta::get_sort_key($a, $meta)
  432. cmp
  433. IkiWiki::Plugin::meta::get_sort_key($b, $meta);
  434. }
  435. # A prototype of how sort=title could behave in 4.0 or something
  436. sub cmp_meta_title {
  437. $_[0] = 'title';
  438. return cmp_meta(@_);
  439. }
  440. 1