2006-04-25 01:09:26 +02:00
|
|
|
#!/usr/bin/perl
|
|
|
|
|
2006-03-23 07:51:15 +01:00
|
|
|
package IkiWiki;
|
|
|
|
|
|
|
|
use warnings;
|
|
|
|
use strict;
|
2006-05-02 08:53:33 +02:00
|
|
|
use IkiWiki;
|
2006-07-03 22:18:16 +02:00
|
|
|
use Encode;
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
my %backlinks;
|
2009-08-14 07:11:53 +02:00
|
|
|
our %brokenlinks;
|
|
|
|
my $links_calculated=0;
|
2006-10-28 07:07:56 +02:00
|
|
|
|
2009-08-14 07:11:53 +02:00
|
|
|
sub calculate_links () {
|
|
|
|
return if $links_calculated;
|
|
|
|
%backlinks=%brokenlinks=();
|
2006-10-28 07:07:56 +02:00
|
|
|
foreach my $page (keys %links) {
|
|
|
|
foreach my $link (@{$links{$page}}) {
|
|
|
|
my $bestlink=bestlink($page, $link);
|
2009-08-14 07:11:53 +02:00
|
|
|
if (length $bestlink) {
|
|
|
|
$backlinks{$bestlink}{$page}=1
|
|
|
|
if $bestlink ne $page;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
push @{$brokenlinks{$link}}, $page;
|
2006-10-28 07:07:56 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2009-08-14 07:11:53 +02:00
|
|
|
$links_calculated=1;
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-10-28 07:07:56 +02:00
|
|
|
|
2009-06-18 19:27:00 +02:00
|
|
|
sub backlink_pages ($) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $page=shift;
|
|
|
|
|
2009-08-14 07:11:53 +02:00
|
|
|
calculate_links();
|
2006-10-28 05:27:10 +02:00
|
|
|
|
2009-06-18 19:27:00 +02:00
|
|
|
return keys %{$backlinks{$page}};
|
|
|
|
}
|
|
|
|
|
|
|
|
sub backlinks ($) {
|
|
|
|
my $page=shift;
|
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
my @links;
|
2009-06-18 19:27:00 +02:00
|
|
|
foreach my $p (backlink_pages($page)) {
|
2007-04-01 21:59:42 +02:00
|
|
|
my $href=urlto($p, $page);
|
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
# Trim common dir prefixes from both pages.
|
|
|
|
my $p_trimmed=$p;
|
|
|
|
my $page_trimmed=$page;
|
|
|
|
my $dir;
|
|
|
|
1 while (($dir)=$page_trimmed=~m!^([^/]+/)!) &&
|
|
|
|
defined $dir &&
|
|
|
|
$p_trimmed=~s/^\Q$dir\E// &&
|
|
|
|
$page_trimmed=~s/^\Q$dir\E//;
|
|
|
|
|
|
|
|
push @links, { url => $href, page => pagetitle($p_trimmed) };
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
2007-05-12 21:17:41 +02:00
|
|
|
return @links;
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2008-12-17 21:22:16 +01:00
|
|
|
sub genpage ($$) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $page=shift;
|
2006-05-26 10:24:36 +02:00
|
|
|
my $content=shift;
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2007-07-26 22:50:55 +02:00
|
|
|
my $templatefile;
|
|
|
|
run_hooks(templatefile => sub {
|
|
|
|
return if defined $templatefile;
|
|
|
|
my $file=shift->(page => $page);
|
|
|
|
if (defined $file && defined template_file($file)) {
|
|
|
|
$templatefile=$file;
|
|
|
|
}
|
|
|
|
});
|
|
|
|
my $template=template(defined $templatefile ? $templatefile : 'page.tmpl', blind_cache => 1);
|
2006-05-26 17:18:12 +02:00
|
|
|
my $actions=0;
|
|
|
|
|
2006-03-23 07:51:15 +01:00
|
|
|
if (length $config{cgiurl}) {
|
2008-09-05 19:57:25 +02:00
|
|
|
$template->param(editurl => cgiurl(do => "edit", page => $page))
|
|
|
|
if IkiWiki->can("cgi_editpage");
|
2009-06-09 21:39:00 +02:00
|
|
|
$template->param(prefsurl => cgiurl(do => "prefs"))
|
|
|
|
if exists $hooks{auth};
|
2008-01-29 18:20:17 +01:00
|
|
|
$actions++;
|
|
|
|
}
|
|
|
|
|
2008-07-27 01:37:25 +02:00
|
|
|
if (defined $config{historyurl} && length $config{historyurl}) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $u=$config{historyurl};
|
|
|
|
$u=~s/\[\[file\]\]/$pagesources{$page}/g;
|
|
|
|
$template->param(historyurl => $u);
|
2006-05-26 17:18:12 +02:00
|
|
|
$actions++;
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
2007-01-18 16:06:57 +01:00
|
|
|
if ($config{discussion}) {
|
2009-08-14 03:41:33 +02:00
|
|
|
if ($page !~ /.*\/\Q$config{discussionpage}\E$/ &&
|
2007-01-18 16:06:57 +01:00
|
|
|
(length $config{cgiurl} ||
|
2009-08-14 03:41:33 +02:00
|
|
|
exists $links{$page."/".$config{discussionpage}})) {
|
|
|
|
$template->param(discussionlink => htmllink($page, $page, $config{discussionpage}, noimageinline => 1, forcesubpage => 1));
|
2007-01-18 16:06:57 +01:00
|
|
|
$actions++;
|
|
|
|
}
|
2006-05-26 17:18:12 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if ($actions) {
|
|
|
|
$template->param(have_actions => 1);
|
2006-05-05 20:20:52 +02:00
|
|
|
}
|
2006-05-26 03:10:58 +02:00
|
|
|
|
2007-05-12 21:17:41 +02:00
|
|
|
my @backlinks=sort { $a->{page} cmp $b->{page} } backlinks($page);
|
|
|
|
my ($backlinks, $more_backlinks);
|
|
|
|
if (@backlinks <= $config{numbacklinks} || ! $config{numbacklinks}) {
|
|
|
|
$backlinks=\@backlinks;
|
|
|
|
$more_backlinks=[];
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
$backlinks=[@backlinks[0..$config{numbacklinks}-1]];
|
|
|
|
$more_backlinks=[@backlinks[$config{numbacklinks}..$#backlinks]];
|
|
|
|
}
|
2007-03-31 10:48:10 +02:00
|
|
|
|
2006-03-23 07:51:15 +01:00
|
|
|
$template->param(
|
2006-07-04 22:04:33 +02:00
|
|
|
title => $page eq 'index'
|
|
|
|
? $config{wikiname}
|
|
|
|
: pagetitle(basename($page)),
|
2006-03-23 07:51:15 +01:00
|
|
|
wikiname => $config{wikiname},
|
|
|
|
content => $content,
|
2007-03-31 10:48:10 +02:00
|
|
|
backlinks => $backlinks,
|
|
|
|
more_backlinks => $more_backlinks,
|
2007-12-12 20:43:35 +01:00
|
|
|
mtime => displaytime($pagemtime{$page}),
|
2008-02-10 05:05:48 +01:00
|
|
|
ctime => displaytime($pagectime{$page}),
|
2006-08-22 00:27:02 +02:00
|
|
|
baseurl => baseurl($page),
|
2006-03-23 07:51:15 +01:00
|
|
|
);
|
2006-06-02 06:49:12 +02:00
|
|
|
|
2006-07-30 02:20:11 +02:00
|
|
|
run_hooks(pagetemplate => sub {
|
|
|
|
shift->(page => $page, destpage => $page, template => $template);
|
|
|
|
});
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2006-08-04 09:41:02 +02:00
|
|
|
$content=$template->output;
|
2008-07-17 21:16:56 +02:00
|
|
|
|
|
|
|
run_hooks(postscan => sub {
|
|
|
|
shift->(page => $page, content => $content);
|
|
|
|
});
|
2006-08-04 09:41:02 +02:00
|
|
|
|
|
|
|
run_hooks(format => sub {
|
2006-08-28 20:17:59 +02:00
|
|
|
$content=shift->(
|
|
|
|
page => $page,
|
|
|
|
content => $content,
|
|
|
|
);
|
2006-08-04 09:41:02 +02:00
|
|
|
});
|
|
|
|
|
|
|
|
return $content;
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2008-12-17 21:22:16 +01:00
|
|
|
sub scan ($) {
|
2006-10-28 05:27:10 +02:00
|
|
|
my $file=shift;
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2006-10-28 05:27:10 +02:00
|
|
|
my $type=pagetype($file);
|
|
|
|
if (defined $type) {
|
|
|
|
my $srcfile=srcfile($file);
|
|
|
|
my $content=readfile($srcfile);
|
|
|
|
my $page=pagename($file);
|
2006-10-28 07:07:56 +02:00
|
|
|
will_render($page, htmlpage($page), 1);
|
|
|
|
|
2006-10-28 05:27:10 +02:00
|
|
|
if ($config{discussion}) {
|
2006-11-26 20:42:40 +01:00
|
|
|
# Discussion links are a special case since they're
|
|
|
|
# not in the text of the page, but on its template.
|
2009-08-14 03:41:33 +02:00
|
|
|
$links{$page}=[ $page."/".lc($config{discussionpage}) ];
|
2006-10-28 05:27:10 +02:00
|
|
|
}
|
2008-02-12 04:48:27 +01:00
|
|
|
else {
|
|
|
|
$links{$page}=[];
|
|
|
|
}
|
|
|
|
|
|
|
|
run_hooks(scan => sub {
|
|
|
|
shift->(
|
|
|
|
page => $page,
|
|
|
|
content => $content,
|
|
|
|
);
|
|
|
|
});
|
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
# Preprocess in scan-only mode.
|
|
|
|
preprocess($page, $page, $content, 1);
|
2006-05-05 20:20:52 +02:00
|
|
|
}
|
2006-10-29 00:24:18 +02:00
|
|
|
else {
|
|
|
|
will_render($file, $file, 1);
|
|
|
|
}
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2008-12-17 21:22:16 +01:00
|
|
|
sub fast_file_copy (@) {
|
2008-07-01 06:42:23 +02:00
|
|
|
my $srcfile=shift;
|
|
|
|
my $destfile=shift;
|
|
|
|
my $srcfd=shift;
|
|
|
|
my $destfd=shift;
|
|
|
|
my $cleanup=shift;
|
|
|
|
|
|
|
|
my $blksize = 16384;
|
|
|
|
my ($len, $buf, $written);
|
|
|
|
while ($len = sysread $srcfd, $buf, $blksize) {
|
|
|
|
if (! defined $len) {
|
|
|
|
next if $! =~ /^Interrupted/;
|
|
|
|
error("failed to read $srcfile: $!", $cleanup);
|
|
|
|
}
|
|
|
|
my $offset = 0;
|
|
|
|
while ($len) {
|
|
|
|
defined($written = syswrite $destfd, $buf, $len, $offset)
|
|
|
|
or error("failed to write $destfile: $!", $cleanup);
|
|
|
|
$len -= $written;
|
|
|
|
$offset += $written;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-12-17 21:22:16 +01:00
|
|
|
sub render ($) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $file=shift;
|
|
|
|
|
|
|
|
my $type=pagetype($file);
|
2006-03-29 20:21:01 +02:00
|
|
|
my $srcfile=srcfile($file);
|
2006-07-04 00:14:52 +02:00
|
|
|
if (defined $type) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $page=pagename($file);
|
2006-05-04 06:29:37 +02:00
|
|
|
delete $depends{$page};
|
2009-08-28 21:13:45 +02:00
|
|
|
delete $depends_simple{$page};
|
2006-10-08 23:56:50 +02:00
|
|
|
will_render($page, htmlpage($page), 1);
|
2008-01-29 18:39:28 +01:00
|
|
|
return if $type=~/^_/;
|
2006-05-04 06:29:37 +02:00
|
|
|
|
2008-06-04 07:24:23 +02:00
|
|
|
my $content=htmlize($page, $page, $type,
|
2007-05-17 21:55:11 +02:00
|
|
|
linkify($page, $page,
|
|
|
|
preprocess($page, $page,
|
|
|
|
filter($page, $page,
|
|
|
|
readfile($srcfile)))));
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2007-12-12 20:43:35 +01:00
|
|
|
my $output=htmlpage($page);
|
|
|
|
writefile($output, $config{destdir}, genpage($page, $content));
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
else {
|
2006-05-02 04:34:33 +02:00
|
|
|
delete $depends{$file};
|
2009-08-28 21:13:45 +02:00
|
|
|
delete $depends_simple{$file};
|
2006-10-08 23:56:50 +02:00
|
|
|
will_render($file, $file, 1);
|
2008-03-30 03:02:47 +02:00
|
|
|
|
|
|
|
if ($config{hardlink}) {
|
2008-07-13 05:31:27 +02:00
|
|
|
# only hardlink if owned by same user
|
|
|
|
my @stat=stat($srcfile);
|
|
|
|
if ($stat[4] == $>) {
|
|
|
|
prep_writefile($file, $config{destdir});
|
|
|
|
unlink($config{destdir}."/".$file);
|
|
|
|
if (link($srcfile, $config{destdir}."/".$file)) {
|
|
|
|
return;
|
|
|
|
}
|
2008-03-30 03:02:47 +02:00
|
|
|
}
|
2008-05-08 05:15:43 +02:00
|
|
|
# if hardlink fails, fall back to copying
|
2008-03-30 03:02:47 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
my $srcfd=readfile($srcfile, 1, 1);
|
2007-02-15 03:22:08 +01:00
|
|
|
writefile($file, $config{destdir}, undef, 1, sub {
|
2008-07-01 06:42:23 +02:00
|
|
|
fast_file_copy($srcfile, $file, $srcfd, @_);
|
2007-02-15 03:22:08 +01:00
|
|
|
});
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2008-12-17 21:22:16 +01:00
|
|
|
sub prune ($) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $file=shift;
|
|
|
|
|
|
|
|
unlink($file);
|
|
|
|
my $dir=dirname($file);
|
|
|
|
while (rmdir($dir)) {
|
|
|
|
$dir=dirname($dir);
|
|
|
|
}
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2009-07-20 05:23:16 +02:00
|
|
|
sub srcdir_check () {
|
2008-07-22 00:33:09 +02:00
|
|
|
# security check, avoid following symlinks in the srcdir path by default
|
2007-11-26 21:30:44 +01:00
|
|
|
my $test=$config{srcdir};
|
|
|
|
while (length $test) {
|
2008-07-22 00:33:09 +02:00
|
|
|
if (-l $test && ! $config{allow_symlinks_before_srcdir}) {
|
2008-10-29 18:38:26 +01:00
|
|
|
error(sprintf(gettext("symlink found in srcdir path (%s) -- set allow_symlinks_before_srcdir to allow this"), $test));
|
2007-11-26 21:30:44 +01:00
|
|
|
}
|
|
|
|
unless ($test=~s/\/+$//) {
|
|
|
|
$test=dirname($test);
|
|
|
|
}
|
|
|
|
}
|
2008-01-29 19:08:32 +01:00
|
|
|
|
2009-07-20 05:23:16 +02:00
|
|
|
}
|
2007-11-26 21:30:44 +01:00
|
|
|
|
2009-07-20 05:23:16 +02:00
|
|
|
sub find_src_files () {
|
|
|
|
my (@files, %pages);
|
2006-03-23 07:51:15 +01:00
|
|
|
eval q{use File::Find};
|
2006-11-08 22:03:33 +01:00
|
|
|
error($@) if $@;
|
2006-03-23 07:51:15 +01:00
|
|
|
find({
|
|
|
|
no_chdir => 1,
|
|
|
|
wanted => sub {
|
2006-07-05 20:20:25 +02:00
|
|
|
$_=decode_utf8($_);
|
2006-12-21 20:36:15 +01:00
|
|
|
if (file_pruned($_, $config{srcdir})) {
|
2006-03-23 07:51:15 +01:00
|
|
|
$File::Find::prune=1;
|
|
|
|
}
|
2008-05-07 20:11:56 +02:00
|
|
|
elsif (! -l $_ && ! -d _) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my ($f)=/$config{wiki_file_regexp}/; # untaint
|
|
|
|
if (! defined $f) {
|
2006-12-29 05:38:40 +01:00
|
|
|
warn(sprintf(gettext("skipping bad filename %s"), $_)."\n");
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
$f=~s/^\Q$config{srcdir}\E\/?//;
|
|
|
|
push @files, $f;
|
2008-09-23 19:32:41 +02:00
|
|
|
my $pagename = pagename($f);
|
2009-07-20 05:23:16 +02:00
|
|
|
if ($pages{$pagename}) {
|
2008-09-23 19:32:41 +02:00
|
|
|
debug(sprintf(gettext("%s has multiple possible source pages"), $pagename));
|
|
|
|
}
|
2009-07-20 05:23:16 +02:00
|
|
|
$pages{$pagename}=1;
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}, $config{srcdir});
|
2007-08-28 03:59:01 +02:00
|
|
|
foreach my $dir (@{$config{underlaydirs}}, $config{underlaydir}) {
|
|
|
|
find({
|
|
|
|
no_chdir => 1,
|
|
|
|
wanted => sub {
|
|
|
|
$_=decode_utf8($_);
|
|
|
|
if (file_pruned($_, $dir)) {
|
|
|
|
$File::Find::prune=1;
|
2006-03-29 20:21:01 +02:00
|
|
|
}
|
2008-05-07 20:11:56 +02:00
|
|
|
elsif (! -l $_ && ! -d _) {
|
2007-08-28 03:59:01 +02:00
|
|
|
my ($f)=/$config{wiki_file_regexp}/; # untaint
|
|
|
|
if (! defined $f) {
|
|
|
|
warn(sprintf(gettext("skipping bad filename %s"), $_)."\n");
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
$f=~s/^\Q$dir\E\/?//;
|
|
|
|
# avoid underlaydir
|
|
|
|
# override attacks; see
|
|
|
|
# security.mdwn
|
2008-05-07 20:11:56 +02:00
|
|
|
if (! -l "$config{srcdir}/$f" &&
|
|
|
|
! -e _) {
|
2007-08-28 03:59:01 +02:00
|
|
|
my $page=pagename($f);
|
2009-07-20 05:23:16 +02:00
|
|
|
if (! $pages{$page}) {
|
2007-08-28 03:59:01 +02:00
|
|
|
push @files, $f;
|
2009-07-20 05:23:16 +02:00
|
|
|
$pages{$page}=1;
|
2007-08-28 03:59:01 +02:00
|
|
|
}
|
2006-12-28 23:15:38 +01:00
|
|
|
}
|
2006-03-29 20:21:01 +02:00
|
|
|
}
|
|
|
|
}
|
2007-08-28 03:59:01 +02:00
|
|
|
},
|
|
|
|
}, $dir);
|
|
|
|
};
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2009-07-20 05:23:16 +02:00
|
|
|
# Returns a list of all source files found, and a hash of
|
|
|
|
# the corresponding page names.
|
|
|
|
return \@files, \%pages;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub refresh () {
|
|
|
|
srcdir_check();
|
|
|
|
run_hooks(refresh => sub { shift->() });
|
|
|
|
my ($files, $exists)=find_src_files();
|
|
|
|
|
2008-01-29 21:05:49 +01:00
|
|
|
my (%rendered, @add, @del, @internal);
|
2006-03-23 07:51:15 +01:00
|
|
|
# check for added or removed pages
|
2009-07-20 05:23:16 +02:00
|
|
|
foreach my $file (@$files) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $page=pagename($file);
|
2008-07-20 09:40:16 +02:00
|
|
|
if (exists $pagesources{$page} && $pagesources{$page} ne $file) {
|
|
|
|
# the page has changed its type
|
|
|
|
$forcerebuild{$page}=1;
|
|
|
|
}
|
2006-12-28 23:15:38 +01:00
|
|
|
$pagesources{$page}=$file;
|
2007-03-24 16:10:58 +01:00
|
|
|
if (! $pagemtime{$page}) {
|
2008-01-29 21:05:49 +01:00
|
|
|
if (isinternal($page)) {
|
|
|
|
push @internal, $file;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
push @add, $file;
|
2008-02-25 00:02:34 +01:00
|
|
|
if ($config{getctime} && -e "$config{srcdir}/$file") {
|
|
|
|
eval {
|
|
|
|
my $time=rcs_getctime("$config{srcdir}/$file");
|
|
|
|
$pagectime{$page}=$time;
|
|
|
|
};
|
|
|
|
if ($@) {
|
|
|
|
print STDERR $@;
|
|
|
|
}
|
2008-02-08 04:11:54 +01:00
|
|
|
}
|
2006-05-26 16:54:47 +02:00
|
|
|
}
|
2008-02-25 00:02:34 +01:00
|
|
|
$pagecase{lc $page}=$page;
|
2008-02-08 04:11:54 +01:00
|
|
|
if (! exists $pagectime{$page}) {
|
2008-05-07 20:11:56 +02:00
|
|
|
$pagectime{$page}=(srcfile_stat($file))[10];
|
2006-05-26 16:54:47 +02:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
}
|
2007-03-24 16:10:58 +01:00
|
|
|
foreach my $page (keys %pagemtime) {
|
2009-07-20 05:23:16 +02:00
|
|
|
if (! $exists->{$page}) {
|
2008-01-29 21:05:49 +01:00
|
|
|
if (isinternal($page)) {
|
|
|
|
push @internal, $pagesources{$page};
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
debug(sprintf(gettext("removing old page %s"), $page));
|
|
|
|
push @del, $pagesources{$page};
|
|
|
|
}
|
2006-10-28 05:27:10 +02:00
|
|
|
$links{$page}=[];
|
2006-10-08 23:56:50 +02:00
|
|
|
$renderedfiles{$page}=[];
|
2007-03-24 16:10:58 +01:00
|
|
|
$pagemtime{$page}=0;
|
2009-08-12 18:49:16 +02:00
|
|
|
foreach my $old (@{$oldrenderedfiles{$page}}) {
|
|
|
|
prune($config{destdir}."/".$old);
|
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
delete $pagesources{$page};
|
2009-08-12 18:49:16 +02:00
|
|
|
foreach my $source (keys %destsources) {
|
|
|
|
if ($destsources{$source} eq $page) {
|
|
|
|
delete $destsources{$source};
|
2007-07-26 21:41:04 +02:00
|
|
|
}
|
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
}
|
2006-10-28 07:07:56 +02:00
|
|
|
|
2007-05-09 02:48:09 +02:00
|
|
|
# find changed and new files
|
|
|
|
my @needsbuild;
|
2009-07-20 05:23:16 +02:00
|
|
|
foreach my $file (@$files) {
|
2006-10-28 05:27:10 +02:00
|
|
|
my $page=pagename($file);
|
2008-05-07 20:11:56 +02:00
|
|
|
my ($srcfile, @stat)=srcfile_stat($file);
|
2007-03-24 16:10:58 +01:00
|
|
|
if (! exists $pagemtime{$page} ||
|
2008-05-07 20:11:56 +02:00
|
|
|
$stat[9] > $pagemtime{$page} ||
|
2006-10-28 05:27:10 +02:00
|
|
|
$forcerebuild{$page}) {
|
2008-05-07 20:11:56 +02:00
|
|
|
$pagemtime{$page}=$stat[9];
|
2008-01-29 21:05:49 +01:00
|
|
|
if (isinternal($page)) {
|
|
|
|
push @internal, $file;
|
2008-01-30 00:06:36 +01:00
|
|
|
# Preprocess internal page in scan-only mode.
|
2008-05-07 20:11:56 +02:00
|
|
|
preprocess($page, $page, readfile($srcfile), 1);
|
2008-01-29 21:05:49 +01:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
push @needsbuild, $file;
|
|
|
|
}
|
2006-10-28 05:27:10 +02:00
|
|
|
}
|
|
|
|
}
|
2007-05-09 02:48:09 +02:00
|
|
|
run_hooks(needsbuild => sub { shift->(\@needsbuild) });
|
2006-10-28 05:27:10 +02:00
|
|
|
|
2007-07-28 23:37:22 +02:00
|
|
|
# scan and render files
|
2007-05-09 02:48:09 +02:00
|
|
|
foreach my $file (@needsbuild) {
|
|
|
|
debug(sprintf(gettext("scanning %s"), $file));
|
|
|
|
scan($file);
|
|
|
|
}
|
2009-08-14 07:11:53 +02:00
|
|
|
calculate_links();
|
2007-05-09 02:48:09 +02:00
|
|
|
foreach my $file (@needsbuild) {
|
2009-07-23 00:53:23 +02:00
|
|
|
debug(sprintf(gettext("building %s"), $file));
|
2006-10-28 07:07:56 +02:00
|
|
|
render($file);
|
|
|
|
$rendered{$file}=1;
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
2008-01-29 21:05:49 +01:00
|
|
|
foreach my $file (@internal) {
|
|
|
|
# internal pages are not rendered
|
|
|
|
my $page=pagename($file);
|
|
|
|
delete $depends{$page};
|
2009-08-28 21:13:45 +02:00
|
|
|
delete $depends_simple{$page};
|
2008-01-29 21:05:49 +01:00
|
|
|
foreach my $old (@{$renderedfiles{$page}}) {
|
|
|
|
delete $destsources{$old};
|
|
|
|
}
|
|
|
|
$renderedfiles{$page}=[];
|
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2006-11-01 06:41:37 +01:00
|
|
|
# rebuild pages that link to added or removed pages
|
2006-03-23 07:51:15 +01:00
|
|
|
if (@add || @del) {
|
2006-11-01 06:41:37 +01:00
|
|
|
foreach my $f (@add, @del) {
|
|
|
|
my $p=pagename($f);
|
|
|
|
foreach my $page (keys %{$backlinks{$p}}) {
|
|
|
|
my $file=$pagesources{$page};
|
|
|
|
next if $rendered{$file};
|
2009-07-23 00:53:23 +02:00
|
|
|
debug(sprintf(gettext("building %s, which links to %s"), $file, $p));
|
2006-11-01 06:41:37 +01:00
|
|
|
render($file);
|
|
|
|
$rendered{$file}=1;
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-01-29 21:05:49 +01:00
|
|
|
if (%rendered || @del || @internal) {
|
|
|
|
my @changed=(keys %rendered, @del);
|
|
|
|
|
2009-08-28 16:22:07 +02:00
|
|
|
my %lcchanged = map { lc(pagename($_)) => 1 } @changed;
|
Add depends_exact: simplified dependency tracking for dependencies on a single page
Let E be the number of dependencies per page of the form "A depends on B and
nothing else", let D be the number of other dependencies per page,
let P be the total number of pages, and let C be the number of changed
pages in a refresh.
This patch should speed up a refresh from O(E*C*P + D*C*P) to
O(C + E*P + D*C*P), assuming that hash lookups are O(1).
In practice, plugins like inline and map produce a lot of these very simple
dependencies, and my album plugin's combination of inline with a large
number of pages causes it to suffer particularly badly.
In testing on a wiki with about 7000 objects (3500 full pages, 3500
images), a full rebuild continued to take about 5:30, and a refresh
after touching about 350 pages and 350 images reduced from 5:30 to 1:30.
As with my previous optimizations, this change will result in downgrades not
working correctly until the wiki is rebuilt.
2009-08-28 00:25:58 +02:00
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
# rebuild dependant pages
|
2009-08-28 16:28:52 +02:00
|
|
|
foreach my $f (@$files) {
|
2006-10-28 05:27:10 +02:00
|
|
|
next if $rendered{$f};
|
2006-03-24 04:21:46 +01:00
|
|
|
my $p=pagename($f);
|
2009-08-28 16:28:52 +02:00
|
|
|
my $reason = undef;
|
Add depends_exact: simplified dependency tracking for dependencies on a single page
Let E be the number of dependencies per page of the form "A depends on B and
nothing else", let D be the number of other dependencies per page,
let P be the total number of pages, and let C be the number of changed
pages in a refresh.
This patch should speed up a refresh from O(E*C*P + D*C*P) to
O(C + E*P + D*C*P), assuming that hash lookups are O(1).
In practice, plugins like inline and map produce a lot of these very simple
dependencies, and my album plugin's combination of inline with a large
number of pages causes it to suffer particularly badly.
In testing on a wiki with about 7000 objects (3500 full pages, 3500
images), a full rebuild continued to take about 5:30, and a refresh
after touching about 350 pages and 350 images reduced from 5:30 to 1:30.
As with my previous optimizations, this change will result in downgrades not
working correctly until the wiki is rebuilt.
2009-08-28 00:25:58 +02:00
|
|
|
|
2009-08-28 21:13:45 +02:00
|
|
|
if (exists $depends_simple{$p}) {
|
|
|
|
foreach my $d (keys %{$depends_simple{$p}}) {
|
2009-08-28 16:22:07 +02:00
|
|
|
if (exists $lcchanged{$d}) {
|
2009-08-28 16:28:52 +02:00
|
|
|
$reason = $d;
|
|
|
|
last;
|
Add depends_exact: simplified dependency tracking for dependencies on a single page
Let E be the number of dependencies per page of the form "A depends on B and
nothing else", let D be the number of other dependencies per page,
let P be the total number of pages, and let C be the number of changed
pages in a refresh.
This patch should speed up a refresh from O(E*C*P + D*C*P) to
O(C + E*P + D*C*P), assuming that hash lookups are O(1).
In practice, plugins like inline and map produce a lot of these very simple
dependencies, and my album plugin's combination of inline with a large
number of pages causes it to suffer particularly badly.
In testing on a wiki with about 7000 objects (3500 full pages, 3500
images), a full rebuild continued to take about 5:30, and a refresh
after touching about 350 pages and 350 images reduced from 5:30 to 1:30.
As with my previous optimizations, this change will result in downgrades not
working correctly until the wiki is rebuilt.
2009-08-28 00:25:58 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2009-08-28 16:28:52 +02:00
|
|
|
if (exists $depends{$p} && ! defined $reason) {
|
|
|
|
D: foreach my $d (keys %{$depends{$p}}) {
|
2009-08-25 23:46:15 +02:00
|
|
|
my $sub=pagespec_translate($d);
|
|
|
|
next if $@ || ! defined $sub;
|
|
|
|
|
2009-06-18 16:54:53 +02:00
|
|
|
# only consider internal files
|
2009-08-25 23:46:15 +02:00
|
|
|
# if the page explicitly depends
|
|
|
|
# on such files
|
|
|
|
foreach my $file (@changed, $d =~ /internal\(/ ? @internal : ()) {
|
|
|
|
next if $file eq $f;
|
|
|
|
my $page=pagename($file);
|
|
|
|
if ($sub->($page, location => $p)) {
|
2009-08-28 16:28:52 +02:00
|
|
|
$reason = $page;
|
|
|
|
last D;
|
2009-08-25 23:46:15 +02:00
|
|
|
}
|
2006-03-24 04:21:46 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2009-08-28 16:28:52 +02:00
|
|
|
|
|
|
|
if (defined $reason) {
|
|
|
|
debug(sprintf(gettext("building %s, which depends on %s"), $f, $reason));
|
|
|
|
render($f);
|
|
|
|
$rendered{$f}=1;
|
|
|
|
}
|
2006-03-24 04:21:46 +01:00
|
|
|
}
|
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
# handle backlinks; if a page has added/removed links,
|
|
|
|
# update the pages it links to
|
2006-03-23 07:51:15 +01:00
|
|
|
my %linkchanged;
|
2008-01-29 21:05:49 +01:00
|
|
|
foreach my $file (@changed) {
|
2006-03-23 07:51:15 +01:00
|
|
|
my $page=pagename($file);
|
2006-03-24 02:49:42 +01:00
|
|
|
|
2006-03-23 07:51:15 +01:00
|
|
|
if (exists $links{$page}) {
|
|
|
|
foreach my $link (map { bestlink($page, $_) } @{$links{$page}}) {
|
|
|
|
if (length $link &&
|
2006-05-02 04:34:33 +02:00
|
|
|
(! exists $oldlinks{$page} ||
|
|
|
|
! grep { bestlink($page, $_) eq $link } @{$oldlinks{$page}})) {
|
2006-03-23 07:51:15 +01:00
|
|
|
$linkchanged{$link}=1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (exists $oldlinks{$page}) {
|
|
|
|
foreach my $link (map { bestlink($page, $_) } @{$oldlinks{$page}}) {
|
|
|
|
if (length $link &&
|
2006-05-02 04:34:33 +02:00
|
|
|
(! exists $links{$page} ||
|
|
|
|
! grep { bestlink($page, $_) eq $link } @{$links{$page}})) {
|
2006-03-23 07:51:15 +01:00
|
|
|
$linkchanged{$link}=1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2008-01-29 21:05:49 +01:00
|
|
|
|
2006-03-23 07:51:15 +01:00
|
|
|
foreach my $link (keys %linkchanged) {
|
|
|
|
my $linkfile=$pagesources{$link};
|
|
|
|
if (defined $linkfile) {
|
2006-10-28 05:27:10 +02:00
|
|
|
next if $rendered{$linkfile};
|
2009-07-23 00:53:23 +02:00
|
|
|
debug(sprintf(gettext("building %s, to update its backlinks"), $linkfile));
|
2006-03-23 07:51:15 +01:00
|
|
|
render($linkfile);
|
2006-03-30 00:21:23 +02:00
|
|
|
$rendered{$linkfile}=1;
|
2006-03-23 07:51:15 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2006-03-30 00:21:23 +02:00
|
|
|
|
2006-10-28 07:07:56 +02:00
|
|
|
# remove no longer rendered files
|
2006-10-08 23:56:50 +02:00
|
|
|
foreach my $src (keys %rendered) {
|
|
|
|
my $page=pagename($src);
|
|
|
|
foreach my $file (@{$oldrenderedfiles{$page}}) {
|
|
|
|
if (! grep { $_ eq $file } @{$renderedfiles{$page}}) {
|
2009-07-23 00:53:23 +02:00
|
|
|
debug(sprintf(gettext("removing %s, no longer built by %s"), $file, $page));
|
2006-10-08 23:56:50 +02:00
|
|
|
prune($config{destdir}."/".$file);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-07-30 02:20:11 +02:00
|
|
|
if (@del) {
|
|
|
|
run_hooks(delete => sub { shift->(@del) });
|
2006-05-03 23:50:39 +02:00
|
|
|
}
|
2006-07-30 02:20:11 +02:00
|
|
|
if (%rendered) {
|
|
|
|
run_hooks(change => sub { shift->(keys %rendered) });
|
2006-03-30 00:21:23 +02:00
|
|
|
}
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-03-23 07:51:15 +01:00
|
|
|
|
2008-12-17 21:22:16 +01:00
|
|
|
sub commandline_render () {
|
2006-09-21 23:34:29 +02:00
|
|
|
lockwiki();
|
|
|
|
loadindex();
|
|
|
|
unlockwiki();
|
|
|
|
|
|
|
|
my $srcfile=possibly_foolish_untaint($config{render});
|
|
|
|
my $file=$srcfile;
|
|
|
|
$file=~s/\Q$config{srcdir}\E\/?//;
|
|
|
|
|
|
|
|
my $type=pagetype($file);
|
2009-07-23 00:53:23 +02:00
|
|
|
die sprintf(gettext("ikiwiki: cannot build %s"), $srcfile)."\n" unless defined $type;
|
2006-09-21 23:34:29 +02:00
|
|
|
my $content=readfile($srcfile);
|
|
|
|
my $page=pagename($file);
|
|
|
|
$pagesources{$page}=$file;
|
2007-05-17 21:55:11 +02:00
|
|
|
$content=filter($page, $page, $content);
|
2006-09-21 23:34:29 +02:00
|
|
|
$content=preprocess($page, $page, $content);
|
|
|
|
$content=linkify($page, $page, $content);
|
2008-06-04 07:24:23 +02:00
|
|
|
$content=htmlize($page, $page, $type, $content);
|
2008-05-07 20:11:56 +02:00
|
|
|
$pagemtime{$page}=(stat($srcfile))[9];
|
2008-10-30 19:50:33 +01:00
|
|
|
$pagectime{$page}=$pagemtime{$page} if ! exists $pagectime{$page};
|
2006-09-21 23:34:29 +02:00
|
|
|
|
2007-12-12 20:43:35 +01:00
|
|
|
print genpage($page, $content);
|
2006-09-21 23:34:29 +02:00
|
|
|
exit 0;
|
2008-12-17 21:22:16 +01:00
|
|
|
}
|
2006-09-21 23:34:29 +02:00
|
|
|
|
2006-03-23 07:51:15 +01:00
|
|
|
1
|