aboutsummaryrefslogtreecommitdiff
path: root/IkiWiki/Plugin/htmltidy.pm
blob: da77e60f1cb6198278e87897522fd74b553f95e9 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
#!/usr/bin/perl
# HTML Tidy plugin
# requires 'tidy' binary, found in Debian or http://tidy.sf.net/
# mostly a proof-of-concept on how to use external filters.
# It is particularly useful when the html plugin is used.
#
# by Faidon Liambotis
package IkiWiki::Plugin::htmltidy;

use warnings;
use strict;
use IkiWiki 3.00;
use IPC::Open2;

sub import {
	hook(type => "getsetup", id => "tidy", call => \&getsetup);
	hook(type => "sanitize", id => "tidy", call => \&sanitize);
	hook(type => "checkconfig", id => "tidy", call => \&checkconfig);
}

sub getsetup () {
	return
		plugin => {
			safe => 1,
			rebuild => undef,
		},
		htmltidy => {
			type => "string",
			description => "tidy command line",
			safe => 0, # path
			rebuild => undef,
		},
}

sub checkconfig () {
	if (! defined $config{htmltidy}) {
		$config{htmltidy}="tidy -quiet -asxhtml -utf8 --show-body-only yes --show-warnings no --tidy-mark no --markup yes";
	}
}

sub sanitize (@) {
	my %params=@_;

	return $params{content} unless defined $config{htmltidy};

	my $pid;
	my $sigpipe=0;
	$SIG{PIPE}=sub { $sigpipe=1 };
	$pid=open2(*IN, *OUT, "$config{htmltidy} 2>/dev/null");

	# open2 doesn't respect "use open ':utf8'"
	binmode (IN, ':utf8');
	binmode (OUT, ':utf8');
	
	print OUT $params{content};
	close OUT;

	local $/ = undef;
	my $ret=<IN>;
	close IN;
	waitpid $pid, 0;

	$SIG{PIPE}="DEFAULT";
	if ($sigpipe || ! defined $ret) {
		return gettext("htmltidy failed to parse this html");
	}

	return $ret;
}

1