forked from github/kensanata.oddmuse
There were some files that did not offer "or (at your option) any later version" in their license and these had to be left alone. This should solve the incorrect FSF address issue #4 on GitHub.
80 lines
2.5 KiB
Perl
Executable File
80 lines
2.5 KiB
Perl
Executable File
#! /usr/bin/perl
|
|
# Copyright (C) 2004 Alex Schroeder <alex@emacswiki.org>
|
|
#
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation; either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
use CGI qw/:standard/;
|
|
use CGI::Carp qw(fatalsToBrowser);
|
|
use LWP::UserAgent;
|
|
use Encode;
|
|
|
|
if (not param('url')) {
|
|
print header(-charset=>'utf-8'),
|
|
start_html('PHP Wiki Search RSS 3.0'),
|
|
h1('PHP Wiki Search RSS 3.0'),
|
|
p('Translates a PHP Wiki Search result into RSS 3.0 usable by Oddmuse.'),
|
|
start_form(-method=>'GET'),
|
|
p('Search URL: ', textfield('url', '', 40), checkbox('latin-1'), submit()),
|
|
end_form(),
|
|
end_html();
|
|
exit;
|
|
}
|
|
|
|
print header(-type=>'text/plain; charset=UTF-8');
|
|
|
|
my $url = param('url');
|
|
if (param('latin-1')) {
|
|
$url =~ s/%([0-9a-f][0-9a-f])/chr(hex($1))/ige;
|
|
$url = encode('latin-1', decode('utf-8', $url));
|
|
my @letters = split(//, $url);
|
|
my @safe = ('a' .. 'z', 'A' .. 'Z', '0' .. '9', '-', '_', '.', '!', '~', '*', "'", '(', ')',
|
|
':', '/', '?', ';', '&', '=');
|
|
foreach my $letter (@letters) {
|
|
my $pattern = quotemeta($letter);
|
|
if (not grep(/$pattern/, @safe)) {
|
|
$letter = uc(sprintf("%%%02x", ord($letter)));
|
|
}
|
|
}
|
|
$url = join('', @letters);
|
|
}
|
|
|
|
my $ua = new LWP::UserAgent;
|
|
my $request = HTTP::Request->new('GET', $url);
|
|
my $response = $ua->request($request);
|
|
my $data = $response->content;
|
|
$data = encode('utf-8', decode('latin-1', $data)) if param('latin-1');
|
|
|
|
$data =~ /\<title\>([^<]*)/i;
|
|
print "title: $1\n" if $1;
|
|
print "link: " . param(url) . "\n";
|
|
print "debug: $url\n"; # FIXME
|
|
print "\n";
|
|
while ($data =~ m|<dt>.*?<a href="([^"]*)".*\n((<dd>.*</dd>\n)*)|g) {
|
|
my ($title, $desc) = ($1, $2);
|
|
$title =~ s/%([0-9a-f][0-9a-f])/chr(hex($1))/ige;
|
|
$title = encode('utf-8', decode('latin-1', $title)) if param('latin-1');
|
|
print "title: $title\n";
|
|
$_ = $desc;
|
|
s|<dd>||g;
|
|
s|<small[^>]*>||g;
|
|
s|<strong[^>]*>||g;
|
|
s|</strong>||g;
|
|
s|</small>||g;
|
|
s|</dd>||g;
|
|
s|\n+$||g;
|
|
s|\n|\n\t|g;
|
|
print "description: $_\n";
|
|
print "\n";
|
|
}
|