forked from github/kensanata.oddmuse
83 lines
2.6 KiB
Perl
Executable File
83 lines
2.6 KiB
Perl
Executable File
#! /usr/bin/perl
|
|
# Copyright (C) 2004 Alex Schroeder <alex@emacswiki.org>
|
|
#
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation; either version 2 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program; if not, write to the
|
|
# Free Software Foundation, Inc.
|
|
# 59 Temple Place, Suite 330
|
|
# Boston, MA 02111-1307 USA
|
|
|
|
use CGI qw/:standard/;
|
|
use CGI::Carp qw(fatalsToBrowser);
|
|
use LWP::UserAgent;
|
|
use Encode;
|
|
|
|
if (not param('url')) {
|
|
print header(-charset=>'utf-8'),
|
|
start_html('PHP Wiki Search RSS 3.0'),
|
|
h1('PHP Wiki Search RSS 3.0'),
|
|
p('Translates a PHP Wiki Search result into RSS 3.0 usable by Oddmuse.'),
|
|
start_form(-method=>'GET'),
|
|
p('Search URL: ', textfield('url', '', 40), checkbox('latin-1'), submit()),
|
|
end_form(),
|
|
end_html();
|
|
exit;
|
|
}
|
|
|
|
print header(-type=>'text/plain; charset=UTF-8');
|
|
|
|
my $url = param('url');
|
|
if (param('latin-1')) {
|
|
$url =~ s/%([0-9a-f][0-9a-f])/chr(hex($1))/ige;
|
|
$url = encode('latin-1', decode('utf-8', $url));
|
|
my @letters = split(//, $url);
|
|
my @safe = ('a' .. 'z', 'A' .. 'Z', '0' .. '9', '-', '_', '.', '!', '~', '*', "'", '(', ')',
|
|
':', '/', '?', ';', '&', '=');
|
|
foreach my $letter (@letters) {
|
|
my $pattern = quotemeta($letter);
|
|
if (not grep(/$pattern/, @safe)) {
|
|
$letter = uc(sprintf("%%%02x", ord($letter)));
|
|
}
|
|
}
|
|
$url = join('', @letters);
|
|
}
|
|
|
|
my $ua = new LWP::UserAgent;
|
|
my $request = HTTP::Request->new('GET', $url);
|
|
my $response = $ua->request($request);
|
|
my $data = $response->content;
|
|
$data = encode('utf-8', decode('latin-1', $data)) if param('latin-1');
|
|
|
|
$data =~ /\<title\>([^<]*)/i;
|
|
print "title: $1\n" if $1;
|
|
print "link: " . param(url) . "\n";
|
|
print "debug: $url\n"; # FIXME
|
|
print "\n";
|
|
while ($data =~ m|<dt>.*?<a href="([^"]*)".*\n((<dd>.*</dd>\n)*)|g) {
|
|
my ($title, $desc) = ($1, $2);
|
|
$title =~ s/%([0-9a-f][0-9a-f])/chr(hex($1))/ige;
|
|
$title = encode('utf-8', decode('latin-1', $title)) if param('latin-1');
|
|
print "title: $title\n";
|
|
$_ = $desc;
|
|
s|<dd>||g;
|
|
s|<small[^>]*>||g;
|
|
s|<strong[^>]*>||g;
|
|
s|</strong>||g;
|
|
s|</small>||g;
|
|
s|</dd>||g;
|
|
s|\n+$||g;
|
|
s|\n|\n\t|g;
|
|
print "description: $_\n";
|
|
print "\n";
|
|
}
|