[Pmwiki-users] rss-feed
Patrick R. Michaud
pmichaud
Fri Dec 31 11:45:48 CST 2004
On Fri, Dec 31, 2004 at 05:41:53PM +0100, Philipp H?gelmeyer wrote:
>
> I fixed the date format and some other stuff and now in validates
> (rss1.0 & rss2.0) and works in the news readers, that I use (sage &
> newsfire).
>
> I also started a table of character entities, feel free to complete it.
I've gone ahead and reworked rss.php to convert all of the named
character entities defined by XHTML. It's lengthy but it works.
In the process I'm also able to eliminate the RSS "<!DOCTYPE ...>",
so that feeds appear to now validate (at least they do according to
feedvalidator.org).
The new rss.php will be provided in the next beta release; I'm attaching
it to this email for anyone who wants to start using it immediately.
Pm
-------------- next part --------------
<?php if (!defined('PmWiki')) exit();
/* Copyright 2002-2004 Patrick R. Michaud (pmichaud at pobox.com)
This file is part of PmWiki; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published
by the Free Software Foundation; either version 2 of the License, or
(at your option) any later version. See pmwiki.php for full details.
This script defines "?action=rss". It will read the current page
for a WikiTrail, and then output an RSS 2.0 document with the current
page as the channel and the pages in the WikiTrail as the items.
To add RSS capabilities to your site, simply add to config.php:
include_once('scripts/rss.php');
To avoid the cost of loading this script and initializing RSS variables
when you aren't going to generate a feed, use this instead:
if ($action == 'rss' || $action == 'rdf')
include_once('scripts/rss.php');
*/
SDV($HandleActions['rss'],'HandleRss');
SDV($HandleActions['rdf'],'HandleRss');
SDV($RssMaxItems,20); # maximum items to display
SDV($RssSourceSize,400); # max size to build desc from
SDV($RssDescSize,200); # max desc size
SDV($RssItems,array()); # RSS item elements
SDV($RssItemsRDFList,array()); # RDF <items> elements
if ($action=='rdf') {
### RSS 1.0 (RDF) definitions
SDV($RssTimeFmt,'%Y-%m-%dT%H:%MZ'); # time format
SDV($RssItemsRDFListFmt,"<rdf:li rdf:resource=\"\$PageUrl\" />\n");
SDV($RssChannelFmt,array('<?xml version="1.0"?'.'>
<rdf:RDF xmlns="http://purl.org/rss/1.0/"
xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
xmlns:dc="http://purl.org/dc/elements/1.1/">
<channel rdf:about="$PageUrl">
<title>$WikiTitle - $Group.$Name</title>
<link>$PageUrl</link>
<description>$RssChannelDesc</description>
<dc:date>$RssChannelBuildDate</dc:date>
<items>
<rdf:Seq>',&$RssItemsRDFList,'
</rdf:Seq>
</items>
</channel>'));
SDV($RssItemFmt,'
<item rdf:about="$PageUrl">
<title>$WikiTitle - $Group.$Name</title>
<link>$PageUrl</link>
<description>$RssItemDesc</description>
<dc:date>$RssItemPubDate</dc:date>
</item>');
SDV($HandleRssFmt,array(&$RssChannelFmt,&$RssItems,'</rdf:RDF>'));
}
### RSS 2.0 definitions
SDV($RssTimeFmt,'%Y-%m-%dT%H:%MZ');
SDV($RssChannelFmt,'<?xml version="1.0"?'.'>
<rss version="2.0" xmlns:dc="http://purl.org/dc/elements/1.1/">
<channel>
<title>$WikiTitle - $Group.$Name</title>
<link>$PageUrl</link>
<description>$RssChannelDesc</description>
<lastBuildDate>$RssChannelBuildDate</lastBuildDate>
<generator>$Version</generator>');
SDV($RssItemFmt,'
<item>
<title>$FullName</title>
<link>$PageUrl</link>
<description>$RssItemDesc</description>
<dc:contributor>$RssItemAuthor</dc:contributor>
<dc:date>$RssItemPubDate</dc:date>
</item>');
SDV($HandleRssFmt,array(&$RssChannelFmt,&$RssItems,'</channel></rss>'));
function HandleRss($pagename) {
global $RssMaxItems,$RssSourceSize,$RssDescSize,
$RssChannelFmt,$RssChannelDesc,$RssTimeFmt,$RssChannelBuildDate,
$RssItemsRDFList,$RssItemsRDFListFmt,$RssItems,$RssItemFmt,
$HandleRssFmt,$FmtV;
$t = ReadTrail($pagename,$pagename);
$page = RetrieveAuthPage($pagename,'read',false);
if (!$page) Abort("?cannot read $pagename");
$cbgmt = $page['time'];
$r = array();
for($i=0;$i<count($t) && count($r)<$RssMaxItems;$i++) {
if (!PageExists($t[$i]['pagename'])) continue;
$page = RetrieveAuthPage($t[$i]['pagename'],'read',false); Lock(0);
if (!$page) continue;
$text =
MarkupToHTML($t[$i]['pagename'],substr($page['text'],0,$RssSourceSize));
$text = entityencode(preg_replace("/<.*?>/s","",$text));
preg_match("/^(.{0,$RssDescSize}\\s)/s",$text,$match);
$r[] = array('name' => $t[$i]['pagename'],'time' => $page['time'],
'desc' => $match[1]." ...", 'author' => $page['author']);
if ($page['time']>$cbgmt) $cbgmt=$page['time'];
}
SDV($RssChannelBuildDate,
entityencode(gmdate('D, d M Y H:i:s \G\M\T', $cbgmt)));
SDV($RssChannelDesc,entityencode(FmtPageName('$Group.$Title',$pagename)));
foreach($r as $page) {
$FmtV['$RssItemPubDate'] = gmstrftime($RssTimeFmt,$page['time']);
$FmtV['$RssItemDesc'] = $page['desc'];
$FmtV['$RssItemAuthor'] = $page['author'];
$RssItemsRDFList[] =
entityencode(FmtPageName($RssItemsRDFListFmt,$page['name']));
$RssItems[] =
entityencode(FmtPageName($RssItemFmt,$page['name']));
}
header("Content-type: text/xml");
PrintFmt($pagename,$HandleRssFmt);
exit();
}
# entityencode() and $EntitiesTable are used to convert non-ASCII characters
# and named entities into numeric entities, since the RSS and RDF
# specifications don't have a good way of incorporating them by default.
function entityencode($s) {
global $EntitiesTable;
$s = str_replace(array_keys($EntitiesTable),array_values($EntitiesTable),$s);
return preg_replace('/([\\x80-\\xff])/e',"'&#'.ord('\$1').';'",$s);
}
SDVA($EntitiesTable, array(
# entities defined in "http://www.w3.org/TR/xhtml1/DTD/xhtml-lat1.ent"
' ' => ' ',
'¡' => '¡',
'¢' => '¢',
'£' => '£',
'¤' => '¤',
'¥' => '¥',
'¦' => '¦',
'§' => '§',
'¨' => '¨',
'©' => '©',
'ª' => 'ª',
'«' => '«',
'¬' => '¬',
'­' => '­',
'®' => '®',
'¯' => '¯',
'°' => '°',
'±' => '±',
'²' => '²',
'³' => '³',
'´' => '´',
'µ' => 'µ',
'¶' => '¶',
'·' => '·',
'¸' => '¸',
'¹' => '¹',
'º' => 'º',
'»' => '»',
'¼' => '¼',
'½' => '½',
'¾' => '¾',
'¿' => '¿',
'À' => 'À',
'Á' => 'Á',
'Â' => 'Â',
'Ã' => 'Ã',
'Ä' => 'Ä',
'Å' => 'Å',
'Æ' => 'Æ',
'Ç' => 'Ç',
'È' => 'È',
'É' => 'É',
'Ê' => 'Ê',
'Ë' => 'Ë',
'Ì' => 'Ì',
'Í' => 'Í',
'Î' => 'Î',
'Ï' => 'Ï',
'Ð' => 'Ð',
'Ñ' => 'Ñ',
'Ò' => 'Ò',
'Ó' => 'Ó',
'Ô' => 'Ô',
'Õ' => 'Õ',
'Ö' => 'Ö',
'×' => '×',
'Ø' => 'Ø',
'Ù' => 'Ù',
'Ú' => 'Ú',
'Û' => 'Û',
'Ü' => 'Ü',
'Ý' => 'Ý',
'Þ' => 'Þ',
'ß' => 'ß',
'à' => 'à',
'á' => 'á',
'â' => 'â',
'ã' => 'ã',
'ä' => 'ä',
'å' => 'å',
'æ' => 'æ',
'ç' => 'ç',
'è' => 'è',
'é' => 'é',
'ê' => 'ê',
'ë' => 'ë',
'ì' => 'ì',
'í' => 'í',
'î' => 'î',
'ï' => 'ï',
'ð' => 'ð',
'ñ' => 'ñ',
'ò' => 'ò',
'ó' => 'ó',
'ô' => 'ô',
'õ' => 'õ',
'ö' => 'ö',
'÷' => '÷',
'ø' => 'ø',
'ù' => 'ù',
'ú' => 'ú',
'û' => 'û',
'ü' => 'ü',
'ý' => 'ý',
'þ' => 'þ',
'ÿ' => 'ÿ',
# entities defined in "http://www.w3.org/TR/xhtml1/DTD/xhtml-special.ent"
'"' => '"',
#'&' => '&#38;',
#'<' => '&#60;',
#'>' => '>',
''' => ''',
'Œ' => 'Œ',
'œ' => 'œ',
'Š' => 'Š',
'š' => 'š',
'Ÿ' => 'Ÿ',
'ˆ' => 'ˆ',
'˜' => '˜',
' ' => ' ',
' ' => ' ',
' ' => ' ',
'‌' => '‌',
'‍' => '‍',
'‎' => '‎',
'‏' => '‏',
'–' => '–',
'—' => '—',
'‘' => '‘',
'’' => '’',
'‚' => '‚',
'“' => '“',
'”' => '”',
'„' => '„',
'†' => '†',
'‡' => '‡',
'‰' => '‰',
'‹' => '‹',
'›' => '›',
'€' => '€',
# entities defined in "http://www.w3.org/TR/xhtml1/DTD/xhtml-symbol.ent"
'ƒ' => 'ƒ',
'Α' => 'Α',
'Β' => 'Β',
'Γ' => 'Γ',
'Δ' => 'Δ',
'Ε' => 'Ε',
'Ζ' => 'Ζ',
'Η' => 'Η',
'Θ' => 'Θ',
'Ι' => 'Ι',
'Κ' => 'Κ',
'Λ' => 'Λ',
'Μ' => 'Μ',
'Ν' => 'Ν',
'Ξ' => 'Ξ',
'Ο' => 'Ο',
'Π' => 'Π',
'Ρ' => 'Ρ',
'Σ' => 'Σ',
'Τ' => 'Τ',
'Υ' => 'Υ',
'Φ' => 'Φ',
'Χ' => 'Χ',
'Ψ' => 'Ψ',
'Ω' => 'Ω',
'α' => 'α',
'β' => 'β',
'γ' => 'γ',
'δ' => 'δ',
'ε' => 'ε',
'ζ' => 'ζ',
'η' => 'η',
'θ' => 'θ',
'ι' => 'ι',
'κ' => 'κ',
'λ' => 'λ',
'μ' => 'μ',
'ν' => 'ν',
'ξ' => 'ξ',
'ο' => 'ο',
'π' => 'π',
'ρ' => 'ρ',
'ς' => 'ς',
'σ' => 'σ',
'τ' => 'τ',
'υ' => 'υ',
'φ' => 'φ',
'χ' => 'χ',
'ψ' => 'ψ',
'ω' => 'ω',
'ϑ' => 'ϑ',
'ϒ' => 'ϒ',
'ϖ' => 'ϖ',
'•' => '•',
'…' => '…',
'′' => '′',
'″' => '″',
'‾' => '‾',
'⁄' => '⁄',
'℘' => '℘',
'ℑ' => 'ℑ',
'ℜ' => 'ℜ',
'™' => '™',
'ℵ' => 'ℵ',
'←' => '←',
'↑' => '↑',
'→' => '→',
'↓' => '↓',
'↔' => '↔',
'↵' => '↵',
'⇐' => '⇐',
'⇑' => '⇑',
'⇒' => '⇒',
'⇓' => '⇓',
'⇔' => '⇔',
'∀' => '∀',
'∂' => '∂',
'∃' => '∃',
'∅' => '∅',
'∇' => '∇',
'∈' => '∈',
'∉' => '∉',
'∋' => '∋',
'∏' => '∏',
'∑' => '∑',
'−' => '−',
'∗' => '∗',
'√' => '√',
'∝' => '∝',
'∞' => '∞',
'∠' => '∠',
'∧' => '∧',
'∨' => '∨',
'∩' => '∩',
'∪' => '∪',
'∫' => '∫',
'∴' => '∴',
'∼' => '∼',
'≅' => '≅',
'≈' => '≈',
'≠' => '≠',
'≡' => '≡',
'≤' => '≤',
'≥' => '≥',
'⊂' => '⊂',
'⊃' => '⊃',
'⊄' => '⊄',
'⊆' => '⊆',
'⊇' => '⊇',
'⊕' => '⊕',
'⊗' => '⊗',
'⊥' => '⊥',
'⋅' => '⋅',
'⌈' => '⌈',
'⌉' => '⌉',
'⌊' => '⌊',
'⌋' => '⌋',
'⟨' => '〈',
'⟩' => '〉',
'◊' => '◊',
'♠' => '♠',
'♣' => '♣',
'♥' => '♥',
'♦' => '♦'));
?>
More information about the pmwiki-users
mailing list