- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
2005-08-11 13:02:08 +00:00
// $Id$
* @file
* Used to aggregate syndicated content (RSS and RDF).
* Implementation of hook_help().
function aggregator_help($section) {
switch ($section) {
case 'admin/help#aggregator':
$output = '<p>'. t('The news aggregator is a powerful on-site RSS syndicator/news reader that can gather fresh content from news sites and weblogs around the web.') .'</p>';
$output .= '<p>'. t('Users can view the latest news chronologically in the <a href="%aggregator">main news aggregator display</a> or by <a href="%aggregator-sources">source</a>. Administrators can add, edit and delete feeds and choose how often to check for newly updated news for each individual feed. Administrators can also tag individual feeds with categories, offering selective grouping of some feeds into separate displays. Listings of the latest news for individual sources or categorized sources can be enabled as blocks for display in the sidebar through the <a href="%admin-block">block administration page</a>. The news aggregator requires cron to check for the latest news from the sites to which you have subscribed. Drupal also provides a <a href="%aggregator-opml">machine-readable OPML file</a> of all of your subscribed feeds.', array('%aggregator' => url('aggregator'), '%aggregator-sources' => url('aggregator/sources'), '%admin-block' => url('admin/block'), '%aggregator-opml' => url('aggregator/opml'))) .'</p>';
$output .= t('<p>You can</p>
<li>administer your list of news feeds <a href="%admin-aggregator">administer &gt;&gt; aggregator</a>.</li>
<li>add a new feed <a href="%admin-aggregator-add-feed">administer &gt;&gt; aggregator &gt;&gt; add feed</a>.</li>
<li>add a new category <a href="%admin-aggregator-add-category">administer &gt;&gt; aggregator &gt;&gt; add category</a>.</li>
<li>configure global settings for the news aggregator <a href="%admin-settings-aggregator">administer &gt;&gt; settings &gt;&gt; aggregator</a>.</li>
<li>control access to the aggregator module through access permissions <a href="%admin-access">administer &gt;&gt; access control &gt;&gt; permissions</a>.</li>
<li>set permissions to access new feeds for user roles such as anonymous users at <a href="%admin-access">administer &gt;&gt; access control</a>.</li>
<li>view the <a href="%aggregator">aggregator page</a>.</li>
', array('%admin-aggregator' => url('admin/aggregator'), '%admin-aggregator-add-feed' => url('admin/aggregator/add/feed'), '%admin-aggregator-add-category' => url('admin/aggregator/add/category'), '%admin-settings-aggregator' => url('admin/settings/aggregator'), '%admin-access' => url('admin/access'), '%aggregator' => url('aggregator')));
$output .= '<p>'. t('For more information please read the configuration and customization handbook <a href="%aggregator">Aggregator page</a>.', array('%aggregator' => 'http://www.drupal.org/handbook/modules/aggregator/')) .'</p>';
return $output;
case 'admin/modules#description':
return t('Aggregates syndicated content (RSS and RDF feeds).');
case 'admin/aggregator':
return t('<p>Thousands of sites (particularly news sites and weblogs) publish their latest headlines and/or stories in a machine-readable format so that other sites can easily link to them. This content is usually in the form of an <a href="http://blogs.law.harvard.edu/tech/rss">RSS</a> feed (which is an XML-based syndication standard). To display the feed or category in a block you must decide how many items to show by editing the feed or block and turning on the <a href="%block">feed\'s block</a>.</p>', array('%block' => url('admin/block')));
case 'admin/aggregator/add/feed':
return t('<p>Add a site that has an RSS/RDF feed. The URL is the full path to the RSS feed file. For the feed to update automatically you must run "cron.php" on a regular basis. If you already have a feed with the URL you are planning to use, the system will not accept another feed with the same URL.</p>');
case 'admin/aggregator/add/category':
return t('<p>Categories provide a way to group items from different news feeds together. Each news category has its own feed page and block. For example, you could tag various sport-related feeds as belonging to a category called <em>Sports</em>. News items can be added to a category automatically by setting a feed to automatically place its item into that category, or by using the categorize items link in any listing of news items.</p>');
2001-05-26 18:26:56 +00:00
function aggregator_settings() {
$items = array(0 => t('none')) + drupal_map_assoc(array(3, 5, 10, 15, 20, 25), '_aggregator_items');
$period = drupal_map_assoc(array(3600, 10800, 21600, 32400, 43200, 86400, 172800, 259200, 604800, 1209600, 2419200, 4838400, 9676800), 'format_interval');
$form['aggregator_allowed_html_tags'] = array(
'#type' => 'textfield', '#title' => t('Allowed HTML tags'), '#size' => 80, '#maxlength' => 255,
'#default_value' => variable_get('aggregator_allowed_html_tags', '<a> <b> <br> <dd> <dl> <dt> <em> <i> <li> <ol> <p> <strong> <u> <ul>'),
'#description' => t('The list of tags which are allowed in feeds, i.e., which will not be removed by Drupal.')
$form['aggregator_summary_items'] = array(
'#type' => 'select', '#title' => t('Items shown in sources and categories pages') ,
'#default_value' => variable_get('aggregator_summary_items', 3), '#options' => $items,
'#description' => t('The number of items which will be shown with each feed or category in the feed and category summary pages.')
$form['aggregator_clear'] = array(
'#type' => 'select', '#title' => t('Discard news items older than'),
'#default_value' => variable_get('aggregator_clear', 9676800), '#options' => $period,
'#description' => t('Older news items will be automatically discarded. Requires crontab.')
$form['aggregator_category_selector'] = array(
'#type' => 'radios', '#title' => t('Category selection type'), '#default_value' => variable_get('aggregator_category_selector', 'check'),
'#options' => array('check' => t('checkboxes'), 'select' => t('multiple selector')),
'#description' => t('The type of category selection widget which is shown on categorization pages. Checkboxes are easier to use; a multiple selector is good for working with large numbers of categories.')
return $form;
* Helper function for drupal_map_assoc.
function _aggregator_items($count) {
return format_plural($count, '1 item', '%count items');
* Implementation of hook_perm().
function aggregator_perm() {
return array('administer news feeds', 'access news feeds');
* Implementation of hook_menu().
function aggregator_menu($may_cache) {
$items = array();
$edit = user_access('administer news feeds');
$view = user_access('access news feeds');
if ($may_cache) {
$items[] = array('path' => 'admin/aggregator', 'title' => t('aggregator'),
'callback' => 'aggregator_admin_overview', 'access' => $edit);
$items[] = array('path' => 'admin/aggregator/edit/feed', 'title' => t('edit feed'),
'callback' => 'aggregator_admin_edit_feed', 'access' => $edit,
'type' => MENU_CALLBACK);
$items[] = array('path' => 'admin/aggregator/edit/category', 'title' => t('edit category'),
'callback' => 'aggregator_admin_edit_category', 'access' => $edit,
'type' => MENU_CALLBACK);
$items[] = array('path' => 'admin/aggregator/remove', 'title' => t('remove items'),
'callback' => 'aggregator_admin_remove_feed', 'access' => $edit,
'type' => MENU_CALLBACK);
$items[] = array('path' => 'admin/aggregator/update', 'title' => t('update items'),
'callback' => 'aggregator_admin_refresh_feed', 'access' => $edit,
'type' => MENU_CALLBACK);
$items[] = array('path' => 'admin/aggregator/list', 'title' => t('list'),
'type' => MENU_DEFAULT_LOCAL_TASK, 'weight' => -10);
$items[] = array('path' => 'admin/aggregator/add/feed', 'title' => t('add feed'),
'callback' => 'aggregator_admin_edit_feed', 'access' => $edit,
'type' => MENU_LOCAL_TASK);
$items[] = array('path' => 'admin/aggregator/add/category', 'title' => t('add category'),
'callback' => 'aggregator_admin_edit_category', 'access' => $edit,
'type' => MENU_LOCAL_TASK);
$items[] = array('path' => 'aggregator', 'title' => t('news aggregator'),
'callback' => 'aggregator_page_last', 'access' => $view,
'weight' => 5);
$items[] = array('path' => 'aggregator/sources', 'title' => t('sources'),
'callback' => 'aggregator_page_sources', 'access' => $view);
$items[] = array('path' => 'aggregator/categories', 'title' => t('categories'),
'callback' => 'aggregator_page_categories', 'access' => $view,
$items[] = array('path' => 'aggregator/rss', 'title' => t('RSS feed'),
'callback' => 'aggregator_page_rss', 'access' => $view,
'type' => MENU_CALLBACK);
$items[] = array('path' => 'aggregator/opml', 'title' => t('OPML feed'),
'callback' => 'aggregator_page_opml', 'access' => $view,
'type' => MENU_CALLBACK);
else {
if (arg(0) == 'aggregator' && is_numeric(arg(2))) {
if (arg(1) == 'sources') {
$feed = db_fetch_object(db_query('SELECT title, fid FROM {aggregator_feed} WHERE fid = %d', arg(2)));
if ($feed) {
$items[] = array('path' => 'aggregator/sources/'. $feed->fid, 'title' => $feed->title,
'callback' => 'aggregator_page_source', 'access' => $view);
$items[] = array('path' => 'aggregator/sources/'. $feed->fid .'/view', 'title' => t('view'),
'type' => MENU_DEFAULT_LOCAL_TASK, 'weight' => -10);
$items[] = array('path' => 'aggregator/sources/'. $feed->fid .'/categorize', 'title' => t('categorize'),
'callback' => 'aggregator_page_source', 'access' => $edit,
'type' => MENU_LOCAL_TASK);
$items[] = array('path' => 'aggregator/sources/'. $feed->fid .'/configure', 'title' => t('configure'),
'callback' => 'aggregator_edit', 'access' => $edit,
'type' => MENU_LOCAL_TASK,
'weight' => 1);
else if (arg(1) == 'categories') {
$category = db_fetch_object(db_query('SELECT title, cid FROM {aggregator_category} WHERE cid = %d', arg(2)));
if ($category) {
$items[] = array('path' => 'aggregator/categories/'. $category->cid, 'title' => $category->title,
'callback' => 'aggregator_page_category', 'access' => $view);
$items[] = array('path' => 'aggregator/categories/'. $category->cid .'/view', 'title' => t('view'),
'type' => MENU_DEFAULT_LOCAL_TASK, 'weight' => -10);
$items[] = array('path' => 'aggregator/categories/'. $category->cid .'/categorize', 'title' => t('categorize'),
'callback' => 'aggregator_page_category', 'access' => $edit,
'type' => MENU_LOCAL_TASK);
$items[] = array('path' => 'aggregator/categories/'. $category->cid .'/configure', 'title' => t('configure'),
'callback' => 'aggregator_edit', 'access' => $edit,
'type' => MENU_LOCAL_TASK,
'weight' => 1);
return $items;
2001-05-26 18:26:56 +00:00
* Implementation of hook_cron().
* Checks news feeds for updates once their refresh interval has elapsed.
function aggregator_cron() {
$result = db_query('SELECT * FROM {aggregator_feed} WHERE checked + refresh < %d', time());
while ($feed = db_fetch_array($result)) {
* Implementation of hook_block().
* Generates blocks for the latest news items in each category and feed.
2005-03-02 08:13:15 +00:00
function aggregator_block($op, $delta = 0, $edit = array()) {
if (user_access('access news feeds')) {
if ($op == 'list') {
$result = db_query('SELECT cid, title FROM {aggregator_category} ORDER BY title');
while ($category = db_fetch_object($result)) {
$block['category-'. $category->cid]['info'] = t('%title category latest items', array('%title' => theme('placeholder', $category->title)));
$result = db_query('SELECT fid, title FROM {aggregator_feed} ORDER BY fid');
while ($feed = db_fetch_object($result)) {
$block['feed-'. $feed->fid]['info'] = t('%title feed latest items', array('%title' => theme('placeholder', $feed->title)));
else if ($op == 'configure') {
list($type, $id) = explode('-', $delta);
if ($type == 'category') {
$value = db_result(db_query('SELECT block FROM {aggregator_category} WHERE cid = %d', $id));
else {
$value = db_result(db_query('SELECT block FROM {aggregator_feed} WHERE fid = %d', $id));
$form['block'] = array('#type' => 'select', '#title' => t('Number of news items in block'), '#default_value' => $value, '#options' => drupal_map_assoc(array(2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20)));
return $form;
else if ($op == 'save') {
list($type, $id) = explode('-', $delta);
if ($type == 'category') {
$value = db_query('UPDATE {aggregator_category} SET block = %d WHERE cid = %d', $edit['block'], $id);
else {
$value = db_query('UPDATE {aggregator_feed} SET block = %d WHERE fid = %d', $edit['block'], $id);
else if ($op == 'view') {
list($type, $id) = explode('-', $delta);
switch ($type) {
case 'feed':
if ($feed = db_fetch_object(db_query('SELECT fid, title, block FROM {aggregator_feed} WHERE fid = %d', $id))) {
$block['subject'] = check_plain($feed->title);
$result = db_query_range('SELECT * FROM {aggregator_item} WHERE fid = %d ORDER BY timestamp DESC, iid DESC', $feed->fid, 0, $feed->block);
$block['content'] = '<div class="more-link">'. l(t('more'), 'aggregator/sources/'. $feed->fid, array('title' => t('View this feed\'s recent news.'))) .'</div>';
case 'category':
if ($category = db_fetch_object(db_query('SELECT cid, title, block FROM {aggregator_category} WHERE cid = %d', $id))) {
$block['subject'] = check_plain($category->title);
$result = db_query_range('SELECT i.* FROM {aggregator_category_item} ci LEFT JOIN {aggregator_item} i ON ci.iid = i.iid WHERE ci.cid = %d ORDER BY i.timestamp DESC, i.iid DESC', $category->cid, 0, $category->block);
$block['content'] = '<div class="more-link">'. l(t('more'), 'aggregator/categories/'. $category->cid, array('title' => t('View this category\'s recent news.'))) .'</div>';
$items = array();
while ($item = db_fetch_object($result)) {
$items[] = theme('aggregator_block_item', $item);
$block['content'] = theme('item_list', $items) . $block['content'];
return $block;
function aggregator_remove($feed) {
$result = db_query('SELECT iid FROM {aggregator_item} WHERE fid = %d', $feed['fid']);
while ($item = db_fetch_object($result)) {
$items[] = "iid = $item->iid";
if ($items) {
db_query('DELETE FROM {aggregator_category_item} WHERE '. implode(' OR ', $items));
db_query('DELETE FROM {aggregator_item} WHERE fid = %d', $feed['fid']);
2004-04-29 21:10:12 +00:00
db_query("UPDATE {aggregator_feed} SET checked = 0, etag = '', modified = 0 WHERE fid = %d", $feed['fid']);
drupal_set_message(t('The news items from %site have been removed.', array('%site' => theme('placeholder', $feed['title']))));
* Call-back function used by the XML parser.
function aggregator_element_start($parser, $name, $attributes) {
global $item, $element, $tag, $items, $channel;
switch ($name) {
case 'IMAGE':
case 'CONTENT':
case 'SUMMARY':
case 'TAGLINE':
case 'SUBTITLE':
case 'LOGO':
case 'INFO':
$element = $name;
case 'ID':
if ($element != 'ITEM') {
$element = $name;
case 'LINK':
if ($attributes['REL'] == 'alternate') {
if ($element == 'ITEM') {
$items[$item]['LINK'] = $attributes['HREF'];
else {
$channel['LINK'] = $attributes['HREF'];
case 'ITEM':
$element = $name;
$item += 1;
case 'ENTRY':
$element = 'ITEM';
$item += 1;
$tag = $name;
* Call-back function used by the XML parser.
function aggregator_element_end($parser, $name) {
global $element;
switch ($name) {
case 'IMAGE':
case 'ITEM':
case 'ENTRY':
case 'CONTENT':
case 'INFO':
$element = '';
case 'ID':
if ($element == 'ID') {
$element = '';
* Call-back function used by the XML parser.
function aggregator_element_data($parser, $data) {
global $channel, $element, $items, $item, $image, $tag;
switch ($element) {
case 'ITEM':
$items[$item][$tag] .= $data;
case 'IMAGE':
case 'LOGO':
$image[$tag] .= $data;
case 'LINK':
if ($data) {
$items[$item][$tag] .= $data;
case 'CONTENT':
$items[$item]['CONTENT'] .= $data;
case 'SUMMARY':
$items[$item]['SUMMARY'] .= $data;
case 'TAGLINE':
case 'SUBTITLE':
$channel['DESCRIPTION'] .= $data;
case 'INFO':
case 'ID':
// The sub-element is not supported. However, we must recognize
// it or its contents will end up in the item array.
$channel[$tag] .= $data;
* Checks a news feed for new items.
function aggregator_refresh($feed) {
global $channel, $image;
// Generate conditional GET headers.
$headers = array();
if ($feed['etag']) {
$headers['If-None-Match'] = $feed['etag'];
if ($feed['modified']) {
$headers['If-Modified-Since'] = gmdate('D, d M Y H:i:s', $feed['modified']) .' GMT';
// Request feed.
$result = drupal_http_request($feed['url'], $headers);
// Process HTTP response code.
switch ($result->code) {
case 304:
db_query('UPDATE {aggregator_feed} SET checked = %d WHERE fid = %d', time(), $feed['fid']);
drupal_set_message(t('There is no new syndicated content from %site.', array('%site' => theme('placeholder', $feed['title']))));
case 301:
$feed['url'] = $result->redirect_url;
watchdog('aggregator', t('Updated URL for feed %title to %url.', array('%title' => theme('placeholder', $feed['title']), '%url' => theme('placeholder', $feed['url']))));
case 200:
case 302:
case 307:
// Filter the input data:
if (aggregator_parse_feed($result->data, $feed)) {
2001-05-26 18:26:56 +00:00
if ($result->headers['Last-Modified']) {
$modified = strtotime($result->headers['Last-Modified']);
2003-03-23 19:12:38 +00:00
** Prepare the channel data:
foreach ($channel as $key => $value) {
$channel[$key] = trim(strip_tags($value));
** Prepare the image data (if any):
foreach ($image as $key => $value) {
$image[$key] = trim($value);
if ($image['LINK'] && $image['URL'] && $image['TITLE']) {
$image = '<a href="'. $image['LINK'] .'"><img src="'. $image['URL'] .'" alt="'. $image['TITLE'] .'" /></a>';
else {
$image = NULL;
** Update the feed data:
db_query("UPDATE {aggregator_feed} SET url = '%s', checked = %d, link = '%s', description = '%s', image = '%s', etag = '%s', modified = %d WHERE fid = %d", $feed['url'], time(), $channel['LINK'], $channel['DESCRIPTION'], $image, $result->headers['ETag'], $modified, $feed['fid']);
** Clear the cache:
watchdog('aggregator', t('There is new syndicated content from %site.', array('%site' => theme('placeholder', $feed['#title']))));
drupal_set_message(t('There is new syndicated content from %site.', array('%site' => theme('placeholder', $feed['#title']))));
watchdog('aggregator', t('The RSS-feed from %site seems to be broken, due to "%error".', array('%site' => theme('placeholder', $feed['title']), '%error' => theme('placeholder', $result->code .' '. $result->error))), WATCHDOG_WARNING);
drupal_set_message(t('The RSS-feed from %site seems to be broken, because of error "%error".', array('%site' => theme('placeholder', $feed['title']), '%error' => theme('placeholder', $result->code .' '. $result->error))));
* Parse the W3C date/time format, a subset of ISO 8601. PHP date parsing
* functions do not handle this format.
* See http://www.w3.org/TR/NOTE-datetime for more information.
* Originally from MagpieRSS (http://magpierss.sourceforge.net/).
* @param $date_str A string with a potentially W3C DTF date.
* @return A timestamp if parsed successfully or -1 if not.
function aggregator_parse_w3cdtf($date_str) {
if (preg_match('/(\d{4})-(\d{2})-(\d{2})T(\d{2}):(\d{2})(:(\d{2}))?(?:([-+])(\d{2}):?(\d{2})|(Z))?/', $date_str, $match)) {
list($year, $month, $day, $hours, $minutes, $seconds) = array($match[1], $match[2], $match[3], $match[4], $match[5], $match[6]);
// calc epoch for current date assuming GMT
$epoch = gmmktime($hours, $minutes, $seconds, $month, $day, $year);
if ($match[10] != 'Z') { // Z is zulu time, aka GMT
list($tz_mod, $tz_hour, $tz_min) = array($match[8], $match[9], $match[10]);
// zero out the variables
if (!$tz_hour) {
$tz_hour = 0;
if (!$tz_min) {
$tz_min = 0;
$offset_secs = (($tz_hour * 60) + $tz_min) * 60;
// is timezone ahead of GMT? then subtract offset
if ($tz_mod == '+') {
$offset_secs *= -1;
$epoch += $offset_secs;
return $epoch;
else {
return FALSE;
function aggregator_parse_feed(&$data, $feed) {
global $items, $image, $channel;
// Unset the global variables before we use them:
unset($GLOBALS['element'], $GLOBALS['item'], $GLOBALS['tag']);
$items = array();
$image = array();
$channel = array();
// parse the data:
$xml_parser = drupal_xml_parser_create($data);
xml_set_element_handler($xml_parser, 'aggregator_element_start', 'aggregator_element_end');
xml_set_character_data_handler($xml_parser, 'aggregator_element_data');
if (!xml_parse($xml_parser, $data, 1)) {
watchdog('aggregator', t('The RSS-feed from %site seems to be broken, due to an error "%error" on line %line.', array('%site' => theme('placeholder', $feed['title']), '%error' => xml_error_string(xml_get_error_code($xml_parser)), '%line' => xml_get_current_line_number($xml_parser))), WATCHDOG_WARNING);
drupal_set_message(t('The RSS-feed from %site seems to be broken, because of error "%error" on line %line.', array('%site' => theme('placeholder', $feed['title']), '%error' => xml_error_string(xml_get_error_code($xml_parser)), '%line' => xml_get_current_line_number($xml_parser))), 'error');
return 0;
** We reverse the array such that we store the first item last,
** and the last item first. In the database, the newest item
** should be at the top.
$items = array_reverse($items);
foreach ($items as $item) {
unset($title, $link, $author, $description);
2001-05-26 18:26:56 +00:00
// Prepare the item:
foreach ($item as $key => $value) {
$value = decode_entities(trim($value));
$value = strip_tags($value, variable_get('aggregator_allowed_html_tags', '<a> <b> <br> <dd> <dl> <dt> <em> <i> <li> <ol> <p> <strong> <u> <ul>'));
2005-11-30 11:03:58 +00:00
$value = filter_xss($value);
The Input formats - filter patch has landed. I still need to make update instructions for modules and update the hook docs. Here's an overview of the changes: 1) Multiple Input formats: they are complete filter configurations (what filters to use, in what order and with which settings). Input formats are admin-definable, and usage of them is role-dependant. For example, you can set it up so that regular users can only use limited HTML, while admins can free HTML without any tag limitations. The input format can be chosen per content item (nodes, comments, blocks, ...) when you add/edit them. If only a single format is available, there is no choice, and nothing changes with before. The default install (and the upgrade) contains a basic set of formats which should satisfy the average user's needs. 2) Filters have toggles Because now you might want to enable a filter only on some input formats, an explicit toggle is provided by the filter system. Modules do not need to worry about it and filters that still have their own on/off switch should get rid of it. 3) Multiple filters per module This was necessary to accomodate the next change, and it's also a logical extension of the filter system. 4) Embedded PHP is now a filter Thanks to the multiple input formats, I was able to move the 'embedded PHP' feature from block.module, page.module and book.module into a simple filter which executes PHP code. This filter is part of filter.module, and by default there is an input format 'PHP', restricted to the administrator only, which contains this filter. This change means that block.module now passes custom block contents through the filter system. As well as from reducing code duplication and avoiding two type selectors for page/book nodes, you can now combine PHP code with other filters. 5) User-supplied PHP code now requires <?php ?> tags. This is required for teasers to work with PHP code. Because PHP evaluation is now just another step in the filter process, we can't do this. Also, because teasers are generated before filtering, this would result in errors when the teaser generation would cut off a piece of PHP code. Also, regular PHP syntax explicitly includes the <?php ?> tags for PHP files, so it makes sense to use the same convention for embedded PHP in Drupal. 6) Filter caching was added. Benchmarking shows that even for a simple setup (basic html filtering + legacy URL rewriting), filtercache can offer speedups. Unlike the old filtercache, this uses the normal cache table. 7) Filtertips were moved from help into a hook_filter_tips(). This was required to accomodate the fact that there are multiple filters per module, and that filter settings are format dependant. Shoehorning filter tips into _help was ugly and silly. The display of the filter tips is done through the input format selector, so filter_tips_short() no longer exists. 8) A more intelligent linebreak convertor was added, which doesn't stop working if you use block-level tags and which adds <p> tags.
2004-08-10 18:34:29 +00:00
$item[$key] = $value;
2005-11-30 11:03:58 +00:00
** Resolve the item's title. If no title is found, we use
** up to 40 characters of the description ending at a word
** boundary but not splitting potential entities.
if ($item['TITLE']) {
$title = $item['TITLE'];
else {
$title = preg_replace('/^(.*)[^\w;&].*?$/', "\\1", truncate_utf8($item['DESCRIPTION'], 40));
** Resolve the items link.
if ($item['LINK']) {
$link = $item['LINK'];
elseif ($item['GUID'] && (strncmp($item['GUID'], 'http://', 7) == 0)) {
$link = $item['GUID'];
else {
$link = $feed['link'];
* Atom feeds have a CONTENT and/or SUMMARY tag instead of a DESCRIPTION tag
if ($item['CONTENT']) {
$item['DESCRIPTION'] = $item['CONTENT'];
else if ($item['SUMMARY']) {
$item['DESCRIPTION'] = $item['SUMMARY'];
** Try to resolve and parse the item's publication date. If no
** date is found, we use the current date instead.
if ($item['PUBDATE']) $date = $item['PUBDATE']; // RSS 2.0
else if ($item['DC:DATE']) $date = $item['DC:DATE']; // Dublin core
else if ($item['DCTERMS:ISSUED']) $date = $item['DCTERMS:ISSUED']; // Dublin core
else if ($item['DCTERMS:CREATED']) $date = $item['DCTERMS:CREATED']; // Dublin core
else if ($item['DCTERMS:MODIFIED']) $date = $item['DCTERMS:MODIFIED']; // Dublin core
else if ($item['ISSUED']) $date = $item['ISSUED']; // Atom XML
else if ($item['CREATED']) $date = $item['CREATED']; // Atom XML
else if ($item['MODIFIED']) $date = $item['MODIFIED']; // Atom XML
else $date = 'now';
$timestamp = strtotime($date); // As of PHP 5.1.0, strtotime returns FALSE on failure instead of -1.
if ($timestamp <= 0) {
$timestamp = aggregator_parse_w3cdtf($date); // Returns FALSE on failure
if (!$timestamp) {
$timestamp = time(); // better than nothing
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
** Save this item. Try to avoid duplicate entries as much as
** possible. If we find a duplicate entry, we resolve it and
** pass along it's ID such that we can update it if needed.
if ($link && $link != $feed['link'] && $link != $feed['url']) {
$entry = db_fetch_object(db_query("SELECT iid FROM {aggregator_item} WHERE fid = %d AND link = '%s'", $feed['fid'], $link));
else {
$entry = db_fetch_object(db_query("SELECT iid FROM {aggregator_item} WHERE fid = %d AND title = '%s'", $feed['fid'], $title));
2005-11-30 11:03:58 +00:00
aggregator_save_item(array('iid' => $entry->iid, 'fid' => $feed['fid'], 'timestamp' => $timestamp, 'title' => $title, 'link' => $link, 'author' => $item['AUTHOR'], 'description' => $item['DESCRIPTION']));
** Remove all items that are older than flush item timer:
$age = time() - variable_get('aggregator_clear', 9676800);
$result = db_query('SELECT iid FROM {aggregator_item} WHERE fid = %d AND timestamp < %d', $feed['fid'], $age);
if (db_num_rows($result)) {
$items = array();
while ($item = db_fetch_object($result)) {
$items[] = $item->iid;
db_query('DELETE FROM {aggregator_category_item} WHERE iid IN ('. implode(', ', $items) .')');
db_query('DELETE FROM {aggregator_item} WHERE fid = %d AND timestamp < %d', $feed['fid'], $age);
return 1;
2001-05-26 18:26:56 +00:00
function aggregator_save_item($edit) {
if ($edit['iid'] && $edit['title']) {
db_query('UPDATE {aggregator_item} SET title = \'%s\', link = \'%s\', author = \'%s\', description = \'%s\' WHERE iid = %d', $edit['title'], $edit['link'], $edit['author'], $edit['description'], $edit['iid']);
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
else if ($edit['iid']) {
db_query('DELETE FROM {aggregator_item} WHERE iid = %d', $edit['iid']);
db_query('DELETE FROM {aggregator_category_item} WHERE iid = %d', $edit['iid']);
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
else if ($edit['title'] && $edit['link']) {
$edit['iid'] = db_next_id('{aggregator_item}_iid');
db_query('INSERT INTO {aggregator_item} (iid, fid, title, link, author, description, timestamp) VALUES (%d, %d, \'%s\', \'%s\', \'%s\', \'%s\', %d)', $edit['iid'], $edit['fid'], $edit['title'], $edit['link'], $edit['author'], $edit['description'], $edit['timestamp']);
// file the items in the categories indicated by the feed
$categories = db_query('SELECT cid FROM {aggregator_category_feed} WHERE fid = %d', $edit['fid']);
while ($category = db_fetch_object($categories)) {
db_query('INSERT INTO {aggregator_category_item} (cid, iid) VALUES (%d, %d)', $category->cid, $edit['iid']);
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
function aggregator_form_category($edit = array()) {
$form['title'] = array('#type' => 'textfield', '#title' => t('Title'), '#default_value' => $edit['title'], '#maxlength' => 64);
$form['description'] = array('#type' => 'textarea', '#title' => t('Description'), '#default_value' => $edit['description']);
$form['submit'] = array('#type' => 'submit', '#value' =>t('Submit'));
2001-05-26 18:26:56 +00:00
if ($edit['cid']) {
$form['delete'] = array('#type' => 'submit', '#value' =>t('Delete'));
$form['cid'] = array('#type' => 'hidden', '#value' => $edit['cid']);
2001-05-26 18:26:56 +00:00
return drupal_get_form('aggregator_form_category', $form);
2001-05-26 18:26:56 +00:00
function aggregator_save_category($edit) {
if ($edit['cid'] && $edit['title']) {
db_query('UPDATE {aggregator_category} SET title = \'%s\', description = \'%s\' WHERE cid = %d', $edit['title'], $edit['description'], $edit['cid']);
2001-05-26 18:26:56 +00:00
else if ($edit['cid']) {
db_query('DELETE FROM {aggregator_category} WHERE cid = %d', $edit['cid']);
2001-05-26 18:26:56 +00:00
else if ($edit['title']) {
// a single unique id for bundles and feeds, to use in blocks
$next_id = db_next_id('{aggregator_category}_cid');
db_query('INSERT INTO {aggregator_category} (cid, title, description, block) VALUES (%d, \'%s\', \'%s\', 5)', $next_id, $edit['title'], $edit['description']);
2001-05-26 18:26:56 +00:00
function aggregator_form_feed($edit = array()) {
$period = drupal_map_assoc(array(900, 1800, 3600, 7200, 10800, 21600, 32400, 43200, 64800, 86400, 172800, 259200, 604800, 1209600, 2419200), 'format_interval');
2001-05-26 18:26:56 +00:00
if ($edit['refresh'] == '') {
$edit['refresh'] = 3600;
- import.module: + Improved input filtering; this should make the news items look more consistent in terms of mark-up. + Quoted all array indices: converted all instances of $foo[bar] to $foo["bar"]. Made various other changes to make the import module compliant with the coding style. - theme.inc: + Fixed small XHTML glitch - comment system: + Made it possible for users to edit their comments (when certain criteria are matched). + Renamed the SQL table field "lid" to "nid" and updated the code to reflect this change: this is a rather /annoying/ change that has been asked for a few times. It will impact the contributed BBS/forum modules and requires a tiny SQL update: sql> ALTER TABLE comments CHANGE lid nid int(10) NOT NULL; + Moved most (all?) of the comment related logic from node.php to comment.module where it belongs. This also marks a first step towards removing/reducing "node.php". + Added a delete button to the comment admin form and made it so that Drupal prompts for confirmation prior to deleting a comment from the database. This behavior is similar to that of deleting nodes. + Disabled comment moderation for now. + Some of the above changes will make it easier to integrate the upcomcing mail-to-web and web-to-mail gateways. They are part of a bigger plan. ;) - node system: + Made it so that updating nodes (like for instance updating blog entries) won't trigger the submission rate throttle. + Fixed a small glitch where a node's title wasn't always passed to the $theme->header() function. + Made "node_array()" and "node_object()" more generic and named them "object2array()" and "array2object()". + Moved most (all?) of the comment related logic from node.php to comment.module where it belongs. This also marks a first step towards removing/reducing "node.php". - misc: + Applied three patches by Foxen. One to improve performance of the book module, and two other patches to fix small glitches in common.inc. Thanks Foxen!
2001-12-30 16:16:38 +00:00
$form['title'] = array('#type' => 'textfield', '#title' => t('Title'), '#default_value' => $edit['title'], '#maxlength' => 64, '#description' => t('The name of the feed; typically the name of the web site you syndicate content from.'));
$form['url'] = array('#type' => 'textfield', '#title' => t('URL'), '#default_value' => $edit['url'], '#maxlength' => 255, '#description' => t('The fully-qualified URL of the feed.'));
$form['refresh'] = array('#type' => 'select', '#title' => t('Update interval'), '#default_value' => $edit['refresh'], '#options' => $period, '#description' => t('The refresh interval indicating how often you want to update this feed. Requires crontab.'));
// Handling of categories:
$options = array();
$values = array();
$categories = db_query('SELECT c.cid, c.title, f.fid FROM {aggregator_category} c LEFT JOIN {aggregator_category_feed} f ON c.cid = f.cid AND f.fid = %d ORDER BY title', $edit['fid']);
while ($category = db_fetch_object($categories)) {
$options[$category->cid] = $category->title;
if ($category->fid) $values[] = check_plain($category->cid);
if ($options) {
$form['category'] = array('#type' => 'checkboxes', '#title' => t('Categorize news items'), '#default_value' => $values, '#options' => $options, '#description' => t('New items in this feed will be automatically filed in the checked categories as they are received.'));
$form['submit'] = array('#type' => 'submit', '#value' =>t('Submit'));
if ($edit['fid']) {
$form['delete'] = array('#type' => 'submit', '#value' =>t('Delete'));
$form['fid'] = array('#type' => 'hidden', '#value' => $edit['fid']);
2001-05-26 18:26:56 +00:00
return drupal_get_form('aggregator_form_feed', $form);
2001-05-26 18:26:56 +00:00
function aggregator_save_feed($edit) {
if ($edit['fid']) {
// an existing feed is being modified, delete the category listings
db_query('DELETE FROM {aggregator_category_feed} WHERE fid = %d', $edit['fid']);
2001-05-26 18:26:56 +00:00
if ($edit['fid'] && $edit['title']) {
db_query('UPDATE {aggregator_feed} SET title = \'%s\', url = \'%s\', refresh = %d WHERE fid = %d', $edit['title'], $edit['url'], $edit['refresh'], $edit['fid']);
2001-05-26 18:26:56 +00:00
else if ($edit['fid']) {
$result = db_query('SELECT iid FROM {aggregator_item} WHERE fid = %d', $edit['fid']);
while ($item = db_fetch_object($result)) {
$items[] = "iid = $item->iid";
if ($items) {
db_query('DELETE FROM {aggregator_category_item} WHERE '. implode(' OR ', $items));
db_query('DELETE FROM {aggregator_feed} WHERE fid = %d', $edit['fid']);
db_query('DELETE FROM {aggregator_item} WHERE fid = %d', $edit['fid']);
2001-05-26 18:26:56 +00:00
else if ($edit['title']) {
// a single unique id for bundles and feeds, to use in blocks
$edit['fid'] = db_next_id('{aggregator_feed}_fid');
db_query('INSERT INTO {aggregator_feed} (fid, title, url, refresh, block) VALUES (%d, \'%s\', \'%s\', %d, 5)', $edit['fid'], $edit['title'], $edit['url'], $edit['refresh']);
if ($edit['title']) {
// the feed is being saved, save the categories as well
2004-05-17 22:11:12 +00:00
if ($edit['category']) {
foreach ($edit['category'] as $cid => $value) {
db_query('INSERT INTO {aggregator_category_feed} (fid, cid) VALUES (%d, %d)', $edit['fid'], $cid);
2001-05-26 18:26:56 +00:00
function aggregator_get_feed($fid) {
return db_fetch_array(db_query('SELECT * FROM {aggregator_feed} WHERE fid = %d', $fid));
2001-05-26 18:26:56 +00:00
function aggregator_get_category($cid) {
return db_fetch_array(db_query('SELECT * FROM {aggregator_category} WHERE cid = %d', $cid));
2001-05-26 18:26:56 +00:00
function aggregator_view() {
$result = db_query('SELECT f.*, COUNT(i.iid) AS items FROM {aggregator_feed} f LEFT JOIN {aggregator_item} i ON f.fid = i.fid GROUP BY f.fid, f.title, f.url, f.refresh, f.checked, f.link, f.description, f.etag, f.modified, f.image, f.block ORDER BY f.title');
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
$output .= '<h3>'. t('Feed overview') .'</h3>';
$header = array(t('Title'), t('Items'), t('Last update'), t('Next update'), array('data' => t('Operations'), 'colspan' => '3'));
$rows = array();
2001-05-26 18:26:56 +00:00
while ($feed = db_fetch_object($result)) {
$rows[] = array(l($feed->title, "aggregator/sources/$feed->fid"), format_plural($feed->items, '1 item', '%count items'), ($feed->checked ? t('%time ago', array('%time' => format_interval(time() - $feed->checked))) : t('never')), ($feed->checked ? t('%time left', array('%time' => format_interval($feed->checked + $feed->refresh - time()))) : t('never')), l(t('edit'), "admin/aggregator/edit/feed/$feed->fid"), l(t('remove items'), "admin/aggregator/remove/$feed->fid"), l(t('update items'), "admin/aggregator/update/$feed->fid"));
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
$output .= theme('table', $header, $rows);
2001-05-26 18:26:56 +00:00
$result = db_query('SELECT c.cid, c.title, count(ci.iid) as items FROM {aggregator_category} c LEFT JOIN {aggregator_category_item} ci ON c.cid = ci.cid GROUP BY c.cid, c.title ORDER BY title');
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
$output .= '<h3>'. t('Category overview') .'</h3>';
$header = array(t('Title'), t('Items'), t('Operations'));
$rows = array();
while ($category = db_fetch_object($result)) {
$rows[] = array(l($category->title, "aggregator/categories/$category->cid"), format_plural($category->items, '1 item', '%count items'), l(t('edit'), "admin/aggregator/edit/category/$category->cid"));
- Rewrote the headline module from scratch. Note that the old headline code is still in place 'till the new code has proven to be stable. See "syndication.module" for the new code. Changes: + Improved the parser and tested it against RSS 0.9, RSS 0.91, RSS 0.92, RSS 1.0, RDF and XML feeds. + Improved the administration interface. It might be a bit fuzzy at first. Maybe some native English like Julian, Michael (or any one else with knowledge in the field) can help out by suggesting better naming, terminology or descriptions - as well as by writing the help section for this module? I'd have no idea how much this would be appreciated. + We can *easily* recognize new tags or extensions: we parse out "link", "title", "description" and "author" right now, but we will have to revise which tags to support and which not. New tags can be added in less than 10 minutes (if you are familiar with the code). Read: we have something we can build on. + Within each item, tags can now appear is random order which is or was not the case with the old headline code where we expect <link>s prior to <description>s for example. + Feed updates only (ie. always) happen through cron. Neither do we use one global cron for updating all feeds; instead, every feed can specify his own update-interval. + Newly fetched headlines are "appended" to the pool of existing headlines (read: we don't replace the whole feed), and headlines automatically "expire" after x days or hours. (Every headline has a timestamp.) + Got rid of backend.class; it is integrated in the module. + Switched to more generic names: "headline" became "item" and "backend" became "feed". This should ease future non-headline oriented syndication. + You can associate attributes or keyword lists with every feed. At the moment new items will automatically inherit their feeds attributes but in future we can use heuristics to make these attributes "mutate" when and where we see fit. The attributes can be maintained by hand as well. + We don't export any blocks yet; we will soon do as soon this new code has been tested for a bit more. We will only export bundles though so if you want to export by feed/source, you will have to make a source-specific bundle. - Polished a bit on a few other modules: nothing major.
2001-05-26 18:26:56 +00:00
$output .= theme('table', $header, $rows);
2001-05-26 18:26:56 +00:00
return $output;
function aggregator_edit() {
if ($_POST['op'] == t('Submit')) {
if (arg(1) == 'categories') {
drupal_set_message(t('The category has been updated.'));
else {
drupal_set_message(t('The feed has been updated.'));
else if ($_POST['op'] == t('Delete')) {
// Unset the title:
if (arg(1) == 'categories') {
drupal_set_message(t('The category has been deleted.'));
else {
drupal_set_message(t('The feed has been deleted.'));
drupal_goto('aggregator/'. arg(1));
if (arg(1) == 'categories') {
$output = aggregator_form_category(aggregator_get_category(arg(2)));
else {
$output = aggregator_form_feed(aggregator_get_feed(arg(2)));
return $output;
2004-05-17 22:00:06 +00:00
* Menu callback; displays the category edit form, or saves changes and
* redirects to the overview page.
function aggregator_admin_edit_category($category = 0) {
$edit = $_POST['edit'];
$op = $_POST['op'];
switch ($op) {
case t('Delete'):
$edit['title'] = 0;
// Fall through:
case t('Submit'):
drupal_set_message($edit['title'] ? t('The category has been updated.') : t('The category has been removed.'));
if ($category) {
$output = aggregator_form_category(aggregator_get_category($category));
else {
$output = aggregator_form_category();
return $output;
2004-05-17 22:00:06 +00:00
* Menu callback; displays the feed edit form.
* After editing, saves changes and redirects to the overview page.
function aggregator_admin_edit_feed($feed = 0) {
$edit = $_POST['edit'];
$op = $_POST['op'];
switch ($op) {
case t('Delete'):
$edit['title'] = 0;
// Fall through:
case t('Submit'):
drupal_set_message($edit['title'] ? t('The feed has been updated.') : t('The feed has been removed.'));
if ($feed) {
$output = aggregator_form_feed(aggregator_get_feed($feed));
else {
$output = aggregator_form_feed();
2001-05-26 18:26:56 +00:00
return $output;
* Menu callback; removes all items from a feed, then redirects to the overview page.
function aggregator_admin_remove_feed($feed) {
* Menu callback; refreshes a feed, then redirects to the overview page.
function aggregator_admin_refresh_feed($feed) {
2004-05-17 22:00:06 +00:00
* Menu callback; displays the aggregator administration page.
function aggregator_admin_overview() {
return aggregator_view();
2001-05-26 18:26:56 +00:00
2004-05-17 22:00:06 +00:00
* Menu callback; displays the most recent items gathered from any feed.
function aggregator_page_last() {
return _aggregator_page_list('SELECT i.*, f.title AS ftitle, f.link AS flink FROM {aggregator_item} i INNER JOIN {aggregator_feed} f ON i.fid = f.fid ORDER BY i.timestamp DESC, i.iid DESC', arg(1));
2004-05-17 22:00:06 +00:00
* Menu callback; displays all the items captured from a particular feed.
function aggregator_page_source() {
$feed = db_fetch_object(db_query('SELECT * FROM {aggregator_feed} WHERE fid = %d', arg(2)));
$info = theme('aggregator_feed', $feed);
return _aggregator_page_list('SELECT * FROM {aggregator_item} WHERE fid = '. $feed->fid .' ORDER BY timestamp DESC, iid DESC', arg(3), "<div class=\"feed\">$info</div>");
2004-05-17 22:00:06 +00:00
* Menu callback; displays all the items aggregated in a particular category.
function aggregator_page_category() {
$category = db_fetch_object(db_query('SELECT cid, title FROM {aggregator_category} WHERE cid = %d', arg(2)));
return _aggregator_page_list('SELECT i.*, f.title AS ftitle, f.link AS flink FROM {aggregator_category_item} c LEFT JOIN {aggregator_item} i ON c.iid = i.iid LEFT JOIN {aggregator_feed} f ON i.fid = f.fid WHERE cid = '. $category->cid .' ORDER BY timestamp DESC, iid DESC', arg(3));
* Prints an aggregator page listing a number of feed items. Various
* menu callbacks use this function to print their feeds.
function _aggregator_page_list($sql, $op, $header = '') {
$categorize = (user_access('administer news feeds') && ($op == 'categorize'));
$output = '<div id="aggregator">';
$form['header'] = array('#value' => $header);
$output .= $form['header']['#value'];
$result = pager_query($sql, 20);
$categories = array();
while ($item = db_fetch_object($result)) {
$form['items'][$item->iid] = array('#value' => theme('aggregator_page_item', $item));
$output .= $form['items'][$item->iid]['#value'];
$form['categories'][$item->iid] = array();
if ($categorize) {
$categories_result = db_query('SELECT c.cid, c.title, ci.iid FROM {aggregator_category} c LEFT JOIN {aggregator_category_item} ci ON c.cid = ci.cid AND ci.iid = %d', $item->iid);
$selected = array();
while ($category = db_fetch_object($categories_result)) {
if (!$done) {
$categories[$category->cid] = check_plain($category->title);
if ($category->iid) {
$selected[] = $category->cid;
$done = true;
$form['categories'][$item->iid] = array(
'#type' => variable_get('aggregator_category_selector', 'checkboxes'),
'#default_value' => $selected, '#options' => $categories,
'#size' => 10, '#multiple' => true
$output .= '</div>';
$form['submit'] = array('#type' => 'submit', '#value' => t('Save categories'));
$form['pager'] = array('#value' => theme('pager', NULL, 20, 0));
$output .= $form['pager']['#value'];
// arg(1) is undefined if we are at the top aggregator URL
// is there a better way to do this?
if (!arg(1)) {
$form['xml_icon'] = array('#value' => theme('xml_icon', url('aggregator/rss')));
elseif (arg(1) == 'categories' && arg(2) && !arg(3)) {
$form['xml_icon'] = array('#value' => theme('xml_icon', url('aggregator/rss/' . arg(2))));
$output .= $form['xml_icon']['#value'];
return ($categorize) ? drupal_get_form('aggregator_page_list', $form) : $output;
function theme_aggregator_page_list($form) {
$output = '<div id="aggregator">';
$output .= form_render($form['header']);
$rows = array();
if ($form['items']) {
foreach (element_children($form['items']) as $key) {
if (is_array($form['items'][$key])) {
$rows[] = array(form_render($form['items'][$key]), array('data' => form_render($form['categories'][$key]), 'class' => 'categorize-item'));
$output .= theme('table', array('', t('Categorize')), $rows);
$output .= form_render($form['submit']);
$output .= '</div>';
$output .= form_render($form);
return $output;
function aggregator_page_list_validate($form_id, &$form) {
if (!user_access('administer news feeds')) {
form_error($form, t('You are not allowed to categorize this feed item.'));
function aggregator_page_list_submit($form_id, $form) {
global $form_values;
foreach ($form_values['categories'] as $iid => $selection) {
db_query('DELETE FROM {aggregator_category_item} WHERE iid = %d', $iid);
foreach ($selection as $cid) {
if ($cid) {
db_query('INSERT INTO {aggregator_category_item} (cid, iid) VALUES (%d, %d)', $cid, $iid);
drupal_set_message(t('The categories have been saved.'));
2004-05-17 22:00:06 +00:00
* Menu callback; displays all the feeds used by the aggregator.
function aggregator_page_sources() {
$result = db_query('SELECT f.fid, f.title, f.description, f.image, MAX(i.timestamp) AS last FROM {aggregator_feed} f LEFT JOIN {aggregator_item} i ON f.fid = i.fid GROUP BY f.fid, f.title, f.description, f.image');
$output = "<div id=\"aggregator\">\n";
while ($feed = db_fetch_object($result)) {
$output .= '<h2>'. check_plain($feed->title) ."</h2>\n";
// Most recent items:
$list = array();
if (variable_get('aggregator_summary_items', 3)) {
$items = db_query_range('SELECT i.title, i.timestamp, i.link FROM {aggregator_item} i WHERE i.fid = %d ORDER BY i.timestamp DESC', $feed->fid, 0, variable_get('aggregator_summary_items', 3));
while ($item = db_fetch_object($items)) {
$list[] = theme('aggregator_summary_item', $item);
$output .= theme('item_list', $list);
$output .= '<div class="links">'. theme('links', array(l(t('more'), 'aggregator/sources/'. $feed->fid))) ."</div>\n";
$output .= theme('xml_icon', url('aggregator/opml'));
$output .= '</div>';
return $output;
* Menu callback; generate an RSS 0.92 feed of aggregator items or categories.
function aggregator_page_rss() {
global $base_url;
// arg(2) is the passed cid, only select for that category
$result = NULL;
if (arg(2)) {
$category = db_fetch_object(db_query('SELECT cid, title FROM {aggregator_category} WHERE cid = %d', arg(2)));
$url = '/categories/' . $category->cid;
$title = ' ' . t('in category') . ' ' . $category->title;
$sql = 'SELECT i.*, f.title AS ftitle, f.link AS flink FROM {aggregator_category_item} c LEFT JOIN {aggregator_item} i ON c.iid = i.iid LEFT JOIN {aggregator_feed} f ON i.fid = f.fid WHERE cid = %d ORDER BY timestamp DESC, iid DESC';
$result = db_query_range($sql, $category->cid, 0, variable_get('feed_default_items', 10));
// or, get the default aggregator items
else {
$sql = 'SELECT i.*, f.title AS ftitle, f.link AS flink FROM {aggregator_item} i INNER JOIN {aggregator_feed} f ON i.fid = f.fid ORDER BY i.timestamp DESC, i.iid DESC';
$result = db_query_range($sql, 0, variable_get('feed_default_items', 10));
while ($item = db_fetch_object($result)) {
switch (variable_get('feed_item_length', 'teaser')) {
case 'teaser':
$teaser = node_teaser($item->description);
if ($teaser != $item_description) {
$teaser .= '<p><a href="'. check_url($item->link) .'">'. t('read more') ."</a></p>\n";
$item->description = $teaser;
case 'title':
$item->description = '';
$items .= format_rss_item($item->ftitle . ': ' . $item->title, $item->link, $item->description, array('pubDate' => date('r', $item->timestamp)));
$output .= "<?xml version=\"1.0\" encoding=\"utf-8\"?>\n";
$output .= "<rss version=\"2.0\">\n";
$output .= format_rss_channel(variable_get('site_name', t('Drupal')) . ' ' . t('aggregator'), $base_url . '/' . url('aggregator' . $url), variable_get('site_name', t('Drupal')) . ' - ' . t('aggregated feeds') . $title, $items, 'en');
$output .= "</rss>\n";
drupal_set_header('Content-Type: text/xml; charset=utf-8');
print $output;
2004-05-17 22:00:06 +00:00
* Menu callback; generates an OPML representation of all feeds.
function aggregator_page_opml($cid = NULL) {
if ($cid) {
$result = db_query('SELECT f.title, f.url FROM {aggregator_feed} f LEFT JOIN {aggregator_category_feed} c on f.fid = c.fid WHERE c.cid = %d ORDER BY title', $cid);
else {
$result = db_query('SELECT * FROM {aggregator_feed} ORDER BY title');
$output = "<?xml version=\"1.0\" encoding=\"utf-8\"?>\n";
$output .= "<opml version=\"1.1\">\n";
$output .= "<head>\n";
$output .= '<title>'. check_plain(variable_get('site_name', 'Drupal')) ."</title>\n";
$output .= '<dateModified>'. gmdate('r') ."</dateModified>\n";
$output .= "</head>\n";
$output .= "<body>\n";
while ($feed = db_fetch_object($result)) {
$output .= '<outline text="'. check_plain($feed->title) .'" xmlUrl="'. check_url($feed->url) ."\" />\n";
$output .= "</body>\n";
$output .= "</opml>\n";
2001-08-05 08:43:58 +00:00
drupal_set_header('Content-Type: text/xml; charset=utf-8');
print $output;
2004-05-17 22:00:06 +00:00
* Menu callback; displays all the categories used by the aggregator.
function aggregator_page_categories() {
$result = db_query('SELECT c.cid, c.title, c.description FROM {aggregator_category} c LEFT JOIN {aggregator_category_item} ci ON c.cid = ci.cid LEFT JOIN {aggregator_item} i ON ci.iid = i.iid GROUP BY c.cid, c.title, c.description');
$output = "<div id=\"aggregator\">\n";
while ($category = db_fetch_object($result)) {
$output .= '<h2>'. check_plain($category->title) ."</h2>\n";
if (variable_get('aggregator_summary_items', 3)) {
$list = array();
$items = db_query_range('SELECT i.title, i.timestamp, i.link, f.title as feed_title, f.link as feed_link FROM {aggregator_category_item} ci LEFT JOIN {aggregator_item} i ON i.iid = ci.iid LEFT JOIN {aggregator_feed} f ON i.fid = f.fid WHERE ci.cid = %d ORDER BY i.timestamp DESC', $category->cid, 0, variable_get('aggregator_summary_items', 3));
while ($item = db_fetch_object($items)) {
$list[] = theme('aggregator_summary_item', $item);
$output .= theme('item_list', $list);
$output .= '<div class="links">'. theme('links', array(l(t('more'), 'aggregator/categories/'. $category->cid))) ."</div>\n";
$output .= '</div>';
return $output;
* Format a news feed.
* @ingroup themeable
function theme_aggregator_feed($feed) {
$output = '';
if ($feed->image) {
$output .= $feed->image;
$output .= $feed->description;
$output .= '<h3>'. t('URL') ."</h3>\n";
$output .= theme('xml_icon', $feed->url);
$output .= '<a href="'. check_url($feed->link) .'">'. check_plain($feed->link) ."</a>\n";
$output .= '<h3>'. t('Last update') ."</h3>\n";
$updated = t('%time ago', array('%time' => format_interval(time() - $feed->checked)));
if (user_access('administer news feeds')) {
$output .= l($updated, 'admin/aggregator');
else {
$output .= $updated;
return $output;
* Format an individual feed item for display in the block.
* @ingroup themeable
function theme_aggregator_block_item($item, $feed = 0) {
global $user;
if ($user->uid && module_exist('blog') && user_access('edit own blog')) {
if ($image = theme('image', 'misc/blog.png', t('blog it'), t('blog it'))) {
$output .= '<div class="icon">'. l($image, 'node/add/blog', array('title' => t('Comment on this news item in your personal blog.'), 'class' => 'blog-it'), "iid=$item->iid", NULL, FALSE, TRUE) .'</div>';
// Display the external link to the item.
$output .= '<a href="'. check_url($item->link) .'">'. check_plain($item->title) ."</a>\n";
return $output;
* Return a themed item heading for summary pages located at "aggregator/sources"
* and "aggregator/categories".
* @param $item The item object from the aggregator module.
* @return A string containing the output.
* @ingroup themeable
function theme_aggregator_summary_item($item) {
$output = '<a href="'. check_url($item->link) .'">'. check_plain($item->title) .'</a> <span class="age">'. t('%age old', array('%age' => format_interval(time() - $item->timestamp))) .'</span>';
if ($item->feed_link) {
$output .= ', <span class="source"><a href="'. $item->feed_link .'">'. $item->feed_title .'</a></span>';
return $output ."\n";
* Format an individual feed item for display on the aggregator page.
* @ingroup themeable
function theme_aggregator_page_item($item) {
static $last;
$date = format_date($item->timestamp, 'custom', 'Ymd');
if ($date != $last) {
$last = $date;
$output .= '<h3>'. format_date($item->timestamp, 'custom', 'F j, Y') ."</h3>\n";
$output .= "<div class=\"news-item\">\n";
$output .= ' <div class="date">'. format_date($item->timestamp, 'custom', 'H:i') ."</div>\n";
$output .= " <div class=\"body\">\n";
$source = '';
if ($item->ftitle && $item->fid) {
$source = '<span class="source">'. l($item->ftitle, "aggregator/sources/$item->fid") .":</span>\n";
$output .= ' <div class="title">'. $source .'<a href="'. check_url($item->link) .'">'. check_plain($item->title) ."</a></div>\n";
if ($item->description) {
$output .= ' <div class="description">'. $item->description ."</div>\n";
$result = db_query('SELECT c.title, c.cid FROM {aggregator_category_item} ci LEFT JOIN {aggregator_category} c ON ci.cid = c.cid WHERE ci.iid = %d ORDER BY c.title', $item->iid);
$categories = array();
while ($category = db_fetch_object($result)) {
$categories[] = l($category->title, 'aggregator/categories/'. $category->cid);
if ($categories) {
$output .= ' <div class="categories">'. t('Categories') .': '. implode(', ', $categories) ."</div>\n";
$output .= " </div>\n";
$output .= "</div>\n";
return $output;