function aggregator_parse_feed

Parses a feed and stores its items.


$data: The feed data.

$feed: An object describing the feed to be parsed.

Return value

FALSE on error, TRUE otherwise.

1 call to aggregator_parse_feed()
aggregator_aggregator_parse in modules/aggregator/
Implements hook_aggregator_parse().


modules/aggregator/, line 67


function aggregator_parse_feed(&$data, $feed) {
    global $items, $image, $channel;
    // Unset the global variables before we use them.
    unset($GLOBALS['element'], $GLOBALS['item'], $GLOBALS['tag']);
    $items = array();
    $image = array();
    $channel = array();
    // Parse the data.
    $xml_parser = drupal_xml_parser_create($data);
    xml_set_element_handler($xml_parser, 'aggregator_element_start', 'aggregator_element_end');
    xml_set_character_data_handler($xml_parser, 'aggregator_element_data');
    if (!xml_parse($xml_parser, $data, 1)) {
        watchdog('aggregator', 'The feed from %site seems to be broken, due to an error "%error" on line %line.', array(
            '%site' => $feed->title,
            '%error' => xml_error_string(xml_get_error_code($xml_parser)),
            '%line' => xml_get_current_line_number($xml_parser),
        drupal_set_message(t('The feed from %site seems to be broken, because of error "%error" on line %line.', array(
            '%site' => $feed->title,
            '%error' => xml_error_string(xml_get_error_code($xml_parser)),
            '%line' => xml_get_current_line_number($xml_parser),
        )), 'error');
        return FALSE;
    // We reverse the array such that we store the first item last, and the last
    // item first. In the database, the newest item should be at the top.
    $items = array_reverse($items);
    // Initialize items array.
    $feed->items = array();
    foreach ($items as $item) {
        // Prepare the item:
        foreach ($item as $key => $value) {
            $item[$key] = trim($value);
        // Resolve the item's title. If no title is found, we use up to 40
        // characters of the description ending at a word boundary, but not
        // splitting potential entities.
        if (!empty($item['title'])) {
            $item['title'] = $item['title'];
        elseif (!empty($item['description'])) {
            $item['title'] = preg_replace('/^(.*)[^\\w;&].*?$/', "\\1", truncate_utf8($item['description'], 40));
        else {
            $item['title'] = '';
        // Resolve the items link.
        if (!empty($item['link'])) {
            $item['link'] = $item['link'];
        else {
            $item['link'] = $feed->link;
        // Atom feeds have an ID tag instead of a GUID tag.
        if (!isset($item['guid'])) {
            $item['guid'] = isset($item['id']) ? $item['id'] : '';
        // Atom feeds have a content and/or summary tag instead of a description tag.
        if (!empty($item['content:encoded'])) {
            $item['description'] = $item['content:encoded'];
        elseif (!empty($item['summary'])) {
            $item['description'] = $item['summary'];
        elseif (!empty($item['content'])) {
            $item['description'] = $item['content'];
        // Try to resolve and parse the item's publication date.
        $date = '';
        foreach (array(
        ) as $key) {
            if (!empty($item[$key])) {
                $date = $item[$key];
        $item['timestamp'] = strtotime($date);
        if ($item['timestamp'] === FALSE) {
            $item['timestamp'] = aggregator_parse_w3cdtf($date);
            // Aggregator_parse_w3cdtf() returns FALSE on failure.
        // Resolve dc:creator tag as the item author if author tag is not set.
        if (empty($item['author']) && !empty($item['dc:creator'])) {
            $item['author'] = $item['dc:creator'];
        $item += array(
            'author' => '',
            'description' => '',
        // Store on $feed object. This is where processors will look for parsed items.
        $feed->items[] = $item;
    return TRUE;

