You are here

abstract class FeedsExBase in Feeds extensible parsers 7.2

Same name and namespace in other branches
  1. 7 src/ \FeedsExBase

The Feeds extensible parser.


Expanded class hierarchy of FeedsExBase

2 string references to 'FeedsExBase'
feeds_ex_feeds_plugins in ./
Implements hook_feeds_plugins().
feeds_ex_test_feeds_plugins in tests/feeds_ex_test.module
Implements hook_feeds_plugins().


src/, line 11
Contains FeedsExBase.

View source
abstract class FeedsExBase extends FeedsParser {

   * Whether the current system handles mb_* functions.
   * @var bool
  protected $isMultibyte;

   * The object used to display messages to the user.
   * @var FeedsExMessengerInterface
  protected $messenger;

   * Returns rows to be parsed.
   * @param FeedsSource $source
   *   Source information.
   * @param FeedsFetcherResult $fetcher_result
   *   The result returned by the fetcher.
   * @return array|Traversable
   *   Some iterable that returns rows.
  protected abstract function executeContext(FeedsSource $source, FeedsFetcherResult $fetcher_result);

   * Executes a single source expression.
   * @param string $machine_name
   *   The source machine name being executed.
   * @param string $expression
   *   The expression to execute.
   * @param mixed $row
   *   The row to execute on.
   * @return scalar|[]scalar
   *   Either a scalar, or a list of scalars. If null, the value will be
   *   ignored.
  protected abstract function executeSourceExpression($machine_name, $expression, $row);

   * Validates an expression.
   * @param string &$expression
   *   The expression to validate.
   * @return string|null
   *   Return the error string, or null if validation was passed.
  protected abstract function validateExpression(&$expression);

   * Returns the errors after parsing.
   * @return array
   *   A structured array array with keys:
   *   - message: The error message.
   *   - variables: The variables for the message.
   *   - severity: The severity of the message.
   * @see watchdog()
  protected abstract function getErrors();

   * Allows subclasses to prepare for parsing.
   * @param FeedsSource $source
   *   The feed source.
   * @param FeedsFetcherResult $fetcher_result
   *   The result of the fetching stage.
  protected function setUp(FeedsSource $source, FeedsFetcherResult $fetcher_result) {

   * Allows subclasses to cleanup after parsing.
   * @param FeedsSource $source
   *   The feed source.
   * @param FeedsParserResult $parser_result
   *   The result of parsing.
  protected function cleanUp(FeedsSource $source, FeedsParserResult $parser_result) {

   * Starts internal error handling.
   * Subclasses can override this to being error handling.
  protected function startErrorHandling() {

   * Stops internal error handling.
   * Subclasses can override this to end error handling.
  protected function stopErrorHandling() {

   * Loads the necessary library.
   * Subclasses can override this to load the necessary library. It will be
   * called automatically.
   * @throws RuntimeException
   *   Thrown if the library does not exist.
  protected function loadLibrary() {

   * Returns whether or not this parser uses a context query.
   * Sub-classes can return false here if they don't require a user-configured
   * context query.
   * @return bool
   *   True if the parser uses a context query and false if not.
  protected function hasConfigurableContext() {
    return TRUE;

   * Reuturns the list of table headers.
   * @return array
   *   A list of header names keyed by the form keys.
  protected function configFormTableHeader() {
    return array();

   * Returns a form element for a specific column.
   * @param array &$form_state
   *   The current form state.
   * @param string $column_name
   *   The name of the column.
   * @param array $source
   *   The individual source item.
   * @return array
   *   A single form element.
  protected function configFormTableColumn(array &$form_state, $column_name, array $source) {
    return array();

   * {@inheritdoc}
  protected function __construct($id) {
    $this->isMultibyte = $GLOBALS['multibyte'] == UNICODE_MULTIBYTE;

   * {@inheritdoc}
  public function parse(FeedsSource $source, FeedsFetcherResult $fetcher_result) {
    try {
      $result = $this
        ->delegateParsing($source, $fetcher_result);
    } catch (FeedsExEmptyException $e) {

      // The feed is empty.
        ->setMessage(t('The feed is empty.'), 'warning', FALSE);
      $result = new FeedsParserResult();
    } catch (Expcetion $exception) {

      // Do nothing. Store for later.

    // Show some warnings.
    $errors = $this
    if ($this->config['display_errors']) {
        ->printErrors($errors, WATCHDOG_DEBUG);
    else {

      // Always print fatal errors.

    // Log any fatal errors.
      ->logErrors($source, $errors);
    if (isset($exception)) {
      throw $exception;
    return $result;

   * Delegates parsing to the subclass.
   * @param FeedsSource $source
   *   The feed source.
   * @param FeedsFetcherResult $fetcher_result
   *   The fetcher result.
   * @return FeedsParserResult
   *   The populated parser result.
   * @throws FeedsExEmptyException
   *   Thrown if the feed is empty.
   * @throws Exception
   *   Thrown if an error occured during parsing.
  protected function delegateParsing(FeedsSource $source, FeedsFetcherResult $fetcher_result) {
    $result = new FeedsParserResult();

    // Set link.
    $fetcher_config = $source
    $result->link = is_string($fetcher_config['source']) ? $fetcher_config['source'] : '';
    $expressions = $this
    $variable_map = $this
      ->setUp($source, $fetcher_result);
    foreach ($this
      ->executeContext($source, $fetcher_result) as $row) {
      if ($item = $this
        ->executeSources($row, $expressions, $variable_map)) {
        $result->items[] = $item;
      ->cleanUp($source, $result);
    return $result;

   * Prepares the expressions for parsing.
   * At this point we just remove empty expressions.
   * @return array
   *   A map of machine name to expression.
  protected function prepareExpressions() {
    $expressions = array();
    foreach ($this->config['sources'] as $machine_name => $source) {
      if (strlen($source['value'])) {
        $expressions[$machine_name] = $source['value'];
    return $expressions;

   * Prepares the variable map used to substitution.
   * @param array $expressions
   *   The expressions being parsed.
   * @return array
   *   A map of machine name to variable name.
  protected function prepareVariables(array $expressions) {
    $variable_map = array();
    foreach ($expressions as $machine_name => $expression) {
      $variable_map[$machine_name] = '$' . $machine_name;
    return $variable_map;

   * Executes the source expressions.
   * @param mixed $row
   *   A single item returned from the context expression.
   * @param array $expressions
   *   A map of machine name to expression.
   * @param array $variable_map
   *   A map of machine name to varible name.
   * @return array
   *   The fully-parsed item array.
  protected function executeSources($row, array $expressions, array $variable_map) {
    $item = array();
    $variables = array();
    foreach ($expressions as $machine_name => $expression) {

      // Variable substitution.
      $expression = strtr($expression, $variables);
      $result = $this
        ->executeSourceExpression($machine_name, $expression, $row);
      if (!empty($this->config['sources'][$machine_name]['debug'])) {
          ->debug($result, $machine_name);
      if ($result === NULL) {
        $variables[$variable_map[$machine_name]] = '';
      $item[$machine_name] = $result;
      $variables[$variable_map[$machine_name]] = is_array($result) ? reset($result) : $result;
    return $item;

   * Prints errors to the screen.
   * @param array $errors
   *   A list of errors as returned by stopErrorHandling().
   * @param int $severity
   *   (optional) Limit to only errors of the specified severity. Defaults to
   * @see watchdog()
  protected function printErrors(array $errors, $severity = WATCHDOG_ERROR) {
    foreach ($errors as $error) {
      if ($error['severity'] > $severity) {
        ->setMessage(t($error['message'], $error['variables']), $error['severity'] <= WATCHDOG_ERROR ? 'error' : 'warning', FALSE);

   * Logs errors.
   * @param FeedsSource $source
   *   The feed source being importerd.
   * @param array $errors
   *   A list of errors as returned by stopErrorHandling().
   * @param int $severity
   *   (optional) Limit to only errors of the specified severity. Defaults to
   * @see watchdog()
  protected function logErrors(FeedsSource $source, array $errors, $severity = WATCHDOG_ERROR) {
    foreach ($errors as $error) {
      if ($error['severity'] > $severity) {
        ->log('feeds_ex', $error['message'], $error['variables'], $error['severity']);

   * Detects the encoding of a string.
   * @param string $data
   *   The string to guess the encoding for.
   * @return string|bool
   *   Returns the encoding, or false if one could not be detected.
   * @todo Add other methods of encoding detection.
  protected function detectEncoding($data) {
    if ($this->isMultibyte) {
      return mb_detect_encoding($data, $this->config['source_encoding'], TRUE);
    return FALSE;

   * Converts a string to UTF-8.
   * Requires the iconv, GNU recode or mbstring PHP extension.
   * @param string $data
   *   The string to convert.
   * @param string $encoding
   *   The encoding to convert to.
   * @return string
   *   The encoded string, or the original string if encoding failed.
   * @see drupal_convert_to_utf8()
  protected function convertEncoding($data, $encoding) {
    $php_supported = array(
    if (in_array(strtolower($encoding), $php_supported)) {
      return $data;
    $converted = drupal_convert_to_utf8($data, $encoding);
    if ($converted === FALSE) {
      return $data;
    return $converted;

   * Renders our debug messages into a list.
   * @param mixed $data
   *   The result of an expression. Either a scalar or a list of scalars.
   * @param string $machine_name
   *   The source key that produced this query.
  protected function debug($data, $machine_name) {
    $name = $machine_name;
    if ($this->config['sources'][$machine_name]['name']) {
      $name = $this->config['sources'][$machine_name]['name'];
    $output = '<strong>' . $name . ':</strong>';
    $data = is_array($data) ? $data : array(
    foreach ($data as $key => $value) {
      $data[$key] = check_plain($value);
    $output .= theme('item_list', array(
      'items' => $data,

   * {@inheritdoc}
  public function getMappingSources() {
    return parent::getMappingSources() + $this->config['sources'];

   * {@inheritdoc}
  public function configDefaults() {
    return array(
      'sources' => array(),
      'context' => array(
        'value' => '',
      'display_errors' => FALSE,
      'source_encoding' => array(
      'debug_mode' => FALSE,

   * {@inheritdoc}
  public function configForm(&$form_state) {
    $form = array(
      '#tree' => TRUE,
      '#theme' => 'feeds_ex_configuration_table',
      '#prefix' => '<div id="feeds-ex-configuration-wrapper">',
      '#suffix' => '</div>',
    if ($this
      ->hasConfigurableContext()) {
      $form['context']['name'] = array(
        '#type' => 'markup',
        '#markup' => t('Context'),
      $form['context']['value'] = array(
        '#type' => 'textfield',
        '#title' => t('Context value'),
        '#title_display' => 'invisible',
        '#default_value' => $this->config['context']['value'],
        '#size' => 50,
        '#required' => TRUE,
        // We're hiding the title, so add a little hint.
        '#description' => '<span class="form-required">*</span>',
        '#attributes' => array(
          'class' => array(
    $form['sources'] = array(
      '#id' => 'feeds-ex-source-table',
    $max_weight = 0;
    foreach ($this->config['sources'] as $machine_name => $source) {
      $form['sources'][$machine_name]['name'] = array(
        '#type' => 'textfield',
        '#title' => t('Name'),
        '#title_display' => 'invisible',
        '#default_value' => $source['name'],
        '#size' => 20,
      $form['sources'][$machine_name]['machine_name'] = array(
        '#title' => t('Machine name'),
        '#title_display' => 'invisible',
        '#markup' => $machine_name,
      $form['sources'][$machine_name]['value'] = array(
        '#type' => 'textfield',
        '#title' => t('Value'),
        '#title_display' => 'invisible',
        '#default_value' => $source['value'],
        '#size' => 50,
      foreach ($this
        ->configFormTableHeader() as $column => $name) {
        $form['sources'][$machine_name][$column] = $this
          ->configFormTableColumn($form_state, $column, $source);
      $form['sources'][$machine_name]['debug'] = array(
        '#type' => 'checkbox',
        '#title' => t('Debug'),
        '#title_display' => 'invisible',
        '#default_value' => $source['debug'],
      $form['sources'][$machine_name]['remove'] = array(
        '#type' => 'checkbox',
        '#title' => t('Remove'),
        '#title_display' => 'invisible',
      $form['sources'][$machine_name]['weight'] = array(
        '#type' => 'textfield',
        '#default_value' => $source['weight'],
        '#size' => 3,
        '#attributes' => array(
          'class' => array(
      $max_weight = $source['weight'];
    $form['add']['name'] = array(
      '#type' => 'textfield',
      '#title' => t('Add new source'),
      '#id' => 'edit-sources-add-name',
      '#description' => t('Name'),
      '#size' => 20,
    $form['add']['machine_name'] = array(
      '#title' => t('Machine name'),
      '#title_display' => 'invisible',
      '#type' => 'machine_name',
      '#machine_name' => array(
        'exists' => 'feeds_ex_source_exists',
        'source' => array(
        'standalone' => TRUE,
        'label' => '',
      '#field_prefix' => '<span dir="ltr">',
      '#field_suffix' => '</span>&lrm;',
      '#feeds_importer' => $this->id,
      '#required' => FALSE,
      '#maxlength' => 32,
      '#size' => 15,
      '#description' => t('A unique machine-readable name containing letters, numbers, and underscores.'),
    $form['add']['value'] = array(
      '#type' => 'textfield',
      '#description' => t('Value'),
      '#title' => '&nbsp;',
      '#size' => 50,
    foreach ($this
      ->configFormTableHeader() as $column => $name) {
      $form['add'][$column] = $this
        ->configFormTableColumn($form_state, $column, array());
    $form['add']['debug'] = array(
      '#type' => 'checkbox',
      '#title' => t('Debug'),
      '#title_display' => 'invisible',
    $form['add']['weight'] = array(
      '#type' => 'textfield',
      '#default_value' => ++$max_weight,
      '#size' => 3,
      '#attributes' => array(
        'class' => array(
    $form['display_errors'] = array(
      '#type' => 'checkbox',
      '#title' => t('Display errors'),
      '#description' => t('Display all error messages after parsing. Fatal errors will always be displayed.'),
      '#default_value' => $this->config['display_errors'],
    $form['debug_mode'] = array(
      '#type' => 'checkbox',
      '#title' => t('Enable debug mode'),
      '#description' => t('Displays the configuration form on the feed source page to ease figuring out the expressions. Any values entered on that page will be saved here.'),
      '#default_value' => $this->config['debug_mode'],
    if ($this->isMultibyte) {
      $args = array(
        '%encodings' => implode(', ', mb_detect_order()),
      $form['source_encoding'] = array(
        '#type' => 'textfield',
        '#title' => t('Source encoding'),
        '#description' => t('The possible encodings of the source files. auto: %encodings', $args),
        '#default_value' => implode(', ', $this->config['source_encoding']),
        '#autocomplete_path' => '_feeds_ex/encoding_autocomplete',
    $form['#attached']['drupal_add_tabledrag'][] = array(
    $form['#attached']['css'][] = drupal_get_path('module', 'feeds_ex') . '/feeds_ex.css';
    $form['#header'] = $this
    return $form;

   * {@inheritdoc}
  public function configFormValidate(&$values) {

    // Throwing an exception during validation shows a nasty error to users.
    try {
    } catch (RuntimeException $e) {
        ->getMessage(), 'error', FALSE);

    // @todo We should do this in Feeds automatically.
    $values += $this

    // Remove sources.
    foreach ($values['sources'] as $machine_name => $source) {
      if (!empty($source['remove'])) {

    // Validate context.
    if ($this
      ->hasConfigurableContext()) {
      if ($message = $this
        ->validateExpression($values['context']['value'])) {
        form_set_error('context', $message);

    // Validate expressions.
    foreach (array_keys($values['sources']) as $machine_name) {
      if ($message = $this
        ->validateExpression($values['sources'][$machine_name]['value'])) {
        form_set_error('sources][' . $machine_name . '][value', $message);

    // Add new source.
    if (strlen($values['add']['machine_name']) && strlen($values['add']['name'])) {
      if ($message = $this
        ->validateExpression($values['add']['value'])) {
        form_set_error('add][value', $message);
      else {
        $values['sources'][$values['add']['machine_name']] = $values['add'];

    // Rebuild sources to keep the configuration values clean.
    $columns = $this
    unset($columns['remove'], $columns['machine_name']);
    $columns = array_keys($columns);
    foreach ($values['sources'] as $machine_name => $source) {
      $new_value = array();
      foreach ($columns as $column) {
        $new_value[$column] = $source[$column];
      $values['sources'][$machine_name] = $new_value;

    // Sort by weight.
    uasort($values['sources'], 'ctools_plugin_sort');
    if (!$this->isMultibyte) {

    // Normalize encodings. Make them exactly as they are defined in
    // mb_list_encodings(), but maintain user-defined order.
    $encodings = array_map('drupal_strtolower', array_map('trim', explode(',', $values['source_encoding'])));
    $values['source_encoding'] = array();
    foreach (mb_list_encodings() as $encoding) {

      // Maintain order.
      $pos = array_search(drupal_strtolower($encoding), $encodings);
      if ($pos !== FALSE) {
        $values['source_encoding'][$pos] = $encoding;

    // Make sure there's some value set.
    if (!$values['source_encoding']) {
      $values['source_encoding'][] = 'auto';

   * {@inheritdoc}
  public function hasConfigForm() {
    return TRUE;

   * {@inheritdoc}
  public function sourceDefaults() {
    return array();

   * {@inheritdoc}
  public function sourceForm($source_config) {
    if (!$this
      ->hasSourceConfig()) {
      return array();
    $form_state = array();
    $form = $this
    $form['add']['machine_name']['#machine_name']['source'] = array(
    return $form;

   * {@inheritdoc}
  public function sourceFormValidate(&$source_config) {

   * {@inheritdoc}
  public function sourceSave(FeedsSource $source) {
    $config = $source
      ->setConfigFor($this, array());
    if ($this
      ->hasSourceConfig() && $config) {

   * {@inheritdoc}
  public function hasSourceConfig() {
    return !empty($this->config['debug_mode']);

   * Returns the configuration form table header.
   * @return array
   *   The header array.
  protected function getFormHeader() {
    $header = array(
      'name' => t('Name'),
      'machine_name' => t('Machine name'),
      'value' => t('Value'),
    $header += $this
    $header += array(
      'debug' => t('Debug'),
      'remove' => t('Remove'),
      'weight' => t('Weight'),
    return $header;

   * Sets the multibyte handling.
   * @param bool $is_multibyte
   *   Whether this parser should assume multibyte handling exists.
   * @internal Used only during testing to force handling.
  public function setMultibyte($is_multibyte) {
    $this->isMultibyte = (bool) $is_multibyte;

   * Sets the messenger to be used to display messages.
   * @param FeedsExMessengerInterface $messenger
   *   The messenger.
  public function setMessenger(FeedsExMessengerInterface $messenger) {
    $this->messenger = $messenger;

   * Returns the messenger.
   * @return FeedsExMessengerInterface
   *   The messenger.
  public function getMessenger() {
    if (!isset($this->messenger)) {
      $this->messenger = new FeedsExMessenger();
    return $this->messenger;



Namesort descending Modifiers Type Description Overrides
FeedsExBase::$isMultibyte protected property Whether the current system handles mb_* functions.
FeedsExBase::$messenger protected property The object used to display messages to the user.
FeedsExBase::cleanUp protected function Allows subclasses to cleanup after parsing. 3
FeedsExBase::configDefaults public function 1
FeedsExBase::configForm public function 1
FeedsExBase::configFormTableColumn protected function Returns a form element for a specific column. 1
FeedsExBase::configFormTableHeader protected function Reuturns the list of table headers. 1
FeedsExBase::configFormValidate public function
FeedsExBase::convertEncoding protected function Converts a string to UTF-8. 1
FeedsExBase::debug protected function Renders our debug messages into a list.
FeedsExBase::delegateParsing protected function Delegates parsing to the subclass.
FeedsExBase::detectEncoding protected function Detects the encoding of a string.
FeedsExBase::executeContext abstract protected function Returns rows to be parsed. 4
FeedsExBase::executeSourceExpression abstract protected function Executes a single source expression. 4
FeedsExBase::executeSources protected function Executes the source expressions.
FeedsExBase::getErrors abstract protected function Returns the errors after parsing. 4
FeedsExBase::getFormHeader protected function Returns the configuration form table header.
FeedsExBase::getMappingSources public function
FeedsExBase::getMessenger public function Returns the messenger.
FeedsExBase::hasConfigForm public function
FeedsExBase::hasConfigurableContext protected function Returns whether or not this parser uses a context query. 2
FeedsExBase::hasSourceConfig public function
FeedsExBase::loadLibrary protected function Loads the necessary library. 2
FeedsExBase::logErrors protected function Logs errors.
FeedsExBase::parse public function
FeedsExBase::prepareExpressions protected function Prepares the expressions for parsing.
FeedsExBase::prepareVariables protected function Prepares the variable map used to substitution.
FeedsExBase::printErrors protected function Prints errors to the screen.
FeedsExBase::setMessenger public function Sets the messenger to be used to display messages.
FeedsExBase::setMultibyte public function Sets the multibyte handling.
FeedsExBase::setUp protected function Allows subclasses to prepare for parsing. 3
FeedsExBase::sourceDefaults public function
FeedsExBase::sourceForm public function
FeedsExBase::sourceFormValidate public function
FeedsExBase::sourceSave public function
FeedsExBase::startErrorHandling protected function Starts internal error handling. 1
FeedsExBase::stopErrorHandling protected function Stops internal error handling. 1
FeedsExBase::validateExpression abstract protected function Validates an expression. 4
FeedsExBase::__construct protected function 1