feeds_ex-8.x-1.0-alpha4/tests/src/Unit/Feeds/Parser/HtmlParserTest.php
tests/src/Unit/Feeds/Parser/HtmlParserTest.php
<?php namespace Drupal\Tests\feeds_ex\Unit\Feeds\Parser; use Drupal\feeds\Result\RawFetcherResult; use Drupal\feeds_ex\Feeds\Parser\HtmlParser; use Drupal\feeds_ex\Messenger\TestMessenger; use Drupal\feeds_ex\Utility\XmlUtility; /** * @coversDefaultClass \Drupal\feeds_ex\Feeds\Parser\HtmlParser * @group feeds_ex */ class HtmlParserTest extends ParserTestBase { /** * {@inheritdoc} */ public function setUp(): void { parent::setUp(); $configuration = ['feed_type' => $this->feedType]; $utility = new XmlUtility(); $this->parser = new HtmlParser($configuration, 'html', [], $utility); $this->parser->setStringTranslation($this->getStringTranslationStub()); $this->parser->setFeedsExMessenger(new TestMessenger()); } /** * Tests simple parsing. */ public function testSimpleParsing() { $fetcher_result = new RawFetcherResult(file_get_contents($this->moduleDir . '/tests/resources/test.html'), $this->fileSystem); $config = [ 'context' => [ 'value' => '//div[@class="post"]', ], ] + $this->parser->defaultConfiguration(); $this->parser->setConfiguration($config); $this->feedType->expects($this->any()) ->method('getCustomSources') ->willReturn([ 'title' => [ 'label' => 'Title', 'value' => 'h3', ], 'description' => [ 'label' => 'Description', 'value' => 'p', ], ]); $result = $this->parser->parse($this->feed, $fetcher_result, $this->state); $this->assertCount(3, $result); $this->assertSame('I am a title<thing>Stuff</thing>', $result[0]->get('title')); $this->assertSame('I am a description0', $result[0]->get('description')); $this->assertSame('I am a title1', $result[1]->get('title')); $this->assertSame('I am a description1', $result[1]->get('description')); $this->assertSame('I am a title2', $result[2]->get('title')); $this->assertSame('I am a description2', $result[2]->get('description')); } /** * Tests getting the raw value. */ public function testRaw() { $fetcher_result = new RawFetcherResult(file_get_contents($this->moduleDir . '/tests/resources/test.html'), $this->fileSystem); $config = [ 'context' => [ 'value' => '//div[@class="post"]', ], ] + $this->parser->defaultConfiguration(); $this->parser->setConfiguration($config); $this->feedType->expects($this->any()) ->method('getCustomSources') ->willReturn([ 'title' => [ 'label' => 'Title', 'value' => 'h3', ], 'description' => [ 'label' => 'Description', 'value' => 'p', 'raw' => TRUE, ], ]); $result = $this->parser->parse($this->feed, $fetcher_result, $this->state); $this->assertCount(3, $result); $this->assertSame('I am a title<thing>Stuff</thing>', $result[0]->get('title')); $this->assertSame('<p>I am a description0</p>', $result[0]->get('description')); $this->assertSame('I am a title1', $result[1]->get('title')); $this->assertSame('<p>I am a description1</p>', $result[1]->get('description')); $this->assertSame('I am a title2', $result[2]->get('title')); $this->assertSame('<p>I am a description2</p>', $result[2]->get('description')); } /** * Tests innerxml. */ public function testInner() { $fetcher_result = new RawFetcherResult(file_get_contents($this->moduleDir . '/tests/resources/test.html'), $this->fileSystem); $config = [ 'context' => [ 'value' => '//div[@class="post"]', ], ] + $this->parser->defaultConfiguration(); $this->parser->setConfiguration($config); $this->feedType->expects($this->any()) ->method('getCustomSources') ->willReturn([ 'title' => [ 'label' => 'Title', 'value' => 'h3', ], 'description' => [ 'label' => 'Description', 'value' => 'p', 'raw' => TRUE, 'inner' => TRUE, ], ]); $result = $this->parser->parse($this->feed, $fetcher_result, $this->state); $this->assertCount(3, $result); $this->assertSame('I am a title<thing>Stuff</thing>', $result[0]->get('title')); $this->assertSame('I am a description0', $result[0]->get('description')); $this->assertSame('I am a title1', $result[1]->get('title')); $this->assertSame('I am a description1', $result[1]->get('description')); $this->assertSame('I am a title2', $result[2]->get('title')); $this->assertSame('I am a description2', $result[2]->get('description')); } /** * Tests parsing a CP866 (Russian) encoded file. */ public function testCp866Encoded() { $fetcher_result = new RawFetcherResult(file_get_contents($this->moduleDir . '/tests/resources/test_ru.html'), $this->fileSystem); $config = [ 'context' => [ 'value' => '//div[@class="post"]', ], ] + $this->parser->defaultConfiguration(); $this->parser->setConfiguration($config); $this->feedType->expects($this->any()) ->method('getCustomSources') ->willReturn([ 'title' => [ 'label' => 'Title', 'value' => 'h3', ], 'description' => [ 'label' => 'Description', 'value' => 'p', ], ]); $result = $this->parser->parse($this->feed, $fetcher_result, $this->state); $this->assertCount(3, $result); foreach ($result as $delta => $item) { $this->assertSame('Я название' . $delta, $item->get('title')); $this->assertSame('Я описание' . $delta, $item->get('description')); } } /** * Tests a EUC-JP (Japanese) encoded file without the encoding declaration. * * This implicitly tests Base's encoding conversion. */ public function testEucJpEncodedNoDeclaration() { $fetcher_result = new RawFetcherResult(file_get_contents($this->moduleDir . '/tests/resources/test_jp.html'), $this->fileSystem); $config = [ 'context' => [ 'value' => '//div[@class="post"]', ], 'source_encoding' => ['EUC-JP'], ] + $this->parser->defaultConfiguration(); $this->parser->setConfiguration($config); $this->feedType->expects($this->any()) ->method('getCustomSources') ->willReturn([ 'title' => [ 'label' => 'Title', 'value' => 'h3', ], 'description' => [ 'label' => 'Description', 'value' => 'p', ], ]); $result = $this->parser->parse($this->feed, $fetcher_result, $this->state); $this->assertCount(3, $result); foreach ($result as $delta => $item) { $this->assertSame('私はタイトルです' . $delta, $item->get('title')); $this->assertSame('私が説明してい' . $delta, $item->get('description')); } } /** * Tests that the link property is set. * * @todo turned off, because unsure if this is still needed. */ public function testLinkIsSet() { $this->markTestIncomplete(); $this->setProperty($this->feed, 'config', [ 'FeedsFileFetcher' => [ 'source' => 'file fetcher source path', ], ]); $config = ['context' => ['value' => '/beep']]; $result = $this->parser->parse($this->feed, new RawFetcherResult('<?xml version="1.0" encoding="UTF-8"?><item></item>', $this->fileSystem)); $this->assertSame($result->link, 'file fetcher source path'); } /** * Tests empty feed handling. */ public function testEmptyFeed() { $this->feedType->expects($this->any()) ->method('getCustomSources') ->willReturn([]); $this->parser->parse($this->feed, new RawFetcherResult(' ', $this->fileSystem), $this->state); $this->assertEmptyFeedMessage($this->parser->getMessenger()->getMessages()); } }