484 lines
		
	
	
		
			17 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			484 lines
		
	
	
		
			17 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| <?php
 | |
| 
 | |
| namespace Masterminds\HTML5\Tests;
 | |
| 
 | |
| use Masterminds\HTML5;
 | |
| 
 | |
| class Html5Test extends TestCase
 | |
| {
 | |
|     /**
 | |
|      * @var HTML5
 | |
|      */
 | |
|     private $html5;
 | |
| 
 | |
|     public function setUp()
 | |
|     {
 | |
|         $this->html5 = $this->getInstance();
 | |
|     }
 | |
| 
 | |
|     /**
 | |
|      * Parse and serialize a string.
 | |
|      */
 | |
|     protected function cycle($html)
 | |
|     {
 | |
|         $dom = $this->html5->loadHTML('<!DOCTYPE html><html><body>' . $html . '</body></html>');
 | |
|         $out = $this->html5->saveHTML($dom);
 | |
| 
 | |
|         return $out;
 | |
|     }
 | |
| 
 | |
|     protected function cycleFragment($fragment)
 | |
|     {
 | |
|         $dom = $this->html5->loadHTMLFragment($fragment);
 | |
|         $out = $this->html5->saveHTML($dom);
 | |
| 
 | |
|         return $out;
 | |
|     }
 | |
| 
 | |
|     public function testImageTagsInSvg()
 | |
|     {
 | |
|         $html = '<!DOCTYPE html>
 | |
|                     <html>
 | |
|                         <head>
 | |
|                             <title>foo</title>
 | |
|                         </head>
 | |
|                         <body>
 | |
|                             <svg>
 | |
|                                 <image height="10" width="10"></image>
 | |
|                             </svg>
 | |
|                         </body>
 | |
|                     </html>';
 | |
|         $doc = $this->html5->loadHTML($html);
 | |
|         $this->assertInstanceOf('DOMElement', $doc->getElementsByTagName('image')->item(0));
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|     }
 | |
| 
 | |
|     public function testLoadOptions()
 | |
|     {
 | |
|         // doc
 | |
|         $dom = $this->html5->loadHTML($this->wrap('<t:tag/>'), array(
 | |
|             'implicitNamespaces' => array('t' => 'http://example.com'),
 | |
|             'xmlNamespaces' => true,
 | |
|         ));
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $this->assertFalse($this->html5->hasErrors());
 | |
| 
 | |
|         $xpath = new \DOMXPath($dom);
 | |
|         $xpath->registerNamespace('t', 'http://example.com');
 | |
|         $this->assertEquals(1, $xpath->query('//t:tag')->length);
 | |
| 
 | |
|         // doc fragment
 | |
|         $frag = $this->html5->loadHTMLFragment('<t:tag/>', array(
 | |
|             'implicitNamespaces' => array('t' => 'http://example.com'),
 | |
|             'xmlNamespaces' => true,
 | |
|         ));
 | |
|         $this->assertInstanceOf('\DOMDocumentFragment', $frag);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $this->assertFalse($this->html5->hasErrors());
 | |
| 
 | |
|         $frag->ownerDocument->appendChild($frag);
 | |
|         $xpath = new \DOMXPath($frag->ownerDocument);
 | |
|         $xpath->registerNamespace('t', 'http://example.com');
 | |
|         $this->assertEquals(1, $xpath->query('//t:tag', $frag)->length);
 | |
|     }
 | |
| 
 | |
|     public function testEncodingUtf8()
 | |
|     {
 | |
|         $dom = $this->html5->load(__DIR__ . '/Fixtures/encoding/utf-8.html');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $this->assertFalse($this->html5->hasErrors());
 | |
| 
 | |
|         $this->assertContains('Žťčýů', $dom->saveHTML());
 | |
|     }
 | |
| 
 | |
|     public function testEncodingWindows1252()
 | |
|     {
 | |
|         $dom = $this->html5->load(__DIR__ . '/Fixtures/encoding/windows-1252.html', array(
 | |
|             'encoding' => 'Windows-1252',
 | |
|         ));
 | |
| 
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $this->assertFalse($this->html5->hasErrors());
 | |
| 
 | |
|         $dumpedAsUtf8 = mb_convert_encoding($dom->saveHTML(), 'UTF-8', 'Windows-1252');
 | |
|         $this->assertNotFalse(mb_strpos($dumpedAsUtf8, 'Ž'));
 | |
|         $this->assertNotFalse(mb_strpos($dumpedAsUtf8, 'è'));
 | |
|         $this->assertNotFalse(mb_strpos($dumpedAsUtf8, 'ý'));
 | |
|         $this->assertNotFalse(mb_strpos($dumpedAsUtf8, 'ù'));
 | |
|     }
 | |
| 
 | |
|     public function testErrors()
 | |
|     {
 | |
|         $dom = $this->html5->loadHTML('<xx as>');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
| 
 | |
|         $this->assertNotEmpty($this->html5->getErrors());
 | |
|         $this->assertTrue($this->html5->hasErrors());
 | |
|     }
 | |
| 
 | |
|     public function testLoad()
 | |
|     {
 | |
|         $dom = $this->html5->load(__DIR__ . '/Html5Test.html');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $this->assertFalse($this->html5->hasErrors());
 | |
| 
 | |
|         $file = fopen(__DIR__ . '/Html5Test.html', 'r');
 | |
|         $dom = $this->html5->load($file);
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
| 
 | |
|         $dom = $this->html5->loadHTMLFile(__DIR__ . '/Html5Test.html');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|     }
 | |
| 
 | |
|     public function testLoadHTML()
 | |
|     {
 | |
|         $contents = file_get_contents(__DIR__ . '/Html5Test.html');
 | |
|         $dom = $this->html5->loadHTML($contents);
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|     }
 | |
| 
 | |
|     public function testLoadHTMLWithComments()
 | |
|     {
 | |
|         $contents = '<!--[if lte IE 8]> <html class="no-js lt-ie9" lang="en"> <![endif]-->
 | |
| <!--[if gt IE 8]> <!--><html class="no-js" lang="en"><!--<![endif]-->
 | |
| </html>';
 | |
| 
 | |
|         $dom = $this->html5->loadHTML($contents);
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
| 
 | |
|         $expected = '<!DOCTYPE html>
 | |
| <!--[if lte IE 8]> <html class="no-js lt-ie9" lang="en"> <![endif]--><!--[if gt IE 8]> <!--><html class="no-js" lang="en"><!--<![endif]--></html>
 | |
| ';
 | |
|         $this->assertEquals($expected, $this->html5->saveHTML($dom));
 | |
|     }
 | |
| 
 | |
|     public function testLoadHTMLFragment()
 | |
|     {
 | |
|         $fragment = '<section id="Foo"><div class="Bar">Baz</div></section>';
 | |
|         $dom = $this->html5->loadHTMLFragment($fragment);
 | |
|         $this->assertInstanceOf('\DOMDocumentFragment', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|     }
 | |
| 
 | |
|     public function testSaveHTML()
 | |
|     {
 | |
|         $dom = $this->html5->load(__DIR__ . '/Html5Test.html');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
| 
 | |
|         $saved = $this->html5->saveHTML($dom);
 | |
|         $this->assertRegExp('|<p>This is a test.</p>|', $saved);
 | |
|     }
 | |
| 
 | |
|     public function testSaveHTMLFragment()
 | |
|     {
 | |
|         $fragment = '<section id="Foo"><div class="Bar">Baz</div></section>';
 | |
|         $dom = $this->html5->loadHTMLFragment($fragment);
 | |
| 
 | |
|         $string = $this->html5->saveHTML($dom);
 | |
|         $this->assertEquals($fragment, $string);
 | |
|     }
 | |
| 
 | |
|     public function testSave()
 | |
|     {
 | |
|         $dom = $this->html5->load(__DIR__ . '/Html5Test.html');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
| 
 | |
|         // Test resource
 | |
|         $file = fopen('php://temp', 'w');
 | |
|         $this->html5->save($dom, $file);
 | |
|         $content = stream_get_contents($file, -1, 0);
 | |
|         $this->assertRegExp('|<p>This is a test.</p>|', $content);
 | |
| 
 | |
|         // Test file
 | |
|         $tmpfname = tempnam(sys_get_temp_dir(), 'html5-php');
 | |
|         $this->html5->save($dom, $tmpfname);
 | |
|         $content = file_get_contents($tmpfname);
 | |
|         $this->assertRegExp('|<p>This is a test.</p>|', $content);
 | |
|         unlink($tmpfname);
 | |
|     }
 | |
| 
 | |
|     // This test reads a document into a dom, turn the dom into a document,
 | |
|     // then tries to read that document again. This makes sure we are reading,
 | |
|     // and generating a document that works at a high level.
 | |
|     public function testItWorks()
 | |
|     {
 | |
|         $dom = $this->html5->load(__DIR__ . '/Html5Test.html');
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
| 
 | |
|         $saved = $this->html5->saveHTML($dom);
 | |
| 
 | |
|         $dom2 = $this->html5->loadHTML($saved);
 | |
|         $this->assertInstanceOf('\DOMDocument', $dom2);
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|     }
 | |
| 
 | |
|     public function testConfig()
 | |
|     {
 | |
|         $html5 = $this->getInstance();
 | |
|         $options = $html5->getOptions();
 | |
|         $this->assertEquals(false, $options['encode_entities']);
 | |
| 
 | |
|         $html5 = $this->getInstance(array(
 | |
|             'foo' => 'bar',
 | |
|             'encode_entities' => true,
 | |
|         ));
 | |
|         $options = $html5->getOptions();
 | |
|         $this->assertEquals('bar', $options['foo']);
 | |
|         $this->assertEquals(true, $options['encode_entities']);
 | |
| 
 | |
|         // Need to reset to original so future tests pass as expected.
 | |
|         // $this->getInstance()->setOption('encode_entities', false);
 | |
|     }
 | |
| 
 | |
|     public function testSvg()
 | |
|     {
 | |
|         $dom = $this->html5->loadHTML(
 | |
|             '<!doctype html>
 | |
|       <html lang="en">
 | |
|         <body>
 | |
|           <div id="foo" class="bar baz">foo bar baz</div>
 | |
|           <svg width="150" height="100" viewBox="0 0 3 2">
 | |
|             <rect width="1" height="2" x="0" fill="#008d46" />
 | |
|             <rect width="1" height="2" x="1" fill="#ffffff" />
 | |
|             <rect width="1" height="2" x="2" fill="#d2232c" />
 | |
|             <text font-family="Verdana" font-size="32">
 | |
|               <textPath xlink:href="#Foo">
 | |
|                 Test Text.
 | |
|               </textPath>
 | |
|             </text>
 | |
|           </svg>
 | |
|         </body>
 | |
|       </html>');
 | |
| 
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
| 
 | |
|         // Test a mixed case attribute.
 | |
|         $list = $dom->getElementsByTagName('svg');
 | |
|         $this->assertNotEmpty($list->length);
 | |
|         $svg = $list->item(0);
 | |
|         $this->assertEquals('0 0 3 2', $svg->getAttribute('viewBox'));
 | |
|         $this->assertFalse($svg->hasAttribute('viewbox'));
 | |
| 
 | |
|         // Test a mixed case tag.
 | |
|         // Note: getElementsByTagName is not case sensitive.
 | |
|         $list = $dom->getElementsByTagName('textPath');
 | |
|         $this->assertNotEmpty($list->length);
 | |
|         $textPath = $list->item(0);
 | |
|         $this->assertEquals('textPath', $textPath->tagName);
 | |
|         $this->assertNotEquals('textpath', $textPath->tagName);
 | |
| 
 | |
|         $html = $this->html5->saveHTML($dom);
 | |
|         $this->assertRegExp('|<svg width="150" height="100" viewBox="0 0 3 2">|', $html);
 | |
|         $this->assertRegExp('|<rect width="1" height="2" x="0" fill="#008d46" />|', $html);
 | |
|     }
 | |
| 
 | |
|     public function testMathMl()
 | |
|     {
 | |
|         $dom = $this->html5->loadHTML(
 | |
|             '<!doctype html>
 | |
|       <html lang="en">
 | |
|         <body>
 | |
|           <div id="foo" class="bar baz" definitionURL="http://example.com">foo bar baz</div>
 | |
|           <math>
 | |
|             <mi>x</mi>
 | |
|             <csymbol definitionURL="http://www.example.com/mathops/multiops.html#plusminus">
 | |
|               <mo>±</mo>
 | |
|             </csymbol>
 | |
|             <mi>y</mi>
 | |
|           </math>
 | |
|         </body>
 | |
|       </html>');
 | |
| 
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $list = $dom->getElementsByTagName('math');
 | |
|         $this->assertNotEmpty($list->length);
 | |
| 
 | |
|         $list = $dom->getElementsByTagName('div');
 | |
|         $this->assertNotEmpty($list->length);
 | |
|         $div = $list->item(0);
 | |
|         $this->assertEquals('http://example.com', $div->getAttribute('definitionurl'));
 | |
|         $this->assertFalse($div->hasAttribute('definitionURL'));
 | |
|         $list = $dom->getElementsByTagName('csymbol');
 | |
|         $csymbol = $list->item(0);
 | |
|         $this->assertEquals('http://www.example.com/mathops/multiops.html#plusminus', $csymbol->getAttribute('definitionURL'));
 | |
|         $this->assertFalse($csymbol->hasAttribute('definitionurl'));
 | |
| 
 | |
|         $html = $this->html5->saveHTML($dom);
 | |
|         $this->assertRegExp('|<csymbol definitionURL="http://www.example.com/mathops/multiops.html#plusminus">|', $html);
 | |
|         $this->assertRegExp('|<mi>y</mi>|', $html);
 | |
|     }
 | |
| 
 | |
|     public function testUnknownElements()
 | |
|     {
 | |
|         // The : should not have special handling accourding to section 2.9 of the
 | |
|         // spec. This is differenant than XML. Since we don't know these elements
 | |
|         // they are handled as normal elements. Note, to do this is really
 | |
|         // an invalid example and you should not embed prefixed xml in html5.
 | |
|         $dom = $this->html5->loadHTMLFragment(
 | |
|             '<f:rug>
 | |
|       <f:name>Big rectangle thing</f:name>
 | |
|       <f:width>40</f:width>
 | |
|       <f:length>80</f:length>
 | |
|     </f:rug>
 | |
|     <sarcasm>um, yeah</sarcasm>');
 | |
| 
 | |
|         $this->assertEmpty($this->html5->getErrors());
 | |
|         $markup = $this->html5->saveHTML($dom);
 | |
|         $this->assertRegExp('|<f:name>Big rectangle thing</f:name>|', $markup);
 | |
|         $this->assertRegExp('|<sarcasm>um, yeah</sarcasm>|', $markup);
 | |
|     }
 | |
| 
 | |
|     public function testElements()
 | |
|     {
 | |
|         // Should have content.
 | |
|         $res = $this->cycle('<div>FOO</div>');
 | |
|         $this->assertRegExp('|<div>FOO</div>|', $res);
 | |
| 
 | |
|         // Should be empty
 | |
|         $res = $this->cycle('<span></span>');
 | |
|         $this->assertRegExp('|<span></span>|', $res);
 | |
| 
 | |
|         // Should have content.
 | |
|         $res = $this->cycleFragment('<div>FOO</div>');
 | |
|         $this->assertRegExp('|<div>FOO</div>|', $res);
 | |
| 
 | |
|         // Should be empty
 | |
|         $res = $this->cycleFragment('<span></span>');
 | |
|         $this->assertRegExp('|<span></span>|', $res);
 | |
| 
 | |
|         // Elements with dashes and underscores
 | |
|         $res = $this->cycleFragment('<sp-an></sp-an>');
 | |
|         $this->assertRegExp('|<sp-an></sp-an>|', $res);
 | |
|         $res = $this->cycleFragment('<sp_an></sp_an>');
 | |
|         $this->assertRegExp('|<sp_an></sp_an>|', $res);
 | |
| 
 | |
|         // Should have no closing tag.
 | |
|         $res = $this->cycle('<hr>');
 | |
|         $this->assertRegExp('|<hr></body>|', $res);
 | |
|     }
 | |
| 
 | |
|     public function testAttributes()
 | |
|     {
 | |
|         $res = $this->cycle('<use xlink:href="#svg-track" xmlns:xlink="http://www.w3.org/1999/xlink"></use>');
 | |
|         $this->assertContains('<use xlink:href="#svg-track" xmlns:xlink="http://www.w3.org/1999/xlink"></use>', $res);
 | |
| 
 | |
|         $res = $this->cycle('<div attr="val">FOO</div>');
 | |
|         $this->assertRegExp('|<div attr="val">FOO</div>|', $res);
 | |
| 
 | |
|         // XXX: Note that spec does NOT require attrs in the same order.
 | |
|         $res = $this->cycle('<div attr="val" class="even">FOO</div>');
 | |
|         $this->assertRegExp('|<div attr="val" class="even">FOO</div>|', $res);
 | |
| 
 | |
|         $res = $this->cycle('<div xmlns:foo="http://example.com">FOO</div>');
 | |
|         $this->assertRegExp('|<div xmlns:foo="http://example.com">FOO</div>|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<div attr="val">FOO</div>');
 | |
|         $this->assertRegExp('|<div attr="val">FOO</div>|', $res);
 | |
| 
 | |
|         // XXX: Note that spec does NOT require attrs in the same order.
 | |
|         $res = $this->cycleFragment('<div attr="val" class="even">FOO</div>');
 | |
|         $this->assertRegExp('|<div attr="val" class="even">FOO</div>|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<div xmlns:foo="http://example.com">FOO</div>');
 | |
|         $this->assertRegExp('|<div xmlns:foo="http://example.com">FOO</div>|', $res);
 | |
|     }
 | |
| 
 | |
|     public function testPCData()
 | |
|     {
 | |
|         $res = $this->cycle('<a>This is a test.</a>');
 | |
|         $this->assertRegExp('|This is a test.|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<a>This is a test.</a>');
 | |
|         $this->assertRegExp('|This is a test.|', $res);
 | |
| 
 | |
|         $res = $this->cycle('This
 | |
|       is
 | |
|       a
 | |
|       test.');
 | |
| 
 | |
|         // Check that newlines are there, but don't count spaces.
 | |
|         $this->assertRegExp('|This\n\s*is\n\s*a\n\s*test.|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('This
 | |
|       is
 | |
|       a
 | |
|       test.');
 | |
| 
 | |
|         // Check that newlines are there, but don't count spaces.
 | |
|         $this->assertRegExp('|This\n\s*is\n\s*a\n\s*test.|', $res);
 | |
| 
 | |
|         $res = $this->cycle('<a>This <em>is</em> a test.</a>');
 | |
|         $this->assertRegExp('|This <em>is</em> a test.|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<a>This <em>is</em> a test.</a>');
 | |
|         $this->assertRegExp('|This <em>is</em> a test.|', $res);
 | |
|     }
 | |
| 
 | |
|     public function testUnescaped()
 | |
|     {
 | |
|         $res = $this->cycle('<script>2 < 1</script>');
 | |
|         $this->assertRegExp('|2 < 1|', $res);
 | |
| 
 | |
|         $res = $this->cycle('<style>div>div>div</style>');
 | |
|         $this->assertRegExp('|div>div>div|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<script>2 < 1</script>');
 | |
|         $this->assertRegExp('|2 < 1|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<style>div>div>div</style>');
 | |
|         $this->assertRegExp('|div>div>div|', $res);
 | |
|     }
 | |
| 
 | |
|     public function testEntities()
 | |
|     {
 | |
|         $res = $this->cycle('<a>Apples & bananas.</a>');
 | |
|         $this->assertRegExp('|Apples & bananas.|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<a>Apples & bananas.</a>');
 | |
|         $this->assertRegExp('|Apples & bananas.|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('<p>R&D</p>');
 | |
|         $this->assertRegExp('|R&D|', $res);
 | |
|     }
 | |
| 
 | |
|     public function testCaseSensitiveTags()
 | |
|     {
 | |
|         $dom = $this->html5->loadHTML(
 | |
|             '<html><body><Button color="red">Error</Button></body></html>',
 | |
|             array(
 | |
|                 'xmlNamespaces' => true,
 | |
|             )
 | |
|         );
 | |
|         $out = $this->html5->saveHTML($dom);
 | |
|         $this->assertRegExp('|<html><body><Button color="red">Error</Button></body></html>|', $out);
 | |
|     }
 | |
| 
 | |
|     public function testComment()
 | |
|     {
 | |
|         $res = $this->cycle('a<!-- This is a test. -->b');
 | |
|         $this->assertRegExp('|<!-- This is a test. -->|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('a<!-- This is a test. -->b');
 | |
|         $this->assertRegExp('|<!-- This is a test. -->|', $res);
 | |
|     }
 | |
| 
 | |
|     public function testCDATA()
 | |
|     {
 | |
|         $res = $this->cycle('a<![CDATA[ This <is> a test. ]]>b');
 | |
|         $this->assertRegExp('|<!\[CDATA\[ This <is> a test\. \]\]>|', $res);
 | |
| 
 | |
|         $res = $this->cycleFragment('a<![CDATA[ This <is> a test. ]]>b');
 | |
|         $this->assertRegExp('|<!\[CDATA\[ This <is> a test\. \]\]>|', $res);
 | |
|     }
 | |
| }
 |