-
-
Notifications
You must be signed in to change notification settings - Fork 9.6k
[Serializer] Add a data: URI normalizer #16164
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 6 commits
efa58f4
28b1e13
790ad3a
b0fe18c
7e5e845
f207713
f4ee396
53e2b26
c03aa28
68869f5
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,121 @@ | ||
<?php | ||
|
||
/* | ||
* This file is part of the Symfony package. | ||
* | ||
* (c) Fabien Potencier <fabien@symfony.com> | ||
* | ||
* For the full copyright and license information, please view the LICENSE | ||
* file that was distributed with this source code. | ||
*/ | ||
|
||
namespace Symfony\Component\Serializer\Normalizer; | ||
|
||
use Symfony\Component\HttpFoundation\File\File; | ||
use Symfony\Component\HttpFoundation\File\MimeType\MimeTypeGuesser; | ||
use Symfony\Component\HttpFoundation\File\MimeType\MimeTypeGuesserInterface; | ||
use Symfony\Component\Serializer\Exception\UnexpectedValueException; | ||
|
||
/** | ||
* Normalizes a {@see \SplFileInfo} object to a data URI. | ||
* Denormalizes a data URI to a {@see \SplFileObject} object. | ||
* | ||
* @author Kévin Dunglas <dunglas@gmail.com> | ||
*/ | ||
class DataUriNormalizer implements NormalizerInterface, DenormalizerInterface | ||
{ | ||
/** | ||
* @var MimeTypeGuesserInterface | ||
*/ | ||
private $mimeTypeGuesser; | ||
|
||
public function __construct(MimeTypeGuesserInterface $mimeTypeGuesser = null) | ||
{ | ||
if (null === $mimeTypeGuesser && class_exists('Symfony\Component\HttpFoundation\File\MimeType\MimeTypeGuesser')) { | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. The There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. It is not useless in the following case: The constructor argument is optional, so the existence of the interface will not be checked and you cannot know if |
||
$mimeTypeGuesser = MimeTypeGuesser::getInstance(); | ||
} | ||
|
||
$this->mimeTypeGuesser = $mimeTypeGuesser; | ||
} | ||
|
||
/** | ||
* {@inheritdoc} | ||
*/ | ||
public function normalize($object, $format = null, array $context = array()) | ||
{ | ||
if ($object instanceof File) { | ||
$mimeType = $object->getMimeType(); | ||
} elseif ($this->mimeTypeGuesser) { | ||
$mimeType = $this->mimeTypeGuesser->guess($object->getPathname()); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. We would need a type-check on this to make sure it's an There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. The pro as you pointed out is clarity. As dealing with |
||
} else { | ||
$mimeType = 'application/octet-stream'; | ||
} | ||
|
||
list($typeName) = explode('/', $mimeType, 2); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Why you limit There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Because it won't work:
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. minutiae detail, but I'd like this line moved right before the |
||
|
||
if (!$object instanceof \SplFileObject) { | ||
$object = $object->openFile(); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. What if the object does not have an There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. It is not possible because of https://github.com/symfony/symfony/pull/16164/files#diff-b7fc65c7d852312152e353f395fc70a8R77 There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. So when can There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. When it's an instance of There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I agree thought that this reads weird to me. The entire class suffers a little bit of complexity since we're handling SplFileInfo, SplFileObject and File (even though they are all instances of After looking for awhile, I don't think there is a problem - it can just be more clear :) There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Splitting this class in 3 normalizers is not convenient for users using the component. It will require to instantiate and register 3 normalizers only to have a correct |
||
} | ||
|
||
$data = ''; | ||
|
||
$object->rewind(); | ||
while (!$object->eof()) { | ||
$data .= $object->fgets(); | ||
} | ||
|
||
if ('text' === $typeName) { | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Making this decision seems a little bit arbitrary... but it kind of makes sense. |
||
return sprintf('data:%s,%s', $mimeType, rawurlencode($data)); | ||
} | ||
|
||
return sprintf('data:%s;base64,%s', $mimeType, base64_encode($data)); | ||
} | ||
|
||
/** | ||
* {@inheritdoc} | ||
*/ | ||
public function supportsNormalization($data, $format = null) | ||
{ | ||
return $data instanceof \SplFileInfo; | ||
} | ||
|
||
/** | ||
* {@inheritdoc} | ||
* | ||
* Regex adapted from Brian Grinstead code. | ||
* | ||
* @see https://gist.github.com/bgrins/6194623 | ||
* | ||
* @throws UnexpectedValueException | ||
*/ | ||
public function denormalize($data, $class, $format = null, array $context = array()) | ||
{ | ||
if (!preg_match('/^data:([a-z0-9]+\/[a-z0-9]+(;[a-z0-9\-]+\=[a-z0-9\-]+)?)?(;base64)?,[a-z0-9\!\$\&\\\'\,\(\)\*\+\,\;\=\-\.\_\~\:\@\/\?\%\s]*\s*$/i', $data)) { | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
...could be made posessive/greedy for better performance...
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. On the other hand, is matching the string all the way to the end really necessary (with a large list of allowed characters)? I mean we're not validating if the actual data corresponds with the encoding specification, the user could still (for example) use the base64 option but not send base64 encoded data. We're taking the correctness of the data (more or less) for granted -- so why allow the regex engine to even bother scanning it? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. There is two main reasons:
However 👍 to make the regex as fast as possible There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Uh-oh, i can't imagine how the /etc/shadow file could get exposed since the On 20:14, Thu, Feb 4, 2016 Kévin Dunglas notifications@github.com wrote:
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. @dunglas the original RegEx does not match Which means the DataUriNormalizer can't match a Also there's an issue in the I could submit a PR with the aforementioned speedups as well as some logic to make the mime type guessing part optional (ex.: supply a mime type via There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I'm checking out this list and apparently literal dots and underscores are also (sometimes) used in mime-type names (especially in the second part) and dashes are (sometimes) used in the first part. So the RegEx needs to allow for those too. |
||
throw new UnexpectedValueException('The provided "data:" URI is not valid.'); | ||
} | ||
|
||
try { | ||
if ('Symfony\Component\HttpFoundation\File\File' === $class) { | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I think we should check for other class values to an throw an exception if we don't support the given class. That makes it easier for users to spot errors (for example, referring a normalizer they didn't intend to use). |
||
return new File($data, false); | ||
} | ||
|
||
return new \SplFileObject($data); | ||
} catch (\RuntimeException $exception) { | ||
throw new UnexpectedValueException($exception->getMessage(), $exception->getCode(), $exception); | ||
} | ||
} | ||
|
||
/** | ||
* {@inheritdoc} | ||
*/ | ||
public function supportsDenormalization($data, $type, $format = null) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Why not applying the regex to the data here too? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Why not but will it be easy to debug that this validator is skipped regardless of the |
||
{ | ||
$supportedTypes = array( | ||
'SplFileInfo' => true, | ||
'SplFileObject' => true, | ||
'Symfony\Component\HttpFoundation\File\File' => true, | ||
); | ||
|
||
return isset($supportedTypes[$type]); | ||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
Kévin Dunglas |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,176 @@ | ||
<?php | ||
|
||
/* | ||
* This file is part of the Symfony package. | ||
* | ||
* (c) Fabien Potencier <fabien@symfony.com> | ||
* | ||
* For the full copyright and license information, please view the LICENSE | ||
* file that was distributed with this source code. | ||
*/ | ||
|
||
namespace Symfony\Component\Serializer\Tests\Normalizer; | ||
|
||
use Symfony\Component\HttpFoundation\File\File; | ||
use Symfony\Component\Serializer\Normalizer\DataUriNormalizer; | ||
|
||
/** | ||
* @author Kévin Dunglas <dunglas@gmail.com> | ||
*/ | ||
class DataUriNormalizerTest extends \PHPUnit_Framework_TestCase | ||
{ | ||
const TEST_GIF_DATA = ''; | ||
const TEST_TXT_DATA = 'data:text/plain,K%C3%A9vin%20Dunglas%0A'; | ||
const TEST_TXT_CONTENT = "Kévin Dunglas\n"; | ||
|
||
/** | ||
* @var DataUriNormalizer | ||
*/ | ||
private $normalizer; | ||
|
||
public function setUp() | ||
{ | ||
$this->normalizer = new DataUriNormalizer(); | ||
} | ||
|
||
public function testInterface() | ||
{ | ||
$this->assertInstanceOf('Symfony\Component\Serializer\Normalizer\NormalizerInterface', $this->normalizer); | ||
$this->assertInstanceOf('Symfony\Component\Serializer\Normalizer\DenormalizerInterface', $this->normalizer); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. This test looks useless to me. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I agree with you that it's not very useful but it guaranties that nobody remove the |
||
} | ||
|
||
public function testSupportNormalization() | ||
{ | ||
$this->assertFalse($this->normalizer->supportsNormalization(new \stdClass())); | ||
$this->assertTrue($this->normalizer->supportsNormalization(new \SplFileObject('data:,Hello%2C%20World!'))); | ||
} | ||
|
||
public function testNormalizeHttpFoundationFile() | ||
{ | ||
$file = new File(__DIR__.'/../Fixtures/test.gif'); | ||
|
||
$this->assertSame(self::TEST_GIF_DATA, $this->normalizer->normalize($file)); | ||
} | ||
|
||
public function testNormalizeSplFileInfo() | ||
{ | ||
$file = new \SplFileInfo(__DIR__.'/../Fixtures/test.gif'); | ||
|
||
$this->assertSame(self::TEST_GIF_DATA, $this->normalizer->normalize($file)); | ||
} | ||
|
||
public function testNormalizeText() | ||
{ | ||
$file = new \SplFileObject(__DIR__.'/../Fixtures/test.txt'); | ||
|
||
$data = $this->normalizer->normalize($file); | ||
|
||
$this->assertSame(self::TEST_TXT_DATA, $data); | ||
$this->assertSame(self::TEST_TXT_CONTENT, file_get_contents($data)); | ||
} | ||
|
||
public function testSupportsDenormalization() | ||
{ | ||
$this->assertFalse($this->normalizer->supportsDenormalization('foo', 'Bar')); | ||
$this->assertTrue($this->normalizer->supportsDenormalization(self::TEST_GIF_DATA, 'SplFileInfo')); | ||
$this->assertTrue($this->normalizer->supportsDenormalization(self::TEST_GIF_DATA, 'SplFileObject')); | ||
$this->assertTrue($this->normalizer->supportsDenormalization(self::TEST_TXT_DATA, 'Symfony\Component\HttpFoundation\File\File')); | ||
} | ||
|
||
public function testDenormalizeSplFileInfo() | ||
{ | ||
$file = $this->normalizer->denormalize(self::TEST_TXT_DATA, 'SplFileInfo'); | ||
|
||
$this->assertInstanceOf('SplFileInfo', $file); | ||
$this->assertSame(file_get_contents(self::TEST_TXT_DATA), $this->getContent($file)); | ||
} | ||
|
||
public function testDenormalizeSplFileObject() | ||
{ | ||
$file = $this->normalizer->denormalize(self::TEST_TXT_DATA, 'SplFileObject'); | ||
|
||
$this->assertInstanceOf('SplFileObject', $file); | ||
$this->assertEquals(file_get_contents(self::TEST_TXT_DATA), $this->getContent($file)); | ||
} | ||
|
||
public function testDenormalizeHttpFoundationFile() | ||
{ | ||
$file = $this->normalizer->denormalize(self::TEST_GIF_DATA, 'Symfony\Component\HttpFoundation\File\File'); | ||
|
||
$this->assertInstanceOf('Symfony\Component\HttpFoundation\File\File', $file); | ||
$this->assertSame(file_get_contents(self::TEST_GIF_DATA), $this->getContent($file->openFile())); | ||
} | ||
|
||
/** | ||
* @expectedException \Symfony\Component\Serializer\Exception\UnexpectedValueException | ||
* @expectedExceptionMessage The provided "data:" URI is not valid. | ||
*/ | ||
public function testGiveNotAccessToLocalFiles() | ||
{ | ||
$this->normalizer->denormalize('/etc/shadow', 'SplFileObject'); | ||
} | ||
|
||
/** | ||
* @expectedException \Symfony\Component\Serializer\Exception\UnexpectedValueException | ||
* @dataProvider invalidUriProvider | ||
*/ | ||
public function testInvalidData($uri) | ||
{ | ||
$this->normalizer->denormalize($uri, 'SplFileObject'); | ||
} | ||
|
||
public function invalidUriProvider() | ||
{ | ||
return array( | ||
array('dataxbase64'), | ||
array('data:HelloWorld'), | ||
array('data:text/html;charset=,%3Ch1%3EHello!%3C%2Fh1%3E'), | ||
array('data:text/html;charset,%3Ch1%3EHello!%3C%2Fh1%3E'), | ||
array('data:base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQAQMAAAAlPW0iAAAABlBMVEUAAAD///+l2Z/dAAAAM0lEQVR4nGP4/5/h/1+G/58ZDrAz3D/McH8yw83NDDeNGe4Ug9C9zwz3gVLMDA/A6P9/AFGGFyjOXZtQAAAAAElFTkSuQmCC'), | ||
array(''), | ||
array('http://wikipedia.org'), | ||
array('base64'), | ||
array('iVBORw0KGgoAAAANSUhEUgAAABAAAAAQAQMAAAAlPW0iAAAABlBMVEUAAAD///+l2Z/dAAAAM0lEQVR4nGP4/5/h/1+G/58ZDrAz3D/McH8yw83NDDeNGe4Ug9C9zwz3gVLMDA/A6P9/AFGGFyjOXZtQAAAAAElFTkSuQmCC'), | ||
array(' '), | ||
array(' '), | ||
); | ||
} | ||
|
||
/** | ||
* @dataProvider validUriProvider | ||
*/ | ||
public function testValidData($uri) | ||
{ | ||
$this->assertInstanceOf('SplFileObject', $this->normalizer->denormalize($uri, 'SplFileObject')); | ||
} | ||
|
||
public function validUriProvider() | ||
{ | ||
$data = array( | ||
array(''), | ||
array(''), | ||
array(' '), | ||
array('data:,Hello%2C%20World!'), | ||
array('data:text/html,%3Ch1%3EHello%2C%20World!%3C%2Fh1%3E'), | ||
array('data:,A%20brief%20note'), | ||
array('data:text/html;charset=US-ASCII,%3Ch1%3EHello!%3C%2Fh1%3E'), | ||
); | ||
|
||
if (!defined('HHVM_VERSION')) { | ||
// See https://github.com/facebook/hhvm/issues/6354 | ||
$data[] = array('data:text/plain;charset=utf-8;base64,SGVsbG8gV29ybGQh'); | ||
} | ||
|
||
return $data; | ||
} | ||
|
||
private function getContent(\SplFileObject $file) | ||
{ | ||
$buffer = ''; | ||
while (!$file->eof()) { | ||
$buffer .= $file->fgets(); | ||
} | ||
|
||
return $buffer; | ||
} | ||
} |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
an
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
a SplFileInfo [...] no?
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
an SplFileInfo afaik