2 class IPTCTest
extends MediaWikiTestCase
{
3 public function testRecognizeUtf8() {
4 // utf-8 is the only one used in practise.
5 $res = IPTC
::getCharset( "\x1b%G" );
6 $this->assertEquals( 'UTF-8', $res );
9 public function testIPTCParseNoCharset88591() {
10 // basically IPTC for keyword with value of 0xBC which is 1/4 in iso-8859-1
11 // This data doesn't specify a charset. We're supposed to guess
12 // (which basically means utf-8 if valid, windows 1252 (iso 8859-1) if not)
13 $iptcData = "Photoshop 3.0\08BIM\4\4\0\0\0\0\0\x06\x1c\x02\x19\x00\x01\xBC";
14 $res = IPTC
::Parse( $iptcData );
15 $this->assertEquals( array( '¼' ), $res['Keywords'] );
18 /* This one contains a sequence that's valid iso 8859-1 but not valid utf8 */
19 /* \xC3 = Ã, \xB8 = ¸ */
20 public function testIPTCParseNoCharset88591b() {
21 $iptcData = "Photoshop 3.0\08BIM\4\4\0\0\0\0\0\x09\x1c\x02\x19\x00\x04\xC3\xC3\xC3\xB8";
22 $res = IPTC
::Parse( $iptcData );
23 $this->assertEquals( array( 'ÃÃø' ), $res['Keywords'] );
26 /* Same as testIPTCParseNoCharset88591b, but forcing the charset to utf-8.
27 * What should happen is the first "\xC3\xC3" should be dropped as invalid,
28 * leaving \xC3\xB8, which is ø
30 public function testIPTCParseForcedUTFButInvalid() {
31 $iptcData = "Photoshop 3.0\08BIM\4\4\0\0\0\0\0\x11\x1c\x02\x19\x00\x04\xC3\xC3\xC3\xB8"
32 . "\x1c\x01\x5A\x00\x03\x1B\x25\x47";
33 $res = IPTC
::Parse( $iptcData );
34 $this->assertEquals( array( 'ø' ), $res['Keywords'] );
37 public function testIPTCParseNoCharsetUTF8() {
38 $iptcData = "Photoshop 3.0\08BIM\4\4\0\0\0\0\0\x07\x1c\x02\x19\x00\x02¼";
39 $res = IPTC
::Parse( $iptcData );
40 $this->assertEquals( array( '¼' ), $res['Keywords'] );
43 // Testing something that has 2 values for keyword
44 public function testIPTCParseMulti() {
45 $iptcData = /* identifier */ "Photoshop 3.0\08BIM\4\4"
46 /* length */ . "\0\0\0\0\0\x0D"
47 . "\x1c\x02\x19" . "\x00\x01" . "\xBC"
48 . "\x1c\x02\x19" . "\x00\x02" . "\xBC\xBD";
49 $res = IPTC
::Parse( $iptcData );
50 $this->assertEquals( array( '¼', '¼½' ), $res['Keywords'] );
53 public function testIPTCParseUTF8() {
54 // This has the magic "\x1c\x01\x5A\x00\x03\x1B\x25\x47" which marks content as UTF8.
55 $iptcData = "Photoshop 3.0\08BIM\4\4\0\0\0\0\0\x0F\x1c\x02\x19\x00\x02¼\x1c\x01\x5A\x00\x03\x1B\x25\x47";
56 $res = IPTC
::Parse( $iptcData );
57 $this->assertEquals( array( '¼' ), $res['Keywords'] );