3 * Formatting of image metadata values into human readable form.
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
21 * @author Ævar Arnfjörð Bjarmason <avarab@gmail.com>
22 * @copyright Copyright © 2005, Ævar Arnfjörð Bjarmason, 2009 Brent Garber, 2010 Brian Wolff
23 * @license GPL-2.0-or-later
24 * @see http://exif.org/Exif2-2.PDF The Exif 2.2 specification
27 use MediaWiki\MediaWikiServices
;
28 use Wikimedia\Timestamp\TimestampException
;
31 * Format Image metadata values into a human readable form.
33 * Note lots of these messages use the prefix 'exif' even though
34 * they may not be exif properties. For example 'exif-ImageDescription'
35 * can be the Exif ImageDescription, or it could be the iptc-iim caption
36 * property, or it could be the xmp dc:description property. This
37 * is because these messages should be independent of how the data is
38 * stored, sine the user doesn't care if the description is stored in xmp,
39 * exif, etc only that its a description. (Additionally many of these properties
40 * are merged together following the MWG standard, such that for example,
41 * exif properties override XMP properties that mean the same thing if
42 * there is a conflict).
44 * It should perhaps use a prefix like 'metadata' instead, but there
45 * is already a large number of messages using the 'exif' prefix.
48 * @since 1.23 the class extends ContextSource and various formerly-public
49 * internal methods are private
51 class FormatMetadata
extends ContextSource
{
53 * Only output a single language for multi-language fields
57 protected $singleLang = false;
60 * Trigger only outputting single language for multilanguage fields
65 public function setSingleLanguage( $val ) {
66 $this->singleLang
= $val;
70 * Numbers given by Exif user agents are often magical, that is they
71 * should be replaced by a detailed explanation depending on their
72 * value which most of the time are plain integers. This function
73 * formats Exif (and other metadata) values into human readable form.
75 * This is the usual entry point for this class.
77 * @param array $tags The Exif data to format ( as returned by
78 * Exif::getFilteredData() or BitmapMetadataHandler )
79 * @param bool|IContextSource $context Context to use (optional)
82 public static function getFormattedData( $tags, $context = false ) {
83 $obj = new FormatMetadata
;
85 $obj->setContext( $context );
88 return $obj->makeFormattedData( $tags );
92 * Numbers given by Exif user agents are often magical, that is they
93 * should be replaced by a detailed explanation depending on their
94 * value which most of the time are plain integers. This function
95 * formats Exif (and other metadata) values into human readable form.
97 * @param array $tags The Exif data to format ( as returned by
98 * Exif::getFilteredData() or BitmapMetadataHandler )
102 public function makeFormattedData( $tags ) {
103 $resolutionunit = !isset( $tags['ResolutionUnit'] ) ||
$tags['ResolutionUnit'] == 2 ?
2 : 3;
104 unset( $tags['ResolutionUnit'] );
106 foreach ( $tags as $tag => &$vals ) {
107 // This seems ugly to wrap non-array's in an array just to unwrap again,
108 // especially when most of the time it is not an array
109 if ( !is_array( $tags[$tag] ) ) {
113 // _type is a special value to say what array type
114 if ( isset( $tags[$tag]['_type'] ) ) {
115 $type = $tags[$tag]['_type'];
116 unset( $vals['_type'] );
118 $type = 'ul'; // default unordered list.
121 // This is done differently as the tag is an array.
122 if ( $tag == 'GPSTimeStamp' && count( $vals ) === 3 ) {
123 // hour min sec array
125 $h = explode( '/', $vals[0] );
126 $m = explode( '/', $vals[1] );
127 $s = explode( '/', $vals[2] );
129 // this should already be validated
130 // when loaded from file, but it could
131 // come from a foreign repo, so be
142 $tags[$tag] = str_pad( intval( $h[0] / $h[1] ), 2, '0', STR_PAD_LEFT
)
143 . ':' . str_pad( intval( $m[0] / $m[1] ), 2, '0', STR_PAD_LEFT
)
144 . ':' . str_pad( intval( $s[0] / $s[1] ), 2, '0', STR_PAD_LEFT
);
147 $time = wfTimestamp( TS_MW
, '1971:01:01 ' . $tags[$tag] );
148 // the 1971:01:01 is just a placeholder, and not shown to user.
149 if ( $time && intval( $time ) > 0 ) {
150 $tags[$tag] = $this->getLanguage()->time( $time );
152 } catch ( TimestampException
$e ) {
153 // This shouldn't happen, but we've seen bad formats
154 // such as 4-digit seconds in the wild.
155 // leave $tags[$tag] as-is
160 // The contact info is a multi-valued field
161 // instead of the other props which are single
162 // valued (mostly) so handle as a special case.
163 if ( $tag === 'Contact' ) {
164 $vals = $this->collapseContactInfo( $vals );
168 foreach ( $vals as &$val ) {
183 $val = $this->exifMsg( $tag, $val );
186 /* If not recognized, display as is. */
191 case 'PhotometricInterpretation':
205 $val = $this->exifMsg( $tag, $val );
208 /* If not recognized, display as is. */
223 $val = $this->exifMsg( $tag, $val );
226 /* If not recognized, display as is. */
231 case 'PlanarConfiguration':
235 $val = $this->exifMsg( $tag, $val );
238 /* If not recognized, display as is. */
243 // TODO: YCbCrSubSampling
244 case 'YCbCrPositioning':
248 $val = $this->exifMsg( $tag, $val );
251 /* If not recognized, display as is. */
258 switch ( $resolutionunit ) {
260 $val = $this->exifMsg( 'XYResolution', 'i', $this->formatNum( $val ) );
263 $val = $this->exifMsg( 'XYResolution', 'c', $this->formatNum( $val ) );
266 /* If not recognized, display as is. */
271 // TODO: YCbCrCoefficients #p27 (see annex E)
273 case 'FlashpixVersion':
274 $val = (int)$val / 100;
281 $val = $this->exifMsg( $tag, $val );
284 /* If not recognized, display as is. */
289 case 'ComponentsConfiguration':
298 $val = $this->exifMsg( $tag, $val );
301 /* If not recognized, display as is. */
307 case 'DateTimeOriginal':
308 case 'DateTimeDigitized':
309 case 'DateTimeReleased':
310 case 'DateTimeExpires':
313 case 'DateTimeMetadata':
314 if ( $val == '0000:00:00 00:00:00' ||
$val == ' : : : : ' ) {
315 $val = $this->msg( 'exif-unknowndate' )->text();
316 } elseif ( preg_match(
317 '/^(?:\d{4}):(?:\d\d):(?:\d\d) (?:\d\d):(?:\d\d):(?:\d\d)$/D',
321 $time = wfTimestamp( TS_MW
, $val );
322 if ( $time && intval( $time ) > 0 ) {
323 $val = $this->getLanguage()->timeanddate( $time );
325 } elseif ( preg_match( '/^(?:\d{4}):(?:\d\d):(?:\d\d) (?:\d\d):(?:\d\d)$/D', $val ) ) {
326 // No second field. Still format the same
327 // since timeanddate doesn't include seconds anyways,
328 // but second still available in api
329 $time = wfTimestamp( TS_MW
, $val . ':00' );
330 if ( $time && intval( $time ) > 0 ) {
331 $val = $this->getLanguage()->timeanddate( $time );
333 } elseif ( preg_match( '/^(?:\d{4}):(?:\d\d):(?:\d\d)$/D', $val ) ) {
334 // If only the date but not the time is filled in.
335 $time = wfTimestamp( TS_MW
, substr( $val, 0, 4 )
336 . substr( $val, 5, 2 )
337 . substr( $val, 8, 2 )
339 if ( $time && intval( $time ) > 0 ) {
340 $val = $this->getLanguage()->date( $time );
343 // else it will just output $val without formatting it.
346 case 'ExposureProgram':
357 $val = $this->exifMsg( $tag, $val );
360 /* If not recognized, display as is. */
365 case 'SubjectDistance':
366 $val = $this->exifMsg( $tag, '', $this->formatNum( $val ) );
380 $val = $this->exifMsg( $tag, $val );
383 /* If not recognized, display as is. */
411 $val = $this->exifMsg( $tag, $val );
414 /* If not recognized, display as is. */
421 'fired' => $val & 0b00000001
,
422 'return' => ( $val & 0b00000110
) >> 1,
423 'mode' => ( $val & 0b00011000
) >> 3,
424 'function' => ( $val & 0b00100000
) >> 5,
425 'redeye' => ( $val & 0b01000000
) >> 6,
426 // 'reserved' => ( $val & 0b10000000 ) >> 7,
429 # We do not need to handle unknown values since all are used.
430 foreach ( $flashDecode as $subTag => $subValue ) {
431 # We do not need any message for zeroed values.
432 if ( $subTag != 'fired' && $subValue == 0 ) {
435 $fullTag = $tag . '-' . $subTag;
436 $flashMsgs[] = $this->exifMsg( $fullTag, $subValue );
438 $val = $this->getLanguage()->commaList( $flashMsgs );
441 case 'FocalPlaneResolutionUnit':
444 $val = $this->exifMsg( $tag, $val );
447 /* If not recognized, display as is. */
452 case 'SensingMethod':
461 $val = $this->exifMsg( $tag, $val );
464 /* If not recognized, display as is. */
472 $val = $this->exifMsg( $tag, $val );
475 /* If not recognized, display as is. */
483 $val = $this->exifMsg( $tag, $val );
486 /* If not recognized, display as is. */
491 case 'CustomRendered':
495 $val = $this->exifMsg( $tag, $val );
498 /* If not recognized, display as is. */
508 $val = $this->exifMsg( $tag, $val );
511 /* If not recognized, display as is. */
520 $val = $this->exifMsg( $tag, $val );
523 /* If not recognized, display as is. */
528 case 'SceneCaptureType':
534 $val = $this->exifMsg( $tag, $val );
537 /* If not recognized, display as is. */
549 $val = $this->exifMsg( $tag, $val );
552 /* If not recognized, display as is. */
562 $val = $this->exifMsg( $tag, $val );
565 /* If not recognized, display as is. */
575 $val = $this->exifMsg( $tag, $val );
578 /* If not recognized, display as is. */
588 $val = $this->exifMsg( $tag, $val );
591 /* If not recognized, display as is. */
596 case 'SubjectDistanceRange':
602 $val = $this->exifMsg( $tag, $val );
605 /* If not recognized, display as is. */
610 // The GPS...Ref values are kept for compatibility, probably won't be reached.
611 case 'GPSLatitudeRef':
612 case 'GPSDestLatitudeRef':
616 $val = $this->exifMsg( 'GPSLatitude', $val );
619 /* If not recognized, display as is. */
624 case 'GPSLongitudeRef':
625 case 'GPSDestLongitudeRef':
629 $val = $this->exifMsg( 'GPSLongitude', $val );
632 /* If not recognized, display as is. */
639 $val = $this->exifMsg( 'GPSAltitude', 'below-sealevel', $this->formatNum( -$val, 3 ) );
641 $val = $this->exifMsg( 'GPSAltitude', 'above-sealevel', $this->formatNum( $val, 3 ) );
649 $val = $this->exifMsg( $tag, $val );
652 /* If not recognized, display as is. */
657 case 'GPSMeasureMode':
661 $val = $this->exifMsg( $tag, $val );
664 /* If not recognized, display as is. */
670 case 'GPSImgDirectionRef':
671 case 'GPSDestBearingRef':
675 $val = $this->exifMsg( 'GPSDirection', $val );
678 /* If not recognized, display as is. */
684 case 'GPSDestLatitude':
685 $val = $this->formatCoords( $val, 'latitude' );
688 case 'GPSDestLongitude':
689 $val = $this->formatCoords( $val, 'longitude' );
697 $val = $this->exifMsg( 'GPSSpeed', $val );
700 /* If not recognized, display as is. */
705 case 'GPSDestDistanceRef':
710 $val = $this->exifMsg( 'GPSDestDistance', $val );
713 /* If not recognized, display as is. */
719 // See https://en.wikipedia.org/wiki/Dilution_of_precision_(GPS)
721 $val = $this->exifMsg( $tag, 'excellent', $this->formatNum( $val ) );
722 } elseif ( $val <= 5 ) {
723 $val = $this->exifMsg( $tag, 'good', $this->formatNum( $val ) );
724 } elseif ( $val <= 10 ) {
725 $val = $this->exifMsg( $tag, 'moderate', $this->formatNum( $val ) );
726 } elseif ( $val <= 20 ) {
727 $val = $this->exifMsg( $tag, 'fair', $this->formatNum( $val ) );
729 $val = $this->exifMsg( $tag, 'poor', $this->formatNum( $val ) );
733 // This is not in the Exif standard, just a special
734 // case for our purposes which enables wikis to wikify
735 // the make, model and software name to link to their articles.
738 $val = $this->exifMsg( $tag, '', $val );
742 if ( is_array( $val ) ) {
743 if ( count( $val ) > 1 ) {
744 // if its a software, version array.
745 $val = $this->msg( 'exif-software-version-value', $val[0], $val[1] )->text();
747 // https://phabricator.wikimedia.org/T178130
748 $val = $this->exifMsg( $tag, '', $val[0] );
751 $val = $this->exifMsg( $tag, '', $val );
756 // Show the pretty fraction as well as decimal version
757 $val = $this->msg( 'exif-exposuretime-format',
758 $this->formatFraction( $val ), $this->formatNum( $val ) )->text();
760 case 'ISOSpeedRatings':
761 // If its = 65535 that means its at the
762 // limit of the size of Exif::short and
764 if ( $val == '65535' ) {
765 $val = $this->exifMsg( $tag, 'overflow' );
767 $val = $this->formatNum( $val );
771 $val = $this->msg( 'exif-fnumber-format',
772 $this->formatNum( $val ) )->text();
776 case 'FocalLengthIn35mmFilm':
777 $val = $this->msg( 'exif-focallength-format',
778 $this->formatNum( $val ) )->text();
781 case 'MaxApertureValue':
782 if ( strpos( $val, '/' ) !== false ) {
783 // need to expand this earlier to calculate fNumber
784 list( $n, $d ) = explode( '/', $val );
785 if ( is_numeric( $n ) && is_numeric( $d ) ) {
789 if ( is_numeric( $val ) ) {
790 $fNumber = 2 ** ( $val / 2 );
791 if ( $fNumber !== false ) {
792 $val = $this->msg( 'exif-maxaperturevalue-value',
793 $this->formatNum( $val ),
794 $this->formatNum( $fNumber, 2 )
801 switch ( strtolower( $val ) ) {
802 // See pg 29 of IPTC photo
803 // metadata standard.
821 $val = $this->exifMsg(
827 case 'SubjectNewsCode':
828 // Essentially like iimCategory.
829 // 8 (numeric) digit hierarchical
830 // classification. We decode the
831 // first 2 digits, which provide
833 $val = $this->convertNewsCode( $val );
836 // 1-8 with 1 being highest, 5 normal
837 // 0 is reserved, and 9 is 'user-defined'.
839 if ( $val == 0 ||
$val == 9 ) {
841 } elseif ( $val < 5 && $val > 1 ) {
843 } elseif ( $val == 5 ) {
845 } elseif ( $val <= 8 && $val > 5 ) {
849 if ( $urgency !== '' ) {
850 $val = $this->exifMsg( 'urgency',
856 // Things that have a unit of pixels.
857 case 'OriginalImageHeight':
858 case 'OriginalImageWidth':
859 case 'PixelXDimension':
860 case 'PixelYDimension':
863 $val = $this->formatNum( $val ) . ' ' . $this->msg( 'unit-pixel' )->text();
866 // Do not transform fields with pure text.
867 // For some languages the formatNum()
868 // conversion results to wrong output like
869 // foo,bar@example,com or foo٫bar@example٫com.
870 // Also some 'numeric' things like Scene codes
871 // are included here as we really don't want
873 case 'ImageDescription':
877 case 'RelatedSoundFile':
878 case 'ImageUniqueID':
879 case 'SpectralSensitivity':
880 case 'GPSSatellites':
884 case 'WorldRegionDest':
886 case 'CountryCodeDest':
887 case 'ProvinceOrStateDest':
889 case 'SublocationDest':
890 case 'WorldRegionCreated':
891 case 'CountryCreated':
892 case 'CountryCodeCreated':
893 case 'ProvinceOrStateCreated':
895 case 'SublocationCreated':
897 case 'SpecialInstructions':
902 case 'FixtureIdentifier':
904 case 'LocationDestCode':
906 case 'JPEGFileComment':
907 case 'iimSupplementalCategory':
908 case 'OriginalTransmissionRef':
910 case 'dc-contributor':
919 case 'CameraOwnerName':
922 case 'RightsCertificate':
923 case 'CopyrightOwner':
926 case 'OriginalDocumentID':
928 case 'MorePermissionsUrl':
929 case 'AttributionUrl':
930 case 'PreferredAttributionName':
931 case 'PNGFileComment':
933 case 'ContentWarning':
934 case 'GIFFileComment':
936 case 'IntellectualGenre':
938 case 'OrginisationInImage':
939 case 'PersonInImage':
941 $val = htmlspecialchars( $val );
949 $val = $this->exifMsg( $tag, $val );
952 $val = htmlspecialchars( $val );
960 $val = $this->exifMsg( $tag, $val );
965 if ( $val == '-1' ) {
966 $val = $this->exifMsg( $tag, 'rejected' );
968 $val = $this->formatNum( $val );
973 $lang = Language
::fetchLanguageName( strtolower( $val ), $this->getLanguage()->getCode() );
974 $val = htmlspecialchars( $lang ?
: $val );
978 $val = $this->formatNum( $val );
982 // End formatting values, start flattening arrays.
983 $vals = $this->flattenArrayReal( $vals, $type );
990 * Flatten an array, using the content language for any messages.
992 * @param array $vals Array of values
993 * @param string $type Type of array (either lang, ul, ol).
994 * lang = language assoc array with keys being the lang code
995 * ul = unordered list, ol = ordered list
996 * type can also come from the '_type' member of $vals.
997 * @param bool $noHtml If to avoid returning anything resembling HTML.
998 * (Ugly hack for backwards compatibility with old MediaWiki).
999 * @param bool|IContextSource $context
1000 * @return string Single value (in wiki-syntax).
1003 public static function flattenArrayContentLang( $vals, $type = 'ul',
1004 $noHtml = false, $context = false
1006 $obj = new FormatMetadata
;
1008 $obj->setContext( $context );
1010 $context = new DerivativeContext( $obj->getContext() );
1011 $context->setLanguage( MediaWikiServices
::getInstance()->getContentLanguage() );
1012 $obj->setContext( $context );
1014 return $obj->flattenArrayReal( $vals, $type, $noHtml );
1018 * A function to collapse multivalued tags into a single value.
1019 * This turns an array of (for example) authors into a bulleted list.
1021 * This is public on the basis it might be useful outside of this class.
1023 * @param array $vals Array of values
1024 * @param string $type Type of array (either lang, ul, ol).
1025 * lang = language assoc array with keys being the lang code
1026 * ul = unordered list, ol = ordered list
1027 * type can also come from the '_type' member of $vals.
1028 * @param bool $noHtml If to avoid returning anything resembling HTML.
1029 * (Ugly hack for backwards compatibility with old mediawiki).
1030 * @return string Single value (in wiki-syntax).
1033 public function flattenArrayReal( $vals, $type = 'ul', $noHtml = false ) {
1034 if ( !is_array( $vals ) ) {
1035 return $vals; // do nothing if not an array;
1038 if ( isset( $vals['_type'] ) ) {
1039 $type = $vals['_type'];
1040 unset( $vals['_type'] );
1043 if ( !is_array( $vals ) ) {
1044 return $vals; // do nothing if not an array;
1045 } elseif ( count( $vals ) === 1 && $type !== 'lang' && isset( $vals[0] ) ) {
1047 } elseif ( count( $vals ) === 0 ) {
1048 wfDebug( __METHOD__
. " metadata array with 0 elements!\n" );
1050 return ""; // paranoia. This should never happen
1052 /* @todo FIXME: This should hide some of the list entries if there are
1053 * say more than four. Especially if a field is translated into 20
1054 * languages, we don't want to show them all by default
1058 // Display default, followed by ContentLanguage,
1059 // followed by the rest in no particular
1062 // Todo: hide some items if really long list.
1066 $priorityLanguages = $this->getPriorityLanguages();
1067 $defaultItem = false;
1068 $defaultLang = false;
1070 // If default is set, save it for later,
1071 // as we don't know if it's equal to
1072 // one of the lang codes. (In xmp
1073 // you specify the language for a
1074 // default property by having both
1075 // a default prop, and one in the language
1076 // that are identical)
1077 if ( isset( $vals['x-default'] ) ) {
1078 $defaultItem = $vals['x-default'];
1079 unset( $vals['x-default'] );
1081 foreach ( $priorityLanguages as $pLang ) {
1082 if ( isset( $vals[$pLang] ) ) {
1084 if ( $vals[$pLang] === $defaultItem ) {
1085 $defaultItem = false;
1088 $content .= $this->langItem(
1089 $vals[$pLang], $pLang,
1090 $isDefault, $noHtml );
1092 unset( $vals[$pLang] );
1094 if ( $this->singleLang
) {
1095 return Html
::rawElement( 'span',
1096 [ 'lang' => $pLang ], $vals[$pLang] );
1102 foreach ( $vals as $lang => $item ) {
1103 if ( $item === $defaultItem ) {
1104 $defaultLang = $lang;
1107 $content .= $this->langItem( $item,
1108 $lang, false, $noHtml );
1109 if ( $this->singleLang
) {
1110 return Html
::rawElement( 'span',
1111 [ 'lang' => $lang ], $item );
1114 if ( $defaultItem !== false ) {
1115 $content = $this->langItem( $defaultItem,
1116 $defaultLang, true, $noHtml ) .
1118 if ( $this->singleLang
) {
1119 return $defaultItem;
1126 return '<ul class="metadata-langlist">' .
1131 return "\n#" . implode( "\n#", $vals );
1134 return "<ol><li>" . implode( "</li>\n<li>", $vals ) . '</li></ol>';
1138 return "\n*" . implode( "\n*", $vals );
1141 return "<ul><li>" . implode( "</li>\n<li>", $vals ) . '</li></ul>';
1146 /** Helper function for creating lists of translations.
1148 * @param string $value Value (this is not escaped)
1149 * @param string $lang Lang code of item or false
1150 * @param bool $default If it is default value.
1151 * @param bool $noHtml If to avoid html (for back-compat)
1152 * @throws MWException
1153 * @return string Language item (Note: despite how this looks, this is
1154 * treated as wikitext, not as HTML).
1156 private function langItem( $value, $lang, $default = false, $noHtml = false ) {
1157 if ( $lang === false && $default === false ) {
1158 throw new MWException( '$lang and $default cannot both '
1163 $wrappedValue = $value;
1165 $wrappedValue = '<span class="mw-metadata-lang-value">'
1166 . $value . '</span>';
1169 if ( $lang === false ) {
1170 $msg = $this->msg( 'metadata-langitem-default', $wrappedValue );
1172 return $msg->text() . "\n\n";
1175 return '<li class="mw-metadata-lang-default">'
1180 $lowLang = strtolower( $lang );
1181 $langName = Language
::fetchLanguageName( $lowLang );
1182 if ( $langName === '' ) {
1183 // try just the base language name. (aka en-US -> en ).
1184 $langPrefix = explode( '-', $lowLang, 2 )[0];
1185 $langName = Language
::fetchLanguageName( $langPrefix );
1186 if ( $langName === '' ) {
1191 // else we have a language specified
1193 $msg = $this->msg( 'metadata-langitem', $wrappedValue, $langName, $lang );
1195 return '*' . $msg->text();
1198 $item = '<li class="mw-metadata-lang-code-'
1201 $item .= ' mw-metadata-lang-default';
1203 $item .= '" lang="' . $lang . '">';
1204 $item .= $msg->text();
1211 * Convenience function for getFormattedData()
1213 * @param string $tag The tag name to pass on
1214 * @param string $val The value of the tag
1215 * @param string $arg An argument to pass ($1)
1216 * @param string $arg2 A 2nd argument to pass ($2)
1217 * @return string The text content of "exif-$tag-$val" message in lower case
1219 private function exifMsg( $tag, $val, $arg = null, $arg2 = null ) {
1220 if ( $val === '' ) {
1225 MediaWikiServices
::getInstance()->getContentLanguage()->lc( "exif-$tag-$val" ),
1232 * Format a number, convert numbers from fractions into floating point
1233 * numbers, joins arrays of numbers with commas.
1235 * @param mixed $num The value to format
1236 * @param float|int|bool $round Digits to round to or false.
1237 * @return mixed A floating point number or whatever we were fed
1239 private function formatNum( $num, $round = false ) {
1241 if ( is_array( $num ) ) {
1243 foreach ( $num as $number ) {
1244 $out[] = $this->formatNum( $number );
1247 return $this->getLanguage()->commaList( $out );
1249 if ( preg_match( '/^(-?\d+)\/(\d+)$/', $num, $m ) ) {
1251 $newNum = $m[1] / $m[2];
1252 if ( $round !== false ) {
1253 $newNum = round( $newNum, $round );
1259 return $this->getLanguage()->formatNum( $newNum );
1261 if ( is_numeric( $num ) && $round !== false ) {
1262 $num = round( $num, $round );
1265 return $this->getLanguage()->formatNum( $num );
1270 * Format a rational number, reducing fractions
1272 * @param mixed $num The value to format
1273 * @return mixed A floating point number or whatever we were fed
1275 private function formatFraction( $num ) {
1277 if ( preg_match( '/^(-?\d+)\/(\d+)$/', $num, $m ) ) {
1278 $numerator = intval( $m[1] );
1279 $denominator = intval( $m[2] );
1280 $gcd = $this->gcd( abs( $numerator ), $denominator );
1282 // 0 shouldn't happen! ;)
1283 return $this->formatNum( $numerator / $gcd ) . '/' . $this->formatNum( $denominator / $gcd );
1287 return $this->formatNum( $num );
1291 * Calculate the greatest common divisor of two integers.
1293 * @param int $a Numerator
1294 * @param int $b Denominator
1297 private function gcd( $a, $b ) {
1299 // https://en.wikipedia.org/wiki/Euclidean_algorithm
1300 // Recursive form would be:
1304 return gcd( $b, $a % $b );
1307 $remainder = $a %
$b;
1309 // tail recursion...
1318 * Fetch the human readable version of a news code.
1319 * A news code is an 8 digit code. The first two
1320 * digits are a general classification, so we just
1323 * Note, leading 0's are significant, so this is
1324 * a string, not an int.
1326 * @param string $val The 8 digit news code.
1327 * @return string The human readable form
1329 private function convertNewsCode( $val ) {
1330 if ( !preg_match( '/^\d{8}$/D', $val ) ) {
1331 // Not a valid news code.
1335 switch ( substr( $val, 0, 2 ) ) {
1388 if ( $cat !== '' ) {
1389 $catMsg = $this->exifMsg( 'iimcategory', $cat );
1390 $val = $this->exifMsg( 'subjectnewscode', '', $val, $catMsg );
1397 * Format a coordinate value, convert numbers from floating point
1398 * into degree minute second representation.
1400 * @param int $coord Degrees, minutes and seconds
1401 * @param string $type Latitude or longitude (for if its a NWS or E)
1402 * @return mixed A floating point number or whatever we were fed
1404 private function formatCoords( $coord, $type ) {
1408 if ( $type === 'latitude' ) {
1410 } elseif ( $type === 'longitude' ) {
1415 if ( $type === 'latitude' ) {
1417 } elseif ( $type === 'longitude' ) {
1422 $deg = floor( $nCoord );
1423 $min = floor( ( $nCoord - $deg ) * 60.0 );
1424 $sec = round( ( ( $nCoord - $deg ) - $min / 60 ) * 3600, 2 );
1426 $deg = $this->formatNum( $deg );
1427 $min = $this->formatNum( $min );
1428 $sec = $this->formatNum( $sec );
1430 return $this->msg( 'exif-coordinate-format', $deg, $min, $sec, $ref, $coord )->text();
1434 * Format the contact info field into a single value.
1436 * This function might be called from
1437 * JpegHandler::convertMetadataVersion which is why it is
1440 * @param array $vals Array with fields of the ContactInfo
1441 * struct defined in the IPTC4XMP spec. Or potentially
1442 * an array with one element that is a free form text
1443 * value from the older iptc iim 1:118 prop.
1444 * @return string HTML-ish looking wikitext
1445 * @since 1.23 no longer static
1447 public function collapseContactInfo( $vals ) {
1448 if ( !( isset( $vals['CiAdrExtadr'] )
1449 ||
isset( $vals['CiAdrCity'] )
1450 ||
isset( $vals['CiAdrCtry'] )
1451 ||
isset( $vals['CiEmailWork'] )
1452 ||
isset( $vals['CiTelWork'] )
1453 ||
isset( $vals['CiAdrPcode'] )
1454 ||
isset( $vals['CiAdrRegion'] )
1455 ||
isset( $vals['CiUrlWork'] )
1457 // We don't have any sub-properties
1458 // This could happen if its using old
1459 // iptc that just had this as a free-form
1461 // Note: We run this through htmlspecialchars
1462 // partially to be consistent, and partially
1463 // because people often insert >, etc into
1464 // the metadata which should not be interpreted
1465 // but we still want to auto-link urls.
1466 foreach ( $vals as &$val ) {
1467 $val = htmlspecialchars( $val );
1470 return $this->flattenArrayReal( $vals );
1472 // We have a real ContactInfo field.
1473 // Its unclear if all these fields have to be
1474 // set, so assume they do not.
1475 $url = $tel = $street = $city = $country = '';
1476 $email = $postal = $region = '';
1478 // Also note, some of the class names this uses
1479 // are similar to those used by hCard. This is
1480 // mostly because they're sensible names. This
1481 // does not (and does not attempt to) output
1482 // stuff in the hCard microformat. However it
1483 // might output in the adr microformat.
1485 if ( isset( $vals['CiAdrExtadr'] ) ) {
1486 // Todo: This can potentially be multi-line.
1487 // Need to check how that works in XMP.
1488 $street = '<span class="extended-address">'
1490 $vals['CiAdrExtadr'] )
1493 if ( isset( $vals['CiAdrCity'] ) ) {
1494 $city = '<span class="locality">'
1495 . htmlspecialchars( $vals['CiAdrCity'] )
1498 if ( isset( $vals['CiAdrCtry'] ) ) {
1499 $country = '<span class="country-name">'
1500 . htmlspecialchars( $vals['CiAdrCtry'] )
1503 if ( isset( $vals['CiEmailWork'] ) ) {
1505 // Have to split multiple emails at commas/new lines.
1506 $splitEmails = explode( "\n", $vals['CiEmailWork'] );
1507 foreach ( $splitEmails as $e1 ) {
1508 // Also split on comma
1509 foreach ( explode( ',', $e1 ) as $e2 ) {
1510 $finalEmail = trim( $e2 );
1511 if ( $finalEmail == ',' ||
$finalEmail == '' ) {
1514 if ( strpos( $finalEmail, '<' ) !== false ) {
1515 // Don't do fancy formatting to
1516 // "My name" <foo@bar.com> style stuff
1517 $emails[] = $finalEmail;
1519 $emails[] = '[mailto:'
1521 . ' <span class="email">'
1527 $email = implode( ', ', $emails );
1529 if ( isset( $vals['CiTelWork'] ) ) {
1530 $tel = '<span class="tel">'
1531 . htmlspecialchars( $vals['CiTelWork'] )
1534 if ( isset( $vals['CiAdrPcode'] ) ) {
1535 $postal = '<span class="postal-code">'
1537 $vals['CiAdrPcode'] )
1540 if ( isset( $vals['CiAdrRegion'] ) ) {
1541 // Note this is province/state.
1542 $region = '<span class="region">'
1544 $vals['CiAdrRegion'] )
1547 if ( isset( $vals['CiUrlWork'] ) ) {
1548 $url = '<span class="url">'
1549 . htmlspecialchars( $vals['CiUrlWork'] )
1553 return $this->msg( 'exif-contact-value', $email, $url,
1554 $street, $city, $region, $postal, $country,
1560 * Get a list of fields that are visible by default.
1565 public static function getVisibleFields() {
1567 $lines = explode( "\n", wfMessage( 'metadata-fields' )->inContentLanguage()->text() );
1568 foreach ( $lines as $line ) {
1570 if ( preg_match( '/^\\*\s*(.*?)\s*$/', $line, $matches ) ) {
1571 $fields[] = $matches[1];
1574 $fields = array_map( 'strtolower', $fields );
1580 * Get an array of extended metadata. (See the imageinfo API for format.)
1582 * @param File $file File to use
1583 * @return array [<property name> => ['value' => <value>]], or [] on error
1586 public function fetchExtendedMetadata( File
$file ) {
1587 $cache = MediaWikiServices
::getInstance()->getMainWANObjectCache();
1589 // If revision deleted, exit immediately
1590 if ( $file->isDeleted( File
::DELETED_FILE
) ) {
1594 $cacheKey = $cache->makeKey(
1595 'getExtendedMetadata',
1596 $this->getLanguage()->getCode(),
1597 (int)$this->singleLang
,
1601 $cachedValue = $cache->get( $cacheKey );
1604 && Hooks
::run( 'ValidateExtendedMetadataCache', [ $cachedValue['timestamp'], $file ] )
1606 $extendedMetadata = $cachedValue['data'];
1608 $maxCacheTime = ( $file instanceof ForeignAPIFile
) ?
60 * 60 * 12 : 60 * 60 * 24 * 30;
1609 $fileMetadata = $this->getExtendedMetadataFromFile( $file );
1610 $extendedMetadata = $this->getExtendedMetadataFromHook( $file, $fileMetadata, $maxCacheTime );
1611 if ( $this->singleLang
) {
1612 $this->resolveMultilangMetadata( $extendedMetadata );
1614 $this->discardMultipleValues( $extendedMetadata );
1615 // Make sure the metadata won't break the API when an XML format is used.
1616 // This is an API-specific function so it would be cleaner to call it from
1617 // outside fetchExtendedMetadata, but this way we don't need to redo the
1618 // computation on a cache hit.
1619 $this->sanitizeArrayForAPI( $extendedMetadata );
1620 $valueToCache = [ 'data' => $extendedMetadata, 'timestamp' => wfTimestampNow() ];
1621 $cache->set( $cacheKey, $valueToCache, $maxCacheTime );
1624 return $extendedMetadata;
1628 * Get file-based metadata in standardized format.
1630 * Note that for a remote file, this might return metadata supplied by extensions.
1632 * @param File $file File to use
1633 * @return array [<property name> => ['value' => <value>]], or [] on error
1636 protected function getExtendedMetadataFromFile( File
$file ) {
1637 // If this is a remote file accessed via an API request, we already
1638 // have remote metadata so we just ignore any local one
1639 if ( $file instanceof ForeignAPIFile
) {
1640 // In case of error we pretend no metadata - this will get cached.
1641 // Might or might not be a good idea.
1642 return $file->getExtendedMetadata() ?
: [];
1645 $uploadDate = wfTimestamp( TS_ISO_8601
, $file->getTimestamp() );
1648 // This is modification time, which is close to "upload" time.
1650 'value' => $uploadDate,
1651 'source' => 'mediawiki-metadata',
1655 $title = $file->getTitle();
1657 $text = $title->getText();
1658 $pos = strrpos( $text, '.' );
1661 $name = substr( $text, 0, $pos );
1666 $fileMetadata['ObjectName'] = [
1668 'source' => 'mediawiki-metadata',
1672 return $fileMetadata;
1676 * Get additional metadata from hooks in standardized format.
1678 * @param File $file File to use
1679 * @param array $extendedMetadata
1680 * @param int &$maxCacheTime Hook handlers might use this parameter to override cache time
1682 * @return array [<property name> => ['value' => <value>]], or [] on error
1685 protected function getExtendedMetadataFromHook( File
$file, array $extendedMetadata,
1688 Hooks
::run( 'GetExtendedMetadata', [
1691 $this->getContext(),
1696 $visible = array_flip( self
::getVisibleFields() );
1697 foreach ( $extendedMetadata as $key => $value ) {
1698 if ( !isset( $visible[strtolower( $key )] ) ) {
1699 $extendedMetadata[$key]['hidden'] = '';
1703 return $extendedMetadata;
1707 * Turns an XMP-style multilang array into a single value.
1708 * If the value is not a multilang array, it is returned unchanged.
1709 * See mediawiki.org/wiki/Manual:File_metadata_handling#Multi-language_array_format
1710 * @param mixed $value
1711 * @return mixed Value in best language, null if there were no languages at all
1714 protected function resolveMultilangValue( $value ) {
1717 ||
!isset( $value['_type'] )
1718 ||
$value['_type'] != 'lang'
1720 return $value; // do nothing if not a multilang array
1723 // choose the language best matching user or site settings
1724 $priorityLanguages = $this->getPriorityLanguages();
1725 foreach ( $priorityLanguages as $lang ) {
1726 if ( isset( $value[$lang] ) ) {
1727 return $value[$lang];
1731 // otherwise go with the default language, if set
1732 if ( isset( $value['x-default'] ) ) {
1733 return $value['x-default'];
1736 // otherwise just return any one language
1737 unset( $value['_type'] );
1738 if ( !empty( $value ) ) {
1739 return reset( $value );
1742 // this should not happen; signal error
1747 * Turns an XMP-style multivalue array into a single value by dropping all but the first
1748 * value. If the value is not a multivalue array (or a multivalue array inside a multilang
1749 * array), it is returned unchanged.
1750 * See mediawiki.org/wiki/Manual:File_metadata_handling#Multi-language_array_format
1751 * @param mixed $value
1752 * @return mixed The value, or the first value if there were multiple ones
1755 protected function resolveMultivalueValue( $value ) {
1756 if ( !is_array( $value ) ) {
1758 } elseif ( isset( $value['_type'] ) && $value['_type'] === 'lang' ) {
1759 // if this is a multilang array, process fields separately
1761 foreach ( $value as $k => $v ) {
1762 $newValue[$k] = $this->resolveMultivalueValue( $v );
1765 } else { // _type is 'ul' or 'ol' or missing in which case it defaults to 'ul'
1766 $v = reset( $value );
1767 if ( key( $value ) === '_type' ) {
1768 $v = next( $value );
1775 * Takes an array returned by the getExtendedMetadata* functions,
1776 * and resolves multi-language values in it.
1777 * @param array &$metadata
1780 protected function resolveMultilangMetadata( &$metadata ) {
1781 if ( !is_array( $metadata ) ) {
1784 foreach ( $metadata as &$field ) {
1785 if ( isset( $field['value'] ) ) {
1786 $field['value'] = $this->resolveMultilangValue( $field['value'] );
1792 * Takes an array returned by the getExtendedMetadata* functions,
1793 * and turns all fields into single-valued ones by dropping extra values.
1794 * @param array &$metadata
1797 protected function discardMultipleValues( &$metadata ) {
1798 if ( !is_array( $metadata ) ) {
1801 foreach ( $metadata as $key => &$field ) {
1802 if ( $key === 'Software' ||
$key === 'Contact' ) {
1803 // we skip some fields which have composite values. They are not particularly interesting
1804 // and you can get them via the metadata / commonmetadata APIs anyway.
1807 if ( isset( $field['value'] ) ) {
1808 $field['value'] = $this->resolveMultivalueValue( $field['value'] );
1814 * Makes sure the given array is a valid API response fragment
1815 * @param array &$arr
1817 protected function sanitizeArrayForAPI( &$arr ) {
1818 if ( !is_array( $arr ) ) {
1823 foreach ( $arr as $key => &$value ) {
1824 $sanitizedKey = $this->sanitizeKeyForAPI( $key );
1825 if ( $sanitizedKey !== $key ) {
1826 if ( isset( $arr[$sanitizedKey] ) ) {
1827 // Make the sanitized keys hopefully unique.
1828 // To make it definitely unique would be too much effort, given that
1829 // sanitizing is only needed for misformatted metadata anyway, but
1830 // this at least covers the case when $arr is numeric.
1831 $sanitizedKey .= $counter;
1834 $arr[$sanitizedKey] = $arr[$key];
1835 unset( $arr[$key] );
1837 if ( is_array( $value ) ) {
1838 $this->sanitizeArrayForAPI( $value );
1842 // Handle API metadata keys (particularly "_type")
1843 $keys = array_filter( array_keys( $arr ), 'ApiResult::isMetadataKey' );
1845 ApiResult
::setPreserveKeysList( $arr, $keys );
1850 * Turns a string into a valid API identifier.
1851 * @param string $key
1855 protected function sanitizeKeyForAPI( $key ) {
1856 // drop all characters which are not valid in an XML tag name
1857 // a bunch of non-ASCII letters would be valid but probably won't
1858 // be used so we take the easy way
1859 $key = preg_replace( '/[^a-zA-z0-9_:.\-]/', '', $key );
1860 // drop characters which are invalid at the first position
1861 $key = preg_replace( '/^[\d\-.]+/', '', $key );
1867 // special case for an internal keyword
1868 if ( $key == '_element' ) {
1876 * Returns a list of languages (first is best) to use when formatting multilang fields,
1877 * based on user and site preferences.
1881 protected function getPriorityLanguages() {
1882 $priorityLanguages =
1883 Language
::getFallbacksIncludingSiteLanguage( $this->getLanguage()->getCode() );
1884 $priorityLanguages = array_merge(
1885 (array)$this->getLanguage()->getCode(),
1886 $priorityLanguages[0],
1887 $priorityLanguages[1]
1890 return $priorityLanguages;