View file File name : CBOR.pm Content :#------------------------------------------------------------------------------ # File: CBOR.pm # # Description: Read CBOR format metadata # # Revisions: 2021-09-30 - P. Harvey Created # # References: 1) https://c2pa.org/public-draft/ # 2) https://datatracker.ietf.org/doc/html/rfc7049 #------------------------------------------------------------------------------ package Image::ExifTool::CBOR; use strict; use vars qw($VERSION); use Image::ExifTool qw(:DataAccess :Utils); use Image::ExifTool::JSON; $VERSION = '1.01'; sub ProcessCBOR($$$); sub ReadCBORValue($$$$); # optional CBOR type code my %cborType6 = ( 0 => 'date/time string', 1 => 'epoch-based date/time', 2 => 'positive bignum', 3 => 'negative bignum', 4 => 'decimal fraction', 5 => 'bigfloat', 21 => 'expected base64url encoding', 22 => 'expected base64 encoding', 23 => 'expected base16 encoding', 24 => 'encoded CBOR data', 32 => 'URI', 33 => 'base64url', 34 => 'base64', 35 => 'regular expression', 36 => 'MIME message', 55799 => 'CBOR magic number', ); my %cborType7 = ( 20 => 'False', 21 => 'True', 22 => 'null', 23 => 'undef', ); %Image::ExifTool::CBOR::Main = ( GROUPS => { 0 => 'JUMBF', 1 => 'CBOR', 2 => 'Other' }, VARS => { NO_ID => 1 }, PROCESS_PROC => \&ProcessCBOR, NOTES => q{ The tags below are extracted from CBOR (Concise Binary Object Representation) metadata. The C2PA specification uses this format for some metadata. As well as these tags, ExifTool will read any existing tags. }, 'dc:title' => 'Title', 'dc:format' => 'Format', # my sample file has the following 2 tags in CBOR, but they should be JSON authorName => { Name => 'AuthorName', Groups => { 2 => 'Author' } }, authorIdentifier=> { Name => 'AuthorIdentifier', Groups => { 2 => 'Author' } }, documentID => { }, instanceID => { }, thumbnailHash => { List => 1 }, thumbnailUrl => { Name => 'ThumbnailURL' }, relationship => { } ); #------------------------------------------------------------------------------ # Read CBOR value # Inputs: 0) ExifTool ref, 1) data ref, 2) position in data, 3) data end # Returns: 0) value, 1) error string, 2) new data position sub ReadCBORValue($$$$) { my ($et, $dataPt, $pos, $end) = @_; return(undef, 'Truncated CBOR data', $pos) if $pos >= $end; my $verbose = $$et{OPTIONS}{Verbose}; my $indent = $$et{INDENT}; my $dumpStart = $pos; my $fmt = Get8u($dataPt, $pos++); my $dat = $fmt & 0x1f; my ($num, $val, $err, $size); $fmt >>= 5; if ($dat < 24) { $num = $dat; } elsif ($dat == 31) { # indefinite count (not used in C2PA) $num = -1; # (flag for indefinite count) $et->VPrint(1, "$$et{INDENT} (indefinite count):\n"); } else { my $format = { 24 => 'int8u', 25 => 'int16u', 26 => 'int32u', 27 => 'int64u' }->{$dat}; return(undef, "Invalid CBOR integer type $dat", $pos) unless $format; $size = Image::ExifTool::FormatSize($format); return(undef, 'Truncated CBOR integer value', $pos) if $pos + $size > $end; $num = ReadValue($dataPt, $pos, $format, 1, $size); $pos += $size; } my $pre = ''; if (defined $$et{cbor_pre} and $fmt != 6) { $pre = $$et{cbor_pre}; delete $$et{cbor_pre}; } if ($fmt == 0) { # positive integer $val = $num; $et->VPrint(1, "$$et{INDENT} ${pre}int+: $val\n"); } elsif ($fmt == 1) { # negative integer $val = -1 * $num; $et->VPrint(1, "$$et{INDENT} ${pre}int-: $val\n"); } elsif ($fmt == 2 or $fmt == 3) { # byte/UTF8 string return(undef, 'Truncated CBOR string value', $pos) if $pos + $num > $end; if ($num < 0) { # (should not happen in C2PA) my $string = ''; $$et{INDENT} .= ' '; for (;;) { ($val, $err, $pos) = ReadCBORValue($et, $dataPt, $pos, $end); return(undef, $err, $pos) if $err; last if not defined $val; # hit the break? # (note: strictly we should be checking that this was a string we read) $string .= $val; } $$et{INDENT} = $indent; return($string, undef, $pos); # return concatenated byte/text string } else { $val = substr($$dataPt, $pos, $num); } $pos += $num; if ($fmt == 2) { # (byte string) $et->VPrint(1, "$$et{INDENT} ${pre}byte: <binary data ".length($val)." bytes>\n"); my $dat = $val; $val = \$dat; # use scalar reference for binary data } else { # (text string) $val = $et->Decode($val, 'UTF8'); $et->VPrint(1, "$$et{INDENT} ${pre}text: '${val}'\n"); } } elsif ($fmt == 4 or $fmt == 5) { # list/hash if ($fmt == 4) { $et->VPrint(1, "$$et{INDENT} ${pre}list: <$num elements>\n"); } else { $et->VPrint(1, "$$et{INDENT} ${pre}hash: <$num pairs>\n"); $num *= 2; } $$et{INDENT} .= ' '; my $i = 0; my @list; Image::ExifTool::HexDump($dataPt, $pos - $dumpStart, Start => $dumpStart, DataPos => $$et{cbor_datapos}, Prefix => $$et{INDENT}, ) if $verbose > 2; while ($num) { $$et{cbor_pre} = "$i) "; if ($fmt == 4) { ++$i; } elsif ($num & 0x01) { $$et{cbor_pre} = ' ' x length($$et{cbor_pre}); ++$i; } ($val, $err, $pos) = ReadCBORValue($et, $dataPt, $pos, $end); return(undef, $err, $pos) if $err; if (not defined $val) { return(undef, 'Unexpected list terminator', $pos) unless $num < 0; last; } push @list, $val; --$num; } $dumpStart = $pos; $$et{INDENT} = $indent; if ($fmt == 5) { my ($i, @keys); my %hash = ( _ordered_keys_ => \@keys ); for ($i=0; $i<@list-1; $i+=2) { $hash{$list[$i]} = $list[$i+1]; push @keys, $list[$i]; # save ordered list of keys } $val = \%hash; } else { $val = \@list; } } elsif ($fmt == 6) { # optional tag if ($verbose) { my $str = "$num (" . ($cborType6{$num} || 'unknown') . ')'; my $spc = $$et{cbor_pre} ? (' ' x length $$et{cbor_pre}) : ''; $et->VPrint(1, "$$et{INDENT} $spc<CBOR optional type $str>\n"); Image::ExifTool::HexDump($dataPt, $pos - $dumpStart, Start => $dumpStart, DataPos => $$et{cbor_datapos}, Prefix => $$et{INDENT} . ' ', ) if $verbose > 2; } # read next value (note: in the case of multiple tags, # this nesting will apply the tags in the correct order) ($val, $err, $pos) = ReadCBORValue($et, $dataPt, $pos, $end); $dumpStart = $pos; # convert some values according to the optional tag number (untested) if ($num == 0 and not ref $val) { # date/time string require Image::ExifTool::XMP; $val = Image::ExifTool::XMP::ConvertXMPDate($val); } elsif ($num == 1 and not ref $val) { # epoch-based date/time if (Image::ExifTool::IsFloat($val)) { my $dec = ($val == int($val)) ? undef : 6; $val = Image::ExifTool::ConvertUnixTime($val, 1, $dec); } } elsif (($num == 2 or $num == 3) and ref($val) eq 'SCALAR') { # pos/neg bignum my $big = 0; $big = 256 * $big + Get8u($val,$_) foreach 0..(length($$val) - 1); $val = $num==2 ? $big : -$big; } elsif (($num == 4 or $num == 5) and # decimal fraction or bigfloat ref($val) eq 'ARRAY' and @$val == 2 and Image::ExifTool::IsInt($$val[0]) and Image::ExifTool::IsInt($$val[1])) { $val = $$val[1] * ($num == 4 ? 10 : 2) ** $$val[0]; } } elsif ($fmt == 7) { if ($dat == 31) { undef $val; # "break" = end of indefinite array/hash (not used in C2PA) } elsif ($dat < 24) { $val = $cborType7{$num}; $val = "Unknown ($val)" unless defined $val; } elsif ($dat == 25) { # half-precision float my $exp = ($num >> 10) & 0x1f; my $mant = $num & 0x3ff; if ($exp == 0) { $val = $mant ** -24; $val *= -1 if $num & 0x8000; } elsif (exp != 31) { $val = ($mant + 1024) ** ($exp - 25); $val *= -1 if $num & 0x8000; } else { $val = $mant == 0 ? '<inf>' : '<nan>'; } } elsif ($dat == 26) { # float $val = GetFloat($dataPt, $pos - $size); } elsif ($dat == 27) { # double $val = GetDouble($dataPt, $pos - $size); } else { return(undef, "Invalid CBOR type 7 variant $num", $pos); } $et->VPrint(1, "$$et{INDENT} ${pre}typ7: ".(defined $val ? $val : '<break>')."\n"); } else { return(undef, "Unknown CBOR format $fmt", $pos); } Image::ExifTool::HexDump($dataPt, $pos - $dumpStart, Start => $dumpStart, DataPos => $$et{cbor_datapos}, Prefix => $$et{INDENT} . ' ', MaxLen => $verbose < 5 ? ($verbose == 3 ? 96 : 2048) : undef, ) if $verbose > 2; return($val, $err, $pos); } #------------------------------------------------------------------------------ # Read CBOR box # Inputs: 0) ExifTool ref, 1) dirInfo ref, 2) tag table ref # Returns: 1 on success sub ProcessCBOR($$$) { my ($et, $dirInfo, $tagTablePtr) = @_; my $dataPt = $$dirInfo{DataPt}; my $pos = $$dirInfo{DirStart}; my $end = $pos + $$dirInfo{DirLen}; my ($val, $err, $tag, $i); $et->VerboseDir('CBOR', undef, $$dirInfo{DirLen}); $$et{cbor_datapos} = $$dirInfo{DataPos} + $$dirInfo{Base}; while ($pos < $end) { ($val, $err, $pos) = ReadCBORValue($et, $dataPt, $pos, $end); $err and $et->Warn($err), last; if (ref $val eq 'HASH') { foreach $tag (@{$$val{_ordered_keys_}}) { Image::ExifTool::JSON::ProcessTag($et, $tagTablePtr, $tag, $$val{$tag}); } } elsif (ref $val eq 'ARRAY') { for ($i=0; $i<@$val; ++$i) { Image::ExifTool::JSON::ProcessTag($et, $tagTablePtr, "Item$i", $$val[$i]); } } elsif ($val eq '0') { $et->VPrint(1, "$$et{INDENT} <CBOR end>\n"); last; # (treat as padding) } else { $et->VPrint(1, "$$et{INDENT} Unknown value: $val\n"); } } return 1; } 1; # end __END__ =head1 NAME Image::ExifTool::CBOR - Read CBOR format metadata =head1 SYNOPSIS This module is used by Image::ExifTool =head1 DESCRIPTION This module contains definitions required by Image::ExifTool read Concise Binary Object Representation (CBOR) formatted metadata, used by the C2PA specification. =head1 AUTHOR Copyright 2003-2022, Phil Harvey (philharvey66 at gmail.com) This library is free software; you can redistribute it and/or modify it under the same terms as Perl itself. =head1 REFERENCES =over 4 =item L<https://c2pa.org/public-draft/> =item L<https://datatracker.ietf.org/doc/html/rfc7049> =back =head1 SEE ALSO L<Image::ExifTool::TagNames/CBOR Tags>, L<Image::ExifTool(3pm)|Image::ExifTool> =cut