test_pie/external/exiftool/lib/Image/ExifTool/VCard.pm

444 lines
17 KiB
Perl

#------------------------------------------------------------------------------
# File: VCard.pm
#
# Description: Read vCard and iCalendar meta information
#
# Revisions: 2015/04/05 - P. Harvey Created
# 2015/05/02 - PH Added iCalendar support
#
# References: 1) http://en.m.wikipedia.org/wiki/VCard
# 2) http://tools.ietf.org/html/rfc6350
# 3) http://tools.ietf.org/html/rfc5545
#------------------------------------------------------------------------------
package Image::ExifTool::VCard;
use strict;
use vars qw($VERSION);
use Image::ExifTool qw(:DataAccess :Utils);
$VERSION = '1.06';
my %unescapeVCard = ( '\\'=>'\\', ','=>',', 'n'=>"\n", 'N'=>"\n" );
# lookup for iCalendar components (used to generate family 1 group names if top level)
my %isComponent = ( Event=>1, Todo=>1, Journal=>1, Freebusy=>1, Timezone=>1, Alarm=>1 );
my %timeInfo = (
# convert common date/time formats to EXIF style
ValueConv => q{
$val =~ s/(\d{4})(\d{2})(\d{2})T(\d{2})(\d{2})(\d{2})(Z?)/$1:$2:$3 $4:$5:$6$7/g;
$val =~ s/(\d{4})(\d{2})(\d{2})/$1:$2:$3/g;
$val =~ s/(\d{4})-(\d{2})-(\d{2})/$1:$2:$3/g;
return $val;
},
PrintConv => '$self->ConvertDateTime($val)',
);
# vCard tags (ref 1/2/PH)
# Note: The case of all tag ID's is normalized to lowercase with uppercase first letter
%Image::ExifTool::VCard::Main = (
GROUPS => { 2 => 'Document' },
VARS => { NO_LOOKUP => 1 }, # omit tags from lookup
NOTES => q{
This table lists common vCard tags, but ExifTool will also extract any other
vCard tags found. Tag names may have "Pref" added to indicate the preferred
instance of a vCard property, and other "TYPE" parameters may also added to
the tag name. VCF files may contain multiple vCard entries which are
distinguished by the ExifTool family 3 group name (document number). See
L<http://tools.ietf.org/html/rfc6350> for the vCard 4.0 specification.
},
Version => { Name => 'VCardVersion', Description => 'VCard Version' },
Fn => { Name => 'FormattedName', Groups => { 2 => 'Author' } },
N => { Name => 'Name', Groups => { 2 => 'Author' } },
Bday => { Name => 'Birthday', Groups => { 2 => 'Time' }, %timeInfo },
Tz => { Name => 'TimeZone', Groups => { 2 => 'Time' } },
Adr => { Name => 'Address', Groups => { 2 => 'Location' } },
Geo => {
Name => 'Geolocation',
Groups => { 2 => 'Location' },
# when used as a parameter, VCard 4.0 adds a "geo:" prefix that we need to remove
ValueConv => '$val =~ s/^geo://; $val',
},
Anniversary => { },
Email => { },
Gender => { },
Impp => 'IMPP',
Lang => 'Language',
Logo => { },
Nickname => { },
Note => { },
Org => 'Organization',
Photo => { Groups => { 2 => 'Preview' } },
Prodid => 'Software',
Rev => 'Revision',
Sound => { },
Tel => 'Telephone',
Title => 'JobTitle',
Uid => 'UID',
Url => 'URL',
'X-ablabel' => { Name => 'ABLabel', PrintConv => '$val =~ s/^_\$!<(.*)>!\$_$/$1/; $val' },
'X-abdate' => { Name => 'ABDate', Groups => { 2 => 'Time' }, %timeInfo },
'X-aim' => 'AIM',
'X-icq' => 'ICQ',
'X-abuid' => 'AB_UID',
'X-abrelatednames' => 'ABRelatedNames',
'X-socialprofile' => 'SocialProfile',
);
%Image::ExifTool::VCard::VCalendar = (
GROUPS => { 1 => 'VCalendar', 2 => 'Document' },
VARS => {
NO_LOOKUP => 1, # omit tags from lookup
LONG_TAGS => 6, # some X-microsoft tags have unavoidably long ID's
},
NOTES => q{
The VCard module is also used to process iCalendar ICS files since they use
a format similar to vCard. The following table lists standard iCalendar
tags, but any existing tags will be extracted. Top-level iCalendar
components (eg. Event, Todo, Timezone, etc.) are used for the family 1 group
names, and embedded components (eg. Alarm) are added as a prefix to the tag
name. See L<http://tools.ietf.org/html/rfc5545> for the official iCalendar
2.0 specification.
},
Version => { Name => 'VCalendarVersion', Description => 'VCalendar Version' },
Calscale => 'CalendarScale',
Method => { },
Prodid => 'Software',
Attach => 'Attachment',
Categories => { },
Class => 'Classification',
Comment => { },
Description => { },
Geo => {
Name => 'Geolocation',
Groups => { 2 => 'Location' },
ValueConv => '$val =~ s/^geo://; $val',
},
Location => { Name => 'Location', Groups => { 2 => 'Location' } },
'Percent-complete' => 'PercentComplete',
Priority => { },
Resources => { },
Status => { },
Summary => { },
Completed => { Name => 'DateTimeCompleted', Groups => { 2 => 'Time' }, %timeInfo },
Dtend => { Name => 'DateTimeEnd', Groups => { 2 => 'Time' }, %timeInfo },
Due => { Name => 'DateTimeDue', Groups => { 2 => 'Time' }, %timeInfo },
Dtstart => { Name => 'DateTimeStart', Groups => { 2 => 'Time' }, %timeInfo },
Duration => { },
Freebusy => 'FreeBusyTime',
Transp => 'TimeTransparency',
Tzid => { Name => 'TimezoneID', Groups => { 2 => 'Time' } },
Tzname => { Name => 'TimezoneName', Groups => { 2 => 'Time' } },
Tzoffsetfrom=> { Name => 'TimezoneOffsetFrom', Groups => { 2 => 'Time' } },
Tzoffsetto => { Name => 'TimezoneOffsetTo', Groups => { 2 => 'Time' } },
Tzurl => { Name => 'TimeZoneURL', Groups => { 2 => 'Time' } },
Attendee => { },
Contact => { },
Organizer => { },
'Recurrence-id' => 'RecurrenceID',
'Related-to' => 'RelatedTo',
Url => 'URL',
Uid => 'UID',
Exdate => { Name => 'ExceptionDateTimes', Groups => { 2 => 'Time' }, %timeInfo },
Rdate => { Name => 'RecurrenceDateTimes', Groups => { 2 => 'Time' }, %timeInfo },
Rrule => { Name => 'RecurrenceRule', Groups => { 2 => 'Time' } },
Action => { },
Repeat => { },
Trigger => { },
Created => { Name => 'DateCreated', Groups => { 2 => 'Time' }, %timeInfo },
Dtstamp => { Name => 'DateTimeStamp', Groups => { 2 => 'Time' }, %timeInfo },
'Last-modified' => { Name => 'ModifyDate', Groups => { 2 => 'Time' }, %timeInfo },
Sequence => 'SequenceNumber',
'Request-status' => 'RequestStatus',
Acknowledged=> { Name => 'Acknowledged', Groups => { 2 => 'Time' }, %timeInfo },
#
# Observed X-tags (not a comprehensive list):
#
'X-apple-calendar-color'=> 'CalendarColor',
'X-apple-default-alarm' => 'DefaultAlarm',
'X-apple-local-default-alarm' => 'LocalDefaultAlarm',
'X-microsoft-cdo-appt-sequence' => 'AppointmentSequence',
'X-microsoft-cdo-ownerapptid' => 'OwnerAppointmentID',
'X-microsoft-cdo-busystatus' => 'BusyStatus',
'X-microsoft-cdo-intendedstatus' => 'IntendedBusyStatus',
'X-microsoft-cdo-alldayevent' => 'AllDayEvent',
'X-microsoft-cdo-importance' => {
Name => 'Importance',
PrintConv => {
0 => 'Low',
1 => 'Normal',
2 => 'High',
},
},
'X-microsoft-cdo-insttype' => {
Name => 'InstanceType',
PrintConv => {
0 => 'Non-recurring Appointment',
1 => 'Recurring Appointment',
2 => 'Single Instance of Recurring Appointment',
3 => 'Exception to Recurring Appointment',
},
},
'X-microsoft-donotforwardmeeting' => 'DoNotForwardMeeting',
'X-microsoft-disallow-counter' => 'DisallowCounterProposal',
'X-microsoft-locations' => { Name => 'MeetingLocations', Groups => { 2 => 'Location' } },
'X-wr-caldesc' => 'CalendarDescription',
'X-wr-calname' => 'CalendarName',
'X-wr-relcalid' => 'CalendarID',
'X-wr-timezone' => { Name => 'TimeZone2', Groups => { 2 => 'Time' } },
'X-wr-alarmuid' => 'AlarmUID',
);
#------------------------------------------------------------------------------
# Get vCard tag, creating if necessary
# Inputs: 0) ExifTool ref, 1) tag table ref, 2) tag ID, 3) tag Name,
# 4) source tagInfo ref, 5) lang code
# Returns: tagInfo ref
sub GetVCardTag($$$$;$$)
{
my ($et, $tagTablePtr, $tag, $name, $srcInfo, $langCode) = @_;
my $tagInfo = $$tagTablePtr{$tag};
unless ($tagInfo) {
if ($srcInfo) {
$tagInfo = { %$srcInfo };
} else {
$tagInfo = { };
$et->VPrint(0, $$et{INDENT}, "[adding $tag]\n");
}
$$tagInfo{Name} = $name;
delete $$tagInfo{Description}; # create new description
AddTagToTable($tagTablePtr, $tag, $tagInfo);
}
# handle alternate languages (the "language" parameter)
$tagInfo = Image::ExifTool::GetLangInfo($tagInfo, $langCode) if $langCode;
return $tagInfo;
}
#------------------------------------------------------------------------------
# Decode vCard text
# Inputs: 0) ExifTool ref, 1) vCard text, 2) encoding
# Returns: decoded text (or array ref for a list of values)
sub DecodeVCardText($$;$)
{
my ($et, $val, $enc) = @_;
$enc = defined($enc) ? lc $enc : '';
if ($enc eq 'b' or $enc eq 'base64') {
require Image::ExifTool::XMP;
$val = Image::ExifTool::XMP::DecodeBase64($val);
} else {
if ($enc eq 'quoted-printable') {
# convert "=HH" hex codes to characters
$val =~ s/=([0-9a-f]{2})/chr(hex($1))/ige;
}
$val = $et->Decode($val, 'UTF8'); # convert from UTF-8
# convert unescaped commas to nulls to separate list items
$val =~ s/(\\.)|(,)/$1 || "\0"/sge;
# unescape necessary characters in value
$val =~ s/\\(.)/$unescapeVCard{$1}||$1/sge;
# split into list if necessary
my @vals = split /\0/, $val;
$val = \@vals if @vals > 1;
}
return $val;
}
#------------------------------------------------------------------------------
# Read information in a vCard file
# Inputs: 0) ExifTool ref, 1) dirInfo ref
# Returns: 1 on success, 0 if this wasn't a valid vCard file
sub ProcessVCard($$)
{
local $_;
my ($et, $dirInfo) = @_;
my $raf = $$dirInfo{RAF};
my ($buff, $val, $ok, $component, %compNum, @count);
return 0 unless $raf->Read($buff, 24) and $raf->Seek(0,0) and $buff=~/^BEGIN:(VCARD|VCALENDAR)\r\n/i;
my ($type, $lbl, $tbl, $ext) = uc($1) eq 'VCARD' ? qw(VCard vCard Main VCF) : qw(ICS iCalendar VCalendar ICS);
$et->SetFileType($type, undef, $ext);
return 1 if $$et{OPTIONS}{FastScan} and $$et{OPTIONS}{FastScan} == 3;
local $/ = "\r\n";
my $tagTablePtr = GetTagTable("Image::ExifTool::VCard::$tbl");
my $more = $raf->ReadLine($buff); # read first line
chomp $buff if $more;
while ($more) {
# retrieve previous line from $buff
$val = $buff if defined $buff;
# read ahead to next line to see if is a continuation
$more = $raf->ReadLine($buff);
if ($more) {
chomp $buff;
# add continuation line if necessary
$buff =~ s/^[ \t]// and $val .= $buff, undef($buff), next;
}
if ($val =~ /^(BEGIN|END):(V?)(\w+)$/i) {
my ($begin, $v, $what) = ((lc($1) eq 'begin' ? 1 : 0), $2, ucfirst lc $3);
if ($what eq 'Card' or $what eq 'Calendar') {
if ($begin) {
@count = ( { } ); # reset group counters
} else {
$ok = 1; # ok if we read at least on full VCARD or VCALENDAR
}
next;
}
# absorb top-level component into family 1 group name
if ($isComponent{$what}) {
if ($begin) {
unless ($component) {
# begin a new top-level component
@count = ( { } );
$component = $what;
$compNum{$component} = ($compNum{$component} || 0) + 1;
next;
}
} elsif ($component and $component eq $what) {
# this top-level component has ended
undef $component;
next;
}
}
# keep count of each component at this level
if ($begin) {
$count[-1]{$what} = ($count[-1]{$what} || 0) + 1 if $v;
push @count, { obj => $what };
} elsif (@count > 1) {
pop @count;
}
next;
} elsif ($ok) {
$ok = 0;
$$et{DOC_NUM} = ++$$et{DOC_COUNT}; # read next card as a new document
}
unless ($val =~ s/^([-A-Za-z0-9.]+)//) {
$et->WarnOnce("Unrecognized line in $lbl file");
next;
}
my $tag = $1;
# set group if it exists
if ($tag =~ s/^([-A-Za-z0-9]+)\.//) {
$$et{SET_GROUP1} = ucfirst lc $1;
} elsif ($component) {
$$et{SET_GROUP1} = $component . $compNum{$component};
} else {
delete $$et{SET_GROUP1};
}
my ($name, %param, $p, @val);
# vCard tag ID's are case-insensitive, so normalize to lowercase with
# an uppercase first letter for use as a tag name
$name = ucfirst $tag if $tag =~ /[a-z]/; # preserve mixed case in name if it exists
$tag = ucfirst lc $tag;
# get source tagInfo reference
my $srcInfo = $et->GetTagInfo($tagTablePtr, $tag);
if ($srcInfo) {
$name = $$srcInfo{Name}; # use our name
} else {
$name or $name = $tag;
# remove leading "X-" from name if it exists
$name =~ s/^X-// and $name = ucfirst $name;
}
# add object name(s) to tag if necessary
if (@count > 1) {
my $i;
for ($i=$#count-1; $i>=0; --$i) {
my $pre = $count[$i-1]{obj}; # use containing object name as tag prefix
my $c = $count[$i]{$pre}; # add index for object number
$c = '' unless defined $c;
$tag = $pre . $c . $tag;
$name = $pre . $c . $name;
}
}
# parse parameters
while ($val =~ s/^;([-A-Za-z0-9]*)(=?)//) {
$p = ucfirst lc $1;
# convert old vCard 2.x parameters to the new "TYPE=" format
$2 or $val = $1 . $val, $p = 'Type';
# read parameter value
for (;;) {
last unless $val =~ s/^"([^"]*)",?// or $val =~ s/^([^";:,]+,?)//;
my $v = $p eq 'Type' ? ucfirst lc $1 : $1;
$param{$p} = defined($param{$p}) ? $param{$p} . $v : $v;
}
if (defined $param{$p}) {
$param{$p} =~ s/\\(.)/$unescapeVCard{$1}||$1/sge;
} else {
$param{$p} = '';
}
}
$val =~ s/^:// or $et->WarnOnce("Invalid line in $lbl file"), next;
# add 'Type' parameter to id and name if it exists
$param{Type} and $tag .= $param{Type}, $name .= $param{Type};
# convert base64-encoded data
if ($val =~ s{^data:(\w+)/(\w+);base64,}{}) {
my $xtra = ucfirst(lc $1) . ucfirst(lc $2);
$tag .= $xtra;
$name .= $xtra;
$param{Encoding} = 'base64';
}
$val = DecodeVCardText($et, $val, $param{Encoding});
my $tagInfo = GetVCardTag($et, $tagTablePtr, $tag, $name, $srcInfo, $param{Language});
$et->HandleTag($tagTablePtr, $tag, $val, TagInfo => $tagInfo);
# handle some other parameters that we care about (ignore the rest for now)
foreach $p (qw(Geo Label Tzid)) {
next unless defined $param{$p};
# use tag attributes from our table if it exists
my $srcTag2 = $et->GetTagInfo($tagTablePtr, $p);
my $pn = $srcTag2 ? $$srcTag2{Name} : $p;
$val = DecodeVCardText($et, $param{$p});
# add parameter to tag ID and name
my ($tg, $nm) = ($tag . $p, $name . $pn);
$tagInfo = GetVCardTag($et, $tagTablePtr, $tg, $nm, $srcTag2, $param{Language});
$et->HandleTag($tagTablePtr, $tg, $val, TagInfo => $tagInfo);
}
}
delete $$et{SET_GROUP1};
delete $$et{DOC_NUM};
$ok or $et->Warn("Missing $lbl end");
return 1;
}
1; # end
__END__
=head1 NAME
Image::ExifTool::VCard - Read vCard and iCalendar meta information
=head1 SYNOPSIS
This module is used by Image::ExifTool
=head1 DESCRIPTION
This module contains definitions required by Image::ExifTool to read meta
information from vCard VCF and iCalendar ICS files.
=head1 AUTHOR
Copyright 2003-2018, Phil Harvey (phil at owl.phy.queensu.ca)
This library is free software; you can redistribute it and/or modify it
under the same terms as Perl itself.
=head1 REFERENCES
=over 4
=item L<http://en.m.wikipedia.org/wiki/VCard>
=item L<http://tools.ietf.org/html/rfc6350>
=item L<http://tools.ietf.org/html/rfc5545>
=back
=head1 SEE ALSO
L<Image::ExifTool::TagNames/VCard Tags>,
L<Image::ExifTool::TagNames/VCard VCalendar Tags>,
L<Image::ExifTool(3pm)|Image::ExifTool>
=cut