#------------------------------------------------------------------------------
# File: Vorbis.pm
#
# Description: Read Ogg Vorbis meta information
#
# Revisions: 11/10/2006 - P. Harvey Created
#
# References: 1) http://www.xiph.org/vorbis/doc/
# 2) http://flac.sourceforge.net/ogg_mapping.html
#------------------------------------------------------------------------------
package Image::ExifTool::Vorbis;
use strict;
use vars qw($VERSION);
use Image::ExifTool qw(:DataAccess :Utils);
$VERSION = '1.01';
my $MAX_PACKETS = 2; # maximum packets to scan from each stream at start of file
sub ProcessComments($$$);
sub DecodeCoverArt($);
# Vorbis comment tags
%Image::ExifTool::Vorbis::Main = (
NOTES => q{
ExifTool extracts the following Vorbis information from Ogg files. As well
as this, ExifTool also extracts FLAC and ID3 information from Ogg files.
},
1 => {
Name => 'Identification',
SubDirectory => { TagTable => 'Image::ExifTool::Vorbis::Identification' },
},
3 => {
Name => 'Comments',
SubDirectory => { TagTable => 'Image::ExifTool::Vorbis::Comments' },
},
);
%Image::ExifTool::Vorbis::Identification = (
PROCESS_PROC => \&Image::ExifTool::ProcessBinaryData,
GROUPS => { 2 => 'Audio' },
0 => {
Name => 'VorbisVersion',
Format => 'int32u',
},
4 => 'AudioChannels',
5 => {
Name => 'SampleRate',
Format => 'int32u',
},
9 => {
Name => 'MaximumBitrate',
Format => 'int32u',
RawConv => '$val || undef',
},
13 => {
Name => 'NominalBitrate',
Format => 'int32u',
RawConv => '$val || undef',
},
17 => {
Name => 'MinimumBitrate',
Format => 'int32u',
RawConv => '$val || undef',
},
);
%Image::ExifTool::Vorbis::Comments = (
PROCESS_PROC => \&ProcessComments,
GROUPS => { 2 => 'Audio' },
NOTES => q{
The tags below are only some common tags found in the Vorbis comments of Ogg
Vorbis and Ogg FLAC audio files, however ExifTool will extract values from
any tag found, even if not listed here.
},
vendor => { Notes => 'from comment header' },
TITLE => { Name => 'Title' },
VERSION => { Name => 'Version' },
ALBUM => { Name => 'Album' },
TRACKNUMBER=>{ Name => 'TrackNumber' },
ARTIST => { Name => 'Artist', Groups => { 2 => 'Author' }, List => 1 },
PERFORMER => { Name => 'Performer', Groups => { 2 => 'Author' }, List => 1 },
COPYRIGHT => { Name => 'Copyright', Groups => { 2 => 'Author' } },
LICENSE => { Name => 'License', Groups => { 2 => 'Author' } },
ORGANIZATION=>{Name => 'Organization', Groups => { 2 => 'Author' } },
DESCRIPTION=>{ Name => 'Description' },
GENRE => { Name => 'Genre' },
DATE => { Name => 'Date', Groups => { 2 => 'Time' } },
LOCATION => { Name => 'Location', Groups => { 2 => 'Location' } },
CONTACT => { Name => 'Contact', Groups => { 2 => 'Author' }, List => 1 },
ISRC => { Name => 'ISRCNumber' },
COVERARTMIME => { Name => 'CoverArtMIMEType' },
COVERART => {
Name => 'CoverArt',
Notes => 'base64-encoded image',
ValueConv => q{
require Image::ExifTool::XMP;
Image::ExifTool::XMP::DecodeBase64($val);
},
},
REPLAYGAIN_TRACK_PEAK => { Name => 'ReplayGainTrackPeak' },
REPLAYGAIN_TRACK_GAIN => { Name => 'ReplayGainTrackGain' },
REPLAYGAIN_ALBUM_PEAK => { Name => 'ReplayGainAlbumPeak' },
REPLAYGAIN_ALBUM_GAIN => { Name => 'ReplayGainAlbumGain' },
# observed in "Xiph.Org libVorbis I 20020717" ogg:
ENCODED_USING => { Name => 'EncodedUsing' },
ENCODED_BY => { Name => 'EncodedBy' },
COMMENT => { Name => 'Comment' },
);
#------------------------------------------------------------------------------
# Process Vorbis Comments
# Inputs: 0) ExifTool object ref, 1) dirInfo ref, 2) tag table ref
# Returns: 1 on success, otherwise returns 0 and sets a Warning
sub ProcessComments($$$)
{
my ($exifTool, $dirInfo, $tagTablePtr) = @_;
my $dataPt = $$dirInfo{DataPt};
my $dataPos = $$dirInfo{DataPos};
my $pos = $$dirInfo{DirStart} || 0;
my $end = $$dirInfo{DirLen} ? $pos + $$dirInfo{DirLen} : length $$dataPt;
my ($num, $index);
SetByteOrder('II');
for (;;) {
last if $pos + 4 > $end;
my $len = Get32u($dataPt, $pos);
last if $pos + 4 + $len > $end;
my $start = $pos + 4;
my $buff = substr($$dataPt, $start, $len);
$pos = $start + $len;
my ($tag, $val);
if (defined $num) {
$buff =~ /(.*?)=(.*)/s or last;
($tag, $val) = ($1, $2);
} else {
$tag = 'vendor';
$val = $buff;
$num = ($pos + 4 < $end) ? Get32u($dataPt, $pos) : 0;
$exifTool->VPrint(0, " + [Vorbis comments with $num entries]\n");
$pos += 4;
}
# add tag to table unless it exists already
unless ($$tagTablePtr{$tag}) {
my $name = ucfirst(lc($tag));
# remove invalid characters in tag name and capitalize following letters
$name =~ s/[^\w-]+(.?)/\U$1/sg;
$name =~ s/([a-z0-9])_([a-z])/$1\U$2/g;
Image::ExifTool::AddTagToTable($tagTablePtr, $tag, { Name => $name });
}
$exifTool->HandleTag($tagTablePtr, $tag, $val,
Index => $index,
DataPt => $dataPt,
DataPos => $dataPos,
Start => $start,
Size => $len,
);
# all done if this was our last tag
$num-- or return 1;
$index = (defined $index) ? $index + 1 : 0;
}
$exifTool->Warn('Format error in Vorbis comments');
return 0;
}
#------------------------------------------------------------------------------
# Process Ogg packet
# Inputs: 0) ExifTool object ref, 1) data ref, 2) tag table ref
# Returns: 1 on success
sub ProcessPacket($$$)
{
my ($exifTool, $dataPt, $tagTablePtr) = @_;
if ($$dataPt =~ /^(.)vorbis/s) {
my $tag = ord($1);
my $tagInfo = $exifTool->GetTagInfo($tagTablePtr, $tag);
return 0 unless $tagInfo and $$tagInfo{SubDirectory};
my %dirInfo = (
DataPt => $dataPt,
DirName => $$tagInfo{Name},
DirStart => 7,
);
my $table = GetTagTable($tagInfo->{SubDirectory}->{TagTable});
return $exifTool->ProcessDirectory(\%dirInfo, $table);
}
return 0;
}
#------------------------------------------------------------------------------
# Extract information from an Ogg Vorbis or Ogg FLAC file
# Inputs: 0) ExifTool object reference, 1) dirInfo reference
# Returns: 1 on success, 0 if this wasn't a valid Ogg Vorbis file
sub ProcessOGG($$)
{
my ($exifTool, $dirInfo) = @_;
# must first check for leading/trailing ID3 information
unless ($exifTool->{DONE_ID3}) {
require Image::ExifTool::ID3;
Image::ExifTool::ID3::ProcessID3($exifTool, $dirInfo) and return 1;
}
my $raf = $$dirInfo{RAF};
my $verbose = $exifTool->Options('Verbose');
my $out = $exifTool->Options('TextOut');
my ($success, $page, $packets, $streams) = (0,0,0,0);
my ($buff, $tagTablePtr, $flag, $stream, %val, $numFlac);
for (;;) {
# must read ahead to next page to see if it is a continuation
# (this code would be a lot simpler if the continuation flag
# was on the leading instead of the trailing page!)
if ($raf and $raf->Read($buff, 28) == 28) {
# validate magic number
unless ($buff =~ /^OggS/) {
$success and $exifTool->Warn('Lost synchronization');
last;
}
unless ($success) {
# set file type and initialize on first page
$success = 1;
$exifTool->SetFileType();
SetByteOrder('II');
$tagTablePtr = GetTagTable('Image::ExifTool::Vorbis::Main');
}
$flag = Get8u(\$buff, 5); # page flag
$stream = Get32u(\$buff, 14); # stream serial number
++$streams if $flag & 0x02; # count start-of-stream pages
++$packets unless $flag & 0x01; # keep track of packet count
} else {
# all done unless we have to process our last packet
last unless %val;
($stream) = sort keys %val; # take a stream
$flag = 0; # no continuation
undef $raf; # flag for done reading
}
if (defined $numFlac) {
# stop to process FLAC headers if we hit the end of file
last unless $raf;
--$numFlac; # one less header packet to read
} else {
# can finally process previous packet from this stream
# unless this is a continuation page
if (defined $val{$stream} and not $flag & 0x01) {
ProcessPacket($exifTool, \$val{$stream}, $tagTablePtr);
delete $val{$stream};
# only read the first $MAX_PACKETS packets from each stream
if ($packets > $MAX_PACKETS * $streams or not defined $raf) {
last unless %val; # all done (success!)
next; # process remaining stream(s)
}
}
# stop processing Ogg Vorbis if we have scanned enough packets
last if $packets > $MAX_PACKETS * $streams and not %val;
}
# continue processing the current page
my $pageNum = Get32u(\$buff, 18); # page sequence number
my $nseg = Get8u(\$buff, 26); # number of segments
# calculate total data length
my $dataLen = Get8u(\$buff, 27);
if ($nseg) {
$raf->Read($buff, $nseg-1) == $nseg-1 or last;
my @segs = unpack('C*', $buff);
# could check that all these (but the last) are 255...
foreach (@segs) { $dataLen += $_ }
}
if (defined $page) {
if ($page == $pageNum) {
++$page;
} else {
$exifTool->Warn('Missing page(s) in Ogg file');
undef $page;
}
}
# read page data
$raf->Read($buff, $dataLen) == $dataLen or last;
if ($verbose > 1) {
printf $out "Page %d, stream 0x%x, flag 0x%x (%d bytes)\n",
$pageNum, $stream, $flag, $dataLen;
$exifTool->VerboseDump(\$buff, DataPos => $raf->Tell() - $dataLen);
}
if (defined $val{$stream}) {
$val{$stream} .= $buff; # add this continuation page
} elsif (not $flag & 0x01) { # ignore remaining pages of a continued packet
# ignore the first page of any packet we aren't parsing
if ($buff =~ /^(.)vorbis/s and $$tagTablePtr{ord($1)}) {
$val{$stream} = $buff; # save this page
} elsif ($buff =~ /^\x7fFLAC..(..)/s) {
$numFlac = unpack('n',$1);
$val{$stream} = substr($buff, 9);
}
}
if (defined $numFlac) {
# stop to process FLAC headers if we have them all
last if $numFlac <= 0;
} elsif (defined $val{$stream} and $flag & 0x04) {
# process Ogg Vorbis packet now if end-of-stream bit is set
ProcessPacket($exifTool, \$val{$stream}, $tagTablePtr);
delete $val{$stream};
}
}
if (defined $numFlac and defined $val{$stream}) {
# process FLAC headers as if it was a complete FLAC file
require Image::ExifTool::FLAC;
my %dirInfo = ( RAF => new File::RandomAccess(\$val{$stream}) );
Image::ExifTool::FLAC::ProcessFLAC($exifTool, \%dirInfo);
}
return $success;
}
1; # end
__END__
=head1 NAME
Image::ExifTool::Vorbis - Read Ogg Vorbis meta information
=head1 SYNOPSIS
This module is used by Image::ExifTool
=head1 DESCRIPTION
This module contains definitions required by Image::ExifTool to extract meta
information from Ogg Vorbis and Ogg FLAC audio files.
=head1 AUTHOR
Copyright 2003-2008, Phil Harvey (phil at owl.phy.queensu.ca)
This library is free software; you can redistribute it and/or modify it
under the same terms as Perl itself.
=head1 REFERENCES
=over 4
=item L
=item L
=back
=head1 SEE ALSO
L,
L
=cut