summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rwxr-xr-xtools/mp3info.pm2184
-rwxr-xr-xtools/songdb.pl448
-rw-r--r--tools/vorbiscomm.pm732
3 files changed, 3364 insertions, 0 deletions
diff --git a/tools/mp3info.pm b/tools/mp3info.pm
new file mode 100755
index 0000000000..d900777266
--- /dev/null
+++ b/tools/mp3info.pm
@@ -0,0 +1,2184 @@
1package mp3info;
2
3require 5.006;
4
5use overload;
6use strict;
7use Carp;
8
9use vars qw(
10 @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS $VERSION $REVISION
11 @mp3_genres %mp3_genres @winamp_genres %winamp_genres $try_harder
12 @t_bitrate @t_sampling_freq @frequency_tbl %v1_tag_fields
13 @v1_tag_names %v2_tag_names %v2_to_v1_names $AUTOLOAD
14 @mp3_info_fields %rva2_channel_types
15);
16
17@ISA = 'Exporter';
18@EXPORT = qw(
19 set_mp3tag get_mp3tag get_mp3info remove_mp3tag
20 use_winamp_genres, use_mp3_utf8
21);
22@EXPORT_OK = qw(@mp3_genres %mp3_genres use_mp3_utf8);
23%EXPORT_TAGS = (
24 genres => [qw(@mp3_genres %mp3_genres)],
25 utf8 => [qw(use_mp3_utf8)],
26 all => [@EXPORT, @EXPORT_OK]
27);
28
29# $Id$
30($REVISION) = ' $Revision$ ' =~ /\$Revision:\s+([^\s]+)/;
31$VERSION = '1.20';
32
33=pod
34
35=head1 NAME
36
37MP3::Info - Manipulate / fetch info from MP3 audio files
38
39=head1 SYNOPSIS
40
41 #!perl -w
42 use MP3::Info;
43 my $file = 'Pearls_Before_Swine.mp3';
44 set_mp3tag($file, 'Pearls Before Swine', q"77's",
45 'Sticks and Stones', '1990',
46 q"(c) 1990 77's LTD.", 'rock & roll');
47
48 my $tag = get_mp3tag($file) or die "No TAG info";
49 $tag->{GENRE} = 'rock';
50 set_mp3tag($file, $tag);
51
52 my $info = get_mp3info($file);
53 printf "$file length is %d:%d\n", $info->{MM}, $info->{SS};
54
55=cut
56
57{
58 my $c = -1;
59 # set all lower-case and regular-cased versions of genres as keys
60 # with index as value of each key
61 %mp3_genres = map {($_, ++$c, lc, $c)} @mp3_genres;
62
63 # do it again for winamp genres
64 $c = -1;
65 %winamp_genres = map {($_, ++$c, lc, $c)} @winamp_genres;
66}
67
68=pod
69
70 my $mp3 = new MP3::Info $file;
71 $mp3->title('Perls Before Swine');
72 printf "$file length is %s, title is %s\n",
73 $mp3->time, $mp3->title;
74
75
76=head1 DESCRIPTION
77
78=over 4
79
80=item $mp3 = MP3::Info-E<gt>new(FILE)
81
82OOP interface to the rest of the module. The same keys
83available via get_mp3info and get_mp3tag are available
84via the returned object (using upper case or lower case;
85but note that all-caps "VERSION" will return the module
86version, not the MP3 version).
87
88Passing a value to one of the methods will set the value
89for that tag in the MP3 file, if applicable.
90
91=cut
92
93sub new {
94 my($pack, $file) = @_;
95
96 my $info = get_mp3info($file) or return undef;
97 my $tags = get_mp3tag($file) || { map { ($_ => undef) } @v1_tag_names };
98 my %self = (
99 FILE => $file,
100 TRY_HARDER => 0
101 );
102
103 @self{@mp3_info_fields, @v1_tag_names, 'file'} = (
104 @{$info}{@mp3_info_fields},
105 @{$tags}{@v1_tag_names},
106 $file
107 );
108
109 return bless \%self, $pack;
110}
111
112sub can {
113 my $self = shift;
114 return $self->SUPER::can(@_) unless ref $self;
115 my $name = uc shift;
116 return sub { $self->$name(@_) } if exists $self->{$name};
117 return undef;
118}
119
120sub AUTOLOAD {
121 my($self) = @_;
122 (my $name = uc $AUTOLOAD) =~ s/^.*://;
123
124 if (exists $self->{$name}) {
125 my $sub = exists $v1_tag_fields{$name}
126 ? sub {
127 if (defined $_[1]) {
128 $_[0]->{$name} = $_[1];
129 set_mp3tag($_[0]->{FILE}, $_[0]);
130 }
131 return $_[0]->{$name};
132 }
133 : sub {
134 return $_[0]->{$name}
135 };
136
137 no strict 'refs';
138 *{$AUTOLOAD} = $sub;
139 goto &$AUTOLOAD;
140
141 } else {
142 carp(sprintf "No method '$name' available in package %s.",
143 __PACKAGE__);
144 }
145}
146
147sub DESTROY {
148
149}
150
151
152=item use_mp3_utf8([STATUS])
153
154Tells MP3::Info to (or not) return TAG info in UTF-8.
155TRUE is 1, FALSE is 0. Default is TRUE, if available.
156
157Will only be able to turn it on if Encode is available. ID3v2
158tags will be converted to UTF-8 according to the encoding specified
159in each tag; ID3v1 tags will be assumed Latin-1 and converted
160to UTF-8.
161
162Function returns status (TRUE/FALSE). If no argument is supplied,
163or an unaccepted argument is supplied, function merely returns status.
164
165This function is not exported by default, but may be exported
166with the C<:utf8> or C<:all> export tag.
167
168=cut
169
170my $unicode_module = eval { require Encode; require Encode::Guess };
171my $UNICODE = use_mp3_utf8($unicode_module ? 1 : 0);
172
173sub use_mp3_utf8 {
174 my($val) = @_;
175 if ($val == 1) {
176 if ($unicode_module) {
177 $UNICODE = 1;
178 $Encode::Guess::NoUTFAutoGuess = 1;
179 }
180 } elsif ($val == 0) {
181 $UNICODE = 0;
182 }
183 return $UNICODE;
184}
185
186=pod
187
188=item use_winamp_genres()
189
190Puts WinAmp genres into C<@mp3_genres> and C<%mp3_genres>
191(adds 68 additional genres to the default list of 80).
192This is a separate function because these are non-standard
193genres, but they are included because they are widely used.
194
195You can import the data structures with one of:
196
197 use MP3::Info qw(:genres);
198 use MP3::Info qw(:DEFAULT :genres);
199 use MP3::Info qw(:all);
200
201=cut
202
203sub use_winamp_genres {
204 %mp3_genres = %winamp_genres;
205 @mp3_genres = @winamp_genres;
206 return 1;
207}
208
209=pod
210
211=item remove_mp3tag (FILE [, VERSION, BUFFER])
212
213Can remove ID3v1 or ID3v2 tags. VERSION should be C<1> for ID3v1
214(the default), C<2> for ID3v2, and C<ALL> for both.
215
216For ID3v1, removes last 128 bytes from file if those last 128 bytes begin
217with the text 'TAG'. File will be 128 bytes shorter.
218
219For ID3v2, removes ID3v2 tag. Because an ID3v2 tag is at the
220beginning of the file, we rewrite the file after removing the tag data.
221The buffer for rewriting the file is 4MB. BUFFER (in bytes) ca
222change the buffer size.
223
224Returns the number of bytes removed, or -1 if no tag removed,
225or undef if there is an error.
226
227=cut
228
229sub remove_mp3tag {
230 my($file, $version, $buf) = @_;
231 my($fh, $return);
232
233 $buf ||= 4096*1024; # the bigger the faster
234 $version ||= 1;
235
236 if (not (defined $file && $file ne '')) {
237 $@ = "No file specified";
238 return undef;
239 }
240
241 if (not -s $file) {
242 $@ = "File is empty";
243 return undef;
244 }
245
246 if (ref $file) { # filehandle passed
247 $fh = $file;
248 } else {
249 if (not open $fh, '+<', $file) {
250 $@ = "Can't open $file: $!";
251 return undef;
252 }
253 }
254
255 binmode $fh;
256
257 if ($version eq 1 || $version eq 'ALL') {
258 seek $fh, -128, 2;
259 my $tell = tell $fh;
260 if (<$fh> =~ /^TAG/) {
261 truncate $fh, $tell or carp "Can't truncate '$file': $!";
262 $return += 128;
263 }
264 }
265
266 if ($version eq 2 || $version eq 'ALL') {
267 my $v2h = _get_v2head($fh);
268 if ($v2h) {
269 local $\;
270 seek $fh, 0, 2;
271 my $eof = tell $fh;
272 my $off = $v2h->{tag_size};
273
274 while ($off < $eof) {
275 seek $fh, $off, 0;
276 read $fh, my($bytes), $buf;
277 seek $fh, $off - $v2h->{tag_size}, 0;
278 print $fh $bytes;
279 $off += $buf;
280 }
281
282 truncate $fh, $eof - $v2h->{tag_size}
283 or carp "Can't truncate '$file': $!";
284 $return += $v2h->{tag_size};
285 }
286 }
287
288 _close($file, $fh);
289
290 return $return || -1;
291}
292
293
294=pod
295
296=item set_mp3tag (FILE, TITLE, ARTIST, ALBUM, YEAR, COMMENT, GENRE [, TRACKNUM])
297
298=item set_mp3tag (FILE, $HASHREF)
299
300Adds/changes tag information in an MP3 audio file. Will clobber
301any existing information in file.
302
303Fields are TITLE, ARTIST, ALBUM, YEAR, COMMENT, GENRE. All fields have
304a 30-byte limit, except for YEAR, which has a four-byte limit, and GENRE,
305which is one byte in the file. The GENRE passed in the function is a
306case-insensitive text string representing a genre found in C<@mp3_genres>.
307
308Will accept either a list of values, or a hashref of the type
309returned by C<get_mp3tag>.
310
311If TRACKNUM is present (for ID3v1.1), then the COMMENT field can only be
31228 bytes.
313
314ID3v2 support may come eventually. Note that if you set a tag on a file
315with ID3v2, the set tag will be for ID3v1[.1] only, and if you call
316C<get_mp3tag> on the file, it will show you the (unchanged) ID3v2 tags,
317unless you specify ID3v1.
318
319=cut
320
321sub set_mp3tag {
322 my($file, $title, $artist, $album, $year, $comment, $genre, $tracknum) = @_;
323 my(%info, $oldfh, $ref, $fh);
324 local %v1_tag_fields = %v1_tag_fields;
325
326 # set each to '' if undef
327 for ($title, $artist, $album, $year, $comment, $tracknum, $genre,
328 (@info{@v1_tag_names}))
329 {$_ = defined() ? $_ : ''}
330
331 ($ref) = (overload::StrVal($title) =~ /^(?:.*\=)?([^=]*)\((?:[^\(]*)\)$/)
332 if ref $title;
333 # populate data to hashref if hashref is not passed
334 if (!$ref) {
335 (@info{@v1_tag_names}) =
336 ($title, $artist, $album, $year, $comment, $tracknum, $genre);
337
338 # put data from hashref into hashref if hashref is passed
339 } elsif ($ref eq 'HASH') {
340 %info = %$title;
341
342 # return otherwise
343 } else {
344 carp(<<'EOT');
345Usage: set_mp3tag (FILE, TITLE, ARTIST, ALBUM, YEAR, COMMENT, GENRE [, TRACKNUM])
346 set_mp3tag (FILE, $HASHREF)
347EOT
348 return undef;
349 }
350
351 if (not (defined $file && $file ne '')) {
352 $@ = "No file specified";
353 return undef;
354 }
355
356 if (not -s $file) {
357 $@ = "File is empty";
358 return undef;
359 }
360
361 # comment field length 28 if ID3v1.1
362 $v1_tag_fields{COMMENT} = 28 if $info{TRACKNUM};
363
364
365 # only if -w is on
366 if ($^W) {
367 # warn if fields too long
368 foreach my $field (keys %v1_tag_fields) {
369 $info{$field} = '' unless defined $info{$field};
370 if (length($info{$field}) > $v1_tag_fields{$field}) {
371 carp "Data too long for field $field: truncated to " .
372 "$v1_tag_fields{$field}";
373 }
374 }
375
376 if ($info{GENRE}) {
377 carp "Genre `$info{GENRE}' does not exist\n"
378 unless exists $mp3_genres{$info{GENRE}};
379 }
380 }
381
382 if ($info{TRACKNUM}) {
383 $info{TRACKNUM} =~ s/^(\d+)\/(\d+)$/$1/;
384 unless ($info{TRACKNUM} =~ /^\d+$/ &&
385 $info{TRACKNUM} > 0 && $info{TRACKNUM} < 256) {
386 carp "Tracknum `$info{TRACKNUM}' must be an integer " .
387 "from 1 and 255\n" if $^W;
388 $info{TRACKNUM} = '';
389 }
390 }
391
392 if (ref $file) { # filehandle passed
393 $fh = $file;
394 } else {
395 if (not open $fh, '+<', $file) {
396 $@ = "Can't open $file: $!";
397 return undef;
398 }
399 }
400
401 binmode $fh;
402 $oldfh = select $fh;
403 seek $fh, -128, 2;
404 # go to end of file if no tag, beginning of file if tag
405 seek $fh, (<$fh> =~ /^TAG/ ? -128 : 0), 2;
406
407 # get genre value
408 $info{GENRE} = $info{GENRE} && exists $mp3_genres{$info{GENRE}} ?
409 $mp3_genres{$info{GENRE}} : 255; # some default genre
410
411 local $\;
412 # print TAG to file
413 if ($info{TRACKNUM}) {
414 print pack 'a3a30a30a30a4a28xCC', 'TAG', @info{@v1_tag_names};
415 } else {
416 print pack 'a3a30a30a30a4a30C', 'TAG', @info{@v1_tag_names[0..4, 6]};
417 }
418
419 select $oldfh;
420
421 _close($file, $fh);
422
423 return 1;
424}
425
426=pod
427
428=item get_mp3tag (FILE [, VERSION, RAW_V2])
429
430Returns hash reference containing tag information in MP3 file. The keys
431returned are the same as those supplied for C<set_mp3tag>, except in the
432case of RAW_V2 being set.
433
434If VERSION is C<1>, the information is taken from the ID3v1 tag (if present).
435If VERSION is C<2>, the information is taken from the ID3v2 tag (if present).
436If VERSION is not supplied, or is false, the ID3v1 tag is read if present, and
437then, if present, the ID3v2 tag information will override any existing ID3v1
438tag info.
439
440If RAW_V2 is C<1>, the raw ID3v2 tag data is returned, without any manipulation
441of text encoding. The key name is the same as the frame ID (ID to name mappings
442are in the global %v2_tag_names).
443
444If RAW_V2 is C<2>, the ID3v2 tag data is returned, manipulating for Unicode if
445necessary, etc. It also takes multiple values for a given key (such as comments)
446and puts them in an arrayref.
447
448If the ID3v2 version is older than ID3v2.2.0 or newer than ID3v2.4.0, it will
449not be read.
450
451Strings returned will be in Latin-1, unless UTF-8 is specified (L<use_mp3_utf8>),
452(unless RAW_V2 is C<1>).
453
454Also returns a TAGVERSION key, containing the ID3 version used for the returned
455data (if TAGVERSION argument is C<0>, may contain two versions).
456
457=cut
458
459sub get_mp3tag {
460 my ($file, $ver, $raw_v2, $find_ape) = @_;
461 my ($tag, $v2h, $fh);
462
463 my $v1 = {};
464 my $v2 = {};
465 my $ape = {};
466 my %info = ();
467 my @array = ();
468
469 $raw_v2 ||= 0;
470 $ver = !$ver ? 0 : ($ver == 2 || $ver == 1) ? $ver : 0;
471
472 if (not (defined $file && $file ne '')) {
473 $@ = "No file specified";
474 return undef;
475 }
476
477 my $filesize = -s $file;
478
479 if (!$filesize) {
480 $@ = "File is empty";
481 return undef;
482 }
483
484 if (ref $file) { # filehandle passed
485 $fh = $file;
486 } else {
487 if (not open $fh, '<', $file) {
488 $@ = "Can't open $file: $!";
489 return undef;
490 }
491 }
492
493 binmode $fh;
494
495 # Try and find an APE Tag - this is where FooBar2k & others
496 # store ReplayGain information
497 if ($find_ape) {
498
499 $ape = _parse_ape_tag($fh, $filesize, \%info);
500 }
501
502 if ($ver < 2) {
503
504 $v1 = _get_v1tag($fh, \%info);
505
506 if ($ver == 1 && !$v1) {
507 _close($file, $fh);
508 $@ = "No ID3v1 tag found";
509 return undef;
510 }
511 }
512
513 if ($ver == 2 || $ver == 0) {
514 ($v2, $v2h) = _get_v2tag($fh);
515 }
516
517 if (!$v1 && !$v2 && !$ape) {
518 _close($file, $fh);
519 $@ = "No ID3 tag found";
520 return undef;
521 }
522
523 if (($ver == 0 || $ver == 2) && $v2) {
524
525 if ($raw_v2 == 1 && $ver == 2) {
526
527 %info = %$v2;
528
529 $info{'TAGVERSION'} = $v2h->{'version'};
530
531 } else {
532
533 _parse_v2tag($raw_v2, $v2, \%info);
534
535 if ($ver == 0 && $info{'TAGVERSION'}) {
536 $info{'TAGVERSION'} .= ' / ' . $v2h->{'version'};
537 } else {
538 $info{'TAGVERSION'} = $v2h->{'version'};
539 }
540 }
541 }
542
543 unless ($raw_v2 && $ver == 2) {
544 foreach my $key (keys %info) {
545 if (defined $info{$key}) {
546 $info{$key} =~ s/\000+.*//g;
547 $info{$key} =~ s/\s+$//;
548 }
549 }
550
551 for (@v1_tag_names) {
552 $info{$_} = '' unless defined $info{$_};
553 }
554 }
555
556 if (keys %info && exists $info{'GENRE'} && ! defined $info{'GENRE'}) {
557 $info{'GENRE'} = '';
558 }
559
560 _close($file, $fh);
561
562 return keys %info ? {%info} : undef;
563}
564
565sub _get_v1tag {
566 my ($fh, $info) = @_;
567
568 seek $fh, -128, 2;
569 read($fh, my $tag, 128);
570
571 if (!defined($tag) || $tag !~ /^TAG/) {
572
573 return 0;
574 }
575
576 if (substr($tag, -3, 2) =~ /\000[^\000]/) {
577
578 (undef, @{$info}{@v1_tag_names}) =
579 (unpack('a3a30a30a30a4a28', $tag),
580 ord(substr($tag, -2, 1)),
581 $mp3_genres[ord(substr $tag, -1)]);
582
583 $info->{'TAGVERSION'} = 'ID3v1.1';
584
585 } else {
586
587 (undef, @{$info}{@v1_tag_names[0..4, 6]}) =
588 (unpack('a3a30a30a30a4a30', $tag),
589 $mp3_genres[ord(substr $tag, -1)]);
590
591 $info->{'TAGVERSION'} = 'ID3v1';
592 }
593
594 if ($UNICODE) {
595
596 # Save off the old suspects list, since we add
597 # iso-8859-1 below, but don't want that there
598 # for possible ID3 v2.x parsing below.
599 my $oldSuspects = $Encode::Encoding{'Guess'}->{'Suspects'};
600
601 for my $key (keys %{$info}) {
602
603 next unless $info->{$key};
604
605 # Try and guess the encoding.
606 my $value = $info->{$key};
607 my $icode = Encode::Guess->guess($value);
608
609 unless (ref($icode)) {
610
611 # Often Latin1 bytes are
612 # stuffed into a 1.1 tag.
613 Encode::Guess->add_suspects('iso-8859-1');
614
615 while (length($value)) {
616
617 $icode = Encode::Guess->guess($value);
618
619 last if ref($icode);
620
621 # Remove garbage and retry
622 # (string is truncated in the
623 # middle of a multibyte char?)
624 $value =~ s/(.)$//;
625 }
626 }
627
628 $info->{$key} = Encode::decode(ref($icode) ? $icode->name : 'iso-8859-1', $info->{$key});
629 }
630
631 Encode::Guess->set_suspects(keys %{$oldSuspects});
632 }
633
634 return 1;
635}
636
637sub _parse_v2tag {
638 my ($raw_v2, $v2, $info) = @_;
639
640 # Make sure any existing TXXX flags are an array.
641 # As we might need to append comments to it below.
642 if ($v2->{'TXXX'} && ref($v2->{'TXXX'}) ne 'ARRAY') {
643
644 $v2->{'TXXX'} = [ $v2->{'TXXX'} ];
645 }
646
647 # J.River Media Center sticks RG tags in comments.
648 # Ugh. Make them look like TXXX tags, which is really what they are.
649 if (ref($v2->{'COMM'}) eq 'ARRAY' && grep { /Media Jukebox/ } @{$v2->{'COMM'}}) {
650
651 for my $comment (@{$v2->{'COMM'}}) {
652
653 if ($comment =~ /Media Jukebox/) {
654
655 # we only want one null to lead.
656 $comment =~ s/^\000+//g;
657
658 push @{$v2->{'TXXX'}}, "\000$comment";
659 }
660 }
661 }
662
663 my $hash = $raw_v2 == 2 ? { map { ($_, $_) } keys %v2_tag_names } : \%v2_to_v1_names;
664
665 for my $id (keys %$hash) {
666
667 next if !exists $v2->{$id};
668
669 if ($id =~ /^UFID?$/) {
670
671 my @ufid_list = split(/\0/, $v2->{$id});
672
673 $info->{$hash->{$id}} = $ufid_list[1] if ($#ufid_list > 0);
674
675 } elsif ($id =~ /^RVA[D2]?$/) {
676
677 # Expand these binary fields. See the ID3 spec for Relative Volume Adjustment.
678 if ($id eq 'RVA2') {
679
680 # ID is a text string
681 ($info->{$hash->{$id}}->{'ID'}, my $rvad) = split /\0/, $v2->{$id};
682
683 my $channel = $rva2_channel_types{ ord(substr($rvad, 0, 1, '')) };
684
685 $info->{$hash->{$id}}->{$channel}->{'REPLAYGAIN_TRACK_GAIN'} =
686 sprintf('%f', _grab_int_16(\$rvad) / 512);
687
688 my $peakBytes = ord(substr($rvad, 0, 1, ''));
689
690 if (int($peakBytes / 8)) {
691
692 $info->{$hash->{$id}}->{$channel}->{'REPLAYGAIN_TRACK_PEAK'} =
693 sprintf('%f', _grab_int_16(\$rvad) / 512);
694 }
695
696 } elsif ($id eq 'RVAD' || $id eq 'RVA') {
697
698 my $rvad = $v2->{$id};
699 my $flags = ord(substr($rvad, 0, 1, ''));
700 my $desc = ord(substr($rvad, 0, 1, ''));
701
702 # iTunes appears to be the only program that actually writes
703 # out a RVA/RVAD tag. Everyone else punts.
704 for my $type (qw(REPLAYGAIN_TRACK_GAIN REPLAYGAIN_TRACK_PEAK)) {
705
706 for my $channel (qw(RIGHT LEFT)) {
707
708 my $val = _grab_uint_16(\$rvad) / 256;
709
710 # iTunes uses a range of -255 to 255
711 # to be -100% (silent) to 100% (+6dB)
712 if ($val == -255) {
713 $val = -96.0;
714 } else {
715 $val = 20.0 * log(($val+255)/255)/log(10);
716 }
717
718 $info->{$hash->{$id}}->{$channel}->{$type} = $flags & 0x01 ? $val : -$val;
719 }
720 }
721 }
722
723 } elsif ($id =~ /^A?PIC$/) {
724
725 my $pic = $v2->{$id};
726
727 # if there is more than one picture, just grab the first one.
728 if (ref($pic) eq 'ARRAY') {
729 $pic = (@$pic)[0];
730 }
731
732 use bytes;
733
734 my $valid_pic = 0;
735 my $pic_len = 0;
736 my $pic_format = '';
737
738 # look for ID3 v2.2 picture
739 if ($pic && $id eq 'PIC') {
740
741 # look for ID3 v2.2 picture
742 my ($encoding, $format, $picture_type, $description) = unpack 'Ca3CZ*', $pic;
743 $pic_len = length($description) + 1 + 5;
744
745 # skip extra terminating null if unicode
746 if ($encoding) { $pic_len++; }
747
748 if ($pic_len < length($pic)) {
749 $valid_pic = 1;
750 $pic_format = $format;
751 }
752
753 } elsif ($pic && $id eq 'APIC') {
754
755 # look for ID3 v2.3 picture
756 my ($encoding, $format) = unpack 'C Z*', $pic;
757
758 $pic_len = length($format) + 2;
759
760 if ($pic_len < length($pic)) {
761
762 my ($picture_type, $description) = unpack "x$pic_len C Z*", $pic;
763
764 $pic_len += 1 + length($description) + 1;
765
766 # skip extra terminating null if unicode
767 if ($encoding) { $pic_len++; }
768
769 $valid_pic = 1;
770 $pic_format = $format;
771 }
772 }
773
774 # Proceed if we have a valid picture.
775 if ($valid_pic && $pic_format) {
776
777 my ($data) = unpack("x$pic_len A*", $pic);
778
779 if (length($data) && $pic_format) {
780
781 $info->{$hash->{$id}} = {
782 'DATA' => $data,
783 'FORMAT' => $pic_format,
784 }
785 }
786 }
787
788 } else {
789 my $data1 = $v2->{$id};
790
791 # this is tricky ... if this is an arrayref,
792 # we want to only return one, so we pick the
793 # first one. but if it is a comment, we pick
794 # the first one where the first charcter after
795 # the language is NULL and not an additional
796 # sub-comment, because that is most likely to be
797 # the user-supplied comment
798 if (ref $data1 && !$raw_v2) {
799 if ($id =~ /^COMM?$/) {
800 my($newdata) = grep /^(....\000)/, @{$data1};
801 $data1 = $newdata || $data1->[0];
802 } elsif ($id !~ /^(?:TXXX?|PRIV)$/) {
803 # We can get multiple User Defined Text frames in a mp3 file
804 $data1 = $data1->[0];
805 }
806 }
807
808 $data1 = [ $data1 ] if ! ref $data1;
809
810 for my $data (@$data1) {
811 # TODO : this should only be done for certain frames;
812 # using RAW still gives you access, but we should be smarter
813 # about how individual frame types are handled. it's not
814 # like the list is infinitely long.
815 $data =~ s/^(.)//; # strip first char (text encoding)
816 my $encoding = $1;
817 my $desc;
818
819 # Comments & Unsyncronized Lyrics have the same format.
820 if ($id =~ /^(COM[M ]?|USLT)$/) { # space for iTunes brokenness
821
822 $data =~ s/^(?:...)//; # strip language
823 }
824
825 if ($UNICODE) {
826
827 if ($encoding eq "\001" || $encoding eq "\002") { # UTF-16, UTF-16BE
828 # text fields can be null-separated lists;
829 # UTF-16 therefore needs special care
830 #
831 # foobar2000 encodes tags in UTF-16LE
832 # (which is apparently illegal)
833 # Encode dies on a bad BOM, so it is
834 # probably wise to wrap it in an eval
835 # anyway
836 $data = eval { Encode::decode('utf16', $data) } || Encode::decode('utf16le', $data);
837
838 } elsif ($encoding eq "\003") { # UTF-8
839
840 # make sure string is UTF8, and set flag appropriately
841 $data = Encode::decode('utf8', $data);
842
843 } elsif ($encoding eq "\000") {
844
845 # Only guess if it's not ascii.
846 if ($data && $data !~ /^[\x00-\x7F]+$/) {
847
848 # Try and guess the encoding, otherwise just use latin1
849 my $dec = Encode::Guess->guess($data);
850
851 if (ref $dec) {
852 $data = $dec->decode($data);
853 } else {
854 # Best try
855 $data = Encode::decode('iso-8859-1', $data);
856 }
857 }
858 }
859
860 } else {
861
862 # If the string starts with an
863 # UTF-16 little endian BOM, use a hack to
864 # convert to ASCII per best-effort
865 my $pat;
866 if ($data =~ s/^\xFF\xFE//) {
867 $pat = 'v';
868 } elsif ($data =~ s/^\xFE\xFF//) {
869 $pat = 'n';
870 }
871
872 if ($pat) {
873 $data = pack 'C*', map {
874 (chr =~ /[[:ascii:]]/ && chr =~ /[[:print:]]/)
875 ? $_
876 : ord('?')
877 } unpack "$pat*", $data;
878 }
879 }
880
881 # We do this after decoding so we could be certain we're dealing
882 # with 8-bit text.
883 if ($id =~ /^(COM[M ]?|USLT)$/) { # space for iTunes brokenness
884
885 $data =~ s/^(.*?)\000//; # strip up to first NULL(s),
886 # for sub-comments (TODO:
887 # handle all comment data)
888 $desc = $1;
889
890 } elsif ($id =~ /^TCON?$/) {
891
892 my ($index, $name);
893
894 # Turn multiple nulls into a single.
895 $data =~ s/\000+/\000/g;
896
897 # Handle the ID3v2.x spec -
898 #
899 # just an index number, possibly
900 # paren enclosed - referer to the v1 genres.
901 if ($data =~ /^ \(? (\d+) \)?\000?$/sx) {
902
903 $index = $1;
904
905 # Paren enclosed index with refinement.
906 # (4)Eurodisco
907 } elsif ($data =~ /^ \( (\d+) \)\000? ([^\(].+)$/x) {
908
909 ($index, $name) = ($1, $2);
910
911 # List of indexes: (37)(38)
912 } elsif ($data =~ /^ \( (\d+) \)\000?/x) {
913
914 my @genres = ();
915
916 while ($data =~ s/^ \( (\d+) \)\000?//x) {
917
918 push @genres, $mp3_genres[$1];
919 }
920
921 $data = \@genres;
922 }
923
924 # Text based genres will fall through.
925 if ($name && $name ne "\000") {
926 $data = $name;
927 } elsif (defined $index) {
928 $data = $mp3_genres[$index];
929 }
930 }
931
932 if ($raw_v2 == 2 && $desc) {
933 $data = { $desc => $data };
934 }
935
936 if ($raw_v2 == 2 && exists $info->{$hash->{$id}}) {
937
938 if (ref $info->{$hash->{$id}} eq 'ARRAY') {
939 push @{$info->{$hash->{$id}}}, $data;
940 } else {
941 $info->{$hash->{$id}} = [ $info->{$hash->{$id}}, $data ];
942 }
943
944 } else {
945
946 # User defined frame
947 if ($id eq 'TXXX') {
948
949 my ($key, $val) = split(/\0/, $data);
950 $info->{uc($key)} = $val;
951
952 } elsif ($id eq 'PRIV') {
953
954 my ($key, $val) = split(/\0/, $data);
955 $info->{uc($key)} = unpack('v', $val);
956
957 } else {
958
959 $info->{$hash->{$id}} = $data;
960 }
961 }
962 }
963 }
964 }
965}
966
967sub _get_v2tag {
968 my($fh) = @_;
969 my($off, $end, $myseek, $v2, $v2h, $hlen, $num, $wholetag);
970
971 $v2 = {};
972 $v2h = _get_v2head($fh) or return;
973
974 if ($v2h->{major_version} < 2) {
975 carp "This is $v2h->{version}; " .
976 "ID3v2 versions older than ID3v2.2.0 not supported\n"
977 if $^W;
978 return;
979 }
980
981 # use syncsafe bytes if using version 2.4
982 # my $bytesize = ($v2h->{major_version} > 3) ? 128 : 256;
983
984 # alas, that's what the spec says, but iTunes and others don't syncsafe
985 # the length, which breaks MP3 files with v2.4 tags longer than 128 bytes,
986 # like every image file.
987 my $bytesize = 256;
988
989 if ($v2h->{major_version} == 2) {
990 $hlen = 6;
991 $num = 3;
992 } else {
993 $hlen = 10;
994 $num = 4;
995 }
996
997 $off = $v2h->{ext_header_size} + 10;
998 $end = $v2h->{tag_size} + 10; # should we read in the footer too?
999
1000 seek $fh, $v2h->{offset}, 0;
1001 read $fh, $wholetag, $end;
1002
1003 $wholetag =~ s/\xFF\x00/\xFF/gs if $v2h->{unsync};
1004
1005 $myseek = sub {
1006 my $bytes = substr($wholetag, $off, $hlen);
1007 return unless $bytes =~ /^([A-Z0-9]{$num})/
1008 || ($num == 4 && $bytes =~ /^(COM )/); # stupid iTunes
1009 my($id, $size) = ($1, $hlen);
1010 my @bytes = reverse unpack "C$num", substr($bytes, $num, $num);
1011
1012 for my $i (0 .. ($num - 1)) {
1013 $size += $bytes[$i] * $bytesize ** $i;
1014 }
1015
1016 my $flags = {};
1017 if ($v2h->{major_version} > 3) {
1018 my @bits = split //, unpack 'B16', substr($bytes, 8, 2);
1019 $flags->{frame_unsync} = $bits[14];
1020 $flags->{data_len_indicator} = $bits[15];
1021 }
1022
1023 return($id, $size, $flags);
1024 };
1025
1026 while ($off < $end) {
1027 my($id, $size, $flags) = &$myseek or last;
1028
1029 my $bytes = substr($wholetag, $off+$hlen, $size-$hlen);
1030
1031 my $data_len;
1032 if ($flags->{data_len_indicator}) {
1033 $data_len = 0;
1034 my @data_len_bytes = reverse unpack 'C4', substr($bytes, 0, 4);
1035 $bytes = substr($bytes, 4);
1036 for my $i (0..3) {
1037 $data_len += $data_len_bytes[$i] * 128 ** $i;
1038 }
1039 }
1040
1041 # perform frame-level unsync if needed (skip if already done for whole tag)
1042 $bytes =~ s/\xFF\x00/\xFF/gs if $flags->{frame_unsync} && !$v2h->{unsync};
1043
1044 # if we know the data length, sanity check it now.
1045 if ($flags->{data_len_indicator} && defined $data_len) {
1046 carp "Size mismatch on $id\n" unless $data_len == length($bytes);
1047 }
1048
1049 if (exists $v2->{$id}) {
1050 if (ref $v2->{$id} eq 'ARRAY') {
1051 push @{$v2->{$id}}, $bytes;
1052 } else {
1053 $v2->{$id} = [$v2->{$id}, $bytes];
1054 }
1055 } else {
1056 $v2->{$id} = $bytes;
1057 }
1058 $off += $size;
1059 }
1060
1061 return($v2, $v2h);
1062}
1063
1064
1065=pod
1066
1067=item get_mp3info (FILE)
1068
1069Returns hash reference containing file information for MP3 file.
1070This data cannot be changed. Returned data:
1071
1072 VERSION MPEG audio version (1, 2, 2.5)
1073 LAYER MPEG layer description (1, 2, 3)
1074 STEREO boolean for audio is in stereo
1075
1076 VBR boolean for variable bitrate
1077 BITRATE bitrate in kbps (average for VBR files)
1078 FREQUENCY frequency in kHz
1079 SIZE bytes in audio stream
1080 OFFSET bytes offset that stream begins
1081
1082 SECS total seconds
1083 MM minutes
1084 SS leftover seconds
1085 MS leftover milliseconds
1086 TIME time in MM:SS
1087
1088 COPYRIGHT boolean for audio is copyrighted
1089 PADDING boolean for MP3 frames are padded
1090 MODE channel mode (0 = stereo, 1 = joint stereo,
1091 2 = dual channel, 3 = single channel)
1092 FRAMES approximate number of frames
1093 FRAME_LENGTH approximate length of a frame
1094 VBR_SCALE VBR scale from VBR header
1095
1096On error, returns nothing and sets C<$@>.
1097
1098=cut
1099
1100sub get_mp3info {
1101 my($file) = @_;
1102 my($off, $byte, $eof, $h, $tot, $fh);
1103
1104 if (not (defined $file && $file ne '')) {
1105 $@ = "No file specified";
1106 return undef;
1107 }
1108
1109 if (not -s $file) {
1110 $@ = "File is empty";
1111 return undef;
1112 }
1113
1114 if (ref $file) { # filehandle passed
1115 $fh = $file;
1116 } else {
1117 if (not open $fh, '<', $file) {
1118 $@ = "Can't open $file: $!";
1119 return undef;
1120 }
1121 }
1122
1123 $off = 0;
1124 $tot = 8192;
1125
1126 # Let the caller change how far we seek in looking for a header.
1127 if ($try_harder) {
1128 $tot *= $try_harder;
1129 }
1130
1131 binmode $fh;
1132 seek $fh, $off, 0;
1133 read $fh, $byte, 4;
1134
1135 if ($off == 0) {
1136 if (my $v2h = _get_v2head($fh)) {
1137 $tot += $off += $v2h->{tag_size};
1138 seek $fh, $off, 0;
1139 read $fh, $byte, 4;
1140 }
1141 }
1142
1143 $h = _get_head($byte);
1144 my $is_mp3 = _is_mp3($h);
1145
1146 # the head wasn't where we were expecting it.. dig deeper.
1147 unless ($is_mp3) {
1148
1149 # do only one read - it's _much_ faster
1150 $off++;
1151 seek $fh, $off, 0;
1152 read $fh, $byte, $tot;
1153
1154 my $i;
1155
1156 # now walk the bytes looking for the head
1157 for ($i = 0; $i < $tot; $i++) {
1158
1159 last if ($tot - $i) < 4;
1160
1161 my $head = substr($byte, $i, 4) || last;
1162
1163 next if (ord($head) != 0xff);
1164
1165 $h = _get_head($head);
1166 $is_mp3 = _is_mp3($h);
1167 last if $is_mp3;
1168 }
1169
1170 # adjust where we are for _get_vbr()
1171 $off += $i;
1172
1173 if ($off > $tot && !$try_harder) {
1174 _close($file, $fh);
1175 $@ = "Couldn't find MP3 header (perhaps set " .
1176 '$MP3::Info::try_harder and retry)';
1177 return undef;
1178 }
1179 }
1180
1181 my $vbr = _get_vbr($fh, $h, \$off);
1182
1183 seek $fh, 0, 2;
1184 $eof = tell $fh;
1185 seek $fh, -128, 2;
1186 $eof -= 128 if <$fh> =~ /^TAG/ ? 1 : 0;
1187
1188 _close($file, $fh);
1189
1190 $h->{size} = $eof - $off;
1191 $h->{offset} = $off;
1192
1193 return _get_info($h, $vbr);
1194}
1195
1196sub _get_info {
1197 my($h, $vbr) = @_;
1198 my $i;
1199
1200 # No bitrate or sample rate? Something's wrong.
1201 unless ($h->{bitrate} && $h->{fs}) {
1202 return {};
1203 }
1204
1205 $i->{VERSION} = $h->{IDR} == 2 ? 2 : $h->{IDR} == 3 ? 1 :
1206 $h->{IDR} == 0 ? 2.5 : 0;
1207 $i->{LAYER} = 4 - $h->{layer};
1208 $i->{VBR} = defined $vbr ? 1 : 0;
1209
1210 $i->{COPYRIGHT} = $h->{copyright} ? 1 : 0;
1211 $i->{PADDING} = $h->{padding_bit} ? 1 : 0;
1212 $i->{STEREO} = $h->{mode} == 3 ? 0 : 1;
1213 $i->{MODE} = $h->{mode};
1214
1215 $i->{SIZE} = $vbr && $vbr->{bytes} ? $vbr->{bytes} : $h->{size};
1216 $i->{OFFSET} = $h->{offset};
1217
1218 my $mfs = $h->{fs} / ($h->{ID} ? 144000 : 72000);
1219 $i->{FRAMES} = int($vbr && $vbr->{frames}
1220 ? $vbr->{frames}
1221 : $i->{SIZE} / ($h->{bitrate} / $mfs)
1222 );
1223
1224 if ($vbr) {
1225 $i->{VBR_SCALE} = $vbr->{scale} if $vbr->{scale};
1226 $h->{bitrate} = $i->{SIZE} / $i->{FRAMES} * $mfs;
1227 if (not $h->{bitrate}) {
1228 $@ = "Couldn't determine VBR bitrate";
1229 return undef;
1230 }
1231 }
1232
1233 $h->{'length'} = ($i->{SIZE} * 8) / $h->{bitrate} / 10;
1234 $i->{SECS} = $h->{'length'} / 100;
1235 $i->{MM} = int $i->{SECS} / 60;
1236 $i->{SS} = int $i->{SECS} % 60;
1237 $i->{MS} = (($i->{SECS} - ($i->{MM} * 60) - $i->{SS}) * 1000);
1238# $i->{LF} = ($i->{MS} / 1000) * ($i->{FRAMES} / $i->{SECS});
1239# int($i->{MS} / 100 * 75); # is this right?
1240 $i->{TIME} = sprintf "%.2d:%.2d", @{$i}{'MM', 'SS'};
1241
1242 $i->{BITRATE} = int $h->{bitrate};
1243 # should we just return if ! FRAMES?
1244 $i->{FRAME_LENGTH} = int($h->{size} / $i->{FRAMES}) if $i->{FRAMES};
1245 $i->{FREQUENCY} = $frequency_tbl[3 * $h->{IDR} + $h->{sampling_freq}];
1246
1247 return $i;
1248}
1249
1250sub _get_head {
1251 my($byte) = @_;
1252 my($bytes, $h);
1253
1254 $bytes = _unpack_head($byte);
1255 @$h{qw(IDR ID layer protection_bit
1256 bitrate_index sampling_freq padding_bit private_bit
1257 mode mode_extension copyright original
1258 emphasis version_index bytes)} = (
1259 ($bytes>>19)&3, ($bytes>>19)&1, ($bytes>>17)&3, ($bytes>>16)&1,
1260 ($bytes>>12)&15, ($bytes>>10)&3, ($bytes>>9)&1, ($bytes>>8)&1,
1261 ($bytes>>6)&3, ($bytes>>4)&3, ($bytes>>3)&1, ($bytes>>2)&1,
1262 $bytes&3, ($bytes>>19)&3, $bytes
1263 );
1264
1265 $h->{bitrate} = $t_bitrate[$h->{ID}][3 - $h->{layer}][$h->{bitrate_index}];
1266 $h->{fs} = $t_sampling_freq[$h->{IDR}][$h->{sampling_freq}];
1267
1268 return $h;
1269}
1270
1271sub _is_mp3 {
1272 my $h = $_[0] or return undef;
1273 return ! ( # all below must be false
1274 $h->{bitrate_index} == 0
1275 ||
1276 $h->{version_index} == 1
1277 ||
1278 ($h->{bytes} & 0xFFE00000) != 0xFFE00000
1279 ||
1280 !$h->{fs}
1281 ||
1282 !$h->{bitrate}
1283 ||
1284 $h->{bitrate_index} == 15
1285 ||
1286 !$h->{layer}
1287 ||
1288 $h->{sampling_freq} == 3
1289 ||
1290 $h->{emphasis} == 2
1291 ||
1292 !$h->{bitrate_index}
1293 ||
1294 ($h->{bytes} & 0xFFFF0000) == 0xFFFE0000
1295 ||
1296 ($h->{ID} == 1 && $h->{layer} == 3 && $h->{protection_bit} == 1)
1297 # mode extension should only be applicable when mode = 1
1298 # however, failing just becuase mode extension is used when unneeded is a bit strict
1299 # ||
1300 #($h->{mode_extension} != 0 && $h->{mode} != 1)
1301 );
1302}
1303
1304sub _vbr_seek {
1305 my $fh = shift;
1306 my $off = shift;
1307 my $bytes = shift;
1308 my $n = shift || 4;
1309
1310 seek $fh, $$off, 0;
1311 read $fh, $$bytes, $n;
1312
1313 $$off += $n;
1314}
1315
1316sub _get_vbr {
1317 my($fh, $h, $roff) = @_;
1318 my($off, $bytes, @bytes, %vbr);
1319
1320 $off = $$roff;
1321
1322 $off += 4;
1323
1324 if ($h->{ID}) { # MPEG1
1325 $off += $h->{mode} == 3 ? 17 : 32;
1326 } else { # MPEG2
1327 $off += $h->{mode} == 3 ? 9 : 17;
1328 }
1329
1330 _vbr_seek($fh, \$off, \$bytes);
1331 return unless $bytes eq 'Xing';
1332
1333 _vbr_seek($fh, \$off, \$bytes);
1334 $vbr{flags} = _unpack_head($bytes);
1335
1336 if ($vbr{flags} & 1) {
1337 _vbr_seek($fh, \$off, \$bytes);
1338 $vbr{frames} = _unpack_head($bytes);
1339 }
1340
1341 if ($vbr{flags} & 2) {
1342 _vbr_seek($fh, \$off, \$bytes);
1343 $vbr{bytes} = _unpack_head($bytes);
1344 }
1345
1346 if ($vbr{flags} & 4) {
1347 _vbr_seek($fh, \$off, \$bytes, 100);
1348# Not used right now ...
1349# $vbr{toc} = _unpack_head($bytes);
1350 }
1351
1352 if ($vbr{flags} & 8) { # (quality ind., 0=best 100=worst)
1353 _vbr_seek($fh, \$off, \$bytes);
1354 $vbr{scale} = _unpack_head($bytes);
1355 } else {
1356 $vbr{scale} = -1;
1357 }
1358
1359 $$roff = $off;
1360 return \%vbr;
1361}
1362
1363sub _get_v2head {
1364 my $fh = $_[0] or return;
1365 my($v2h, $bytes, @bytes);
1366 $v2h->{offset} = 0;
1367
1368 # check first three bytes for 'ID3'
1369 seek $fh, 0, 0;
1370 read $fh, $bytes, 3;
1371
1372 # TODO: add support for tags at the end of the file
1373 if ($bytes eq 'RIF' || $bytes eq 'FOR') {
1374 _find_id3_chunk($fh, $bytes) or return;
1375 $v2h->{offset} = tell $fh;
1376 read $fh, $bytes, 3;
1377 }
1378
1379 return unless $bytes eq 'ID3';
1380
1381 # get version
1382 read $fh, $bytes, 2;
1383 $v2h->{version} = sprintf "ID3v2.%d.%d",
1384 @$v2h{qw[major_version minor_version]} =
1385 unpack 'c2', $bytes;
1386
1387 # get flags
1388 read $fh, $bytes, 1;
1389 my @bits = split //, unpack 'b8', $bytes;
1390 if ($v2h->{major_version} == 2) {
1391 $v2h->{unsync} = $bits[7];
1392 $v2h->{compression} = $bits[8];
1393 $v2h->{ext_header} = 0;
1394 $v2h->{experimental} = 0;
1395 } else {
1396 $v2h->{unsync} = $bits[7];
1397 $v2h->{ext_header} = $bits[6];
1398 $v2h->{experimental} = $bits[5];
1399 $v2h->{footer} = $bits[4] if $v2h->{major_version} == 4;
1400 }
1401
1402 # get ID3v2 tag length from bytes 7-10
1403 $v2h->{tag_size} = 10; # include ID3v2 header size
1404 $v2h->{tag_size} += 10 if $v2h->{footer};
1405 read $fh, $bytes, 4;
1406 @bytes = reverse unpack 'C4', $bytes;
1407 foreach my $i (0 .. 3) {
1408 # whoaaaaaa nellllllyyyyyy!
1409 $v2h->{tag_size} += $bytes[$i] * 128 ** $i;
1410 }
1411
1412 # get extended header size
1413 $v2h->{ext_header_size} = 0;
1414 if ($v2h->{ext_header}) {
1415 read $fh, $bytes, 4;
1416 @bytes = reverse unpack 'C4', $bytes;
1417
1418 # use syncsafe bytes if using version 2.4
1419 my $bytesize = ($v2h->{major_version} > 3) ? 128 : 256;
1420 for my $i (0..3) {
1421 $v2h->{ext_header_size} += $bytes[$i] * $bytesize ** $i;
1422 }
1423 }
1424
1425 return $v2h;
1426}
1427
1428sub _find_id3_chunk {
1429 my($fh, $filetype) = @_;
1430 my($bytes, $size, $tag, $pat, $mat);
1431
1432 read $fh, $bytes, 1;
1433 if ($filetype eq 'RIF') { # WAV
1434 return 0 if $bytes ne 'F';
1435 $pat = 'a4V';
1436 $mat = 'id3 ';
1437 } elsif ($filetype eq 'FOR') { # AIFF
1438 return 0 if $bytes ne 'M';
1439 $pat = 'a4N';
1440 $mat = 'ID3 ';
1441 }
1442 seek $fh, 12, 0; # skip to the first chunk
1443
1444 while ((read $fh, $bytes, 8) == 8) {
1445 ($tag, $size) = unpack $pat, $bytes;
1446 return 1 if $tag eq $mat;
1447 seek $fh, $size, 1;
1448 }
1449
1450 return 0;
1451}
1452
1453sub _unpack_head {
1454 unpack('l', pack('L', unpack('N', $_[0])));
1455}
1456
1457sub _grab_int_16 {
1458 my $data = shift;
1459 my $value = unpack('s',substr($$data,0,2));
1460 $$data = substr($$data,2);
1461 return $value;
1462}
1463
1464sub _grab_uint_16 {
1465 my $data = shift;
1466 my $value = unpack('S',substr($$data,0,2));
1467 $$data = substr($$data,2);
1468 return $value;
1469}
1470
1471sub _grab_int_32 {
1472 my $data = shift;
1473 my $value = unpack('V',substr($$data,0,4));
1474 $$data = substr($$data,4);
1475 return $value;
1476}
1477
1478sub _parse_ape_tag {
1479 my ($fh, $filesize, $info) = @_;
1480
1481 my $ape_tag_id = 'APETAGEX';
1482
1483 seek $fh, -256, 2;
1484 read($fh, my $tag, 256);
1485 my $pre_tag = substr($tag, 0, 128, '');
1486
1487 # Try and bail early if there's no ape tag.
1488 if (substr($pre_tag, 96, 8) ne $ape_tag_id && substr($tag, 96, 8) ne $ape_tag_id) {
1489
1490 seek($fh, 0, 0);
1491 return 0;
1492 }
1493
1494 my $id3v1_tag_size = 128;
1495 my $ape_tag_header_size = 32;
1496 my $lyrics3_tag_size = 10;
1497 my $tag_offset_start = 0;
1498 my $tag_offset_end = 0;
1499
1500 seek($fh, (0 - $id3v1_tag_size - $ape_tag_header_size - $lyrics3_tag_size), 2);
1501
1502 read($fh, my $ape_footer_id3v1, $id3v1_tag_size + $ape_tag_header_size + $lyrics3_tag_size);
1503
1504 if (substr($ape_footer_id3v1, (length($ape_footer_id3v1) - $id3v1_tag_size - $ape_tag_header_size), 8) eq $ape_tag_id) {
1505
1506 $tag_offset_end = $filesize - $id3v1_tag_size;
1507
1508 } elsif (substr($ape_footer_id3v1, (length($ape_footer_id3v1) - $ape_tag_header_size), 8) eq $ape_tag_id) {
1509
1510 $tag_offset_end = $filesize;
1511 }
1512
1513 seek($fh, $tag_offset_end - $ape_tag_header_size, 0);
1514
1515 read($fh, my $ape_footer_data, 32);
1516
1517 my $ape_footer = _parse_ape_header_or_footer($ape_footer_data);
1518
1519 if (keys %{$ape_footer}) {
1520
1521 my $ape_tag_data = '';
1522
1523 if ($ape_footer->{'flags'}->{'header'}) {
1524
1525 seek($fh, ($tag_offset_end - $ape_footer->{'tag_size'} - $ape_tag_header_size), 0);
1526
1527 $tag_offset_start = tell($fh);
1528
1529 read($fh, $ape_tag_data, $ape_footer->{'tag_size'} + $ape_tag_header_size);
1530
1531 } else {
1532
1533 $tag_offset_start = $tag_offset_end - $ape_footer->{'tag_size'};
1534
1535 seek($fh, $tag_offset_start, 0);
1536
1537 read($fh, $ape_tag_data, $ape_footer->{'tag_size'});
1538 }
1539
1540 my $ape_header_data = substr($ape_tag_data, 0, $ape_tag_header_size, '');
1541 my $ape_header = _parse_ape_header_or_footer($ape_header_data);
1542
1543 for (my $c = 0; $c < $ape_header->{'tag_items'}; $c++) {
1544
1545 # Loop through the tag items
1546 my $tag_len = _grab_int_32(\$ape_tag_data);
1547 my $tag_flags = _grab_int_32(\$ape_tag_data);
1548
1549 $ape_tag_data =~ s/^(.*?)\0//;
1550
1551 my $tag_item_key = uc($1 || 'UNKNOWN');
1552
1553 $info->{$tag_item_key} = substr($ape_tag_data, 0, $tag_len, '');
1554 }
1555 }
1556
1557 seek($fh, 0, 0);
1558
1559 return 1;
1560}
1561
1562sub _parse_ape_header_or_footer {
1563 my $bytes = shift;
1564 my %data = ();
1565
1566 if (substr($bytes, 0, 8, '') eq 'APETAGEX') {
1567
1568 $data{'version'} = _grab_int_32(\$bytes);
1569 $data{'tag_size'} = _grab_int_32(\$bytes);
1570 $data{'tag_items'} = _grab_int_32(\$bytes);
1571 $data{'global_flags'} = _grab_int_32(\$bytes);
1572
1573 # trim the reseved bytes
1574 _grab_int_32(\$bytes);
1575 _grab_int_32(\$bytes);
1576
1577 $data{'flags'}->{'header'} = ($data{'global_flags'} & 0x80000000) ? 1 : 0;
1578 $data{'flags'}->{'footer'} = ($data{'global_flags'} & 0x40000000) ? 1 : 0;
1579 $data{'flags'}->{'is_header'} = ($data{'global_flags'} & 0x20000000) ? 1 : 0;
1580 }
1581
1582 return \%data;
1583}
1584
1585sub _close {
1586 my($file, $fh) = @_;
1587 unless (ref $file) { # filehandle not passed
1588 close $fh or carp "Problem closing '$file': $!";
1589 }
1590}
1591
1592BEGIN {
1593 @mp3_genres = (
1594 'Blues',
1595 'Classic Rock',
1596 'Country',
1597 'Dance',
1598 'Disco',
1599 'Funk',
1600 'Grunge',
1601 'Hip-Hop',
1602 'Jazz',
1603 'Metal',
1604 'New Age',
1605 'Oldies',
1606 'Other',
1607 'Pop',
1608 'R&B',
1609 'Rap',
1610 'Reggae',
1611 'Rock',
1612 'Techno',
1613 'Industrial',
1614 'Alternative',
1615 'Ska',
1616 'Death Metal',
1617 'Pranks',
1618 'Soundtrack',
1619 'Euro-Techno',
1620 'Ambient',
1621 'Trip-Hop',
1622 'Vocal',
1623 'Jazz+Funk',
1624 'Fusion',
1625 'Trance',
1626 'Classical',
1627 'Instrumental',
1628 'Acid',
1629 'House',
1630 'Game',
1631 'Sound Clip',
1632 'Gospel',
1633 'Noise',
1634 'AlternRock',
1635 'Bass',
1636 'Soul',
1637 'Punk',
1638 'Space',
1639 'Meditative',
1640 'Instrumental Pop',
1641 'Instrumental Rock',
1642 'Ethnic',
1643 'Gothic',
1644 'Darkwave',
1645 'Techno-Industrial',
1646 'Electronic',
1647 'Pop-Folk',
1648 'Eurodance',
1649 'Dream',
1650 'Southern Rock',
1651 'Comedy',
1652 'Cult',
1653 'Gangsta',
1654 'Top 40',
1655 'Christian Rap',
1656 'Pop/Funk',
1657 'Jungle',
1658 'Native American',
1659 'Cabaret',
1660 'New Wave',
1661 'Psychadelic',
1662 'Rave',
1663 'Showtunes',
1664 'Trailer',
1665 'Lo-Fi',
1666 'Tribal',
1667 'Acid Punk',
1668 'Acid Jazz',
1669 'Polka',
1670 'Retro',
1671 'Musical',
1672 'Rock & Roll',
1673 'Hard Rock',
1674 );
1675
1676 @winamp_genres = (
1677 @mp3_genres,
1678 'Folk',
1679 'Folk-Rock',
1680 'National Folk',
1681 'Swing',
1682 'Fast Fusion',
1683 'Bebop',
1684 'Latin',
1685 'Revival',
1686 'Celtic',
1687 'Bluegrass',
1688 'Avantgarde',
1689 'Gothic Rock',
1690 'Progressive Rock',
1691 'Psychedelic Rock',
1692 'Symphonic Rock',
1693 'Slow Rock',
1694 'Big Band',
1695 'Chorus',
1696 'Easy Listening',
1697 'Acoustic',
1698 'Humour',
1699 'Speech',
1700 'Chanson',
1701 'Opera',
1702 'Chamber Music',
1703 'Sonata',
1704 'Symphony',
1705 'Booty Bass',
1706 'Primus',
1707 'Porn Groove',
1708 'Satire',
1709 'Slow Jam',
1710 'Club',
1711 'Tango',
1712 'Samba',
1713 'Folklore',
1714 'Ballad',
1715 'Power Ballad',
1716 'Rhythmic Soul',
1717 'Freestyle',
1718 'Duet',
1719 'Punk Rock',
1720 'Drum Solo',
1721 'Acapella',
1722 'Euro-House',
1723 'Dance Hall',
1724 'Goa',
1725 'Drum & Bass',
1726 'Club-House',
1727 'Hardcore',
1728 'Terror',
1729 'Indie',
1730 'BritPop',
1731 'Negerpunk',
1732 'Polsk Punk',
1733 'Beat',
1734 'Christian Gangsta Rap',
1735 'Heavy Metal',
1736 'Black Metal',
1737 'Crossover',
1738 'Contemporary Christian',
1739 'Christian Rock',
1740 'Merengue',
1741 'Salsa',
1742 'Thrash Metal',
1743 'Anime',
1744 'JPop',
1745 'Synthpop',
1746 );
1747
1748 @t_bitrate = ([
1749 [0, 32, 48, 56, 64, 80, 96, 112, 128, 144, 160, 176, 192, 224, 256],
1750 [0, 8, 16, 24, 32, 40, 48, 56, 64, 80, 96, 112, 128, 144, 160],
1751 [0, 8, 16, 24, 32, 40, 48, 56, 64, 80, 96, 112, 128, 144, 160]
1752 ],[
1753 [0, 32, 64, 96, 128, 160, 192, 224, 256, 288, 320, 352, 384, 416, 448],
1754 [0, 32, 48, 56, 64, 80, 96, 112, 128, 160, 192, 224, 256, 320, 384],
1755 [0, 32, 40, 48, 56, 64, 80, 96, 112, 128, 160, 192, 224, 256, 320]
1756 ]);
1757
1758 @t_sampling_freq = (
1759 [11025, 12000, 8000],
1760 [undef, undef, undef], # reserved
1761 [22050, 24000, 16000],
1762 [44100, 48000, 32000]
1763 );
1764
1765 @frequency_tbl = map { $_ ? eval "${_}e-3" : 0 }
1766 map { @$_ } @t_sampling_freq;
1767
1768 @mp3_info_fields = qw(
1769 VERSION
1770 LAYER
1771 STEREO
1772 VBR
1773 BITRATE
1774 FREQUENCY
1775 SIZE
1776 OFFSET
1777 SECS
1778 MM
1779 SS
1780 MS
1781 TIME
1782 COPYRIGHT
1783 PADDING
1784 MODE
1785 FRAMES
1786 FRAME_LENGTH
1787 VBR_SCALE
1788 );
1789
1790 %rva2_channel_types = (
1791 0x00 => 'OTHER',
1792 0x01 => 'MASTER',
1793 0x02 => 'FRONT_RIGHT',
1794 0x03 => 'FRONT_LEFT',
1795 0x04 => 'BACK_RIGHT',
1796 0x05 => 'BACK_LEFT',
1797 0x06 => 'FRONT_CENTER',
1798 0x07 => 'BACK_CENTER',
1799 0x08 => 'SUBWOOFER',
1800 );
1801
1802 %v1_tag_fields =
1803 (TITLE => 30, ARTIST => 30, ALBUM => 30, COMMENT => 30, YEAR => 4);
1804
1805 @v1_tag_names = qw(TITLE ARTIST ALBUM YEAR COMMENT TRACKNUM GENRE);
1806
1807 %v2_to_v1_names = (
1808 # v2.2 tags
1809 'TT2' => 'TITLE',
1810 'TP1' => 'ARTIST',
1811 'TAL' => 'ALBUM',
1812 'TYE' => 'YEAR',
1813 'COM' => 'COMMENT',
1814 'TRK' => 'TRACKNUM',
1815 'TCO' => 'GENRE', # not clean mapping, but ...
1816 # v2.3 tags
1817 'TIT2' => 'TITLE',
1818 'TPE1' => 'ARTIST',
1819 'TALB' => 'ALBUM',
1820 'TYER' => 'YEAR',
1821 'COMM' => 'COMMENT',
1822 'TRCK' => 'TRACKNUM',
1823 'TCON' => 'GENRE',
1824 # v2.3 tags - needed for MusicBrainz
1825 'UFID' => 'Unique file identifier',
1826 'TXXX' => 'User defined text information frame',
1827 );
1828
1829 %v2_tag_names = (
1830 # v2.2 tags
1831 'BUF' => 'Recommended buffer size',
1832 'CNT' => 'Play counter',
1833 'COM' => 'Comments',
1834 'CRA' => 'Audio encryption',
1835 'CRM' => 'Encrypted meta frame',
1836 'ETC' => 'Event timing codes',
1837 'EQU' => 'Equalization',
1838 'GEO' => 'General encapsulated object',
1839 'IPL' => 'Involved people list',
1840 'LNK' => 'Linked information',
1841 'MCI' => 'Music CD Identifier',
1842 'MLL' => 'MPEG location lookup table',
1843 'PIC' => 'Attached picture',
1844 'POP' => 'Popularimeter',
1845 'REV' => 'Reverb',
1846 'RVA' => 'Relative volume adjustment',
1847 'SLT' => 'Synchronized lyric/text',
1848 'STC' => 'Synced tempo codes',
1849 'TAL' => 'Album/Movie/Show title',
1850 'TBP' => 'BPM (Beats Per Minute)',
1851 'TCM' => 'Composer',
1852 'TCO' => 'Content type',
1853 'TCR' => 'Copyright message',
1854 'TDA' => 'Date',
1855 'TDY' => 'Playlist delay',
1856 'TEN' => 'Encoded by',
1857 'TFT' => 'File type',
1858 'TIM' => 'Time',
1859 'TKE' => 'Initial key',
1860 'TLA' => 'Language(s)',
1861 'TLE' => 'Length',
1862 'TMT' => 'Media type',
1863 'TOA' => 'Original artist(s)/performer(s)',
1864 'TOF' => 'Original filename',
1865 'TOL' => 'Original Lyricist(s)/text writer(s)',
1866 'TOR' => 'Original release year',
1867 'TOT' => 'Original album/Movie/Show title',
1868 'TP1' => 'Lead artist(s)/Lead performer(s)/Soloist(s)/Performing group',
1869 'TP2' => 'Band/Orchestra/Accompaniment',
1870 'TP3' => 'Conductor/Performer refinement',
1871 'TP4' => 'Interpreted, remixed, or otherwise modified by',
1872 'TPA' => 'Part of a set',
1873 'TPB' => 'Publisher',
1874 'TRC' => 'ISRC (International Standard Recording Code)',
1875 'TRD' => 'Recording dates',
1876 'TRK' => 'Track number/Position in set',
1877 'TSI' => 'Size',
1878 'TSS' => 'Software/hardware and settings used for encoding',
1879 'TT1' => 'Content group description',
1880 'TT2' => 'Title/Songname/Content description',
1881 'TT3' => 'Subtitle/Description refinement',
1882 'TXT' => 'Lyricist/text writer',
1883 'TXX' => 'User defined text information frame',
1884 'TYE' => 'Year',
1885 'UFI' => 'Unique file identifier',
1886 'ULT' => 'Unsychronized lyric/text transcription',
1887 'WAF' => 'Official audio file webpage',
1888 'WAR' => 'Official artist/performer webpage',
1889 'WAS' => 'Official audio source webpage',
1890 'WCM' => 'Commercial information',
1891 'WCP' => 'Copyright/Legal information',
1892 'WPB' => 'Publishers official webpage',
1893 'WXX' => 'User defined URL link frame',
1894
1895 # v2.3 tags
1896 'AENC' => 'Audio encryption',
1897 'APIC' => 'Attached picture',
1898 'COMM' => 'Comments',
1899 'COMR' => 'Commercial frame',
1900 'ENCR' => 'Encryption method registration',
1901 'EQUA' => 'Equalization',
1902 'ETCO' => 'Event timing codes',
1903 'GEOB' => 'General encapsulated object',
1904 'GRID' => 'Group identification registration',
1905 'IPLS' => 'Involved people list',
1906 'LINK' => 'Linked information',
1907 'MCDI' => 'Music CD identifier',
1908 'MLLT' => 'MPEG location lookup table',
1909 'OWNE' => 'Ownership frame',
1910 'PCNT' => 'Play counter',
1911 'POPM' => 'Popularimeter',
1912 'POSS' => 'Position synchronisation frame',
1913 'PRIV' => 'Private frame',
1914 'RBUF' => 'Recommended buffer size',
1915 'RVAD' => 'Relative volume adjustment',
1916 'RVRB' => 'Reverb',
1917 'SYLT' => 'Synchronized lyric/text',
1918 'SYTC' => 'Synchronized tempo codes',
1919 'TALB' => 'Album/Movie/Show title',
1920 'TBPM' => 'BPM (beats per minute)',
1921 'TCOM' => 'Composer',
1922 'TCON' => 'Content type',
1923 'TCOP' => 'Copyright message',
1924 'TDAT' => 'Date',
1925 'TDLY' => 'Playlist delay',
1926 'TENC' => 'Encoded by',
1927 'TEXT' => 'Lyricist/Text writer',
1928 'TFLT' => 'File type',
1929 'TIME' => 'Time',
1930 'TIT1' => 'Content group description',
1931 'TIT2' => 'Title/songname/content description',
1932 'TIT3' => 'Subtitle/Description refinement',
1933 'TKEY' => 'Initial key',
1934 'TLAN' => 'Language(s)',
1935 'TLEN' => 'Length',
1936 'TMED' => 'Media type',
1937 'TOAL' => 'Original album/movie/show title',
1938 'TOFN' => 'Original filename',
1939 'TOLY' => 'Original lyricist(s)/text writer(s)',
1940 'TOPE' => 'Original artist(s)/performer(s)',
1941 'TORY' => 'Original release year',
1942 'TOWN' => 'File owner/licensee',
1943 'TPE1' => 'Lead performer(s)/Soloist(s)',
1944 'TPE2' => 'Band/orchestra/accompaniment',
1945 'TPE3' => 'Conductor/performer refinement',
1946 'TPE4' => 'Interpreted, remixed, or otherwise modified by',
1947 'TPOS' => 'Part of a set',
1948 'TPUB' => 'Publisher',
1949 'TRCK' => 'Track number/Position in set',
1950 'TRDA' => 'Recording dates',
1951 'TRSN' => 'Internet radio station name',
1952 'TRSO' => 'Internet radio station owner',
1953 'TSIZ' => 'Size',
1954 'TSRC' => 'ISRC (international standard recording code)',
1955 'TSSE' => 'Software/Hardware and settings used for encoding',
1956 'TXXX' => 'User defined text information frame',
1957 'TYER' => 'Year',
1958 'UFID' => 'Unique file identifier',
1959 'USER' => 'Terms of use',
1960 'USLT' => 'Unsychronized lyric/text transcription',
1961 'WCOM' => 'Commercial information',
1962 'WCOP' => 'Copyright/Legal information',
1963 'WOAF' => 'Official audio file webpage',
1964 'WOAR' => 'Official artist/performer webpage',
1965 'WOAS' => 'Official audio source webpage',
1966 'WORS' => 'Official internet radio station homepage',
1967 'WPAY' => 'Payment',
1968 'WPUB' => 'Publishers official webpage',
1969 'WXXX' => 'User defined URL link frame',
1970
1971 # v2.4 additional tags
1972 # note that we don't restrict tags from 2.3 or 2.4,
1973 'ASPI' => 'Audio seek point index',
1974 'EQU2' => 'Equalisation (2)',
1975 'RVA2' => 'Relative volume adjustment (2)',
1976 'SEEK' => 'Seek frame',
1977 'SIGN' => 'Signature frame',
1978 'TDEN' => 'Encoding time',
1979 'TDOR' => 'Original release time',
1980 'TDRC' => 'Recording time',
1981 'TDRL' => 'Release time',
1982 'TDTG' => 'Tagging time',
1983 'TIPL' => 'Involved people list',
1984 'TMCL' => 'Musician credits list',
1985 'TMOO' => 'Mood',
1986 'TPRO' => 'Produced notice',
1987 'TSOA' => 'Album sort order',
1988 'TSOP' => 'Performer sort order',
1989 'TSOT' => 'Title sort order',
1990 'TSST' => 'Set subtitle',
1991
1992 # grrrrrrr
1993 'COM ' => 'Broken iTunes comments',
1994 );
1995}
1996
19971;
1998
1999__END__
2000
2001=pod
2002
2003=back
2004
2005=head1 TROUBLESHOOTING
2006
2007If you find a bug, please send me a patch (see the project page in L<"SEE ALSO">).
2008If you cannot figure out why it does not work for you, please put the MP3 file in
2009a place where I can get it (preferably via FTP, or HTTP, or .Mac iDisk) and send me
2010mail regarding where I can get the file, with a detailed description of the problem.
2011
2012If I download the file, after debugging the problem I will not keep the MP3 file
2013if it is not legal for me to have it. Just let me know if it is legal for me to
2014keep it or not.
2015
2016
2017=head1 TODO
2018
2019=over 4
2020
2021=item ID3v2 Support
2022
2023Still need to do more for reading tags, such as using Compress::Zlib to decompress
2024compressed tags. But until I see this in use more, I won't bother. If something
2025does not work properly with reading, follow the instructions above for
2026troubleshooting.
2027
2028ID3v2 I<writing> is coming soon.
2029
2030=item Get data from scalar
2031
2032Instead of passing a file spec or filehandle, pass the
2033data itself. Would take some work, converting the seeks, etc.
2034
2035=item Padding bit ?
2036
2037Do something with padding bit.
2038
2039=item Test suite
2040
2041Test suite could use a bit of an overhaul and update. Patches very welcome.
2042
2043=over 4
2044
2045=item *
2046
2047Revamp getset.t. Test all the various get_mp3tag args.
2048
2049=item *
2050
2051Test Unicode.
2052
2053=item *
2054
2055Test OOP API.
2056
2057=item *
2058
2059Test error handling, check more for missing files, bad MP3s, etc.
2060
2061=back
2062
2063=item Other VBR
2064
2065Right now, only Xing VBR is supported.
2066
2067=back
2068
2069
2070=head1 THANKS
2071
2072Edward Allen,
2073Vittorio Bertola,
2074Michael Blakeley,
2075Per Bolmstedt,
2076Tony Bowden,
2077Tom Brown,
2078Sergio Camarena,
2079Chris Dawson,
2080Anthony DiSante,
2081Luke Drumm,
2082Kyle Farrell,
2083Jeffrey Friedl,
2084brian d foy,
2085Ben Gertzfield,
2086Brian Goodwin,
2087Todd Hanneken,
2088Todd Harris,
2089Woodrow Hill,
2090Kee Hinckley,
2091Roman Hodek,
2092Ilya Konstantinov,
2093Peter Kovacs,
2094Johann Lindvall,
2095Alex Marandon,
2096Peter Marschall,
2097michael,
2098Trond Michelsen,
2099Dave O'Neill,
2100Christoph Oberauer,
2101Jake Palmer,
2102Andrew Phillips,
2103David Reuteler,
2104John Ruttenberg,
2105Matthew Sachs,
2106scfc_de,
2107Hermann Schwaerzler,
2108Chris Sidi,
2109Roland Steinbach,
2110Brian S. Stephan,
2111Stuart,
2112Dan Sully,
2113Jeffery Sumler,
2114Predrag Supurovic,
2115Bogdan Surdu,
2116Pierre-Yves Thoulon,
2117tim,
2118Pass F. B. Travis,
2119Tobias Wagener,
2120Ronan Waide,
2121Andy Waite,
2122Ken Williams,
2123Ben Winslow,
2124Meng Weng Wong.
2125
2126
2127=head1 CURRENT AUTHOR
2128
2129Dan Sully E<lt>dan | at | slimdevices.comE<gt> & Slim Devices, Inc.
2130
2131=head1 AUTHOR EMERITUS
2132
2133Chris Nandor E<lt>pudge@pobox.comE<gt>, http://pudge.net/
2134
2135=head1 COPYRIGHT AND LICENSE
2136
2137Copyright (c) 2006 Dan Sully & Slim Devices, Inc. All rights reserved.
2138
2139Copyright (c) 1998-2005 Chris Nandor. All rights reserved.
2140
2141This program is free software; you can redistribute it and/or modify it under
2142the same terms as Perl itself.
2143
2144=head1 SEE ALSO
2145
2146=over 4
2147
2148=item Slim Devices
2149
2150 http://www.slimdevices.com/
2151
2152=item mp3tools
2153
2154 http://www.zevils.com/linux/mp3tools/
2155
2156=item mpgtools
2157
2158 http://www.dv.co.yu/mpgscript/mpgtools.htm
2159 http://www.dv.co.yu/mpgscript/mpeghdr.htm
2160
2161=item mp3tool
2162
2163 http://www.dtek.chalmers.se/~d2linjo/mp3/mp3tool.html
2164
2165=item ID3v2
2166
2167 http://www.id3.org/
2168
2169=item Xing Variable Bitrate
2170
2171 http://www.xingtech.com/support/partner_developer/mp3/vbr_sdk/
2172
2173=item MP3Ext
2174
2175 http://rupert.informatik.uni-stuttgart.de/~mutschml/MP3ext/
2176
2177=item Xmms
2178
2179 http://www.xmms.org/
2180
2181
2182=back
2183
2184=cut
diff --git a/tools/songdb.pl b/tools/songdb.pl
new file mode 100755
index 0000000000..cba30492da
--- /dev/null
+++ b/tools/songdb.pl
@@ -0,0 +1,448 @@
1#!/usr/bin/perl
2#
3# Rockbox song database docs:
4# http://www.rockbox.org/twiki/bin/view/Main/TagCache
5#
6
7use mp3info;
8use vorbiscomm;
9
10# configuration settings
11my $db = "tagcache";
12my $dir;
13my $strip;
14my $add;
15my $verbose;
16my $help;
17my $dirisalbum;
18my $littleendian = 0;
19my $dbver = 0x54434804;
20
21# file data
22my %entries;
23
24while($ARGV[0]) {
25 if($ARGV[0] eq "--path") {
26 $dir = $ARGV[1];
27 shift @ARGV;
28 shift @ARGV;
29 }
30 elsif($ARGV[0] eq "--db") {
31 $db = $ARGV[1];
32 shift @ARGV;
33 shift @ARGV;
34 }
35 elsif($ARGV[0] eq "--strip") {
36 $strip = $ARGV[1];
37 shift @ARGV;
38 shift @ARGV;
39 }
40 elsif($ARGV[0] eq "--add") {
41 $add = $ARGV[1];
42 shift @ARGV;
43 shift @ARGV;
44 }
45 elsif($ARGV[0] eq "--dirisalbum") {
46 $dirisalbum = 1;
47 shift @ARGV;
48 }
49 elsif($ARGV[0] eq "--littleendian") {
50 $littleendian = 1;
51 shift @ARGV;
52 }
53 elsif($ARGV[0] eq "--verbose") {
54 $verbose = 1;
55 shift @ARGV;
56 }
57 elsif($ARGV[0] eq "--help" or ($ARGV[0] eq "-h")) {
58 $help = 1;
59 shift @ARGV;
60 }
61 else {
62 shift @ARGV;
63 }
64}
65
66if(! -d $dir or $help) {
67 print "'$dir' is not a directory\n" if ($dir ne "" and ! -d $dir);
68 print <<MOO
69
70songdb --path <dir> [--db <file>] [--strip <path>] [--add <path>] [--dirisalbum] [--littleendian] [--verbose] [--help]
71
72Options:
73
74 --path <dir> Where your music collection is found
75 --db <file> Prefix for output files. Defaults to tagcache.
76 --strip <path> Removes this string from the left of all file names
77 --add <path> Adds this string to the left of all file names
78 --dirisalbum Use dir name as album name if the album name is missing in the
79 tags
80 --littleendian Write out data as little endian (for simulator)
81 --verbose Shows more details while working
82 --help This text
83MOO
84;
85 exit;
86}
87
88sub get_oggtag {
89 my $fn = shift;
90 my %hash;
91
92 my $ogg = vorbiscomm->new($fn);
93
94 my $h= $ogg->load;
95
96 # Convert this format into the same format used by the id3 parser hash
97
98 foreach my $k ($ogg->comment_tags())
99 {
100 foreach my $cmmt ($ogg->comment($k))
101 {
102 my $n;
103 if($k =~ /^artist$/i) {
104 $n = 'ARTIST';
105 }
106 elsif($k =~ /^album$/i) {
107 $n = 'ALBUM';
108 }
109 elsif($k =~ /^title$/i) {
110 $n = 'TITLE';
111 }
112 $hash{$n}=$cmmt if($n);
113 }
114 }
115
116 return \%hash;
117}
118
119sub get_ogginfo {
120 my $fn = shift;
121 my %hash;
122
123 my $ogg = vorbiscomm->new($fn);
124
125 my $h= $ogg->load;
126
127 return $ogg->{'INFO'};
128}
129
130# return ALL directory entries in the given dir
131sub getdir {
132 my ($dir) = @_;
133
134 $dir =~ s|/$|| if ($dir ne "/");
135
136 if (opendir(DIR, $dir)) {
137 my @all = readdir(DIR);
138 closedir DIR;
139 return @all;
140 }
141 else {
142 warn "can't opendir $dir: $!\n";
143 }
144}
145
146sub extractmp3 {
147 my ($dir, @files) = @_;
148 my @mp3;
149 for(@files) {
150 if( (/\.mp[23]$/i || /\.ogg$/i) && -f "$dir/$_" ) {
151 push @mp3, $_;
152 }
153 }
154 return @mp3;
155}
156
157sub extractdirs {
158 my ($dir, @files) = @_;
159 $dir =~ s|/$||;
160 my @dirs;
161 for(@files) {
162 if( -d "$dir/$_" && ($_ !~ /^\.(|\.)$/)) {
163 push @dirs, $_;
164 }
165 }
166 return @dirs;
167}
168
169sub singlefile {
170 my ($file) = @_;
171 my $hash;
172 my $info;
173
174 if($file =~ /\.ogg$/i) {
175 $hash = get_oggtag($file);
176 $info = get_ogginfo($file);
177 }
178 else {
179 $hash = get_mp3tag($file);
180 $info = get_mp3info($file);
181 if (defined $$info{'BITRATE'}) {
182 $$hash{'BITRATE'} = $$info{'BITRATE'};
183 }
184
185 if (defined $$info{'SECS'}) {
186 $$hash{'SECS'} = $$info{'SECS'};
187 }
188 }
189
190 return $hash;
191}
192
193sub dodir {
194 my ($dir)=@_;
195
196 my %lcartists;
197 my %lcalbums;
198
199 print "$dir\n";
200
201 # getdir() returns all entries in the given dir
202 my @a = getdir($dir);
203
204 # extractmp3 filters out only the mp3 files from all given entries
205 my @m = extractmp3($dir, @a);
206
207 my $f;
208
209 for $f (sort @m) {
210
211 my $id3 = singlefile("$dir/$f");
212
213 if (not defined $$id3{'ARTIST'} or $$id3{'ARTIST'} eq "") {
214 $$id3{'ARTIST'} = "<Untagged>";
215 }
216
217 # Only use one case-variation of each artist
218 if (exists($lcartists{lc($$id3{'ARTIST'})})) {
219 $$id3{'ARTIST'} = $lcartists{lc($$id3{'ARTIST'})};
220 }
221 else {
222 $lcartists{lc($$id3{'ARTIST'})} = $$id3{'ARTIST'};
223 }
224 #printf "Artist: %s\n", $$id3{'ARTIST'};
225
226 if (not defined $$id3{'ALBUM'} or $$id3{'ALBUM'} eq "") {
227 $$id3{'ALBUM'} = "<Untagged>";
228 if ($dirisalbum) {
229 $$id3{'ALBUM'} = $dir;
230 }
231 }
232
233 # Only use one case-variation of each album
234 if (exists($lcalbums{lc($$id3{'ALBUM'})})) {
235 $$id3{'ALBUM'} = $lcalbums{lc($$id3{'ALBUM'})};
236 }
237 else {
238 $lcalbums{lc($$id3{'ALBUM'})} = $$id3{'ALBUM'};
239 }
240 #printf "Album: %s\n", $$id3{'ALBUM'};
241
242 if (not defined $$id3{'GENRE'} or $$id3{'GENRE'} eq "") {
243 $$id3{'GENRE'} = "<Untagged>";
244 }
245 #printf "Genre: %s\n", $$id3{'GENRE'};
246
247 if (not defined $$id3{'TITLE'} or $$id3{'TITLE'} eq "") {
248 # fall back on basename of the file if no title tag.
249 ($$id3{'TITLE'} = $f) =~ s/\.\w+$//;
250 }
251 #printf "Title: %s\n", $$id3{'TITLE'};
252
253 my $path = "$dir/$f";
254 if ($strip ne "" and $path =~ /^$strip(.*)/) {
255 $path = $1;
256 }
257
258 if ($add ne "") {
259 $path = $add . $path;
260 }
261 #printf "Path: %s\n", $path;
262
263 if (not defined $$id3{'COMPOSER'} or $$id3{'COMPOSER'} eq "") {
264 $$id3{'COMPOSER'} = "<Untagged>";
265 }
266 #printf "Composer: %s\n", $$id3{'COMPOSER'};
267
268 if (not defined $$id3{'YEAR'} or $$id3{'YEAR'} eq "") {
269 $$id3{'YEAR'} = "-1";
270 }
271 #printf "Year: %s\n", $$id3{'YEAR'};
272
273 if (not defined $$id3{'TRACKNUM'} or $$id3{'TRACKNUM'} eq "") {
274 $$id3{'TRACKNUM'} = "-1";
275 }
276 #printf "Track num: %s\n", $$id3{'TRACKNUM'};
277
278 if (not defined $$id3{'BITRATE'} or $$id3{'BITRATE'} eq "") {
279 $$id3{'BITRATE'} = "-1";
280 }
281 #printf "Bitrate: %s\n", $$id3{'BITRATE'};
282
283 if (not defined $$id3{'SECS'} or $$id3{'SECS'} eq "") {
284 $$id3{'SECS'} = "-1";
285 }
286 #printf "Length: %s\n", $$id3{'SECS'};
287
288 $$id3{'PATH'} = $path;
289 $entries{$path} = $id3;
290 }
291
292 # extractdirs filters out only subdirectories from all given entries
293 my @d = extractdirs($dir, @a);
294 my $d;
295
296 for $d (sort @d) {
297 $dir =~ s|/$||;
298 dodir("$dir/$d");
299 }
300}
301
302use_mp3_utf8(1);
303dodir($dir);
304print "\n";
305
306sub dumpshort {
307 my ($num)=@_;
308
309 # print "int: $num\n";
310
311 if ($littleendian) {
312 print DB pack "v", $num;
313 }
314 else {
315 print DB pack "n", $num;
316 }
317}
318
319sub dumpint {
320 my ($num)=@_;
321
322# print "int: $num\n";
323
324 if ($littleendian) {
325 print DB pack "V", $num;
326 }
327 else {
328 print DB pack "N", $num;
329 }
330}
331
332sub dump_tag_string {
333 my ($s, $index) = @_;
334
335 my $strlen = length($s)+1;
336 my $padding = $strlen%4;
337 if ($padding > 0) {
338 $padding = 4 - $padding;
339 $strlen += $padding;
340 }
341
342 dumpshort($strlen);
343 dumpshort($index);
344 print DB $s."\0";
345
346 for (my $i = 0; $i < $padding; $i++) {
347 print DB "X";
348 }
349}
350
351sub dump_tag_header {
352 my ($entry_count) = @_;
353
354 my $size = tell(DB) - 12;
355 seek(DB, 0, 0);
356
357 dumpint($dbver);
358 dumpint($size);
359 dumpint($entry_count);
360}
361
362sub openfile {
363 my ($f) = @_;
364 open(DB, "> $f") || die "couldn't open $f";
365 binmode(DB);
366}
367
368sub create_tagcache_index_file {
369 my ($index, $key, $unique) = @_;
370
371 my $num = 0;
372 my $prev = "";
373 my $offset = 12;
374
375 openfile $db ."_".$index.".tcd";
376 dump_tag_header(0);
377
378 for(sort {uc($entries{$a}->{$key}) cmp uc($entries{$b}->{$key})} keys %entries) {
379 if (!$unique || !($entries{$_}->{$key} eq $prev)) {
380 my $index;
381
382 $num++;
383 $prev = $entries{$_}->{$key};
384 $offset = tell(DB);
385 printf(" %s\n", $prev) if ($verbose);
386
387 if ($unique) {
388 $index = 0xFFFF;
389 }
390 else {
391 $index = $entries{$_}->{'INDEX'};
392 }
393 dump_tag_string($prev, $index);
394 }
395 $entries{$_}->{$key."_OFFSET"} = $offset;
396 }
397
398 dump_tag_header($num);
399 close(DB);
400}
401
402if (!scalar keys %entries) {
403 print "No songs found. Did you specify the right --path ?\n";
404 print "Use the --help parameter to see all options.\n";
405 exit;
406}
407
408my $i = 0;
409for (sort keys %entries) {
410 $entries{$_}->{'INDEX'} = $i;
411 $i++;
412}
413
414if ($db) {
415 # Artists
416 create_tagcache_index_file(0, 'ARTIST', 1);
417 # Albums
418 create_tagcache_index_file(1, 'ALBUM', 1);
419 # Genres
420 create_tagcache_index_file(2, 'GENRE', 1);
421 # Titles
422 create_tagcache_index_file(3, 'TITLE', 0);
423 # Filenames
424 create_tagcache_index_file(4, 'PATH', 0);
425 # Composers
426 create_tagcache_index_file(5, 'COMPOSER', 1);
427
428 # Master index file
429 openfile $db ."_idx.tcd";
430 dump_tag_header(0);
431
432 for (sort keys %entries) {
433 dumpint($entries{$_}->{'ARTIST_OFFSET'});
434 dumpint($entries{$_}->{'ALBUM_OFFSET'});
435 dumpint($entries{$_}->{'GENRE_OFFSET'});
436 dumpint($entries{$_}->{'TITLE_OFFSET'});
437 dumpint($entries{$_}->{'PATH_OFFSET'});
438 dumpint($entries{$_}->{'COMPOSER_OFFSET'});
439 dumpint($entries{$_}->{'YEAR'});
440 dumpint($entries{$_}->{'TRACKNUM'});
441 dumpint($entries{$_}->{'BITRATE'});
442 dumpint($entries{$_}->{'SECS'});
443 dumpint(0);
444 }
445
446 dump_tag_header(scalar keys %entries);
447 close(DB);
448}
diff --git a/tools/vorbiscomm.pm b/tools/vorbiscomm.pm
new file mode 100644
index 0000000000..f2e48e8632
--- /dev/null
+++ b/tools/vorbiscomm.pm
@@ -0,0 +1,732 @@
1#############################################################################
2# This is
3# http://search.cpan.org/~amolloy/Ogg-Vorbis-Header-PurePerl-0.07/PurePerl.pm
4# written by Andrew Molloy
5# Code under GNU GENERAL PUBLIC LICENCE v2
6# $Id$
7#############################################################################
8
9package vorbiscomm;
10
11use 5.005;
12use strict;
13use warnings;
14
15use Fcntl qw/SEEK_END/;
16
17our $VERSION = '0.07';
18
19sub new
20{
21 my $class = shift;
22 my $file = shift;
23
24 return load($class, $file);
25}
26
27sub load
28{
29 my $class = shift;
30 my $file = shift;
31 my $from_new = shift;
32 my %data;
33 my $self;
34
35 # there must be a better way...
36 if ($class eq 'vorbiscomm')
37 {
38 $self = bless \%data, $class;
39 }
40 else
41 {
42 $self = $class;
43 }
44
45 if ($self->{'FILE_LOADED'})
46 {
47 return $self;
48 }
49
50 $self->{'FILE_LOADED'} = 1;
51
52 # check that the file exists and is readable
53 unless ( -e $file && -r _ )
54 {
55 warn "File does not exist or cannot be read.";
56 # file does not exist, can't do anything
57 return undef;
58 }
59 # open up the file
60 open FILE, $file;
61 # make sure dos-type systems can handle it...
62 binmode FILE;
63
64 $data{'filename'} = $file;
65 $data{'fileHandle'} = \*FILE;
66
67 if (_init(\%data)) {
68 _loadInfo(\%data);
69 _loadComments(\%data);
70 _calculateTrackLength(\%data);
71 }
72
73 close FILE;
74
75 return $self;
76}
77
78sub info
79{
80 my $self = shift;
81 my $key = shift;
82
83 # if the user did not supply a key, return the entire hash
84 unless ($key)
85 {
86 return $self->{'INFO'};
87 }
88
89 # otherwise, return the value for the given key
90 return $self->{'INFO'}{lc $key};
91}
92
93sub comment_tags
94{
95 my $self = shift;
96
97 if ( $self && $self->{'COMMENT_KEYS'} ) {
98 return @{$self->{'COMMENT_KEYS'}};
99 }
100
101 return undef;
102}
103
104sub comment
105{
106 my $self = shift;
107 my $key = shift;
108
109 # if the user supplied key does not exist, return undef
110 unless($self->{'COMMENTS'}{lc $key})
111 {
112 return undef;
113 }
114
115 return @{$self->{'COMMENTS'}{lc $key}};
116}
117
118sub add_comments
119{
120 warn "Ogg::Vorbis::Header::PurePerl add_comments() unimplemented.";
121}
122
123sub edit_comment
124{
125 warn "Ogg::Vorbis::Header::PurePerl edit_comment() unimplemented.";
126}
127
128sub delete_comment
129{
130 warn "Ogg::Vorbis::Header::PurePerl delete_comment() unimplemented.";
131}
132
133sub clear_comments
134{
135 warn "Ogg::Vorbis::Header::PurePerl clear_comments() unimplemented.";
136}
137
138sub path
139{
140 my $self = shift;
141
142 return $self->{'fileName'};
143}
144
145sub write_vorbis
146{
147 warn "Ogg::Vorbis::Header::PurePerl write_vorbis unimplemented.";
148}
149
150# "private" methods
151
152sub _init
153{
154 my $data = shift;
155 my $fh = $data->{'fileHandle'};
156 my $byteCount = 0;
157
158 # check the header to make sure this is actually an Ogg-Vorbis file
159 $byteCount = _checkHeader($data);
160
161 unless($byteCount)
162 {
163 # if it's not, we can't do anything
164 return undef;
165 }
166
167 $data->{'startInfoHeader'} = $byteCount;
168 return 1; # Success
169}
170
171sub _checkHeader
172{
173 my $data = shift;
174 my $fh = $data->{'fileHandle'};
175 my $buffer;
176 my $pageSegCount;
177 my $byteCount = 0; # stores how far into the file we've read,
178 # so later reads into the file can skip right
179 # past all of the header stuff
180
181 # check that the first four bytes are 'OggS'
182 read($fh, $buffer, 4);
183 if ($buffer ne 'OggS')
184 {
185 warn "This is not an Ogg bitstream (no OggS header).";
186 return undef;
187 }
188 $byteCount += 4;
189
190 # check the stream structure version (1 byte, should be 0x00)
191 read($fh, $buffer, 1);
192 if (ord($buffer) != 0x00)
193 {
194 warn "This is not an Ogg bitstream (invalid structure version).";
195 return undef;
196 }
197 $byteCount += 1;
198
199 # check the header type flag
200 # This is a bitfield, so technically we should check all of the bits
201 # that could potentially be set. However, the only value this should
202 # possibly have at the beginning of a proper Ogg-Vorbis file is 0x02,
203 # so we just check for that. If it's not that, we go on anyway, but
204 # give a warning (this behavior may (should?) be modified in the future.
205 read($fh, $buffer, 1);
206 if (ord($buffer) != 0x02)
207 {
208 warn "Invalid header type flag (trying to go ahead anyway).";
209 }
210 $byteCount += 1;
211
212 # skip to the page_segments count
213 read($fh, $buffer, 20);
214 $byteCount += 20;
215 # we do nothing with this data
216
217 # read the number of page segments
218 read($fh, $buffer, 1);
219 $pageSegCount = ord($buffer);
220 $byteCount += 1;
221
222 # read $pageSegCount bytes, then throw 'em out
223 read($fh, $buffer, $pageSegCount);
224 $byteCount += $pageSegCount;
225
226 # check packet type. Should be 0x01 (for indentification header)
227 read($fh, $buffer, 1);
228 if (ord($buffer) != 0x01)
229 {
230 warn "Wrong vorbis header type, giving up.";
231 return undef;
232 }
233 $byteCount += 1;
234
235 # check that the packet identifies itself as 'vorbis'
236 read($fh, $buffer, 6);
237 if ($buffer ne 'vorbis')
238 {
239 warn "This does not appear to be a vorbis stream, giving up.";
240 return undef;
241 }
242 $byteCount += 6;
243
244 # at this point, we assume the bitstream is valid
245 return $byteCount;
246}
247
248sub _loadInfo
249{
250 my $data = shift;
251 my $start = $data->{'startInfoHeader'};
252 my $fh = $data->{'fileHandle'};
253 my $buffer;
254 my $byteCount = $start;
255 my %info;
256
257 seek $fh, $start, 0;
258
259 # read the vorbis version
260 read($fh, $buffer, 4);
261 $info{'version'} = _decodeInt($buffer);
262 $byteCount += 4;
263
264 # read the number of audio channels
265 read($fh, $buffer, 1);
266 $info{'channels'} = ord($buffer);
267 $byteCount += 1;
268
269 # read the sample rate
270 read($fh, $buffer, 4);
271 $info{'rate'} = _decodeInt($buffer);
272 $byteCount += 4;
273
274 # read the bitrate maximum
275 read($fh, $buffer, 4);
276 $info{'bitrate_upper'} = _decodeInt($buffer);
277 $byteCount += 4;
278
279 # read the bitrate nominal
280 read($fh, $buffer, 4);
281 $info{'bitrate_nominal'} = _decodeInt($buffer);
282 $byteCount += 4;
283
284 # read the bitrate minimal
285 read($fh, $buffer, 4);
286 $info{'bitrate_lower'} = _decodeInt($buffer);
287 $byteCount += 4;
288
289 # read the blocksize_0 and blocksize_1
290 read($fh, $buffer, 1);
291 # these are each 4 bit fields, whose actual value is 2 to the power
292 # of the value of the field
293 $info{'blocksize_0'} = 2 << ((ord($buffer) & 0xF0) >> 4);
294 $info{'blocksize_1'} = 2 << (ord($buffer) & 0x0F);
295 $byteCount += 1;
296
297 # read the framing_flag
298 read($fh, $buffer, 1);
299 $info{'framing_flag'} = ord($buffer);
300 $byteCount += 1;
301
302 # bitrate_window is -1 in the current version of vorbisfile
303 $info{'bitrate_window'} = -1;
304
305 $data->{'startCommentHeader'} = $byteCount;
306
307 $data->{'INFO'} = \%info;
308}
309
310sub _loadComments
311{
312 my $data = shift;
313 my $fh = $data->{'fileHandle'};
314 my $start = $data->{'startCommentHeader'};
315 my $buffer;
316 my $page_segments;
317 my $vendor_length;
318 my $user_comment_count;
319 my $byteCount = $start;
320 my %comments;
321
322 seek $fh, $start, 0;
323
324 # check that the first four bytes are 'OggS'
325 read($fh, $buffer, 4);
326 if ($buffer ne 'OggS')
327 {
328 warn "No comment header?";
329 return undef;
330 }
331 $byteCount += 4;
332
333 # skip over next ten bytes
334 read($fh, $buffer, 10);
335 $byteCount += 10;
336
337 # read the stream serial number
338 read($fh, $buffer, 4);
339 push @{$data->{'commentSerialNumber'}}, _decodeInt($buffer);
340 $byteCount += 4;
341
342 # read the page sequence number (should be 0x01)
343 read($fh, $buffer, 4);
344 if (_decodeInt($buffer) != 0x01)
345 {
346 warn "Comment header page sequence number is not 0x01: " +
347 _decodeInt($buffer);
348 warn "Going to keep going anyway.";
349 }
350 $byteCount += 4;
351
352 # and ignore the page checksum for now
353 read($fh, $buffer, 4);
354 $byteCount += 4;
355
356 # get the number of entries in the segment_table...
357 read($fh, $buffer, 1);
358 $page_segments = _decodeInt($buffer);
359 $byteCount += 1;
360 # then skip on past it
361 read($fh, $buffer, $page_segments);
362 $byteCount += $page_segments;
363
364 # check the header type (should be 0x03)
365 read($fh, $buffer, 1);
366 if (ord($buffer) != 0x03)
367 {
368 warn "Wrong header type: " . ord($buffer);
369 }
370 $byteCount += 1;
371
372 # now we should see 'vorbis'
373 read($fh, $buffer, 6);
374 if ($buffer ne 'vorbis')
375 {
376 warn "Missing comment header. Should have found 'vorbis', found " .
377 $buffer;
378 }
379 $byteCount += 6;
380
381 # get the vendor length
382 read($fh, $buffer, 4);
383 $vendor_length = _decodeInt($buffer);
384 $byteCount += 4;
385
386 # read in the vendor
387 read($fh, $buffer, $vendor_length);
388 $comments{'vendor'} = $buffer;
389 $byteCount += $vendor_length;
390
391 # read in the number of user comments
392 read($fh, $buffer, 4);
393 $user_comment_count = _decodeInt($buffer);
394 $byteCount += 4;
395
396 $data->{'COMMENT_KEYS'} = [];
397
398 # finally, read the comments
399 for (my $i = 0; $i < $user_comment_count; $i++)
400 {
401 # first read the length
402 read($fh, $buffer, 4);
403 my $comment_length = _decodeInt($buffer);
404 $byteCount += 4;
405
406 # then the comment itself
407 read($fh, $buffer, $comment_length);
408 $byteCount += $comment_length;
409
410 my ($key) = $buffer =~ /^([^=]+)/;
411 my ($value) = $buffer =~ /=(.*)$/;
412
413 push @{$comments{lc $key}}, $value;
414 push @{$data->{'COMMENT_KEYS'}}, lc $key;
415 }
416
417 # read past the framing_bit
418 read($fh, $buffer, 1);
419 $byteCount += 1;
420
421 $data->{'INFO'}{'offset'} = $byteCount;
422
423 $data->{'COMMENTS'} = \%comments;
424
425 # Now find the offset of the first page
426 # with audio data.
427 while(_findPage($fh))
428 {
429 $byteCount = tell($fh) - 4;
430
431 # version flag
432 read($fh, $buffer, 1);
433 if (ord($buffer) != 0x00)
434 {
435 warn "Invalid stream structure version: " .
436 sprintf("%x", ord($buffer));
437 return;
438 }
439
440 # header type flag
441 read($fh, $buffer, 1);
442 # Audio data starts as a fresh packet on a new page, so
443 # if header_type is odd it's not a fresh packet
444 next if ( ord($buffer) % 2 );
445
446 # skip past granule position, stream_serial_number,
447 # page_sequence_number, and crc
448 read($fh, $buffer, 20);
449
450 # page_segments
451 read($fh, $buffer, 1);
452 my $page_segments = ord($buffer);
453
454 # skip past the segment table
455 read($fh, $buffer, $page_segments);
456
457 # read packet_type byte
458 read($fh, $buffer, 1);
459
460 # Not an audio packet. All audio packet numbers are even
461 next if ( ord($buffer) % 2 );
462
463 # Found the first audio packet
464 last;
465 }
466
467 $data->{'INFO'}{'audio_offset'} = $byteCount;
468}
469
470sub _calculateTrackLength
471{
472 my $data = shift;
473 my $fh = $data->{'fileHandle'};
474 my $buffer;
475 my $pageSize;
476 my $granule_position;
477
478 seek($fh,-8500,SEEK_END); # that magic number is from vorbisfile.c
479 # in the constant CHUNKSIZE, which comes
480 # with the comment /* a shade over 8k;
481 # anyone using pages well over 8k gets
482 # what they deserve */
483
484 # we just keep looking through the headers until we get to the last one
485 # (there might be a couple of blocks here)
486 while(_findPage($fh))
487 {
488 # stream structure version - must be 0x00
489 read($fh, $buffer, 1);
490 if (ord($buffer) != 0x00)
491 {
492 warn "Invalid stream structure version: " .
493 sprintf("%x", ord($buffer));
494 return;
495 }
496
497 # header type flag
498 read($fh, $buffer, 1);
499 # we should check this, but for now we'll just ignore it
500
501 # absolute granule position - this is what we need!
502 read($fh, $buffer, 8);
503 $granule_position = _decodeInt($buffer);
504
505 # skip past stream_serial_number, page_sequence_number, and crc
506 read($fh, $buffer, 12);
507
508 # page_segments
509 read($fh, $buffer, 1);
510 my $page_segments = ord($buffer);
511
512 # reset pageSize
513 $pageSize = 0;
514
515 # calculate approx. page size
516 for (my $i = 0; $i < $page_segments; $i++)
517 {
518 read($fh, $buffer, 1);
519 $pageSize += ord($buffer);
520 }
521
522 seek $fh, $pageSize, 1;
523 }
524
525 $data->{'INFO'}{'length'} =
526 int($granule_position / $data->{'INFO'}{'rate'});
527}
528
529sub _findPage
530{
531 # search forward in the file for the 'OggS' page header
532 my $fh = shift;
533 my $char;
534 my $curStr = '';
535
536 while (read($fh, $char, 1))
537 {
538 $curStr = $char . $curStr;
539 $curStr = substr($curStr, 0, 4);
540
541 # we are actually looking for the string 'SggO' because we
542 # tack character on to our test string backwards, to make
543 # trimming it to 4 characters easier.
544 if ($curStr eq 'SggO')
545 {
546 return 1;
547 }
548 }
549
550 return undef;
551}
552
553sub _decodeInt
554{
555 my $bytes = shift;
556 my $num = 0;
557 my @byteList = split //, $bytes;
558 my $numBytes = @byteList;
559 my $mult = 1;
560
561 for (my $i = 0; $i < $numBytes; $i ++)
562 {
563 $num += ord($byteList[$i]) * $mult;
564 $mult *= 256;
565 }
566
567 return $num;
568}
569
570sub _decodeInt5Bit
571{
572 my $byte = ord(shift);
573
574 $byte = $byte & 0xF8; # clear out the bottm 3 bits
575 $byte = $byte >> 3; # and shifted down to where it belongs
576
577 return $byte;
578}
579
580sub _decodeInt4Bit
581{
582 my $byte = ord(shift);
583
584 $byte = $byte & 0xFC; # clear out the bottm 4 bits
585 $byte = $byte >> 4; # and shifted down to where it belongs
586
587 return $byte;
588}
589
590sub _ilog
591{
592 my $x = shift;
593 my $ret = 0;
594
595 unless ($x > 0)
596 {
597 return 0;
598 }
599
600 while ($x > 0)
601 {
602 $ret++;
603 $x = $x >> 1;
604 }
605
606 return $ret;
607}
608
6091;
610__DATA__
611
612=head1 NAME
613
614Ogg::Vorbis::Header::PurePerl - An object-oriented interface to Ogg Vorbis
615information and comment fields, implemented entirely in Perl. Intended to be
616a drop in replacement for Ogg::Vobis::Header.
617
618Unlike Ogg::Vorbis::Header, this module will go ahead and fill in all of the
619information fields as soon as you construct the object. In other words,
620the C<new> and C<load> constructors have identical behavior.
621
622=head1 SYNOPSIS
623
624 use Ogg::Vorbis::Header::PurePerl;
625 my $ogg = Ogg::Vorbis::Header::PurePerl->new("song.ogg");
626 while (my ($k, $v) = each %{$ogg->info}) {
627 print "$k: $v\n";
628 }
629 foreach my $com ($ogg->comment_tags) {
630 print "$com: $_\n" foreach $ogg->comment($com);
631 }
632
633=head1 DESCRIPTION
634
635This module is intended to be a drop in replacement for Ogg::Vorbis::Header,
636implemented entirely in Perl. It provides an object-oriented interface to
637Ogg Vorbis information and comment fields. (NOTE: This module currently
638supports only read operations).
639
640=head1 CONSTRUCTORS
641
642=head2 C<new ($filename)>
643
644Opens an Ogg Vorbis file, ensuring that it exists and is actually an
645Ogg Vorbis stream. This method does not actually read any of the
646information or comment fields, and closes the file immediately.
647
648=head2 C<load ([$filename])>
649
650Opens an Ogg Vorbis file, ensuring that it exists and is actually an
651Ogg Vorbis stream, then loads the information and comment fields. This
652method can also be used without a filename to load the information
653and fields of an already constructed instance.
654
655=head1 INSTANCE METHODS
656
657=head2 C<info ([$key])>
658
659Returns a hashref containing information about the Ogg Vorbis file from
660the file's information header. Hash fields are: version, channels, rate,
661bitrate_upper, bitrate_nominal, bitrate_lower, bitrate_window, and length.
662The bitrate_window value is not currently used by the vorbis codec, and
663will always be -1.
664
665The optional parameter, key, allows you to retrieve a single value from
666the object's hash. Returns C<undef> if the key is not found.
667
668=head2 C<comment_tags ()>
669
670Returns an array containing the key values for the comment fields.
671These values can then be passed to C<comment> to retrieve their values.
672
673=head2 C<comment ($key)>
674
675Returns an array of comment values associated with the given key.
676
677=head2 C<add_comments ($key, $value, [$key, $value, ...])>
678
679Unimplemented.
680
681=head2 C<edit_comment ($key, $value, [$num])>
682
683Unimplemented.
684
685=head2 C<delete_comment ($key, [$num])>
686
687Unimplemented.
688
689=head2 C<clear_comments ([@keys])>
690
691Unimplemented.
692
693=head2 C<write_vorbis ()>
694
695Unimplemented.
696
697=head2 C<path ()>
698
699Returns the path/filename of the file the object represents.
700
701=head1 NOTE
702
703This is ALPHA SOFTWARE. It may very well be very broken. Do not use it in
704a production environment. You have been warned.
705
706=head1 ACKNOWLEDGEMENTS
707
708Dave Brown <cpan@dagbrown.com> made this module significantly faster
709at calculating the length of ogg files.
710
711Robert Moser II <rlmoser@earthlink.net> fixed a problem with files that
712have no comments.
713
714=head1 AUTHOR
715
716Andrew Molloy E<lt>amolloy@kaizolabs.comE<gt>
717
718=head1 COPYRIGHT
719
720Copyright (c) 2003, Andrew Molloy. All Rights Reserved.
721
722This program is free software; you can redistribute it and/or modify it
723under the terms of the GNU General Public License as published by the
724Free Software Foundation; either version 2 of the License, or (at
725your option) any later version. A copy of this license is included
726with this module (LICENSE.GPL).
727
728=head1 SEE ALSO
729
730L<Ogg::Vorbis::Header>, L<Ogg::Vorbis::Decoder>
731
732=cut