4 # Copyright (C) 2003 Rainer Typke
5 # Copyright (C) 2010 Reinhold Kainhofer <reinhold@kainhofer.com>
6 #pae2xml is licensed under the terms of the GNU General Public License Version
7 #2 as published by the <a href="http://www.fsf.org/" target="_top">Free Software Foundation</a>.
8 #This gives you legal permission to copy, distribute and/or modify <em>pae2xml</em> under
9 #certain conditions. Read
10 #the <a href="http://www.gnu.org/copyleft/gpl.html" target="_top">online version of the license</a>
11 #for more details. pae2xml is provided AS IS with NO WARRANTY OF ANY KIND,
12 #INCLUDING THE WARRANTY OF DESIGN, MERCHANTABILITY, AND FITNESS FOR A PARTICULAR PURPOSE.
14 our $script = "pae2xml.pl";
17 ### Handle command-line options
26 print 'pae2xml.pl [OPTIONS...] FILE
28 Converts the Plaine & Easie file FILE to MusicXML. If FILE is -, STDIN is used.
31 -h, --help Prints out this help message
32 --format=FORMAT, -f FORMAT
33 Interprets input file as FORMAT. Possible values are
34 rism, pae (default: rism)
35 -v, -- version Prints out version information
39 print "$script $version
40 Copyright (C) 2003 Rainer Typke
41 Copyright (C) 2010 Reinhold Kainhofer <reinhold\@kainhofer.com>
46 my $print_version = 0;
47 my $result = GetOptions
("f|format=s" => \
$format, "help|h" => \
$print_help, "version|v" => \
$print_version);
52 if ($print_help || (@ARGV == 0)) {
62 $old_duration = $divisions;
65 ($mday, $mon, $year) = (localtime()) [3..5];
66 $encoding_date = sprintf("%4d-%02d-%02d", $year + 1900, $mon+1, $mday);
73 if ($format eq "rism") {
74 $p =~ s/\s*\=\=+\s*(.*?)\s*\=\=+\s*/$1/sg;
75 $p =~ s/\s*included.*?-------------*\s*(.*?)\s*/$1/s;
78 if ($q !~ /^.*1\.1\.1.*$/gsx && $r =~ /^.*plain.*$/gsx) {
79 print_error
("$a contains 'plain', but not 1.1.1!\n");
81 if ($p =~ /^\s*([^\n]+)\n(.*?)\n((\d+\.\d+\.\d.*?plain.*?\n)+)(.*?)\n?([^\n]+)\n([^\n]+)\s*$/gs) {
82 my ($comp, $title, $incipits, $sonst, $libsig, $rismsig) = ($1, $2, $3, $5, $6, $7);
90 RISM SIGN.: $rismsig\n\n";
91 parse_rism_incipits
($incipits, $comp, $title, $sonst, $libsig, $rismsig);
94 if (index($p,"plain&easy") > -1) {
95 print_error
("Ignoring the following text:\n\n\n$p\n\n\n");
100 # Just a plaine & easie snippet, without any further RISM fields
102 $filename = "out.xml";
104 $filename = basename
($a, ".pae") . ".xml";
106 parse_pe
($filename, $p, "", "", "", "", "", "", "");
111 ##############################################################################
112 ### RISM file parsing
113 ##############################################################################
115 sub parse_rism_incipits
{
116 my ($incipits, $comp, $title, $sonst, $libsig, $rismsig) = @_;
118 $toprint .= "parsing: $incipits\n";
120 while ($incipits =~ /^(\d+\.\d+\..+?)(\d+\.\d+\..*)$/gs) {
123 parse_rism_incipit
($inc1, $comp, $title, $sonst, $libsig, $rismsig);
125 parse_rism_incipit
($incipits, $comp, $title, $sonst, $libsig, $rismsig);
128 sub parse_rism_incipit
{
129 my ($pe, $comp, $title, $sonst, $libsig, $rismsig) = @_;
131 if ($pe =~ /^\s*(\d+\.\d+\.\d)(\.|:)\s*(.*?)\nplain&easy:\s*(.*)$/gs) {
132 my ($inr, $instr, $pecode) = ($1, $3, $4);
134 my $filename="$rismsig-$inr.xml";
135 $filename =~ s/RISM\s*A\/II\s*:?\s*//gs
;
137 foreach $_ ($rismsig,$title,$inr,$instr,$comp,$libsig,$sonst)
145 parse_pe
($filename, $pecode, $inr, $instr, $comp, $title, $sonst, $libsig, $rismsig);
148 print_error
("could not parse $pe\n");
153 ##############################################################################
154 ### pure Plaine & Easie data parsing
155 ##############################################################################
158 my ($filename, $pe, $inr, $instr, $comp, $title, $sonst, $libsig, $rismsig) = @_;
160 $pe =~ s/@ü/@0ü/gs; # make missing time signature explicit
161 while ($pe =~ s/([^\-])(\d+)(\'|\,)(A|B|C|D|E|F|G)/$1$3$2$4/gs) {}; # octave first, then duration. Truly global.
163 if ($pe =~ /\s*(%([\w\-\+\d]+))?(@([\d\w\/]+))?\s
*&?\s
*(\
$([^ü
]+))?ü
(.*)$/gs
) {
164 my ($clef, $timesig, $keysig, $rest) = ($2, $4, $6, $7);
166 print "Writing $filename...\n";
167 open(OUT
, ">$filename");
169 my %fif=("", 0, "xF", 1, "xFC", 2, "xFCG",3, "xFCGD",4, "xFCGDA",5, "xFCGDAE",6, "xFCGDAEB",7, "bB",-1, "bBE",-2, "bBEA",-3, "bBEAD",-4, "bBEADG",-5, "bBEADGC",-6, "bBEADGCF",-7);
170 $keysig =~ s/(\s+)|&//gs; # it is unclear what the & means, so we'll ignore it for now.
171 $keysig =~ s/\[|\]//gs; # IGNORING brackets around a key sig.
172 $fifths = $fif{$keysig};
175 print_error
("Strange key signature '$keysig'.\n");
178 print OUT
'<?xml version="1.0" encoding="iso-8859-1" standalone="no"?>
179 <!DOCTYPE score-partwise PUBLIC "-//Recordare//DTD MusicXML 2.0 Partwise//EN" "http://www.musicxml.org/dtds/partwise.dtd">
182 print OUT
" <work>\n" if ($rismsig || $title);
183 print OUT
" <work-number>$rismsig</work-number>\n" if ($rismsig);
184 print OUT
" <work-title>$title</work-title>\n" if ($title);
185 print OUT
" </work>\n" if ($rismsig || $title);
186 print OUT
" <movement-number>$inr</movement-number>\n" if ($inr);
187 print OUT
" <movement-title>$instr</movement-title>\n" if ($instr);
188 print OUT
" <identification>\n";
189 print OUT
" <creator type=\"composer\">$comp</creator>\n" if ($comp);
190 print OUT
' <encoding>
191 <software>pae2xml by R. Typke</software>
192 <encoding-date>'.$encoding_date.'</encoding-date>
195 print OUT
" <source>$libsig</source>\n" if ($libsig);
196 print OUT
' </identification>
199 <part-name>'.$sonst.'</part-name>
205 <divisions>'.$divisions.'</divisions>
207 <fifths>'.$fifths.'</fifths>
209 '.timesignature
($timesig)
220 parse_notes
($rest, $keysig);
222 else { print_error
("could not parse $pe\n"); }
224 </score-partwise>\n";
228 # Repeat $1 by a count of $2
230 (my $e, my $count) = @_;
232 for (my $i=1; $i <= $count; ++$i)
240 my ($notes, $keysig) = @_;
241 my $qq = 0; # in group of cue notes
243 my $meas = 2; # measure number
244 my $mopen = 1; # measure tag still open
246 if ($notes =~ /^\s*(.*?)\s*$/) {
250 $notes =~ s/!([^!]*)!(f*)/repeat($1, length($2)+1)/gse; # write out repetitions
251 $notes =~ s/\{([^\}]*)\}/$1/gs; # ignore beamings
252 while ( $notes =~ s/(:?\/+:?|^)([^\/:]*)(:?\
/+:?)i(:?\/+:?
)/$1$2$3$2$4/gs) {}; # replace whole-measure repeats (i notation)
254 $notes =~ s/(\d+)\(([^;]+\))/\($1$2/gs; # pull note lengths into fermatas or triplets
255 $notes =~ s/(xx|x|bb|b|n)\(/\($1/gs; # pull accidentals into tuplets or fermatas:
256 $notes =~ s/(\d+)(xx|x|bb|b|n)(A|B|C|D|E|F|G)/$2$1$3/gs; # accidentals first, then duration
258 # $notes =~ s/x\(/\(x/gs; # pull accidentals into tuplets or fermatas
259 # $notes =~ s/bb\(/\(bb/gs; # pull accidentals into tuplets or fermatas
260 # $notes =~ s/b\(/\(b/gs; # pull accidentals into tuplets or fermatas
261 # $notes =~ s/n\(/\(n/gs; # pull accidentals into tuplets or fermatas
262 # $notes =~ s/(\'+|\,+)\(/\($1/g; # pull octave marks into tuplets or fermatas
264 $notes =~ s/(\.|\d|\,|\')qq/qq$1/gs; # pull beginning mark of group of grace notes in front of corresponding notes
265 $notes =~ s/(xx|x|bb|b|n)qq/qq$1/gs; # qq first, then parts of notes
267 while ($notes ne "") {
268 if ($notes =~ /^(\'+|\,+)(.*)$/) { # Octave marks
269 ($oct, $notes) = ($1, $2);
271 } elsif ($notes =~ /^qq(.*)$/) { # Begin grace
274 } elsif ($notes =~ /^r(.*)$/) { # End grace
277 } elsif ($notes =~ /^\=(\d*)(\/.*)$/) { # multi-measure rests
280 if ($measrest eq '') {
283 $toprint .= "$measrest measures of rest.\n";
285 # Create a real multi-bar rest
286 print OUT
' <attributes>
288 <multiple-rest>'.$measrest.'</multiple-rest>
293 # Now create the measures
294 for $n (1..$measrest) {
297 <duration>'.($beats*$divisions*4/$beattype).'</duration
>
300 if ($n < $measrest) {
301 print OUT " </measure>\n";
303 print OUT ' <measure number
="'.$meas.'">
311 } elsif ($notes =~ /^((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)(.*)$/) { # a note
312 ($note, $notes) = ($1,$6);
313 parse_note($note, $keysig, "", "", $qq);
314 } elsif ($notes =~ /^(\((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?\))(.*)$/) { # one note with a fermata
315 ($note, $notes) = ($1,$6);
316 parse_note($note, $keysig, "", "", $qq);
317 } elsif ($notes =~ /^(\(((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?){3}\))(.*)$/) { # a triplet
318 ($triplet, $notes) = ($1,$7);
319 # print "TRIPLET: ".$triplet." -> ";
320 $triplet =~ /^\(((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)(.*)\)$/gs;
321 ($note, $triplet) = ($1,$6);
322 #print "$note $triplet\n";
323 parse_note($note, $keysig, '<tuplet type
="start"/>', ' <time-modification
>
324 <actual
-notes
>3</actual
-notes
>
325 <normal
-notes
>2</normal
-notes
>
326 </time-modification
>', $qq);
327 $triplet =~ /^((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)(.*)$/gs;
328 ($note, $triplet) = ($1,$6);
329 #print "$note $triplet\n";
330 parse_note($note, $keysig, '', ' <time-modification
>
331 <actual
-notes
>3</actual
-notes
>
332 <normal
-notes
>2</normal
-notes
>
333 </time-modification
>', $qq);
334 parse_note($triplet, $keysig, '<tuplet type
="stop"/>', ' <time-modification
>
335 <actual
-notes
>3</actual
-notes
>
336 <normal
-notes
>2</normal
-notes
>
337 </time-modification
>', $qq);
338 } elsif ($notes =~ /^((\d+)\(((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)+\;(\d+)\))(.*)$/) { # an n-tuplet
339 ($tuplet, $notes) = ($1,$9);
340 # print "N-TUPLET: ".$tuplet." -> ";
341 $tuplet =~ /^(\d+)\(((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)(.*);(\d)\)$/gs;
342 ($combdur, $note, $tuplet, $numval) = ($1,$2,$7,$8);
343 #print "i=$combdur, n=$numval; $note / $tuplet\n";
344 my $ind_dur = duration($combdur)/$numval;
346 my $act_notes = $numval;
347 parse_note($note, $keysig, '<tuplet type
="start"/>', ' <time-modification
>
348 <actual
-notes
>'.$act_notes.'</actual
-notes
>
349 <normal
-notes
>1</normal
-notes
>
350 </time-modification
>', $qq);
351 while ($tuplet =~ /^((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)(.+)$/gs) {
352 ($note, $tuplet) = ($1,$6);
353 #print "$note / $tuplet\n";
354 parse_note($note, $keysig, '', ' <time-modification
>
355 <actual
-notes
>'.$act_notes.'</actual
-notes
>
356 <normal
-notes
>1</normal
-notes
>
357 </time-modification
>', $qq);
359 parse_note($tuplet, $keysig, '<tuplet type
="stop"/>', ' <time-modification
>
360 <actual
-notes
>'.$act_notes.'</actual
-notes
>
361 <normal
-notes
>1</normal
-notes
>
362 </time-modification
>', $qq);
363 } elsif ($notes =~ /^(%(\w(-|\+)\d))(.*)$/) { # Clef change
364 ($clef,$notes) = ($2,$4);
365 $clef = clef ($clef);
366 print OUT " <attributes>\n";
368 print OUT " </attributes>\n";
369 } elsif ($notes =~ /^@(\d\/\d|c\/?)\s*(.*)$/) { # time signatue change
371 ($timesig,$notes) = ($1,$2);
372 #print "-> $timesig / $notes\n"; exit;
373 $timesig = timesignature($timesig);
374 print OUT " <attributes>\n$timesig
376 } elsif ($notes =~ /^(:?\/+:?)(.*)$/) { # Barline (and repeats)
379 if ($barline =~ /^:\/\/:/) {
380 print OUT ' <barline location
="right">
381 <bar
-style
>light
-light
</bar
-style
>
382 <repeat direction
="backward"/>
385 } elsif ($barline =~ /^:\/\/$/ ) {
386 print OUT ' <barline location
="right">
387 <bar
-style
>light
-heavy
</bar
-style
>
388 <repeat direction
="backward"/>
391 } elsif ($barline =~ /^\/\/$/) {
392 print OUT ' <barline location
="right">
393 <bar
-style
>light
-light
</bar
-style
>
394 <repeat direction
="backward"/>
398 print OUT " </measure>\n";
400 print OUT ' <measure number
="'.$meas.'">
402 if ($barline =~ /^\/\/:$/) {
403 print OUT ' <barline location
="left">
404 <bar
-style
>heavy
-light
</bar
-style
>
405 <repeat direction
="forward"/>
408 } elsif ($barline =~ /^:\/\/:$/) {
409 print OUT ' <barline location
="left">
410 <repeat direction
="forward"/>
419 $toprint .= "bar line\n";
420 } #elsif ($notes =~ /^(\d*\.*\-)(.*)$/) {
421 #($rst, $notes) = ($1, $2);
422 #$toprint .= "rest: $rst\n";
423 #$rst =~ /^(\d*)(\.*)\-$/;
424 #($rst, $dots) =($1,$2);
427 # <duration>'.duration($rst, $dots).'</duration>
428 #'.# <type>quarter</type>
432 elsif ($notes =~ /^\((\=)\)(.*)$/) { # a bar of rest with a fermata
433 ($rst, $notes) = ($1, $2);
434 $toprint .= "rest: $rst\n";
437 <duration>'.($beats*$divisions*4/$beattype).'</duration
>
439 <fermata type
="upright"/>
444 elsif ($notes =~ s/(\d+\.*)\(((\,|\')*(x|xx|b|bb|n)?\d*\.*(g|q)?(\-|A|B|C|D|E|F|G)t?\+?)\)/\($1$2\)/gs) { # pull duration into fermata parentheses
445 # print "after replacement: $notes\n"; exit;
447 elsif ($notes =~ /^ +(.*)$/) {
449 print("Invalid space encountered in notes before $notes\n");
452 print_error("got stuck with $notes\n");
457 print OUT " </measure>\n";
463 my($note, $keysig, $notation, $addition, $in_qq_group) = @_;
466 my ($actualnotes, $normalnotes) = (1,1);
468 if ($addition =~ /^\s*<time-modification>\s*<actual-notes>\s*(\d+)\s*<\/actual-notes>\s*<normal-notes>\s*(\d+)\s*<\/normal-notes>\s*<\/time-modification>\s*$/) {
469 ($actualnotes, $normalnotes) = ($1, $2);
472 if ($note =~ /^\((.*)\)$/) {
477 $note =~ /^((\,|\')*)(x|xx|b|bb|n)?(\d*)(\.*)(g|q)?(\-|A|B|C|D|E|F|G)(t?)(\+?)$/;
478 my ($oct, $acc, $dur, $dot, $gracecue, $pitch, $trill, $tie) = ($1, $3, $4, $5, $6, $7, $8, $9);
482 if ($gracecue eq "g") {
483 print OUT ' <grace steal
-time-following
="33"/>
486 if ($gracecue eq "q" || $in_qq_group) {
491 print OUT " <rest />\n";
494 <step
>'.$pitch.'</step
>
495 '.alter($pitch, $acc, $keysig)
496 .' <octave
>'.octave($oct).'</octave
>
500 if ($gracecue ne "g") {
501 print OUT ' <duration
>'.(duration($dur, $dot)*$normalnotes/$actualnotes).'</duration
>
508 print OUT ' <tie type
="start"/>
513 print OUT ' <tie type
="stop"/>
521 my $notationbracket = $fermata || ($trill eq "t") || ($notation ne "");
522 if ($notationbracket) {
523 print OUT " <notations>\n";
525 if ($fermata) { print OUT '
526 <fermata type
="upright"/>'."\n"; }
527 if ($trill eq "t") { print OUT ' <ornaments
>
532 if ($notation ne "") {
533 print OUT " $notation\n";
535 if ($notationbracket) {
536 print OUT " </notations>\n";
542 $toprint .= "note: oct. $oct/acc. $acc/dur. $dur/dots $dot/grace,cue $gracecue/pitch $pitch\n";
546 my ($pitch, $acc, $keysig) = @_;
550 if (index ($keysig,$pitch) > -1) {
551 $keysig =~ /^(.).*$/gs;
557 my %acc_alt = ("n", 0, "b", -1, "bb", -2, "x", 1, "xx", 2);
558 if ($acc_alt{$acc} ne "") {
559 $alt = $acc_alt{$acc};
563 return "\t\t\t\t\t<alter>$alt</alter>\n";
569 my ($duration, $dots) = @_;
571 if ($duration.$dots ne "") {
572 my %du=("1",4*$divisions,"2",2*$divisions,"4",$divisions,
573 "8",$divisions/2,"6",$divisions/4,"3",$divisions/8,
574 "5",$divisions/16,"7",$divisions/32,
575 "9",$divisions*8,"0",$divisions*16); # breve/long
576 $old_duration = $du{$duration};
577 if ($old_duration eq "") {
578 print_error("strange duration '$duration'\n");
580 my $add = $old_duration;
581 while ($dots ne "") {
583 $old_duration += $add;
584 $dots =~ /^.(.*)$/gs;
588 return $old_duration;
595 $octave =~ /^(.)(.*)$/gs;
597 $old_octave = 4 - length $octave;
599 $old_octave = 3 + length $octave;
608 if ($clef =~ /^(\w)(\-|\+)(\d)$/) {
609 ($clefsign, $clefline) = ($1, $3);
611 print "Warning: Mensural clefs are not supported by MusicXML, using modern clef (input: $clef)\n";
613 if ($clefsign eq 'g
') {
615 $clefoctave = " <clef-octave-change>-1</clef-octave-change>\n";
618 ($clefsign, $clefline) = ("G", 2);
621 <sign
>'.$clefsign.'</sign
>
622 <line
>'.$clefline.'</line
>
623 '.$clefoctave.' </clef
>
630 if ($timesig eq "c3") {
631 $timesig = "3/2"; # it would be better to display it as "C". Example: 451.023.814
633 if ($timesig =~ /^c(\d+)\/(\d+)$/gs) {
634 $timesig = "$1/$2"; # it would be better to show the "C"
637 if ($timesig eq "0" || $timesig eq "") { # unclear how to handle absence of time signature.
638 $timesig =' <time symbol
="common">
640 <beat
-type
>4</beat
-type
>
642 '; # using 4/4 for now.
643 ($beats, $beattype) = (4,4);
644 } elsif ($timesig =~ /^c(\/?)$/gi) {
646 $timesig = ' <time symbol
="cut">
648 <beat
-type
>2</beat
-type
>
651 ($beats, $beattype) = (2,2);
653 $timesig = ' <time symbol
="common">
655 <beat
-type
>4</beat
-type
>
658 ($beats, $beattype) = (4,4);
660 } elsif ($timesig =~ /^(\d+)\/(\d+)$/gs) {
661 ($beats, $beattype) = ($1, $2);
663 <beats
>'.$beats.'</beats
>
664 <beat
-type
>'.$beattype.'</beat
-type
>
668 print_error("Time signature '$timesig' looks strange.\n");
669 # $timesig = ""; we assume 4/4 just to get something legible:
670 ($beats, $beattype) = (4,4);
672 <beats
>'.$beats.'</beats
>
673 <beat
-type
>'.$beattype.'</beat
-type
>
683 print "\nAn error occurred; context:\n\n$toprint\n
691 while (<STDIN>) { $res .= $_; } # read all lines
693 if (!(open FH, $fn)) {
696 while (<FH>) { $res .= $_; } # read all lines