my
%default_macros
= (
jan
=>
"January"
,
feb
=>
"February"
,
mar
=>
"March"
,
apr
=>
"April"
,
may
=>
"May"
,
jun
=>
"June"
,
jul
=>
"July"
,
aug
=>
"August"
,
sep
=>
"September"
,
oct
=>
"October"
,
nov
=>
"November"
,
dec
=>
"December"
,
acmcs
=>
"ACM Computing Surveys"
,
acta
=>
"Acta Informatica"
,
cacm
=>
"Communications of the ACM"
,
ibmjrd
=>
"IBM Journal of Research and Development"
,
ibmsj
=>
"IBM Systems Journal"
,
ieeese
=>
"IEEE Transactions on Software Engineering"
,
ieeetc
=>
"IEEE Transactions on Computers"
,
ieeetcad
=>
"IEEE Transactions on Computer-Aided Design of Integrated Circuits"
,
ipl
=>
"Information Processing Letters"
,
jacm
=>
"Journal of the ACM"
,
jcss
=>
"Journal of Computer and System Sciences"
,
scp
=>
"Science of Computer Programming"
,
sicomp
=>
"SIAM Journal on Computing"
,
tocs
=>
"ACM Transactions on Computer Systems"
,
tods
=>
"ACM Transactions on Database Systems"
,
tog
=>
"ACM Transactions on Graphics"
,
toms
=>
"ACM Transactions on Mathematical Software"
,
toois
=>
"ACM Transactions on Office Information Systems"
,
toplas
=>
"ACM Transactions on Programming Languages and Systems"
,
tcs
=>
"Theoretical Computer Science"
);
sub
newFromFile {
my
(
$class
,
$bibname
) =
@_
;
my
$self
= {
source
=>
$bibname
,
preamble
=> [],
entries
=> [],
macros
=> {
%default_macros
} };
bless
$self
,
$class
;
my
$paths
=
$STATE
->lookupValue(
'SEARCHPATHS'
);
my
$file
= pathname_find(
$bibname
,
types
=> [
'bib'
],
paths
=>
$paths
);
Fatal(
'missing_file'
,
$bibname
,
undef
,
"Can't find BibTeX file $bibname"
,
"SEACHPATHS is "
.
join
(
', '
,
@$paths
))
unless
$file
;
my
$BIB
;
$$self
{file} =
$bibname
;
open
(
$BIB
,
'<'
,
$file
) or Fatal(
'I/O'
,
$file
,
undef
,
"Can't open BibTeX $file for reading"
, $!);
$$self
{lines} = [<
$BIB
>];
close
(
$BIB
);
$$self
{line} =
shift
(@{
$$self
{lines} }) ||
''
;
$$self
{lineno} = 1;
return
$self
; }
sub
newFromString {
my
(
$class
,
$string
) =
@_
;
my
$self
= {
source
=>
"<Unknown>"
,
preamble
=> [],
entries
=> [],
macros
=> {
%default_macros
} };
bless
$self
,
$class
;
$$self
{file} =
"<anonymous>"
;
$$self
{lines} = [
split
(/\n/,
$string
)];
$$self
{line} =
shift
(@{
$$self
{lines} });
$$self
{lineno} = 1;
return
$self
; }
sub
newFromGullet {
my
(
$class
,
$name
,
$gullet
) =
@_
;
my
$self
= {
source
=>
$name
,
preamble
=> [],
entries
=> [],
macros
=> {
%default_macros
} };
bless
$self
,
$class
;
my
@lines
= ();
while
(
$gullet
->getMouth->hasMoreInput) {
while
(
defined
(
my
$line
=
$gullet
->readRawLine)) {
push
(
@lines
,
$line
.
"\n"
); }
$gullet
->closeMouth; }
$$self
{file} =
$name
;
$$self
{lines} = [
@lines
];
$$self
{line} =
shift
(@{
$$self
{lines} });
$$self
{lineno} = 1;
return
$self
; }
sub
toString {
my
(
$self
) =
@_
;
return
"Bibliography[$$self{source}]"
; }
sub
toTeX {
my
(
$self
) =
@_
;
$self
->parseTopLevel
unless
$$self
{parsed};
foreach
my
$entry
(@{
$$self
{entries} }) {
$STATE
->assignValue(
'BIBENTRY@'
.
lc
(
$entry
->getKey) =>
$entry
); }
return
join
(
"\n"
,
@{
$$self
{preamble} },
'\begin{bibtex@bibliography}'
,
(
map
{
'\ProcessBibTeXEntry{'
.
$_
->getKey .
'}'
} @{
$$self
{entries} }),
'\end{bibtex@bibliography}'
); }
sub
getLocator {
my
(
$self
) =
@_
;
return
"at $$self{source}; line $$self{lineno}\n $$self{line}"
; }
sub
parseTopLevel {
my
(
$self
) =
@_
;
NoteBegin(
"Preparsing Bibliography $$self{source}"
);
while
(
$self
->skipJunk) {
my
$type
=
$self
->parseEntryType;
if
(
$type
eq
'preamble'
) {
$self
->parsePreamble; }
elsif
(
$type
eq
'string'
) {
$self
->parseMacro; }
elsif
(
$type
eq
'comment'
) {
$self
->parseComment; }
else
{
$self
->parseEntry(
$type
); }
}
NoteEnd(
"Preparsing Bibliography $$self{source}"
);
$$self
{parsed} = 1;
return
; }
my
%CLOSE
= (
"{"
=>
"}"
,
"("
=>
")"
);
sub
parsePreamble {
my
(
$self
) =
@_
;
my
$open
=
$self
->parseMatch(
"({"
);
my
(
$value
,
$rawvalue
) =
$self
->parseValue();
push
(@{
$$self
{preamble} },
$value
);
$self
->parseMatch(
$CLOSE
{
$open
});
return
; }
sub
parseMacro {
my
(
$self
) =
@_
;
my
$open
=
$self
->parseMatch(
"({"
);
my
(
$fields
,
$rawfields
) =
$self
->parseFields(
'@string'
,
$open
);
foreach
my
$macro
(
@$fields
) {
$$self
{macros}{
$$macro
[0] } =
$$macro
[1]; }
return
; }
sub
parseComment {
my
(
$self
) =
@_
;
my
$comment
=
$self
->parseString();
return
; }
sub
parseEntry {
my
(
$self
,
$type
) =
@_
;
my
$open
=
$self
->parseMatch(
"({"
);
my
$key
=
$self
->parseEntryName();
$self
->parseMatch(
','
);
my
(
$fields
,
$rawfields
) =
$self
->parseFields(
'@string'
,
$open
);
push
(@{
$$self
{entries} }, LaTeXML::Pre::BibTeX::Entry->new(
$type
,
$key
,
$fields
,
$rawfields
));
return
; }
sub
parseFields {
my
(
$self
,
$for
,
$open
) =
@_
;
my
@fields
= ();
my
@rawfields
= ();
do
{
my
$name
=
$self
->parseFieldName;
$self
->parseMatch(
'='
);
my
(
$value
,
$rawvalue
) =
$self
->parseValue;
push
(
@fields
, [
$name
,
$value
]);
push
(
@rawfields
, [
$name
,
$rawvalue
]);
$self
->skipWhite;
}
while
((
$$self
{line} =~ s/^,//)
&&
$self
->skipWhite && (
$$self
{line} !~ /^\Q
$CLOSE
{
$open
}\E/));
$self
->parseMatch(
$CLOSE
{
$open
});
return
([
@fields
], [
@rawfields
]); }
my
$BIBNAME_re
=
q/a-zA-Z0-9/
;
my
$BIBNOISE_re
=
q/\.\+\-\*\/
\^\_\:\;\@\`\?\!\~\|\<\>\$\[\]/;
sub
parseEntryType {
my
(
$self
) =
@_
;
$self
->skipWhite;
return
(
$$self
{line} =~ s/^([
$BIBNAME_re
$BIBNOISE_re
]*)//x ?
lc
($1) :
undef
); }
sub
parseEntryName {
my
(
$self
) =
@_
;
$self
->skipWhite;
return
(
$$self
{line} =~ s/^([\"\
sub
parseFieldName {
my
(
$self
) =
@_
;
$self
->skipWhite;
return
(
$$self
{line} =~ s/^([\
&$BIBNAME_re
$BIBNOISE_re
]*)//x ?
lc
($1) :
undef
); }
sub
parseMatch {
my
(
$self
,
$delims
) =
@_
;
$self
->skipWhite;
if
(!
$delims
) {
return
; }
elsif
(
$$self
{line} =~ s/^([\Q
$delims
\E])//) {
return
$1; }
else
{
Error(
'expected'
,
$delims
,
undef
,
"Expected one of "
.
join
(
' '
,
split
(//,
$delims
)));
return
; } }
sub
parseString {
my
(
$self
) =
@_
;
$self
->skipWhite;
my
$string
;
if
(
$$self
{line} =~ s/^\
"//) { # If opening "
(and remove it!)
while
(
$$self
{line} !~ s/^\
"//) { # Until we've found the closing "
if
(!
$$self
{line}) {
$self
->extendLine; }
elsif
(
$$self
{line} =~ /^\{/) {
$string
.=
$self
->parseBalancedBraces; }
elsif
(
$$self
{line} =~ s/^([^
"\{]*)//) { # else pull off everything except a brace or "
$string
.= $1; } }
}
elsif
(
$$self
{line} =~ /^\{/) {
$string
=
$self
->parseBalancedBraces;
$string
=~ s/^.//;
$string
=~ s/.$//; }
else
{
Error(
'expected'
,
'<delimitedstring>'
,
undef
,
"Expected a string delimited by \"..\", (..) or {..}"
); }
$string
=~ s/^\s+//;
$string
=~ s/\s+$//;
return
$string
; }
sub
parseBalancedBraces {
my
(
$self
) =
@_
;
my
$string
;
while
((
$$self
{line} !~ /\}/) &&
$self
->extendLine) { }
while
((!
defined
(
$string
= extract_bracketed(
$$self
{line},
'{}'
))) &&
$self
->extendLine) { }
return
$string
; }
sub
extendLine {
my
(
$self
) =
@_
;
my
$nextline
=
shift
(@{
$$self
{lines} });
if
(
defined
$nextline
) {
$$self
{line} .=
$nextline
;
$$self
{lineno}++;
return
1; }
else
{
Error(
'unexpected'
,
'<EOF>'
,
undef
,
"Input ended while parsing string"
);
return
; } }
sub
parseValue {
my
(
$self
) =
@_
;
my
$value
=
""
;
do
{
$self
->skipWhite;
if
(
$$self
{line} =~ /^[\"\{]/) {
$value
.=
$self
->parseString; }
elsif
(
my
$name
=
$self
->parseFieldName) {
my
$macro
= (
$name
=~ /^\d+$/ ?
$name
:
$$self
{macros}{
$name
});
if
(!
defined
$macro
) {
Error(
'unexpected'
,
$name
,
undef
,
"The BibTeX macro '$name' is not defined"
);
$macro
=
$name
; }
$value
.=
$macro
; }
else
{
Error(
'expected'
,
'<value>'
,
undef
,
"Expected a BibTeX value"
); }
$self
->skipWhite;
}
while
(
$$self
{line} =~ s/^
return
$value
; }
sub
skipWhite {
my
(
$self
) =
@_
;
my
$nextline
;
do
{
$$self
{line} =~ s/^(\s+)//s;
return
1
if
$$self
{line};
$nextline
=
shift
(@{
$$self
{lines} });
$$self
{line} =
$nextline
||
""
;
$$self
{lineno}++;
}
while
defined
$nextline
;
return
; }
sub
skipJunk {
my
(
$self
) =
@_
;
while
(1) {
$$self
{line} =~ s/^[^@%]*//;
return
'@'
if
$$self
{line} =~ s/^@//;
my
$nextline
=
shift
(@{
$$self
{lines} });
$$self
{line} =
$nextline
||
""
;
$$self
{lineno}++;
return
unless
defined
$nextline
; }
return
; }
1;