our
@EXPORT
= (
@LaTeXML::Common::Error::EXPORT
);
sub
new {
my
(
$class
,
%options
) =
@_
;
my
$self
=
bless
{
status
=> {},
%options
},
$class
;
$$self
{state} = LaTeXML::Core::State->new();
return
$self
; }
sub
ProcessChain {
my
(
$self
,
$doc
,
@postprocessors
) =
@_
;
return
$self
->withState(
sub
{
return
$self
->ProcessChain_internal(
$doc
,
@postprocessors
); }); }
sub
ProcessChain_internal {
my
(
$self
,
$doc
,
@postprocessors
) =
@_
;
local
$LaTeXML::POST
=
$self
;
local
$LaTeXML::Post::NOTEINFO
=
undef
;
local
$LaTeXML::Post::DOCUMENT
=
$doc
;
my
@docs
= (
$doc
);
ProgressSpinup(
"post-processing"
);
foreach
my
$processor
(
@postprocessors
) {
local
$LaTeXML::Post::PROCESSOR
=
$processor
;
my
@newdocs
= ();
foreach
my
$doc
(
@docs
) {
local
$LaTeXML::Post::DOCUMENT
=
$doc
;
if
(
my
@nodes
=
grep
{
$_
}
$processor
->toProcess(
$doc
)) {
my
$n
=
scalar
(
@nodes
);
my
$msg
=
join
(
' '
,
$processor
->getName ||
''
,
$doc
->siteRelativeDestination ||
''
,
(
$n
> 1 ?
"$n to process"
:
'processing'
));
ProgressSpinup(
$msg
);
push
(
@newdocs
,
$processor
->process(
$doc
,
@nodes
));
ProgressSpindown(
$msg
); }
else
{
push
(
@newdocs
,
$doc
); } }
@docs
=
@newdocs
; }
ProgressSpindown(
"post-processing"
);
return
@docs
; }
sub
withState {
my
(
$self
,
$closure
) =
@_
;
local
$STATE
=
$$self
{state};
local
$SIG
{__DIE__} = \
&LaTeXML::Common::Error::perl_die_handler
;
local
$SIG
{INT} = \
&LaTeXML::Common::Error::perl_interrupt_handler
;
local
$SIG
{__WARN__} = \
&LaTeXML::Common::Error::perl_warn_handler
;
local
$SIG
{
'ALRM'
} = \
&LaTeXML::Common::Error::perl_timeout_handler
;
local
$SIG
{
'TERM'
} = \
&LaTeXML::Common::Error::perl_terminate_handler
;
local
$LaTeXML::DUAL_BRANCH
=
''
;
return
&$closure
(
$STATE
); }
sub
getStatusCode {
my
(
$self
) =
@_
;
return
$$self
{state}->getStatusCode; }
sub
getStatusMessage {
my
(
$self
) =
@_
;
return
$$self
{state}->getStatusMessage; }
sub
getsorter {
my
(
$self
,
$lang
) =
@_
;
my
$collator
;
if
(
$collator
=
$$self
{collatorcache}{
$lang
}) { }
elsif
(
$collator
=
eval
{
local
$LaTeXML::IGNORE_ERRORS
= 1;
require
'Unicode/Collate/Locale.pm'
;
Unicode::Collate::Locale->new(
locale
=>
$lang
,
variable
=>
'non-ignorable'
,
upper_before_lower
=> 1); }) { }
elsif
(
$collator
=
eval
{
local
$LaTeXML::IGNORE_ERRORS
= 1;
require
'Unicode/Collate.pm'
;
Unicode::Collate->new(
variable
=>
'non-ignorable'
,
upper_before_lower
=> 1); }) {
Info(
'expected'
,
'Unicode::Collate::Locale'
,
undef
,
"No Unicode::Collate::Locale found;"
,
"using Unicode::Collate; ignoring language='$lang'"
); }
else
{
$collator
= LaTeXML::Post::DumbCollator->new();
Info(
'expected'
,
'Unicode::Collate::Locale'
,
undef
,
"No Unicode::Collate::Locale or Unicode::Collate"
,
"using perl's sort; ignoring language='$lang'"
); }
$$self
{collatorcache}{
$lang
} =
$collator
;
return
$collator
; }
sub
new {
my
(
$class
) =
@_
;
return
bless
{},
$class
; }
sub
sort
{
my
(
$self
,
@things
) =
@_
;
return
(
sort
@things
); }
sub
new {
my
(
$class
,
%options
) =
@_
;
my
$self
=
bless
{
%options
},
$class
;
$$self
{resource_directory} =
$options
{resource_directory};
$$self
{resource_prefix} =
$options
{resource_prefix};
my
$name
=
$class
;
$name
=~ s/^LaTeXML::Post:://;
$$self
{name} =
$name
;
return
$self
; }
sub
getName {
my
(
$self
) =
@_
;
return
$$self
{name}; }
sub
toProcess {
my
(
$self
,
$doc
) =
@_
;
return
$doc
->getDocumentElement; }
sub
process {
my
(
$self
,
$doc
,
@toprocess
) =
@_
;
Fatal(
"misdefined"
,
$self
,
$doc
,
"This post-processor is abstract; does not implement ->process"
);
return
$doc
; }
sub
desiredResourcePathname {
my
(
$self
,
$doc
,
$node
,
$source
,
$type
) =
@_
;
return
; }
sub
generateResourcePathname {
my
(
$self
,
$doc
,
$node
,
$source
,
$type
) =
@_
;
my
$subdir
=
$$self
{resource_directory} ||
''
;
my
$prefix
=
$$self
{resource_prefix} ||
"x"
;
my
$counter
=
join
(
'_'
,
"_max"
,
$subdir
,
$prefix
,
"counter_"
);
my
$n
=
$doc
->cacheLookup(
$counter
) || 0;
my
$name
=
$prefix
. ++
$n
;
$doc
->cacheStore(
$counter
,
$n
);
return
pathname_make(
dir
=>
$subdir
,
name
=>
$name
,
type
=>
$type
); }
sub
find_documentclass_and_packages {
my
(
$self
,
$doc
) =
@_
;
my
(
$class
,
$classoptions
,
$oldstyle
,
@packages
);
foreach
my
$pi
(
$doc
->findnodes(
".//processing-instruction('latexml')"
)) {
my
$data
=
$pi
->textContent;
my
$entry
= {};
while
(
$data
=~ s/\s*([\w\-\_]*)=([\"\'])(.*?)\2//) {
$$entry
{$1} = $3; }
if
(
$$entry
{class}) {
$class
=
$$entry
{class};
$classoptions
=
$$entry
{options} ||
'onecolumn'
;
$oldstyle
=
$$entry
{oldstyle}; }
elsif
(
$$entry
{
package
}) {
my
@p
=
grep
{
$_
; }
split
(/\s*,\s*/,
$$entry
{
package
});
foreach
my
$package
(
@p
) {
push
(
@packages
, [
$package
,
$$entry
{options} ||
''
]); } } }
if
(!
$class
) {
Warn(
'expected'
,
'class'
,
undef
,
"No document class found; using article"
);
$class
=
'article'
; }
return
([
$class
,
$classoptions
,
$oldstyle
],
@packages
); }
sub
find_preambles {
my
(
$self
,
$doc
) =
@_
;
my
@preambles
= ();
foreach
my
$pi
(
$doc
->findnodes(
".//processing-instruction('latexml')"
)) {
my
$data
=
$pi
->textContent;
while
(
$data
=~ s/\s*([\w\-\_]*)=([\"\'])(.*?)\2//) {
if
($1 eq
'preamble'
) {
push
(
@preambles
, $3); } } }
return
join
(
"\n"
,
@preambles
); }
sub
copy_foreign_attributes {
my
(
$self
,
$newnode
,
$node
) =
@_
;
my
%attr
= ();
if
(
ref
$node
eq
'ARRAY'
) {
%attr
= %{
$$node
[1] }; }
else
{
foreach
my
$attr
(
$node
->attributes()) {
if
(
$attr
->nodeType == XML_ATTRIBUTE_NODE) {
$attr
{
$attr
->nodeName } =
$attr
->getValue; } } }
foreach
my
$key
(
keys
%attr
) {
next
if
$key
=~ /^xml:/;
next
unless
$key
=~ /:/;
my
$value
=
$attr
{
$key
};
if
(
ref
$newnode
eq
'ARRAY'
) {
$$newnode
[1]{
$key
} =
$value
unless
defined
$$newnode
[1]{
$key
}; }
else
{
$newnode
->setAttribute(
$key
=>
$value
)
unless
$newnode
->hasAttribute(
$key
); } }
return
; }
sub
toProcess {
my
(
$self
,
$doc
) =
@_
;
return
$doc
->findnodes(
'//ltx:Math[not(ancestor::ltx:Math)]'
); }
sub
process {
my
(
$self
,
$doc
,
@maths
) =
@_
;
local
$LaTeXML::Post::MATHPROCESSOR
=
$self
;
$doc
->markXMNodeVisibility;
$self
->preprocess(
$doc
,
@maths
);
if
(
$$self
{parallel}) {
my
@secondaries
= @{
$$self
{secondary_processors} };
my
(
$proc1
,
@ignore
) =
grep
{
$_
->can(
'addCrossref'
) }
@secondaries
;
if
(
$self
->can(
'addCrossref'
) &&
$proc1
) {
$$self
{crossreferencing} = 1;
$$proc1
{crossreferencing} = 1; }
foreach
my
$proc
(
@secondaries
) {
local
$LaTeXML::Post::MATHPROCESSOR
=
$proc
;
$proc
->preprocess(
$doc
,
@maths
); } }
@maths
=
$self
->toProcess(
$doc
);
my
$n
= 0;
foreach
my
$math
(
reverse
(
@maths
)) {
my
@preceding
=
$doc
->findnodes(
"parent::ltx:MathBranch/preceding-sibling::*"
,
$math
);
local
$LaTeXML::Post::MathProcessor::FORK
=
scalar
(
@preceding
);
$self
->processNode(
$doc
,
$math
);
$n
++; }
if
(
$$self
{parallel}) {
my
(
$proc1
,
$proc2
,
@ignore
)
=
grep
{
$_
->can(
'addCrossref'
) }
$self
, @{
$$self
{secondary_processors} };
if
(
$proc1
&&
$proc2
) {
my
$ids
= {};
my
$pos
= 0;
foreach
my
$n
(
$doc
->findnodes(
'descendant-or-self::ltx:Math/descendant::*[@xml:id]'
)) {
$$ids
{
$n
->getAttribute(
'xml:id'
) } =
$pos
++; }
$$proc1
{crossreferencing_ids} =
$ids
;
$$proc2
{crossreferencing_ids} =
$ids
;
$proc1
->addCrossrefs(
$doc
,
$proc2
);
$proc2
->addCrossrefs(
$doc
,
$proc1
); } }
NoteLog(
"converted $n Maths"
);
return
$doc
; }
sub
canConvert {
return
1; }
sub
setParallel {
my
(
$self
,
@moreprocessors
) =
@_
;
if
(
@moreprocessors
) {
$$self
{parallel} = 1;
map
{
$$_
{is_secondary} = 1 }
@moreprocessors
;
$$self
{secondary_processors} = [
@moreprocessors
];
$$self
{name} .=
'[w/'
.
join
(
'+'
,
map
{
$_
->getName }
@moreprocessors
) .
']'
; }
else
{
$$self
{parallel} = 0; }
return
; }
sub
preprocess {
my
(
$self
,
$doc
,
@nodes
) =
@_
;
return
; }
sub
processNode {
my
(
$self
,
$doc
,
$math
) =
@_
;
my
$xmath
=
$doc
->findnode(
'ltx:XMath'
,
$math
);
return
unless
$xmath
;
local
$LaTeXML::Post::MATHPROCESSOR
=
$self
;
my
$conversion
;
$doc
->preremoveNodes(
$xmath
);
if
(
$$self
{parallel}) {
my
$primary
=
$self
->convertNode(
$doc
,
$xmath
);
my
@secondaries
= ();
foreach
my
$proc
(@{
$$self
{secondary_processors} }) {
next
unless
$proc
->canConvert(
$doc
,
$math
);
local
$LaTeXML::Post::MATHPROCESSOR
=
$proc
;
my
$secondary
=
$proc
->convertNode(
$doc
,
$xmath
);
$self
->maybeSetMathImage(
$math
,
$secondary
);
push
(
@secondaries
,
$secondary
); }
$conversion
=
$self
->combineParallel(
$doc
,
$xmath
,
$primary
,
@secondaries
); }
else
{
$conversion
=
$self
->convertNode(
$doc
,
$xmath
);
$self
->maybeSetMathImage(
$math
,
$conversion
); }
if
(
my
$xml
=
$$conversion
{xml}) {
$$conversion
{xml} =
$self
->outerWrapper(
$doc
,
$xmath
,
$xml
); }
elsif
(
my
$string
=
$$conversion
{string}) {
my
$mimetype
=
$$conversion
{mimetype} ||
'unknown'
;
$$conversion
{xml} = [
'ltx:text'
, {
class
=>
'ltx_math_'
.
$mimetype
},
$string
]; }
$doc
->removeNodes(
$xmath
);
if
(
$$conversion
{mimetype} && (
$$conversion
{mimetype} ne
'application/x-latexml'
)) {
map
{
$_
->removeAttribute(
'xml:id'
) }
$doc
->findnodes(
'descendant-or-self::*[@xml:id]'
,
$xmath
); }
$doc
->removeBlankNodes(
$math
);
if
(
my
$new
=
$$conversion
{xml}) {
$doc
->addNodes(
$math
,
$new
); }
return
; }
sub
maybeSetMathImage {
my
(
$self
,
$math
,
$conversion
) =
@_
;
if
(((
$$conversion
{mimetype} ||
''
) =~ /^image\//)
&& !
$math
->getAttribute(
'imagesrc'
)) {
if
(
my
$src
=
$$conversion
{src}) {
$math
->setAttribute(
imagesrc
=> pathname_to_url(
$src
));
$math
->setAttribute(
imagewidth
=>
$$conversion
{width});
$math
->setAttribute(
imageheight
=>
$$conversion
{height});
$math
->setAttribute(
imagedepth
=>
$$conversion
{depth}); } }
return
; }
sub
outerWrapper {
my
(
$self
,
$doc
,
$xmath
,
$conversion
) =
@_
;
return
$conversion
; }
sub
convertNode {
my
(
$self
,
$doc
,
$node
) =
@_
;
Fatal(
'misdefined'
, (
ref
$self
),
undef
,
"Abstract package: math conversion has not been defined for this MathProcessor"
);
return
; }
sub
combineParallel {
my
(
$self
,
$doc
,
$xmath
,
$primary
,
@secondaries
) =
@_
;
Error(
'misdefined'
, (
ref
$self
),
undef
,
"Abstract package: combining parallel markup has not been defined for this MathProcessor"
,
"dropping the extra markup from: "
.
join
(
','
,
map
{
$$_
{processor} }
@secondaries
));
return
$primary
; }
my
$NBSP
=
pack
(
'U'
, 0xA0);
sub
convertXMTextContent {
my
(
$self
,
$doc
,
$convertspaces
,
@nodes
) =
@_
;
my
@result
= ();
foreach
my
$node
(
@nodes
) {
if
(
$node
->nodeType == XML_TEXT_NODE) {
my
$string
=
$node
->textContent;
if
(
$convertspaces
) {
$string
=~ s/^\s+/
$NBSP
/;
$string
=~ s/\s+$/
$NBSP
/; }
push
(
@result
,
$string
); }
else
{
my
$tag
=
$doc
->getQName(
$node
);
if
(
$tag
eq
'ltx:XMath'
) {
my
$conversion
=
$self
->convertNode(
$doc
,
$node
);
my
$xml
=
$$conversion
{xml};
push
(
@result
,
$self
->outerWrapper(
$doc
,
$node
,
$xml
)); }
else
{
my
%attr
= ();
foreach
my
$attr
(
$node
->attributes) {
my
$atype
=
$attr
->nodeType;
if
(
$atype
== XML_ATTRIBUTE_NODE) {
my
$key
=
$attr
->nodeName;
my
$value
=
$attr
->getValue;
if
(
$key
=~ /^_/) { }
elsif
(
$key
eq
'xml:id'
) { }
elsif
(
$key
eq
'fragid'
) {
my
$id
=
$doc
->uniquifyID(
$value
,
$self
->IDSuffix);
$attr
{
'xml:id'
} =
$id
; }
else
{
$attr
{
$key
} =
$attr
->value; } } }
push
(
@result
,
[
$tag
, {
%attr
},
$self
->convertXMTextContent(
$doc
,
$convertspaces
,
$node
->childNodes)]); } } }
return
@result
; }
sub
IDSuffix {
my
(
$self
) =
@_
;
return
(
$$self
{is_secondary} ?
$self
->rawIDSuffix :
''
); }
sub
rawIDSuffix {
return
''
; }
sub
associateNode {
my
(
$self
,
$node
,
$currentnode
,
$noxref
) =
@_
;
my
$r
=
ref
$node
;
return
unless
$currentnode
&&
$r
&& (
$r
eq
'ARRAY'
||
$r
eq
'XML::LibXML::Element'
);
$self
->copy_foreign_attributes(
$node
,
$currentnode
);
my
$document
=
$LaTeXML::Post::DOCUMENT
;
my
$isarray
=
ref
$node
eq
'ARRAY'
;
my
$ispresentation
=
$self
->rawIDSuffix eq
'.pmml'
;
my
$iscontainer
= 0;
my
$container
;
if
(
$isarray
) {
return
if
$$node
[1]{
'_sourced'
};
$$node
[1]{
'_sourced'
} = 1;
my
(
$tag
,
$attr
,
@children
) =
@$node
;
$iscontainer
=
grep
{
ref
$_
}
@children
; }
else
{
return
if
$node
->getAttribute(
'_sourced'
);
$node
->setAttribute(
'_sourced'
=> 1);
$iscontainer
=
scalar
(element_nodes(
$node
)); }
my
$sourcenode
=
$currentnode
;
if
(
$currentnode
->getAttribute(
'decl_id'
)) { }
elsif
(
$iscontainer
) {
my
$sid
=
$sourcenode
->getAttribute(
'xml:id'
);
if
(
$container
=
$document
->findnode(
'parent::ltx:XMDual[1]'
,
$sourcenode
)
|| (
$sid
&&
$document
->findnode(
"ancestor-or-self::ltx:XMDual[ltx:XMRef[\@idref='$sid']][1]"
,
$sourcenode
))) {
$sourcenode
=
$container
; } }
elsif
(
$container
=
$document
->findnode(
'ancestor::ltx:XMApp[@decl_id or @meaning][1]'
,
$sourcenode
)) {
$sourcenode
=
$container
; }
elsif
(
$currentnode
->getAttribute((
$ispresentation
?
'_cvis'
:
'_pvis'
))) { }
elsif
(
$container
=
$document
->findnode(
'ancestor-or-self::ltx:XMDual[1]'
,
$sourcenode
)) {
my
(
$op
) = element_nodes(
$container
);
my
$q
=
$document
->getQName(
$op
) ||
'unknown'
;
if
(
$container
->hasAttribute(
'decl_id'
)) {
$op
=
undef
; }
elsif
(
$q
eq
'ltx:XMTok'
) { }
elsif
(
$q
eq
'ltx:XMApp'
) {
while
((
$q
eq
'ltx:XMApp'
) && !
$op
->hasAttribute(
'meaning'
)) {
(
$op
) = element_nodes(
$op
);
$q
=
$document
->getQName(
$op
) ||
'unknown'
; } }
if
(
$q
eq
'ltx:XMRef'
) {
$op
=
$document
->realizeXMNode(
$op
); }
if
(
$op
&& !(
$op
->getAttribute(
'_pvis'
)
&& ((
$op
->getAttribute(
'thickness'
) ||
'<anything>'
) ne
'0pt'
))) {
$sourcenode
=
$op
; }
else
{
$sourcenode
=
$container
; } }
if
(
$$self
{crossreferencing}) {
if
(!
$noxref
&& !
$sourcenode
->getAttribute(
'fragid'
)) {
$document
->generateNodeID(
$sourcenode
,
''
, 1); }
if
(
my
$sourceid
=
$sourcenode
->getAttribute(
'fragid'
)) {
my
$nodeid
=
$currentnode
->getAttribute(
'fragid'
) ||
$sourceid
;
my
$id
=
$document
->uniquifyID(
$nodeid
,
$self
->IDSuffix);
if
(
$isarray
) {
$$node
[1]{
'xml:id'
} =
$id
; }
else
{
$node
->setAttribute(
'xml:id'
=>
$id
); }
push
(@{
$$self
{convertedIDs}{
$sourceid
} },
$id
)
unless
$noxref
; } }
$self
->associateNodeHook(
$node
,
$sourcenode
,
$noxref
);
if
(
$isarray
) {
map
{
$self
->associateNode(
$_
,
$currentnode
,
$noxref
) }
@$node
[2 ..
$#$node
]; }
else
{
map
{
$self
->associateNode(
$_
,
$currentnode
,
$noxref
) } element_nodes(
$node
); }
return
; }
sub
associateNodeHook {
my
(
$self
,
$node
,
$sourcenode
,
$noxref
) =
@_
;
return
; }
sub
shownode {
my
(
$node
,
$level
) =
@_
;
$level
= 0
unless
defined
$level
;
my
$ref
=
ref
$node
;
if
(
$ref
eq
'ARRAY'
) {
my
(
$tag
,
$attr
,
@children
) =
@$node
;
return
"\n"
. (
' '
x
$level
)
.
'['
.
$tag
.
',{'
.
join
(
','
,
map
{
$_
.
'=>'
. (
$$attr
{
$_
} ||
''
) }
sort
keys
%$attr
) .
'},'
.
join
(
','
,
map
{ shownode(
$_
,
$level
+ 1) }
@children
) .
']'
; }
elsif
(
$ref
=~ /^XML/) {
return
$node
->toString; }
else
{
return
"$node"
; } }
sub
addCrossrefs {
my
(
$self
,
$doc
,
$otherprocessor
) =
@_
;
my
$selfs_map
=
$$self
{convertedIDs};
my
$others_map
=
$$otherprocessor
{convertedIDs};
my
$xrefids
=
$$self
{crossreferencing_ids};
my
$backref
= {};
foreach
my
$id
(
keys
%$selfs_map
) {
foreach
my
$t
(@{
$$selfs_map
{
$id
} }) {
$$backref
{
$t
} =
$id
; } }
foreach
my
$xid
(
keys
%$selfs_map
) {
my
$other_ids
=
$$others_map
{
$xid
};
if
(!
$other_ids
) {
if
(
my
$mapped
=
$$selfs_map
{
$xid
}) {
foreach
my
$mid
(
@$mapped
) {
if
(
my
$node
=
$doc
->findNodeByID(
$mid
)) {
my
(
$parent
,
$pid
,
$xpid
) = (
$node
,
undef
,
undef
);
while
((
$parent
=
$parent
->parentNode)
&& (
$parent
->nodeType == XML_ELEMENT_NODE)
&& (!(
$pid
=
$parent
->getAttribute(
'xml:id'
))
|| !(
$xpid
=
$$backref
{
$pid
})
|| !
$$others_map
{
$xpid
})) { }
if
(
$xpid
) {
$other_ids
=
$$others_map
{
$xpid
}; } } } } }
if
(
$other_ids
) {
my
$xref_id
=
$$other_ids
[0];
if
(
scalar
(
@$other_ids
) > 1) {
(
$xref_id
) =
sort
{
$$xrefids
{
$a
} <=>
$$xrefids
{
$b
} }
@$other_ids
; }
foreach
my
$id
(@{
$$selfs_map
{
$xid
} }) {
if
(
my
$node
=
$doc
->findNodeByID(
$id
)) {
$self
->addCrossref(
$node
,
$xref_id
); } } }
else
{
} }
return
; }
sub
mathIsParsed {
my
(
$doc
,
$math
) =
@_
;
return
$math
&& ((
$math
->getAttribute(
'class'
) ||
''
) !~
'ltx_math_unparsed'
); }
our
$XPATH
= LaTeXML::Common::XML::XPath->new(
ltx
=>
$NSURI
);
sub
new {
my
(
$class
,
$xmldoc
,
%options
) =
@_
;
my
$self
=
$class
->new_internal(
$xmldoc
,
%options
);
$self
->setDocument_internal(
$xmldoc
);
return
$self
; }
sub
new_internal {
my
(
$class
,
$xmldoc
,
%options
) =
@_
;
my
%data
= ();
if
(
ref
$class
) {
map
{
$data
{
$_
} =
$$class
{
$_
} }
keys
%$class
;
$class
=
ref
$class
; }
map
{
$data
{
$_
} =
$options
{
$_
} }
keys
%options
;
if
((
defined
$options
{destination}) && (!
defined
$options
{destinationDirectory})) {
my
(
$dir
,
$name
,
$ext
) = pathname_split(
$data
{destination});
$data
{destinationDirectory} =
$dir
||
'.'
; }
if
(
$data
{destinationDirectory}) {
if
(
$data
{siteDirectory}) {
Fatal(
'unexpected'
,
$data
{destinationDirectory},
undef
,
"The destination directory ($data{destinationDirectory})"
.
" must be within the siteDirectory ($data{siteDirectory})"
)
unless
pathname_is_contained(
$data
{destinationDirectory},
$data
{siteDirectory}); }
else
{
$data
{siteDirectory} =
$data
{destinationDirectory}; } }
$data
{namespaces} = {
ltx
=>
$NSURI
}
unless
$data
{namespaces};
$data
{namespaceURIs} = {
$NSURI
=>
'ltx'
}
unless
$data
{namespaceURIs};
$data
{idcache} = {};
$data
{idcache_reusable} = {};
$data
{idcache_reserve} = {};
my
$self
=
bless
{
%data
},
$class
;
return
$self
; }
sub
newFromFile {
my
(
$class
,
$source
,
%options
) =
@_
;
my
$path
= (
ref
$class
? pathname_find(
$source
,
paths
=>
$$class
{searchpaths})
:
$source
);
if
(!
$path
) {
Error(
'missing_file'
,
$source
,
$class
,
"No XML document '$source' found"
,
(
ref
$class
?
"search paths are "
.
join
(
', '
, @{
$$class
{searchpaths} }) : ()));
return
; }
$options
{source} =
$path
;
if
(!
$options
{sourceDirectory}) {
my
(
$dir
,
$name
,
$ext
) = pathname_split(
$path
);
$options
{sourceDirectory} =
$dir
||
'.'
; }
my
$doc
=
$class
->new(LaTeXML::Common::XML::Parser->new()->parseFile(
$path
),
%options
);
$doc
->validate
if
$$doc
{validate};
return
$doc
; }
sub
newFromString {
my
(
$class
,
$string
,
%options
) =
@_
;
$options
{sourceDirectory} =
'.'
unless
$options
{sourceDirectory};
my
$doc
=
$class
->new(LaTeXML::Common::XML::Parser->new()->parseString(
$string
),
%options
);
$doc
->validate
if
$$doc
{validate};
return
$doc
; }
sub
newFromSTDIN {
my
(
$class
,
%options
) =
@_
;
my
$string
;
{
local
$/ =
undef
;
$string
= <>; }
$options
{sourceDirectory} =
'.'
unless
$options
{sourceDirectory};
my
$doc
=
$class
->new(LaTeXML::Common::XML::Parser->new()->parseString(
$string
),
%options
);
$doc
->validate
if
$$doc
{validate};
return
$doc
; }
sub
newDocument {
my
(
$self
,
$root
,
%options
) =
@_
;
my
$clone_suffix
=
$options
{clone_suffix};
delete
$options
{clone_suffix};
my
$doc
=
$self
->new_internal(
undef
,
%options
);
$doc
->setDocument_internal(
$root
,
clone_suffix
=>
$clone_suffix
);
if
(
my
$root_id
=
$self
->getDocumentElement->getAttribute(
'xml:id'
)) {
$$doc
{split_from_id} =
$root_id
; }
foreach
my
$pi
(
$self
->findnodes(
".//processing-instruction('latexml')"
)) {
$doc
->getDocument->appendChild(
$pi
->cloneNode); }
if
(
my
@resources
=
$self
->findnodes(
"descendant::ltx:resource"
)) {
$doc
->addNodes(
$doc
->getDocumentElement,
@resources
); }
$doc
->addDate(
$self
);
if
(
my
$class
=
$self
->getDocumentElement->getAttribute(
'class'
)) {
my
$root
=
$doc
->getDocumentElement;
my
$oclass
=
$root
->getAttribute(
'class'
);
$root
->setAttribute(
class
=> (
$oclass
?
$oclass
.
' '
.
$class
:
$class
)); }
return
$doc
; }
sub
setDocument_internal {
my
(
$self
,
$root
,
%options
) =
@_
;
my
$roottype
=
ref
$root
;
if
(
$roottype
eq
'LaTeXML::Core::Document'
) {
$root
=
$root
->getDocument;
$roottype
=
ref
$root
; }
if
(
my
$clone_suffix
=
$options
{clone_suffix}) {
if
(
$roottype
eq
'XML::LibXML::Document'
) {
Fatal(
'internal'
,
'unimplemented'
,
undef
,
"Have not yet implemented cloning for entire documents"
); }
$root
=
$self
->cloneNode(
$root
,
$clone_suffix
); }
if
(
$roottype
eq
'XML::LibXML::Document'
) {
$$self
{document} =
$root
;
foreach
my
$node
(
$self
->findnodes(
"//*[\@xml:id]"
)) {
$$self
{idcache}{
$node
->getAttribute(
'xml:id'
) } =
$node
; }
if
(
my
$docroot
=
$root
->documentElement) {
foreach
my
$ns
(
$docroot
->getNamespaces) {
my
(
$prefix
,
$uri
) = (
$ns
->getLocalName,
$ns
->getData);
if
(
$prefix
) {
$$self
{namespaces}{
$prefix
} =
$uri
unless
$$self
{namespaces}{
$prefix
};
$$self
{namespaceURIs}{
$uri
} =
$prefix
unless
$$self
{namespaceURIs}{
$uri
}; } } }
$$self
{processingInstructions} =
[
map
{
$_
->textContent }
$XPATH
->findnodes(
'.//processing-instruction("latexml")'
,
$root
)];
my
@paths
= ();
@paths
= @{
$$self
{searchpaths} }
if
$$self
{searchpaths};
foreach
my
$pi
(@{
$$self
{processingInstructions} }) {
if
(
$pi
=~ /^\s
*searchpaths
\s*=\s*([\"\'])(.*?)\1\s*$/) {
push
(
@paths
,
split
(
','
, $2)); } }
$$self
{searchpaths} = [
@paths
,
'.'
]; }
elsif
(
$roottype
eq
'XML::LibXML::Element'
) {
$$self
{document} = XML::LibXML::Document->new(
"1.0"
,
"UTF-8"
);
if
(
my
$parent
=
$self
->findnode(
'ancestor::*[@id][1]'
,
$root
)) {
$$self
{parent_id} =
$parent
->getAttribute(
'xml:id'
); }
$$self
{document}->setDocumentElement(
$$self
{document}->importNode(
$root
));
$root
->setNamespace(
$root
->namespaceURI,
$root
->prefix, 1);
foreach
my
$node
(
$self
->findnodes(
"//*[\@xml:id]"
)) {
$$self
{idcache}{
$node
->getAttribute(
'xml:id'
) } =
$node
; } }
elsif
(
$roottype
eq
'ARRAY'
) {
$$self
{document} = XML::LibXML::Document->new(
"1.0"
,
"UTF-8"
);
my
(
$tag
,
$attributes
,
@children
) =
@$root
;
my
(
$prefix
,
$localname
) =
$tag
=~ /^(.*):(.*)$/;
my
$nsuri
=
$$self
{namespaces}{
$prefix
};
my
$node
=
$$self
{document}->createElementNS(
$nsuri
,
$localname
);
$$self
{document}->setDocumentElement(
$node
);
map
{
$$attributes
{
$_
} &&
$node
->setAttribute(
$_
=>
$$attributes
{
$_
}) }
keys
%$attributes
if
$attributes
;
if
(
my
$id
=
$$attributes
{
'xml:id'
}) {
$self
->recordID(
$id
=>
$node
); }
$self
->addNodes(
$node
,
@children
); }
else
{
Fatal(
'unexpected'
,
$root
,
undef
,
"Dont know how to use '$root' as document element"
); }
$$self
{document}->setURI(URI::file->new(
$self
->getDestination));
return
$self
; }
our
@MonthNames
= (
qw( January February March April May June
July August September October November December)
);
sub
addDate {
my
(
$self
,
$fromdoc
) =
@_
;
if
(!
$self
->findnodes(
'ltx:date'
,
$self
->getDocumentElement)) {
my
@dates
;
if
(
$fromdoc
&& (
@dates
=
$fromdoc
->findnodes(
'ltx:date'
,
$fromdoc
->getDocumentElement))) {
$self
->addNodes(
$self
->getDocumentElement,
@dates
); } }
return
; }
sub
getDocument {
my
(
$self
) =
@_
;
return
$$self
{document}; }
sub
getDocumentElement {
my
(
$self
) =
@_
;
return
$$self
{document}->documentElement; }
sub
getSource {
my
(
$self
) =
@_
;
return
$$self
{source}; }
sub
getSourceDirectory {
my
(
$self
) =
@_
;
return
$$self
{sourceDirectory} ||
'.'
; }
sub
getSearchPaths {
my
(
$self
) =
@_
;
return
@{
$$self
{searchpaths} }; }
sub
getDestination {
my
(
$self
) =
@_
;
return
$$self
{destination}; }
sub
getDestinationDirectory {
my
(
$self
) =
@_
;
return
$$self
{destinationDirectory}; }
sub
getSiteDirectory {
my
(
$self
) =
@_
;
return
$$self
{siteDirectory}; }
sub
siteRelativePathname {
my
(
$self
,
$pathname
) =
@_
;
return
(
defined
$pathname
? pathname_relative(
$pathname
,
$$self
{siteDirectory}) :
undef
); }
sub
siteRelativeDestination {
my
(
$self
) =
@_
;
return
(
defined
$$self
{destination}
? pathname_relative(
$$self
{destination},
$$self
{siteDirectory})
:
undef
); }
sub
getParentDocument {
my
(
$self
) =
@_
;
return
$$self
{parentDocument}; }
sub
getAncestorDocument {
my
(
$self
) =
@_
;
my
(
$doc
,
$d
) =
$self
;
while
(
$d
=
$$doc
{parentDocument}) {
$doc
=
$d
; }
return
$doc
; }
sub
toString {
my
(
$self
) =
@_
;
return
$$self
{document}->toString(1); }
sub
getDestinationExtension {
my
(
$self
) =
@_
;
return
(
$$self
{destination} =~ /\.([^\.\/]*)$/ ? $1 :
undef
); }
sub
checkDestination {
my
(
$self
,
$reldest
) =
@_
;
my
$dest
= pathname_absolute(
$reldest
,
$self
->getDestinationDirectory);
if
(
my
$destdir
= pathname_directory(
$dest
)) {
pathname_mkdir(
$destdir
)
or
return
Fatal(
"I/O"
,
$destdir
,
undef
,
"Could not create directory $destdir for $reldest: $!"
); }
return
$dest
; }
sub
stringify {
my
(
$self
) =
@_
;
return
'Post::Document['
.
$self
->siteRelativeDestination .
']'
; }
sub
getLocator {
my
(
$self
) =
@_
;
return
$$self
{source}; }
sub
validate {
my
(
$self
) =
@_
;
my
$schema
;
foreach
my
$pi
(@{
$$self
{processingInstructions} }) {
if
(
$pi
=~ /^\s
*RelaxNGSchema
\s*=\s*([\"\'])(.*?)\1\s*$/) {
$schema
= $2; } }
if
(
$schema
) {
my
$rng
= LaTeXML::Common::XML::RelaxNG->new(
$schema
,
searchpaths
=> [
$self
->getSearchPaths]);
Error(
'I/O'
,
$schema
,
undef
,
"Failed to load RelaxNG schema $schema"
.
"Response was: $@"
)
unless
$rng
;
my
$v
=
eval
{
local
$LaTeXML::IGNORE_ERRORS
= 1;
$rng
->validate(
$$self
{document}); };
Error(
"malformed"
,
'document'
,
undef
,
"Document fails RelaxNG validation ("
.
$schema
.
")"
,
"Validation reports: "
. $@,
if
$@ || !
defined
$v
; }
elsif
(
my
$decldtd
=
$$self
{document}->internalSubset) {
my
$dtd
= XML::LibXML::Dtd->new(
$decldtd
->publicId,
$decldtd
->systemId);
if
(!
$dtd
) {
Error(
"I/O"
,
$decldtd
->publicId,
undef
,
"Failed to load DTD "
.
$decldtd
->publicId .
" at "
.
$decldtd
->systemId,
"skipping validation"
); }
else
{
my
$v
=
eval
{
local
$LaTeXML::IGNORE_ERRORS
= 1;
$$self
{document}->validate(
$dtd
); };
Error(
"malformed"
,
'document'
,
undef
,
"Document failed DTD validation ("
.
$decldtd
->systemId .
")"
,
"Validation reports: "
. $@)
if
$@ || !
defined
$v
; } }
else
{
Warn(
"expected"
,
'schema'
,
undef
,
"No Schema or DTD found for this document"
); }
return
; }
sub
idcheck {
my
(
$self
) =
@_
;
my
%idcache
= ();
my
%dups
= ();
my
%missing
= ();
foreach
my
$node
(
$self
->findnodes(
"//*[\@xml:id]"
)) {
my
$id
=
$node
->getAttribute(
'xml:id'
);
$dups
{
$id
} = 1
if
$idcache
{
$id
};
$idcache
{
$id
} = 1; }
foreach
my
$id
(
keys
%{
$$self
{idcache} }) {
$missing
{
$id
} = 1
unless
$idcache
{
$id
}; }
Warn(
"unexpected"
,
'ids'
,
undef
,
"IDs were duplicated in cache for "
.
$self
->siteRelativeDestination,
join
(
','
,
keys
%dups
))
if
keys
%dups
;
Warn(
"expected"
,
'ids'
,
undef
,
"IDs were cached for "
.
$self
->siteRelativeDestination
.
" but not in document"
,
join
(
','
,
keys
%missing
))
if
keys
%missing
;
return
; }
sub
findnodes {
my
(
$self
,
$path
,
$node
) =
@_
;
return
$XPATH
->findnodes(
$path
,
$node
||
$$self
{document}); }
sub
findnode {
my
(
$self
,
$path
,
$node
) =
@_
;
my
(
$first
) =
$XPATH
->findnodes(
$path
,
$node
||
$$self
{document});
return
$first
; }
sub
findvalue {
my
(
$self
,
$path
,
$node
) =
@_
;
return
$XPATH
->findvalue(
$path
,
$node
||
$$self
{document}); }
sub
addNamespace {
my
(
$self
,
$nsuri
,
$prefix
) =
@_
;
if
(!
$$self
{namespaces}{
$prefix
} || (
$$self
{namespaces}{
$prefix
} ne
$nsuri
)
|| ((
$self
->getDocumentElement->lookupNamespacePrefix(
$nsuri
) ||
''
) ne
$prefix
)) {
$$self
{namespaces}{
$prefix
} =
$nsuri
;
$$self
{namespaceURIs}{
$nsuri
} =
$prefix
;
$XPATH
->registerNS(
$prefix
=>
$nsuri
);
$self
->getDocumentElement->setNamespace(
$nsuri
,
$prefix
, 0); }
return
; }
sub
getQName {
my
(
$self
,
$node
) =
@_
;
if
(
ref
$node
eq
'ARRAY'
) {
return
$$node
[0]; }
elsif
(
ref
$node
eq
'XML::LibXML::Element'
) {
my
$nsuri
=
$node
->namespaceURI;
if
(!
$nsuri
) {
if
(
$node
->nodeType == XML_ELEMENT_NODE) {
return
$node
->localname; }
else
{
return
; } }
elsif
(
my
$prefix
=
$$self
{namespaceURIs}{
$nsuri
}) {
return
$prefix
.
":"
.
$node
->localname; }
else
{
my
$prefix
=
"_ns"
. (1 +
scalar
(
grep
{ /^_ns\d+$/ }
keys
%{
$$self
{namespaces} }));
$$self
{namespaces}{
$prefix
} =
$nsuri
;
$$self
{namespaceURIs}{
$nsuri
} =
$prefix
;
return
$prefix
.
":"
.
$node
->localname; } }
else
{
return
; } }
sub
addNodes {
no
warnings
'recursion'
;
my
(
$self
,
$node
,
@data
) =
@_
;
foreach
my
$child
(
@data
) {
if
(
ref
$child
eq
'ARRAY'
) {
my
(
$tag
,
$attributes
,
@children
) =
@$child
;
if
(
$tag
eq
'_Fragment_'
) {
my
$indent
;
if
(
my
$pre
=
$node
->previousSibling) {
if
((
$pre
->nodeType == XML_TEXT_NODE) && ((
$pre
=
$pre
->textContent) =~ /^\s*$/)) {
$indent
=
$pre
.
' '
; } }
if
(
$indent
) {
$self
->addNodes(
$node
,
map
{ (
$indent
,
$_
) }
@children
); }
else
{
$self
->addNodes(
$node
,
@children
); } }
else
{
my
(
$prefix
,
$localname
) =
$tag
=~ /^(.*):(.*)$/;
my
$nsuri
=
$prefix
&&
$$self
{namespaces}{
$prefix
};
Warn(
'expected'
,
'namespace'
,
undef
,
"No namespace on '$tag'"
)
unless
$nsuri
;
my
$new
;
if
(
ref
$node
eq
'LibXML::XML::Document'
) {
$new
=
$node
->createElementNS(
$nsuri
,
$localname
);
$node
->setDocumentElement(
$new
); }
else
{
$new
=
$node
->addNewChild(
$nsuri
,
$localname
); }
if
(
$attributes
) {
foreach
my
$key
(
sort
keys
%$attributes
) {
next
unless
defined
$$attributes
{
$key
};
next
if
$key
=~ /^_/;
my
(
$attrprefix
,
$attrname
) =
$key
=~ /^(.*):(.*)$/;
my
$value
=
$$attributes
{
$key
};
if
(
$key
eq
'xml:id'
) {
if
(
defined
$$self
{idcache}{
$value
}) {
my
$newid
=
$self
->uniquifyID(
$value
);
Info(
'unexpected'
,
'duplicate_id'
,
undef
,
"Duplicated id=$value using $newid "
. (
$$self
{destination} ||
''
));
$value
=
$newid
; }
$self
->recordID(
$value
=>
$new
);
$new
->setAttribute(
$key
,
$value
); }
elsif
(
$attrprefix
&& (
$attrprefix
ne
'xml'
)) {
my
$attrnsuri
=
$attrprefix
&&
$$self
{namespaces}{
$attrprefix
};
$new
->setAttributeNS(
$attrnsuri
,
$key
,
$$attributes
{
$key
}); }
else
{
$new
->setAttribute(
$key
,
$$attributes
{
$key
}); } } }
$self
->addNodes(
$new
,
@children
); } }
elsif
((
ref
$child
) =~ /^XML::LibXML::/) {
my
$type
=
$child
->nodeType;
if
(
$type
== XML_ELEMENT_NODE) {
my
$nsuri
=
$child
->namespaceURI;
my
$localname
=
$child
->localname;
my
$new
;
if
(
ref
$node
eq
'LibXML::XML::Document'
) {
$new
=
$node
->createElementNS(
$nsuri
,
$localname
);
$node
->setDocumentElement(
$new
); }
else
{
$new
=
$node
->addNewChild(
$nsuri
,
$localname
); }
foreach
my
$attr
(
$child
->attributes) {
my
$atype
=
$attr
->nodeType;
if
(
$atype
== XML_ATTRIBUTE_NODE) {
my
$key
=
$attr
->nodeName;
if
(
$key
=~ /^_/) { }
elsif
(
$key
eq
'xml:id'
) {
my
$value
=
$attr
->getValue;
my
$old
;
if
((
defined
(
$old
=
$$self
{idcache}{
$value
}))
&& !
$old
->isSameNode(
$child
)) {
my
$newid
=
$self
->uniquifyID(
$value
);
Info(
'unexpected'
,
'duplicate_id'
,
undef
,
"Duplicated id=$value using $newid "
. (
$$self
{destination} ||
''
));
$value
=
$newid
; }
$self
->recordID(
$value
=>
$new
);
$new
->setAttribute(
$key
,
$value
); }
elsif
(
my
$ns
=
$attr
->namespaceURI) {
$new
->setAttributeNS(
$ns
,
$attr
->name,
$attr
->getValue); }
else
{
$new
->setAttribute(
$attr
->localname,
$attr
->getValue); } }
}
$self
->addNodes(
$new
,
$child
->childNodes); }
elsif
(
$type
== XML_DOCUMENT_FRAG_NODE) {
$self
->addNodes(
$node
,
$child
->childNodes); }
elsif
(
$type
== XML_TEXT_NODE) {
$node
->appendTextNode(
$child
->textContent); }
}
elsif
(
ref
$child
) {
Warn(
'misdefined'
,
$child
,
undef
,
"Dont know how to add $child to $node; ignoring"
); }
elsif
(
defined
$child
) {
$node
->appendTextNode(
$child
); } }
return
; }
sub
removeNodes {
my
(
$self
,
@nodes
) =
@_
;
foreach
my
$node
(
@nodes
) {
my
$ref
=
ref
$node
;
if
(!
$ref
) { }
elsif
(
$ref
eq
'ARRAY'
) {
my
(
$t
,
$a
,
@n
) =
@$node
;
if
(
my
$id
=
$$a
{
'xml:id'
}) {
if
(
$$self
{idcache}{
$id
}) {
delete
$$self
{idcache}{
$id
}; } }
$self
->removeNodes(
@n
); }
elsif
(
$ref
=~ /^XML::LibXML::/) {
if
(
$node
->nodeType == XML_ELEMENT_NODE) {
foreach
my
$idd
(
$self
->findnodes(
"descendant-or-self::*[\@xml:id]"
,
$node
)) {
my
$id
=
$idd
->getAttribute(
'xml:id'
);
if
(
$$self
{idcache}{
$id
}) {
delete
$$self
{idcache}{
$id
}; } } }
$node
->unlinkNode; } }
return
; }
sub
preremoveNodes {
my
(
$self
,
@nodes
) =
@_
;
foreach
my
$node
(
@nodes
) {
my
$ref
=
ref
$node
;
if
(!
$ref
) { }
elsif
(
$ref
eq
'ARRAY'
) {
my
(
$t
,
$a
,
@n
) =
@$node
;
if
(
my
$id
=
$$a
{
'xml:id'
}) {
$$self
{idcache_reusable}{
$id
} = 1; }
$self
->preremoveNodes(
@n
); }
elsif
(
$ref
=~ /^XML::LibXML::/) {
if
(
$node
->nodeType == XML_ELEMENT_NODE) {
foreach
my
$idd
(
$self
->findnodes(
"descendant-or-self::*[\@xml:id]"
,
$node
)) {
my
$id
=
$idd
->getAttribute(
'xml:id'
);
$$self
{idcache_reusable}{
$id
} = 1; } } } }
return
; }
sub
removeBlankNodes {
my
(
$self
,
$node
) =
@_
;
my
$n
= 0;
foreach
my
$child
(
$node
->childNodes) {
if
((
$child
->nodeType == XML_TEXT_NODE) && (
$child
->textContent =~ /^\s*$/)) {
$node
->removeChild(
$child
);
$n
++; } }
return
$n
; }
sub
replaceNode {
my
(
$self
,
$node
,
@replacements
) =
@_
;
my
(
$parent
,
$following
) = (
$node
->parentNode,
undef
);
my
@save
= ();
while
((
$following
=
$parent
->lastChild) && (
$$following
!=
$$node
)) {
unshift
(
@save
,
$parent
->removeChild(
$following
)); }
$self
->removeNodes(
$node
);
$self
->addNodes(
$parent
,
@replacements
);
map
{
$parent
->appendChild(
$_
) }
@save
;
return
; }
sub
prependNodes {
my
(
$self
,
$node
,
@nodes
) =
@_
;
my
@save
= ();
while
(
my
$last
=
$node
->lastChild) {
unshift
(
@save
,
$node
->removeChild(
$last
)); }
$self
->addNodes(
$node
,
@nodes
);
map
{
$node
->appendChild(
$_
) }
@save
;
return
; }
sub
cloneNode {
my
(
$self
,
$node
,
$idsuffix
,
%options
) =
@_
;
return
$node
unless
ref
$node
;
return
$node
if
ref
$node
eq
'ARRAY'
;
my
$copy
=
$node
->cloneNode(1);
my
$nocache
=
$options
{nocache};
my
%idmap
= ();
foreach
my
$n
(
$self
->findnodes(
'descendant-or-self::*[@xml:id]'
,
$copy
)) {
my
$id
=
$n
->getAttribute(
'xml:id'
);
my
$newid
=
$self
->uniquifyID(
$id
,
$idsuffix
);
$idmap
{
$id
} =
$newid
;
$self
->recordID(
$newid
=>
$n
)
unless
$nocache
;
$n
->setAttribute(
'xml:id'
=>
$newid
);
if
(
my
$fragid
=
$n
->getAttribute(
'fragid'
)) {
$n
->setAttribute(
fragid
=>
substr
(
$newid
,
length
(
$id
) -
length
(
$fragid
))); } }
foreach
my
$n
(
$self
->findnodes(
'descendant-or-self::*[@idref]'
,
$copy
)) {
if
(
my
$id
=
$idmap
{
$n
->getAttribute(
'idref'
) }) {
$n
->setAttribute(
idref
=>
$id
); } }
foreach
my
$n
(
$self
->findnodes(
'descendant-or-self::*[@labels]'
,
$copy
)) {
$n
->removeAttribute(
'labels'
); }
return
$copy
; }
sub
cloneNodes {
my
(
$self
,
@nodes
) =
@_
;
return
map
{
$self
->cloneNode(
$_
) }
@nodes
; }
sub
addSSValues {
my
(
$self
,
$node
,
$key
,
$values
) =
@_
;
$values
=
$values
->toAttribute
if
ref
$values
;
if
((
defined
$values
) && (
$values
ne
''
)) {
my
@values
=
split
(/\s/,
$values
);
if
(
my
$oldvalues
=
$node
->getAttribute(
$key
)) {
my
@old
=
split
(/\s/,
$oldvalues
);
foreach
my
$new
(
@values
) {
push
(
@old
,
$new
)
unless
grep
{
$_
eq
$new
}
@old
; }
$node
->setAttribute(
$key
=>
join
(
' '
,
sort
@old
)); }
else
{
$node
->setAttribute(
$key
=>
join
(
' '
,
sort
@values
)); } }
return
; }
sub
addClass {
my
(
$self
,
$node
,
$class
) =
@_
;
return
$self
->addSSValues(
$node
,
class
=>
$class
); }
sub
markXMNodeVisibility {
my
(
$self
) =
@_
;
foreach
my
$math
(
$self
->findnodes(
'//ltx:XMath/*'
)) {
$self
->markXMNodeVisibility_aux(
$math
, 1, 1); }
return
; }
sub
markXMNodeVisibility_aux {
no
warnings
'recursion'
;
my
(
$self
,
$node
,
$cvis
,
$pvis
) =
@_
;
return
unless
$node
;
my
$qname
=
$self
->getQName(
$node
);
return
if
(!
$cvis
||
$node
->getAttribute(
'_cvis'
)) && (!
$pvis
||
$node
->getAttribute(
'_pvis'
));
$node
->setAttribute(
'_cvis'
=> 1)
if
$cvis
;
$node
->setAttribute(
'_pvis'
=> 1)
if
$pvis
;
if
(
$qname
eq
'ltx:XMDual'
) {
my
(
$c
,
$p
) = element_nodes(
$node
);
$self
->markXMNodeVisibility_aux(
$c
, 1, 0)
if
$cvis
;
$self
->markXMNodeVisibility_aux(
$p
, 0, 1)
if
$pvis
; }
elsif
(
$qname
eq
'ltx:XMRef'
) {
my
$id
=
$node
->getAttribute(
'idref'
);
$self
->markXMNodeVisibility_aux(
$self
->findNodeByID(
$id
),
$cvis
,
$pvis
); }
else
{
foreach
my
$child
(element_nodes(
$node
)) {
$self
->markXMNodeVisibility_aux(
$child
,
$cvis
,
$pvis
); } }
return
; }
sub
conjoin {
my
(
$self
,
$conjunction
,
@nodes
) =
@_
;
my
(
$comma
,
$and
) = (
$conjunction
,
$conjunction
);
(
$comma
,
$and
) =
@$conjunction
if
ref
$conjunction
;
my
$n
=
scalar
(
@nodes
);
if
(
$n
< 2) {
return
@nodes
; }
else
{
my
@foo
= ();
push
(
@foo
,
shift
(
@nodes
));
while
(
$nodes
[1]) {
push
(
@foo
,
$comma
,
shift
(
@nodes
)); }
push
(
@foo
,
$and
,
shift
(
@nodes
));
return
@foo
; } }
sub
initial {
my
(
$self
,
$string
,
$force
) =
@_
;
$string
= NFD(
$string
);
$string
=~ s/^\s+//gs;
$string
=~ s/^[^a-zA-Z]*//
if
$force
;
return
(
$string
=~ /^([a-zA-Z])/ ?
uc
($1) :
'*'
); }
sub
trimChildNodes {
my
(
$self
,
$node
) =
@_
;
if
(!
$node
) {
return
(); }
elsif
(!
ref
$node
) {
return
(
$node
); }
elsif
(
my
@children
=
$node
->childNodes) {
if
(
$children
[0] &&
$children
[0]->nodeType == XML_TEXT_NODE) {
my
$s
=
$children
[0]->data;
$s
=~ s/^\s+//;
if
(
$s
) {
$children
[0]->setData(
$s
); }
else
{
shift
(
@children
); } }
if
(
$children
[-1] &&
$children
[-1]->nodeType == XML_TEXT_NODE) {
my
$s
=
$children
[-1]->data;
$s
=~ s/\s+$//;
if
(
$s
) {
$children
[-1]->setData(
$s
); }
else
{
pop
(
@children
); } }
return
@children
; }
else
{
return
(); } }
sub
unisort {
my
(
$self
,
@keys
) =
@_
;
my
$lang
=
$self
->getDocumentElement->getAttribute(
'xml:lang'
) ||
'en'
;
return
$LaTeXML::POST
->getsorter(
$lang
)->
sort
(
@keys
); }
sub
addNavigation {
my
(
$self
,
$relation
,
$id
) =
@_
;
return
if
$self
->findnode(
'//ltx:navigation/ltx:ref[@rel="'
.
$relation
.
'"][@idref="'
.
$id
.
'"]'
);
my
$ref
= [
'ltx:ref'
, {
idref
=>
$id
,
rel
=>
$relation
,
show
=>
'toctitle'
}];
if
(
my
$nav
=
$self
->findnode(
'//ltx:navigation'
)) {
$self
->addNodes(
$nav
,
$ref
); }
else
{
$self
->addNodes(
$self
->getDocumentElement, [
'ltx:navigation'
, {},
$ref
]); }
return
; }
sub
recordID {
my
(
$self
,
$id
,
$node
) =
@_
;
$$self
{idcache}{
$id
} =
$node
;
delete
$$self
{idcache_reserve}{
$id
};
delete
$$self
{idcache_reusable}{
$id
};
return
; }
sub
findNodeByID {
my
(
$self
,
$id
) =
@_
;
my
$node
=
$$self
{idcache}{
$id
};
return
$$self
{idcache}{
$id
}; }
sub
realizeXMNode {
my
(
$self
,
$node
,
$branch
) =
@_
;
if
(
$branch
) {
while
(
$node
) {
my
$qname
=
$self
->getQName(
$node
);
if
(
$qname
eq
'ltx:XMRef'
) {
my
$id
=
$node
->getAttribute(
'idref'
);
if
(
my
$realnode
=
$self
->findNodeByID(
$id
)) {
$node
=
$realnode
; }
else
{
Error(
'expected'
,
'id'
,
undef
,
"Cannot find a node with xml:id='$id'"
);
return
; } }
elsif
(
$qname
eq
'ltx:XMDual'
) {
my
(
$content
,
$presentation
) = element_nodes(
$node
);
$node
= (
$branch
eq
'content'
?
$content
:
$presentation
); }
else
{
return
$node
; } } }
elsif
(
$self
->getQName(
$node
) eq
'ltx:XMRef'
) {
my
$id
=
$node
->getAttribute(
'idref'
);
if
(
my
$realnode
=
$self
->findNodeByID(
$id
)) {
return
$realnode
; }
else
{
Error(
'expected'
,
'id'
,
undef
,
"Cannot find a node with xml:id='$id'"
);
return
; } }
return
$node
; }
sub
uniquifyID {
my
(
$self
,
$baseid
,
$suffix
) =
@_
;
my
$id
=
$baseid
;
$id
= (
ref
$suffix
eq
'CODE'
?
&$suffix
(
$id
) :
$id
.
$suffix
)
if
defined
$suffix
;
my
$cachekey
=
$id
;
while
((
$$self
{idcache}{
$id
} ||
$$self
{idcache_reserve}{
$id
}) && !
$$self
{idcache_reusable}{
$id
}) {
$id
=
$baseid
. radix_alpha(++
$$self
{idcache_clashes}{
$cachekey
});
$id
= (
ref
$suffix
eq
'CODE'
?
&$suffix
(
$id
) :
$id
.
$suffix
)
if
defined
$suffix
; }
delete
$$self
{idcache_reusable}{
$id
};
$$self
{idcache_reserve}{
$id
} = 1;
return
$id
; }
sub
generateNodeID {
my
(
$self
,
$node
,
$prefix
,
$reusable
) =
@_
;
my
$id
=
$node
->getAttribute(
'xml:id'
);
return
$id
if
$id
;
my
(
$parent
,
$pid
,
$n
) = (
$node
->parentNode,
undef
,
undef
);
while
(
$parent
&& !(
$pid
=
$parent
->getAttribute(
'xml:id'
))) {
$parent
=
$parent
->parentNode; }
$pid
.=
'.'
if
$pid
;
for
(
$n
= 1 ; (
$id
=
$pid
.
$prefix
.
$n
)
&& (
$$self
{idcache}{
$id
} ||
$$self
{idcache_reserved}{
$id
}) ;
$n
++) { }
$node
->setAttribute(
'xml:id'
=>
$id
);
$$self
{idcache}{
$id
} =
$node
;
$$self
{idcache_reusable}{
$id
} =
$reusable
;
if
(
my
$fragid
=
$parent
&&
$parent
->getAttribute(
'fragid'
)) {
$node
->setAttribute(
fragid
=>
$fragid
.
'.'
.
$prefix
.
$n
); }
return
$id
; }
sub
adjust_latexml_doctype {
my
(
$self
,
@additions
) =
@_
;
my
$doc
=
$$self
{document};
if
(
my
$dtd
=
$doc
->internalSubset) {
if
(
$dtd
->toString
=~ /^<!DOCTYPE\s+(\w+)\s+PUBLIC\s+(\"|\')-\/\/NIST LaTeXML\/\/LaTeXML\s+([^\"]*)\2\s+(\"|\')([^\"]*)\4>$/) {
my
(
$root
,
$parts
,
$system
) = ($1, $3, $5);
my
(
$type
,
@addns
) =
split
(/ \+ /,
$parts
);
my
%addns
= ();
map
{
$addns
{
$_
} = 1 }
@addns
,
@additions
;
@addns
=
sort
keys
%addns
;
my
$publicid
=
join
(
' + '
,
"-//NIST LaTeXML//LaTeXML $type"
,
@addns
);
$doc
->removeInternalSubset;
$doc
->createInternalSubset(
$root
,
$publicid
,
$systemid
); } }
return
; }
sub
cacheLookup {
my
(
$self
,
$key
) =
@_
;
$self
->openCache;
$key
= Encode::encode_utf8(
$key
)
if
$key
;
return
$$self
{cache}{
$key
}; }
sub
cacheStore {
my
(
$self
,
$key
,
$value
) =
@_
;
$self
->openCache;
$key
= Encode::encode_utf8(
$key
)
if
$key
;
if
(
defined
$value
) {
$$self
{cache}{
$key
} =
$value
; }
else
{
delete
$$self
{cache}{
$key
}; }
return
; }
sub
openCache {
my
(
$self
) =
@_
;
if
(!
$$self
{cache}) {
$$self
{cache} = {};
my
$dbfile
=
$self
->checkDestination(
"LaTeXML.cache"
);
tie
%{
$$self
{cache} },
'DB_File'
,
$dbfile
, O_RDWR | O_CREAT
or
return
Fatal(
'internal'
,
'db'
,
undef
,
"Couldn't create DB cache for "
.
$self
->getDestination,
"Message was: "
. $!,
(-f
$dbfile
?
"\n(possibly incompatible db format?)"
:
''
));
}
return
; }
sub
closeCache {
my
(
$self
) =
@_
;
if
(
$$self
{cache}) {
untie
%{
$$self
{cache} };
$$self
{cache} =
undef
; }
return
; }
1;