our
@EXPORT
= (
qw(
&ReadAlignmentTemplate &MatrixTemplate)
);
sub
new {
my
(
$class
,
%data
) =
@_
;
my
$self
=
bless
{
%data
},
$class
;
$$self
{template} = LaTeXML::Core::Alignment::Template->new()
unless
$$self
{template};
$$self
{template} = parseAlignmentTemplate(
$$self
{template})
unless
ref
$$self
{template};
$$self
{rows} = [];
$$self
{current_column} = 0;
$$self
{current_row} =
undef
;
$$self
{properties} = {}
unless
$$self
{properties};
if
(
my
$attributes
=
$$self
{properties}{attributes}) {
$$self
{properties}{width} =
$$attributes
{width}
if
$$attributes
{width};
$$self
{properties}{height} =
$$attributes
{height}
if
$$attributes
{height};
$$self
{properties}{depth} =
$$attributes
{depth}
if
$$attributes
{depth}; }
return
$self
; }
sub
getTemplate {
my
(
$self
,
$template
) =
@_
;
return
$$self
{template}; }
sub
currentRow {
my
(
$self
) =
@_
;
return
$$self
{current_row}; }
sub
newRow {
my
(
$self
) =
@_
;
my
$row
=
$$self
{template}->clone;
$$self
{current_row} =
$row
;
$$self
{current_column} = 0;
push
(@{
$$self
{rows} },
$row
);
return
$row
; }
sub
removeRow {
my
(
$self
) =
@_
;
my
@rows
= @{
$$self
{rows} };
if
(
@rows
) {
my
$row
=
pop
(
@rows
);
$$self
{rows} = [
@rows
];
return
$row
; }
else
{
return
; } }
sub
prependRows {
my
(
$self
,
@rows
) =
@_
;
unshift
(@{
$$self
{rows} },
@rows
);
return
; }
sub
appendRows {
my
(
$self
,
@rows
) =
@_
;
push
(@{
$$self
{rows} },
@rows
);
return
; }
sub
rows {
my
(
$self
) =
@_
;
return
@{
$$self
{rows} }; }
sub
addLine {
my
(
$self
,
$border
,
@cols
) =
@_
;
my
$row
=
$$self
{current_row};
if
(
@cols
) {
foreach
my
$c
(
@cols
) {
my
$colspec
=
$row
->column(
$c
);
$$colspec
{border} .=
$border
; } }
else
{
foreach
my
$colspec
(@{
$$row
{columns} }) {
$$colspec
{border} .=
$border
; } }
return
; }
sub
nextColumn {
my
(
$self
) =
@_
;
return
unless
$$self
{current_row};
my
$colspec
=
$$self
{current_row}->column(++
$$self
{current_column});
if
(!
$colspec
) {
Error(
'unexpected'
,
'&'
,
$STATE
->getStomach->getGullet,
"Extra alignment tab '&'"
);
$$self
{current_row}->addColumn(
align
=>
'center'
);
$colspec
=
$$self
{current_row}->column(
$$self
{current_column}); }
return
$colspec
; }
sub
currentColumnNumber {
my
(
$self
) =
@_
;
return
$$self
{current_column}; }
sub
currentRowNumber {
my
(
$self
) =
@_
;
return
scalar
(@{
$$self
{rows} }); }
sub
currentColumn {
my
(
$self
) =
@_
;
return
$$self
{current_row} &&
$$self
{current_row}->column(
$$self
{current_column}); }
sub
getColumn {
my
(
$self
,
$n
) =
@_
;
return
$$self
{current_row} &&
$$self
{current_row}->column(
$n
); }
sub
addBeforeRow {
my
(
$self
,
@boxes
) =
@_
;
$$self
{current_row}{
before
} = [@{
$$self
{current_row}{
before
} || [] },
@boxes
];
return
; }
sub
addAfterRow {
my
(
$self
,
@boxes
) =
@_
;
$$self
{current_row}{
after
} = [@{
$$self
{current_row}{
after
} || [] },
@boxes
];
return
; }
sub
toString {
my
(
$self
) =
@_
;
return
"Alignment[]"
; }
sub
stringify {
my
(
$self
) =
@_
;
return
"Alignment[]"
; }
sub
revert {
my
(
$self
) =
@_
;
return
$self
->getBody->revert; }
sub
computeSize {
my
(
$self
,
%options
) =
@_
;
$self
->normalizeAlignment;
my
$props
=
$self
->getPropertiesRef;
my
@rowheights
= ();
my
@colwidths
= ();
my
$base
=
$STATE
->lookupDefinition(T_CS(
'\baselineskip'
))->valueOf->valueOf;
foreach
my
$row
(@{
$$self
{rows} }) {
my
@cols
= @{
$$row
{columns} };
my
$ncols
=
scalar
(
@cols
);
if
(
my
$short
=
$ncols
-
scalar
(
@colwidths
)) {
push
(
@colwidths
,
map
{ 0 } 1 ..
$short
); }
my
(
$rowh
,
$rowd
) = (
$base
* 0.7,
$base
* 0.3);
for
(
my
$i
= 0 ;
$i
<
$ncols
;
$i
++) {
my
$cell
=
$cols
[
$i
];
next
if
$$cell
{skipped};
next
unless
$$cell
{boxes};
my
(
$w
,
$h
,
$d
) =
$$cell
{boxes}->getSize(
align
=>
$$cell
{align},
width
=>
$$cell
{width},
vattach
=>
$$cell
{vattach});
if
((
$$cell
{colspan} || 1) == 1) {
$colwidths
[
$i
] = max(
$colwidths
[
$i
],
$w
->valueOf); }
else
{ }
if
((
$$cell
{rowspan} || 1) == 1) {
$rowh
= max(
$rowh
,
$h
->valueOf);
$rowd
= max(
$rowd
,
$d
->valueOf); }
else
{ }
}
push
(
@rowheights
,
$rowh
+
$rowd
+ 0.5 *
$base
); }
my
$ww
= Dimension(sum(
@colwidths
));
my
$hh
= Dimension(sum(
@rowheights
));
my
$dd
= Dimension(0);
$$props
{width} =
$ww
unless
defined
$$props
{width};
$$props
{height} =
$hh
unless
defined
$$props
{height};
$$props
{depth} =
$dd
unless
defined
$$props
{depth};
return
; }
sub
beAbsorbed {
my
(
$self
,
$document
) =
@_
;
my
$attr
=
$self
->getProperty(
'attributes'
);
my
$body
=
$self
->getBody;
my
$ismath
=
$$self
{isMath};
$self
->normalizeAlignment;
&{
$$self
{openContainer} }(
$document
, (
$attr
?
%$attr
: ()));
foreach
my
$row
(@{
$$self
{rows} }) {
&{
$$self
{openRow} }(
$document
,
'xml:id'
=>
$$row
{id},
refnum
=>
$$row
{refnum},
frefnum
=>
$$row
{frefnum},
rrefnum
=>
$$row
{rrefnum});
if
(
my
$before
=
$$row
{
before
}) {
map
{
$document
->absorb(
$_
) }
@$before
; }
foreach
my
$cell
(@{
$$row
{columns} }) {
next
if
$$cell
{skipped};
my
$border
=
join
(
' '
,
sort
(
map
{
split
(/ */,
$_
) }
$$cell
{border} ||
''
));
$border
=~ s/(.) \1/$1$1/g;
my
$empty
= !
$$cell
{boxes} || !
scalar
(
$$cell
{boxes}->unlist);
$$cell
{cell} = &{
$$self
{openColumn} }(
$document
,
align
=>
$$cell
{align},
width
=>
$$cell
{width},
vattach
=>
$$cell
{vattach},
((
$$cell
{colspan} || 1) != 1 ? (
colspan
=>
$$cell
{colspan}) : ()),
((
$$cell
{rowspan} || 1) != 1 ? (
rowspan
=>
$$cell
{rowspan}) : ()),
(
$border
? (
border
=>
$border
) : ()),
(
$$cell
{thead} ? (
thead
=>
join
(
' '
,
sort
keys
%{
$$cell
{thead} })) : ()));
if
(!
$empty
) {
local
$LaTeXML::BOX
=
$$cell
{boxes};
$document
->openElement(
'ltx:XMArg'
,
rule
=>
'Anything,'
)
if
$ismath
;
$document
->absorb(
$$cell
{boxes});
$document
->closeElement(
'ltx:XMArg'
)
if
$ismath
;
}
&{
$$self
{closeColumn} }(
$document
); }
if
(
my
$after
=
$$row
{
after
}) {
map
{
$document
->absorb(
$_
) }
@$after
; }
&{
$$self
{closeRow} }(
$document
); }
my
$node
= &{
$$self
{closeContainer} }(
$document
);
if
(!
$document
->findnodes(
"ancestor::ltx:tabular"
,
$node
)) {
my
$hashead
=
$document
->findnodes(
'descendant::ltx:td[@thead]'
,
$node
);
if
(
$self
->getProperty(
'guess_headers'
) && !
$hashead
) {
guess_alignment_headers(
$document
,
$node
,
$self
); }
elsif
(
$hashead
&& !
$body
->isMath) {
alignment_regroup_rows(
$document
,
$node
); } }
return
$node
; }
sub
normalizeAlignment {
my
(
$self
) =
@_
;
return
if
$$self
{normalized};
my
$ismath
=
$$self
{isMath};
my
$preserve
=
$$self
{isMath} ||
$self
->getProperty(
'preserve_structure'
);
my
@rows
= @{
$$self
{rows} };
for
(
my
$i
= 0 ;
$i
<
scalar
(
@rows
) ;
$i
++) {
my
@row
= @{
$rows
[
$i
]->{columns} };
for
(
my
$j
= 0 ;
$j
<
scalar
(
@row
) ;
$j
++) {
my
$col
=
$row
[
$j
];
my
(
$nc
,
$nr
);
if
((
$nc
=
$$col
{colspan} || 1) > 1) {
foreach
(
my
$jj
=
$j
+ 1 ;
$jj
<
$j
+
$nc
;
$jj
++) {
my
$ccol
=
$row
[
$jj
];
$$ccol
{skipped} = 1;
$$ccol
{colspanned} =
$j
;
if
(
my
$nr
=
$$ccol
{rowspan}) {
$$col
{rowspan} =
$nr
; } } }
if
((
$nr
=
$$col
{rowspan} || 1) > 1) {
my
$nc
=
$$col
{colspan} || 1;
for
(
my
$ii
=
$i
+ 1 ;
$ii
<
$i
+
$nr
;
$ii
++) {
if
(
my
$rrow
=
$rows
[
$ii
]) {
for
(
my
$jj
=
$j
;
$jj
<
$j
+
$nc
;
$jj
++) {
if
(
my
$ccol
=
$$rrow
{columns}[
$jj
]) {
$$ccol
{skipped} = 1;
$$ccol
{rowspanned} =
$i
; } } } }
if
(
my
$rrow
=
$rows
[
$i
+
$nr
- 1]) {
my
$sborder
=
''
;
for
(
my
$jj
=
$j
;
$jj
<
$j
+
$nc
;
$jj
++) {
if
(
my
$ccol
=
$$rrow
{columns}[
$jj
]) {
my
$border
=
$$ccol
{border} ||
''
;
$border
=~ s/[^bB]//g;
$sborder
=
$border
unless
$sborder
; } }
$$col
{border} .=
$sborder
if
$sborder
; }
} } }
my
@filtered
= ();
for
(
my
$i
= 0 ;
$i
<
scalar
(
@rows
) ;
$i
++) {
my
$row
=
$rows
[
$i
];
foreach
my
$col
(@{
$$row
{columns} }) {
$$col
{empty} = 1
unless
$$col
{boxes} &&
$$col
{boxes}->unlist; }
if
(
grep
{ !
$$_
{empty} } @{
$$row
{columns} }) {
push
(
@filtered
,
$row
); }
elsif
(
my
$next
=
$rows
[
$i
+ 1]) {
if
(
$preserve
) {
push
(
@filtered
,
$row
);
next
; }
my
$nc
=
scalar
(@{
$$row
{columns} });
for
(
my
$j
= 0 ;
$j
<
$nc
;
$j
++) {
my
$col
=
$$row
{columns}[
$j
];
if
(
defined
$$col
{rowspanned}) {
$rows
[
$$col
{rowspanned}]{columns}[
$j
]{rowspan}--; }
my
$border
=
$$col
{border} ||
''
;
$border
=~ s/[^tTbB]//g;
$border
=~ s/b/t/g;
$border
=~ s/B/T/g;
$$next
{columns}[
$j
]{border} .=
$border
; } }
else
{
my
$prev
=
$filtered
[-1];
my
$nc
=
scalar
(@{
$$row
{columns} });
for
(
my
$j
= 0 ;
$j
<
$nc
;
$j
++) {
my
$col
=
$$row
{columns}[
$j
];
if
(
defined
$$col
{rowspanned}) {
$rows
[
$$col
{rowspanned}]{columns}[
$j
]{rowspan}--; }
my
$border
=
$$col
{border} ||
''
;
$border
=~ s/[^tT]//g;
$border
=~ s/t/b/g;
$border
=~ s/T/B/g;
my
$ccol
=
$$prev
{columns}[
$j
];
if
(
defined
$$ccol
{rowspanned}) {
$ccol
=
$rows
[
$$ccol
{rowspanned}]{columns}[
$j
]; }
$$ccol
{border} .=
$border
; } }
}
@rows
=
@filtered
;
$$self
{rows} = [
@filtered
];
if
(!
$preserve
) {
my
$nc
= 0;
foreach
my
$row
(
@rows
) {
my
$n
=
scalar
(@{
$$row
{columns} });
$nc
=
$n
if
$n
>
$nc
; }
for
(
my
$j
=
$nc
- 1 ;
$j
>= 0 ;
$j
--) {
if
(!
grep
{ (
defined
$$_
{columns}[
$j
]) && !
$$_
{columns}[
$j
]{empty} }
@rows
) {
foreach
my
$row
(
@rows
) {
if
(
my
$col
=
$$row
{columns}[
$j
]) {
if
(
defined
$$col
{colspanned}) {
$$row
{columns}[
$$col
{colspanned}]{colspan}--; }
my
$border
=
$$col
{border} ||
''
;
if
(
$j
> 0) {
my
$prev
=
$$row
{columns}[
$j
- 1];
if
(
my
$jj
=
$$prev
{colspanned}) {
$prev
=
$$row
{columns}[
$jj
]; }
$border
=~ s/[^rRlL]//g;
$border
=~ s/l/r/g;
$border
=~ s/L/R/g;
$$prev
{border} .=
$border
;
if
(
my
@preserve
= preservedBoxes(
$$col
{boxes})) {
$$prev
{boxes} = LaTeXML::Core::List(
$$prev
{boxes}
? (
$$prev
{boxes}->unlist,
@preserve
) :
@preserve
); }
}
elsif
(
my
$next
=
$$row
{columns}[1]) {
my
$border
=
$$col
{border} ||
''
;
$border
=~ s/[^rRlL]//g;
$border
=~ s/r/l/g;
$border
=~ s/R/L/g;
$$next
{border} .=
$border
;
if
(
my
@preserve
= preservedBoxes(
$$col
{boxes})) {
$$next
{boxes} = LaTeXML::Core::List(
$$col
{boxes}
? (
@preserve
,
$$next
{boxes}->unlist) :
@preserve
); }
}
$$row
{columns} = [
grep
{
$_
ne
$col
} @{
$$row
{columns} }];
} } } }
}
$$self
{normalized} = 1;
return
; }
sub
preservedBoxes {
my
(
$boxes
) =
@_
;
return
(
$boxes
?
grep
{
$_
->getProperty(
'alignmentPreserve'
) }
$boxes
->unlist : ()); }
sub
ReadAlignmentTemplate {
my
(
$gullet
) =
@_
;
$gullet
->skipSpaces;
local
$LaTeXML::BUILD_TEMPLATE
=
LaTeXML::Core::Alignment::Template->new(
columns
=> [],
tokens
=> []);
my
@tokens
= (T_BEGIN);
my
$nopens
= 0;
while
(
my
$open
=
$gullet
->readToken) {
if
(
$open
->equals(T_BEGIN)) {
$nopens
++; }
else
{
$gullet
->unread(
$open
);
last
; } }
my
$defn
;
while
(
my
$op
=
$gullet
->readToken) {
if
(
$op
->equals(T_SPACE)) { }
elsif
(
$op
->equals(T_END)) {
while
(--
$nopens
&& (
$op
=
$gullet
->readToken)->equals(T_END)) { }
last
unless
$nopens
;
$gullet
->unread(
$op
); }
elsif
(
defined
(
$defn
=
$STATE
->lookupDefinition(T_CS(
'\NC@rewrite@'
. ToString(
$op
))))
&&
$defn
->isExpandable) {
my
@args
=
$defn
->readArguments(
$gullet
);
if
(
my
$exp
=
$defn
->doInvocation(
$gullet
,
@args
)) {
$gullet
->unread(@{
$exp
}); }
else
{
push
(
@tokens
,
$op
);
if
(
my
$param
=
$defn
->getParameters) {
push
(
@tokens
,
$param
->revertArguments(
@args
)); } } }
elsif
(
$op
->equals(T_BEGIN)) {
$gullet
->unread(
$gullet
->readBalanced->unlist); }
else
{
Warn(
'unexpected'
,
$op
,
$gullet
,
"Unrecognized tabular template '"
. Stringify(
$op
) .
"'"
); }
last
unless
$nopens
; }
push
(
@tokens
, T_END);
$LaTeXML::BUILD_TEMPLATE
->setReversion(
@tokens
);
return
$LaTeXML::BUILD_TEMPLATE
; }
sub
parseAlignmentTemplate {
my
(
$spec
) =
@_
;
return
$STATE
->getStomach->getGullet->readingFromMouth(LaTeXML::Core::Mouth->new(
"{"
.
$spec
.
"}"
),
sub
{
ReadAlignmentTemplate(
$_
[0]); }); }
sub
MatrixTemplate {
return
LaTeXML::Core::Alignment::Template->new(
repeated
=> [{
before
=> Tokens(T_CS(
'\hfil'
)),
after
=> Tokens(T_CS(
'\hfil'
)) }]); }
sub
guess_alignment_headers {
my
(
$document
,
$table
,
$alignment
) =
@_
;
return
if
$document
->findnodes(
"ancestor::ltx:tabular"
,
$table
);
my
$tag
=
$document
->getModel->getNodeQName(
$table
);
my
$x
;
print
STDERR
"\n"
. (
'='
x 50) .
"\nGuessing alignment headers for "
. ((
$x
=
$document
->findnode(
'ancestor-or-self::*[@xml:id]'
,
$table
)) ?
$x
->getAttribute(
'xml:id'
) :
$tag
) .
"\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$ismath
=
$tag
eq
'ltx:XMArray'
;
local
$LaTeXML::TR
= (
$ismath
?
'ltx:XMRow'
:
'ltx:tr'
);
local
$LaTeXML::TD
= (
$ismath
?
'ltx:XMCell'
:
'ltx:td'
);
my
$reversed
= 0;
my
@rows
= collect_alignment_rows(
$document
,
$table
,
$alignment
);
my
@cols
= ();
return
unless
@rows
;
for
(
my
$c
= 0 ;
$c
<
scalar
(@{
$rows
[0] }) ;
$c
++) {
push
(
@cols
, [
map
{
$$_
[
$c
] }
@rows
]); }
if
(alignment_characterize_lines(
$document
, 0, 0,
@rows
)) { }
alignment_characterize_lines(
$document
, 1, 0,
@cols
);
my
%n
= (
h
=> 0,
d
=> 0);
foreach
my
$r
(
@rows
) {
foreach
my
$c
(
@$r
) {
$n
{
$$c
{cell_type} }++; } }
print
STDERR
"$n{h} header, $n{d} data cells\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
if
(
$n
{d} == 1) {
$n
{h} = 0;
foreach
my
$r
(
@rows
) {
foreach
my
$c
(
@$r
) {
$$c
{cell_type} =
'd'
;
$$c
{cell}->removeAttribute(
'thead'
)
if
$$c
{cell}; } } }
if
(!
$ismath
&& !
$reversed
) {
alignment_regroup_rows(
$document
,
$table
); }
if
(
$n
{h}) {
$document
->addClass(
$table
,
'ltx_guessed_headers'
); }
summarize_alignment([
@rows
], [
@cols
])
if
$LaTeXML::Core::Alignment::DEBUG
;
return
; }
sub
alignment_regroup_rows {
my
(
$document
,
$table
) =
@_
;
my
@rows
=
$document
->findnodes(
"ltx:tr"
,
$table
);
my
@heads
= ();
my
$maxreach
= 0;
while
(
@rows
) {
my
@cells
=
$document
->findnodes(
'ltx:td'
,
$rows
[0]);
last
if
scalar
(
grep
{ (!
$_
->getAttribute(
'thead'
)) }
@cells
);
push
(
@heads
,
shift
(
@rows
));
my
$line
=
scalar
(
@heads
);
$maxreach
= max(
$maxreach
,
map
{ (
$_
->getAttribute(
'rowspan'
) || 0) +
$line
}
@cells
); }
if
(
$maxreach
>
scalar
(
@heads
)) {
unshift
(
@rows
,
@heads
);
@heads
= (); }
my
@foots
= ();
while
(
@rows
) {
my
@cells
=
$document
->findnodes(
'ltx:td'
,
$rows
[-1]);
last
if
scalar
(
grep
{ (!
$_
->getAttribute(
'thead'
)) }
@cells
);
push
(
@foots
,
pop
(
@rows
)); }
$document
->wrapNodes(
'ltx:thead'
,
@heads
)
if
@heads
;
$document
->wrapNodes(
'ltx:tbody'
,
@rows
)
if
@rows
;
$document
->wrapNodes(
'ltx:tfoot'
,
@foots
)
if
@foots
;
return
; }
my
%ALIGNMENT_CODE
= (
right
=>
'r'
,
left
=>
'l'
,
center
=>
'c'
,
justify
=>
'p'
);
sub
collect_alignment_rows {
my
(
$document
,
$table
,
$alignment
) =
@_
;
my
@arows
= @{
$$alignment
{rows} };
my
$nrows
=
scalar
(
@arows
);
my
$ncols
= 0;
foreach
my
$arow
(
@arows
) {
my
$n
=
scalar
(@{
$$arow
{columns} });
$ncols
=
$n
if
$n
>
$ncols
; }
my
@rows
= ();
my
(
$h
,
$v
) = (0, 0);
foreach
my
$arow
(
@arows
) {
push
(
@rows
, []);
my
@cols
= @{
$$arow
{columns} };
foreach
my
$col
(
@cols
) {
push
(@{
$rows
[-1] },
$col
);
$$col
{cell_type} =
'd'
;
$$col
{content_class} = ((
$$col
{align} ||
''
) eq
'justify'
?
'mx'
: (
$$col
{cell} ? classify_alignment_cell(
$document
,
$$col
{cell}) :
'?'
));
$$col
{content_length} = (
$$col
{content_class} eq
'g'
? 1000
: (
$$col
{cell} ?
length
(
$$col
{cell}->textContent) : 0));
my
%border
= (
t
=> 0,
r
=> 0,
b
=> 0,
l
=> 0);
map
{
$border
{
$_
}++ }
split
(/ */,
$$col
{border} ||
''
);
$h
= 1
if
$border
{t} ||
$border
{b};
$v
= 1
if
$border
{r} ||
$border
{l};
map
{
$$col
{
$_
} =
$border
{
$_
} }
keys
%border
; }
for
(
my
$c
=
scalar
(
@cols
) ;
$c
<
$ncols
;
$c
++) {
my
$col
= {};
push
(@{
$rows
[-1] },
$col
);
$$col
{align} =
'c'
;
$$col
{cell_type} =
'd'
;
$$col
{content_class} =
'_'
;
$$col
{content_length} = 0;
map
{
$$col
{
$_
} = 0 }
qw(t r b l)
; }
}
for
(
my
$r
= 0 ;
$r
<
$nrows
;
$r
++) {
for
(
my
$c
= 0 ;
$c
<
$ncols
;
$c
++) {
my
$rs
=
$rows
[
$r
][
$c
]{rowspan} || 1;
my
$cs
=
$rows
[
$r
][
$c
]{colspan} || 1;
my
$ca
=
$rows
[
$r
][
$c
]{align};
my
$cc
=
$rows
[
$r
][
$c
]{content_class};
my
$cl
=
$rows
[
$r
][
$c
]{content_length};
my
$rb
=
$rows
[
$r
][
$c
]{r};
$rows
[
$r
][
$c
]{r} = 0;
my
$bb
=
$rows
[
$r
][
$c
]{b};
$rows
[
$r
][
$c
]{b} = 0;
for
(
my
$sc
= 1 ;
$sc
<
$cs
;
$sc
++) {
$rows
[
$r
][
$c
+
$sc
]{align} =
$ca
;
$rows
[
$r
][
$c
+
$sc
]{content_class} =
$cc
;
$rows
[
$r
][
$c
+
$sc
]{content_length} =
$cl
; }
for
(
my
$sr
= 1 ;
$sr
<
$rs
;
$sr
++) {
for
(
my
$sc
= 0 ;
$sc
<
$cs
;
$sc
++) {
$rows
[
$r
+
$sr
][
$c
+
$sc
]{align} =
$ca
;
$rows
[
$r
+
$sr
][
$c
+
$sc
]{content_class} =
$cc
;
$rows
[
$r
+
$sr
][
$c
+
$sc
]{content_length} =
$cl
; } }
for
(
my
$sr
= 0 ;
$sr
<
$rs
;
$sr
++) {
$rows
[
$r
+
$sr
][
$c
+
$cs
- 1]{r} =
$rb
; }
for
(
my
$sc
= 0 ;
$sc
<
$cs
;
$sc
++) {
$rows
[
$r
+
$rs
- 1][
$c
+
$sc
]{b} =
$bb
; }
} }
for
(
my
$r
= 0 ;
$r
<
$nrows
;
$r
++) {
$rows
[
$r
][0]{l} =
$v
;
$rows
[
$r
][0]{r} =
$rows
[
$r
][1]{l}
if
(
$ncols
> 1) &&
$rows
[
$r
][1]{l};
$rows
[
$r
][
$ncols
- 1]{l} =
$rows
[
$r
][
$ncols
- 2]{r}
if
(
$ncols
> 1) &&
$rows
[
$r
][
$ncols
- 2]{r};
$rows
[
$r
][
$ncols
- 1]{r} =
$v
; }
for
(
my
$c
= 0 ;
$c
<
$ncols
;
$c
++) {
$rows
[0][
$c
]{t} =
$h
;
$rows
[0][
$c
]{b} =
$rows
[1][
$c
]{t}
if
(
$nrows
> 1) &&
$rows
[1][
$c
]{t};
$rows
[
$nrows
- 1][
$c
]{t} =
$rows
[
$nrows
- 2][
$c
]{b}
if
(
$nrows
> 1) &&
$rows
[
$nrows
- 2][
$c
]{b};
$rows
[
$nrows
- 1][
$c
]{b} =
$h
; }
for
(
my
$r
= 1 ;
$r
<
$nrows
- 1 ;
$r
++) {
for
(
my
$c
= 1 ;
$c
<
$ncols
- 1 ;
$c
++) {
$rows
[
$r
][
$c
]{t} =
$rows
[
$r
- 1][
$c
]{b}
if
$rows
[
$r
- 1][
$c
]{b};
$rows
[
$r
][
$c
]{b} =
$rows
[
$r
+ 1][
$c
]{t}
if
$rows
[
$r
+ 1][
$c
]{t};
$rows
[
$r
][
$c
]{l} =
$rows
[
$r
][
$c
- 1]{r}
if
$rows
[
$r
][
$c
- 1]{r};
$rows
[
$r
][
$c
]{r} =
$rows
[
$r
][
$c
+ 1]{l}
if
$rows
[
$r
][
$c
+ 1]{l}; } }
if
(
$LaTeXML::Core::Alignment::DEBUG
) {
print
STDERR
"\nCell characterizations:\n"
;
for
(
my
$r
= 0 ;
$r
<
$nrows
;
$r
++) {
for
(
my
$c
= 0 ;
$c
<
$ncols
;
$c
++) {
my
$col
=
$rows
[
$r
][
$c
];
print
STDERR
"[$r,$c]=>"
. (
$$col
{cell_type} ||
'?'
)
. (
$$col
{align} ?
$ALIGNMENT_CODE
{
$$col
{align} } :
' '
)
. (
$$col
{content_class} ||
'?'
)
.
' '
.
$$col
{content_length}
.
' '
.
$$col
{border} .
"=>"
.
join
(
''
,
grep
{
$$col
{
$_
} }
qw(t r b l)
)
. ((
$$col
{rowspan} || 1) > 1 ?
" rowspan="
.
$$col
{rowspan} :
''
)
. ((
$$col
{colspan} || 1) > 1 ?
" colspan="
.
$$col
{colspan} :
''
)
.
"\n"
; } } }
return
@rows
; }
sub
classify_alignment_cell {
my
(
$document
,
$xcell
) =
@_
;
my
$content
=
$xcell
->textContent;
my
$class
=
''
;
if
(
$content
=~ /^[\s\d]+$/) {
$class
=
'i'
; }
else
{
my
@nodes
=
$xcell
->childNodes;
while
(
@nodes
) {
my
$ch
=
shift
(
@nodes
);
my
$chtype
=
$ch
->nodeType;
if
(
$chtype
== XML_TEXT_NODE) {
my
$text
=
$ch
->textContent;
$class
.=
't'
unless
$text
=~ /^\s*$/ || ((
$class
eq
'm'
) && (
$text
=~ /^\s*[\.,;]\s*$/)); }
elsif
(
$chtype
== XML_ELEMENT_NODE) {
my
$chtag
=
$document
->getModel->getNodeQName(
$ch
);
if
(
$chtag
eq
'ltx:text'
) {
$class
.=
't'
unless
$class
eq
't'
; }
elsif
(
$chtag
eq
'ltx:graphics'
) {
$class
.=
'g'
unless
$class
eq
'g'
; }
elsif
(
$chtag
eq
'ltx:Math'
) {
$class
.=
'm'
unless
$class
eq
'm'
; }
elsif
(
$chtag
eq
'ltx:XMText'
) {
$class
.=
't'
unless
$class
eq
't'
; }
elsif
(
$chtag
eq
'ltx:XMArg'
) {
unshift
(
@nodes
,
$ch
->childNodes); }
elsif
(
$chtag
=~ /^ltx:XM/) {
$class
.=
'm'
unless
$class
eq
'm'
; }
else
{
$class
.=
'?'
unless
$class
; }
} } }
$class
=
'mx'
if
$class
&& ((
$class
=~ /^((m|i)t)+(m|i)?$/) || (
$class
=~ /^(t(m|i))+t?$/));
return
$class
||
'_'
; }
my
$MIN_ALIGNMENT_DATA_LINES
= 1;
my
$MAX_ALIGNMENT_HEADER_LINES
= 4;
my
@axisname
= (
'column'
,
'row'
);
sub
alignment_characterize_lines {
my
(
$document
,
$axis
,
$reversed
,
@lines
) =
@_
;
my
$n
=
scalar
(
@lines
);
return
if
$n
< 2;
local
@::TABLINES =
@lines
;
print
STDERR
"\nCharacterizing $n "
. (
$axis
?
"columns"
:
"rows"
) .
"\n "
if
$LaTeXML::Core::Alignment::DEBUG
;
my
(
$diffhi
,
$difflo
,
$diffavg
) = (0, 99999999, 0);
for
(
my
$l
= 0 ;
$l
<
$n
- 1 ;
$l
++) {
my
$d
= alignment_compare(
$axis
, 1,
$reversed
,
$l
,
$l
+ 1);
$diffavg
+=
$d
;
$diffhi
=
$d
if
$d
>
$diffhi
;
$difflo
=
$d
if
$d
<
$difflo
; }
$diffavg
=
$diffavg
/ (
$n
- 1);
if
(
$diffhi
< 0.05) {
print
STDERR
"Lines are almost identical => Fail\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
; }
if
((
$n
> 2) && ((
$diffhi
-
$difflo
) <
$diffhi
* 0.5)) {
print
STDERR
"Differences between lines are almost identical => Fail\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
; }
local
$::TAB_THRESHOLD =
$difflo
+ 0.3 * (
$diffhi
-
$difflo
);
local
$::TAB_AXIS =
$axis
;
print
STDERR
"\nDifferences $difflo -- $diffhi => threshold = $::TAB_THRESHOLD\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
print
STDERR
"Scanning for headers\n "
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$diff
;
my
(
$minh
,
$maxh
) = (1, 1);
while
((
$diff
= alignment_compare(
$axis
, 1,
$reversed
,
$maxh
- 1,
$maxh
)) < $::TAB_THRESHOLD) {
$maxh
++; }
return
if
$maxh
>
$MAX_ALIGNMENT_HEADER_LINES
;
while
(alignment_compare(
$axis
, 1,
$reversed
,
$maxh
,
$maxh
+ 1) > $::TAB_THRESHOLD) {
$maxh
++; }
$maxh
=
$MAX_ALIGNMENT_HEADER_LINES
if
$maxh
>
$MAX_ALIGNMENT_HEADER_LINES
;
print
STDERR
"\nFound from $minh--$maxh potential headers\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$nn
=
scalar
(@{
$lines
[0] }) - 1;
for
(
my
$nh
=
$maxh
;
$nh
>=
$minh
;
$nh
--) {
if
(
my
@heads
= alignment_test_headers(
$nh
)) {
foreach
my
$h
(
@heads
) {
my
$i
= 0;
foreach
my
$cell
(@{
$lines
[
$h
] }) {
$$cell
{cell_type} =
'h'
;
if
(
my
$xcell
=
$$cell
{cell}) {
if
((
$$cell
{content_class} eq
'_'
)
&& (((
$i
== 0) && !
$$cell
{ (
$axis
== 0 ?
'l'
:
't'
) })
|| ((
$i
==
$nn
) && !
$$cell
{ (
$axis
== 0 ?
'r'
:
'b'
) }))) { }
else
{
$document
->addSSValues(
$$cell
{cell},
thead
=>
$axisname
[
$axis
]); } }
$i
++; } }
return
1; } }
return
; }
sub
alignment_test_headers {
my
(
$nhead
) =
@_
;
print
STDERR
"Testing $nhead headers\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
my
(
$headlength
,
$datalength
) = (0, 0);
my
@heads
= (0 ..
$nhead
- 1);
$headlength
= alignment_max_content_length(
$headlength
, 0,
$nhead
- 1);
my
$nextline
=
$nhead
;
my
$nrep
=
scalar
(@::TABLINES) /
$nhead
;
if
((
$nhead
> 1) && (
$nrep
==
int
(
$nrep
))) {
print
STDERR
"Check for apparent header repeated $nrep times\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$matched
= 1;
for
(
my
$r
= 1 ;
$r
<
$nrep
;
$r
++) {
$matched
&&= alignment_match_head(0,
$r
*
$nhead
,
$nhead
); }
print
STDERR
"Repeated headers: "
. (
$matched
?
"Matched=> Fail"
:
"Nomatch => Succeed"
) .
"\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
if
$matched
; }
my
$ndata
= alignment_skip_data(
$nextline
);
return
if
$ndata
<
$nhead
;
return
if
(
$ndata
<
$nhead
) && (
$ndata
< 2);
$datalength
= alignment_max_content_length(
$datalength
,
$nextline
,
$nextline
+
$ndata
- 1);
$nextline
+=
$ndata
;
my
$nd
;
while
(
$nextline
<
scalar
(@::TABLINES)) {
if
((
$ndata
> 1) && (
$nd
= alignment_match_data(
$nhead
,
$nextline
,
$ndata
))) {
$datalength
= alignment_max_content_length(
$datalength
,
$nextline
,
$nextline
+
$nd
- 1);
$nextline
+=
$nd
; }
elsif
(alignment_match_head(0,
$nextline
,
$nhead
)) {
push
(
@heads
,
$nextline
..
$nextline
+
$nhead
- 1);
$headlength
= alignment_max_content_length(
$headlength
,
$nextline
,
$nextline
+
$nhead
- 1);
$nextline
+=
$nhead
;
return
unless
(
$nd
= alignment_match_data(
$nhead
,
$nextline
,
$ndata
));
$datalength
= alignment_max_content_length(
$datalength
,
$nextline
,
$nextline
+
$nd
- 1);
$nextline
+=
$nd
; }
else
{
return
; } }
print
STDERR
"header content = $headlength; data content = $datalength\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
if
((
$headlength
> 10) && (0.25 *
$headlength
>
$datalength
)) {
print
STDERR
"header content too much longer than data content\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
; }
print
STDERR
"Succeeded with $nhead headers\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
@heads
; }
sub
alignment_match_head {
my
(
$p1
,
$p2
,
$nhead
) =
@_
;
print
STDERR
"Try match $nhead header lines from $p1 to $p2\n "
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$nh
= alignment_match_lines(
$p1
,
$p2
,
$nhead
);
my
$ok
=
$nhead
==
$nh
;
print
STDERR
"\nMatched $nh header lines => "
. (
$ok
?
"Succeed"
:
"Failed"
) .
"\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
(
$ok
?
$nhead
: 0); }
sub
alignment_match_data {
my
(
$p1
,
$p2
,
$ndata
) =
@_
;
print
STDERR
"Try match $ndata data lines from $p1 to $p2\n "
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$nd
= alignment_match_lines(
$p1
,
$p2
,
$ndata
);
my
$ok
= (
$nd
* 1.0) /
$ndata
> 0.66;
print
STDERR
"\nMatched $nd data lines => "
. (
$ok
?
"Succeed"
:
"Failed"
) .
"\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
(
$ok
?
$nd
: 0); }
sub
alignment_match_lines {
my
(
$p1
,
$p2
,
$n
) =
@_
;
for
(
my
$i
= 0 ;
$i
<
$n
;
$i
++) {
return
$i
if
(
$p1
+
$i
>=
scalar
(@::TABLINES)) || (
$p2
+
$i
>=
scalar
(@::TABLINES))
|| alignment_compare($::TAB_AXIS, 0, 0,
$p1
+
$i
,
$p2
+
$i
) >= $::TAB_THRESHOLD; }
return
$n
; }
sub
alignment_skip_data {
my
(
$i
) =
@_
;
return
0
if
$i
>=
scalar
(@::TABLINES);
print
STDERR
"Scanning for data\n "
if
$LaTeXML::Core::Alignment::DEBUG
;
my
$n
= 1;
while
(
$i
+
$n
<
scalar
(@::TABLINES)) {
last
if
(alignment_compare($::TAB_AXIS, 1, 0,
$i
+
$n
- 1,
$i
+
$n
) >= $::TAB_THRESHOLD)
&& ((
$n
< 2)
|| (
scalar
(
grep
{
$$_
{content_class} eq
'_'
} @{ $::TABLINES[
$i
+
$n
] }) <= 0.4 *
scalar
($::TABLINES[0])));
$n
++; }
print
STDERR
"\nFound $n data lines at $i\n"
if
$LaTeXML::Core::Alignment::DEBUG
;
return
(
$n
>=
$MIN_ALIGNMENT_DATA_LINES
?
$n
: 0); }
sub
XXXalignment_max_content_length {
my
(
$length
,
$from
,
$to
) =
@_
;
foreach
my
$j
((
$from
..
$to
)) {
foreach
my
$cell
(@{ $::TABLINES[
$j
] }) {
$length
=
$$cell
{content_length}
if
$$cell
{content_length} && (
$$cell
{content_length} >
$length
); } }
return
$length
; }
sub
alignment_max_content_length {
my
(
$length
,
$from
,
$to
) =
@_
;
foreach
my
$j
((
$from
..
$to
)) {
my
$l
= 0;
foreach
my
$cell
(@{ $::TABLINES[
$j
] }) {
$l
+=
$$cell
{content_length}; }
$length
=
$l
if
$l
>
$length
; }
return
$length
; }
my
%cell_class_diff
= (
'_'
=> {
'_'
=> 0.0,
m
=> 0.05,
i
=> 0.05,
t
=> 0.05,
'?'
=> 0.05,
mx
=> 0.05 },
m
=> {
'_'
=> 0.05,
m
=> 0.0,
i
=> 0.1,
mx
=> 0.2 },
i
=> {
'_'
=> 0.05,
m
=> 0.1,
i
=> 0.0,
mx
=> 0.2 },
t
=> {
'_'
=> 0.05,
t
=> 0.0,
mx
=> 0.2 },
'?'
=> {
'_'
=> 0.05,
'?'
=> 0.0,
mx
=> 0.2 },
mx
=> {
'_'
=> 0.05,
m
=> 0.2,
i
=> 0.2,
t
=> 0.2,
'?'
=> 0.2,
mx
=> 0.0 });
sub
alignment_compare {
my
(
$axis
,
$foradjacency
,
$reversed
,
$p1
,
$p2
) =
@_
;
my
$line1
= $::TABLINES[
$p1
];
my
$line2
= $::TABLINES[
$p2
];
return
0
if
!(
$line1
&&
$line2
);
return
999999
if
$line1
xor
$line2
;
my
@cells1
=
@$line1
;
my
@cells2
=
@$line2
;
my
$ncells
=
scalar
(
@cells1
);
my
$diff
= 0.0;
while
(
@cells1
&&
@cells2
) {
my
$cell1
=
shift
(
@cells1
);
my
$cell2
=
shift
(
@cells2
);
$diff
+= 0.75
if
((
$$cell1
{align} ||
''
) ne (
$$cell2
{align} ||
''
))
&& (
$$cell1
{content_class} ne
'_'
) && (
$$cell2
{content_class} ne
'_'
);
if
(
my
$d
=
$cell_class_diff
{
$$cell1
{content_class} }{
$$cell2
{content_class} }) {
$diff
+=
$d
; }
elsif
(
$$cell1
{content_class} ne
$$cell2
{content_class}) {
$diff
+= 0.75; }
if
(
$foradjacency
) {
$diff
+= 0.3 *
scalar
(
grep
{
$$cell1
{
$_
} !=
$$cell2
{
$_
} } (
$axis
== 0 ?
qw(r l)
:
qw(t b)
));
my
$pedge
= (
$axis
== 0 ? (
$reversed
?
't'
:
'b'
) : (
$reversed
?
'l'
:
'r'
));
if
(
$$cell1
{
$pedge
} && (
$$cell1
{
$pedge
} !=
$$cell2
{
$pedge
})) {
$diff
+=
abs
(
$$cell1
{
$pedge
} -
$$cell2
{
$pedge
}) * 1.0; }
}
else
{
$diff
+= 0.3 *
scalar
(
grep
{
$$cell1
{
$_
} !=
$$cell2
{
$_
} }
qw(r l t b)
); }
}
$diff
/=
$ncells
;
print
STDERR
"$p1-$p2 => $diff; "
if
$LaTeXML::Core::Alignment::DEBUG
;
return
$diff
; }
sub
summarize_alignment {
my
(
$rows
,
$cols
) =
@_
;
my
$r
= 0;
my
(
$nrows
,
$ncols
) = (
scalar
(
@$rows
),
scalar
(@{
$$rows
[0] }));
print
STDERR
"\n"
;
foreach
my
$cell
(@{
$$rows
[0] }) {
print
STDERR
' '
. (
$$cell
{t} ? (
'-'
x 6) : (
' '
x 6)); }
print
STDERR
"\n"
;
foreach
my
$row
(
@$rows
) {
my
$maxb
= 0;
print
STDERR (
$$row
[0]{l} ? (
'|'
x
$$row
[0]{l}) :
' '
);
foreach
my
$cell
(
@$row
) {
print
STDERR
sprintf
(
" %4s "
,
(
$$cell
{cell_type} ||
'?'
)
. (
$$cell
{align} ?
$ALIGNMENT_CODE
{
$$cell
{align} } :
' '
)
. (
$$cell
{content_class} ||
'?'
)
. (
$$cell
{r} ? (
'|'
x
$$cell
{r}) :
' '
));
$maxb
=
$$cell
{b}
if
$$cell
{b} >
$maxb
; }
print
STDERR
"\n"
;
for
(
my
$b
= 0 ;
$b
<
$maxb
;
$b
++) {
foreach
my
$cell
(
@$row
) {
print
STDERR
' '
. (
$b
<
$$cell
{b} ? (
'-'
x 6) : (
' '
x 6)); }
print
STDERR
"\n"
; }
$r
++; }
print
STDERR
" "
;
print
STDERR
"\n"
;
return
; }
1;