use v5.18;
use strict;
use warnings qw( FATAL utf8 );
use utf8;
use open qw( :std :utf8 );
use Unicode::Normalize qw( NFC );
use Encode qw( decode );
use English qw( -no_match_vars );
if ( grep /\P{ASCII}/ => @ARGV ) {
@ARGV = map { decode( 'UTF-8', $_ ) } @ARGV;
}
use Carp;
=head1 NAME
Pg::Explain::FromText - Parser for text based explains
=head1 VERSION
Version 2.9
=cut
our $VERSION = '2.9';
=head1 SYNOPSIS
It's internal class to wrap some work. It should be used by Pg::Explain, and not directly.
=head1 FUNCTIONS
=head2 new
Object constructor.
This is not really useful in this particular class, but it's to have the same API for all Pg::Explain::From* classes.
=cut
sub new {
my $class = shift;
my $self = bless {}, $class;
return $self;
}
=head2 explain
Get/Set master explain object.
=cut
sub explain { my $self = shift; $self->{ 'explain' } = $_[ 0 ] if 0 < scalar @_; return $self->{ 'explain' }; }
=head2 split_into_lines
Splits source into lines, while fixing (well, trying to fix) cases where input has been force-wrapped to some length.
=cut
sub split_into_lines {
my $self = shift;
my $source = shift;
my @lines = split /\r?\n/, $source;
my @out = ();
for my $l ( @lines ) {
# Ignore certain lines
next if $l =~ m{\A \s* \( \d+ \s+ rows? \) \s* \z}xms;
next if $l =~ m{\A \s* query \s plan \s* \z}xmsi;
next if $l =~ m{\A \s* (?: -+ | ─+ ) \s* \z}xms;
if ( $l =~ m{ \A Trigger \s+ }xms ) {
push @out, $l;
}
elsif ( $l =~ m{ \A (?: Total \s+ runtime | Planning \s+ time | Execution \s+ time | Time | Filter | Output | JIT | Planning | Settings | Query \s+ Identifier ): }xmsi ) {
push @out, $l;
}
elsif ( $l =~ m{\A\S} ) {
if ( 0 < scalar @out ) {
$out[ -1 ] .= $l;
}
else {
push @out, $l;
}
}
else {
push @out, $l;
}
}
return @out;
}
=head2 parse_source
Function which parses actual plan, and constructs Pg::Explain::Node objects
which represent it.
Returns Top node of query plan.
=cut
sub parse_source {
my $self = shift;
my $source = shift;
# Store jit text info, and flag whether we're in JIT parsing phase
my $jit = undef;
my $in_jit = undef;
# Store information about planning buffers
my $planning_buffers = undef;
my $in_planning = undef;
my $top_node = undef;
my %element_at_depth = (); # element is hashref, contains 2 keys: node (Pg::Explain::Node) and subelement-type, which can be: subnode, initplan or subplan.
my @lines = $self->split_into_lines( $source );
my $costs_re = qr{ \( cost=(?<estimated_startup_cost>\d+\.\d+)\.\.(?<estimated_total_cost>\d+\.\d+) \s+ rows=(?<estimated_rows>\d+) \s+ width=(?<estimated_row_width>\d+) \) }xms;
my $analyze_re = qr{ \(
(?:
actual \s time=(?<actual_time_first>\d+\.\d+)\.\.(?<actual_time_last>\d+\.\d+) \s rows=(?<actual_rows>\d+(?:\.\d+)?) \s loops=(?<actual_loops>\d+)
|
actual \s rows=(?<actual_rows>\d+(?:\.\d+)?) \s loops=(?<actual_loops>\d+)
|
(?<never_executed> never \s+ executed )
)
\) }xms;
my $guc_name = qr{ [a-zA-Z_.]+ }xms;
my $guc_value = qr{ ' (?:[^']+|'' )* ' }xms;
my $single_guc = qr{ ( $guc_name ) \s* = \s* ( $guc_value ) }xms;
my $multiple_gucs = qr{ $single_guc (?: , \s* $single_guc )* }xms;
my $query = '';
my $plan_started = 0;
LINE:
for my $line ( @lines ) {
# Remove trailing whitespace - it makes next line matches MUCH faster.
$line =~ s/\s+\z//;
# There could be stray " at the end. No idea why, but some people paste such explains on explain.depesz.com
$line =~ s/\s*"\z//;
# Replace tabs with 4 spaces
$line =~ s/\t/ /g;
if (
( $line =~ m{\(} )
&& (
$line =~ m{
\A
(?<prefix>\s* -> \s* | \s* )
(?<type>\S.*?)
\s+
(?:
$costs_re \s+ $analyze_re
|
$costs_re
|
$analyze_re
)
\s*
\z
}xms
)
)
{
$plan_started = 1;
my $new_node = Pg::Explain::Node->new( %+ );
$new_node->explain( $self->explain );
if ( defined $+{ 'never_executed' } ) {
$new_node->actual_loops( 0 );
$new_node->never_executed( 1 );
}
my $element = { 'node' => $new_node, 'subelement-type' => 'subnode', };
$in_jit = undef;
my $prefix = $+{ 'prefix' };
$prefix =~ s/->.*//;
my $prefix_length = length $prefix;
if ( 0 == scalar keys %element_at_depth ) {
$element_at_depth{ '0' } = $element;
$top_node = $new_node;
next LINE;
}
my @existing_depths = sort { $a <=> $b } keys %element_at_depth;
for my $key ( grep { $_ >= $prefix_length } @existing_depths ) {
delete $element_at_depth{ $key };
}
my $maximal_depth = ( sort { $b <=> $a } keys %element_at_depth )[ 0 ];
if ( !defined $maximal_depth ) {
croak( "Didn't find current_element by depth - this shouldn't happen - please contact author.\n" );
}
my $previous_element = $element_at_depth{ $maximal_depth };
$element_at_depth{ $prefix_length } = $element;
if ( $previous_element->{ 'subelement-type' } eq 'subnode' ) {
$previous_element->{ 'node' }->add_sub_node( $new_node );
}
elsif ( $previous_element->{ 'subelement-type' } eq 'initplan' ) {
$previous_element->{ 'node' }->add_initplan( $new_node, $previous_element->{ 'metainfo' } );
}
elsif ( $previous_element->{ 'subelement-type' } eq 'subplan' ) {
$previous_element->{ 'node' }->add_subplan( $new_node );
}
elsif ( $previous_element->{ 'subelement-type' } =~ /^cte:(.+)$/ ) {
$previous_element->{ 'node' }->add_cte( $1, $new_node );
delete $element_at_depth{ $maximal_depth };
}
else {
croak( "Bad subelement-type in previous_element - this shouldn't happen - please contact author.\n" );
}
}
elsif ( $line =~ m{ \A (\s*) InitPlan \s* ( \d+ )? \s* (?: \( returns \s+ (.*) \) \s* )? \z }xms ) {
my ( $prefix, $name, $returns ) = ( $1, $2, $3 );
$in_jit = undef;
my @remove_elements = grep { $_ >= length $prefix } keys %element_at_depth;
delete @element_at_depth{ @remove_elements } unless 0 == scalar @remove_elements;
my $maximal_depth = ( sort { $b <=> $a } keys %element_at_depth )[ 0 ];
if ( !defined $maximal_depth ) {
croak( "Didn't find current_element by depth - this shouldn't happen - please contact author (subplan).\n" );
}
my $previous_element = $element_at_depth{ $maximal_depth };
my $metainfo = {};
$metainfo->{ 'name' } = $name if defined $name;
$metainfo->{ 'returns' } = $returns if defined $returns;
$metainfo = undef if 0 == scalar keys %{ $metainfo };
$element_at_depth{ 1 + length $prefix } = {
'node' => $previous_element->{ 'node' },
'subelement-type' => 'initplan',
'metainfo' => $metainfo,
};
next LINE;
}
elsif ( $line =~ m{ \A (\s*) SubPlan \s* (?: \d+ \s* )? \s* (?: \( returns .* \) \s* )? \z }xms ) {
my $prefix = $1;
$in_jit = undef;
my @remove_elements = grep { $_ >= length $prefix } keys %element_at_depth;
delete @element_at_depth{ @remove_elements } unless 0 == scalar @remove_elements;
my $maximal_depth = ( sort { $b <=> $a } keys %element_at_depth )[ 0 ];
if ( !defined $maximal_depth ) {
croak( "Didn't find current_element by depth - this shouldn't happen - please contact author (subplan).\n" );
}
my $previous_element = $element_at_depth{ $maximal_depth };
$element_at_depth{ 1 + length $prefix } = {
'node' => $previous_element->{ 'node' },
'subelement-type' => 'subplan',
};
next LINE;
}
elsif ( $line =~ m{ \A (\s*) CTE \s+ (\S+) \s* \z }xms ) {
my ( $prefix, $cte_name ) = ( $1, $2 );
$in_jit = undef;
my @remove_elements = grep { $_ >= length $prefix } keys %element_at_depth;
delete @element_at_depth{ @remove_elements } unless 0 == scalar @remove_elements;
my $maximal_depth = ( sort { $b <=> $a } keys %element_at_depth )[ 0 ];
if ( !defined $maximal_depth ) {
croak( "Didn't find current_element by depth - this shouldn't happen - please contact author (CTE).\n" );
}
my $previous_element = $element_at_depth{ $maximal_depth };
$element_at_depth{ length $prefix } = {
'node' => $previous_element->{ 'node' },
'subelement-type' => 'cte:' . $cte_name,
};
next LINE;
}
elsif ( $line =~ m{ \A \s* (Planning|Execution) \s+ time: \s+ (\d+\.\d+) \s+ ms \s* \z }xmsi ) {
my ( $type, $time ) = ( $1, $2 );
$in_jit = undef;
$self->explain->planning_time( $time ) if 'planning' eq lc( $type );
$self->explain->execution_time( $time ) if 'execution' eq lc( $type );
}
elsif ( $line =~ m{ \A \s* Total \s+ runtime: \s+ (\d+\.\d+) \s+ ms \s* \z }xmsi ) {
my ( $time ) = ( $1 );
$in_jit = undef;
$self->explain->total_runtime( $time );
}
elsif ( $line =~ m{ \A \s* Settings: \s* ( $multiple_gucs ) \s* \z }xmsi ) {
my $gucs = $1;
my $settings = {};
my @elements = $gucs =~ m{ $single_guc }xmsg;
for ( my $i = 0 ; $i < @elements ; $i += 2 ) {
my $val = $elements[ $i + 1 ];
$val =~ s/\A'|'\z//g;
$val =~ s/''/'/g;
$settings->{ $elements[ $i ] } = $val;
}
$self->explain->settings( $settings ) if 0 < scalar keys %{ $settings };
}
elsif ( $line =~ m{ \A \s* Trigger \s+ (.*) : \s+ time=(\d+\.\d+) \s+ calls=(\d+) \s* \z }xmsi ) {
my ( $name, $time, $calls ) = ( $1, $2, $3 );
$in_jit = undef;
$self->explain->add_trigger_time(
{
'name' => $name,
'time' => $time,
'calls' => $calls,
}
);
}
elsif ( $line =~ m{ \A (\s*) JIT: \s* \z }xmsi ) {
$in_jit = 1;
$jit = [ $line ];
}
elsif ( $line =~ m{ \A (\s*) Planning: \s* \z }xmsi ) {
$in_planning = 1;
}
elsif ( $line =~ m{ \A \s* Query \s+ Text: \s+ ( .* ) \z }xms ) {
$query = $1;
$plan_started = 0;
}
elsif ( $plan_started == 0 ) {
$query = "$query\n$line";
}
elsif ( $line =~ m{ \A (\s*) ( \S .* \S ) \s* \z }xms ) {
my ( $infoprefix, $info ) = ( $1, $2 );
if ( $in_jit ) {
push @{ $jit }, $line;
next LINE;
}
my $maximal_depth = ( sort { $b <=> $a } grep { $_ < length $infoprefix } keys %element_at_depth )[ 0 ];
next LINE unless defined $maximal_depth;
my $previous_element = $element_at_depth{ $maximal_depth };
next LINE unless $previous_element;
my $node = $previous_element->{ 'node' };
if ( $info =~ m{ \A Workers \s+ Launched: \s+ ( \d+ ) \z }xmsi ) {
$node->workers_launched( $1 );
$node->add_extra_info( $info );
}
elsif ( $info =~ m{ \A Buffers: \s }xms ) {
eval {
my $buffers = Pg::Explain::Buffers->new( $info );
if ( $in_planning ) {
$planning_buffers = $buffers;
}
else {
$node->buffers( $buffers );
}
};
$node->add_extra_info( $info ) if $EVAL_ERROR;
}
elsif ( $info =~ m{ \A I/O \s Timings: \s }xms ) {
eval {
if ( $in_planning ) {
$planning_buffers->add_timing( $info ) if $planning_buffers;
}
else {
$node->buffers->add_timing( $info ) if $node->buffers;
}
};
if ( $EVAL_ERROR ) {
print "[[ $EVAL_ERROR ]]\n";
$node->add_extra_info( $info ) if $EVAL_ERROR;
}
}
else {
$node->add_extra_info( $info );
}
}
}
$self->explain->jit( Pg::Explain::JIT->new( 'lines' => $jit ) ) if defined $jit;
$self->explain->query( $query ) if $query;
$self->explain->planning_buffers( $planning_buffers ) if $planning_buffers;
return $top_node;
}
=head1 AUTHOR
hubert depesz lubaczewski, C<< <depesz at depesz.com> >>
=head1 BUGS
Please report any bugs or feature requests to C<depesz at depesz.com>.
=head1 SUPPORT
You can find documentation for this module with the perldoc command.
perldoc Pg::Explain
=head1 COPYRIGHT & LICENSE
Copyright 2008-2023 hubert depesz lubaczewski, all rights reserved.
This program is free software; you can redistribute it and/or modify it
under the same terms as Perl itself.
=cut
1; # End of Pg::Explain::FromText