lib/WWW/Scraper/ISBN/TWKingstone_Driver.pm


            
              1
2
3
4
5
6
7
8
9
10
11
—
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
—
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
—
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
              # ex:ts=8
package WWW::Scraper::ISBN::TWKingstone_Driver;
use strict;
use warnings;
use vars qw($VERSION @ISA);
$VERSION = '0.02';
#--------------------------------------------------------------------------
=head1 NAME
WWW::Scraper::ISBN::TWKingstone_Driver - Search driver for TWKingstone's online catalog.
=head1 SYNOPSIS
See parent class documentation (L<WWW::Scraper::ISBN::Driver>)
=head1 DESCRIPTION
Searches for book information from the TWKingstone's online catalog.
=cut
#--------------------------------------------------------------------------
###########################################################################
#Library Modules                                                          #
###########################################################################
use WWW::Scraper::ISBN::Driver;
use WWW::Mechanize;
use Template::Extract;
use Text::Iconv;
###########################################################################
#Constants                                                                #
###########################################################################
use constant    QUERY   => 'http://search.kingstone.com.tw/Result.asp?SE_Type=ISBN&k=%s';
#--------------------------------------------------------------------------
###########################################################################
#Inheritence                                                              #
###########################################################################
@ISA = qw(WWW::Scraper::ISBN::Driver);
###########################################################################
#Interface Functions                                                      #
###########################################################################
=head1 METHODS
=over 4
=item C<search()>
Creates a query string, then passes the appropriate form fields to the Kingstone 
server.
The returned page should be the correct catalog page for that ISBN. If not the
function returns zero and allows the next driver in the chain to have a go. If
a valid page is returned, the following fields are returned via the book hash:
  isbn
  title
  author
  book_link
  image_link
  pubdate
  publisher
  price_list
  price_sell
The book_link and image_link refer back to the Kingstone website. 
=back
=cut
sub search {
        my $self = shift;
        my $isbn = shift;
        $self->found(0);
        $self->book(undef);
        my $url = sprintf(QUERY, $isbn);
        my $mechanize = WWW::Mechanize->new();
        $mechanize->get($url);
        return undef unless($mechanize->success());
        # The Search Results page
        my $template = <<END;
<form name="form1" [% ... %]
<span class="font09">[% ... %]
<a href="[% book_link %]&
END
        my $extract = Template::Extract->new;
        my $data = $extract->extract($template, $mechanize->content());
        return $self->handler("Could not extract data from TWKingstone result page.")
                unless(defined $data);
        my $book_link = $data->{book_link};
        $mechanize->get($book_link);
        my $content = $mechanize->content();
        $content =~ /(table width="980" border="0" align="center" .*form name="form2")/s;
        $content = Text::Iconv->new("utf-8", "big5")->convert($1);
        $template = <<END;
<img src="[% image_link %]" [% ... %]
<span class="font01">[% title %]</span>[% ... %]
§@¡@¡@ªÌ¡G[% ... %]>[% author %]</a>[% ... %]
¥Xª©ªÀ¡G[% ... %]>[% publisher %]</a>[% ... %]
ISBN¡G[% isbn %]<br>[% ... %]
¥Xª©¤é¡G[% pubdate %]</td>[% ... %]
©w¡@¡@»ù¡G[% price_list %] ¤¸<br>[% ... %]
¯S¡@¡@»ù¡G<[% ... %] <span class="font01">[% price_sell %]</span>¤¸
END
        $data = $extract->extract($template, $content);
        return $self->handler("Could not extract data from TWKingstone result page.")
                unless(defined $data);
        $data->{pubdate} =~ s/[ \n\r\t]*//g;
        my $bk = {
                'isbn'          => $data->{isbn},
                'title'         => $data->{title},
                'author'        => $data->{author},
                'book_link'     => $book_link,
                'image_link'    => "http://www.kingstone.com.tw".$data->{image_link},
                'pubdate'       => $data->{pubdate},
                'publisher'     => $data->{publisher},
                'price_list'    => $data->{price_list},
                'price_sell'    => $data->{price_sell},
        };
        $self->book($bk);
        $self->found(1);
        return $self->book;
}
1;
__END__
=head1 REQUIRES
Requires the following modules be installed:
L<WWW::Scraper::ISBN::Driver>,
L<WWW::Mechanize>,
L<Template::Extract>
=head1 SEE ALSO
L<WWW::Scraper::ISBN>,
L<WWW::Scraper::ISBN::Record>,
L<WWW::Scraper::ISBN::Driver>
=head1 AUTHOR
Ying-Chieh Liao E<lt>ijliao@csie.nctu.edu.twE<gt>
=head1 COPYRIGHT
Copyright (C) 2005 Ying-Chieh Liao E<lt>ijliao@csie.nctu.edu.twE<gt>
This program is free software; you can redistribute it and/or modify it
under the same terms as Perl itself.
See L<http://www.perl.com/perl/misc/Artistic.html>
=cut
	Global
`s`	Focus search bar
`?`	Bring up this help dialog
	GitHub
`g` `p`	Go to pull requests
`g` `i`	go to github issues (only if github is preferred repository)
	POD
`g` `a`	Go to author
`g` `c`	Go to changes
`g` `i`	Go to issues
`g` `d`	Go to dist
`g` `r`	Go to repository/SCM
`g` `s`	Go to source
`g` `b`	Go to file browse
	Search terms
module: (e.g. module:Plugin)
distribution: (e.g. distribution:Dancer auth)
author: (e.g. author:SONGMU Redis)
version: (e.g. version:1.00)