package GCPlugins::GCboardgames::GCReservoirJeux;
###################################################
#
# Copyright 2005-2010 Christian Jodar
#
# This file is part of GCstar.
#
# GCstar is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# GCstar is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with GCstar; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
#
###################################################
use strict;
use GCPlugins::GCboardgames::GCboardgamesCommon;
{
package GCPlugins::GCboardgames::GCPluginReservoirJeux;
use base qw(GCPlugins::GCboardgames::GCboardgamesPluginsBase);
sub start
{
my ($self, $tagname, $attr, $attrseq, $origtext) = @_;
$self->{inside}->{$tagname}++;
if ($self->{parsingEnded})
{
return;
}
if ($self->{parsingList})
{
# Parse the search results here
if (($tagname eq "h3") && ($attr->{class} =~ /^rusearch_result/))
{
$self->{itemIdx}++;
$self->{isBoardgame} = 1;
$self->{insideName} = 1;
}
if ($self->{isBoardgame})
{
if (($tagname eq "a") && ($attr->{href} ne "#") && ($attr->{class} =~ /^lien_item/))
{
$self->{itemsList}[$self->{itemIdx}]->{url} = $attr->{href};
$self->{isBoardgame} = 0;
}
}
}
else
{
# Parse the items page here. Basically we do this by seaching for tags which match certain criteria, then preparing to grab
# the text inside these tags
if (($tagname eq "h1"))
{
$self->{insideName} = 1;
}
elsif (($tagname eq "div"))
{
if ($attr->{id} eq "fiche_technique_image")
{
$self->{insideImage} = 1;
}
elsif ($attr->{id} eq "bloc_centre_extensions")
{
$self->{insideExpansionList} = 1;
}
elsif ($attr->{id} eq "bloc_centre_extensions_bottom")
{
$self->{insideExpansionList} = 0;
}
elsif ($attr->{class} eq "fiche_technique_sep")
{
$self->{insideCategoryRow} = 0;
$self->{insideMechanicRow} = 0;
}
}
elsif ($tagname eq "img")
{
if ($self->{insideImage})
{
$self->{curInfo}->{boxpic} = "http://www.reservoir-jeux.com".$attr->{src} if ! $self->{curInfo}->{boxpic};
$self->{insideImage} = 0;
}
if ($self->{insideExpansionList})
{
$self->{curInfo}->{expandedby} .= $attr->{alt}.','
}
}
elsif ($tagname eq "a")
{
if ($attr->{class} eq "lien_item")
{
if ($self->{nextIsExpands})
{
$self->{insideExpands} = 1;
$self->{nextIsExpands} = 0;
}
if ($attr->{href} =~ /type=editeur/)
{
$self->{insidePublisher} = 1;
}
elsif ($attr->{href} =~ /type=auteur/)
{
$self->{insideDesigner} = 1;
}
elsif ($attr->{href} =~ /type=illustrateur/)
{
$self->{insideIllustrator} = 1;
}
elsif ($attr->{href} =~ /tag_id=/)
{
if ($self->{insideMechanicRow})
{
$self->{insideMechanic} = 1;
}
elsif ($self->{insideCategoryRow})
{
$self->{insideCategory} = 1;
}
}
elsif ($attr->{href} =~ /type=illustrateur/)
{
$self->{insideIllustrator} = 1;
}
}
}
elsif (($tagname eq "span") && ($attr->{class} eq "prod_description"))
{
$self->{insideDescription} = 1;
}
if ($tagname eq "br")
{
if($self->{insideDesignerRow})
{
$self->{curInfo}->{designedby} =~ s/\s\x2d\s$//g;
$self->{insideDesignerRow} = 0;
}
if($self->{insideIllustratorRow})
{
$self->{curInfo}->{illustratedby} =~ s/\s\x2d\s$//g;
$self->{insideIllustratorRow} = 0;
}
}
if ($self->{insideDescription})
{
if (($tagname eq "br") || ($tagname eq "p"))
{
# neatens up the description a little by starting new line on br tags
$self->{curInfo}->{description} .= "\n";
}
elsif ($tagname eq "li")
{
# basic formatting of lists
$self->{curInfo}->{description} .= " - ";
}
}
}
}
sub end
{
my ($self, $tagname) = @_;
$self->{inside}->{$tagname}--;
if ($self->{insideTechnicalDetails} && $tagname eq "div")
{
$self->{insideTechnicalDetails} = 0;
}
}
sub text
{
my ($self, $origtext) = @_;
return if (length($origtext) < 2);
$origtext =~ s/"/"/g;
$origtext =~ s/³/3/g;
$origtext =~ s/\n//g;
$origtext =~ s/^\s{2,//;
#French accents substitution
$origtext =~ s/à/à/;
$origtext =~ s/À/À/;
$origtext =~ s/é/é/;
return if ($self->{parsingEnded});
if ($self->{parsingList})
{
if ($self->{isBoardgame} && $self->{insideName})
{
$self->{itemsList}[$self->{itemIdx}]->{name} = $origtext;
$self->{insideName} = 0;
}
}
else
{
# Parse the text items page here.
if ($self->{insideName})
{
$self->{curInfo}->{name} = $origtext;
$self->{curInfo}->{name} =~ s/^\s+//;
$self->{curInfo}->{name} =~ s/\s+\Z//;
$self->{insideName} = 0;
}
if ($self->{inside}->{h2})
{
if ($origtext =~ /^Fiche technique/)
{
$self->{insideTechnicalDetails} = 1;
}
elsif ($origtext =~ /^M\xe9canismes/)
{
$self->{insideMechanicRow} = 1;
}
elsif ($origtext =~/^Th\xe8mes/)
{
$self->{insideCategoryRow} = 1;
}
}
if ($self->{insideTechnicalDetails})
{
if ($origtext =~ /^Date de sortie/)
{
$self->{curInfo}->{released} = $origtext;
$self->{curInfo}->{released} =~ s/Date de sortie : //g
}
elsif( $origtext =~ /Dur\xe9e : /)
{
$self->{curInfo}->{playingtime} = $origtext;
$self->{curInfo}->{playingtime} =~ s/\s*Dur\xe9e : //g;
}
elsif($origtext =~ /\xc0 partir de\s[0-9]*\sans/)
{
$self->{curInfo}->{suggestedage} = $origtext;
$self->{curInfo}->{suggestedage} =~ s/^\s*//g;
}
elsif ($origtext =~ /De [0-9]* \xe0 [0-9]* joueurs/)
{
$self->{curInfo}->{players} = $origtext;
$self->{curInfo}->{players} =~ s/^\s*De //g;
$self->{curInfo}->{players} =~ s/ joueurs//g;
}
}
if ($self->{insideDesigner})
{
# Append text (and trailing ,) to existing designer field
$self->{curInfo}->{designedby} .= $origtext." - ";
$self->{insideDesigner} = 0;
}
if ($self->{insideIllustrator})
{
# Append text (and trailing ,) to existing illustrator field
$self->{curInfo}->{illustratedby} .= $origtext." - ";
$self->{insideIllustrator} = 0;
}
if ($self->{insidePublisher})
{
$self->{curInfo}->{publishedby} = $origtext;
$self->{insidePublisher} = 0;
}
if ($self->{insideExpands})
{
$self->{curInfo}->{expansionfor} = $origtext;
$self->{insideExpands} = 0;
}
if ($self->{insideMechanic})
{
$self->{curInfo}->{mechanics} .= $self->capWord($origtext).',';
$self->{insideMechanic} = 0;
}
if ($self->{insideCategory})
{
$self->{curInfo}->{category} .= $self->capWord($origtext).',';
$self->{insideCategory} = 0;
}
if ($origtext =~ /^\s*Auteur(s)? : /)
{
$self->{insideDesignerRow} = 1;
}
if ($origtext =~ /^\s*Illustrateur(s)? : /)
{
$self->{insideIllustratorRow} = 1;
}
if ($origtext =~ /^Ce produit est une extension de :/)
{
$self->{nextIsExpands} = 1;
}
if ($self->{insideDescription})
{
$self->{curInfo}->{description} .= $origtext;
}
}
}
sub comment
{
my ($self, $comment) = @_;
if ($self->{parsingList})
{
}
else
{
if ($comment =~ /\/div/)
{
if($self->{insideDescription})
{
$self->{insideDescription} = 0;
# remove spaces from start and end of description
$self->{curInfo}->{description} =~ s/^\s+//;
$self->{curInfo}->{description} =~ s/\s+$//;
}
}
}
}
sub new
{
my $proto = shift;
my $class = ref($proto) || $proto;
my $self = $class->SUPER::new();
bless ($self, $class);
$self->{hasField} = {
name => 1,
};
$self->{isBoardgame} = 0;
$self->{curName} = undef;
$self->{curUrl} = undef;
return $self;
}
sub preProcess
{
my ($self, $html) = @_;
$self->{parsingEnded} = 0;
$html =~ s/""/'"/g;
$html =~ s/""/"'/g;
$html =~ s|
|
|;
return $html;
}
sub getSearchUrl
{
my ($self, $word) = @_;
# Url returned below is the for the search page, where $word is replaced by the search
return ('http://www.reservoir-jeux.com/recherche.php', ['search' => $word, 'secteurid' => '-1', 'dv' => '30']);
}
sub getItemUrl
{
my ($self, $url) = @_;
return $url if $url =~ /^http:/;
if ($url =~ /^\//)
{
return "http://www.reservoir-jeux.com".$url;
}
else
{
return "http://www.reservoir-jeux.com/".$url;
}
}
sub getName
{
return "Reservoir Jeux";
}
sub getAuthor
{
return 'Florent';
}
sub getLang
{
return 'FR';
}
}
1;