#
# More information here: http://wiki.gcstar.org/en/websites_plugins
#
# GCcollection should be replaced with the kind of collection your
# plugin deals with. e.g. GCfilms, GCgames, GCbooks,...

# Replace SiteTemplate with your plugin name.
# The package name must exactly match the file name (.pm)
package GCPlugins::GCcollection::GCStopklatka;

###################################################
#
#  Copyright 2005-2010 Christian Jodar
#
#  This file is part of GCstar.
#
#  GCstar is free software; you can redistribute it and/or modify
#  it under the terms of the GNU General Public License as published by
#  the Free Software Foundation; either version 2 of the License, or
#  (at your option) any later version.
#
#  GCstar is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#  GNU General Public License for more details.
#
#  You should have received a copy of the GNU General Public License
#  along with GCstar; if not, write to the Free Software
#  Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
#
###################################################

use strict;
use utf8;

use GCPlugins::GCfilms::GCfilmsCommon;

{
    # Replace SiteTemplate with your exporter name
    # It must be the same name as the one used for file and main package name
    package GCPlugins::GCfilms::GCPluginStopklatka;

    use base qw(GCPlugins::GCfilms::GCfilmsPluginsBase);

    # getSearchUrl
    # Used to get the URL that to be used to perform searches.
    # $word is the query
    # Returns the full URL.
    sub getSearchUrl
    {
        my ($self, $word) = @_;

        # Your code here

        return "http://www.stopklatka.pl/szukaj/szukaj.asp?kategoria=film&szukaj=$word";
    }

    # getItemUrl
    # Used to get the full URL of an item page.
    # Useful when url on results pages are relative.
    # $url is the URL as found with a search.
    # Returns the absolute URL.
    sub getItemUrl
    {
        my ($self, $url) = @_;

        # Your code here

        return "http://www.stopklatka.pl/" . $url;
    }

    # getCharset
    # Used to convert charset in web pages.
    # Returns the charset as specified in pages.
    sub getCharset
    {
        my $self = shift;

        return "ISO-8859-2";
    }

    # getName
    # Used to display plugin name in GUI.
    # Returns the plugin name.
    sub getName
    {
        return "Stopklatka";
    }

    # getAuthor
    # Used to display the plugin author in GUI.
    # Returns the plugin author name.
    sub getAuthor
    {
        return 'Marek Cendrowicz';
    }

    # getLang
    # Used to fill in plugin list with user language plugins
    # Return the language used for this site (2 letters code).
    sub getLang
    {
        return 'PL';
    }
    # getExtra
    # Used if the plugin wants an extra column to be displayed in search results
    # Return the column title or empty string to hide the column.
    sub getExtra
    {
        return "";
    }

    # changeUrl
    # Can be used to change URL if item URL and the one used to
    # extract information are different.
    # Return the modified URL.
    sub changeUrl
    {
        my ($self, $url) = @_;

        return $url;
    }

    # In processing functions below, self->{parsingList} can be used.
    # If true, we are processing a search results page
    # If false, we are processing a item information page.

    # $self->{inside}->{tagname} (with correct value for tagname) can be used to test
    # if we are in the corresponding tag.

    # You have a counter $self->{itemIdx} that have to be used when processing search results.
    # It is your responsability to increment it!

    # When processing search results, you have to fill the available fields for results
    #
    #  $self->{itemsList}[$self->{movieIdx}]->{field_name}
    #
    # When processing a movie page, you need to fill the fields (if available)
    # in $self->{curInfo}.
    #
    #  $self->{curInfo}->{field_name}

    # start
    # Called each time a new HTML tag begins.
    # $tagname is the tag name.
    # $attr is reference to an associative array of tag attributes.
    # $attrseq is an array reference containing all the attributes name.
    # $origtext is the tag text as found in source file
    # Returns nothing
    sub start
    {
        my ($self, $tagname, $attr, $attrseq, $origtext) = @_;
        $self->{inside}->{$tagname}++;

        if ($self->{parsingList})
        {
            if ($self->{inside}->{list_details})
            {
                if ($tagname eq 'a')
                {
                    $self->{itemIdx}++;
                    $self->{itemsList}[ $self->{itemIdx} ]->{url} = $attr->{href};
                }

                $self->{listTitle} = 1
                  if ($attr->{class} eq 'searchTitle textB');

                $self->{listYear} = 1
                  if ($attr->{class} eq 'searchTitle');
            }
        }
        else
        {
            if ($attr->{class} eq 'wydarzenie_tytul')
            {
                $self->{pre_itemTitle} = 1;
            }
            elsif ($self->{pre_itemTitle})
            {
                if ($tagname eq 'h1')
                {
                    $self->{itemTitle} = 1;
                }
                elsif ($tagname eq 'h2')
                {
                    $self->{itemOriginalTitle} = 1;
                }
                elsif ($tagname eq 'table')
                {
                    $self->{pre_itemTitle} = 0;
                }
            }
            elsif ($attr->{class} eq 'film_pozycja')
            {
                $self->{pre_itemDetails} = 1;
            }
            elsif ($attr->{class} eq 'main_sub_table film')
            {
                $self->{itemMain} = 1;
            }
            elsif ($tagname eq 'img' && $self->{itemMain})
            {
                $self->{curInfo}->{image} = $attr->{src};
            }
        }
    }

    # end
    # Called each time a HTML tag ends.
    # $tagname is the tag name.
    sub end
    {
        my ($self, $tagname) = @_;
        $self->{inside}->{$tagname}--;
    }

    # text
    # Called each time some plain text (between tags) is processed.
    # $origtext is the read text.
    sub text
    {
        my ($self, $origtext) = @_;

        if ($self->{parsingList})
        {
            if ($self->{listTitle})
            {
                $self->{itemsList}[ $self->{itemIdx} ]->{title} = $origtext;
                $self->{listTitle} = 0;
            }
            elsif ($self->{listYear})
            {
                $origtext =~ s/\((.*?)\)/$1/gms;
                $self->{itemsList}[ $self->{itemIdx} ]->{date} = $origtext;
                $self->{listYear} = 0;
            }
        }
        else
        {
            if ($self->{itemTitle})
            {
                $self->{curInfo}->{title} = $origtext;
                $self->{itemTitle} = 0;
            }
            elsif ($self->{itemOriginalTitle})
            {
                $origtext =~ s/\s*\((.*?)\)/$1/gms;
                $self->{curInfo}->{original} = $origtext;
                $self->{itemOriginalTitle} = 0;
            }
            elsif ($self->{itemDirector})
            {
                $self->{curInfo}->{director} = $origtext;
                $self->{itemDirector}        = 0;
                $self->{pre_itemDetails}     = 0;
            }
            elsif ($self->{itemDetails})
            {
                (
                    $self->{curInfo}->{genre}, $self->{curInfo}->{country},
                    $self->{curInfo}->{date},  $self->{curInfo}->{time}
                ) = split(/, /, $origtext);
                $self->{curInfo}->{time} =~ s/ min//;
                $self->{itemDetails}     = 0;
                $self->{pre_itemDetails} = 0;
            }
            elsif ($self->{itemActors})
            {
                $self->{curInfo}->{actors} = $origtext;
                $self->{itemActors}        = 0;
                $self->{pre_itemDetails}   = 0;
            }
            elsif ($self->{itemMain})
            {
                $self->{curInfo}->{synopsis} = $origtext;
                $self->{itemMain} = 0;
            }
            elsif ($self->{inside}->{item_rank})
            {
                $self->{curInfo}->{ratingpress} = int($origtext + 0.5);
                $self->{pre_itemDetails} = 0;
            }
            elsif ($self->{pre_itemDetails})
            {
                $self->{itemDirector} = 1
                  if ($origtext eq 'reżyseria:');

                $self->{itemDetails} = 1
                  if ($origtext eq 'szczegóły:');

                $self->{itemActors} = 1
                  if ($origtext eq 'obsada:');
            }
        }
    }

    # new
    # Constructor.
    # Returns object reference.
    sub new
    {
        my $proto = shift;
        my $class = ref($proto) || $proto;
        my $self  = $class->SUPER::new();

        # This member should be initialized as a reference
        # to a hash. Each keys is a field that could be
        # in results with value 1 or 0 if it is returned
        # or not. For the list of keys, check the model file
        # (.gcm) and search for tags <field> in
        # /collection/options/fields/results
        $self->{hasField} = {
            title    => 1,
            date     => 1,
            director => 0,
            actors   => 0,
        };

        $self->{itemIdx}               = 0;
        $self->{itemsList}[0]->{title} = '';
        $self->{itemsList}[0]->{url}   = '';

        # Do your init stuff here
        bless($self, $class);
        return $self;
    }

    # preProcess
    # Called before each page is processed. You can use it to do some substitutions.
    # $html is the page content.
    # Returns modified version of page content.
    sub preProcess
    {
        my ($self, $html) = @_;

        # Your code to modify $html here.
        if ($self->{parsingList})
        {
            $html =~
              s|<!-- record_start -->(.*?)<!-- record_end -->|<list_details>$1</list_details>|gms;
        }
        else
        {
            $html =~ s|<nobr>(.*?)</nobr>|$1|gms;
            $html =~ s|<span class="bold">(.*?)</span>|$1|gms;
            $html =~ s|<a href="/filmowcy/osoba.*?">(.*?)</a>|$1|gms;
            $html =~
s|script type="text/javascript">document.write\(getOcena\((.*?)\)\);</script>|<item_rank>$1</item_rank>|gms;
        }
        return $html;
    }

}

1;