* WebGrab+Plus ini for grabbing EPG data from TvGuide websites
* Site siol.net
* revision 0
* revision 1 added description cleanup
* revision 2 changed index_showsplit to solve problems with overlapping shows > 4 hours
* Willy De Wilde, Oktober 2011, Jan van Straaten 19/02/2012
*
site {url=siol.net|timezone=UTC+01:00|maxdays=4|cultureinfo=sl-SI|charset=UTF-8|titlematchfactor=90|ratingsystem=IMDB|episodesystem=xmltv_ns}
url_index{url|http://tv-spored.siol.net/kanal/|channel|/datum/|urldate|}
url_index.headers {customheader=Accept-Encoding=gzip,deflate}
urldate.format {datestring|yyyyMMdd}
*
index_showsplit.scrub {multi||}
*
index_title.scrub {single|
|| |
}
index_category.scrub {single|
|| |
} *index page category
index_temp_4.scrub {single|
|| |
} *index page category
index_category.scrub {multi(separator="," include=first)|
||
|}
index_category.modify {remove(type=regex)|".*\/"}
index_start.scrub {single|
||
|
}
*index_description.scrub {single|}
*index_description.modify {addend|\n}
*index_rating.scrub {single| |IMDB:|!??!|}
index_showicon.scrub {single||
|||
}
index_subtitle.scrub {single(separator="," include="sezona")|
||
|}
index_temp_8.scrub {single(separator="," include="sezona")|
||
|}
index_episode.scrub {single(separator="," include="del")|
||
|}
index_temp_5.scrub {single(separator="," include="del")|
||
|}
************************* detailed page scrub
index_urlshow {url|http://tv-spored.siol.net|
|| |[^>]*(\d{2}:\d{2})[^>]*-[^>]*\d{2}:\d{2}[^>]*
||}
description.scrub {multi(include=2)|||
|
}
director.scrub {single(separator="," include=first2"Ostalo")|Režija: |||}
actor.scrub {single(separator="," include=first5)|Igrajo: |||}
country.scrub {single(separator="," include=last)||| | }
rating.scrub {single| |IMDB:|!??!|}
*
*********************** Modifiers
description.modify {addend(separator="\n\n")|}
description.modify {addstart(null)|Ni opisa}
description.modify {addend|.}
*** xmltv_ns - DVBLINK NEW - regular
*index_temp_8.modify {remove(not "")| sezona }
*index_temp_8.modify {addstart(null)|1}
*index_temp_8.modify {calculate(format=F0)|1 -}
*index_episode.modify {remove(not "")| del}
*index_episode.modify {addstart(null)|1}
*index_episode.modify {calculate(format=F0)|1 -}
*index_episode.modify {addstart|'index_temp_8' . }
*index_episode.modify {addend| . 0/1}
*index_episode.modify {remove(not "")|0 . 0 . 0/1}
*** xmltv_ns - DVBLINK OLD
index_temp_8.modify {remove(not "")| sezona }
index_temp_8.modify {addstart(null)|1}
index_temp_8.modify {calculate(format=F0)|1}
index_episode.modify {remove(not "")| del}
index_episode.modify {addstart(null)|1}
index_episode.modify {calculate(format=F0)|1}
index_episode.modify {addstart|'index_temp_8' . }
index_episode.modify {addend| . 0/1}
index_episode.modify {remove(not "")|1 . 1 . 0/1}
*** country - there is a bug in the page - not acurate it asumes if it doesnt end correctly taht it is from Slovenija
country.modify {replace(null)|Združene države Amerike|ZDA}
country.modify {clear('country' ~ "!??!")}
country.modify {addstart(null)|Slovenija}
country.modify {cleanup}
*
rating.modify {addend(not "")|/10}
starrating.modify {addstart|'rating'}
starrating.modify {remove|/10}
starrating.modify {calculate(format=F0)|0}
starrating.modify {addend|/10}
starrating.modify {remove|0/10}
** subtitle (personal preference)
index_temp_5.modify {cleanup}
index_subtitle.modify {addend(not "")|, 'index_temp_5'}
index_subtitle.modify {addstart(not "")|,}
index_subtitle.modify {addstart|'index_temp_4' }
index_subtitle.modify {cleanup}
index_subtitle.modify {replace| ,|,}
index_subtitle.modify {addend|, 'country'}
*
** _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
** ##### CHANNEL FILE CREATION (only to create the xxx-channel.xml file)
**
** @auto_xml_channel_start
* enable the following lines to create a full channel list file
*url_index{url|http://tv-spored.siol.net/kanali}
*index_site_channel.scrub {multi|| |}
*index_site_id.scrub {multi||">}
*scope.range {(channellist)|end}
*index_site_id.modify {cleanup(removeduplicates=equal,100 link="index_site_channel")}
*end_scope
** @auto_xml_channel_end*
*