Files
epg/siteini.pack/Germany/tvguide.dk.ini
freearhey a597b11307 Init
2021-03-09 22:46:37 +03:00

122 lines
5.9 KiB
INI
Executable File

**------------------------------------------------------------------------------------------------
* @header_start
* WebGrab+Plus ini for grabbing EPG data from TvGuide websites
* @Site: tvguide.dk
* @MinSWversion: 1.1.1/56.26
* none
* @Revision 6 - [27/06/2016] Blackbear199
* adapted for version 56.26 season/episode implimentation
* @Revision 5 - [19/06/2016] Blackbear199
* fix only 4 days epg
* @Revision 4 - [13/06/2016] Blackbear199
* rewrite
* @Revision 3 - [25/11/2011] Jan van Straaten
* removed links from description
* @Revision 2 - []
* new showdetail scrubbing, needs 1.0.7
* @Revision 1 - []
* adapted for V1.0.5
* @Remarks:
* WebGrab 56.26 needed for new season/index_episode implimentation
* @header_end
**------------------------------------------------------------------------------------------------
site {url=tvguide.dk|timezone=UTC+01:00|maxdays=8.1|cultureinfo=da-DK|charset=ISO-8859-1|titlematchfactor=90|ratingsystem=DK|episodesystem=onscreen}
*
url_index{url|http://www.tvguide.dk/kanaler/|channel|}
url_index.headers {customheader=Accept-Encoding=gzip,deflate}
urldate.format {datestring|dd-MM-yyyy} *not used
*
index_showsplit.scrub {multi(include="<a title=")|<h1 class="program-heading"|<tr>|</tr>|</td><td bgcolor="#cacaca">}
*
scope.range{(indexshowdetails)|end}
index_start.scrub {single|class="time"|>|</td>|</td>}
index_start.modify {remove(type=regex)|<.+?>}
*
index_title.scrub {single|<a title="|">|</a>|</td>}
index_title.modify {remove(type=regex)|<br>[^<]*}
*
index_episode.modify {substring(type=regex pattern="'S1' ('E1')""'S1' ('E1':'Et1')""('E1':'Et1')""('E1')")|'index_title' "((?:\s\d{1,3}\s)?\((?:\d+:)?\d+\))$"} *season/index_episode from title Sx (Ex),Sx (Ex:Etx),(Ex:Etx),(Ex)
index_title.modify {remove(type=regex)|\s*\d*\s\(.+?\)$} * remove season/episode info from title
end_scope
*
index_urlshow {url|http://www.tvguide.dk|href="||"|"}
index_urlshow.headers {customheader=Accept-Encoding=gzip,deflate}
*
scope.range{(showdetails)|end}
title.scrub {single|<h1 class='program-heading'>||</h1>|</h1>}
*
title.modify {remove(type=regex)|\s*\d*\s\(.+?\)$} * remove season/episode info from title
*
description.scrub {single|<td colspan="3" valign="top" class="news">||</div></td>|</div></td>}
description.modify {remove(type=regex)|<h2.+?<\/h2>}
description.modify {remove(type=regex)|<div.+?\'>}
description.modify {remove(type=regex)|<script.+?<\/script>}
description.modify {remove(type=regex)|<img.+?\"*>}
description.modify {remove(type=regex)|<!--.+?-->}
description.modify {remove(type=regex)|<br>&nbsp}
*
category.modify {substring(type=regex)|'description' "<b>Genre\s:</b>\s.+?<br>"}
description.modify {remove('category' not "")|'category'}
category.modify {substring(type=regex)|"</b>\s(?:\/?([^\/]*))*<br>"}
*
writer.modify {substring(type=regex)|'description' "Manuskript:\s.+?\s*<br>"}
description.modify {remove('writer' not "")|'writer'}
writer.modify {substring(type=regex)|"Manuskript:\s(.+?)\.\s*<br>"
*
description.modify {remove(type=regex)|<b>Season\s:</b>\s.+?<br>} * remove season from description
description.modify {remove(type=regex)|<b>Episode\s:</b>\s.+?<br>} * remove index_episode from description
*
productiondate.modify {substring(type=regex)|'description' "<b>Year\s:</b>\s\d+<br>"}
description.modify {remove('productiondate' not "")|'productiondate'}
productiondate.modify {substring(type=regex)|"\d{4}"}
*
temp_1.modify {substring(type=regex)|'description' "Tilrettelæggelse:\s.+?<br>"} *organization?
description.modify {remove('temp_1' not "")|'temp_1'}
*
temp_2.modify {substring(type=regex)|'description' "Instruktion:\s.+?<br>"} *Instruction?
description.modify {remove('temp_2' not "")|'temp_2'}
*
temp_3.modify {substring(type=regex)|'description' "<b>Teaser\s:<\/b>\s.+?<br>"} *Teaser?
description.modify {remove('temp_3' not "")|'temp_3'}
*temp_3.modify {clear(not~ ", ")}
temp_3.modify {substring('temp_3' not "" type=regex)|"<\/b>\s(.+?)<br>"}
*temp_3.modify {replace('temp_3' not "")|,|\|} *make multi
*country.modify {substring('temp_3' not "" type=element)|'temp_3' 0 1}
subtitle.modify {addstart('temp_3' not "")|'temp_3'}
*
description.modify {remove(type=regex)|Sendt\sførste\sgang\s\d{2}\.\d{2}\.\d{2}<br>}
*
presenter.modify {substring(type=regex)|'description' "Vært:\s.+?<br>"} *actor
description.modify {remove('presenter' not "")|'presenter'}
presenter.modify {substring('presenter' not "" type=regex)|"<br>Vært:(.+?)"}
*
actor.modify {substring(type=regex)|'description' "<strong>.+?</strong>"} *actor
description.modify {remove('actor' not "")|'actor'}
actor.modify {substring('actor' not "" type=regex)|"<strong>Medvirkende:\s(.+?),</strong>"}
actor.modify {replace('actor' not "")|,|\|} *make Multi
actor.modify {remove('actor' not "" type=regex)|\s\(.+?\)}
*
actor.modify {substring('actor' "" type=regex)|'description' "(<br>.+?:\s.+?\.)*"} *actor
actor.modify {remove('actor' ~ "<br>")|\|}
description.modify {remove('actor' ~ "<br>")|'actor'}
actor.modify {substring('actor' ~ "<br>" type=regex)|"<br>.+?:(.+?)\."}
*
description.modify {remove(type=regex)|<.+?>}
description.modify {remove| (t)}
description.modify {remove|...}
description.modify {cleanup}
description.modify {clear('title')}
end_scope
*
*
** _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
** ##### CHANNEL FILE CREATION (only to create the xxx-channel.xml file)
**
** @auto_xml_channel_start
*index_site_channel.scrub {multi|<table id="channels_selectors"><tr><td><select style='width:155px'>|">|</option>|</option></select></td></tr></table>}
*index_site_id.scrub {multi|<table id="channels_selectors"><tr><td><select style='width:155px'>|<option value="|">|</option></select></td></tr></table>}
*index_site_id.modify {cleanup(removeduplicates=equal,100 link="index_site_channel")}
** @auto_xml_channel_end