mirror of
https://github.com/stashapp/CommunityScrapers.git
synced 2025-12-11 11:18:56 -06:00
Add XPath scraper for POVTrain
This commit is contained in:
parent
6cb2f13700
commit
a36daaff54
@ -1251,6 +1251,7 @@ povperverts.net|ThirdRockEnt.yml|:heavy_check_mark:|:x:|:x:|:x:|-|-
|
|||||||
povpornstars.com|hussiemodels.yml|:heavy_check_mark:|:x:|:x:|:x:|-|-
|
povpornstars.com|hussiemodels.yml|:heavy_check_mark:|:x:|:x:|:x:|-|-
|
||||||
povr.com|POVR.yml|:heavy_check_mark:|:x:|:x:|:x:|-|VR
|
povr.com|POVR.yml|:heavy_check_mark:|:x:|:x:|:x:|-|VR
|
||||||
povthis.com|GammaEntertainment.yml|:heavy_check_mark:|:x:|:x:|:x:|-|-
|
povthis.com|GammaEntertainment.yml|:heavy_check_mark:|:x:|:x:|:x:|-|-
|
||||||
|
povtrain.com|POVTrain.yml|:heavy_check_mark:|:x:|:x:|:x:|-|-
|
||||||
prettydirty.com|Algolia_Adultime.yml|:heavy_check_mark:|:heavy_check_mark:|:x:|:x:|Python|-
|
prettydirty.com|Algolia_Adultime.yml|:heavy_check_mark:|:heavy_check_mark:|:x:|:x:|Python|-
|
||||||
prettydirtyteens.com|Deviante/Deviante.yml|:heavy_check_mark:|:heavy_check_mark:|:heavy_check_mark:|:heavy_check_mark:|Python|-
|
prettydirtyteens.com|Deviante/Deviante.yml|:heavy_check_mark:|:heavy_check_mark:|:heavy_check_mark:|:heavy_check_mark:|Python|-
|
||||||
pridestudios.com|Algolia_MenOver30.yml|:heavy_check_mark:|:heavy_check_mark:|:x:|:x:|Python|Gay
|
pridestudios.com|Algolia_MenOver30.yml|:heavy_check_mark:|:heavy_check_mark:|:x:|:x:|Python|Gay
|
||||||
|
|||||||
58
scrapers/POVTrain.yml
Normal file
58
scrapers/POVTrain.yml
Normal file
@ -0,0 +1,58 @@
|
|||||||
|
name: POV Train
|
||||||
|
sceneByURL:
|
||||||
|
- action: scrapeXPath
|
||||||
|
url:
|
||||||
|
- povtrain.com/tour/trailer.php?id=
|
||||||
|
scraper: sceneScraper
|
||||||
|
sceneByName:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.povtrain.com/tour/search.php?query={}
|
||||||
|
scraper: sceneSearch
|
||||||
|
sceneByQueryFragment:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: "{url}"
|
||||||
|
scraper: sceneScraper
|
||||||
|
xPathScrapers:
|
||||||
|
sceneSearch:
|
||||||
|
scene:
|
||||||
|
Title: //ul[@class="slides"]/li//h3
|
||||||
|
URL: //ul[@class="slides"]/li/a/@href
|
||||||
|
Date:
|
||||||
|
selector: //ul[@class="slides"]/li//comment()[contains(., "Date")]
|
||||||
|
postProcess: &parseDate
|
||||||
|
- replace:
|
||||||
|
- regex: .*</strong>\s*(.*)<.*
|
||||||
|
with: $1
|
||||||
|
- parseDate: January 2, 2006
|
||||||
|
Image:
|
||||||
|
selector: //ul[@class="slides"]/li/a/img/@src
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^
|
||||||
|
with: https://povtrain.com/
|
||||||
|
sceneScraper:
|
||||||
|
scene:
|
||||||
|
Title: //h2
|
||||||
|
Details: //div[@class="desc"]/p
|
||||||
|
Date:
|
||||||
|
selector: //comment()[contains(., "Date Added")]
|
||||||
|
postProcess: *parseDate
|
||||||
|
Image:
|
||||||
|
# Sometimes they put the preview image in a script tag, sometimes it's an actual img
|
||||||
|
selector: //script[contains(., "image:")]/text() | //div[contains(@class, "alpha")]//img[contains(@id, "set-target")]/@src
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
# This regex will only match when we have a script tag
|
||||||
|
# and gives the same result as the img tag, a relative URL
|
||||||
|
- regex: .*image:\s*"([^"]+).*
|
||||||
|
with: $1
|
||||||
|
- regex: ^
|
||||||
|
with: https://povtrain.com
|
||||||
|
Studio:
|
||||||
|
Name:
|
||||||
|
fixed: POV Train
|
||||||
|
Tags:
|
||||||
|
Name: //h5[@class="video_categories"]/a
|
||||||
|
Performers:
|
||||||
|
Name: //h5[@class="featuring_model"]/a
|
||||||
|
# Last Updated March 10, 2024
|
||||||
Loading…
x
Reference in New Issue
Block a user