-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathBaDoink.yml
127 lines (127 loc) · 4.44 KB
/
BaDoink.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
name: "BaDoink"
sceneByURL:
- action: scrapeXPath
url: &urls
- 18vr.com
- babevr.com
- badoinkvr.com
- kinkvr.com
- realvr.com
- vrcosplayx.com
scraper: sceneScraper
performerByURL:
- action: scrapeXPath
url: *urls
scraper: performerScraper
movieByURL:
- action: scrapeXPath
url: *urls
scraper: movieScraper
# Uncomment this section to enable Performer Search on this scraper
# performerByName:
# action: scrapeXPath
# queryURL: https://kinkvr.com/bdsm-performers/search/{}?all=1
# scraper: performerSearch
xPathScrapers:
sceneScraper:
common:
$details: &detailsAttr //div[@class="video-rating-and-details"]
scene:
Title: //h1[@class="heading heading--2 video-title video-actions-title"]/text()
Date: &dateSel
selector: $details//p[@class="video-upload-date"]/text()
postProcess:
- replace:
- regex: Uploaded:\s
with:
- parseDate: January 02, 2006
Details: &detailsSel $details//p[@class="video-description"]/text()
Tags:
Name: $details//p[@class="video-tags"]//a/text()
Performers:
Name: $details//p[@class="video-actors"]/a/text()
Studio:
Name: &studioName
selector: //meta[@name="dl8-customization-brand-name"]/@content
postProcess:
- replace:
- regex: ^BaDoink VR$
with: "BaDoinkVR"
#Name: &studioName //meta[@name="dl8-customization-brand-name"]/@content
Image: &imageSel
selector: //img[@class="video-image"]/@src
postProcess:
- replace:
- regex: \?.+
with: ""
URL: //link[@rel='canonical']/@href
# Uncomment this section to user Performer Search on this scraper
# performerSearch:
# common:
# $girlA: //div[@class="girl-card-info"]/a
# performer:
# Name: $girlA/span
# URL:
# selector: $girlA/@href
# postProcess:
# - replace:
# - regex: .*badoinkvr\.com/girl/redirect/([^\?]+).+
# with: https://badoinkvr.com/vr-pornstar/$1
# - regex: .*vrcosplayx\.com/girl/redirect/([^\?]+).+
# with: https://vrcosplayx.com/cosplaygirl/$1
# - regex: .*18vr\.com/girl/redirect/([^\?]+).+
# with: https://18vr.com/vrgirl/$1
# - regex: .*babesvr\.com/girl/redirect/([^\?]+).+
# with: https://babevr.com/vrbabe/$1
# - regex: .*realvr\.com/girl/redirect/([^\?]+).+
# with: https://realvr.com/pornstar/$1
# - regex: ^/
# with: https://kinkvr.com/
performerScraper:
common:
$stats: //ul[@id='girlOptionDetails']
performer:
Name: //div[@class='girl-details-info']/h1/text()
Gender:
fixed: female
URL: //link[@rel='canonical']/@href
Twitter: //a[contains(@class,'social-media') and contains (@href,'twitter')]/@href
Instagram: //a[contains(@class,'social-media') and contains (@href,'instagram')]/@href
Ethnicity:
selector: $stats/li[span[contains(.,'Ethnicity')]]/span[contains(@class,'value')]/text()
postProcess:
- map:
Caucasian: white
Asian: asian
Black: black
Latin: hispanic
Country: $stats/li[span[contains(.,'Country')]]/span[contains(@class,'value')]/text()
EyeColor: $stats/li[span[contains(.,'Eyes')]]/span[contains(@class,'value')]/text()
Height:
selector: $stats/li[span[contains(.,'Height')]]/span[contains(@class,'value')]/text()
postProcess:
- feetToCm: true
Measurements: $stats/li[span[contains(.,'Measure')]]/span[contains(@class,'value')]/text()
Aliases: $stats/li[span[contains(.,'Aka')]]/span[contains(@class,'value')]/text()
Image: //img[@id='girlImage']/@src
movieScraper:
common:
$details: *detailsAttr
movie:
Name:
selector: //meta[@name="dl8-customization-brand-name"]/@content|$details/h1/text()
concat: " - "
Duration:
selector: $details//p[@class="video-duration"]/text()
postProcess:
- replace:
- regex: Duration:\s
with: ""
- regex: \smin
with: ":00"
Date: *dateSel
Synopsis: *detailsSel
Studio:
Name: *studioName
FrontImage: *imageSel
# Last Updated October 03, 2021