Skip to content

Commit 1cae0c1

Browse files
authored
Update VirtualRealPorn scraper (#549)
after website change, only the 20 latest scenes were being scraped.
1 parent 30b5ac0 commit 1cae0c1

File tree

1 file changed

+11
-28
lines changed

1 file changed

+11
-28
lines changed

pkg/scrape/virtualrealporn.go

Lines changed: 11 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,6 @@ import (
1313
"github.com/thoas/go-funk"
1414
"github.com/tidwall/gjson"
1515
"github.com/xbapps/xbvr/pkg/models"
16-
"gopkg.in/resty.v1"
1716
)
1817

1918
func VirtualRealPornSite(wg *sync.WaitGroup, updateSite bool, knownScenes []string, out chan<- models.ScrapedScene, scraperID string, siteID string, URL string) error {
@@ -186,6 +185,11 @@ func VirtualRealPornSite(wg *sync.WaitGroup, updateSite bool, knownScenes []stri
186185
}
187186
})
188187

188+
siteCollector.OnHTML(`.searchBox option`, func(e *colly.HTMLElement) {
189+
pageURL := e.Request.AbsoluteURL(e.Attr("data-url"))
190+
siteCollector.Visit(pageURL)
191+
})
192+
189193
siteCollector.OnHTML(`a.w-portfolio-item-anchor`, func(e *colly.HTMLElement) {
190194
sceneURL := e.Request.AbsoluteURL(e.Attr("href"))
191195

@@ -195,35 +199,14 @@ func VirtualRealPornSite(wg *sync.WaitGroup, updateSite bool, knownScenes []stri
195199
}
196200
})
197201

198-
// Request scenes via ajax interface
199-
r, err := resty.R().
200-
SetHeader("User-Agent", userAgent).
201-
SetHeader("Accept", "application/json, text/javascript, */*; q=0.01").
202-
SetHeader("Referer", URL).
203-
SetHeader("X-Requested-With", "XMLHttpRequest").
204-
SetHeader("Authority", scraperID+".com").
205-
SetFormData(map[string]string{
206-
"action": "get_videos_list",
207-
"p": "1",
208-
"vpp": "1000",
209-
"sq": "",
210-
"so": "date-DESC",
211-
"pid": "8",
212-
}).
213-
Post("https://" + scraperID + ".com/wp-admin/admin-ajax.php")
214-
215-
if err == nil || r.StatusCode() == 200 {
216-
urls := gjson.Get(r.String(), "data.movies.#.permalink").Array()
217-
for i := range urls {
218-
sceneURL := urls[i].String()
219-
if !funk.ContainsString(knownScenes, sceneURL) {
220-
sceneCollector.Visit(sceneURL)
221-
}
222-
}
202+
if scraperID == "virtualrealamateur" {
203+
siteCollector.Visit(URL)
204+
} else if scraperID == "virtualrealgay" {
205+
siteCollector.Visit(URL + "porn-actor/")
206+
} else {
207+
siteCollector.Visit(URL + "porn-actress/")
223208
}
224209

225-
siteCollector.Visit(URL)
226-
227210
if updateSite {
228211
updateSiteLastUpdate(scraperID)
229212
}

0 commit comments

Comments
 (0)