From cfbbcf4ed2e0229ca5c0a3489a7340e23dd7c48e Mon Sep 17 00:00:00 2001 From: nrg101 Date: Wed, 8 Jan 2025 18:54:58 +0000 Subject: [PATCH] make Code regex work for old video URLs; simplify date parsing in scene scraper --- scrapers/RealJamVR.yml | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/scrapers/RealJamVR.yml b/scrapers/RealJamVR.yml index f6a94dfcf..de9f9ca73 100644 --- a/scrapers/RealJamVR.yml +++ b/scrapers/RealJamVR.yml @@ -28,10 +28,9 @@ xPathScrapers: Date: &date selector: //div[@class="specs-icon"]/following-sibling::strong postProcess: - - replace: - - regex: ^([a-zA-Z]{3})\D*(\d{1,2},\s*\d+)$ - with: $1. $2 + # both date formats are used interchangeably - parseDate: Jan. 2, 2006 + - parseDate: January 2, 2006 Performers: &performers Name: //div[contains(@class,"scene-view")]/a[contains(@href,"/actor/")] Tags: &tags @@ -59,6 +58,8 @@ xPathScrapers: - replace: - regex: .*/scenes/(\d+)/.* with: $1 + - regex: .*/videos_app/\w+/(\d+)_.* + with: $1 gallery: Title: *title Date: *date