Merge branch 'stashapp:master' into wallhaven-imageByFragtment

spaceyuck · web-flow · commit cc05b012bdbf · 2025-10-26T07:45:39.000Z
diff --git a/scrapers/MadBrosX.yml b/scrapers/MadBrosX.yml
@@ -0,0 +1,32 @@
+# yaml-language-server: $schema=https://raw.githubusercontent.com/stashapp/CommunityScrapers/refs/heads/master/validator/scraper.schema.json
+name: "MadBrosX"
+# scrapes: MadBros
+
+sceneByURL:
+  - action: scrapeXPath
+    url:
+      - madbrosx.com
+    scraper: madbrosx
+
+xPathScrapers:
+  madbrosx:
+    scene:
+      Title: //h3[@class = "page-heading"]/span/@title
+      Date:
+        selector: //div[@class = "video_page-sub-head__DqmKK"]//span[@aria-label = "calendar"]/../text()
+        postProcess:
+        - parseDate: January 2, 2006
+      Details:
+        selector: //div[@id = "rc-tabs-1-panel-description"]/p/text()
+        postProcess:
+        - replace:
+            - regex: "^No description$"
+              with: ""
+      Performers:
+        Name: //h4[@class = "ant-list-item-meta-title"]//a[contains(@href, "model")]/text()
+      Studio:
+        Name:
+          fixed: Madbros
+      Image: //meta[@property = "og:image"]/@content
+      Tags:
+        Name: //span[@class = "ant-tag"]/a/text()
diff --git a/scrapers/MilkyPeru.yml b/scrapers/MilkyPeru.yml
@@ -0,0 +1,26 @@
+# yaml-language-server: $schema=https://raw.githubusercontent.com/stashapp/CommunityScrapers/refs/heads/master/validator/scraper.schema.json
+name: "Milky Peru"
+sceneByURL:
+  - action: scrapeXPath
+    url:
+      - milkyperu.com
+    scraper: milkyperu
+
+xPathScrapers:
+  milkyperu:
+    scene:
+      Title:
+        selector: //meta[@property = "og:title"]/@content
+        postProcess:
+        - replace:
+          - regex: "[. -]+$"
+            with: ""
+      URLs: //meta[@property = "og:url"]/@content
+      Date:
+        selector: //meta[@property = "article:published_time"]/@content
+        postProcess:
+        - parseDate: 2006-01-02T15:04:05-07:00
+      Details: //div[@data-elementor-type="wp-post"]//div[@class="elementor-widget-container"]/h2[contains(@class, "elementor-heading-title")]//text()
+      Studio:
+        Name: //meta[@property = "og:site_name"]/@content
+      Image: //meta[@property = "og:image"]/@content
diff --git a/scrapers/MissAV_en.yml b/scrapers/MissAV_en.yml
@@ -2,7 +2,9 @@ name: MissAV (en)
 sceneByURL:
   - action: scrapeXPath
     url:
-      - missav.com
+      - missav.ai
+      - missav.ws
+      - missav.live
     scraper: sceneScraper
 sceneByName:
   action: scrapeXPath
diff --git a/scrapers/MissAV_jp.yml b/scrapers/MissAV_jp.yml
@@ -2,7 +2,9 @@ name: MissAV (jp)
 sceneByURL:
   - action: scrapeXPath
     url:
-      - missav.com
+      - missav.ai
+      - missav.ws
+      - missav.live
     scraper: sceneScraper
 sceneByName:
   action: scrapeXPath
diff --git a/scrapers/Motherless.yml b/scrapers/Motherless.yml
@@ -36,8 +36,9 @@ xPathScrapers:
   sceneScraper:
     common:
       $meta: //div[@class='media-meta']
+      $error: //div[contains(@class,'error-page view-page')]
     scene:
-      Title: $meta//h1/text()
+      Title: $error/h1 | $meta//h1/text()
       Date:
         selector: $meta//div[@class='media-meta-stats']/span[not(contains(.,'Views')) and not(contains(.,'Favorites'))]/text()
         postProcess:
@@ -66,4 +67,4 @@ xPathScrapers:
             - replace:
                 - regex: \#
                   with:
-# Last Updated April 01, 2025
+# Last Updated October 17, 2025
diff --git a/scrapers/OopsFamily/OopsFamily.yml b/scrapers/OopsFamily/OopsFamily.yml
@@ -12,7 +12,7 @@ xPathScrapers:
         Name:
           fixed: "Oops Family"
       Title:
-        selector: //h1[@class = 'video-detail__title']//text()
+        selector: //div[@class="video-detail__title"]/text()
       Details:
         selector: //div[@data-id="description" and @class="hidden"]//text()
       Tags:
@@ -32,4 +32,4 @@ xPathScrapers:
             - regex: (.*) • (.*)
               with: $2
           - parseDate: "2 January, 2006"
-# Last Updated December 29, 2023
+# Last Updated October 17, 2025
diff --git a/scrapers/Perverformer.yml b/scrapers/Perverformer.yml
@@ -7,7 +7,7 @@ sceneByURL:
 xPathScrapers:
   sceneScraper:
     common:
-      $tags: //main/div[@class="columns"]/div[@class="secondary"]/div[@class="area"]/p/span[@class="nowrap"]
+      $tags: //main/div[@class="columns"]/div[@class="secondary"]/div[@class="area"]/div/div[@class="tag-cloud"]/div
     scene:
       Title:
         selector: //main/div[@class="heading"]/h1
@@ -32,4 +32,4 @@ xPathScrapers:
       Studio:
         Name:
           fixed: Perverformer
-# Last Updated September 21, 2025
+# Last Updated Octover 04, 2025
diff --git a/scrapers/ScrapeWithURL/ScrapeWithURL.py b/scrapers/ScrapeWithURL/ScrapeWithURL.py
@@ -73,12 +73,20 @@ def scrape_scene(url):
 
 
 FRAGMENT = json.loads(sys.stdin.read())
-url = FRAGMENT.get("url")
+urls = FRAGMENT.get("urls")
 
-if url:
-    result = scrape_scene(url)
-    result = filter_nones(result)
-    log.debug(f"result {result}")
-    print(json.dumps(result))
+for url in urls:
+    if not url.startswith('http'):
+      continue # skip urls that don't start with http
+    else:
+        try:
+            result = scrape_scene(url)
+            result = filter_nones(result)
+            log.debug(f"result {result}")
+            print(json.dumps(result))
+            if result:
+                break
+        except Exception:
+            continue
 else:
     print("null")
diff --git a/scrapers/ScrapeWithURL/ScrapeWithURL.yml b/scrapers/ScrapeWithURL/ScrapeWithURL.yml
@@ -6,4 +6,4 @@ sceneByFragment:
   script:
     - python
     - ScrapeWithURL.py
-# Last Updated December 20, 2024
+# Last Updated October 19, 2025
diff --git a/scrapers/SexLikeReal.yml b/scrapers/SexLikeReal.yml
@@ -7,73 +7,67 @@ sceneByURL:
       - sexlikereal.com
     scraper: sceneScraper
 
-sceneByFragment:
-  action: scrapeXPath
-  # url format: https://www.sexlikereal.com/scenes/{title}-{code}
-  # However, the url:
-  #     https://www.sexlikereal.com/{code}
-  # will redirect to the full url so that is what we will use for scrapping
-  queryURL: https://www.sexlikereal.com/{filename}
-  queryURLReplace:
-    # filename format:
-    #   SLR_{stufio:[^_]+}_{title:[^_]+}_{res:\d+p}_{code:\d+}_{vrtype}.{ext}
-    #     vrtype: stuff we do not care about but could contain '_'
-    filename:
-      - regex: (?i)^SLR_.+(?:_\d+p)?_(\d+)_.*$
-        with: $1
-      - regex: .*\.[^\.]+$ # if no id is found in the filename
-        with: # clear the filename so that it doesn't leak
-  scraper: sceneScraper
+# as of 2025-10-24, code link does not work, either at /scenes or /
+
+# sceneByFragment:
+#   action: scrapeXPath
+#   # url format: https://www.sexlikereal.com/scenes/{title}-{code}
+#   # However, the url:
+#   #     https://www.sexlikereal.com/{code}
+#   # will redirect to the full url so that is what we will use for scrapping
+#   queryURL: https://www.sexlikereal.com/{filename}
+#   queryURLReplace:
+#     # filename format:
+#     #   SLR_{stufio:[^_]+}_{title:[^_]+}_{res:\d+p}_{code:\d+}_{vrtype}.{ext}
+#     #     vrtype: stuff we do not care about but could contain '_'
+#     filename:
+#       - regex: (?i)^SLR_.+(?:_\d+p)?_(\d+)_.*$
+#         with: $1
+#       - regex: .*\.[^\.]+$ # if no id is found in the filename
+#         with: # clear the filename so that it doesn't leak
+#   scraper: sceneScraper
 
 xPathScrapers:
   sceneScraper:
+    common:
+      $ldjson: //script[@type="application/ld+json"][contains(text(), '"@type":"VideoObject"')]/text()
     scene:
       Title:
-        selector: //script[@type="text/javascript"][contains(.,"videoData:")]/text()
+        selector: //h1
+      Date:
+        selector: //p/time[@datetime][not(@data-hk)]/@datetime
         postProcess:
           - replace:
-              - regex: '.+videoData:\s{[^{]+title":"([^"]+)",.+'
-                with: $1
-              - regex: '\\u2019'
-                with: "’"
-              - regex: '\\u2013'
-                with: "–"
-      Date: //time/@datetime
+            - regex: "T.+"
+              with: ""
+          - parseDate: 2006-01-02
       Details:
-        selector: //div[@data-qa="scene-about-tab-text"]/text()
+        selector: $ldjson
         postProcess:
           - replace:
-              - regex: '^\.\s*'
-                with:
-        concat: "\n"
+              - regex: .*"description":\s?"([^"]+).+
+                with: $1
+              - regex: "^'|'\\r\\n"
+                with: ""
+              - regex: '\\r\\n\\r\\n'
+                with: "\n\n"
+      # fragile but it works
       Tags:
-        Name: >-
-          //meta[@property="video:tag"]/@content
-          |
-          //a[@data-qa="scene-tags-list-item-link"]/text()
+        Name: //div/ul/li/a/span
       Performers:
-        Name: //a[contains(@data-qa, "scene-model-list-item-name")]/text()
+        Name: //a[starts-with(@href,"/pornstars/")]/text()
       Studio:
         Name:
-          selector: //a[contains(@href,"/studios/")]/div[last()]/text()
+          selector: //h3/a[starts-with(@href,"/studios/")]/text()
           postProcess:
             - map:
                 DDFNetworkVR: "DDF Network VR"
                 KinkyGirlsBerlin: "Kinky Girls Berlin"
                 LethalHardcoreVR: "Lethal Hardcore VR"
                 LittleCapriceVR: "Little Caprice Dreams Virtual Reality"
-                LustReality: "LustReality"
                 POVcentralVR: "POV Central"
-                RealHotVR: "RealHotVR"
                 SinsVR: "XSinsVR"
                 VirtualXPorn: "Virtual X Porn"
                 WankitnowVR: "Wank It Now VR"
-      Image: //div[@id="webvr"]//img/@src
-      URL: &sceneUrl //link[@rel="canonical"]/@href
-      Code:
-        selector: *sceneUrl
-        postProcess:
-          - replace:
-              - regex: '^(.+)-(\d+)/?$'
-                with: $2
-# Last Updated May 22, 2025
+      Image: /html/head/meta[@property="og:image"]/@content
+# Last Updated October 24, 2025
diff --git a/scrapers/Teamskeet/Teamskeet.yml b/scrapers/Teamskeet/Teamskeet.yml
@@ -5,14 +5,13 @@ sceneByURL:
   - url:
       - sayuncle.com/movies/
       - teamskeet.com/movies/
-      - app.teamskeet.com/movies/
       - mylf.com/movies/
       - mylf.com/b/movies/
-      - app.mylf.com/movies/
       - swappz.com/movies/
       - freeuse.com/movies/
+      - app.reptyle.com/movies/
     action: script
     script:
       - python
       - TeamskeetAPI.py
-# Last Updated June 23, 2025
+# Last Updated October 24, 2025
diff --git a/scrapers/Teamskeet/TeamskeetAPI.py b/scrapers/Teamskeet/TeamskeetAPI.py
@@ -10,8 +10,7 @@
 
 ### SET MEMBER ACCESS TOKEN HERE
 ### CAN BE access_token OR refresh_token
-TEAMSKEET_ACCESS_TOKEN = ""
-MYLF_ACCESS_TOKEN = ""
+REPTYLE_ACCESS_TOKEN = ""
 ####
 
 scraper = cloudscraper.create_scraper()
@@ -133,17 +132,11 @@ def save_json(api_json, url):
 
 IS_MEMBER = False
 # Check the URL and set the API URL
-if "app.teamskeet.com" in scene_url:
-    ORIGIN = "https://app.teamskeet.com"
-    REFERER = "https://app.teamskeet.com"
-    API_BASE = "https://ma-store.teamskeet.com/ts_index/_doc/movie-"
-    MEMBER_ACCESS_TOKEN = TEAMSKEET_ACCESS_TOKEN
-    IS_MEMBER = True
-elif "app.mylf.com" in scene_url:
-    ORIGIN = "https://app.mylf.com"
-    REFERER = "https://app.mylf.com"
-    API_BASE = "https://ma-store.mylf.com/mylf_movies/_doc/"
-    MEMBER_ACCESS_TOKEN = MYLF_ACCESS_TOKEN
+if "app.reptyle.com" in scene_url:
+    ORIGIN = "https://app.reptyle.com"
+    REFERER = "https://app.reptyle.com"
+    API_BASE = "https://ma-store.reptyle.com/ts_index/_doc/movie-"
+    MEMBER_ACCESS_TOKEN = REPTYLE_ACCESS_TOKEN
     IS_MEMBER = True
 elif "sayuncle.com" in scene_url:
     ORIGIN = "https://www.sayuncle.com"
diff --git a/scrapers/VRPorn.yml b/scrapers/VRPorn.yml
@@ -8,7 +8,7 @@ sceneByURL:
     scraper: sceneScraper
 sceneByName:
   action: scrapeXPath
-  queryURL: https://vrporn.com/?s={}
+  queryURL: https://vrporn.com/search/videos/?query={}
   scraper: sceneSearch
 sceneByQueryFragment:
   action: scrapeXPath
@@ -17,42 +17,28 @@ sceneByQueryFragment:
 
 xPathScrapers:
   sceneScraper:
-    common:
-      $header: //header[@class="entry-header"]
-      $footer: //footer[@class="entry-footer"]
-      $videoarea: //footer[@class="entry-footer"]/div[@class="layout_area_video"]
     scene:
-      Title: $header//h1[contains(@class,"content-title")]
+      Title: //h1
       Date:
-        selector: $footer//span[@class="footer-titles"]/text()
+        selector: //span[contains(@class,"ui-player-title__sub-text")][@data-allow-mismatch]
         postProcess:
-          - replace:
-              - regex: Posted on (?:Premium on )?(.*)
-                with: $1
-          - parseDate: January 02, 2006
+          - parseDate: Jan 02 2006
       Details:
-        selector: //div[contains(@class, "post-video-description")]//p/text()
+        selector: //div[@class="app-comment-item__content-textarea"]/text()
         concat: "\n"
       Tags:
-        Name: $footer//a[@rel="tag"]
+        Name: //div[contains(@class,"tags")]//a/text()
       Performers:
-        Name: $header/following-sibling::*//div[@class="name_pornstar"]
+        Name: //a[@class="ui-card-model__name"]/text()
       Studio:
-        Name: //a[@id="studio-logo"]//span[@class="footer-titles"]
+        Name: //div[contains(@class,"studio")]/a/@title
       Image:
-        selector: //dl8-video/@poster
-        postProcess:
-          - replace:
-              - regex: (.*)(-\d+x\d+)(\.\w+$)
-                with: $1$3
+        selector: //meta[@property="og:image:url"]/@content
       URL: //link[@rel="canonical"]/@href
   sceneSearch:
     common:
-      $videos: //div[@class="entry-footer all_hover box_item_video"]
+      $card: //article
     scene:
-      Title: $videos//div[@class="d_post_meta"]/a
-      URL: $videos//div[@class="d_post_meta"]/a/@href
-      Image: $videos//div[@class="tube-thumbnail-wrapper"]/img/@src
-      Studio:
-        Name: $videos//div[@class="d_post_meta"]//span[@class="left_links"]
-# Last Updated January 10, 2025
+      Title: $card/header/a/@title
+      URL: $card/header/a/@href
+# Last Updated October 17, 2025
diff --git a/scrapers/gelbooru-xpath.yml b/scrapers/gelbooru-xpath.yml