Skip to content

Commit 6fcbf08

Browse files
author
Jorrit Poelen
committed
add test for likely bot detection page; #336 (comment)
1 parent 7b7c1f6 commit 6fcbf08

File tree

2 files changed

+29
-0
lines changed

2 files changed

+29
-0
lines changed

preston-track/src/test/java/bio/guoda/preston/process/SciELOSoftRedirectorTest.java

Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -52,6 +52,34 @@ public InputStream get(IRI key) throws IOException {
5252
assertThat(redirectedTo.getPredicate(), is(HAS_VERSION));
5353
assertThat(RefNodeFactory.isBlankOrSkolemizedBlank(redirectedTo.getObject()), is(true));
5454
}
55+
56+
@Test
57+
public void onSoftRedirectChile() {
58+
// see https://github.com/bio-guoda/preston/issues/336#issuecomment-3005353035
59+
// no soft redirect present likely due to cloudflare bot wall
60+
BlobStoreReadOnly blobStore = new BlobStoreReadOnly() {
61+
@Override
62+
public InputStream get(IRI key) throws IOException {
63+
return getClass().getResourceAsStream("scielo-redirect-chile.html");
64+
}
65+
};
66+
ArrayList<Quad> nodes = new ArrayList<>();
67+
SciELOSoftRedirector registryReader = new SciELOSoftRedirector(
68+
blobStore,
69+
TestUtilForProcessor.testListener(nodes)
70+
);
71+
Quad redirectResource = toStatement(
72+
toIRI("https://www.scielo.org.ar/scielo.php?script=sci_pdf&pid=S1667-782X2007000100006"),
73+
HAS_VERSION,
74+
createTestNode()
75+
);
76+
77+
registryReader.on(redirectResource);
78+
79+
assertThat(nodes.size(), is(0));
80+
}
81+
82+
5583
@Test
5684
public void onPDF() {
5785
BlobStoreReadOnly blobStore = new BlobStoreReadOnly() {
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
<!DOCTYPE html><html lang="en-US"><head><title>Just a moment...</title><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><meta http-equiv="X-UA-Compatible" content="IE=Edge"><meta name="robots" content="noindex,nofollow"><meta name="viewport" content="width=device-width,initial-scale=1"><style>*{box-sizing:border-box;margin:0;padding:0}html{line-height:1.15;-webkit-text-size-adjust:100%;color:#313131;font-family:system-ui,-apple-system,BlinkMacSystemFont,Segoe UI,Roboto,Helvetica Neue,Arial,Noto Sans,sans-serif,Apple Color Emoji,Segoe UI Emoji,Segoe UI Symbol,Noto Color Emoji}body{display:flex;flex-direction:column;height:100vh;min-height:100vh}.main-content{margin:8rem auto;max-width:60rem;padding-left:1.5rem}@media (width <= 720px){.main-content{margin-top:4rem}}.h2{font-size:1.5rem;font-weight:500;line-height:2.25rem}@media (width <= 720px){.h2{font-size:1.25rem;line-height:1.5rem}}#challenge-error-text{background-image:url(data:image/svg+xml;base64,PHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHdpZHRoPSIzMiIgaGVpZ2h0PSIzMiIgZmlsbD0ibm9uZSI+PHBhdGggZmlsbD0iI0IyMEYwMyIgZD0iTTE2IDNhMTMgMTMgMCAxIDAgMTMgMTNBMTMuMDE1IDEzLjAxNSAwIDAgMCAxNiAzbTAgMjRhMTEgMTEgMCAxIDEgMTEtMTEgMTEuMDEgMTEuMDEgMCAwIDEtMTEgMTEiLz48cGF0aCBmaWxsPSIjQjIwRjAzIiBkPSJNMTcuMDM4IDE4LjYxNUgxNC44N0wxNC41NjMgOS41aDIuNzgzem0tMS4wODQgMS40MjdxLjY2IDAgMS4wNTcuMzg4LjQwNy4zODkuNDA3Ljk5NCAwIC41OTYtLjQwNy45ODQtLjM5Ny4zOS0xLjA1Ny4zODktLjY1IDAtMS4wNTYtLjM4OS0uMzk4LS4zODktLjM5OC0uOTg0IDAtLjU5Ny4zOTgtLjk4NS40MDYtLjM5NyAxLjA1Ni0uMzk3Ii8+PC9zdmc+);background-repeat:no-repeat;background-size:contain;padding-left:34px}@media (prefers-color-scheme:dark){body{background-color:#222;color:#d9d9d9}}</style><meta http-equiv="refresh" content="360"></head><body><div class="main-wrapper" role="main"><div class="main-content"><noscript><div class="h2"><span id="challenge-error-text">Enable JavaScript and cookies to continue</span></div></noscript></div></div><script>(function(){window._cf_chl_opt={cvId: '3',cZone: "www.scielo.cl",cType: 'managed',cRay: '9555c1ce59dd4ca0',cH: 'hGyr4R5T4m777NbKfUPdExvpthrcWEakq1cfv3EYC1w-1750868057-1.2.1.1-MnWu3_bC8QtP5zeFBo8jZBY0px7KcksH7n_A8Wg7ALvPcgdNYbE9LCX.0dK048eY',cUPMDTk: "\/scielo.php?script=sci_pdf&pid=S0718-19572015000100003&__cf_chl_tk=h8oZ.asLWjEKSyTAZp5S5SuO6sYTnnhctdap2U6IWws-1750868057-1.0.1.1-FYBndL1XNS2wjBYbOPt98LlZVYH3LEau37oEkEA164E",cFPWv: 'b',cITimeS: '1750868057',cTplC: 0,cTplV: 5,cTplB: 'cf',fa: "\/scielo.php?script=sci_pdf&pid=S0718-19572015000100003&__cf_chl_f_tk=h8oZ.asLWjEKSyTAZp5S5SuO6sYTnnhctdap2U6IWws-1750868057-1.0.1.1-FYBndL1XNS2wjBYbOPt98LlZVYH3LEau37oEkEA164E",md: "sZLk7vrErNCc.jTg.tUcOWayjvNhqCI.9nziHhgTWk4-1750868057-1.2.1.1-2yBuBsdT9g6SgfWsixLb6BcbpfHzbT6LoYfhwjv43xdi5v32GizyY099F7emgjbghkXYDvoas1YpTDGFei5LGGWRdHTG3rpKQXxXk9ryKTWJF8vXKiXElYoojej5CNI9FVwZioDhlKjRCpBJ1h1AmhSTyQuCeoFL3pgRW8qjY.VSMSkuWZBO8B6YywJiQujgHpET0z.dVZQ1hrDpaUEVwwK1lP0iGUlwrI8_ogH4MVAy9blzy5Is45ukc7VB9O_SRKOrGFhxHqF22E705PiRg9sD_R0ZBj4NgjYiiDw9K.pS8jDo8LYdVOgoWfzF9_NnqSW71Z3se8kfk7PnAlTIUu3LZJOWrOSx6x2PN5XUtXC_KwbhsRx0gaJEBNSni8oJu5YDwDqDq6fLsTt0IgnaOk.Ue0W0qZ56u4Ym28XDqLx2oroEzx5DYkMn9Z_GQsmeX5eGfhXzf9KVXLRjUHzPMklOOdOTtYdS3MB9YmLYsqjnm3gWnivFfrJa7dhYqi2xIi6yBs9ZpoVI3dToL7SjPhPsmuRO9FFpRBQ4A82Jkw94vnAXnyelvwT.6lcAjDPYDfi_2y.nO6LB55yV1ti0s.qJ9Pf6XFm3DLiTxUuZ9Fxave9Tlmc9c90pjRgvOCsVKj12pMWda85V2kAJPtH.gZaJ7JFebt_3wmHUqGYiXls7WYnpKJ2URMNlSoazH3XwmD4ig5NZaduez1submyA45oEdlp1phMXOO4AVJsBe2MqsAn2P1pLL5f1ThKHMrAHLqiiyP1tia0mnySdtHIiggUjl.DwMUaSt8.w.RTB7pOXnxScT5XR1VLJw5qrpX14L9MvBjHl5umQO.d17JZ6BeUHs44PHvrk38nKrMKPjtCSBNKPcPpLjNVe2nPOcCJNGsvxzyz5V2qMcUxvpoSb.27MuIWL2yvxweHuNnMiO0ndwdPo_KF4CGjywtdtH2x8JhwvUZIw.HQw5nYFGbxsaSw2.jAxjZ745TQCoKVO_6kMQi1xNS4QVzhe5QsV9QplpNnjI8lDpLKo67r5VY5W0nj3UaQ_ZXMWHn.HxNOSn9tfLKqezIjGIC4aRPCI9JE3G8QKri.bPXXNaCuPuSA2MS97r9aV6MBx4huDWT5_yQRa__xfGkOYEehE1I2C5Ao5xWkMMCnFdC4vp.cZGnbGZLkd8TpgKe17u5knHqrXfns",mdrd: "5p3eMGrB2pQXDzq3CFeQ4.ZQMwO5mC6_xUqhxJqISwU-1750868057-1.2.1.1-Loy56cJAao8is6MijHadtP8zYEfzPhBKlG1iVGGSQTqpuKWLCPDEE60lztcADZIMxr4z6bo9PNAkHD.aCA1QBPEs2M9OUv8x2g5mkMbzb9H40Qygmv1L_dBugpTDHjPhsClk9oESEsPePSxWeKpkzXbxl7Mp9.Gr_rlLB8diY7x9UvX9GAkmoIjpPAXcX0ECpWzwVnJiTYOgX_W1VYOCHxPpj_Ef5ULdmW0J76ibAhDKYUgGMshAW8jiMFIOjQB6akF0lbIFYZs1xzqIU2PzeXZ4CjiiRzyLLhzqN0CcGNxj9DwrZVGtkfa4ci.VDTgVBp4XlDzIkX_Qc9cuFcRboOQ7eyh5s4CPl_hbmzxw7D69_WqYVBGnpHeTXezNPFa3T_oLl246kDpJA0m2GhW9jaMdr5i.nZBA.pc6y0MJJ383WD7Uau7gPQ9WrIgi3qpfXhmY07_4YmAMZrVUQFGkHBLoQzin3xznQ4.jrQg60ubcSKxdRr4siG1VVMTseS1t_gypZf87iDV89WrsZjrRKf__50Vumb_vPmbz1824lcnX76xoGBTRDjEcrCkJQdJ3RU9xI_BhNBe62wsNIT0jKTKdfe.zDvsqL5O_Tmg.kyiPqhn1ruaC4kd_UalnKeltg5BeXKXj.0UDRHVpBs7AAYbvPfKArCroRaiAX_4QO6jXlJF06L5pRan51zqP7_ywS_UO6CxyIHRZ_Rwl7AJpUqPHNa0phbOm3kr.uiKqrbNUYD1ingjJ6a4jv.AHx80rLzQYc95eTjffHoYa3RjC2gKT8siWGrm_GlvgS9KTAxJ_q5ACaa3Kvg8DwD5rogrMjF0yZug3pntQyzRIaY.o9JnP2OOXNmMymGaBBP9YdH6zEmB0rROFuwSspc8OG1VtS0_1CsX5L_Hgx0bpf1XFx3Wn8pm5PoS2Cn2ep_24BGpAOM4BuzyN_5fit7XhWuHo755Lole_AH0ClPEctuHenPraj.JgXWBMB_gQ2KmLqtlxB3zc3KXqpzPebbbwfRYEmEjhEDo.1P5gch2zfgnJ10_xOyhNNsoXbCg7lTtSM5_4jO1RYVmX4e4vxg3kwQH8ojnhkKN5I27wKfwkpAu.mAE4R6yLzGWQvx9T.hVcmNAxZFMuFgs2V8roLjMM9vw1iSBFEV4QYDSpN.87CHMmo3qDj_BtzMHaG18kxfJvrGqFkBcluSdKuEqMU3k37MvgFKAIlqWBQ_JjKIjUrJ.Yqx8syJVDwIMueqJaN27U6IQpsJoqQLP_seMdPZX4HjXvMQjSOQAJAFkboWg8wCgAhsfcQvxUomX8_yAWVjn4n4HiiTGuCwN20gznys2aeKrwN3CzE4FegD74iRFMV2ub0i_KxKh5Dgpa7qjlHT99S_PuFvSKFTARc72ZWEYwlnV2CtnmEHHe9UpJ1piEwq7WT9JGq7P8hLQOSeqFnxrhInLcAwsuPLKNMqTBRst7WTppklb6W27nciM2ijCBEbzcUGiFSo3TNYZsge94ZjC3ZfY9LotKEfXnbjoKFDG9Z0COvwIHvaDiIUyXa8w0s3XKBsLdR5MxdzAEco2uK_Mh5BSjlK8Ti8OXXWdsGJnPsdaHxYDHRXkO13792ujDOUlG_NFpW7WA1RjsjNgLSSelcVKO6hOqFqcEbLGUEJHp5yGK25DNvZ1unS4OF5wwgl_cLHpiuvDOblw.KNBQqfbPMq8oVPnPeBsrN.IjBolryPL1BXdPeVcv.ldKAqRegzlLgddgL0KUHcqp.yygdq2SMV0Z73v5APkeFz6h4r3B4YzJU5aUa94bxZPfeQV5o6admHvTIMj0RkH82qZ02AYN.cRbwZW.rUMUorJ5h3GPjUZqcIzptxnFOKU4jjnTKLp5Fh_N1NRcXWv3aDpTunW8KkOK_UvzZGFlcaakpu7qwCXy4DRvy1Tj7IEp3B22FyUoLklJzMPN6N1MF9XxIoQjGKAjH9kY2DYLh_cPOdOZiIxW..GX5cB1HNN0O6HKe1q5QPMfUqzo9E67o4iQNSLOrETt1Rgkyi_iVI63GYQQHvnYEPfHQV9xFT_grvm.Of59vES24g9Bn_ZWo0tEMGU3fupaoAz1KpQsXp88KaYu.HYibDADRPrMrPwGqfjlIab_jVRktPpsLa3hMY1TUs_8ckCNQHhoER9L9PZPfNytmwIq0oeom160WU_JL2OQ01wlioTBNdjc5YQWvjjFL3WRmj3L1I.eptECXVZl0sZ8g_Uzr_4CKquAk0K_fyPfJU0Iv0.KWCJJS8gUYRlBWHd3_MMKGjULywIvUpTBk68b150voX0swHe03Lac0lYUG2QaQetFCP1f4nivY6.27e0khNrvZ2GOt5dl7aGijP96YpweRgB.th49WwIYPTlFcf9HZSUZzn8utI23En0ThI5EajtPUcfvdgiswNL6T9j4pZOV5ongaU0aBgMyt4LSodxK8vM08gzzyHpgZ9TMDOcVue0L05MloAkbgH.JFryKKLTs",};var a = document.createElement('script');a.src = '/cdn-cgi/challenge-platform/h/b/orchestrate/chl_page/v1?ray=9555c1ce59dd4ca0';window._cf_chl_opt.cOgUHash = location.hash === '' && location.href.indexOf('#') !== -1 ? '#' : location.hash;window._cf_chl_opt.cOgUQuery = location.search === '' && location.href.slice(0, location.href.length - window._cf_chl_opt.cOgUHash.length).indexOf('?') !== -1 ? '?' : location.search;if (window.history && window.history.replaceState) {var ogU = location.pathname + window._cf_chl_opt.cOgUQuery + window._cf_chl_opt.cOgUHash;history.replaceState(null, null, "\/scielo.php?script=sci_pdf&pid=S0718-19572015000100003&__cf_chl_rt_tk=h8oZ.asLWjEKSyTAZp5S5SuO6sYTnnhctdap2U6IWws-1750868057-1.0.1.1-FYBndL1XNS2wjBYbOPt98LlZVYH3LEau37oEkEA164E" + window._cf_chl_opt.cOgUHash);a.onload = function() {history.replaceState(null, null, ogU);}}document.getElementsByTagName('head')[0].appendChild(a);}());</script></body></html>

0 commit comments

Comments
 (0)