From 25c6139e81936876c763902498b17957e99a469c Mon Sep 17 00:00:00 2001 From: Norbert Litkowski Date: Wed, 7 Apr 2021 04:07:53 +0200 Subject: [PATCH] comment --- app/ZborBielawa.hs | 1 + 1 file changed, 1 insertion(+) diff --git a/app/ZborBielawa.hs b/app/ZborBielawa.hs index 38a907f..d3485bc 100644 --- a/app/ZborBielawa.hs +++ b/app/ZborBielawa.hs @@ -28,6 +28,7 @@ extractNestedLinksWithText xpathCondition = proc url -> do extractRecords = proc x -> do + -- todo more specific xpaths (a, b) <- extractLinksWithText "//aside[@class='widget widget_maxmegamenu']//a[@class='mega-menu-link']" -< x -- pary adres-tytuł podstrony (a', b') <- extractLinksWithText "//aside[@class='widget widget_maxmegamenu']//a[@class='mega-menu-link']" -< a -- pobieramy podstronę i kolejne podstrony z menu a'' <- extractNestedLinksWithText "(//big[a[contains(@href,'.pdf')][img]])[1]" -< a' -- pobieramy stronę z adresu URL i wyciągamy linki z tej strony pasujące do wyrażenia XPathowego