This commit is contained in:
nlitkowski 2021-04-07 03:36:28 +02:00
parent 07b43649a9
commit 10c06c503c

View File

@ -15,9 +15,10 @@ import Debug.Trace
getLinkAndText xpathCondition = proc doc -> do getLinkAndText xpathCondition = proc doc -> do
xpathTrees <- getXPathTrees xpathCondition -< doc xpathTrees <- getXPathTrees xpathCondition -< doc
name <- getElemName -< xpathTrees
txt <- (getXPathTrees "../text()" >>> getText) -< xpathTrees
href <- (getXPathTrees "//a" >>> getAttrValue "href") -< xpathTrees href <- (getXPathTrees "//a" >>> getAttrValue "href") -< xpathTrees
txt <- (deep isText >>> getText) -< xpathTrees returnA -< trace ("AAAAAAAAAAAAAAAA " ++ show name) $ traceShowId (href, txt)
returnA -< traceShowId (href, txt)
extractNestedLinksWithText xpathCondition = proc url -> do extractNestedLinksWithText xpathCondition = proc url -> do