I used HTTPClient to get the page and Gumbo to parse it some time ago (near 
v0.3)

https://github.com/porterjamesj/Gumbo.jl

I was doing things like that, it's probably not the most elegant
way of doing it, but it was working fine:

function get_hrefs(body::HTMLElement)
    links = String[]
    for elem in preorder(body)
        if typeof(elem) == HTMLElement{:a}
            try
                push!(links,getattr(elem, "href"))
            catch
            end
        end
    end
    return links
end

Reply via email to