xidel

Download and extract data from HTML/XML pages as well as JSON APIs. More information: https://www.videlibri.de/xidel.html.

xidel https://www.google.com/search?q=test --extract "//a/extract(@href, 'url[?]q=([^&]+)&', 1)[. != '']"

xidel https://www.google.com/search?q=test --follow "//a/extract(@href, 'url[?]q=([^&]+)&', 1)[. != '']" --extract //title --download '{$host}/'

xidel https://example.org --follow //a --extract //title

xidel https://example.org --follow "css('a')" --css title

xidel https://example.org --follow "<a>{.}</a>*" --extract "<title>{.}</title>"

xidel path/to/example.xml --extract "<x><foo>ood</foo><bar>{.}</bar></x>"

xidel http://stackoverflow.com/feeds --extract "<entry><title>{title:=.}</title><link>{uri:=@href}</link></entry>+"

xidel https://reddit.com --follow "form(css('form.login-form')[1], {'user': '$your_username', 'passwd': '$your_password'})" --extract "css('#mail')/@title"