nltk download
import xml.etree.ElementTree as ET resp = requests.get("http://www.nltk.org/nltk_data/") for p in ET.fromstring(resp.text)[0]: print(p.attrib["url"])