import xml.etree.ElementTree as ET tree=ET.parse('testi/ldt-1.5.xml') root=tree.getroot() parole=root.findall('.//word') testo=[i.attrib['form'].lower() for i in parole] print(testo[:500]) #mostra le prime 500 parole unita'