# you don't need to understand this cell, it just downloads and opens a zip file from an URL
import requests
import zipfile 
import io
import xmltodict

response = requests.get("https://donnees.roulez-eco.fr/opendata/jour", stream=True)
z = zipfile.ZipFile(io.BytesIO(response.content))
xmlfile = z.read(z.filelist[0].filename)

xmlfile[:1000]

b'<?xml version="1.0" encoding="ISO-8859-1" standalone="yes"?>\n<pdv_liste>\n  <pdv id="1000001" latitude="4620114" longitude="519791" cp="01000" pop="R">\n    <adresse>596 AVENUE DE TREVOUX</adresse>\n    <ville>SAINT-DENIS-L\xe8S-BOURG</ville>\n    <services>\n      <service>Station de gonflage</service>\n      <service>Vente de gaz domestique (Butane, Propane)</service>\n      <service>DAB (Distributeur automatique de billets)</service>\n    </services>\n    <prix nom="Gazole" id="1" maj="2022-02-25T10:32:40" valeur="1710"/>\n    <prix nom="SP95" id="2" maj="2022-02-25T10:08:42" valeur="1809"/>\n    <prix nom="SP98" id="6" maj="2022-02-25T10:08:43" valeur="1842"/>\n    <rupture id="3" nom="E85" debut="2017-09-16T09:50:23" fin=""/>\n    <rupture id="4" nom="GPLc" debut="2017-09-16T09:50:23" fin=""/>\n    <rupture id="5" nom="E10" debut="2018-12-13T09:49:49" fin=""/>\n  </pdv>\n  <pdv id="1000002" latitude="4621842" longitude="522767" cp="01000" pop="R">\n    <adresse>16 Avenue de Marboz</adresse>\n    <vill'

import xml.etree.ElementTree as ET
root = ET.fromstring(xmlfile)

print(root.tag, root.attrib)

pdv_liste {}

for element in root:
    print(element.tag)
    print(element.attrib)
    print(element.find('ville').text)
    break # it would be too long
len(root)

pdv
{'id': '1000001', 'latitude': '4620114', 'longitude': '519791', 'cp': '01000', 'pop': 'R'}
SAINT-DENIS-LèS-BOURG

13325

result = []

for element in root:
    cp = element.attrib['cp']
    adresse = element.find('adresse').text
    ville = element.find('ville').text
    for p in element.findall('prix'):
        if p.attrib['nom'] == 'SP95' or p.attrib['nom'] == 'E10':
            prix = int(p.attrib['valeur']) / 1000
            result.append([adresse, cp, ville, prix])

result[0]

['596 AVENUE DE TREVOUX', '01000', 'SAINT-DENIS-LèS-BOURG', 1.809]

len(result)

11097

Introduction to XML¶

Using the `xml` library¶

More¶

Introduction to XML¶

Using the xml library¶

More¶

Using the `xml` library¶