import shapefile

r = shapefile.Reader(r"files/departement_shapes/DEPARTEMENT.shp")
shapes = r.shapes()
records = r.records()
fields = r.fields

import pandas as pd

df = pd.DataFrame(records, columns=[f[0] for f in fields[1:]])

df.head()

%matplotlib inline
import matplotlib.pyplot as plt
plt.style.use('bmh')
import numpy as np
from matplotlib.collections import LineCollection

def draw_departements(ax, records, shapes):
    "Draws a map of the départements."
    for record, shape in zip(records, shapes):
        lons, lats = zip(*shape.points)
        data = np.array([lons, lats]).T

        if len(shape.parts) == 1:
            segs = [data,]
        else:
            segs = []
            for i in range(1,len(shape.parts)):
                index = shape.parts[i-1]
                index2 = shape.parts[i]
                segs.append(data[index:index2])
            segs.append(data[index2:])

        lines = LineCollection(segs,antialiaseds=(1,))
        lines.set_edgecolors('k')
        lines.set_linewidth(0.3)
        ax.add_collection(lines)

plt.figure(figsize=(10, 10))
ax = plt.subplot(111)
draw_departements(ax, records, shapes)
        
xmin, xmax = df['X_CHF_LIEU'].min(), df['X_CHF_LIEU'].max()
ymin, ymax = df['Y_CHF_LIEU'].min(), df['Y_CHF_LIEU'].max()
plt.xlim(xmin - 100000, xmax + 100000)
plt.ylim(ymin - 100000, ymax + 100000)
plt.axis('off')

(71326.0, 1328512.0, 6008968.0, 7159443.0)

from bs4 import BeautifulSoup
import requests

soup = BeautifulSoup(requests.get("http://elections.interieur.gouv.fr/presidentielle-2017/index.html").text, 'html.parser')

map_tag = soup.find('map')

area_tags = map_tag.find_all('area')

links = [tag.attrs['href'] for tag in area_tags]

unique_links = set(links)

url = "http://elections.interieur.gouv.fr/presidentielle-2017/024/018/index.html"

def extract_candidate_votes(url):
    "Extracts votes for all candidates from a given url."
    r = requests.get(url)
    soup = BeautifulSoup(r.text, 'html.parser')
    dept = soup.find(class_='span12 pub-fil-ariane').find_all('a')[-1].text
    table = soup.find('tbody')
    results = {}
    for row in table.find_all('tr'):
        results[row.td.text] = int(row.td.next_sibling.next_sibling.text.replace(' ', ''))
    return dept, results

extract_candidate_votes(url)

('Cher (18)',
 {'M. Benoît HAMON': 9157,
  'M. Emmanuel MACRON': 38076,
  'M. François ASSELINEAU': 1479,
  'M. François FILLON': 32967,
  'M. Jacques CHEMINADE': 345,
  'M. Jean LASSALLE': 1925,
  'M. Jean-Luc MÉLENCHON': 33694,
  'M. Nicolas DUPONT-AIGNAN': 9554,
  'M. Philippe POUTOU': 2106,
  'Mme Marine LE PEN': 41753,
  'Mme Nathalie ARTHAUD': 1630})

depts = []
results = []
for link in unique_links:
    dept, result = extract_candidate_votes("http://elections.interieur.gouv.fr/presidentielle-2017/" + link) 
    depts.append(dept)
    results.append(result)

df_votes = pd.DataFrame(results, index=depts)

df_votes.tail()

vote_sum = df_votes.sum(axis=1).sort_values(ascending=True)

fig, ax = plt.subplots(figsize=(7, 12))
vote_sum.plot.barh(ax=ax, fontsize=8, width=1)
plt.tight_layout()

df_votes['total'] = vote_sum

df_votes = df_votes.sort_values(by='total', ascending=True)

df_votes = df_votes.drop('total', 1)

fig, ax = plt.subplots(figsize=(10, 12))
df_votes.plot.barh(ax=ax, stacked=True, fontsize=8, width=1)
plt.tight_layout()

candidate_colors = np.linspace(0, 1, 20)

cmap = plt.get_cmap('Vega20_r')

import matplotlib as mpl

fig = plt.figure(figsize=(10, 10))
ax = plt.subplot(111)
idxs = []
for record, shape, code_dpt in zip(records, shapes, df['CODE_DEPT']):
    lons, lats = zip(*shape.points)
    data = np.array([lons, lats]).T

    if len(shape.parts) == 1:
        segs = [data,]
    else:
        segs = []
        for i in range(1,len(shape.parts)):
            index = shape.parts[i-1]
            index2 = shape.parts[i]
            segs.append(data[index:index2])
        segs.append(data[index2:])

    lines = LineCollection(segs, antialiaseds=(1,))
    lines.set_edgecolors('k')
    lines.set_linewidth(0.3)
    values = df_votes[df_votes.index.str.contains("({})".format(code_dpt), regex=False)].values
    idx = np.argmax(values)
    idxs.append(idx)
    facecolor = cmap(candidate_colors[idx])
    lines.set_facecolor(facecolor)
    ax.add_collection(lines)
        
        
xmin, xmax = df['X_CHF_LIEU'].min(), df['X_CHF_LIEU'].max()
ymin, ymax = df['Y_CHF_LIEU'].min(), df['Y_CHF_LIEU'].max()
plt.xlim(xmin - 100000, xmax + 100000)
plt.ylim(ymin - 100000, ymax + 100000)
plt.axis('off')

ax_cbar = fig.add_axes([0.05, 0.15, 0.7, 0.05])
cbar_cmap = mpl.colors.ListedColormap(np.array([cmap(candidate_colors[i]) for i in set(idxs)]))
bounds = list(range(len(set(idxs)) + 1))
norm = mpl.colors.BoundaryNorm(bounds, cbar_cmap.N)
cb = mpl.colorbar.ColorbarBase(ax_cbar, cmap=cbar_cmap,
                                norm=norm,
                                boundaries=bounds,
                                ticks=np.array(bounds) + 0.5,
                                spacing='uniform',
                                orientation='horizontal')
cb.ax.set_xticklabels([df_votes.columns[i] for i in set(idxs)]);  # horizontal colorbar

mapping_func = lambda z: 1 - (1 - z)**2

fig = plt.figure(figsize=(10, 10))
ax = plt.subplot(111)
idxs = []
for record, shape, code_dpt in zip(records, shapes, df['CODE_DEPT']):
    lons, lats = zip(*shape.points)
    data = np.array([lons, lats]).T

    if len(shape.parts) == 1:
        segs = [data,]
    else:
        segs = []
        for i in range(1,len(shape.parts)):
            index = shape.parts[i-1]
            index2 = shape.parts[i]
            segs.append(data[index:index2])
        segs.append(data[index2:])

    lines = LineCollection(segs, antialiaseds=(1,))
    lines.set_edgecolors('k')
    lines.set_linewidth(0.3)
    values = df_votes[df_votes.index.str.contains("({})".format(code_dpt), regex=False)].values
    idx = np.argmax(values)
    idxs.append(idx)
    facecolor = np.array(cmap(candidate_colors[idx]))
    facecolor[3] = mapping_func((values[0, idx] - np.sort(values.ravel())[-2]) / values[0, idx])
    lines.set_facecolor(facecolor)
    ax.add_collection(lines)
        
        
xmin, xmax = df['X_CHF_LIEU'].min(), df['X_CHF_LIEU'].max()
ymin, ymax = df['Y_CHF_LIEU'].min(), df['Y_CHF_LIEU'].max()
plt.xlim(xmin - 100000, xmax + 100000)
plt.ylim(ymin - 100000, ymax + 100000)
plt.axis('off')

ax_cbar = fig.add_axes([0.05, 0.15, 0.7, 0.05])
cbar_cmap = mpl.colors.ListedColormap(np.array([cmap(candidate_colors[i]) for i in set(idxs)]))
bounds = list(range(len(set(idxs)) + 1))
norm = mpl.colors.BoundaryNorm(bounds, cbar_cmap.N)
cb = mpl.colorbar.ColorbarBase(ax_cbar, cmap=cbar_cmap,
                                norm=norm,
                                boundaries=bounds,
                                ticks=np.array(bounds) + 0.5,
                                spacing='uniform',
                                orientation='horizontal')
cb.ax.set_xticklabels([df_votes.columns[i] for i in set(idxs)]);  # horizontal colorbar

fig = plt.figure(figsize=(16, 13))
for candidate_idx in np.arange(df_votes.columns.size):
    ax = plt.subplot(3, 4, candidate_idx+1)

    for record, shape, code_dpt in zip(records, shapes, df['CODE_DEPT']):
        lons, lats = zip(*shape.points)
        data = np.array([lons, lats]).T

        if len(shape.parts) == 1:
            segs = [data,]
        else:
            segs = []
            for i in range(1,len(shape.parts)):
                index = shape.parts[i-1]
                index2 = shape.parts[i]
                segs.append(data[index:index2])
            segs.append(data[index2:])

        lines = LineCollection(segs, antialiaseds=(1,))
        lines.set_edgecolors('k')
        lines.set_linewidth(0.3)
        values = df_votes[df_votes.index.str.contains("({})".format(code_dpt), regex=False)].values

        facecolor = np.array(cmap(candidate_colors[candidate_idx]))
        facecolor[3] = mapping_func(float(values[0, candidate_idx]) / df_votes.max(axis=0)[df_votes.columns[candidate_idx]])
        lines.set_facecolor(facecolor)
        ax.add_collection(lines)


    xmin, xmax = df['X_CHF_LIEU'].min(), df['X_CHF_LIEU'].max()
    ymin, ymax = df['Y_CHF_LIEU'].min(), df['Y_CHF_LIEU'].max()
    ax.set_xlim(xmin - 100000, xmax + 100000)
    ax.set_ylim(ymin - 100000, ymax + 100000)
    ax.axis('off')

ax_cbar = fig.add_axes([0.05, 0.05, 0.9, 0.025])
cbar_colors = np.array([cmap(candidate_colors[i]) for i in np.arange(df_votes.columns.size)])
cbar_cmap = mpl.colors.ListedColormap(cbar_colors)
bounds = np.arange(cbar_colors.shape[0] + 1)
norm = mpl.colors.BoundaryNorm(bounds, cbar_cmap.N)
cb = mpl.colorbar.ColorbarBase(ax_cbar, cmap=cbar_cmap,
                                norm=norm,
                                boundaries=bounds,
                                ticks=np.array(bounds) + 0.5,
                                spacing='uniform',
                                orientation='horizontal')
cb.ax.tick_params(labelsize=8) 
cb.ax.set_xticklabels(df_votes.columns.str.extract('^(?:M. |Mme )(.*)', expand=False));

fig = plt.figure(figsize=(16, 13))
for candidate_idx in np.arange(df_votes.columns.size):
    ax = plt.subplot(3, 4, candidate_idx+1)

    for record, shape, code_dpt in zip(records, shapes, df['CODE_DEPT']):
        lons, lats = zip(*shape.points)
        data = np.array([lons, lats]).T

        if len(shape.parts) == 1:
            segs = [data,]
        else:
            segs = []
            for i in range(1,len(shape.parts)):
                index = shape.parts[i-1]
                index2 = shape.parts[i]
                segs.append(data[index:index2])
            segs.append(data[index2:])

        lines = LineCollection(segs, antialiaseds=(1,))
        lines.set_edgecolors('k')
        lines.set_linewidth(0.3)
        values = df_votes[df_votes.index.str.contains("({})".format(code_dpt), regex=False)].values

        facecolor = np.array(cmap(candidate_colors[candidate_idx]))
        facecolor[3] = (float(values[0, candidate_idx]) / values.max())
        lines.set_facecolor(facecolor)
        ax.add_collection(lines)


    xmin, xmax = df['X_CHF_LIEU'].min(), df['X_CHF_LIEU'].max()
    ymin, ymax = df['Y_CHF_LIEU'].min(), df['Y_CHF_LIEU'].max()
    ax.set_xlim(xmin - 100000, xmax + 100000)
    ax.set_ylim(ymin - 100000, ymax + 100000)
    ax.axis('off')

ax_cbar = fig.add_axes([0.05, 0.05, 0.9, 0.025])
cbar_colors = np.array([cmap(candidate_colors[i]) for i in np.arange(df_votes.columns.size)])
cbar_cmap = mpl.colors.ListedColormap(cbar_colors)
bounds = np.arange(cbar_colors.shape[0] + 1)
norm = mpl.colors.BoundaryNorm(bounds, cbar_cmap.N)
cb = mpl.colorbar.ColorbarBase(ax_cbar, cmap=cbar_cmap,
                                norm=norm,
                                boundaries=bounds,
                                ticks=np.array(bounds) + 0.5,
                                spacing='uniform',
                                orientation='horizontal')
cb.ax.tick_params(labelsize=8) 
cb.ax.set_xticklabels(df_votes.columns.str.extract('^(?:M. |Mme )(.*)', expand=False));

	ID_GEOFLA	CODE_DEPT	NOM_DEPT	CODE_CHF	NOM_CHF	X_CHF_LIEU	Y_CHF_LIEU	X_CENTROID	Y_CENTROID	CODE_REG	NOM_REG
0	DEPARTEM0000000000000001	39	JURA	300	LONS-LE-SAUNIER	895198	6622537	886172	6641548	27	BOURGOGNE-FRANCHE-COMTE
1	DEPARTEM0000000000000002	42	LOIRE	218	SAINT-ETIENNE	808646	6482549	795655	6521581	84	AUVERGNE-RHONE-ALPES
2	DEPARTEM0000000000000003	76	SEINE-MARITIME	540	ROUEN	562355	6928721	550942	6952842	28	NORMANDIE
3	DEPARTEM0000000000000004	89	YONNE	024	AUXERRE	742447	6744261	748211	6750855	27	BOURGOGNE-FRANCHE-COMTE
4	DEPARTEM0000000000000005	68	HAUT-RHIN	066	COLMAR	1024125	6784581	1016174	6763894	44	ALSACE-CHAMPAGNE-ARDENNE-LORRAINE

	M. Benoît HAMON	M. Emmanuel MACRON	M. François ASSELINEAU	M. François FILLON	M. Jacques CHEMINADE	M. Jean LASSALLE	M. Jean-Luc MÉLENCHON	M. Nicolas DUPONT-AIGNAN	M. Philippe POUTOU	Mme Marine LE PEN	Mme Nathalie ARTHAUD
Lozère (48)	2733	10463	354	10986	93	1764	9483	2197	683	9097	294
Jura (39)	7589	31896	1330	28373	285	1994	30331	8533	1980	36110	1148
Indre (36)	7786	27301	1098	25476	298	1728	24938	7177	1757	31985	1390
Manche (50)	19238	74683	2048	64909	623	2520	51026	17052	4134	61620	2593
Alpes-Maritimes (06)	21067	111953	6067	161036	939	5262	87941	25175	3622	163141	1729

Des cartes du premier tour de l'élection présidentielle 2017

Par département¶

Par candidat¶

Conclusions¶

Comments