import pandas as pd
import json
import numpy as np
from matplotlib import pyplot as plt
import networkx as nx
import shapely.geometry
import sys


with open('FOR_PUBL_FR.json', 'r') as j:
     data = json.loads(j.read())


print("Polygon of the first forest : ")
polygon = np.asarray(data['features'][0]['geometry']['coordinates'][0])
x= polygon[:,0]
y= polygon[:,1]
plt.scatter(x,y)
plt.show()

Polygon of the first forest :


print("Polygon of the second forest : ")
polygon = np.asarray(data['features'][1]['geometry']['coordinates'][0])
x= polygon[:,0]
y= polygon[:,1]
plt.scatter(x,y)
plt.show()

Polygon of the second forest :


polygons = np.asarray(data['features'][11]['geometry']['coordinates'])
polygons = polygons[:,0]

for i in range(len(polygons)):
    polygon = np.asarray(polygons[i], dtype = object)
    x= polygon[:,0]
    y= polygon[:,1]
    plt.scatter(x,y)

plt.show()


centroid = [] #Will contain the positions of the centroids of the forests
areas = [] #Will contain the areas of the forests
for i in range(len(data['features'])):
    if len(data['features'][i]['geometry']['coordinates'][0][0]) > 2 : #When the forest has multiple polygons
        for j in range(len(data['features'][i]['geometry']['coordinates'][0])):
            shapely_pol = shapely.geometry.Polygon(data['features'][i]['geometry']['coordinates'][0][j])
            centroid.append(list(shapely_pol.centroid.coords)[0])
            areas.append(shapely_pol.area) #We add positions and areas of each polygon independently
    else : #If there is only one polygon
        shapely_pol = shapely.geometry.Polygon(data['features'][i]['geometry']['coordinates'][0])
        centroid.append(list(shapely_pol.centroid.coords)[0])
        areas.append(shapely_pol.area)

centroid = np.asarray(centroid)
areas = np.asarray(areas)


fig, ax = plt.subplots(figsize = (20, 20))
for val in centroid :
     ax.add_patch(plt.Circle(val, 10**(-3), facecolor = 'r', edgecolor='black'))
ax.axes.get_xaxis().set_visible(False) 
ax.axes.get_yaxis().set_visible(False) 
ax.axes.set_xlim([min(np.transpose(centroid)[0]) - 1,
               max(np.transpose(centroid)[0]) + 1])
ax.axes.set_ylim([min(np.transpose(centroid)[1]) - 1,
               max(np.transpose(centroid)[1]) + 1])

plt.show()


G = nx.Graph()
count = 0
for (val, a) in zip(centroid, areas) :
    G.add_node(count, lon = val[0], lat = val[1], area = a)
    count += 1


poly = shapely.geometry.Polygon(data['features'][0]['geometry']['coordinates'][0]) # polygon
poly


poly.buffer(0.0005) # extended polygon for d=0.0005


poly.buffer(0.001) # extended polygon for d=0.001


poly.buffer(0.01) # extended polygon for d=0.01


d = 0.01 # the buffer distance = daily foraging distance/2
all_buff_poly = [] #Will contain all the extended polygons
for i in range(len(data['features'])):
    if len(data['features'][i]['geometry']['coordinates'][0][0]) > 2 : #Forest with more than one polygon
        for j in range(len(data['features'][i]['geometry']['coordinates'][0])):
            shapely_pol = shapely.geometry.Polygon(data['features'][i]['geometry']['coordinates'][0][j])
            buff_pol = shapely_pol.buffer(d)
            all_buff_poly.append(buff_pol)
    else : #Forests with only one polygon
        shapely_pol = shapely.geometry.Polygon(data['features'][i]['geometry']['coordinates'][0])
        buff_pol = shapely_pol.buffer(d)
        all_buff_poly.append(buff_pol)


L = 1 # arbitrary diameter of the foraging area, in degree
for i in range(len(centroid) - 1):
    sys.stdout.write("\r{0}%".format(round((i + 1)/(len(centroid) - 1)*100, 2)))
    sys.stdout.flush() #This is to visualize how much of the graph has been treated already
    for j in range(i + 1, len(centroid)):
        if np.linalg.norm(centroid[i] - centroid[j]) < L: #We only consider the polygons that are close enough to the polygon i
            pol1 = all_buff_poly[i]
            pol2 = all_buff_poly[j]
            area = pol1.intersection(pol2).area
            if area > 0: #If there is an intersection, we put an edge, weighted by the area of intersection between the buffered polygons
                G.add_edge(i, j, intersection = area)

100.0%


nx.write_graphml(G, 'graph_d{}_L{}.graphml'.format(d, L)) #Store the graph and the characteristics


G_small = nx.read_graphml('graph_d0.01_L1.graphml')


plt.figure(figsize = (20, 20))
coordinates = {n:(G_small.nodes[n]["lon"], G_small.nodes[n]["lat"]) for n in G_small.nodes}
nx.draw_networkx(G_small, pos = coordinates, with_labels = False, node_size = 1, width = 1)


print("Number of nodes = {}, Number of edges = {}".format(len(G_small.nodes()), len(G_small.edges())))
print("Number of connected components = ", len(list(nx.connected_components(G_small))))

Number of nodes = 18932, Number of edges = 23809
Number of connected components =  7207


G_large = nx.read_graphml('graph_d0.05_L1.graphml')


plt.figure(figsize = (20, 20))
coordinates = {n:(G_large.nodes[n]["lon"], G_large.nodes[n]["lat"]) for n in G_large.nodes}
nx.draw_networkx(G_large, pos = coordinates, with_labels = False, node_size = 1, width = 1)


print("Number of nodes = {}, Number of edges = {}".format(len(G_large.nodes()), len(G_large.edges())))
print("Number of connected components = ", len(list(nx.connected_components(G_large))))

Number of nodes = 18932, Number of edges = 259544
Number of connected components =  398


list_areas = sorted(nx.get_node_attributes(G_small,'area').items(), key = lambda x: x[1])

print("List of 5 highest areas :", list_areas[-5:])
print("List of 5 smallest areas :", list_areas[:5])

List of 5 highest areas : [('12090', 0.008164664789284326), ('7361', 0.008448092891491437), ('7187', 0.01003791573598896), ('3670', 0.010979624359549748), ('7572', 0.011786669568507215)]
List of 5 smallest areas : [('2537', 1.3726108977721857e-16), ('8831', 2.2776345303746083e-14), ('14893', 2.946839434124618e-13), ('757', 4.2343020157101895e-13), ('14362', 4.3484514220810675e-13)]


plt.figure()
plt.hist(np.array(list_areas, dtype = float)[:,1], bins = 100)
plt.show()


degree_list_small = sorted(G_small.degree, key = lambda x: x[1])
print("List of 5 highest degrees for small d:", degree_list_small[-5:])

degree_list_large = sorted(G_large.degree, key = lambda x: x[1])
print("List of 5 highest degrees for large d:", degree_list_large[-5:])

List of 5 highest degrees: [('9898', 27), ('11630', 27), ('12249', 28), ('14495', 29), ('9332', 34)]
List of 5 highest degrees: [('817', 104), ('18090', 104), ('624', 105), ('18019', 105), ('18096', 105)]


plt.figure()
plt.hist(np.array(degree_list_large, dtype = int)[:,1], bins = 100, label = 'large d')
plt.hist(np.array(degree_list_small, dtype = int)[:,1], bins = 100, label = 'small d')
plt.legend()
plt.show()


pagerank_small = nx.algorithms.link_analysis.pagerank_alg.pagerank(G_small, weight = 'area')
pr_list_small = sorted(pagerank_small.items(),
                 key = lambda x: x[1])
print("List of 5 highest pagerank for small d:", pr_list_small[-5:])

pagerank_large = nx.algorithms.link_analysis.pagerank_alg.pagerank(G_large, weight = 'area')
pr_list_large = sorted(pagerank_large.items(),
                 key = lambda x: x[1])
print("List of 5 highest pagerank for large d:", pr_list_large[-5:])

List of 5 highest pagerank: [('9332', 0.00021953185700843112), ('12316', 0.00024068099364861584), ('2833', 0.0002522213854431817), ('9261', 0.00028801024010819293), ('3670', 0.0003155251775955247)]
List of 5 highest pagerank: [('11625', 0.00010736520208220798), ('7304', 0.00011114917959170071), ('14228', 0.00011274537635468298), ('2833', 0.00011349730714741698), ('3670', 0.00014834055883530622)]


biggest_cc_small = G_small.subgraph(sorted(nx.connected_components(G_small), key=len, reverse=True)[0])
print("Biggest connected component :", len(biggest_cc_small.nodes()))

biggest_cc_area_small = sum(list(nx.get_node_attributes(biggest_cc_small,'area').values()))
print("Area of the biggest connected component :", biggest_cc_area_small)

largest_cc_area_small = 0
for i in range(len(list(nx.connected_components(G_small)))):
    sys.stdout.write("\r{0}%".format(round((i + 1)/(len(list(nx.connected_components(G_small))))*100, 2)))
    sys.stdout.flush()
    test_g = G_small.subgraph(list(nx.connected_components(G_small))[i])
    if sum(list(nx.get_node_attributes(test_g,'area').values())) > largest_cc_area_small:
        largest_cc_area_small = sum(list(nx.get_node_attributes(test_g,'area').values()))
        largest_cc_small = test_g

print("\n Largest connected component :", len(largest_cc_small.nodes()))
print("Area of the largest connected component :", largest_cc_area_small)

Biggest connected component : 413
Area of the biggest connected component : 0.009959920536711445
100.0%
 Largest connected component : 51
Area of the largest connected component : 0.021455487619196696


plt.figure(figsize = (20, 20))
coordinates = {n:(G_small.nodes[n]["lon"], G_small.nodes[n]["lat"]) for n in G_small.nodes}
nx.draw_networkx(G_small, pos = coordinates, with_labels = False, node_size = 1, width = 1)

coordinates = {n:(biggest_cc_small.nodes[n]["lon"], biggest_cc_small.nodes[n]["lat"]) for n in biggest_cc_small.nodes}
nx.draw_networkx(biggest_cc_small, pos = coordinates, with_labels = False, node_size = 1, width = 1, node_color = 'r')

coordinates = {n:(largest_cc_small.nodes[n]["lon"], largest_cc_small.nodes[n]["lat"]) for n in largest_cc_small.nodes}
nx.draw_networkx(largest_cc_small, pos = coordinates, with_labels = False, node_size = 1, width = 1, node_color = 'y')


biggest_cc_large = G_large.subgraph(sorted(nx.connected_components(G_large), key=len, reverse=True)[0])
print("Biggest connected component :", len(biggest_cc_large.nodes()))

biggest_cc_area_large = sum(list(nx.get_node_attributes(biggest_cc_large,'area').values()))
print("Area of the biggest connected component :", biggest_cc_area_large)

largest_cc_area_large = 0
for i in range(len(list(nx.connected_components(G_large)))):
    sys.stdout.write("\r{0}%".format(round((i + 1)/(len(list(nx.connected_components(G_large))))*100, 2)))
    sys.stdout.flush()
    test_g = G_large.subgraph(list(nx.connected_components(G_large))[i])
    if sum(list(nx.get_node_attributes(test_g,'area').values())) > largest_cc_area_large:
        largest_cc_area_large = sum(list(nx.get_node_attributes(test_g,'area').values()))
        largest_cc_large = test_g

print("\n Largest connected component :", len(largest_cc_large.nodes()))
print("Area of the largest connected component :", largest_cc_area_large)

Biggest connected component : 16830
Area of the biggest connected component : 0.919316217408412
100.0%
 Largest connected component : 16830
Area of the largest connected component : 0.919316217408412


plt.figure(figsize = (20, 20))
coordinates = {n:(G_large.nodes[n]["lon"], G_large.nodes[n]["lat"]) for n in G_large.nodes}
nx.draw_networkx(G_large, pos = coordinates, with_labels = False, node_size = 1, width = 1)

coordinates = {n:(biggest_cc_large.nodes[n]["lon"], biggest_cc_large.nodes[n]["lat"]) for n in biggest_cc_large.nodes}
nx.draw_networkx(biggest_cc_large, pos = coordinates, with_labels = False, node_size = 1, width = 1, node_color = 'r')


for i in range(len(data['features'])):
    if len(data['features'][i]['geometry']['coordinates'][0][0]) > 2 : #When the forest has multiple polygons
        for j in range(len(data['features'][i]['geometry']['coordinates'][0])):
            for k in range(len(data['features'][i]['geometry']['coordinates'][0][j])):
            data['features'][i]['geometry']['coordinates'][0][j][k][1] *= (long - longmin)*110/80
    else : #If there is only one polygon
        for k in range(len(data['features'][i]['geometry']['coordinates'][0])):
            data['features'][i]['geometry']['coordinates'][0][k][1] *= (long - longmin)*110/80


bc_small = nx.algorithms.centrality.betweenness_centrality(G_small)
bc_list_small = sorted(bc_small.items(),
                key = lambda x: x[1])
print("List of 5 highest betweenness centrality:", bc_list_small[-5:])

bc_large = nx.algorithms.centrality.betweenness_centrality(G_large)
bc_list_large = sorted(bc_large.items(),
                key = lambda x: x[1])
print("List of 5 highest betweenness centrality:", bc_list_large[-5:])

Daily foraging and seasonal migration between forest patches¶

I_Raw data obtention¶

II_Graph construction¶

Centroids representation¶

Weighted nodes construction¶

Edges construction¶

Illustration of the shapely buffer method¶

Computing the buffed polygons¶

Weighting edges¶

Representation of the graph¶

III_Graph analysis¶

Degree¶

Pagerank¶

Components¶

IV_Further analysis¶