import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import networkx as nx


karate = nx.karate_club_graph() #import the Zachary's karate club network data from NetworkX
karate_layout = nx.spring_layout(karate,seed=10) #fix a random layout so we can get a consistent look at the network

nx.draw(karate,karate_layout) #plot the network


network = nx.Graph() #initialize a new graph
network.add_nodes_from(range(1,13)) #add a set of nodes numbered 1 through 12
edgelist = [(1,2), 
            (1,3),
            (2,3),
            (2,4),
            (3,5),
            (4,5),
            (4,6),
            (5,6),
            (6,7),
            (7,8),
            (7,9),
            (8,9),
            (8,10),
            (9,11),
            (10,11),
            (10,12),
            (11,12)]
network.add_edges_from(edgelist) #add a set of links or edges to form a network
positions = nx.spring_layout(network,seed=10) #fix the position again
nx.draw(network,positions,node_color="lightblue",with_labels=True) #plot the network graph


nx.is_directed(network) #check if the network is directed (True) or undirected (False). (We should expect False)

False


deg = network.degree() # retrieve the degree sequence from our network
print(deg)

[(1, 2), (2, 3), (3, 3), (4, 3), (5, 3), (6, 3), (7, 3), (8, 3), (9, 3), (10, 3), (11, 3), (12, 2)]


plt.bar(*np.unique([d for n,d in deg], return_counts=True),width=0.25) # this could also be done using plt.hist([d for n,d in deg]), but this way looks nicer
plt.xticks([0,1,2,3,4]);
plt.xlabel("Degree");
plt.ylabel("Frequency");


deg = karate.degree() # retrieve the degree sequence from the karate club network, and plot its histogram
plt.bar(*np.unique([d for n,d in deg], return_counts=True),width=0.25)
plt.xticks(range(0,21));
plt.yticks(range(0,12));
plt.xlabel("Degree");
plt.ylabel("Frequency");


color_map = ["black","red","red","red","black","red","black","red","red","red","black","red","black","red","red","red","black"]
nx.draw(network,positions,node_color="lightblue",edge_color=color_map,with_labels=True) # highlight our long path


color_map = ["black","red","black","black","red","black","black","red","red","red","black","black","red","black","black","red","black"]
nx.draw(network,positions,node_color="lightblue",edge_color=color_map,with_labels=True) # highlight a shorter path


network.remove_edge(6,7) # delete the edge connecting node 6 to node 7
nx.draw(network,positions,node_color="lightblue",with_labels=True)


network.add_edge(6,7) # add the (6,7) link back to get our original network
A = nx.adjacency_matrix(network).todense() # retrieve the network adjacency matrix, and store it as a dense numpy matrix (this will return a sparse matrix by default, which doesn't look as pretty)
print(A)

[[0 1 1 0 0 0 0 0 0 0 0 0]
 [1 0 1 1 0 0 0 0 0 0 0 0]
 [1 1 0 0 1 0 0 0 0 0 0 0]
 [0 1 0 0 1 1 0 0 0 0 0 0]
 [0 0 1 1 0 1 0 0 0 0 0 0]
 [0 0 0 1 1 0 1 0 0 0 0 0]
 [0 0 0 0 0 1 0 1 1 0 0 0]
 [0 0 0 0 0 0 1 0 1 1 0 0]
 [0 0 0 0 0 0 1 1 0 0 1 0]
 [0 0 0 0 0 0 0 1 0 0 1 1]
 [0 0 0 0 0 0 0 0 1 1 0 1]
 [0 0 0 0 0 0 0 0 0 1 1 0]]


n_paths = np.linalg.matrix_power(A,6)[0,11] # raise the adjacency matrix to the power 6, and print the entry in the first row, 12th column.
print("There are", n_paths, "paths of length 6 from node 1 to node 12")

There are 0 paths of length 6 from node 1 to node 12


n_paths = np.linalg.matrix_power(A,7)[0,11] # raise the adjacency matrix to the power 7
print("There are", n_paths, "paths of length 7 from node 1 to node 12")

There are 4 paths of length 7 from node 1 to node 12


L = nx.laplacian_matrix(network).todense() # retrieve and print the laplacian matrix for our toy network
print(L)

[[ 2 -1 -1  0  0  0  0  0  0  0  0  0]
 [-1  3 -1 -1  0  0  0  0  0  0  0  0]
 [-1 -1  3  0 -1  0  0  0  0  0  0  0]
 [ 0 -1  0  3 -1 -1  0  0  0  0  0  0]
 [ 0  0 -1 -1  3 -1  0  0  0  0  0  0]
 [ 0  0  0 -1 -1  3 -1  0  0  0  0  0]
 [ 0  0  0  0  0 -1  3 -1 -1  0  0  0]
 [ 0  0  0  0  0  0 -1  3 -1 -1  0  0]
 [ 0  0  0  0  0  0 -1 -1  3  0 -1  0]
 [ 0  0  0  0  0  0  0 -1  0  3 -1 -1]
 [ 0  0  0  0  0  0  0  0 -1 -1  3 -1]
 [ 0  0  0  0  0  0  0  0  0 -1 -1  2]]


degrees = network.degree() # retrieve the degree sequence 
degree_colors = [degrees[i] for i in range(1,13)] # turn it into a vector
nx.draw(network,positions,node_color=degree_colors,with_labels=True) # plot the network with colors according to degree


centrality = nx.eigenvector_centrality(network) # compute eigenvector centrality using networkx
print(centrality)

{1: 0.1853442621469683, 2: 0.2679342551926453, 3: 0.2679342551926453, 4: 0.32137618934240997, 5: 0.32137618934240997, 6: 0.33985977126665573, 7: 0.33985977126665573, 8: 0.32137618934241, 9: 0.32137618934241, 10: 0.2679342551926454, 11: 0.2679342551926454, 12: 0.1853442621469684}


cent_colors = [centrality[i] for i in range(1,13)] # build a list of eigenvector centralities
nx.draw(network,positions,node_color=cent_colors,with_labels=True) # plot the graph with colors according to this list


(u,v) = np.linalg.eig(L) # get the eigenvalue decomposition of the laplacian matrix
u_sorted = np.sort(u) # sort the eigenvalues
v_sorted = v[:, u.argsort()] # sort the eigenvectors to match the eigenvalues
plt.scatter(range(1,13),u_sorted) # show a scatterplot of the eigenvalues in increasing order

<matplotlib.collections.PathCollection at 0x2789aece310>


network.remove_edge(1,2) # remove the edge connecting node 1 to node 2, and draw the network
nx.draw(network,positions,node_color="lightblue",with_labels=True)


L = nx.laplacian_matrix(network).todense() # get the laplacian matrix of our new graph, without the (1,2) edge
(u,v) = np.linalg.eig(L) # get the eigenvalue decomposition of the laplacian matrix
u_sorted = np.sort(u) # sort the eigenvalues
v_sorted = v[:, u.argsort()] # sort the eigenvectors to match the eigenvalues
plt.scatter(range(1,13),u_sorted) # show a scatterplot of the eigenvalues in increasing order

<matplotlib.collections.PathCollection at 0x2789afa4190>


network.add_edge(1,2) # return the graph to normal
network.remove_edge(6,7) # delete the link from 6 to 7, and draw the network
nx.draw(network,positions,node_color="lightblue",with_labels=True)


L = nx.laplacian_matrix(network).todense() # get the laplacian matrix of our new graph, without the (6,7) edge
(u,v) = np.linalg.eig(L) # get the eigenvalue decomposition, sort the values and vectors, and plot the resulting sequence
u_sorted = np.sort(u)
v_sorted = v[:, u.argsort()]
plt.scatter(range(1,13),u_sorted)

<matplotlib.collections.PathCollection at 0x2789b066ee0>


network.remove_edges_from([(3,5),(2,4),(8,10),(9,11)]) # remove a set of links, plot the result
nx.draw(network,positions,node_color="lightblue",with_labels=True)


L = nx.laplacian_matrix(network).todense() # get the laplacian matrix of our new "islands" graph
(u,v) = np.linalg.eig(L) # get the eigenvalue decomposition, sort the values and vectors, and plot the resulting sequence
u_sorted = np.sort(u)
v_sorted = v[:, u.argsort()]
plt.scatter(range(1,13),u_sorted)

<matplotlib.collections.PathCollection at 0x2789b09d4f0>


network.add_edges_from([(3,5),(2,4),(8,10),(9,11),(6,7)]) # add back the set of edges that we deleted


L = nx.laplacian_matrix(network).todense() # retrieve the spectrum of our original graph
(u,v) = np.linalg.eig(L)
u_sorted = np.sort(u)
v_sorted = v[:, u.argsort()]
plt.scatter(range(1,13),u_sorted) # remind us what the plot looked like

<matplotlib.collections.PathCollection at 0x2789af60250>


print(v_sorted[:,1])

[[-0.36274292]
 [-0.33412898]
 [-0.33412898]
 [-0.2528014 ]
 [-0.2528014 ]
 [-0.13159078]
 [ 0.13159078]
 [ 0.2528014 ]
 [ 0.2528014 ]
 [ 0.33412898]
 [ 0.33412898]
 [ 0.36274292]]


colors = [ "lightcoral" for i in range(1,13) ] # assign a nice reddish color to all nodes
for i in range(0,12): # for any nodes that have a negative entry, replace this with a nice purplish color
    if (v[i,1] < 0):
        colors[i] = "mediumpurple"
        
nx.draw(network,positions,node_color=colors,with_labels=True) # draw the result


eigen_cent = nx.eigenvector_centrality(karate)
eigen_colors = [eigen_cent[i] for i in range(0,34)]
nx.draw(karate,karate_layout,node_color=eigen_colors)


L = nx.laplacian_matrix(karate).todense() # retrieve and plot the spectrum of Zachary's karate club graph
(u,v) = np.linalg.eig(L)
u_sorted = np.sort(u)
v_sorted = v[:, u.argsort()]
plt.scatter(range(1,35),u_sorted)

<matplotlib.collections.PathCollection at 0x2789b0ac190>


colors = [ "lightcoral" for i in range(0,34) ] # assign colors to the nodes based on the sign of their entry in the Fiedler vector
for i in range(0,34):
    if (v_sorted[i,1] < 0):
        colors[i] = "mediumpurple"
        
nx.draw(karate,karate_layout,node_color=colors) # draw the result


df = pd.read_csv('stocks.csv') # load a dataset of weekly returns for some popular stocks over the past year
df.head(5) # take a peek at the data


returns = df[1:] # remove the dates
corr = returns.corr() # calculate the correlations between the returns of each pair of stocks
corr # display the correlation matrix


def truncate(f): # define a function that "rounds" a number to 0 if it is lower than 0.92, and to 1 if it is higher (or equal).
    if (abs(f) < 0.92):
        return 0.
    else:
        return 1
    
# we already know that every stock is perfectly correlated with itself, so the ones on the diagonal are not really useful information. Let's get rid of them.
adj = corr.applymap(truncate) - np.identity(10)
adj


stocknet = nx.from_numpy_matrix(adj.to_numpy()) # initialize a new graph from our adjacency matrix
stocknet = nx.relabel_nodes(stocknet, dict(enumerate(adj.columns))) # keep the stock tickers as the names of the nodes (instead of integers)
stock_layout = nx.spring_layout(stocknet,seed=10) # fix our layout
nx.draw(stocknet,stock_layout) # plot the graph, without any labels (for now)


L = nx.laplacian_matrix(stocknet).todense()
(u,v) = np.linalg.eig(L)
u_sorted = np.sort(u)
v_sorted = v[:, u.argsort()]
colors = [ "lightcoral" for i in range(0,10) ]
for i in range(0,10):
    if (v_sorted[i,1] < 0):
        colors[i] = "mediumpurple"
        
nx.draw(stocknet,stock_layout,node_color=colors)


nx.draw(stocknet,stock_layout,node_color=colors,with_labels=True)

	Date	AAPL	AMZN	BAC	C	FB	GOOG	MSFT	JPM	V	WFC
0	1/25/2021	0.036374	0.045521	-0.063456	0.047653	0.037820	0.142863	0.044145	0.022682	0.010891	0.113961
1	2/1/2021	-0.008685	-0.022207	0.052859	0.036858	0.008952	0.002912	0.011519	0.030858	0.037142	0.011411
2	2/8/2021	-0.040629	-0.008485	0.043816	0.035116	-0.033050	-0.001412	-0.016409	0.066417	0.031438	0.054223
3	2/15/2021	-0.066297	-0.048300	0.081788	0.058597	-0.015063	-0.030593	-0.033426	0.045614	0.039482	0.038190
4	2/22/2021	0.001319	-0.029897	0.096682	0.090000	0.025852	0.035191	-0.003357	0.093960	0.073817	0.120655

	AAPL	AMZN	BAC	C	FB	GOOG	MSFT	JPM	V	WFC
AAPL	1.000000	0.975844	0.922079	0.938198	0.964855	0.980586	0.986651	0.898194	0.929911	0.923325
AMZN	0.975844	1.000000	0.915539	0.925417	0.973629	0.978831	0.972704	0.889032	0.916407	0.913548
BAC	0.922079	0.915539	1.000000	0.986195	0.918874	0.936426	0.924780	0.959968	0.990712	0.987352
C	0.938198	0.925417	0.986195	1.000000	0.931981	0.947331	0.942960	0.950910	0.981090	0.992604
FB	0.964855	0.973629	0.918874	0.931981	1.000000	0.974683	0.964384	0.892842	0.917335	0.920788
GOOG	0.980586	0.978831	0.936426	0.947331	0.974683	1.000000	0.987984	0.913572	0.934986	0.936900
MSFT	0.986651	0.972704	0.924780	0.942960	0.964384	0.987984	1.000000	0.900485	0.928255	0.928075
JPM	0.898194	0.889032	0.959968	0.950910	0.892842	0.913572	0.900485	1.000000	0.950009	0.954812
V	0.929911	0.916407	0.990712	0.981090	0.917335	0.934986	0.928255	0.950009	1.000000	0.983043
WFC	0.923325	0.913548	0.987352	0.992604	0.920788	0.936900	0.928075	0.954812	0.983043	1.000000

	AAPL	AMZN	BAC	C	FB	GOOG	MSFT	JPM	V	WFC
AAPL	0.0	1.0	1.0	1.0	1.0	1.0	1.0	0.0	1.0	1.0
AMZN	1.0	0.0	0.0	1.0	1.0	1.0	1.0	0.0	0.0	0.0
BAC	1.0	0.0	0.0	1.0	0.0	1.0	1.0	1.0	1.0	1.0
C	1.0	1.0	1.0	0.0	1.0	1.0	1.0	1.0	1.0	1.0
FB	1.0	1.0	0.0	1.0	0.0	1.0	1.0	0.0	0.0	1.0
GOOG	1.0	1.0	1.0	1.0	1.0	0.0	1.0	0.0	1.0	1.0
MSFT	1.0	1.0	1.0	1.0	1.0	1.0	0.0	0.0	1.0	1.0
JPM	0.0	0.0	1.0	1.0	0.0	0.0	0.0	0.0	1.0	1.0
V	1.0	0.0	1.0	1.0	0.0	1.0	1.0	1.0	0.0	1.0
WFC	1.0	0.0	1.0	1.0	1.0	1.0	1.0	1.0	1.0	0.0

Analyzing Economic Networks¶

Philip Solimine ¶

Objectives¶

What is a network?¶

Graph theory and NetworkX¶

Creating a new graph¶

(Un)directedness¶

Degree¶

Connectivity and routing¶

Matrix representations¶

Spectral graph theory¶

Eigenvector centrality¶

Spectral graph clustering¶

Applications¶

Analyzing Economic Networks¶

Philip Solimine¶

Objectives¶

What is a network?¶

Graph theory and NetworkX¶

Creating a new graph¶

(Un)directedness¶

Degree¶

Connectivity and routing¶

Matrix representations¶

Spectral graph theory¶

Eigenvector centrality¶

Spectral graph clustering¶

Applications¶

Philip Solimine ¶