import networkx as nx

def print_info(G, desc):
    print("{}, nodes: {}, edges: {}".format(desc, len(G), len(G.edges())))
    return

lesmis = nx.read_gml('data/lesmis.gml')
print_info(lesmis, 'Les Miserables')

collab = nx.read_gml('data/netscience.gml')
print_info(collab, "Collaboration of network scientists")

powgrid = nx.read_gml('data/power.gml')
print_info(powgrid, "Power grid")

airline = nx.read_pajek('data/air.paj')
print_info(airline, "Air lines in US")

neural = nx.read_gml('data/celegansneural.gml')
print_info(neural, "C. Elegans neural network")

gloss = nx.read_pajek('data/glossary.paj')
print_info(gloss, "Glossary of Graphs and Digraphs")

Les Miserables, nodes: 77, edges: 254
Collaboration of network scientists, nodes: 1589, edges: 2742
Power grid, nodes: 4941, edges: 6594
Air lines in US, nodes: 332, edges: 2126
C. Elegans neural network, nodes: 297, edges: 1875
Glossary of Graphs and Digraphs, nodes: 72, edges: 118


import matplotlib.pyplot as plt

x = range(-10,11)
y = [i**2 for i in x]

plt.bar(x, y)

plt.title("Parabola")
plt.ylabel("y")
plt.xlabel("x")

Text(0.5, 0, 'x')


import collections
import matplotlib.pyplot as plt
import networkx as nx

def draw_deg_distr(G):
    degree_sequence = sorted([G.degree[i] for i in G.nodes()], reverse=True)
    degree_count = collections.Counter(degree_sequence)
    degree, count = zip(*degree_count.items())
    
    plt.bar(degree, count)
    plt.title("Degree distribution")
    plt.ylabel("Frequency")
    plt.xlabel("Degree")
    plt.draw()
    
    return

lollipop = nx.lollipop_graph(8, 10)
#nx.draw(lollipop)
#draw_deg_distr(lollipop)


draw_deg_distr(lesmis)
#draw_deg_distr(collab)
#draw_deg_distr(powgrid)
#draw_deg_distr(airline)
#draw_deg_distr(neural)
#draw_deg_distr(gloss)


import collections
import networkx as nx

def save_fraction_deg(G, filename):
    n = len(G)
    degree_sequence = sorted([G.degree[i] for i in G.nodes()], reverse=True)
    degree_count = collections.Counter(degree_sequence)
    with open(filename, 'w') as outputfile:
        outputfile.write("# Degree Fraction\n")
        for deg, count in degree_count.items():
            #print("Degree: {}, Fraction: {}".format(deg, count/n))
            outputfile.write("{} {}\n".format(deg, count/n))
    return

save_fraction_deg(nx.path_graph(4), 'path4-deg-frac.dat')
save_fraction_deg(lesmis, 'lesmis-deg-frac.dat')
save_fraction_deg(collab, 'collab-deg-frac.dat')
save_fraction_deg(powgrid, 'powgrid-deg-frac.dat')
save_fraction_deg(airline, 'airline-deg-frac.dat')
save_fraction_deg(neural, 'neural-deg-frac.dat')
save_fraction_deg(gloss, 'gloss-deg-frac.dat')


def largest_conn_comp(G):
    if isinstance(G, nx.DiGraph):
        largest_cc = max(nx.weakly_connected_components(G), key=len)
    elif isinstance(G, nx.Graph):
        largest_cc = max(nx.connected_components(G), key=len)
    else:
        raise TypeError()
    return G.subgraph(largest_cc).copy()

def print_stats(G, desc):
    avg_len = nx.average_shortest_path_length(G)
    clust = nx.average_clustering(G)
    print("{}, average shortest path length: {: 0.2f}, average clustering: {: 0.2f}".format(desc, avg_len, clust))
    return

print_stats(lesmis, "Les Miserables network")
print_stats(largest_conn_comp(collab), "Netscience collaboration")
print_stats(powgrid, "Power grid network")
print_stats(nx.Graph(airline), "Airline connections US")
print_stats(largest_conn_comp(neural), "C. Elegans neural network")
print_stats(largest_conn_comp(nx.Graph(gloss)), "Graph theory glossary")

Les Miserables network, average shortest path length:  2.64, average clustering:  0.57
Netscience collaboration, average shortest path length:  6.04, average clustering:  0.74
Power grid network, average shortest path length:  18.99, average clustering:  0.08
Airline connections US, average shortest path length:  2.74, average clustering:  0.63
C. Elegans neural network, average shortest path length:  2.12, average clustering:  0.19
Graph theory glossary, average shortest path length:  3.10, average clustering:  0.28

Tutorial 5: Analysis of real complex networks¶

Degree distribtion¶

Scale-free property¶

Gnuplot¶

Clustering coefficient¶