Mercurial > repos > guerler > springsuite
comparison planemo/lib/python3.7/site-packages/networkx/algorithms/threshold.py @ 1:56ad4e20f292 draft
"planemo upload commit 6eee67778febed82ddd413c3ca40b3183a3898f1"
| author | guerler |
|---|---|
| date | Fri, 31 Jul 2020 00:32:28 -0400 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| 0:d30785e31577 | 1:56ad4e20f292 |
|---|---|
| 1 # Copyright (C) 2004-2019 by | |
| 2 # Aric Hagberg <hagberg@lanl.gov> | |
| 3 # Dan Schult <dschult@colgate.edu> | |
| 4 # Pieter Swart <swart@lanl.gov> | |
| 5 # All rights reserved. | |
| 6 # BSD license. | |
| 7 # | |
| 8 # Authors: Aric Hagberg (hagberg@lanl.gov) | |
| 9 # Pieter Swart (swart@lanl.gov) | |
| 10 # Dan Schult (dschult@colgate.edu) | |
| 11 """ | |
| 12 Threshold Graphs - Creation, manipulation and identification. | |
| 13 """ | |
| 14 from math import sqrt | |
| 15 import networkx as nx | |
| 16 from networkx.utils import py_random_state | |
| 17 | |
| 18 __all__ = ['is_threshold_graph', 'find_threshold_graph'] | |
| 19 | |
| 20 | |
| 21 def is_threshold_graph(G): | |
| 22 """ | |
| 23 Returns True if G is a threshold graph. | |
| 24 """ | |
| 25 return is_threshold_sequence(list(d for n, d in G.degree())) | |
| 26 | |
| 27 | |
| 28 def is_threshold_sequence(degree_sequence): | |
| 29 """ | |
| 30 Returns True if the sequence is a threshold degree seqeunce. | |
| 31 | |
| 32 Uses the property that a threshold graph must be constructed by | |
| 33 adding either dominating or isolated nodes. Thus, it can be | |
| 34 deconstructed iteratively by removing a node of degree zero or a | |
| 35 node that connects to the remaining nodes. If this deconstruction | |
| 36 failes then the sequence is not a threshold sequence. | |
| 37 """ | |
| 38 ds = degree_sequence[:] # get a copy so we don't destroy original | |
| 39 ds.sort() | |
| 40 while ds: | |
| 41 if ds[0] == 0: # if isolated node | |
| 42 ds.pop(0) # remove it | |
| 43 continue | |
| 44 if ds[-1] != len(ds) - 1: # is the largest degree node dominating? | |
| 45 return False # no, not a threshold degree sequence | |
| 46 ds.pop() # yes, largest is the dominating node | |
| 47 ds = [d - 1 for d in ds] # remove it and decrement all degrees | |
| 48 return True | |
| 49 | |
| 50 | |
| 51 def creation_sequence(degree_sequence, with_labels=False, compact=False): | |
| 52 """ | |
| 53 Determines the creation sequence for the given threshold degree sequence. | |
| 54 | |
| 55 The creation sequence is a list of single characters 'd' | |
| 56 or 'i': 'd' for dominating or 'i' for isolated vertices. | |
| 57 Dominating vertices are connected to all vertices present when it | |
| 58 is added. The first node added is by convention 'd'. | |
| 59 This list can be converted to a string if desired using "".join(cs) | |
| 60 | |
| 61 If with_labels==True: | |
| 62 Returns a list of 2-tuples containing the vertex number | |
| 63 and a character 'd' or 'i' which describes the type of vertex. | |
| 64 | |
| 65 If compact==True: | |
| 66 Returns the creation sequence in a compact form that is the number | |
| 67 of 'i's and 'd's alternating. | |
| 68 Examples: | |
| 69 [1,2,2,3] represents d,i,i,d,d,i,i,i | |
| 70 [3,1,2] represents d,d,d,i,d,d | |
| 71 | |
| 72 Notice that the first number is the first vertex to be used for | |
| 73 construction and so is always 'd'. | |
| 74 | |
| 75 with_labels and compact cannot both be True. | |
| 76 | |
| 77 Returns None if the sequence is not a threshold sequence | |
| 78 """ | |
| 79 if with_labels and compact: | |
| 80 raise ValueError("compact sequences cannot be labeled") | |
| 81 | |
| 82 # make an indexed copy | |
| 83 if isinstance(degree_sequence, dict): # labeled degree seqeunce | |
| 84 ds = [[degree, label] for (label, degree) in degree_sequence.items()] | |
| 85 else: | |
| 86 ds = [[d, i] for i, d in enumerate(degree_sequence)] | |
| 87 ds.sort() | |
| 88 cs = [] # creation sequence | |
| 89 while ds: | |
| 90 if ds[0][0] == 0: # isolated node | |
| 91 (d, v) = ds.pop(0) | |
| 92 if len(ds) > 0: # make sure we start with a d | |
| 93 cs.insert(0, (v, 'i')) | |
| 94 else: | |
| 95 cs.insert(0, (v, 'd')) | |
| 96 continue | |
| 97 if ds[-1][0] != len(ds) - 1: # Not dominating node | |
| 98 return None # not a threshold degree sequence | |
| 99 (d, v) = ds.pop() | |
| 100 cs.insert(0, (v, 'd')) | |
| 101 ds = [[d[0] - 1, d[1]] for d in ds] # decrement due to removing node | |
| 102 | |
| 103 if with_labels: | |
| 104 return cs | |
| 105 if compact: | |
| 106 return make_compact(cs) | |
| 107 return [v[1] for v in cs] # not labeled | |
| 108 | |
| 109 | |
| 110 def make_compact(creation_sequence): | |
| 111 """ | |
| 112 Returns the creation sequence in a compact form | |
| 113 that is the number of 'i's and 'd's alternating. | |
| 114 | |
| 115 Examples | |
| 116 -------- | |
| 117 >>> from networkx.algorithms.threshold import make_compact | |
| 118 >>> make_compact(['d', 'i', 'i', 'd', 'd', 'i', 'i', 'i']) | |
| 119 [1, 2, 2, 3] | |
| 120 >>> make_compact(['d', 'd', 'd', 'i', 'd', 'd']) | |
| 121 [3, 1, 2] | |
| 122 | |
| 123 Notice that the first number is the first vertex | |
| 124 to be used for construction and so is always 'd'. | |
| 125 | |
| 126 Labeled creation sequences lose their labels in the | |
| 127 compact representation. | |
| 128 | |
| 129 >>> make_compact([3, 1, 2]) | |
| 130 [3, 1, 2] | |
| 131 """ | |
| 132 first = creation_sequence[0] | |
| 133 if isinstance(first, str): # creation sequence | |
| 134 cs = creation_sequence[:] | |
| 135 elif isinstance(first, tuple): # labeled creation sequence | |
| 136 cs = [s[1] for s in creation_sequence] | |
| 137 elif isinstance(first, int): # compact creation sequence | |
| 138 return creation_sequence | |
| 139 else: | |
| 140 raise TypeError("Not a valid creation sequence type") | |
| 141 | |
| 142 ccs = [] | |
| 143 count = 1 # count the run lengths of d's or i's. | |
| 144 for i in range(1, len(cs)): | |
| 145 if cs[i] == cs[i - 1]: | |
| 146 count += 1 | |
| 147 else: | |
| 148 ccs.append(count) | |
| 149 count = 1 | |
| 150 ccs.append(count) # don't forget the last one | |
| 151 return ccs | |
| 152 | |
| 153 | |
| 154 def uncompact(creation_sequence): | |
| 155 """ | |
| 156 Converts a compact creation sequence for a threshold | |
| 157 graph to a standard creation sequence (unlabeled). | |
| 158 If the creation_sequence is already standard, return it. | |
| 159 See creation_sequence. | |
| 160 """ | |
| 161 first = creation_sequence[0] | |
| 162 if isinstance(first, str): # creation sequence | |
| 163 return creation_sequence | |
| 164 elif isinstance(first, tuple): # labeled creation sequence | |
| 165 return creation_sequence | |
| 166 elif isinstance(first, int): # compact creation sequence | |
| 167 ccscopy = creation_sequence[:] | |
| 168 else: | |
| 169 raise TypeError("Not a valid creation sequence type") | |
| 170 cs = [] | |
| 171 while ccscopy: | |
| 172 cs.extend(ccscopy.pop(0) * ['d']) | |
| 173 if ccscopy: | |
| 174 cs.extend(ccscopy.pop(0) * ['i']) | |
| 175 return cs | |
| 176 | |
| 177 | |
| 178 def creation_sequence_to_weights(creation_sequence): | |
| 179 """ | |
| 180 Returns a list of node weights which create the threshold | |
| 181 graph designated by the creation sequence. The weights | |
| 182 are scaled so that the threshold is 1.0. The order of the | |
| 183 nodes is the same as that in the creation sequence. | |
| 184 """ | |
| 185 # Turn input sequence into a labeled creation sequence | |
| 186 first = creation_sequence[0] | |
| 187 if isinstance(first, str): # creation sequence | |
| 188 if isinstance(creation_sequence, list): | |
| 189 wseq = creation_sequence[:] | |
| 190 else: | |
| 191 wseq = list(creation_sequence) # string like 'ddidid' | |
| 192 elif isinstance(first, tuple): # labeled creation sequence | |
| 193 wseq = [v[1] for v in creation_sequence] | |
| 194 elif isinstance(first, int): # compact creation sequence | |
| 195 wseq = uncompact(creation_sequence) | |
| 196 else: | |
| 197 raise TypeError("Not a valid creation sequence type") | |
| 198 # pass through twice--first backwards | |
| 199 wseq.reverse() | |
| 200 w = 0 | |
| 201 prev = 'i' | |
| 202 for j, s in enumerate(wseq): | |
| 203 if s == 'i': | |
| 204 wseq[j] = w | |
| 205 prev = s | |
| 206 elif prev == 'i': | |
| 207 prev = s | |
| 208 w += 1 | |
| 209 wseq.reverse() # now pass through forwards | |
| 210 for j, s in enumerate(wseq): | |
| 211 if s == 'd': | |
| 212 wseq[j] = w | |
| 213 prev = s | |
| 214 elif prev == 'd': | |
| 215 prev = s | |
| 216 w += 1 | |
| 217 # Now scale weights | |
| 218 if prev == 'd': | |
| 219 w += 1 | |
| 220 wscale = 1. / float(w) | |
| 221 return [ww * wscale for ww in wseq] | |
| 222 # return wseq | |
| 223 | |
| 224 | |
| 225 def weights_to_creation_sequence(weights, threshold=1, with_labels=False, compact=False): | |
| 226 """ | |
| 227 Returns a creation sequence for a threshold graph | |
| 228 determined by the weights and threshold given as input. | |
| 229 If the sum of two node weights is greater than the | |
| 230 threshold value, an edge is created between these nodes. | |
| 231 | |
| 232 The creation sequence is a list of single characters 'd' | |
| 233 or 'i': 'd' for dominating or 'i' for isolated vertices. | |
| 234 Dominating vertices are connected to all vertices present | |
| 235 when it is added. The first node added is by convention 'd'. | |
| 236 | |
| 237 If with_labels==True: | |
| 238 Returns a list of 2-tuples containing the vertex number | |
| 239 and a character 'd' or 'i' which describes the type of vertex. | |
| 240 | |
| 241 If compact==True: | |
| 242 Returns the creation sequence in a compact form that is the number | |
| 243 of 'i's and 'd's alternating. | |
| 244 Examples: | |
| 245 [1,2,2,3] represents d,i,i,d,d,i,i,i | |
| 246 [3,1,2] represents d,d,d,i,d,d | |
| 247 | |
| 248 Notice that the first number is the first vertex to be used for | |
| 249 construction and so is always 'd'. | |
| 250 | |
| 251 with_labels and compact cannot both be True. | |
| 252 """ | |
| 253 if with_labels and compact: | |
| 254 raise ValueError("compact sequences cannot be labeled") | |
| 255 | |
| 256 # make an indexed copy | |
| 257 if isinstance(weights, dict): # labeled weights | |
| 258 wseq = [[w, label] for (label, w) in weights.items()] | |
| 259 else: | |
| 260 wseq = [[w, i] for i, w in enumerate(weights)] | |
| 261 wseq.sort() | |
| 262 cs = [] # creation sequence | |
| 263 cutoff = threshold - wseq[-1][0] | |
| 264 while wseq: | |
| 265 if wseq[0][0] < cutoff: # isolated node | |
| 266 (w, label) = wseq.pop(0) | |
| 267 cs.append((label, 'i')) | |
| 268 else: | |
| 269 (w, label) = wseq.pop() | |
| 270 cs.append((label, 'd')) | |
| 271 cutoff = threshold - wseq[-1][0] | |
| 272 if len(wseq) == 1: # make sure we start with a d | |
| 273 (w, label) = wseq.pop() | |
| 274 cs.append((label, 'd')) | |
| 275 # put in correct order | |
| 276 cs.reverse() | |
| 277 | |
| 278 if with_labels: | |
| 279 return cs | |
| 280 if compact: | |
| 281 return make_compact(cs) | |
| 282 return [v[1] for v in cs] # not labeled | |
| 283 | |
| 284 | |
| 285 # Manipulating NetworkX.Graphs in context of threshold graphs | |
| 286 def threshold_graph(creation_sequence, create_using=None): | |
| 287 """ | |
| 288 Create a threshold graph from the creation sequence or compact | |
| 289 creation_sequence. | |
| 290 | |
| 291 The input sequence can be a | |
| 292 | |
| 293 creation sequence (e.g. ['d','i','d','d','d','i']) | |
| 294 labeled creation sequence (e.g. [(0,'d'),(2,'d'),(1,'i')]) | |
| 295 compact creation sequence (e.g. [2,1,1,2,0]) | |
| 296 | |
| 297 Use cs=creation_sequence(degree_sequence,labeled=True) | |
| 298 to convert a degree sequence to a creation sequence. | |
| 299 | |
| 300 Returns None if the sequence is not valid | |
| 301 """ | |
| 302 # Turn input sequence into a labeled creation sequence | |
| 303 first = creation_sequence[0] | |
| 304 if isinstance(first, str): # creation sequence | |
| 305 ci = list(enumerate(creation_sequence)) | |
| 306 elif isinstance(first, tuple): # labeled creation sequence | |
| 307 ci = creation_sequence[:] | |
| 308 elif isinstance(first, int): # compact creation sequence | |
| 309 cs = uncompact(creation_sequence) | |
| 310 ci = list(enumerate(cs)) | |
| 311 else: | |
| 312 print("not a valid creation sequence type") | |
| 313 return None | |
| 314 | |
| 315 G = nx.empty_graph(0, create_using) | |
| 316 if G.is_directed(): | |
| 317 raise nx.NetworkXError("Directed Graph not supported") | |
| 318 | |
| 319 G.name = "Threshold Graph" | |
| 320 | |
| 321 # add nodes and edges | |
| 322 # if type is 'i' just add nodea | |
| 323 # if type is a d connect to everything previous | |
| 324 while ci: | |
| 325 (v, node_type) = ci.pop(0) | |
| 326 if node_type == 'd': # dominating type, connect to all existing nodes | |
| 327 # We use `for u in list(G):` instead of | |
| 328 # `for u in G:` because we edit the graph `G` in | |
| 329 # the loop. Hence using an iterator will result in | |
| 330 # `RuntimeError: dictionary changed size during iteration` | |
| 331 for u in list(G): | |
| 332 G.add_edge(v, u) | |
| 333 G.add_node(v) | |
| 334 return G | |
| 335 | |
| 336 | |
| 337 def find_alternating_4_cycle(G): | |
| 338 """ | |
| 339 Returns False if there aren't any alternating 4 cycles. | |
| 340 Otherwise returns the cycle as [a,b,c,d] where (a,b) | |
| 341 and (c,d) are edges and (a,c) and (b,d) are not. | |
| 342 """ | |
| 343 for (u, v) in G.edges(): | |
| 344 for w in G.nodes(): | |
| 345 if not G.has_edge(u, w) and u != w: | |
| 346 for x in G.neighbors(w): | |
| 347 if not G.has_edge(v, x) and v != x: | |
| 348 return [u, v, w, x] | |
| 349 return False | |
| 350 | |
| 351 | |
| 352 def find_threshold_graph(G, create_using=None): | |
| 353 """ | |
| 354 Return a threshold subgraph that is close to largest in G. | |
| 355 The threshold graph will contain the largest degree node in G. | |
| 356 | |
| 357 """ | |
| 358 return threshold_graph(find_creation_sequence(G), create_using) | |
| 359 | |
| 360 | |
| 361 def find_creation_sequence(G): | |
| 362 """ | |
| 363 Find a threshold subgraph that is close to largest in G. | |
| 364 Returns the labeled creation sequence of that threshold graph. | |
| 365 """ | |
| 366 cs = [] | |
| 367 # get a local pointer to the working part of the graph | |
| 368 H = G | |
| 369 while H.order() > 0: | |
| 370 # get new degree sequence on subgraph | |
| 371 dsdict = dict(H.degree()) | |
| 372 ds = [(d, v) for v, d in dsdict.items()] | |
| 373 ds.sort() | |
| 374 # Update threshold graph nodes | |
| 375 if ds[-1][0] == 0: # all are isolated | |
| 376 cs.extend(zip(dsdict, ['i'] * (len(ds) - 1) + ['d'])) | |
| 377 break # Done! | |
| 378 # pull off isolated nodes | |
| 379 while ds[0][0] == 0: | |
| 380 (d, iso) = ds.pop(0) | |
| 381 cs.append((iso, 'i')) | |
| 382 # find new biggest node | |
| 383 (d, bigv) = ds.pop() | |
| 384 # add edges of star to t_g | |
| 385 cs.append((bigv, 'd')) | |
| 386 # form subgraph of neighbors of big node | |
| 387 H = H.subgraph(H.neighbors(bigv)) | |
| 388 cs.reverse() | |
| 389 return cs | |
| 390 | |
| 391 | |
| 392 # Properties of Threshold Graphs | |
| 393 def triangles(creation_sequence): | |
| 394 """ | |
| 395 Compute number of triangles in the threshold graph with the | |
| 396 given creation sequence. | |
| 397 """ | |
| 398 # shortcut algorithm that doesn't require computing number | |
| 399 # of triangles at each node. | |
| 400 cs = creation_sequence # alias | |
| 401 dr = cs.count("d") # number of d's in sequence | |
| 402 ntri = dr * (dr - 1) * (dr - 2) / 6 # number of triangles in clique of nd d's | |
| 403 # now add dr choose 2 triangles for every 'i' in sequence where | |
| 404 # dr is the number of d's to the right of the current i | |
| 405 for i, typ in enumerate(cs): | |
| 406 if typ == "i": | |
| 407 ntri += dr * (dr - 1) / 2 | |
| 408 else: | |
| 409 dr -= 1 | |
| 410 return ntri | |
| 411 | |
| 412 | |
| 413 def triangle_sequence(creation_sequence): | |
| 414 """ | |
| 415 Return triangle sequence for the given threshold graph creation sequence. | |
| 416 | |
| 417 """ | |
| 418 cs = creation_sequence | |
| 419 seq = [] | |
| 420 dr = cs.count("d") # number of d's to the right of the current pos | |
| 421 dcur = (dr - 1) * (dr - 2) // 2 # number of triangles through a node of clique dr | |
| 422 irun = 0 # number of i's in the last run | |
| 423 drun = 0 # number of d's in the last run | |
| 424 for i, sym in enumerate(cs): | |
| 425 if sym == "d": | |
| 426 drun += 1 | |
| 427 tri = dcur + (dr - 1) * irun # new triangles at this d | |
| 428 else: # cs[i]="i": | |
| 429 if prevsym == "d": # new string of i's | |
| 430 dcur += (dr - 1) * irun # accumulate shared shortest paths | |
| 431 irun = 0 # reset i run counter | |
| 432 dr -= drun # reduce number of d's to right | |
| 433 drun = 0 # reset d run counter | |
| 434 irun += 1 | |
| 435 tri = dr * (dr - 1) // 2 # new triangles at this i | |
| 436 seq.append(tri) | |
| 437 prevsym = sym | |
| 438 return seq | |
| 439 | |
| 440 | |
| 441 def cluster_sequence(creation_sequence): | |
| 442 """ | |
| 443 Return cluster sequence for the given threshold graph creation sequence. | |
| 444 """ | |
| 445 triseq = triangle_sequence(creation_sequence) | |
| 446 degseq = degree_sequence(creation_sequence) | |
| 447 cseq = [] | |
| 448 for i, deg in enumerate(degseq): | |
| 449 tri = triseq[i] | |
| 450 if deg <= 1: # isolated vertex or single pair gets cc 0 | |
| 451 cseq.append(0) | |
| 452 continue | |
| 453 max_size = (deg * (deg - 1)) // 2 | |
| 454 cseq.append(float(tri) / float(max_size)) | |
| 455 return cseq | |
| 456 | |
| 457 | |
| 458 def degree_sequence(creation_sequence): | |
| 459 """ | |
| 460 Return degree sequence for the threshold graph with the given | |
| 461 creation sequence | |
| 462 """ | |
| 463 cs = creation_sequence # alias | |
| 464 seq = [] | |
| 465 rd = cs.count("d") # number of d to the right | |
| 466 for i, sym in enumerate(cs): | |
| 467 if sym == "d": | |
| 468 rd -= 1 | |
| 469 seq.append(rd + i) | |
| 470 else: | |
| 471 seq.append(rd) | |
| 472 return seq | |
| 473 | |
| 474 | |
| 475 def density(creation_sequence): | |
| 476 """ | |
| 477 Return the density of the graph with this creation_sequence. | |
| 478 The density is the fraction of possible edges present. | |
| 479 """ | |
| 480 N = len(creation_sequence) | |
| 481 two_size = sum(degree_sequence(creation_sequence)) | |
| 482 two_possible = N * (N - 1) | |
| 483 den = two_size / float(two_possible) | |
| 484 return den | |
| 485 | |
| 486 | |
| 487 def degree_correlation(creation_sequence): | |
| 488 """ | |
| 489 Return the degree-degree correlation over all edges. | |
| 490 """ | |
| 491 cs = creation_sequence | |
| 492 s1 = 0 # deg_i*deg_j | |
| 493 s2 = 0 # deg_i^2+deg_j^2 | |
| 494 s3 = 0 # deg_i+deg_j | |
| 495 m = 0 # number of edges | |
| 496 rd = cs.count("d") # number of d nodes to the right | |
| 497 rdi = [i for i, sym in enumerate(cs) if sym == "d"] # index of "d"s | |
| 498 ds = degree_sequence(cs) | |
| 499 for i, sym in enumerate(cs): | |
| 500 if sym == "d": | |
| 501 if i != rdi[0]: | |
| 502 print("Logic error in degree_correlation", i, rdi) | |
| 503 raise ValueError | |
| 504 rdi.pop(0) | |
| 505 degi = ds[i] | |
| 506 for dj in rdi: | |
| 507 degj = ds[dj] | |
| 508 s1 += degj * degi | |
| 509 s2 += degi**2 + degj**2 | |
| 510 s3 += degi + degj | |
| 511 m += 1 | |
| 512 denom = (2 * m * s2 - s3 * s3) | |
| 513 numer = (4 * m * s1 - s3 * s3) | |
| 514 if denom == 0: | |
| 515 if numer == 0: | |
| 516 return 1 | |
| 517 raise ValueError("Zero Denominator but Numerator is %s" % numer) | |
| 518 return numer / float(denom) | |
| 519 | |
| 520 | |
| 521 def shortest_path(creation_sequence, u, v): | |
| 522 """ | |
| 523 Find the shortest path between u and v in a | |
| 524 threshold graph G with the given creation_sequence. | |
| 525 | |
| 526 For an unlabeled creation_sequence, the vertices | |
| 527 u and v must be integers in (0,len(sequence)) referring | |
| 528 to the position of the desired vertices in the sequence. | |
| 529 | |
| 530 For a labeled creation_sequence, u and v are labels of veritices. | |
| 531 | |
| 532 Use cs=creation_sequence(degree_sequence,with_labels=True) | |
| 533 to convert a degree sequence to a creation sequence. | |
| 534 | |
| 535 Returns a list of vertices from u to v. | |
| 536 Example: if they are neighbors, it returns [u,v] | |
| 537 """ | |
| 538 # Turn input sequence into a labeled creation sequence | |
| 539 first = creation_sequence[0] | |
| 540 if isinstance(first, str): # creation sequence | |
| 541 cs = [(i, creation_sequence[i]) for i in range(len(creation_sequence))] | |
| 542 elif isinstance(first, tuple): # labeled creation sequence | |
| 543 cs = creation_sequence[:] | |
| 544 elif isinstance(first, int): # compact creation sequence | |
| 545 ci = uncompact(creation_sequence) | |
| 546 cs = [(i, ci[i]) for i in range(len(ci))] | |
| 547 else: | |
| 548 raise TypeError("Not a valid creation sequence type") | |
| 549 | |
| 550 verts = [s[0] for s in cs] | |
| 551 if v not in verts: | |
| 552 raise ValueError("Vertex %s not in graph from creation_sequence" % v) | |
| 553 if u not in verts: | |
| 554 raise ValueError("Vertex %s not in graph from creation_sequence" % u) | |
| 555 # Done checking | |
| 556 if u == v: | |
| 557 return [u] | |
| 558 | |
| 559 uindex = verts.index(u) | |
| 560 vindex = verts.index(v) | |
| 561 bigind = max(uindex, vindex) | |
| 562 if cs[bigind][1] == 'd': | |
| 563 return [u, v] | |
| 564 # must be that cs[bigind][1]=='i' | |
| 565 cs = cs[bigind:] | |
| 566 while cs: | |
| 567 vert = cs.pop() | |
| 568 if vert[1] == 'd': | |
| 569 return [u, vert[0], v] | |
| 570 # All after u are type 'i' so no connection | |
| 571 return -1 | |
| 572 | |
| 573 | |
| 574 def shortest_path_length(creation_sequence, i): | |
| 575 """ | |
| 576 Return the shortest path length from indicated node to | |
| 577 every other node for the threshold graph with the given | |
| 578 creation sequence. | |
| 579 Node is indicated by index i in creation_sequence unless | |
| 580 creation_sequence is labeled in which case, i is taken to | |
| 581 be the label of the node. | |
| 582 | |
| 583 Paths lengths in threshold graphs are at most 2. | |
| 584 Length to unreachable nodes is set to -1. | |
| 585 """ | |
| 586 # Turn input sequence into a labeled creation sequence | |
| 587 first = creation_sequence[0] | |
| 588 if isinstance(first, str): # creation sequence | |
| 589 if isinstance(creation_sequence, list): | |
| 590 cs = creation_sequence[:] | |
| 591 else: | |
| 592 cs = list(creation_sequence) | |
| 593 elif isinstance(first, tuple): # labeled creation sequence | |
| 594 cs = [v[1] for v in creation_sequence] | |
| 595 i = [v[0] for v in creation_sequence].index(i) | |
| 596 elif isinstance(first, int): # compact creation sequence | |
| 597 cs = uncompact(creation_sequence) | |
| 598 else: | |
| 599 raise TypeError("Not a valid creation sequence type") | |
| 600 | |
| 601 # Compute | |
| 602 N = len(cs) | |
| 603 spl = [2] * N # length 2 to every node | |
| 604 spl[i] = 0 # except self which is 0 | |
| 605 # 1 for all d's to the right | |
| 606 for j in range(i + 1, N): | |
| 607 if cs[j] == "d": | |
| 608 spl[j] = 1 | |
| 609 if cs[i] == 'd': # 1 for all nodes to the left | |
| 610 for j in range(i): | |
| 611 spl[j] = 1 | |
| 612 # and -1 for any trailing i to indicate unreachable | |
| 613 for j in range(N - 1, 0, -1): | |
| 614 if cs[j] == "d": | |
| 615 break | |
| 616 spl[j] = -1 | |
| 617 return spl | |
| 618 | |
| 619 | |
| 620 def betweenness_sequence(creation_sequence, normalized=True): | |
| 621 """ | |
| 622 Return betweenness for the threshold graph with the given creation | |
| 623 sequence. The result is unscaled. To scale the values | |
| 624 to the iterval [0,1] divide by (n-1)*(n-2). | |
| 625 """ | |
| 626 cs = creation_sequence | |
| 627 seq = [] # betweenness | |
| 628 lastchar = 'd' # first node is always a 'd' | |
| 629 dr = float(cs.count("d")) # number of d's to the right of curren pos | |
| 630 irun = 0 # number of i's in the last run | |
| 631 drun = 0 # number of d's in the last run | |
| 632 dlast = 0.0 # betweenness of last d | |
| 633 for i, c in enumerate(cs): | |
| 634 if c == 'd': # cs[i]=="d": | |
| 635 # betweennees = amt shared with eariler d's and i's | |
| 636 # + new isolated nodes covered | |
| 637 # + new paths to all previous nodes | |
| 638 b = dlast + (irun - 1) * irun / dr + 2 * irun * (i - drun - irun) / dr | |
| 639 drun += 1 # update counter | |
| 640 else: # cs[i]="i": | |
| 641 if lastchar == 'd': # if this is a new run of i's | |
| 642 dlast = b # accumulate betweenness | |
| 643 dr -= drun # update number of d's to the right | |
| 644 drun = 0 # reset d counter | |
| 645 irun = 0 # reset i counter | |
| 646 b = 0 # isolated nodes have zero betweenness | |
| 647 irun += 1 # add another i to the run | |
| 648 seq.append(float(b)) | |
| 649 lastchar = c | |
| 650 | |
| 651 # normalize by the number of possible shortest paths | |
| 652 if normalized: | |
| 653 order = len(cs) | |
| 654 scale = 1.0 / ((order - 1) * (order - 2)) | |
| 655 seq = [s * scale for s in seq] | |
| 656 | |
| 657 return seq | |
| 658 | |
| 659 | |
| 660 def eigenvectors(creation_sequence): | |
| 661 """ | |
| 662 Return a 2-tuple of Laplacian eigenvalues and eigenvectors | |
| 663 for the threshold network with creation_sequence. | |
| 664 The first value is a list of eigenvalues. | |
| 665 The second value is a list of eigenvectors. | |
| 666 The lists are in the same order so corresponding eigenvectors | |
| 667 and eigenvalues are in the same position in the two lists. | |
| 668 | |
| 669 Notice that the order of the eigenvalues returned by eigenvalues(cs) | |
| 670 may not correspond to the order of these eigenvectors. | |
| 671 """ | |
| 672 ccs = make_compact(creation_sequence) | |
| 673 N = sum(ccs) | |
| 674 vec = [0] * N | |
| 675 val = vec[:] | |
| 676 # get number of type d nodes to the right (all for first node) | |
| 677 dr = sum(ccs[::2]) | |
| 678 | |
| 679 nn = ccs[0] | |
| 680 vec[0] = [1. / sqrt(N)] * N | |
| 681 val[0] = 0 | |
| 682 e = dr | |
| 683 dr -= nn | |
| 684 type_d = True | |
| 685 i = 1 | |
| 686 dd = 1 | |
| 687 while dd < nn: | |
| 688 scale = 1. / sqrt(dd * dd + i) | |
| 689 vec[i] = i * [-scale] + [dd * scale] + [0] * (N - i - 1) | |
| 690 val[i] = e | |
| 691 i += 1 | |
| 692 dd += 1 | |
| 693 if len(ccs) == 1: | |
| 694 return (val, vec) | |
| 695 for nn in ccs[1:]: | |
| 696 scale = 1. / sqrt(nn * i * (i + nn)) | |
| 697 vec[i] = i * [-nn * scale] + nn * [i * scale] + [0] * (N - i - nn) | |
| 698 # find eigenvalue | |
| 699 type_d = not type_d | |
| 700 if type_d: | |
| 701 e = i + dr | |
| 702 dr -= nn | |
| 703 else: | |
| 704 e = dr | |
| 705 val[i] = e | |
| 706 st = i | |
| 707 i += 1 | |
| 708 dd = 1 | |
| 709 while dd < nn: | |
| 710 scale = 1. / sqrt(i - st + dd * dd) | |
| 711 vec[i] = [0] * st + (i - st) * [-scale] + [dd * scale] + [0] * (N - i - 1) | |
| 712 val[i] = e | |
| 713 i += 1 | |
| 714 dd += 1 | |
| 715 return (val, vec) | |
| 716 | |
| 717 | |
| 718 def spectral_projection(u, eigenpairs): | |
| 719 """ | |
| 720 Returns the coefficients of each eigenvector | |
| 721 in a projection of the vector u onto the normalized | |
| 722 eigenvectors which are contained in eigenpairs. | |
| 723 | |
| 724 eigenpairs should be a list of two objects. The | |
| 725 first is a list of eigenvalues and the second a list | |
| 726 of eigenvectors. The eigenvectors should be lists. | |
| 727 | |
| 728 There's not a lot of error checking on lengths of | |
| 729 arrays, etc. so be careful. | |
| 730 """ | |
| 731 coeff = [] | |
| 732 evect = eigenpairs[1] | |
| 733 for ev in evect: | |
| 734 c = sum([evv * uv for (evv, uv) in zip(ev, u)]) | |
| 735 coeff.append(c) | |
| 736 return coeff | |
| 737 | |
| 738 | |
| 739 def eigenvalues(creation_sequence): | |
| 740 """ | |
| 741 Return sequence of eigenvalues of the Laplacian of the threshold | |
| 742 graph for the given creation_sequence. | |
| 743 | |
| 744 Based on the Ferrer's diagram method. The spectrum is integral | |
| 745 and is the conjugate of the degree sequence. | |
| 746 | |
| 747 See:: | |
| 748 | |
| 749 @Article{degree-merris-1994, | |
| 750 author = {Russel Merris}, | |
| 751 title = {Degree maximal graphs are Laplacian integral}, | |
| 752 journal = {Linear Algebra Appl.}, | |
| 753 year = {1994}, | |
| 754 volume = {199}, | |
| 755 pages = {381--389}, | |
| 756 } | |
| 757 | |
| 758 """ | |
| 759 degseq = degree_sequence(creation_sequence) | |
| 760 degseq.sort() | |
| 761 eiglist = [] # zero is always one eigenvalue | |
| 762 eig = 0 | |
| 763 row = len(degseq) | |
| 764 bigdeg = degseq.pop() | |
| 765 while row: | |
| 766 if bigdeg < row: | |
| 767 eiglist.append(eig) | |
| 768 row -= 1 | |
| 769 else: | |
| 770 eig += 1 | |
| 771 if degseq: | |
| 772 bigdeg = degseq.pop() | |
| 773 else: | |
| 774 bigdeg = 0 | |
| 775 return eiglist | |
| 776 | |
| 777 | |
| 778 # Threshold graph creation routines | |
| 779 | |
| 780 @py_random_state(2) | |
| 781 def random_threshold_sequence(n, p, seed=None): | |
| 782 """ | |
| 783 Create a random threshold sequence of size n. | |
| 784 A creation sequence is built by randomly choosing d's with | |
| 785 probabiliy p and i's with probability 1-p. | |
| 786 | |
| 787 s=nx.random_threshold_sequence(10,0.5) | |
| 788 | |
| 789 returns a threshold sequence of length 10 with equal | |
| 790 probably of an i or a d at each position. | |
| 791 | |
| 792 A "random" threshold graph can be built with | |
| 793 | |
| 794 G=nx.threshold_graph(s) | |
| 795 | |
| 796 seed : integer, random_state, or None (default) | |
| 797 Indicator of random number generation state. | |
| 798 See :ref:`Randomness<randomness>`. | |
| 799 """ | |
| 800 if not (0 <= p <= 1): | |
| 801 raise ValueError("p must be in [0,1]") | |
| 802 | |
| 803 cs = ['d'] # threshold sequences always start with a d | |
| 804 for i in range(1, n): | |
| 805 if seed.random() < p: | |
| 806 cs.append('d') | |
| 807 else: | |
| 808 cs.append('i') | |
| 809 return cs | |
| 810 | |
| 811 | |
| 812 # maybe *_d_threshold_sequence routines should | |
| 813 # be (or be called from) a single routine with a more descriptive name | |
| 814 # and a keyword parameter? | |
| 815 def right_d_threshold_sequence(n, m): | |
| 816 """ | |
| 817 Create a skewed threshold graph with a given number | |
| 818 of vertices (n) and a given number of edges (m). | |
| 819 | |
| 820 The routine returns an unlabeled creation sequence | |
| 821 for the threshold graph. | |
| 822 | |
| 823 FIXME: describe algorithm | |
| 824 | |
| 825 """ | |
| 826 cs = ['d'] + ['i'] * (n - 1) # create sequence with n insolated nodes | |
| 827 | |
| 828 # m <n : not enough edges, make disconnected | |
| 829 if m < n: | |
| 830 cs[m] = 'd' | |
| 831 return cs | |
| 832 | |
| 833 # too many edges | |
| 834 if m > n * (n - 1) / 2: | |
| 835 raise ValueError("Too many edges for this many nodes.") | |
| 836 | |
| 837 # connected case m >n-1 | |
| 838 ind = n - 1 | |
| 839 sum = n - 1 | |
| 840 while sum < m: | |
| 841 cs[ind] = 'd' | |
| 842 ind -= 1 | |
| 843 sum += ind | |
| 844 ind = m - (sum - ind) | |
| 845 cs[ind] = 'd' | |
| 846 return cs | |
| 847 | |
| 848 | |
| 849 def left_d_threshold_sequence(n, m): | |
| 850 """ | |
| 851 Create a skewed threshold graph with a given number | |
| 852 of vertices (n) and a given number of edges (m). | |
| 853 | |
| 854 The routine returns an unlabeled creation sequence | |
| 855 for the threshold graph. | |
| 856 | |
| 857 FIXME: describe algorithm | |
| 858 | |
| 859 """ | |
| 860 cs = ['d'] + ['i'] * (n - 1) # create sequence with n insolated nodes | |
| 861 | |
| 862 # m <n : not enough edges, make disconnected | |
| 863 if m < n: | |
| 864 cs[m] = 'd' | |
| 865 return cs | |
| 866 | |
| 867 # too many edges | |
| 868 if m > n * (n - 1) / 2: | |
| 869 raise ValueError("Too many edges for this many nodes.") | |
| 870 | |
| 871 # Connected case when M>N-1 | |
| 872 cs[n - 1] = 'd' | |
| 873 sum = n - 1 | |
| 874 ind = 1 | |
| 875 while sum < m: | |
| 876 cs[ind] = 'd' | |
| 877 sum += ind | |
| 878 ind += 1 | |
| 879 if sum > m: # be sure not to change the first vertex | |
| 880 cs[sum - m] = 'i' | |
| 881 return cs | |
| 882 | |
| 883 | |
| 884 @py_random_state(3) | |
| 885 def swap_d(cs, p_split=1.0, p_combine=1.0, seed=None): | |
| 886 """ | |
| 887 Perform a "swap" operation on a threshold sequence. | |
| 888 | |
| 889 The swap preserves the number of nodes and edges | |
| 890 in the graph for the given sequence. | |
| 891 The resulting sequence is still a threshold sequence. | |
| 892 | |
| 893 Perform one split and one combine operation on the | |
| 894 'd's of a creation sequence for a threshold graph. | |
| 895 This operation maintains the number of nodes and edges | |
| 896 in the graph, but shifts the edges from node to node | |
| 897 maintaining the threshold quality of the graph. | |
| 898 | |
| 899 seed : integer, random_state, or None (default) | |
| 900 Indicator of random number generation state. | |
| 901 See :ref:`Randomness<randomness>`. | |
| 902 """ | |
| 903 # preprocess the creation sequence | |
| 904 dlist = [i for (i, node_type) in enumerate(cs[1:-1]) if node_type == 'd'] | |
| 905 # split | |
| 906 if seed.random() < p_split: | |
| 907 choice = seed.choice(dlist) | |
| 908 split_to = seed.choice(range(choice)) | |
| 909 flip_side = choice - split_to | |
| 910 if split_to != flip_side and cs[split_to] == 'i' and cs[flip_side] == 'i': | |
| 911 cs[choice] = 'i' | |
| 912 cs[split_to] = 'd' | |
| 913 cs[flip_side] = 'd' | |
| 914 dlist.remove(choice) | |
| 915 # don't add or combine may reverse this action | |
| 916 # dlist.extend([split_to,flip_side]) | |
| 917 # print >>sys.stderr,"split at %s to %s and %s"%(choice,split_to,flip_side) | |
| 918 # combine | |
| 919 if seed.random() < p_combine and dlist: | |
| 920 first_choice = seed.choice(dlist) | |
| 921 second_choice = seed.choice(dlist) | |
| 922 target = first_choice + second_choice | |
| 923 if target >= len(cs) or cs[target] == 'd' or first_choice == second_choice: | |
| 924 return cs | |
| 925 # OK to combine | |
| 926 cs[first_choice] = 'i' | |
| 927 cs[second_choice] = 'i' | |
| 928 cs[target] = 'd' | |
| 929 # print >>sys.stderr,"combine %s and %s to make %s."%(first_choice,second_choice,target) | |
| 930 | |
| 931 return cs |
