diff options
author | KatolaZ <katolaz@yahoo.it> | 2015-10-19 16:23:00 +0100 |
---|---|---|
committer | KatolaZ <katolaz@yahoo.it> | 2015-10-19 16:23:00 +0100 |
commit | df8386f75b0538075d72d52693836bb8878f505b (patch) | |
tree | 704c2a0836f8b9fd9f470c12b6ae05637c431468 /structure/correlations/rank_nodes_thresh.py | |
parent | 363274e79eade464247089c105260bc34940da07 (diff) |
First commit of MAMMULT code
Diffstat (limited to 'structure/correlations/rank_nodes_thresh.py')
-rw-r--r-- | structure/correlations/rank_nodes_thresh.py | 87 |
1 files changed, 87 insertions, 0 deletions
diff --git a/structure/correlations/rank_nodes_thresh.py b/structure/correlations/rank_nodes_thresh.py new file mode 100644 index 0000000..44b565a --- /dev/null +++ b/structure/correlations/rank_nodes_thresh.py @@ -0,0 +1,87 @@ +#### +## +## +## Get a file as input, whose n-th line corresponds to the value of a +## certain property of node n, and rank nodes according to their +## properties, taking into account ranking ties properly. +## +## The output is a file whose n-th line is the "ranking" of the n-th +## node according to the given property. (notice that rankings could +## be fractional, due to the tie removal algorithm) +## +## The rank of a node is set to "0" (ZERO) if the corresponding +## property is smaller than a value given as second parameter +## + + +import sys +import math + + +if len(sys.argv) < 3: + print "Usage: %s <filein> <thresh>" % sys.argv[0] + sys.exit(1) + + +thresh = float(sys.argv[2]) + +lines = open(sys.argv[1], "r").readlines() + +ranking = [] + +n=0 +for l in lines: + if l[0] == "#" or l.strip(" \n").split(" ") == []: + continue + v = [float(x) if "." in x or "e" in x else int(x) for x in l.strip(" \n").split(" ")][0] + if v >= thresh: + ranking.append((v,n)) + else: + ranking.append((0,n)) + n +=1 + +ranking.sort(reverse=True) +#print ranking +new_ranking = {} + +v0, n0 = ranking[0] + + +old_value = v0 +tot_rankings = 1 + +stack = [n0] +l=1.0 +for v,n in ranking[1:]: + l += 1 + ##print stack, tot_rankings + if v != old_value: ### There is a new rank + # We first compute the rank for all the nodes in the stack and then we set it + if old_value == 0: + new_rank_value = 0 + else: + new_rank_value = 1.0 * tot_rankings / len(stack) + ##print new_rank_value + for j in stack: + new_ranking[j] = new_rank_value + old_value = v + tot_rankings = l + stack = [n] + else: # One more value with the same rank, keep it for the future + stack.append(n) + tot_rankings += l + +if v == 0 : + new_rank_value = 0 +else: + new_rank_value = 1.0 * tot_rankings / len(stack) +#print new_rank_value +for j in stack: + new_ranking[j] = new_rank_value + +#print new_ranking + +keys = new_ranking.keys() +keys.sort() +for k in keys: + print new_ranking[k] |