nitaku · December 31, 2015 08:39
diff --git a/README.md b/README.md
diff --git a/generate_random_tree.py b/generate_random_tree.py
 from __future__ import print_function
 from random import random, randint

 leaf_count = 0

 def rand_tree(prefixes, d, MAX_D, MAX_N, index, prefix):
    global leaf_count
    
    # return a tree with maximum depth MAX_D that branches with probability p at most N times for each internal node
    # p starts from 1 and decreases linearly with d, reaching zero at MAX_D
    
    # this still seems to be necessary to avoid infinite recursion (floating point precision?)
    if d == MAX_D:
        prefixes.append(prefix[1:])
        leaf_count += 1
        print(leaf_count, end='\r')
        
    p = float(MAX_D-d)/MAX_D
    
    # if the tree branches, at least one branch is made
    n = randint(1, MAX_N)
    
    child_i = 0
    
    for i in xrange(n):
        if p >= random():
            child_i += 1
            rand_tree(prefixes, d+1, MAX_D, MAX_N, child_i, prefix+(index,))
        else:
            prefixes.append(prefix[1:])
            leaf_count += 1
            print(leaf_count, end='\r')
            
 def generate(filename, max_d, max_n):
    global leaf_count
    
    leaf_count = 0
    
    prefixes = []

    rand_tree(prefixes, 1, max_d, max_n, 0, ())
    prefixes.sort()
    
    # write prefix tuples to the output file
    with open(filename, 'w') as output:
        for prefix in prefixes:
            print(prefix, file=output)
            
diff --git a/thumbnail.png b/thumbnail.png
diff --git a/tree(85).csv b/tree(85).csv
 ()
 ()
 ()
 ()
 ()
 ()
 ()
 (1, 1)
 (1, 1)
 (1, 1)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (1, 1, 2)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2,)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1)
 (2, 1, 2)
 (2, 1, 2)
 (2, 1, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 2)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 3)
 (2, 4)
 (2, 4)
 (3,)
 (3, 1)
 (3, 1)
 (3, 2)
 (3, 2)
 (3, 2)
 (3, 2)
 (3, 2)
 (3, 2)
 (3, 2)
	from __future__ import print_function
	from random import random, randint

	leaf_count = 0

	def rand_tree(prefixes, d, MAX_D, MAX_N, index, prefix):
	global leaf_count

	# return a tree with maximum depth MAX_D that branches with probability p at most N times for each internal node
	# p starts from 1 and decreases linearly with d, reaching zero at MAX_D

	# this still seems to be necessary to avoid infinite recursion (floating point precision?)
	if d == MAX_D:
	prefixes.append(prefix[1:])
	leaf_count += 1
	print(leaf_count, end='\r')

	p = float(MAX_D-d)/MAX_D

	# if the tree branches, at least one branch is made
	n = randint(1, MAX_N)

	child_i = 0

	for i in xrange(n):
	if p >= random():
	child_i += 1
	rand_tree(prefixes, d+1, MAX_D, MAX_N, child_i, prefix+(index,))
	else:
	prefixes.append(prefix[1:])
	leaf_count += 1
	print(leaf_count, end='\r')

	def generate(filename, max_d, max_n):
	global leaf_count

	leaf_count = 0

	prefixes = []

	rand_tree(prefixes, 1, max_d, max_n, 0, ())
	prefixes.sort()

	# write prefix tuples to the output file
	with open(filename, 'w') as output:
	for prefix in prefixes:
	print(prefix, file=output)
	()
	()
	()
	()
	()
	()
	()
	(1, 1)
	(1, 1)
	(1, 1)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(1, 1, 2)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2,)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1)
	(2, 1, 2)
	(2, 1, 2)
	(2, 1, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 2)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 3)
	(2, 4)
	(2, 4)
	(3,)
	(3, 1)
	(3, 1)
	(3, 2)
	(3, 2)
	(3, 2)
	(3, 2)
	(3, 2)
	(3, 2)
	(3, 2)