default answer for every share

refactor hypothesis to be 'pytest style' and add another one

get rid of 'shares->set(1 thing)' in generate_mappings return

Add a unittest hypothesis came up with

fix tests since we return peers, not sets-of-1-peer

add more debug

add a unit-test that's like test_problem_layout_ticket_1128

fix bug

add a note

fix utest

unit-test for bigger numbers

re-insert markberger code for testing

results of pairing with david
This commit is contained in:
meejah 2017-01-26 12:14:56 -07:00
parent e68b331bb1
commit b6d9945b95
5 changed files with 613 additions and 51 deletions

View File

@ -120,6 +120,8 @@ We calculate share placement like so:
shares, where an edge exists between an arbitrary readonly server S and an shares, where an edge exists between an arbitrary readonly server S and an
arbitrary share T if and only if S currently holds T. arbitrary share T if and only if S currently holds T.
^--- all passed in to the Happiness_Upload ctor
3. Calculate a maximum matching graph of G1 (a set of S->T edges that has or 3. Calculate a maximum matching graph of G1 (a set of S->T edges that has or
is-tied-for the highest "happiness score"). There is a clever efficient is-tied-for the highest "happiness score"). There is a clever efficient
algorithm for this, named "Ford-Fulkerson". There may be more than one algorithm for this, named "Ford-Fulkerson". There may be more than one
@ -128,6 +130,8 @@ We calculate share placement like so:
maps shares to servers, where each share appears at most once, and each maps shares to servers, where each share appears at most once, and each
server appears at most once. server appears at most once.
^-- is this the "readonly_mappings"
4. Construct a bipartite graph G2 of readwrite servers to pre-existing 4. Construct a bipartite graph G2 of readwrite servers to pre-existing
shares. Then remove any edge (from G2) that uses a server or a share found shares. Then remove any edge (from G2) that uses a server or a share found
in M1. Let an edge exist between server S and share T if and only if S in M1. Let an edge exist between server S and share T if and only if S

View File

@ -6,17 +6,49 @@ from hypothesis.strategies import text, sets
from allmydata.immutable import happiness_upload from allmydata.immutable import happiness_upload
class Happiness(unittest.TestCase): @given(
sets(elements=text(min_size=1), min_size=4, max_size=4),
sets(elements=text(min_size=1), min_size=4),
)
def test_hypothesis_unhappy(peers, shares):
"""
similar to test_unhappy we test that the resulting happiness is always 4 since the size of peers is 4.
"""
# https://hypothesis.readthedocs.io/en/latest/data.html#hypothesis.strategies.sets
# hypothesis.strategies.sets(elements=None, min_size=None, average_size=None, max_size=None)[source]
readonly_peers = set()
peers_to_shares = {}
places = happiness_upload.share_placement(peers, readonly_peers, shares, peers_to_shares)
happiness = happiness_upload.calculate_happiness(places)
assert set(places.keys()) == shares
assert happiness == 4
@given(sets(elements=text(min_size=1), min_size=4, max_size=4), sets(elements=text(min_size=1), min_size=4))
def test_hypothesis_unhappy(self, peers, shares): @given(
""" sets(elements=text(min_size=1), min_size=1, max_size=10),
similar to test_unhappy we test that the resulting happiness is always 4 since the size of peers is 4. # can we make a readonly_peers that's a subset of ^
""" sets(elements=text(min_size=1), min_size=1, max_size=20),
# https://hypothesis.readthedocs.io/en/latest/data.html#hypothesis.strategies.sets )
# hypothesis.strategies.sets(elements=None, min_size=None, average_size=None, max_size=None)[source] def test_more_hypothesis(peers, shares):
readonly_peers = set() """
peers_to_shares = {} similar to test_unhappy we test that the resulting happiness is always 4 since the size of peers is 4.
places = happiness_upload.share_placement(peers, readonly_peers, shares, peers_to_shares) """
happiness = happiness_upload.calculate_happiness(places) # https://hypothesis.readthedocs.io/en/latest/data.html#hypothesis.strategies.sets
self.assertEqual(4, happiness) # hypothesis.strategies.sets(elements=None, min_size=None, average_size=None, max_size=None)[source]
# XXX would be nice to paramaterize these by hypothesis too
readonly_peers = set()
peers_to_shares = {}
places = happiness_upload.share_placement(peers, readonly_peers, shares, peers_to_shares)
happiness = happiness_upload.calculate_happiness(places)
# every share should get placed
assert set(places.keys()) == shares
# we should only use peers that exist
assert set(places.values()).issubset(peers)
# if we have more shares than peers, happiness is at most # of
# peers; if we have fewer shares than peers happiness is capped at
# # of peers.
assert happiness == min(len(peers), len(shares))

View File

@ -108,8 +108,8 @@ def _compute_maximum_graph(graph, shareIndices):
flow_function = [[0 for sh in xrange(dim)] for s in xrange(dim)] flow_function = [[0 for sh in xrange(dim)] for s in xrange(dim)]
residual_graph, residual_function = residual_network(graph, flow_function) residual_graph, residual_function = residual_network(graph, flow_function)
while augmenting_path_for(residual_graph): path = augmenting_path_for(residual_graph)
path = augmenting_path_for(residual_graph) while path:
# Delta is the largest amount that we can increase flow across # Delta is the largest amount that we can increase flow across
# all of the edges in path. Because of the way that the residual # all of the edges in path. Because of the way that the residual
# function is constructed, f[u][v] for a particular edge (u, v) # function is constructed, f[u][v] for a particular edge (u, v)
@ -122,6 +122,8 @@ def _compute_maximum_graph(graph, shareIndices):
flow_function[u][v] += delta flow_function[u][v] += delta
flow_function[v][u] -= delta flow_function[v][u] -= delta
residual_graph, residual_function = residual_network(graph,flow_function) residual_graph, residual_function = residual_network(graph,flow_function)
path = augmenting_path_for(residual_graph)
print('loop', len(residual_graph))
new_mappings = {} new_mappings = {}
for shareIndex in shareIndices: for shareIndex in shareIndices:
@ -242,7 +244,14 @@ def _filter_g3(g3, m1, m2):
if len(sequence) == 0: if len(sequence) == 0:
return g3 return g3
m12_servers = reduce(lambda a, b: a.union(b), sequence) m12_servers = reduce(lambda a, b: a.union(b), sequence)
m12_shares = set(m1.keys() + m2.keys()) # m1 and m2 may contain edges like "peer -> None" but those
# shouldn't be considered "actual mappings" by this removal
# algorithm (i.e. an edge "peer0 -> None" means there's nothing
# placed on peer0)
m12_shares = set(
[k for k, v in m1.items() if v] +
[k for k, v in m2.items() if v]
)
new_g3 = set() new_g3 = set()
for edge in g3: for edge in g3:
if edge[0] not in m12_servers and edge[1] not in m12_shares: if edge[0] not in m12_servers and edge[1] not in m12_shares:
@ -270,7 +279,7 @@ def calculate_happiness(mappings):
""" """
I calculate the happiness of the generated mappings I calculate the happiness of the generated mappings
""" """
unique_peers = {list(v)[0] for k, v in mappings.items()} unique_peers = {v for k, v in mappings.items()}
return len(unique_peers) return len(unique_peers)
@ -278,6 +287,11 @@ def share_placement(peers, readonly_peers, shares, peers_to_shares={}):
""" """
:param servers: ordered list of servers, "Maybe *2N* of them." :param servers: ordered list of servers, "Maybe *2N* of them."
""" """
if False:
print("peers:", peers)
print("readonly:", readonly_peers)
print("shares:", shares)
print("peers_to_shares:", peers_to_shares)
# "2. Construct a bipartite graph G1 of *readonly* servers to pre-existing # "2. Construct a bipartite graph G1 of *readonly* servers to pre-existing
# shares, where an edge exists between an arbitrary readonly server S and an # shares, where an edge exists between an arbitrary readonly server S and an
# arbitrary share T if and only if S currently holds T." # arbitrary share T if and only if S currently holds T."
@ -296,6 +310,9 @@ def share_placement(peers, readonly_peers, shares, peers_to_shares={}):
# server appears at most once. # server appears at most once.
m1 = _maximum_matching_graph(g1, peers_to_shares) m1 = _maximum_matching_graph(g1, peers_to_shares)
if False: if False:
print("G1:")
for k, v in g1:
print(" {}: {}".format(k, v))
print("M1:") print("M1:")
for k, v in m1.items(): for k, v in m1.items():
print(" {}: {}".format(k, v)) print(" {}: {}".format(k, v))
@ -320,6 +337,9 @@ def share_placement(peers, readonly_peers, shares, peers_to_shares={}):
m2 = _maximum_matching_graph(g2, peers_to_shares) m2 = _maximum_matching_graph(g2, peers_to_shares)
if False: if False:
print("G2:")
for k, v in g2:
print(" {}: {}".format(k, v))
print("M2:") print("M2:")
for k, v in m2.items(): for k, v in m2.items():
print(" {}: {}".format(k, v)) print(" {}: {}".format(k, v))
@ -348,7 +368,13 @@ def share_placement(peers, readonly_peers, shares, peers_to_shares={}):
m3 = _maximum_matching_graph(g3, {})#, peers_to_shares) m3 = _maximum_matching_graph(g3, {})#, peers_to_shares)
answer = dict() answer = {
k: None for k in shares
}
if False:
print("m1", m1)
print("m2", m2)
print("m3", m3)
_merge_dicts(answer, m1) _merge_dicts(answer, m1)
_merge_dicts(answer, m2) _merge_dicts(answer, m2)
_merge_dicts(answer, m3) _merge_dicts(answer, m3)
@ -364,16 +390,390 @@ def share_placement(peers, readonly_peers, shares, peers_to_shares={}):
# this case the remaining shares are distributed as evenly as possible across the # this case the remaining shares are distributed as evenly as possible across the
# set of writable servers." # set of writable servers."
def peer_generator(): # if we have any readwrite servers at all, we can place any shares
while True: # that didn't get placed -- otherwise, we can't.
for peer in readwrite: if readwrite:
yield peer def peer_generator():
round_robin_peers = peer_generator() while True:
for k, v in answer.items(): for peer in readwrite:
if v is None: yield peer
answer[k] = {next(round_robin_peers)} round_robin_peers = peer_generator()
for k, v in answer.items():
if v is None:
answer[k] = {next(round_robin_peers)}
# XXX we should probably actually return share->peer instead of new_answer = dict()
# share->set(peer) where the set-size is 1 because sets are a pain for k, v in answer.items():
# to deal with (i.e. no indexing). new_answer[k] = list(v)[0] if v else None
return answer return new_answer
# putting mark-berger code back in to see if it's slow too
from Queue import PriorityQueue
from allmydata.util.happinessutil import augmenting_path_for, residual_network
class Happiness_Upload:
"""
I handle the calculations involved with generating the maximum
spanning graph for a file when given a set of peerids, shareids, and
a servermap of 'peerid' -> [shareids]. Mappings are returned in a
dictionary of 'shareid' -> 'peerid'
"""
def __init__(self, peerids, readonly_peers, shareids, servermap={}):
self.happy = 0
self.homeless_shares = set()
self.peerids = peerids
self.readonly_peers = readonly_peers
self.shareids = shareids
self.servermap = servermap
self.servermap_peerids = set([key for key in servermap])
self.servermap_shareids = set()
for key in servermap:
for share in servermap[key]:
self.servermap_shareids.add(share)
def happiness(self):
return self.happy
def generate_mappings(self):
"""
Generate a flow network of peerids to existing shareids and find
its maximum spanning graph. The leases of these shares should be renewed
by the client.
"""
# 2. Construct a bipartite graph G1 of *readonly* servers to pre-existing
# shares, where an edge exists between an arbitrary readonly server S and an
# arbitrary share T if and only if S currently holds T.
# First find the maximum spanning of the readonly servers.
readonly_peers = self.readonly_peers
readonly_shares = set()
readonly_map = {}
for peer in self.servermap:
if peer in self.readonly_peers:
readonly_map.setdefault(peer, self.servermap[peer])
for share in self.servermap[peer]:
readonly_shares.add(share)
peer_to_index = self._index_peers(readonly_peers, 1)
share_to_index, index_to_share = self._reindex_shares(readonly_shares,
len(readonly_peers) + 1)
# "graph" is G1
graph = self._servermap_flow_graph(readonly_peers, readonly_shares, readonly_map)
shareids = [share_to_index[s] for s in readonly_shares]
max_graph = self._compute_maximum_graph(graph, shareids)
# 3. Calculate a maximum matching graph of G1 (a set of S->T edges that has or
# is-tied-for the highest "happiness score"). There is a clever efficient
# algorithm for this, named "Ford-Fulkerson". There may be more than one
# maximum matching for this graph; we choose one of them arbitrarily, but
# prefer earlier servers. Call this particular placement M1. The placement
# maps shares to servers, where each share appears at most once, and each
# server appears at most once.
# "max_graph" is M1 and is a dict which maps shares -> peer
# (but "one" of the many arbitrary mappings that give us "max
# happiness" of the existing placed shares)
readonly_mappings = self._convert_mappings(peer_to_index,
index_to_share, max_graph)
used_peers, used_shares = self._extract_ids(readonly_mappings)
print("readonly mappings")
for k, v in readonly_mappings.items():
print(" {} -> {}".format(k, v))
# 4. Construct a bipartite graph G2 of readwrite servers to pre-existing
# shares. Then remove any edge (from G2) that uses a server or a share found
# in M1. Let an edge exist between server S and share T if and only if S
# already holds T.
# Now find the maximum matching for the rest of the existing allocations.
# Remove any peers and shares used in readonly_mappings.
peers = self.servermap_peerids - used_peers
shares = self.servermap_shareids - used_shares
servermap = self.servermap.copy()
for peer in self.servermap:
if peer in used_peers:
servermap.pop(peer, None)
else:
servermap[peer] = servermap[peer] - used_shares
if servermap[peer] == set():
servermap.pop(peer, None)
peers.remove(peer)
# 5. Calculate a maximum matching graph of G2, call this M2, again preferring
# earlier servers.
# Reindex and find the maximum matching of the graph.
peer_to_index = self._index_peers(peers, 1)
share_to_index, index_to_share = self._reindex_shares(shares, len(peers) + 1)
graph = self._servermap_flow_graph(peers, shares, servermap)
shareids = [share_to_index[s] for s in shares]
max_server_graph = self._compute_maximum_graph(graph, shareids)
existing_mappings = self._convert_mappings(peer_to_index,
index_to_share, max_server_graph)
# "max_server_graph" is M2
print("existing mappings")
for k, v in existing_mappings.items():
print(" {} -> {}".format(k, v))
# 6. Construct a bipartite graph G3 of (only readwrite) servers to
# shares (some shares may already exist on a server). Then remove
# (from G3) any servers and shares used in M1 or M2 (note that we
# retain servers/shares that were in G1/G2 but *not* in the M1/M2
# subsets)
existing_peers, existing_shares = self._extract_ids(existing_mappings)
peers = self.peerids - existing_peers - used_peers
shares = self.shareids - existing_shares - used_shares
# Generate a flow network of peerids to shareids for all peers
# and shares which cannot be reused from previous file allocations.
# These mappings represent new allocations the uploader must make.
peer_to_index = self._index_peers(peers, 1)
share_to_index, index_to_share = self._reindex_shares(shares, len(peers) + 1)
peerids = [peer_to_index[peer] for peer in peers]
shareids = [share_to_index[share] for share in shares]
graph = self._flow_network(peerids, shareids)
# XXX I think the above is equivalent to step 6, except
# instead of "construct, then remove" the above is just
# "remove all used peers, shares and then construct graph"
# 7. Calculate a maximum matching graph of G3, call this M3, preferring earlier
# servers. The final placement table is the union of M1+M2+M3.
max_graph = self._compute_maximum_graph(graph, shareids)
new_mappings = self._convert_mappings(peer_to_index, index_to_share,
max_graph)
print("new mappings")
for k, v in new_mappings.items():
print(" {} -> {}".format(k, v))
# "the final placement table"
mappings = dict(readonly_mappings.items() + existing_mappings.items()
+ new_mappings.items())
self._calculate_happiness(mappings)
if len(self.homeless_shares) != 0:
self._distribute_homeless_shares(mappings)
return mappings
def _compute_maximum_graph(self, graph, shareids):
"""
This is an implementation of the Ford-Fulkerson method for finding
a maximum flow in a flow network applied to a bipartite graph.
Specifically, it is the Edmonds-Karp algorithm, since it uses a
BFS to find the shortest augmenting path at each iteration, if one
exists.
The implementation here is an adapation of an algorithm described in
"Introduction to Algorithms", Cormen et al, 2nd ed., pp 658-662.
"""
if graph == []:
return {}
dim = len(graph)
flow_function = [[0 for sh in xrange(dim)] for s in xrange(dim)]
residual_graph, residual_function = residual_network(graph, flow_function)
while augmenting_path_for(residual_graph):
path = augmenting_path_for(residual_graph)
# Delta is the largest amount that we can increase flow across
# all of the edges in path. Because of the way that the residual
# function is constructed, f[u][v] for a particular edge (u, v)
# is the amount of unused capacity on that edge. Taking the
# minimum of a list of those values for each edge in the
# augmenting path gives us our delta.
delta = min(map(lambda (u, v), rf=residual_function: rf[u][v],
path))
for (u, v) in path:
flow_function[u][v] += delta
flow_function[v][u] -= delta
residual_graph, residual_function = residual_network(graph,flow_function)
new_mappings = {}
for share in shareids:
peer = residual_graph[share]
if peer == [dim - 1]:
new_mappings.setdefault(share, None)
else:
new_mappings.setdefault(share, peer[0])
return new_mappings
def _extract_ids(self, mappings):
shares = set()
peers = set()
for share in mappings:
if mappings[share] == None:
pass
else:
shares.add(share)
for item in mappings[share]:
peers.add(item)
return (peers, shares)
def _calculate_happiness(self, mappings):
"""
I calculate the happiness of the generated mappings and
create the set self.homeless_shares.
"""
self.happy = 0
self.homeless_shares = set()
for share in mappings:
if mappings[share] is not None:
self.happy += 1
else:
self.homeless_shares.add(share)
def _distribute_homeless_shares(self, mappings):
"""
Shares which are not mapped to a peer in the maximum spanning graph
still need to be placed on a server. This function attempts to
distribute those homeless shares as evenly as possible over the
available peers. If possible a share will be placed on the server it was
originally on, signifying the lease should be renewed instead.
"""
# First check to see if the leases can be renewed.
to_distribute = set()
for share in self.homeless_shares:
if share in self.servermap_shareids:
for peerid in self.servermap:
if share in self.servermap[peerid]:
mappings[share] = set([peerid])
break
else:
to_distribute.add(share)
# This builds a priority queue of peers with the number of shares
# each peer holds as the priority.
priority = {}
pQueue = PriorityQueue()
for peerid in self.peerids:
priority.setdefault(peerid, 0)
for share in mappings:
if mappings[share] is not None:
for peer in mappings[share]:
if peer in self.peerids:
priority[peer] += 1
if priority == {}:
return
for peerid in priority:
pQueue.put((priority[peerid], peerid))
# Distribute the shares to peers with the lowest priority.
for share in to_distribute:
peer = pQueue.get()
mappings[share] = set([peer[1]])
pQueue.put((peer[0]+1, peer[1]))
def _convert_mappings(self, peer_to_index, share_to_index, maximum_graph):
"""
Now that a maximum spanning graph has been found, convert the indexes
back to their original ids so that the client can pass them to the
uploader.
"""
converted_mappings = {}
for share in maximum_graph:
peer = maximum_graph[share]
if peer == None:
converted_mappings.setdefault(share_to_index[share], None)
else:
converted_mappings.setdefault(share_to_index[share],
set([peer_to_index[peer]]))
return converted_mappings
def _servermap_flow_graph(self, peers, shares, servermap):
"""
Generates a flow network of peerids to shareids from a server map
of 'peerids' -> ['shareids']. According to Wikipedia, "a flow network is a
directed graph where each edge has a capacity and each edge receives a flow.
The amount of flow on an edge cannot exceed the capacity of the edge." This
is necessary because in order to find the maximum spanning, the Edmonds-Karp algorithm
converts the problem into a maximum flow problem.
"""
if servermap == {}:
return []
peerids = peers
shareids = shares
peer_to_index = self._index_peers(peerids, 1)
share_to_index, index_to_share = self._reindex_shares(shareids, len(peerids) + 1)
graph = []
sink_num = len(peerids) + len(shareids) + 1
graph.append([peer_to_index[peer] for peer in peerids])
for peerid in peerids:
shares = [share_to_index[s] for s in servermap[peerid]]
graph.insert(peer_to_index[peerid], shares)
for shareid in shareids:
graph.insert(share_to_index[shareid], [sink_num])
graph.append([])
return graph
def _index_peers(self, ids, base):
"""
I create a bidirectional dictionary of indexes to ids with
indexes from base to base + |ids| - 1 inclusively. I am used
in order to create a flow network with vertices 0 through n.
"""
reindex_to_name = {}
for item in ids:
reindex_to_name.setdefault(item, base)
reindex_to_name.setdefault(base, item)
base += 1
return reindex_to_name
def _reindex_shares(self, shares, base):
"""
I create a dictionary of sharenum -> index (where 'index' is as defined
in _index_peers) and a dictionary of index -> sharenum. Since share
numbers use the same name space as the indexes, two dictionaries need
to be created instead of one like in _reindex_peers.
"""
share_to_index = {}
index_to_share = {}
for share in shares:
share_to_index.setdefault(share, base)
index_to_share.setdefault(base, share)
base += 1
return (share_to_index, index_to_share)
def _flow_network(self, peerids, shareids):
"""
Given set of peerids and shareids, I create a flow network
to be used by _compute_maximum_graph.
"""
graph = []
graph.append(peerids)
sink_num = len(peerids + shareids) + 1
for peerid in peerids:
graph.insert(peerid, shareids)
for shareid in shareids:
graph.insert(shareid, [sink_num])
graph.append([])
return graph

View File

@ -521,7 +521,7 @@ class Tahoe2ServerSelector(log.PrefixingLogMixin):
for shnum, tracker_id in servermap.items(): for shnum, tracker_id in servermap.items():
if tracker_id == None: if tracker_id == None:
continue continue
if tracker.get_serverid() in tracker_id: if tracker.get_serverid() == tracker_id:
shares_to_ask.add(shnum) shares_to_ask.add(shnum)
if shnum in self.homeless_shares: if shnum in self.homeless_shares:
self.homeless_shares.remove(shnum) self.homeless_shares.remove(shnum)

View File

@ -47,9 +47,9 @@ class Happiness(unittest.TestCase):
self.assertEqual( self.assertEqual(
places, places,
{ {
'share0': {'peer1'}, 'share0': 'peer1',
'share1': {'peer1'}, 'share1': 'peer1',
'share2': {'peer0'}, 'share2': 'peer0',
} }
) )
@ -88,7 +88,7 @@ class Happiness(unittest.TestCase):
# i.e. this says that share0 should be on peer0, share1 should # i.e. this says that share0 should be on peer0, share1 should
# be on peer1, etc. # be on peer1, etc.
expected = { expected = {
'share{}'.format(i): {'peer{}'.format(i)} 'share{}'.format(i): 'peer{}'.format(i)
for i in range(10) for i in range(10)
} }
self.assertEqual(expected, places) self.assertEqual(expected, places)
@ -106,21 +106,147 @@ class Happiness(unittest.TestCase):
happiness = happiness_upload.calculate_happiness(places) happiness = happiness_upload.calculate_happiness(places)
self.assertEqual(4, happiness) self.assertEqual(4, happiness)
def test_calc_happy(self): def test_hypothesis0(self):
sharemap = { peers={u'0', u'00'}
0: set(["\x0e\xd6\xb3>\xd6\x85\x9d\x94')'\xf03:R\x88\xf1\x04\x1b\xa4", shares={u'0', u'1'}
'\x8de\x1cqM\xba\xc3\x0b\x80\x9aC<5\xfc$\xdc\xd5\xd3\x8b&', readonly_peers = set()
'\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t', peers_to_shares = dict()
'\xc4\x83\x9eJ\x7f\xac| .\xc90\xf4b\xe4\x92\xbe\xaa\xe6\t\x80']),
1: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), places = happiness_upload.share_placement(peers, readonly_peers, shares, peers_to_shares)
2: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), happiness = happiness_upload.calculate_happiness(places)
3: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']),
4: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), self.assertEqual(2, happiness)
5: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']),
6: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), # process just gets killed with anything like 200 (see
7: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), # test_upload.py)
8: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), def test_50(self):
9: set(['\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t']), peers = set(['peer{}'.format(x) for x in range(50)])
shares = set(['share{}'.format(x) for x in range(50)])
readonly_peers = set()
peers_to_shares = dict()
places = happiness_upload.share_placement(peers, readonly_peers, shares, peers_to_shares)
happiness = happiness_upload.calculate_happiness(places)
self.assertEqual(50, happiness)
def test_50_orig_code(self):
peers = set(['peer{}'.format(x) for x in range(50)])
shares = set(['share{}'.format(x) for x in range(50)])
readonly_peers = set()
peers_to_shares = dict()
h = happiness_upload.Happiness_Upload(peers, readonly_peers, shares, peers_to_shares)
places = h.generate_mappings()
self.assertEqual(50, h.happy)
self.assertEqual(50, len(places))
for share in shares:
self.assertTrue(share in places)
self.assertTrue(places[share].pop() in peers)
def test_redistribute(self):
"""
with existing shares 0, 3 on a single servers we can achieve
higher happiness by moving one of those shares to a new server
"""
peers = {'a', 'b', 'c', 'd'}
shares = {'0', '1', '2', '3'}
readonly_peers = set()
peers_to_shares = {
'a': set(['0']),
'b': set(['1']),
'c': set(['2', '3']),
} }
happy = happiness_upload.calculate_happiness(sharemap) # we can achieve more happiness by moving "2" or "3" to server "d"
places = happiness_upload.share_placement(peers, readonly_peers, shares, peers_to_shares)
happiness = happiness_upload.calculate_happiness(places)
self.assertEqual(4, happiness)
def test_redistribute2(self):
"""
with existing shares 0, 3 on a single servers we can achieve
higher happiness by moving one of those shares to a new server
"""
peers = {'a', 'b', 'c', 'd'}
shares = {'0', '1', '2', '3'}
readonly_peers = set()
peers_to_shares = {
'a': set(['0']),
'b': set(['1']),
'c': set(['2', '3']),
}
# we can achieve more happiness by moving "2" or "3" to server "d"
h = happiness_upload.Happiness_Upload(peers, readonly_peers, shares, peers_to_shares)
places = h.generate_mappings()
self.assertEqual(4, h.happy)
print(places)
def test_calc_happy(self):
# share -> server
share_placements = {
0: "\x0e\xd6\xb3>\xd6\x85\x9d\x94')'\xf03:R\x88\xf1\x04\x1b\xa4",
1: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
2: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
3: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
4: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
5: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
6: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
7: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
8: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
9: '\xb9\xa3N\x80u\x9c_\xf7\x97FSS\xa7\xbd\x02\xf9f$:\t',
}
happy = happiness_upload.calculate_happiness(share_placements)
self.assertEqual(2, happy) self.assertEqual(2, happy)
def test_bar(self):
peers = {'peer0', 'peer1', 'peer2', 'peer3'}
shares = {'share0', 'share1', 'share2'}
readonly_peers = {'peer0'}
servermap = {
'peer0': {'share2', 'share0'},
'peer1': {'share1'},
}
h = happiness_upload.Happiness_Upload(peers, readonly_peers, shares, servermap)
maps = h.generate_mappings()
print("maps:")
for k in sorted(maps.keys()):
print("{} -> {}".format(k, maps[k]))
def test_foo(self):
peers = ['peer0', 'peer1']
shares = ['share0', 'share1', 'share2']
h = happiness_upload.Happiness_Upload(peers, [], shares, {})
# servermap must have all peers -> [share, share, share, ...]
graph = h._servermap_flow_graph(
peers,
shares,
{
'peer0': ['share0', 'share1', 'share2'],
'peer1': ['share1'],
},
)
peer_to_index = h._index_peers(peers, 1)
share_to_index, index_to_share = h._reindex_shares(shares, len(peers) + 1)
print("graph:")
for row in graph:
print(row)
shareids = [3, 4, 5]
max_server_graph = h._compute_maximum_graph(graph, shareids)
print("max_server_graph:", max_server_graph)
for k, v in max_server_graph.items():
print("{} -> {}".format(k, v))
mappings = h._convert_mappings(peer_to_index, index_to_share, max_server_graph)
print("mappings:", mappings)
used_peers, used_shares = h._extract_ids(mappings)
print("existing used peers", used_peers)
print("existing used shares", used_shares)
unused_peers = peers - used_peers
unused_shares = shares - used_shares