-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathMain_ChnkSzVar.py
174 lines (125 loc) · 6.16 KB
/
Main_ChnkSzVar.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
# This is the main file to run the simulator for our coded load balancing scheme.
#
# Here we change the number of chunks a file is partition to and simulate the average cost
# of users and the maximum load of servers.
#
#
from __future__ import division
import math
from multiprocessing import Pool
import sys
import numpy as np
import scipy.io as sio
import time
from CodedLoadBalancing.Simulator_MltChnk import *
#--------------------------------------------------------------------
# Simulation parameters:
# Choose the simulator. It can be the following values:
simulator = 'Coded'
# Base part of the output file name
base_out_filename = 'ChnkSzVar'
# Pool size for parallel processing
pool_size = 2
# Number of runs for computing average values. It is more eficcient that num_of_runs be a multiple of pool_size
num_of_runs = 10
# Number of servers
srv_num = 49
# Cache size of each server (expressed in number of files)
cache_sz = 1
# Total number of files in the system
file_num = 10
# The number of chunks
# If the number of chunks is set to one, we in fact simulate the nearest replica strategy.
# Here, instead of determining the 'number of chunks,' we provide a set of chunk numbers in the
# variable 'chnk_range'.
#chnk_num = 5
chnk_range = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]
# The maximum number of chunks that can be downloaded from each server.
chnk_max = 10
# The graph structure of the network
# It can be:
# 'Lattice' for square lattice graph. For the lattice the graph size should be perfect square.
# 'RGG' for random geometric graph. The RGG is generate over a unit square or unit cube.
# 'BarabasiAlbert' for Barabasi Albert random graph. It takes two parameters: # of nodes and # of edges
# to attach from a new node to existing nodes
graph_type = 'Lattice'
#graph_type = 'RGG'
#graph_type = 'BarabasiAlbert'
# The parameters of the selected random graph
# The dictionary graph_param should always be defined. However, for some graphs it may not be used.
graph_param = {'rgg_radius': sqrt(5 / 4 * log(srv_num)) / sqrt(srv_num)} # if the graph is random geometric graph (RGG)
graph_param = {'num_edges' : 1} # For Barbasi Albert random graphs.
# The distribution of file placement in nodes' caches
# It can be:
# 'Uniform' for uniform placement.
# 'Zipf' for zipf distribution. We have to determine the parameter 'gamma' for this distribution in 'place_dist_param'.
placement_dist = 'Uniform'
#placement_dist = 'Zipf'
# The parameters of the placement distribution
place_dist_param = {'gamma' : 0.0} # For Zipf distribution where 0 < gamma < infty
#--------------------------------------------------------------------
if __name__ == '__main__':
# Create a number of workers for parallel processing
pool = Pool(processes=pool_size)
t_start = time.time()
rslt_maxload = np.zeros((len(chnk_range), 1 + num_of_runs))
rslt_avgcost = np.zeros((len(chnk_range), 1 + num_of_runs))
rslt_outage = np.zeros((len(chnk_range), 1 + num_of_runs))
for i, chnk_num in enumerate(chnk_range):
req_num = srv_num
params = [(srv_num, req_num, cache_sz, file_num, chnk_num, chnk_max, graph_type, graph_param, placement_dist, place_dist_param)
for itr in range(num_of_runs)]
print(params)
if simulator == 'Coded':
rslts = pool.map(coded_load_balancing_simulator, params)
# elif simulator == 'TwoChoices':
# rslts = pool.map(simulator_twochoice, params)
else:
print('Error: an invalid simulator!')
sys.exit()
for j, rslt in enumerate(rslts):
rslt_maxload[i, j + 1] = rslt['maxload']
rslt_avgcost[i, j + 1] = rslt['avgcost']
rslt_outage[i, j + 1] = rslt['outage']
#tmpmxld = tmpmxld + rslt['maxload']
#tmpavgcst = tmpavgcst + rslt['avgcost']
rslt_maxload[i, 0] = chnk_num
rslt_avgcost[i, 0] = chnk_num
rslt_outage[i, 0] = chnk_num
t_end = time.time()
print("The runtime is {}".format(t_end-t_start))
# Write the results to a matlab .mat file
if placement_dist == 'Uniform':
sio.savemat(base_out_filename + '_{}_{}_{}_sn={}_fn={}_cs={}_chnmax={}_itr={}.mat'.\
format(graph_type, placement_dist, simulator, srv_num, file_num, cache_sz, chnk_max, num_of_runs),
{'maxload': rslt_maxload, 'avgcost': rslt_avgcost, 'outage': rslt_outage})
elif placement_dist == 'Zipf':
sio.savemat(base_out_filename + '_{}_{}_gamma={}_{}_sn={}_fn={}_cs={}_chnmax={}_itr={}.mat'.\
format(graph_type, placement_dist, place_dist_param['gamma'], simulator, srv_num,\
file_num, cache_sz, chnk_max, num_of_runs),\
{'maxload': rslt_maxload, 'avgcost': rslt_avgcost, 'outage': rslt_outage})
# if simulator == 'one choice':
# sio.savemat(base_out_filename + '_{}_fn={}_cs={}_itr={}.mat'.format(simulator, file_num, cache_sz, num_of_runs),
# {'maxload': rslt_maxload, 'avgcost': rslt_avgcost, 'outage':rslt_outage})
# elif simulator == 'two choice':
# sio.savemat(base_out_filename + '_two_choice_' + 'fn={}_cs={}_itr={}.mat'.format(file_num, cache_sz, num_of_runs),
# {'maxload': rslt_maxload, 'avgcost': rslt_avgcost, 'outage':rslt_outage})
# if simulator == 'one choice':
# np.savetxt(base_out_filename+'_sim1_'+'fn={}_cs={}_itr={}.txt'.format(file_num,cache_sz,num_of_runs), result, delimiter=',')
# elif simulator == 'two choice':
# np.savetxt(base_out_filename+'_sim2_'+'fn={}_cs={}_itr={}.txt'.format(file_num,cache_sz,num_of_runs), result, delimiter=',')
# plt.plot(result[:,0], result[:,1])
# plt.plot(result[:,0], result[:,2])
# plt.xlabel('Cache size in each server (# of files)')
# plt.title('Random server selection methods. Number of servers = {}, number of files = {}'.format(srv_num,file_num))
# plt.show()
#print(result['loads'])
#print("------")
#print('The maximum load is {}'.format(result['maxload']))
#print('The average request cost is {0:0}'.format(result['avgcost']))
print('Outage:')
print(rslt_outage)
print('Maxload:')
print(rslt_maxload)
print('Communication Cost:')
print(rslt_avgcost)