forked from Networks-Learning/strategic-decisions
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmin_cost.py
192 lines (164 loc) · 6.39 KB
/
min_cost.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
import numpy as np
from lib import configuration as Configuration
import time
import json as js
import click
from joblib import Parallel, delayed
def dump_data(m, k, util, seed, runtime, accepted=None, avg_cost=None, best_responses=None, sparsity=None, alpha=None):
out = {"m": m,
"k": k,
"min_cost": util,
"seed": seed,
"time": runtime,
"sparsity": sparsity,
"accepted": accepted,
"avg_cost": avg_cost,
"alpha": alpha,
"best_responses" : best_responses
}
out = {k:v for k,v in out.items() if v is not None}
return out
# Computes the utility given a policy and a set of explanations
def compute_utility(pi, p, C, utility, ex):
m = pi.size
u = 0
br = np.arange(m) # best-responses
for i in range(m):
if pi[i]==1:
u+=p[i]*utility[i]
br[i]=i
else:
min_dist=np.inf
for j in ex:
if C[i,j]<=min_dist:
min_dist=C[i,j]
min_j=j
if 1-min_dist>=pi[i]:
u+=p[i]*utility[min_j]
br[i]=min_j
else:
u+=pi[i]*p[i]*utility[i]
br[i]=i
return u,br
# Computes the marginal difference in utility caused by adding new_ex in the set of explanations
def marginal(matching, pi, p, C, new_ex):
m = pi.size
wght_cost = 0
if matching is None:
new_matching = np.zeros(m, dtype=int)
for i in range(m):
if pi[i]!=1:
new_matching[i] = new_ex
wght_cost += p[i]*C[i,new_ex]
else:
new_matching = matching.copy()
for i in range(m):
if pi[i]!=1 and C[i,new_ex]<=C[i,new_matching[i]]:
new_matching[i] = new_ex
wght_cost += p[i]*C[i,new_ex]
elif pi[i]!=1 and C[i,new_ex]>C[i,new_matching[i]]:
wght_cost += p[i]*C[i,new_matching[i]]
return new_ex, wght_cost, new_matching
# Finds the optimal solution
def optimize(attr, k, m, njobs):
start = time.time()
solution_set=[]
matching = None # Contains the best-response of each feature value at the end each iteration
for iteration in range(k):
print("Iteration "+str(iteration))
marginals = Parallel(n_jobs=njobs)(delayed(marginal)(matching, attr['pi'], attr['p'], attr['C'], i)
for i in range(m) if attr["utility"][i]>=0 and attr["pi"][i]==1 and i not in solution_set)
if marginals!=[]:
min_new_exp, min_cost, min_exps = min(marginals, key=lambda x : x[1])
solution_set.append(min_new_exp)
matching = min_exps
end = time.time()
run_time = end - start
final_util,final_br = compute_utility(attr["pi"], attr["p"], attr["C"], attr["utility"], solution_set)
return final_util, final_br, run_time
@click.command()
@click.option('--output', required=True, help="output directory")
@click.option('--m', default=4, help="Number of states")
@click.option('--k', default=2, help="Number of examples")
@click.option('--seed', default=2, help="random number for seed.")
@click.option('--sparsity', default=2, help="sparsity of the graph")
@click.option('--accepted', default=1, type=float, help="percentage with pi equals one")
@click.option('--njobs', default=1, help="number of parallel threads")
def experiment(output, m, k, seed, sparsity, accepted, njobs):
"""
Runs one experiment on synthetic data using the minimum cost algorithm.
Parameters
----------
output : string
output directory prefix (e.g., outputs/exec1_)
m : int
number of feature values
k : int
maximum number of explanations
seed : int
random seed for reproducibility
sparsity : int
number of unreachable feature values
accepted : float
percentage of feature values with non-negative utility to set pi to 1
njobs : int
number of parallel threads to be used
"""
# Generate a random configuration
attr = Configuration.generate_pi_configuration(
m, seed, accepted_percentage=accepted, degree_of_sparsity=sparsity)
# Find optimal solution
final_util, final_br, run_time = optimize(attr, k, m, njobs)
# Compute average cost incurred by changing features
avg_cost=0
for i in range(m):
if final_br[i]!=i:
avg_cost+=attr["p"][i]*attr["C"][i,final_br[i]]
print("Minimum Cost RunTime = " + str(run_time))
print("Final Utility = " + str(final_util))
# Store execution details and results
with open(output + '_config.json', "w") as fi:
fi.write(js.dumps(dump_data(m=m, k=k, util=final_util, seed=seed, runtime=run_time,
sparsity=sparsity, accepted=accepted, avg_cost=avg_cost)))
def compute_mincos(output, C, U, Px, k, seed, alpha, indexing, njobs=1):
"""
Runs one experiment on real data using the minimum cost algorithm.
Parameters
----------
output : string
output directory prefix (e.g., outputs/exec1_)
C : numpy array
pairwise costs
U : numpy array
utility gained by each feature value
Px : numpy array
initial population in each feature value
k : int
maximum number of explanations
seed : int
random seed for reproducibility
alpha : float
alpha parameter value
indexing : numpy array
real indices of feature values (unsorted)
njobs : int
number of parallel threads to be used
"""
# Generate a configuration based on input data
attr = Configuration.generate_configuration_state(U, C, Px, seed)
m=attr["m"]
# Find optimal solution
final_util, final_br, run_time = optimize(attr, k, m, njobs)
# Fix best responses to fit the real indices
best_responses = {}
for index, real_index in enumerate(indexing):
best_responses[int(real_index)] = int(indexing[final_br[index]])
print("Minimum Cost RunTime = " + str(run_time))
print("Final Utility = " + str(final_util))
# Store execution details and results
with open(output + '_config.json', "w") as fi:
fi.write(js.dumps(dump_data(m=m, k=k, util=final_util, seed=seed, runtime=run_time,
alpha=alpha, best_responses=best_responses)))
return attr
if __name__ == '__main__':
experiment()