Added results

sumonbis · Dec 9, 2022 · 6e23727 · 6e23727
1 parent f70c12d
commit 6e23727
Show file tree

Hide file tree

Showing 93 changed files with 147,669 additions and 0 deletions.
diff --git a/targeted/AC-result.csv b/targeted/AC-result.csv
@@ -0,0 +1,13 @@
+,Partition_ID,SAT_count,UNSAT_count,UNK_count,h_attempt,h_success,ST_compression,H_compression,SV-time,HV-Time,Total-Time
+0,223,55,160,8,11,3,0.77632287,0.006278027,11.92933184,4.392726457,16.4506278
+4,67,16,37,14,14,0,0.88991791,0.006501493,33.89147761,20.90544776,55.22850746
+5,115,75,32,8,11,3,0.817211304,0.003749565,22.90266957,8.281417391,31.38608696
+6,25,7,3,15,16,1,0.874024,0.042984,77.08212,61.2542,150.408
+7,23,8,1,14,19,5,0.846986957,0.037086957,87.10565217,68.89026087,158.7913043
+8,111,52,47,12,14,2,0.684684685,0.011531532,21.30367568,11.15859459,32.60558559
+9,38,0,26,12,19,7,0.729052632,0.042947368,57.15105263,36.46505263,95.23736842
+10,448,179,266,3,4,1,0.324044643,0,7.249845982,0.677446429,8.047321429
+11,6800,1624,5176,0,0,0,0.261818794,0,0.424020882,0,0.529416176
+1,108,23,81,4,17,13,0.400362963,0.006611111,25.53975926,7.688537037,33.36759259
+2,18,0,0,18,18,0,0.140933333,0.032533333,100.1185,100.1684444,200.7522222
+3,68,0,50,18,18,0,0.417833824,0.006705882,28.21379412,26.51486765,54.97485294
diff --git a/targeted/AC/Verify-AC.py b/targeted/AC/Verify-AC.py
@@ -0,0 +1,317 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+import sys
+sys.path.append('../../')
+
+from random import shuffle
+from z3 import *
+from utils.input_partition import *
+from utils.verif_utils import *
+from utils.prune import *
+from importlib import import_module
+
+# In[]
+
+df, X_train, y_train, X_test, y_test = load_adult_ac1()
+X = np.r_[X_train, X_test]
+single_input = X_test[0].reshape(1, 13)
+#print_metadata(df)
+
+# In[]
+model_dir = '../../models/adult/'
+result_dir = './res/race1-'
+PARTITION_THRESHOLD = 6
+
+SOFT_TIMEOUT = 100
+HARD_TIMEOUT = 1*60*60
+HEURISTIC_PRUNE_THRESHOLD = 20
+
+# In[]
+## Domain
+default_range = [0, 1]
+range_dict = {}
+range_dict['age'] = [30, 35]
+range_dict['workclass'] = [0, 6]
+range_dict['education'] = [0, 15]
+range_dict['education-num'] = [1, 16]
+range_dict['marital-status'] = [0, 6]
+range_dict['occupation'] = [0, 13]
+range_dict['relationship'] = [0, 5]
+range_dict['race'] = [0, 4]
+range_dict['sex'] = [0, 1]
+range_dict['capital-gain'] = [0, 19]
+range_dict['capital-loss'] = [0, 19]
+range_dict['hours-per-week'] = [1, 100]
+range_dict['native-country'] = [0, 40]
+
+A = range_dict.keys()
+PA = ['race']
+
+RA = []
+RA_threshold = 5
+
+sim_size = 1 * 1000
+
+p_dict = partition(range_dict, PARTITION_THRESHOLD)
+p_list = partitioned_ranges(A, PA, p_dict, range_dict)
+print('Number of partitions: ', len(p_list))
+shuffle(p_list)
+
+# In[]
+
+model_files = os.listdir(model_dir)
+for model_file in model_files:
+    if not model_file.endswith('.h5'):
+        continue;
+    print('==================  STARTING MODEL ' + model_file)
+    model_name = model_file.split('.')[0]
+    if model_name == '':
+        continue
+
+    model_funcs = 'utils.' + model_name + '-Model-Functions'
+    mod = import_module(model_funcs)
+    layer_net = getattr(mod, 'layer_net')
+    net = getattr(mod, 'net')
+    z3_net = getattr(mod, 'z3_net')
+
+    w = []
+    b = []
+
+    model = load_model(model_dir + model_file)
+
+    for i in range(len(model.layers)):
+        w.append(model.layers[i].get_weights()[0])
+        b.append(model.layers[i].get_weights()[1])
+
+    print('###################')
+    partition_id = 0
+    sat_count = 0
+    unsat_count = 0
+    unk_count = 0
+    cumulative_time = 0
+
+    for p in p_list:
+        heuristic_attempted = 0
+        result = []
+        start_time = time.time()
+
+        partition_id += 1
+        simulation_size = 1*1000
+
+
+        # In[]
+    #    sd = s
+        neuron_bounds, candidates, s_candidates, b_deads, s_deads, st_deads, pos_prob, sim_X_df  = \
+            sound_prune(df, w, b, simulation_size, layer_net, p)
+
+        b_compression = compression_ratio(b_deads)
+        s_compression = compression_ratio(s_deads)
+        st_compression = compression_ratio(st_deads)
+
+        pr_w, pr_b = prune_neurons(w, b, st_deads)
+
+
+        # In[]
+        # Create properties
+        in_props = []
+        out_props = []
+
+        x = np.array([Int('x%s' % i) for i in range(13)]) 
+        x_ = np.array([Int('x_%s' % i) for i in range(13)])
+
+        y = z3_net(x, pr_w, pr_b) # y is an array of size 1
+        y_ = z3_net(x_, pr_w, pr_b)
+
+        # Basic fairness property - must include
+        for attr in A:
+            if(attr in PA):
+                in_props.extend(in_const_adult(df, x, attr, 'neq', x_))
+            elif(attr in RA):
+                in_props.extend(in_const_diff_adult(df, x, x_, attr, RA_threshold))
+            else:
+                in_props.extend(in_const_adult(df, x, attr, 'eq', x_))
+
+        in_props.extend(in_const_domain_adult(df, x, x_, p, PA))
+
+        # In[]
+        s = Solver()
+        #s.reset()
+
+        if(len(sys.argv) > 1):
+            s.set("timeout", int(sys.argv[1]) * 1000) # X seconds
+        else:
+            s.set("timeout", SOFT_TIMEOUT * 1000)
+
+
+        for i in in_props:
+            s.add(i)
+
+        s.add(Or(And(y[0] < 0, y_[0] > 0), And(y[0] > 0, y_[0] < 0)))
+
+        print('Verifying ...')
+        res = s.check()
+
+        print(res)
+        if res == sat:
+            m = s.model()
+            inp1, inp2 = parse_z3Model(m)
+
+        sv_time = s.statistics().time
+        s_end_time = time.time()
+        s_time = compute_time(start_time, s_end_time)
+        hv_time = 0
+        # In[]
+        h_compression = 0
+        t_compression = st_compression
+        h_success = 0
+        if res == unknown:
+            heuristic_attempted = 1
+
+            h_deads, deads = heuristic_prune(neuron_bounds, candidates,
+                s_candidates, st_deads, pos_prob, HEURISTIC_PRUNE_THRESHOLD, w, b)
+
+            del pr_w
+            del pr_b
+
+            pr_w, pr_b = prune_neurons(w, b, deads)
+            h_compression = compression_ratio(h_deads)
+            print(round(h_compression*100, 2), '% HEURISTIC PRUNING')
+            t_compression = compression_ratio(deads)
+            print(round(t_compression*100, 2), '% TOTAL PRUNING')
+
+            y = z3_net(x, pr_w, pr_b) # y is an array of size 1
+            y_ = z3_net(x_, pr_w, pr_b)
+
+            s = Solver()
+
+            if(len(sys.argv) > 1):
+                s.set("timeout", int(sys.argv[1]) * 1000) # X seconds
+            else:
+                s.set("timeout", SOFT_TIMEOUT * 1000)
+
+            for i in in_props:
+                s.add(i)
+
+            s.add(Or(And(y[0] < 0, y_[0] > 0), And(y[0] > 0, y_[0] < 0)))
+            print('Verifying ...')
+            res = s.check()
+
+            print(res)
+            if res == sat:
+                m = s.model()
+                inp1, inp2 = parse_z3Model(m)
+
+            if res != unknown:
+                h_success = 1
+            hv_time = s.statistics().time
+
+        # In[]
+        h_time = compute_time(s_end_time, time.time())
+        total_time = compute_time(start_time, time.time())
+
+        cumulative_time += total_time
+
+        # In[]
+        print('V time: ', s.statistics().time)
+        file = result_dir + model_name + '.csv'
+
+        # In[]
+        c_check_correct = 0
+        accurate = 0
+        d1 = ''
+        d2 = ''
+        if res == sat:
+            sat_count += 1
+            d1 = np.asarray(inp1, dtype=np.float32)
+            d2 = np.asarray(inp2, dtype=np.float32)
+            print(inp1)
+            print(inp2)
+            res1 = net(d1, pr_w, pr_b)
+            res2 = net(d2, pr_w, pr_b)
+            print(res1, res2)
+            pred1 = sigmoid(res1)
+            pred2 = sigmoid(res2)
+            class_1 = pred1 > 0.5
+            class_2 = pred2 > 0.5
+
+            res1_orig = net(d1, w, b)
+            res2_orig = net(d2, w, b)
+            print(res1_orig, res2_orig)
+            pred1_orig = sigmoid(res1_orig)
+            pred2_orig = sigmoid(res2_orig)
+            class_1_orig = pred1_orig > 0.5
+            class_2_orig = pred2_orig > 0.5
+
+            if class_1_orig != class_2_orig:
+                accurate = 1
+            if class_1 == class_1_orig and class_2 == class_2_orig:
+                c_check_correct = 1
+        elif res == unsat:
+            unsat_count += 1
+        else:
+            unk_count +=1
+
+
+        d = X_test[0]
+        res1 = net(d, pr_w, pr_b)
+        pred1 = sigmoid(res1)
+        class_1 = pred1 > 0.5
+
+        res1_orig = net(d, w, b)
+        pred1_orig = sigmoid(res1_orig)
+        class_1_orig = pred1_orig > 0.5
+
+        sim_X = sim_X_df.to_numpy()    
+        sim_y_orig = get_y_pred(net, w, b, sim_X)    
+        sim_y = get_y_pred(net, pr_w, pr_b, sim_X)
+
+
+        orig_acc = accuracy_score(y_test, get_y_pred(net, w, b, X_test))
+        pruned_acc = accuracy_score(sim_y_orig, sim_y)
+
+        # In[]
+        res_cols = ['Partition_ID', 'Verification', 'SAT_count', 'UNSAT_count', 'UNK_count', 'h_attempt', 'h_success', \
+                    'B_compression', 'S_compression', 'ST_compression', 'H_compression', 'T_compression', 'SV-time', 'S-time', 'HV-Time', 'H-Time', 'Total-Time', 'C-check',\
+                    'V-accurate', 'Original-acc', 'Pruned-acc', 'Acc-dec', 'C1', 'C2']
+
+        result.append(partition_id)
+        result.append(str(res))
+        result.append(sat_count)
+        result.append(unsat_count)
+        result.append(unk_count)
+        result.append(heuristic_attempted)
+        result.append(h_success)
+        result.append(round(b_compression, 4))
+        result.append(round(s_compression, 4))
+        result.append(round(st_compression, 4))
+        result.append(round(h_compression, 4))
+        result.append(round(t_compression, 4))
+        result.append(sv_time)
+        result.append(s_time)
+        result.append(hv_time)
+        result.append(h_time)
+        result.append(total_time)
+        result.append(c_check_correct)
+        result.append(accurate)
+        result.append(round(orig_acc, 4))
+        result.append(round(pruned_acc, 4))
+        result.append('-')
+        #result.append(round(orig_acc - pruned_acc, 4))
+        result.append(d1)
+        result.append(d2)
+
+
+        import csv
+        file_exists = os.path.isfile(file)
+        with open(file, "a", newline='') as fp:
+            if not file_exists:
+                wr = csv.writer(fp, dialect='excel')
+                wr.writerow(res_cols)
+
+            wr = csv.writer(fp)
+            wr.writerow(result)
+        print('******************')
+
+        if(cumulative_time > HARD_TIMEOUT):
+            print('==================  COMPLETED MODEL ' + model_file)
+            break