diff --git a/examples/demo_gerryfair.ipynb b/examples/demo_gerryfair.ipynb index efdb5983..daaabbe1 100644 --- a/examples/demo_gerryfair.ipynb +++ b/examples/demo_gerryfair.ipynb @@ -1,884 +1,998 @@ { - "cells": [ - { - "cell_type": "code", - "execution_count": 1, - "metadata": { - "pycharm": { - "is_executing": false - } - }, - "outputs": [], - "source": [ - "%matplotlib inline\n", - "import warnings\n", - "warnings.filterwarnings(\"ignore\")\n", - "import sys\n", - "sys.path.append(\"../\")\n", - "from aif360.algorithms.inprocessing import GerryFairClassifier\n", - "from aif360.algorithms.inprocessing.gerryfair.clean import array_to_tuple\n", - "from aif360.algorithms.inprocessing.gerryfair.auditor import Auditor\n", - "from aif360.algorithms.preprocessing.optim_preproc_helpers.data_preproc_functions import load_preproc_data_adult\n", - "from sklearn import svm\n", - "from sklearn import tree\n", - "from sklearn.kernel_ridge import KernelRidge\n", - "from sklearn import linear_model\n", - "from aif360.metrics import BinaryLabelDatasetMetric\n", - "from IPython.display import Image\n", - "import pickle\n", - "import matplotlib.pyplot as plt\n", - "\n", - "# load data set\n", - "data_set = load_preproc_data_adult(sub_samp=1000, balance=True)\n", - "max_iterations = 500" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "**instantiate, fit, and predict** \n", - "\n", - "\n", - "We first demonstrate how to instantiate a `GerryFairClassifier`, `train` it with respect to rich subgroup fairness, and `predict` the label of a new example. We remark that when we set the `print_flag = True` at each iteration of the algorithm we print the error, fairness violation, and violated group size of most recent model. The error is the classification error of the classifier. At each round the Learner tries to find a classifier that minimizes the classification error plus a weighted sum of the fairness disparities on all the groups that the Auditor has found up until that point. By contrast the Auditor tries to find the group at each round with the greatest rich subgroup disparity with respect to the Learner's model. We define `violated group size` as the size (as a fraction of the dataset size) of this group, and the `fairness violation` as the `violated group size` times the difference in the statistical rate (FP or FN rate) on the group vs. the whole population. \n", - "\n", - "In the example below we set `max_iterations=500` which is an order of magnitude less than the time to convergence observed in [the rich subgroup fairness empirical paper](https://arxiv.org/abs/1808.08166), but advise that this can be highly dataset dependent. Our target $\\gamma$-disparity is $\\gamma = .005$, our statistical rate is false positive rate or `FP`, and our cost-sensitive classification oracle is linear regression (more on that below). \n" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "metadata": { - "pycharm": { - "is_executing": true - } - }, - "outputs": [ + "cells": [ { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 1, error: 0.263, fairness violation: 0.028780000000000007, violated group size: 0.217\n", - "iteration: 2, error: 0.3815, fairness violation: 0.014390000000000003, violated group size: 0.217\n", - "iteration: 3, error: 0.42099999999999993, fairness violation: 0.009593333333333339, violated group size: 0.283\n", - "iteration: 4, error: 0.44075, fairness violation: 0.007195000000000002, violated group size: 0.217\n", - "iteration: 5, error: 0.45260000000000006, fairness violation: 0.005756000000000001, violated group size: 0.217\n", - "iteration: 6, error: 0.4605000000000001, fairness violation: 0.004796666666666668, violated group size: 0.283\n", - "iteration: 7, error: 0.4661428571428572, fairness violation: 0.004111428571428572, violated group size: 0.217\n", - "iteration: 8, error: 0.470375, fairness violation: 0.0035975000000000017, violated group size: 0.217\n", - "iteration: 9, error: 0.4691111111111112, fairness violation: 0.0033906666666666677, violated group size: 0.283\n", - "iteration: 10, error: 0.4681, fairness violation: 0.003225200000000001, violated group size: 0.283\n", - "iteration: 11, error: 0.4672727272727271, fairness violation: 0.0030898181818181836, violated group size: 0.283\n", - "iteration: 12, error: 0.4665833333333333, fairness violation: 0.0029769999999999996, violated group size: 0.217\n", - "iteration: 13, error: 0.466, fairness violation: 0.0028815384615384627, violated group size: 0.283\n", - "iteration: 14, error: 0.4655000000000001, fairness violation: 0.0027997142857142865, violated group size: 0.217\n", - "iteration: 15, error: 0.46506666666666674, fairness violation: 0.002728800000000001, violated group size: 0.217\n", - "iteration: 16, error: 0.4646875, fairness violation: 0.0026667500000000007, violated group size: 0.217\n", - "iteration: 17, error: 0.4643529411764707, fairness violation: 0.002612000000000001, violated group size: 0.283\n", - "iteration: 18, error: 0.46405555555555567, fairness violation: 0.002563333333333334, violated group size: 0.217\n", - "iteration: 19, error: 0.4637894736842106, fairness violation: 0.0025197894736842096, violated group size: 0.217\n", - "iteration: 20, error: 0.46354999999999996, fairness violation: 0.0024806000000000008, violated group size: 0.283\n", - "iteration: 21, error: 0.4633333333333334, fairness violation: 0.0024451428571428584, violated group size: 0.217\n", - "iteration: 22, error: 0.4631363636363638, fairness violation: 0.0024129090909090914, violated group size: 0.283\n", - "iteration: 23, error: 0.46295652173913054, fairness violation: 0.002383478260869566, violated group size: 0.217\n", - "iteration: 24, error: 0.4627916666666667, fairness violation: 0.002356500000000001, violated group size: 0.283\n", - "iteration: 25, error: 0.4626400000000001, fairness violation: 0.0023316800000000018, violated group size: 0.283\n", - "iteration: 26, error: 0.4625000000000001, fairness violation: 0.0023087692307692314, violated group size: 0.217\n", - "iteration: 27, error: 0.4623703703703705, fairness violation: 0.0022875555555555557, violated group size: 0.217\n", - "iteration: 28, error: 0.46224999999999994, fairness violation: 0.0022678571428571426, violated group size: 0.217\n", - "iteration: 29, error: 0.46213793103448264, fairness violation: 0.0022495172413793106, violated group size: 0.217\n", - "iteration: 30, error: 0.46203333333333335, fairness violation: 0.0022324000000000003, violated group size: 0.217\n", - "iteration: 31, error: 0.46193548387096783, fairness violation: 0.0022163870967741935, violated group size: 0.217\n", - "iteration: 32, error: 0.46184375, fairness violation: 0.0022013749999999993, violated group size: 0.217\n", - "iteration: 33, error: 0.459969696969697, fairness violation: 0.0023319393939393944, violated group size: 0.283\n", - "iteration: 34, error: 0.4582058823529412, fairness violation: 0.002454823529411765, violated group size: 0.217\n", - "iteration: 35, error: 0.45654285714285714, fairness violation: 0.0025706857142857144, violated group size: 0.217\n", - "iteration: 36, error: 0.4549722222222221, fairness violation: 0.0026801111111111114, violated group size: 0.283\n", - "iteration: 37, error: 0.4534864864864866, fairness violation: 0.0027836216216216214, violated group size: 0.283\n", - "iteration: 38, error: 0.45207894736842097, fairness violation: 0.0028816842105263162, violated group size: 0.283\n", - "iteration: 39, error: 0.4507435897435898, fairness violation: 0.0029747179487179492, violated group size: 0.217\n", - "iteration: 40, error: 0.44947499999999996, fairness violation: 0.0030631000000000005, violated group size: 0.217\n", - "iteration: 41, error: 0.44826829268292684, fairness violation: 0.0031471707317073175, violated group size: 0.283\n", - "iteration: 42, error: 0.4471190476190476, fairness violation: 0.0032272380952380955, violated group size: 0.217\n", - "iteration: 43, error: 0.44602325581395347, fairness violation: 0.0033035813953488386, violated group size: 0.283\n", - "iteration: 44, error: 0.44497727272727267, fairness violation: 0.0033764545454545453, violated group size: 0.283\n", - "iteration: 45, error: 0.4439777777777778, fairness violation: 0.003446088888888888, violated group size: 0.217\n", - "iteration: 46, error: 0.44302173913043474, fairness violation: 0.0035126956521739122, violated group size: 0.217\n", - "iteration: 47, error: 0.44210638297872346, fairness violation: 0.0035764680851063826, violated group size: 0.217\n", - "iteration: 48, error: 0.4412291666666666, fairness violation: 0.003637583333333332, violated group size: 0.217\n", - "iteration: 49, error: 0.4403877551020407, fairness violation: 0.0036962040816326523, violated group size: 0.217\n", - "iteration: 50, error: 0.4395600000000001, fairness violation: 0.0037524800000000003, violated group size: 0.217\n", - "iteration: 51, error: 0.43876470588235295, fairness violation: 0.0038065490196078425, violated group size: 0.217\n", - "iteration: 52, error: 0.438, fairness violation: 0.003858538461538461, violated group size: 0.283\n", - "iteration: 53, error: 0.4372641509433963, fairness violation: 0.003908566037735848, violated group size: 0.217\n", - "iteration: 54, error: 0.4365555555555556, fairness violation: 0.003956740740740741, violated group size: 0.283\n", - "iteration: 55, error: 0.4358181818181819, fairness violation: 0.004003163636363636, violated group size: 0.217\n", - "iteration: 56, error: 0.4351071428571429, fairness violation: 0.004047928571428571, violated group size: 0.217\n", - "iteration: 57, error: 0.4344736842105262, fairness violation: 0.004091122807017543, violated group size: 0.217\n", - "iteration: 58, error: 0.43381034482758624, fairness violation: 0.004132827586206895, violated group size: 0.217\n", - "iteration: 59, error: 0.4331694915254237, fairness violation: 0.0041731186440677965, violated group size: 0.283\n", - "iteration: 60, error: 0.43254999999999993, fairness violation: 0.004212066666666666, violated group size: 0.217\n", - "iteration: 61, error: 0.4319508196721312, fairness violation: 0.004249737704918031, violated group size: 0.217\n", - "iteration: 62, error: 0.4313709677419356, fairness violation: 0.004286193548387096, violated group size: 0.217\n", - "iteration: 63, error: 0.43080952380952386, fairness violation: 0.004321492063492062, violated group size: 0.283\n", - "iteration: 64, error: 0.430265625, fairness violation: 0.004355687499999999, violated group size: 0.283\n", - "iteration: 65, error: 0.4297384615384615, fairness violation: 0.004388830769230769, violated group size: 0.283\n", - "iteration: 66, error: 0.42922727272727274, fairness violation: 0.004420969696969697, violated group size: 0.217\n", - "iteration: 67, error: 0.42873134328358203, fairness violation: 0.004452149253731343, violated group size: 0.217\n", - "iteration: 68, error: 0.42824999999999996, fairness violation: 0.0044824117647058815, violated group size: 0.283\n", - "iteration: 69, error: 0.42778260869565227, fairness violation: 0.004511797101449274, violated group size: 0.217\n", - "iteration: 70, error: 0.42732857142857145, fairness violation: 0.004540342857142856, violated group size: 0.283\n", - "iteration: 71, error: 0.42688732394366197, fairness violation: 0.004568084507042252, violated group size: 0.217\n", - "iteration: 72, error: 0.4264583333333332, fairness violation: 0.004595055555555555, violated group size: 0.283\n", - "iteration: 73, error: 0.42604109589041106, fairness violation: 0.004621287671232876, violated group size: 0.217\n", - "iteration: 74, error: 0.4256351351351351, fairness violation: 0.0046468108108108095, violated group size: 0.283\n", - "iteration: 75, error: 0.42524, fairness violation: 0.004671653333333331, violated group size: 0.217\n", - "iteration: 76, error: 0.4248552631578947, fairness violation: 0.004695842105263155, violated group size: 0.217\n", - "iteration: 77, error: 0.42448051948051946, fairness violation: 0.004719402597402596, violated group size: 0.217\n", - "iteration: 78, error: 0.4239871794871795, fairness violation: 0.00475905128205128, violated group size: 0.217\n", - "iteration: 79, error: 0.42363291139240505, fairness violation: 0.004781215189873418, violated group size: 0.283\n", - "iteration: 80, error: 0.42328750000000015, fairness violation: 0.004802824999999999, violated group size: 0.283\n" - ] + "cell_type": "markdown", + "metadata": { + }, + "source": [ + "[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/Trusted-AI/AIF360/blob/master/examples/demo_gerryfair.ipynb)\n" + ] }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 81, error: 0.4229506172839506, fairness violation: 0.004823901234567901, violated group size: 0.283\n", - "iteration: 82, error: 0.4226219512195123, fairness violation: 0.004844463414634145, violated group size: 0.217\n", - "iteration: 83, error: 0.4221807228915662, fairness violation: 0.004880216867469879, violated group size: 0.217\n", - "iteration: 84, error: 0.42175, fairness violation: 0.004915119047619047, violated group size: 0.217\n", - "iteration: 85, error: 0.4214470588235294, fairness violation: 0.004933882352941174, violated group size: 0.217\n", - "iteration: 86, error: 0.4210348837209302, fairness violation: 0.004967348837209301, violated group size: 0.217\n", - "iteration: 87, error: 0.420632183908046, fairness violation: 0.005000045977011494, violated group size: 0.283\n", - "iteration: 88, error: 0.42035227272727277, fairness violation: 0.0050172045454545434, violated group size: 0.217\n", - "iteration: 89, error: 0.4200786516853933, fairness violation: 0.005033977528089887, violated group size: 0.217\n", - "iteration: 90, error: 0.4198111111111112, fairness violation: 0.005050377777777776, violated group size: 0.283\n", - "iteration: 91, error: 0.4195824175824176, fairness violation: 0.0050664175824175805, violated group size: 0.217\n", - "iteration: 92, error: 0.4193695652173913, fairness violation: 0.005082108695652173, violated group size: 0.217\n", - "iteration: 93, error: 0.41916129032258065, fairness violation: 0.005097462365591397, violated group size: 0.217\n", - "iteration: 94, error: 0.41895744680851066, fairness violation: 0.005112489361702126, violated group size: 0.217\n", - "iteration: 95, error: 0.41875789473684216, fairness violation: 0.005127199999999998, violated group size: 0.217\n", - "iteration: 96, error: 0.41856250000000006, fairness violation: 0.005141604166666665, violated group size: 0.283\n", - "iteration: 97, error: 0.418979381443299, fairness violation: 0.005106494845360823, violated group size: 0.217\n", - "iteration: 98, error: 0.41938775510204085, fairness violation: 0.005072102040816325, violated group size: 0.217\n", - "iteration: 99, error: 0.4197878787878788, fairness violation: 0.0050384040404040376, violated group size: 0.217\n", - "iteration: 100, error: 0.42018000000000005, fairness violation: 0.0050053799999999985, violated group size: 0.217\n", - "iteration: 101, error: 0.42056435643564366, fairness violation: 0.004973009900990098, violated group size: 0.217\n", - "iteration: 102, error: 0.42094117647058826, fairness violation: 0.00494127450980392, violated group size: 0.217\n", - "iteration: 103, error: 0.4213106796116506, fairness violation: 0.004910155339805824, violated group size: 0.217\n", - "iteration: 104, error: 0.4216730769230769, fairness violation: 0.004879634615384614, violated group size: 0.217\n", - "iteration: 105, error: 0.4220285714285715, fairness violation: 0.004849695238095237, violated group size: 0.217\n", - "iteration: 106, error: 0.4223773584905662, fairness violation: 0.004820320754716981, violated group size: 0.283\n", - "iteration: 107, error: 0.42271962616822434, fairness violation: 0.004791495327102803, violated group size: 0.217\n", - "iteration: 108, error: 0.4230555555555556, fairness violation: 0.0047632037037037035, violated group size: 0.217\n", - "iteration: 109, error: 0.4233853211009175, fairness violation: 0.00473543119266055, violated group size: 0.217\n", - "iteration: 110, error: 0.4237090909090908, fairness violation: 0.004708163636363636, violated group size: 0.217\n", - "iteration: 111, error: 0.424027027027027, fairness violation: 0.004681387387387387, violated group size: 0.283\n", - "iteration: 112, error: 0.42433928571428586, fairness violation: 0.004655089285714286, violated group size: 0.283\n", - "iteration: 113, error: 0.4241238938053097, fairness violation: 0.004671504424778761, violated group size: 0.217\n", - "iteration: 114, error: 0.42442982456140343, fairness violation: 0.004645754385964912, violated group size: 0.283\n", - "iteration: 115, error: 0.42473043478260875, fairness violation: 0.0046204521739130425, violated group size: 0.283\n", - "iteration: 116, error: 0.42502586206896553, fairness violation: 0.0045955862068965524, violated group size: 0.283\n", - "iteration: 117, error: 0.42481196581196584, fairness violation: 0.004611948717948717, violated group size: 0.217\n", - "iteration: 118, error: 0.4251016949152542, fairness violation: 0.004587576271186439, violated group size: 0.217\n", - "iteration: 119, error: 0.42489075630252104, fairness violation: 0.004603731092436974, violated group size: 0.217\n", - "iteration: 120, error: 0.4251750000000001, fairness violation: 0.0045798333333333325, violated group size: 0.217\n", - "iteration: 121, error: 0.4249669421487604, fairness violation: 0.004595785123966942, violated group size: 0.283\n", - "iteration: 122, error: 0.4247622950819671, fairness violation: 0.0046114754098360656, violated group size: 0.217\n", - "iteration: 123, error: 0.42456097560975614, fairness violation: 0.00462691056910569, violated group size: 0.217\n", - "iteration: 124, error: 0.42436290322580644, fairness violation: 0.004642096774193548, violated group size: 0.217\n", - "iteration: 125, error: 0.4241680000000001, fairness violation: 0.00465704, violated group size: 0.217\n", - "iteration: 126, error: 0.4239761904761905, fairness violation: 0.004671746031746031, violated group size: 0.217\n", - "iteration: 127, error: 0.42425196850393704, fairness violation: 0.004648629921259842, violated group size: 0.217\n", - "iteration: 128, error: 0.4240625, fairness violation: 0.004663171874999999, violated group size: 0.217\n", - "iteration: 129, error: 0.4238759689922481, fairness violation: 0.004677488372093024, violated group size: 0.283\n", - "iteration: 130, error: 0.42369230769230776, fairness violation: 0.004691584615384614, violated group size: 0.217\n", - "iteration: 131, error: 0.42351145038167937, fairness violation: 0.004705465648854962, violated group size: 0.217\n", - "iteration: 132, error: 0.4233333333333333, fairness violation: 0.004719136363636364, violated group size: 0.283\n", - "iteration: 133, error: 0.423157894736842, fairness violation: 0.0047326015037594, violated group size: 0.217\n", - "iteration: 134, error: 0.4229850746268656, fairness violation: 0.004745865671641791, violated group size: 0.217\n", - "iteration: 135, error: 0.42281481481481475, fairness violation: 0.004758933333333335, violated group size: 0.283\n", - "iteration: 136, error: 0.4226470588235294, fairness violation: 0.004771808823529411, violated group size: 0.217\n", - "iteration: 137, error: 0.42248175182481745, fairness violation: 0.004784496350364964, violated group size: 0.283\n", - "iteration: 138, error: 0.42231884057971014, fairness violation: 0.004797000000000002, violated group size: 0.283\n", - "iteration: 139, error: 0.42215827338129497, fairness violation: 0.004809323741007196, violated group size: 0.283\n", - "iteration: 140, error: 0.42200000000000004, fairness violation: 0.004821471428571429, violated group size: 0.217\n", - "iteration: 141, error: 0.4218439716312057, fairness violation: 0.0048334468085106394, violated group size: 0.217\n", - "iteration: 142, error: 0.42169014084507045, fairness violation: 0.004845253521126761, violated group size: 0.283\n", - "iteration: 143, error: 0.4215384615384616, fairness violation: 0.004856895104895106, violated group size: 0.283\n", - "iteration: 144, error: 0.4213888888888888, fairness violation: 0.004868375, violated group size: 0.217\n", - "iteration: 145, error: 0.42124137931034483, fairness violation: 0.004879696551724138, violated group size: 0.217\n", - "iteration: 146, error: 0.4210958904109589, fairness violation: 0.00489086301369863, violated group size: 0.217\n", - "iteration: 147, error: 0.4209523809523809, fairness violation: 0.004901877551020409, violated group size: 0.217\n", - "iteration: 148, error: 0.42081081081081084, fairness violation: 0.004912743243243244, violated group size: 0.217\n", - "iteration: 149, error: 0.42067114093959734, fairness violation: 0.004923463087248323, violated group size: 0.283\n", - "iteration: 150, error: 0.4205333333333334, fairness violation: 0.004934040000000001, violated group size: 0.217\n", - "iteration: 151, error: 0.4203973509933776, fairness violation: 0.004944476821192053, violated group size: 0.217\n", - "iteration: 152, error: 0.4202631578947368, fairness violation: 0.0049547763157894754, violated group size: 0.283\n", - "iteration: 153, error: 0.4201307189542483, fairness violation: 0.00496494117647059, violated group size: 0.283\n", - "iteration: 154, error: 0.42, fairness violation: 0.004974974025974027, violated group size: 0.283\n", - "iteration: 155, error: 0.4198709677419355, fairness violation: 0.0049848774193548395, violated group size: 0.217\n", - "iteration: 156, error: 0.4197435897435898, fairness violation: 0.004994653846153847, violated group size: 0.217\n", - "iteration: 157, error: 0.4196178343949045, fairness violation: 0.0050043057324840766, violated group size: 0.217\n" - ] + "cell_type": "code", + "source": [ + "!pip install aif360" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "nTdJbsvOhAeU", + "outputId": "3da8ff56-8a28-47a3-c8e9-b751018039c6" + }, + "execution_count": 2, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Collecting aif360\n", + " Downloading aif360-0.5.0-py3-none-any.whl (214 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m214.1/214.1 kB\u001b[0m \u001b[31m2.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hRequirement already satisfied: numpy>=1.16 in /usr/local/lib/python3.10/dist-packages (from aif360) (1.23.5)\n", + "Requirement already satisfied: scipy>=1.2.0 in /usr/local/lib/python3.10/dist-packages (from aif360) (1.11.2)\n", + "Requirement already satisfied: pandas>=0.24.0 in /usr/local/lib/python3.10/dist-packages (from aif360) (1.5.3)\n", + "Requirement already satisfied: scikit-learn>=1.0 in /usr/local/lib/python3.10/dist-packages (from aif360) (1.2.2)\n", + "Requirement already satisfied: matplotlib in /usr/local/lib/python3.10/dist-packages (from aif360) (3.7.1)\n", + "Requirement already satisfied: python-dateutil>=2.8.1 in /usr/local/lib/python3.10/dist-packages (from pandas>=0.24.0->aif360) (2.8.2)\n", + "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas>=0.24.0->aif360) (2023.3.post1)\n", + "Requirement already satisfied: joblib>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=1.0->aif360) (1.3.2)\n", + "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=1.0->aif360) (3.2.0)\n", + "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (1.1.0)\n", + "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (0.11.0)\n", + "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (4.42.1)\n", + "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (1.4.5)\n", + "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (23.1)\n", + "Requirement already satisfied: pillow>=6.2.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (9.4.0)\n", + "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->aif360) (3.1.1)\n", + "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.1->pandas>=0.24.0->aif360) (1.16.0)\n", + "Installing collected packages: aif360\n", + "Successfully installed aif360-0.5.0\n" + ] + } + ] }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 158, error: 0.4194936708860761, fairness violation: 0.005013835443037975, violated group size: 0.217\n", - "iteration: 159, error: 0.41937106918239, fairness violation: 0.005023245283018869, violated group size: 0.283\n", - "iteration: 160, error: 0.41925000000000007, fairness violation: 0.0050325375, violated group size: 0.217\n", - "iteration: 161, error: 0.4191304347826087, fairness violation: 0.005041714285714285, violated group size: 0.217\n", - "iteration: 162, error: 0.41901234567901235, fairness violation: 0.005050777777777778, violated group size: 0.283\n", - "iteration: 163, error: 0.41889570552147243, fairness violation: 0.005059730061349694, violated group size: 0.283\n", - "iteration: 164, error: 0.4191402439024391, fairness violation: 0.005039463414634148, violated group size: 0.283\n", - "iteration: 165, error: 0.41938181818181824, fairness violation: 0.005019442424242424, violated group size: 0.217\n", - "iteration: 166, error: 0.4192650602409639, fairness violation: 0.005028421686746988, violated group size: 0.217\n", - "iteration: 167, error: 0.41950299401197605, fairness violation: 0.005008706586826348, violated group size: 0.217\n", - "iteration: 168, error: 0.41973809523809513, fairness violation: 0.004989226190476189, violated group size: 0.217\n", - "iteration: 169, error: 0.41997041420118336, fairness violation: 0.0049699763313609474, violated group size: 0.283\n", - "iteration: 170, error: 0.4202, fairness violation: 0.00495095294117647, violated group size: 0.283\n", - "iteration: 171, error: 0.4204269005847953, fairness violation: 0.004932152046783625, violated group size: 0.217\n", - "iteration: 172, error: 0.42065116279069764, fairness violation: 0.00491356976744186, violated group size: 0.217\n", - "iteration: 173, error: 0.4208728323699421, fairness violation: 0.004895202312138728, violated group size: 0.217\n", - "iteration: 174, error: 0.42109195402298855, fairness violation: 0.004877045977011494, violated group size: 0.217\n", - "iteration: 175, error: 0.4213085714285715, fairness violation: 0.004859097142857142, violated group size: 0.217\n", - "iteration: 176, error: 0.42152272727272727, fairness violation: 0.0048413522727272715, violated group size: 0.217\n", - "iteration: 177, error: 0.42173446327683617, fairness violation: 0.00482380790960452, violated group size: 0.217\n", - "iteration: 178, error: 0.42161235955056187, fairness violation: 0.004833280898876404, violated group size: 0.217\n", - "iteration: 179, error: 0.42182122905027924, fairness violation: 0.004815977653631285, violated group size: 0.217\n", - "iteration: 180, error: 0.4220277777777778, fairness violation: 0.004798866666666665, violated group size: 0.217\n", - "iteration: 181, error: 0.42223204419889504, fairness violation: 0.004781944751381214, violated group size: 0.283\n", - "iteration: 182, error: 0.4224340659340659, fairness violation: 0.004765208791208789, violated group size: 0.217\n", - "iteration: 183, error: 0.4226338797814208, fairness violation: 0.004748655737704917, violated group size: 0.217\n", - "iteration: 184, error: 0.4228315217391304, fairness violation: 0.004732282608695651, violated group size: 0.217\n", - "iteration: 185, error: 0.4230270270270271, fairness violation: 0.004716086486486487, violated group size: 0.217\n", - "iteration: 186, error: 0.4229032258064515, fairness violation: 0.0047257311827957, violated group size: 0.283\n", - "iteration: 187, error: 0.4230962566844919, fairness violation: 0.0047097433155080205, violated group size: 0.217\n", - "iteration: 188, error: 0.4229734042553191, fairness violation: 0.00471931914893617, violated group size: 0.283\n", - "iteration: 189, error: 0.4231640211640213, fairness violation: 0.004703534391534391, violated group size: 0.217\n", - "iteration: 190, error: 0.42304210526315794, fairness violation: 0.004713042105263158, violated group size: 0.217\n", - "iteration: 191, error: 0.4232303664921467, fairness violation: 0.004697455497382198, violated group size: 0.217\n", - "iteration: 192, error: 0.42310937499999995, fairness violation: 0.004706895833333333, violated group size: 0.217\n", - "iteration: 193, error: 0.42329533678756476, fairness violation: 0.004691502590673575, violated group size: 0.283\n", - "iteration: 194, error: 0.4231752577319588, fairness violation: 0.004700876288659792, violated group size: 0.217\n", - "iteration: 195, error: 0.4230564102564103, fairness violation: 0.004710153846153845, violated group size: 0.217\n", - "iteration: 196, error: 0.4229387755102041, fairness violation: 0.004719336734693878, violated group size: 0.283\n", - "iteration: 197, error: 0.4228223350253807, fairness violation: 0.004728426395939086, violated group size: 0.283\n", - "iteration: 198, error: 0.4227070707070707, fairness violation: 0.004737424242424242, violated group size: 0.217\n", - "iteration: 199, error: 0.4228894472361809, fairness violation: 0.004722341708542713, violated group size: 0.217\n", - "iteration: 200, error: 0.42277499999999996, fairness violation: 0.004731279999999999, violated group size: 0.217\n", - "iteration: 201, error: 0.4226616915422886, fairness violation: 0.004740129353233829, violated group size: 0.217\n", - "iteration: 202, error: 0.4225495049504951, fairness violation: 0.00474889108910891, violated group size: 0.217\n", - "iteration: 203, error: 0.42243842364532025, fairness violation: 0.004757566502463053, violated group size: 0.283\n", - "iteration: 204, error: 0.42232843137254905, fairness violation: 0.004766156862745097, violated group size: 0.283\n", - "iteration: 205, error: 0.422219512195122, fairness violation: 0.004774663414634145, violated group size: 0.217\n", - "iteration: 206, error: 0.422111650485437, fairness violation: 0.004783087378640775, violated group size: 0.217\n", - "iteration: 207, error: 0.4220048309178744, fairness violation: 0.00479142995169082, violated group size: 0.217\n", - "iteration: 208, error: 0.4218990384615385, fairness violation: 0.004799692307692306, violated group size: 0.217\n", - "iteration: 209, error: 0.42179425837320567, fairness violation: 0.004807875598086124, violated group size: 0.217\n", - "iteration: 210, error: 0.4216904761904762, fairness violation: 0.004815980952380952, violated group size: 0.217\n", - "iteration: 211, error: 0.42158767772511846, fairness violation: 0.0048240094786729856, violated group size: 0.217\n", - "iteration: 212, error: 0.42148584905660386, fairness violation: 0.004831962264150944, violated group size: 0.217\n", - "iteration: 213, error: 0.4213849765258215, fairness violation: 0.004839840375586855, violated group size: 0.283\n", - "iteration: 214, error: 0.421285046728972, fairness violation: 0.0048476448598130835, violated group size: 0.217\n", - "iteration: 215, error: 0.42118604651162794, fairness violation: 0.004855376744186045, violated group size: 0.217\n", - "iteration: 216, error: 0.4210879629629629, fairness violation: 0.004863037037037037, violated group size: 0.283\n", - "iteration: 217, error: 0.42099078341013824, fairness violation: 0.004870626728110601, violated group size: 0.283\n", - "iteration: 218, error: 0.42089449541284396, fairness violation: 0.004878146788990825, violated group size: 0.217\n", - "iteration: 219, error: 0.42079908675799094, fairness violation: 0.004885598173515983, violated group size: 0.283\n", - "iteration: 220, error: 0.4207045454545455, fairness violation: 0.004892981818181818, violated group size: 0.283\n", - "iteration: 221, error: 0.4206108597285068, fairness violation: 0.004900298642533936, violated group size: 0.283\n", - "iteration: 222, error: 0.4205180180180179, fairness violation: 0.004907549549549549, violated group size: 0.217\n", - "iteration: 223, error: 0.4204260089686098, fairness violation: 0.004914735426008968, violated group size: 0.217\n", - "iteration: 224, error: 0.4203348214285714, fairness violation: 0.004921857142857143, violated group size: 0.283\n", - "iteration: 225, error: 0.4202444444444444, fairness violation: 0.004928915555555555, violated group size: 0.217\n", - "iteration: 226, error: 0.42015486725663725, fairness violation: 0.004935911504424777, violated group size: 0.217\n", - "iteration: 227, error: 0.4200660792951542, fairness violation: 0.004942845814977973, violated group size: 0.217\n", - "iteration: 228, error: 0.4199780701754386, fairness violation: 0.004949719298245614, violated group size: 0.217\n", - "iteration: 229, error: 0.4198908296943231, fairness violation: 0.004956532751091703, violated group size: 0.283\n", - "iteration: 230, error: 0.419804347826087, fairness violation: 0.004963286956521739, violated group size: 0.283\n", - "iteration: 231, error: 0.4197186147186147, fairness violation: 0.004969982683982686, violated group size: 0.283\n", - "iteration: 232, error: 0.4196336206896552, fairness violation: 0.004976620689655175, violated group size: 0.283\n", - "iteration: 233, error: 0.419549356223176, fairness violation: 0.004983201716738197, violated group size: 0.283\n", - "iteration: 234, error: 0.419465811965812, fairness violation: 0.0049897264957264945, violated group size: 0.217\n" - ] + "cell_type": "code", + "execution_count": 5, + "metadata": { + "pycharm": { + "is_executing": false + }, + "id": "8MX9m3k_g9Ft" + }, + "outputs": [], + "source": [ + "%matplotlib inline\n", + "import warnings\n", + "warnings.filterwarnings(\"ignore\")\n", + "import sys\n", + "sys.path.append(\"../\")\n", + "from aif360.algorithms.inprocessing import GerryFairClassifier\n", + "from aif360.algorithms.inprocessing.gerryfair.clean import array_to_tuple\n", + "from aif360.algorithms.inprocessing.gerryfair.auditor import Auditor\n", + "from aif360.algorithms.preprocessing.optim_preproc_helpers.data_preproc_functions import load_preproc_data_adult\n", + "from sklearn import svm\n", + "from sklearn import tree\n", + "from sklearn.kernel_ridge import KernelRidge\n", + "from sklearn import linear_model\n", + "from aif360.metrics import BinaryLabelDatasetMetric\n", + "from IPython.display import Image\n", + "import pickle\n", + "import matplotlib.pyplot as plt" + ] }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 235, error: 0.4193829787234044, fairness violation: 0.00499619574468085, violated group size: 0.217\n", - "iteration: 236, error: 0.41930084745762713, fairness violation: 0.005002610169491525, violated group size: 0.283\n", - "iteration: 237, error: 0.4192194092827004, fairness violation: 0.005008970464135021, violated group size: 0.283\n", - "iteration: 238, error: 0.41913865546218493, fairness violation: 0.00501527731092437, violated group size: 0.283\n", - "iteration: 239, error: 0.4190585774058578, fairness violation: 0.005021531380753138, violated group size: 0.283\n", - "iteration: 240, error: 0.4189791666666667, fairness violation: 0.005027733333333333, violated group size: 0.217\n", - "iteration: 241, error: 0.41890041493775937, fairness violation: 0.005033883817427385, violated group size: 0.217\n", - "iteration: 242, error: 0.4188223140495868, fairness violation: 0.0050399834710743805, violated group size: 0.217\n", - "iteration: 243, error: 0.4187448559670781, fairness violation: 0.005046032921810699, violated group size: 0.217\n", - "iteration: 244, error: 0.41890983606557386, fairness violation: 0.005032467213114753, violated group size: 0.217\n", - "iteration: 245, error: 0.419073469387755, fairness violation: 0.005019012244897959, violated group size: 0.217\n", - "iteration: 246, error: 0.41923577235772364, fairness violation: 0.005005666666666667, violated group size: 0.283\n", - "iteration: 247, error: 0.4191578947368422, fairness violation: 0.005011757085020243, violated group size: 0.217\n", - "iteration: 248, error: 0.41908064516129034, fairness violation: 0.005017798387096774, violated group size: 0.283\n", - "iteration: 249, error: 0.4192409638554217, fairness violation: 0.005004618473895581, violated group size: 0.217\n", - "iteration: 250, error: 0.4194000000000001, fairness violation: 0.004991544, violated group size: 0.217\n", - "iteration: 251, error: 0.4195577689243028, fairness violation: 0.004978573705179282, violated group size: 0.283\n", - "iteration: 252, error: 0.4197142857142857, fairness violation: 0.004965706349206349, violated group size: 0.217\n", - "iteration: 253, error: 0.4198695652173912, fairness violation: 0.00495294071146245, violated group size: 0.217\n", - "iteration: 254, error: 0.42002362204724414, fairness violation: 0.00494027559055118, violated group size: 0.217\n", - "iteration: 255, error: 0.4201764705882353, fairness violation: 0.004927709803921568, violated group size: 0.217\n", - "iteration: 256, error: 0.420328125, fairness violation: 0.004915242187499999, violated group size: 0.217\n", - "iteration: 257, error: 0.42047859922178993, fairness violation: 0.004902871595330739, violated group size: 0.217\n", - "iteration: 258, error: 0.42062790697674424, fairness violation: 0.004890596899224807, violated group size: 0.217\n", - "iteration: 259, error: 0.4207760617760617, fairness violation: 0.004878416988416988, violated group size: 0.283\n", - "iteration: 260, error: 0.42069615384615383, fairness violation: 0.004884692307692307, violated group size: 0.217\n", - "iteration: 261, error: 0.42061685823754785, fairness violation: 0.004890919540229886, violated group size: 0.283\n", - "iteration: 262, error: 0.42076335877862603, fairness violation: 0.004878877862595419, violated group size: 0.217\n", - "iteration: 263, error: 0.4209087452471483, fairness violation: 0.004866927756653992, violated group size: 0.217\n", - "iteration: 264, error: 0.4208295454545454, fairness violation: 0.004873151515151516, violated group size: 0.283\n", - "iteration: 265, error: 0.4209735849056603, fairness violation: 0.004861313207547171, violated group size: 0.283\n", - "iteration: 266, error: 0.4211165413533834, fairness violation: 0.004849563909774436, violated group size: 0.217\n", - "iteration: 267, error: 0.42125842696629223, fairness violation: 0.0048379026217228475, violated group size: 0.217\n", - "iteration: 268, error: 0.42139925373134324, fairness violation: 0.004826328358208956, violated group size: 0.283\n", - "iteration: 269, error: 0.42131970260223045, fairness violation: 0.0048325873605947955, violated group size: 0.217\n", - "iteration: 270, error: 0.42145925925925937, fairness violation: 0.00482111851851852, violated group size: 0.283\n", - "iteration: 271, error: 0.42159778597785963, fairness violation: 0.004809734317343174, violated group size: 0.217\n", - "iteration: 272, error: 0.42173529411764704, fairness violation: 0.004798433823529413, violated group size: 0.283\n", - "iteration: 273, error: 0.4216556776556777, fairness violation: 0.004804703296703296, violated group size: 0.217\n", - "iteration: 274, error: 0.42157664233576647, fairness violation: 0.00481092700729927, violated group size: 0.217\n", - "iteration: 275, error: 0.42171272727272724, fairness violation: 0.004799745454545455, violated group size: 0.217\n", - "iteration: 276, error: 0.42184782608695653, fairness violation: 0.004788644927536233, violated group size: 0.217\n", - "iteration: 277, error: 0.4219819494584837, fairness violation: 0.004777624548736462, violated group size: 0.217\n", - "iteration: 278, error: 0.42190287769784157, fairness violation: 0.004783856115107913, violated group size: 0.217\n", - "iteration: 279, error: 0.42182437275985674, fairness violation: 0.004790043010752689, violated group size: 0.217\n", - "iteration: 280, error: 0.42174642857142863, fairness violation: 0.004796185714285715, violated group size: 0.283\n", - "iteration: 281, error: 0.42166903914590753, fairness violation: 0.0048022846975088965, violated group size: 0.283\n", - "iteration: 282, error: 0.4218014184397163, fairness violation: 0.00479141134751773, violated group size: 0.217\n", - "iteration: 283, error: 0.42172438162544174, fairness violation: 0.0047974840989399295, violated group size: 0.217\n", - "iteration: 284, error: 0.4216478873239437, fairness violation: 0.004803514084507042, violated group size: 0.217\n", - "iteration: 285, error: 0.42157192982456126, fairness violation: 0.004809501754385964, violated group size: 0.217\n", - "iteration: 286, error: 0.4217027972027972, fairness violation: 0.004798755244755245, violated group size: 0.217\n", - "iteration: 287, error: 0.4218327526132404, fairness violation: 0.004788083623693379, violated group size: 0.283\n", - "iteration: 288, error: 0.4219618055555556, fairness violation: 0.004777486111111113, violated group size: 0.283\n", - "iteration: 289, error: 0.4218858131487888, fairness violation: 0.004783480968858131, violated group size: 0.217\n", - "iteration: 290, error: 0.4218103448275861, fairness violation: 0.004789434482758621, violated group size: 0.217\n", - "iteration: 291, error: 0.42193814432989696, fairness violation: 0.004778941580756014, violated group size: 0.283\n", - "iteration: 292, error: 0.42186301369863016, fairness violation: 0.0047848698630136985, violated group size: 0.217\n", - "iteration: 293, error: 0.4217883959044368, fairness violation: 0.004790757679180888, violated group size: 0.217\n", - "iteration: 294, error: 0.42171428571428576, fairness violation: 0.004796605442176871, violated group size: 0.217\n", - "iteration: 295, error: 0.4216406779661017, fairness violation: 0.004802413559322035, violated group size: 0.217\n", - "iteration: 296, error: 0.4215675675675675, fairness violation: 0.004808182432432432, violated group size: 0.217\n", - "iteration: 297, error: 0.4214949494949495, fairness violation: 0.00481391245791246, violated group size: 0.283\n", - "iteration: 298, error: 0.4214228187919464, fairness violation: 0.0048196040268456385, violated group size: 0.217\n", - "iteration: 299, error: 0.42135117056856186, fairness violation: 0.0048252575250836115, violated group size: 0.217\n", - "iteration: 300, error: 0.42128, fairness violation: 0.004830873333333335, violated group size: 0.283\n", - "iteration: 301, error: 0.42120930232558146, fairness violation: 0.004836451827242525, violated group size: 0.217\n", - "iteration: 302, error: 0.42113907284768215, fairness violation: 0.004841993377483444, violated group size: 0.217\n", - "iteration: 303, error: 0.42106930693069305, fairness violation: 0.004847498349834984, violated group size: 0.217\n", - "iteration: 304, error: 0.4211940789473684, fairness violation: 0.004837263157894738, violated group size: 0.283\n", - "iteration: 305, error: 0.4211245901639345, fairness violation: 0.004842747540983607, violated group size: 0.283\n", - "iteration: 306, error: 0.4210555555555555, fairness violation: 0.004848196078431373, violated group size: 0.217\n", - "iteration: 307, error: 0.42098697068403895, fairness violation: 0.004853609120521175, violated group size: 0.283\n", - "iteration: 308, error: 0.4209188311688312, fairness violation: 0.004858987012987015, violated group size: 0.283\n", - "iteration: 309, error: 0.42085113268608415, fairness violation: 0.00486433009708738, violated group size: 0.283\n" - ] + "cell_type": "code", + "source": [ + "import os\n", + "import urllib\n", + "import aif360\n", + "\n", + "# Obtain the location where it is installed\n", + "LIB_PATH = aif360.__file__.rsplit(\"aif360\", 1)[0]\n", + "\n", + "# check if the data got download properly\n", + "def check_data_or_download(destn, files, data_source_directory):\n", + " check = all(item in os.listdir(destn) for item in files)\n", + " if check:\n", + " print(\"Adult dataset is available for us\")\n", + " else:\n", + " print(\"Some files are missing. Downloading now.\")\n", + " for data_file in files:\n", + " _ = urllib.request.urlretrieve(data_source_directory + data_file,\n", + " os.path.join(destn, data_file))\n", + "\n", + "# Download adult dataset\n", + "data_source_directory = \"https://archive.ics.uci.edu/ml/machine-learning-databases/adult/\"\n", + "destn = os.path.join(LIB_PATH, \"aif360\", \"data\", \"raw\", \"adult\")\n", + "files = [\"adult.data\", \"adult.test\", \"adult.names\"]\n", + "\n", + "check_data_or_download(destn, files, data_source_directory)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "R7RtdPi0hmfH", + "outputId": "190a4308-9e85-4da3-96cb-ae042eb09453" + }, + "execution_count": 4, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Some files are missing. Downloading now.\n" + ] + } + ] }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 310, error: 0.4207838709677419, fairness violation: 0.00486963870967742, violated group size: 0.283\n", - "iteration: 311, error: 0.420717041800643, fairness violation: 0.004874913183279744, violated group size: 0.217\n", - "iteration: 312, error: 0.42065064102564104, fairness violation: 0.0048801538461538466, violated group size: 0.217\n", - "iteration: 313, error: 0.42058466453674115, fairness violation: 0.0048853610223642185, violated group size: 0.217\n", - "iteration: 314, error: 0.42051910828025474, fairness violation: 0.004890535031847135, violated group size: 0.217\n", - "iteration: 315, error: 0.4204539682539683, fairness violation: 0.004895676190476191, violated group size: 0.217\n", - "iteration: 316, error: 0.4203892405063292, fairness violation: 0.004900784810126583, violated group size: 0.217\n", - "iteration: 317, error: 0.4203249211356468, fairness violation: 0.004905861198738172, violated group size: 0.283\n", - "iteration: 318, error: 0.4202610062893082, fairness violation: 0.00491090566037736, violated group size: 0.217\n", - "iteration: 319, error: 0.4201974921630094, fairness violation: 0.004915918495297806, violated group size: 0.217\n", - "iteration: 320, error: 0.4201343749999999, fairness violation: 0.004920900000000002, violated group size: 0.217\n", - "iteration: 321, error: 0.4200716510903427, fairness violation: 0.004925850467289721, violated group size: 0.217\n", - "iteration: 322, error: 0.4200093167701862, fairness violation: 0.0049307701863354056, violated group size: 0.283\n", - "iteration: 323, error: 0.4199473684210526, fairness violation: 0.00493565944272446, violated group size: 0.283\n", - "iteration: 324, error: 0.41988580246913576, fairness violation: 0.004940518518518519, violated group size: 0.217\n", - "iteration: 325, error: 0.41982461538461535, fairness violation: 0.004945347692307694, violated group size: 0.217\n", - "iteration: 326, error: 0.4197638036809816, fairness violation: 0.004950147239263805, violated group size: 0.283\n", - "iteration: 327, error: 0.4197033639143731, fairness violation: 0.004954917431192661, violated group size: 0.283\n", - "iteration: 328, error: 0.4196432926829268, fairness violation: 0.004959658536585366, violated group size: 0.217\n", - "iteration: 329, error: 0.41958358662613987, fairness violation: 0.004964370820668694, violated group size: 0.283\n", - "iteration: 330, error: 0.41952424242424236, fairness violation: 0.004969054545454545, violated group size: 0.217\n", - "iteration: 331, error: 0.41946525679758306, fairness violation: 0.00497370996978852, violated group size: 0.217\n", - "iteration: 332, error: 0.41940662650602417, fairness violation: 0.004978337349397591, violated group size: 0.217\n", - "iteration: 333, error: 0.4193483483483482, fairness violation: 0.004982936936936937, violated group size: 0.217\n", - "iteration: 334, error: 0.4192904191616766, fairness violation: 0.004987508982035928, violated group size: 0.217\n", - "iteration: 335, error: 0.4192328358208956, fairness violation: 0.004992053731343284, violated group size: 0.283\n", - "iteration: 336, error: 0.4191755952380953, fairness violation: 0.00499657142857143, violated group size: 0.283\n", - "iteration: 337, error: 0.4191186943620178, fairness violation: 0.0050010623145400595, violated group size: 0.217\n", - "iteration: 338, error: 0.41906213017751476, fairness violation: 0.005005526627218935, violated group size: 0.217\n", - "iteration: 339, error: 0.4190058997050148, fairness violation: 0.005009964601769911, violated group size: 0.217\n", - "iteration: 340, error: 0.41894999999999993, fairness violation: 0.005014376470588236, violated group size: 0.283\n", - "iteration: 341, error: 0.41889442815249267, fairness violation: 0.005018762463343108, violated group size: 0.217\n", - "iteration: 342, error: 0.41883918128654973, fairness violation: 0.005023122807017544, violated group size: 0.217\n", - "iteration: 343, error: 0.41878425655976675, fairness violation: 0.0050274577259475225, violated group size: 0.283\n", - "iteration: 344, error: 0.4187296511627907, fairness violation: 0.005031767441860465, violated group size: 0.217\n", - "iteration: 345, error: 0.4186753623188406, fairness violation: 0.005036052173913045, violated group size: 0.283\n", - "iteration: 346, error: 0.4186213872832369, fairness violation: 0.005040312138728323, violated group size: 0.217\n", - "iteration: 347, error: 0.41856772334293946, fairness violation: 0.005044547550432276, violated group size: 0.283\n", - "iteration: 348, error: 0.41851436781609197, fairness violation: 0.005048758620689655, violated group size: 0.217\n", - "iteration: 349, error: 0.418461318051576, fairness violation: 0.005052945558739255, violated group size: 0.283\n", - "iteration: 350, error: 0.4185771428571428, fairness violation: 0.005043468571428572, violated group size: 0.283\n", - "iteration: 351, error: 0.4186923076923077, fairness violation: 0.005034045584045584, violated group size: 0.217\n", - "iteration: 352, error: 0.4188068181818182, fairness violation: 0.005024676136363637, violated group size: 0.283\n", - "iteration: 353, error: 0.4189206798866855, fairness violation: 0.005015359773371105, violated group size: 0.217\n", - "iteration: 354, error: 0.41903389830508475, fairness violation: 0.005006096045197741, violated group size: 0.283\n", - "iteration: 355, error: 0.41914647887323936, fairness violation: 0.004996884507042254, violated group size: 0.283\n", - "iteration: 356, error: 0.4192584269662922, fairness violation: 0.004987724719101122, violated group size: 0.217\n", - "iteration: 357, error: 0.41936974789915965, fairness violation: 0.0049786162464986, violated group size: 0.217\n", - "iteration: 358, error: 0.41948044692737424, fairness violation: 0.004969558659217878, violated group size: 0.217\n", - "iteration: 359, error: 0.41959052924791085, fairness violation: 0.004960551532033426, violated group size: 0.283\n", - "iteration: 360, error: 0.4195361111111111, fairness violation: 0.004964855555555557, violated group size: 0.283\n", - "iteration: 361, error: 0.4196454293628808, fairness violation: 0.004955911357340723, violated group size: 0.283\n", - "iteration: 362, error: 0.4197541436464089, fairness violation: 0.004947016574585636, violated group size: 0.217\n", - "iteration: 363, error: 0.4198622589531681, fairness violation: 0.004938170798898072, violated group size: 0.283\n", - "iteration: 364, error: 0.41996978021978026, fairness violation: 0.004929373626373626, violated group size: 0.217\n", - "iteration: 365, error: 0.42007671232876714, fairness violation: 0.004920624657534246, violated group size: 0.217\n", - "iteration: 366, error: 0.42018306010928963, fairness violation: 0.004911923497267759, violated group size: 0.217\n", - "iteration: 367, error: 0.4202888283378746, fairness violation: 0.004903269754768393, violated group size: 0.217\n", - "iteration: 368, error: 0.42039402173913043, fairness violation: 0.00489466304347826, violated group size: 0.217\n", - "iteration: 369, error: 0.4204986449864499, fairness violation: 0.00488610298102981, violated group size: 0.283\n", - "iteration: 370, error: 0.4206027027027027, fairness violation: 0.0048775891891891885, violated group size: 0.217\n", - "iteration: 371, error: 0.4207061994609164, fairness violation: 0.004869121293800538, violated group size: 0.217\n", - "iteration: 372, error: 0.4208091397849463, fairness violation: 0.004860698924731182, violated group size: 0.217\n", - "iteration: 373, error: 0.420911528150134, fairness violation: 0.004852321715817694, violated group size: 0.217\n", - "iteration: 374, error: 0.420855614973262, fairness violation: 0.004856754010695187, violated group size: 0.217\n", - "iteration: 375, error: 0.4209573333333334, fairness violation: 0.004848432, violated group size: 0.217\n", - "iteration: 376, error: 0.42105851063829786, fairness violation: 0.004840154255319148, violated group size: 0.217\n", - "iteration: 377, error: 0.4211591511936339, fairness violation: 0.004831920424403182, violated group size: 0.217\n", - "iteration: 378, error: 0.4211031746031746, fairness violation: 0.004836359788359788, violated group size: 0.217\n", - "iteration: 379, error: 0.42120316622691284, fairness violation: 0.004828179419525066, violated group size: 0.217\n", - "iteration: 380, error: 0.42130263157894726, fairness violation: 0.004820042105263157, violated group size: 0.217\n", - "iteration: 381, error: 0.42124671916010503, fairness violation: 0.004824477690288715, violated group size: 0.283\n", - "iteration: 382, error: 0.42134554973821986, fairness violation: 0.004816392670157068, violated group size: 0.283\n", - "iteration: 383, error: 0.42144386422976504, fairness violation: 0.004808349869451696, violated group size: 0.217\n", - "iteration: 384, error: 0.42154166666666676, fairness violation: 0.004800348958333333, violated group size: 0.283\n" - ] + "cell_type": "code", + "source": [ + "# load data set\n", + "data_set = load_preproc_data_adult(sub_samp=1000, balance=True)\n", + "max_iterations = 500" + ], + "metadata": { + "id": "KZhYY9zVhp1i" + }, + "execution_count": 6, + "outputs": [] }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 385, error: 0.4214857142857143, fairness violation: 0.00480478961038961, violated group size: 0.217\n", - "iteration: 386, error: 0.4215829015544041, fairness violation: 0.0047968393782383415, violated group size: 0.217\n", - "iteration: 387, error: 0.42152713178294576, fairness violation: 0.004801266149870801, violated group size: 0.283\n", - "iteration: 388, error: 0.4216237113402061, fairness violation: 0.004793365979381444, violated group size: 0.283\n", - "iteration: 389, error: 0.42171979434447304, fairness violation: 0.004785506426735219, violated group size: 0.217\n", - "iteration: 390, error: 0.4218153846153847, fairness violation: 0.00477768717948718, violated group size: 0.217\n", - "iteration: 391, error: 0.4219104859335038, fairness violation: 0.004769907928388747, violated group size: 0.217\n", - "iteration: 392, error: 0.4218545918367348, fairness violation: 0.00477434693877551, violated group size: 0.217\n", - "iteration: 393, error: 0.42194910941475816, fairness violation: 0.004766615776081424, violated group size: 0.217\n", - "iteration: 394, error: 0.42204314720812186, fairness violation: 0.004758923857868021, violated group size: 0.283\n", - "iteration: 395, error: 0.4221367088607595, fairness violation: 0.00475127088607595, violated group size: 0.217\n", - "iteration: 396, error: 0.42208080808080806, fairness violation: 0.004755712121212122, violated group size: 0.283\n", - "iteration: 397, error: 0.42202518891687657, fairness violation: 0.004760130982367758, violated group size: 0.217\n", - "iteration: 398, error: 0.42196984924623115, fairness violation: 0.004764527638190955, violated group size: 0.283\n", - "iteration: 399, error: 0.42191478696741846, fairness violation: 0.004768902255639098, violated group size: 0.217\n", - "iteration: 400, error: 0.42186, fairness violation: 0.004773255, violated group size: 0.217\n", - "iteration: 401, error: 0.4218054862842893, fairness violation: 0.004777586034912718, violated group size: 0.283\n", - "iteration: 402, error: 0.4217512437810945, fairness violation: 0.00478189552238806, violated group size: 0.217\n", - "iteration: 403, error: 0.4218436724565757, fairness violation: 0.0047743374689826305, violated group size: 0.283\n", - "iteration: 404, error: 0.42178960396039605, fairness violation: 0.004778633663366336, violated group size: 0.217\n", - "iteration: 405, error: 0.4217358024691357, fairness violation: 0.004782908641975308, violated group size: 0.217\n", - "iteration: 406, error: 0.4216822660098523, fairness violation: 0.004787162561576355, violated group size: 0.217\n", - "iteration: 407, error: 0.4216289926289926, fairness violation: 0.004791395577395577, violated group size: 0.283\n", - "iteration: 408, error: 0.421575980392157, fairness violation: 0.004795607843137254, violated group size: 0.217\n", - "iteration: 409, error: 0.4215232273838631, fairness violation: 0.004799799511002444, violated group size: 0.217\n", - "iteration: 410, error: 0.42147073170731714, fairness violation: 0.004803970731707317, violated group size: 0.283\n", - "iteration: 411, error: 0.4214184914841849, fairness violation: 0.0048081216545012165, violated group size: 0.217\n", - "iteration: 412, error: 0.4213665048543689, fairness violation: 0.004812252427184466, violated group size: 0.283\n", - "iteration: 413, error: 0.42131476997578693, fairness violation: 0.004816363196125908, violated group size: 0.217\n", - "iteration: 414, error: 0.42126328502415455, fairness violation: 0.004820454106280194, violated group size: 0.217\n", - "iteration: 415, error: 0.4212120481927711, fairness violation: 0.004824525301204821, violated group size: 0.283\n", - "iteration: 416, error: 0.42116105769230766, fairness violation: 0.004828576923076923, violated group size: 0.217\n", - "iteration: 417, error: 0.4211103117505996, fairness violation: 0.004832609112709832, violated group size: 0.283\n", - "iteration: 418, error: 0.42105980861244025, fairness violation: 0.004836622009569378, violated group size: 0.283\n", - "iteration: 419, error: 0.42100954653937933, fairness violation: 0.004840615751789977, violated group size: 0.217\n", - "iteration: 420, error: 0.42110000000000003, fairness violation: 0.0048332238095238084, violated group size: 0.217\n", - "iteration: 421, error: 0.42104988123515436, fairness violation: 0.004837206650831354, violated group size: 0.217\n", - "iteration: 422, error: 0.42100000000000004, fairness violation: 0.004841170616113744, violated group size: 0.217\n", - "iteration: 423, error: 0.420950354609929, fairness violation: 0.004845115839243499, violated group size: 0.217\n", - "iteration: 424, error: 0.42104009433962253, fairness violation: 0.004837783018867924, violated group size: 0.217\n", - "iteration: 425, error: 0.4209905882352941, fairness violation: 0.004841717647058822, violated group size: 0.217\n", - "iteration: 426, error: 0.42094131455399053, fairness violation: 0.004845633802816901, violated group size: 0.217\n", - "iteration: 427, error: 0.42089227166276344, fairness violation: 0.004849531615925057, violated group size: 0.217\n", - "iteration: 428, error: 0.4208434579439252, fairness violation: 0.004853411214953271, violated group size: 0.217\n", - "iteration: 429, error: 0.4207948717948717, fairness violation: 0.0048572727272727274, violated group size: 0.283\n", - "iteration: 430, error: 0.42074651162790694, fairness violation: 0.004861116279069767, violated group size: 0.217\n", - "iteration: 431, error: 0.4206983758700697, fairness violation: 0.004864941995359629, violated group size: 0.283\n", - "iteration: 432, error: 0.420650462962963, fairness violation: 0.00486875, violated group size: 0.217\n", - "iteration: 433, error: 0.42060277136258656, fairness violation: 0.0048725404157043874, violated group size: 0.217\n", - "iteration: 434, error: 0.42055529953917054, fairness violation: 0.0048763133640553, violated group size: 0.283\n", - "iteration: 435, error: 0.42050804597701147, fairness violation: 0.004880068965517241, violated group size: 0.217\n", - "iteration: 436, error: 0.4204610091743119, fairness violation: 0.004883807339449542, violated group size: 0.217\n", - "iteration: 437, error: 0.4204141876430207, fairness violation: 0.004887528604118992, violated group size: 0.217\n", - "iteration: 438, error: 0.42036757990867574, fairness violation: 0.004891232876712329, violated group size: 0.217\n", - "iteration: 439, error: 0.4203211845102506, fairness violation: 0.0048949202733485206, violated group size: 0.283\n", - "iteration: 440, error: 0.42027499999999995, fairness violation: 0.00489859090909091, violated group size: 0.283\n", - "iteration: 441, error: 0.42022902494331066, fairness violation: 0.004902244897959184, violated group size: 0.283\n", - "iteration: 442, error: 0.42018325791855204, fairness violation: 0.004905882352941177, violated group size: 0.217\n", - "iteration: 443, error: 0.42013769751693003, fairness violation: 0.004909503386004516, violated group size: 0.283\n", - "iteration: 444, error: 0.42009234234234244, fairness violation: 0.004913108108108108, violated group size: 0.217\n", - "iteration: 445, error: 0.420047191011236, fairness violation: 0.004916696629213483, violated group size: 0.217\n", - "iteration: 446, error: 0.42000224215246645, fairness violation: 0.004920269058295964, violated group size: 0.217\n", - "iteration: 447, error: 0.4199574944071588, fairness violation: 0.004923825503355704, violated group size: 0.217\n", - "iteration: 448, error: 0.41991294642857147, fairness violation: 0.004927366071428571, violated group size: 0.217\n", - "iteration: 449, error: 0.41986859688195993, fairness violation: 0.004930890868596881, violated group size: 0.217\n", - "iteration: 450, error: 0.41982444444444433, fairness violation: 0.004934399999999999, violated group size: 0.217\n", - "iteration: 451, error: 0.41978048780487814, fairness violation: 0.004937893569844789, violated group size: 0.217\n", - "iteration: 452, error: 0.41973672566371684, fairness violation: 0.004941371681415928, violated group size: 0.217\n", - "iteration: 453, error: 0.41969315673289187, fairness violation: 0.0049448344370860925, violated group size: 0.217\n", - "iteration: 454, error: 0.41964977973568285, fairness violation: 0.004948281938325991, violated group size: 0.283\n", - "iteration: 455, error: 0.41960659340659345, fairness violation: 0.004951714285714286, violated group size: 0.283\n", - "iteration: 456, error: 0.41956359649122804, fairness violation: 0.004955131578947367, violated group size: 0.217\n", - "iteration: 457, error: 0.41952078774617063, fairness violation: 0.0049585339168490145, violated group size: 0.217\n", - "iteration: 458, error: 0.41947816593886456, fairness violation: 0.004961921397379911, violated group size: 0.217\n", - "iteration: 459, error: 0.4194357298474945, fairness violation: 0.00496529411764706, violated group size: 0.283\n", - "iteration: 460, error: 0.4193934782608696, fairness violation: 0.004968652173913044, violated group size: 0.283\n", - "iteration: 461, error: 0.41935140997830805, fairness violation: 0.004971995661605205, violated group size: 0.283\n", - "iteration: 462, error: 0.41930952380952374, fairness violation: 0.0049753246753246735, violated group size: 0.217\n", - "iteration: 463, error: 0.41926781857451406, fairness violation: 0.004978639308855291, violated group size: 0.217\n" - ] + "cell_type": "markdown", + "metadata": { + "id": "MEge2s2Wg9Fu" + }, + "source": [ + "**instantiate, fit, and predict**\n", + "\n", + "\n", + "We first demonstrate how to instantiate a `GerryFairClassifier`, `train` it with respect to rich subgroup fairness, and `predict` the label of a new example. We remark that when we set the `print_flag = True` at each iteration of the algorithm we print the error, fairness violation, and violated group size of most recent model. The error is the classification error of the classifier. At each round the Learner tries to find a classifier that minimizes the classification error plus a weighted sum of the fairness disparities on all the groups that the Auditor has found up until that point. By contrast the Auditor tries to find the group at each round with the greatest rich subgroup disparity with respect to the Learner's model. We define `violated group size` as the size (as a fraction of the dataset size) of this group, and the `fairness violation` as the `violated group size` times the difference in the statistical rate (FP or FN rate) on the group vs. the whole population.\n", + "\n", + "In the example below we set `max_iterations=500` which is an order of magnitude less than the time to convergence observed in [the rich subgroup fairness empirical paper](https://arxiv.org/abs/1808.08166), but advise that this can be highly dataset dependent. Our target $\\gamma$-disparity is $\\gamma = .005$, our statistical rate is false positive rate or `FP`, and our cost-sensitive classification oracle is linear regression (more on that below).\n" + ] }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "iteration: 464, error: 0.41922629310344817, fairness violation: 0.004981939655172413, violated group size: 0.217\n", - "iteration: 465, error: 0.41918494623655916, fairness violation: 0.004985225806451612, violated group size: 0.217\n", - "iteration: 466, error: 0.4191437768240344, fairness violation: 0.004988497854077254, violated group size: 0.283\n", - "iteration: 467, error: 0.41910278372591, fairness violation: 0.004991755888650964, violated group size: 0.283\n", - "iteration: 468, error: 0.4190619658119658, fairness violation: 0.004994999999999998, violated group size: 0.217\n", - "iteration: 469, error: 0.4190213219616205, fairness violation: 0.0049982302771855, violated group size: 0.217\n", - "iteration: 470, error: 0.41898085106382993, fairness violation: 0.005001446808510636, violated group size: 0.283\n", - "iteration: 471, error: 0.41894055201698516, fairness violation: 0.005004649681528661, violated group size: 0.217\n", - "iteration: 472, error: 0.41890042372881364, fairness violation: 0.005007838983050847, violated group size: 0.283\n", - "iteration: 473, error: 0.4188604651162791, fairness violation: 0.005011014799154333, violated group size: 0.217\n", - "iteration: 474, error: 0.41882067510548526, fairness violation: 0.005014177215189871, violated group size: 0.217\n", - "iteration: 475, error: 0.41878105263157905, fairness violation: 0.0050173263157894735, violated group size: 0.283\n", - "iteration: 476, error: 0.41874159663865557, fairness violation: 0.0050204621848739485, violated group size: 0.217\n", - "iteration: 477, error: 0.4188259958071279, fairness violation: 0.005013576519916141, violated group size: 0.217\n", - "iteration: 478, error: 0.41878661087866115, fairness violation: 0.005016707112970709, violated group size: 0.217\n", - "iteration: 479, error: 0.4188705636743216, fairness violation: 0.005009858037578285, violated group size: 0.217\n", - "iteration: 480, error: 0.41883125000000004, fairness violation: 0.005012983333333334, violated group size: 0.283\n", - "iteration: 481, error: 0.4187920997920998, fairness violation: 0.005016095634095634, violated group size: 0.283\n", - "iteration: 482, error: 0.4187531120331951, fairness violation: 0.0050191950207468874, violated group size: 0.283\n", - "iteration: 483, error: 0.4188364389233955, fairness violation: 0.00501239751552795, violated group size: 0.217\n", - "iteration: 484, error: 0.41891942148760325, fairness violation: 0.005005628099173555, violated group size: 0.283\n", - "iteration: 485, error: 0.4190020618556701, fairness violation: 0.004998886597938144, violated group size: 0.283\n", - "iteration: 486, error: 0.41896296296296304, fairness violation: 0.005001995884773661, violated group size: 0.217\n", - "iteration: 487, error: 0.4190451745379877, fairness violation: 0.004995289527720739, violated group size: 0.283\n", - "iteration: 488, error: 0.4191270491803279, fairness violation: 0.004988610655737704, violated group size: 0.283\n", - "iteration: 489, error: 0.4192085889570552, fairness violation: 0.004981959100204497, violated group size: 0.217\n", - "iteration: 490, error: 0.41916938775510204, fairness violation: 0.004985077551020407, violated group size: 0.283\n", - "iteration: 491, error: 0.4192505091649695, fairness violation: 0.004978460285132381, violated group size: 0.217\n", - "iteration: 492, error: 0.4192113821138212, fairness violation: 0.004981573170731706, violated group size: 0.217\n", - "iteration: 493, error: 0.41917241379310355, fairness violation: 0.004984673427991887, violated group size: 0.283\n", - "iteration: 494, error: 0.41913360323886634, fairness violation: 0.004987761133603237, violated group size: 0.217\n", - "iteration: 495, error: 0.4192141414141415, fairness violation: 0.004981191919191918, violated group size: 0.217\n", - "iteration: 496, error: 0.4192943548387097, fairness violation: 0.004974649193548386, violated group size: 0.217\n", - "iteration: 497, error: 0.419374245472837, fairness violation: 0.004968132796780683, violated group size: 0.217\n", - "iteration: 498, error: 0.4194538152610441, fairness violation: 0.004961642570281124, violated group size: 0.217\n", - "iteration: 499, error: 0.41953306613226454, fairness violation: 0.0049551783567134255, violated group size: 0.217\n" - ] - } - ], - "source": [ - "C = 100\n", - "print_flag = True\n", - "gamma = .005\n", - "\n", - "\n", - "fair_model = GerryFairClassifier(C=C, printflag=print_flag, gamma=gamma, fairness_def='FP',\n", - " max_iters=max_iterations, heatmapflag=False)\n", - "\n", - "# fit method\n", - "fair_model.fit(data_set, early_termination=True)\n", - "\n", - "# predict method. If threshold in (0, 1) produces binary predictions\n", - "\n", - "dataset_yhat = fair_model.predict(data_set, threshold=False)\n", - "\n", - "\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "**3-d heatmaps**\n", - "\n", - "We now show to generate a 3d-heatmap of unfairness using the `generate_heatmap` method. The $X-Y$ axes in the plot represent the coefficients of the linear threshold function that defines a protected subgroup with respect to the first two sensitive attributes. Which $2$ attributes are considered sensitive can be overwritten with the `col_index` argument. The $Z$-axes is the $\\gamma$-disparity (FP) of the corresponding subgroup defined by the linear threshold function. This is important because it allows us to (1) visualize convergence as the heatmap flattens and (2) brute force check the fairness in low-dimensions without relying on a heuristic auditor. See the [the rich subgroup fairness empirical paper](https://arxiv.org/abs/1808.08166) for a discussion of these plots. Note that in the below plot no group has a $\\gamma$-disparity of greater than $.005$, which we would expect since the set of linear threshold functions on two attributes is a subset of the set of linear threshold functions on all protected attributes, and the final model is $\\gamma$-fair. " - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "metadata": { - "pycharm": { - "is_executing": true - } - }, - "outputs": [ + "cell_type": "code", + "execution_count": 7, + "metadata": { + "pycharm": { + "is_executing": true + }, + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "qEigaAI9g9Fv", + "outputId": "5a2852d9-132a-4ed0-a0c3-7eb96686c9e8" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "iteration: 1, error: 0.257, fairness violation: 0.041308000000000004, violated group size: 0.263\n", + "iteration: 2, error: 0.3785, fairness violation: 0.020654000000000002, violated group size: 0.263\n", + "iteration: 3, error: 0.419, fairness violation: 0.013769333333333342, violated group size: 0.263\n", + "iteration: 4, error: 0.43925, fairness violation: 0.010327000000000001, violated group size: 0.263\n", + "iteration: 5, error: 0.4514, fairness violation: 0.008261600000000001, violated group size: 0.237\n", + "iteration: 6, error: 0.4595000000000001, fairness violation: 0.006884666666666671, violated group size: 0.263\n", + "iteration: 7, error: 0.4652857142857143, fairness violation: 0.005901142857142857, violated group size: 0.237\n", + "iteration: 8, error: 0.469625, fairness violation: 0.005163500000000002, violated group size: 0.237\n", + "iteration: 9, error: 0.47300000000000003, fairness violation: 0.00458977777777778, violated group size: 0.237\n", + "iteration: 10, error: 0.4757000000000001, fairness violation: 0.0041308000000000004, violated group size: 0.237\n", + "iteration: 11, error: 0.47790909090909084, fairness violation: 0.0037552727272727273, violated group size: 0.263\n", + "iteration: 12, error: 0.47974999999999995, fairness violation: 0.0034423333333333354, violated group size: 0.263\n", + "iteration: 13, error: 0.4813076923076924, fairness violation: 0.0031775384615384643, violated group size: 0.263\n", + "iteration: 14, error: 0.48264285714285726, fairness violation: 0.0029505714285714296, violated group size: 0.237\n", + "iteration: 15, error: 0.48380000000000006, fairness violation: 0.0027538666666666674, violated group size: 0.237\n", + "iteration: 16, error: 0.4848125, fairness violation: 0.002581750000000001, violated group size: 0.237\n", + "iteration: 17, error: 0.4857058823529412, fairness violation: 0.0024298823529411775, violated group size: 0.237\n", + "iteration: 18, error: 0.4865, fairness violation: 0.00229488888888889, violated group size: 0.237\n", + "iteration: 19, error: 0.48721052631578954, fairness violation: 0.002174105263157895, violated group size: 0.237\n", + "iteration: 20, error: 0.4878499999999999, fairness violation: 0.0020654000000000015, violated group size: 0.263\n", + "iteration: 21, error: 0.4884285714285715, fairness violation: 0.001967047619047619, violated group size: 0.237\n", + "iteration: 22, error: 0.48895454545454553, fairness violation: 0.0018776363636363643, violated group size: 0.237\n", + "iteration: 23, error: 0.4894347826086957, fairness violation: 0.0017960000000000012, violated group size: 0.263\n", + "iteration: 24, error: 0.48987500000000006, fairness violation: 0.0017211666666666686, violated group size: 0.263\n", + "iteration: 25, error: 0.49028000000000016, fairness violation: 0.0016523200000000003, violated group size: 0.237\n", + "iteration: 26, error: 0.49065384615384616, fairness violation: 0.0015887692307692321, violated group size: 0.263\n", + "iteration: 27, error: 0.4910000000000001, fairness violation: 0.0015299259259259272, violated group size: 0.263\n", + "iteration: 28, error: 0.49132142857142846, fairness violation: 0.0014752857142857144, violated group size: 0.237\n", + "iteration: 29, error: 0.4916206896551723, fairness violation: 0.0014244137931034486, violated group size: 0.237\n", + "iteration: 30, error: 0.49190000000000006, fairness violation: 0.0013769333333333335, violated group size: 0.237\n", + "iteration: 31, error: 0.49216129032258077, fairness violation: 0.0013325161290322588, violated group size: 0.263\n", + "iteration: 32, error: 0.49240625, fairness violation: 0.0012908750000000006, violated group size: 0.237\n", + "iteration: 33, error: 0.4926363636363636, fairness violation: 0.001251757575757576, violated group size: 0.237\n", + "iteration: 34, error: 0.49285294117647066, fairness violation: 0.0012149411764705886, violated group size: 0.237\n", + "iteration: 35, error: 0.49305714285714286, fairness violation: 0.0011802285714285717, violated group size: 0.237\n", + "iteration: 36, error: 0.4932499999999999, fairness violation: 0.001147444444444445, violated group size: 0.237\n", + "iteration: 37, error: 0.49343243243243257, fairness violation: 0.0011164324324324328, violated group size: 0.237\n", + "iteration: 38, error: 0.49360526315789466, fairness violation: 0.0010870526315789476, violated group size: 0.237\n", + "iteration: 39, error: 0.4937692307692308, fairness violation: 0.001059179487179488, violated group size: 0.263\n", + "iteration: 40, error: 0.4939249999999999, fairness violation: 0.0010327000000000008, violated group size: 0.263\n", + "iteration: 41, error: 0.4940731707317074, fairness violation: 0.0010075121951219515, violated group size: 0.237\n", + "iteration: 42, error: 0.4942142857142858, fairness violation: 0.0009835238095238096, violated group size: 0.237\n", + "iteration: 43, error: 0.4943488372093023, fairness violation: 0.0009606511627906982, violated group size: 0.263\n", + "iteration: 44, error: 0.49447727272727265, fairness violation: 0.0009388181818181818, violated group size: 0.263\n", + "iteration: 45, error: 0.49460000000000004, fairness violation: 0.000917955555555556, violated group size: 0.263\n", + "iteration: 46, error: 0.4947173913043478, fairness violation: 0.0008980000000000004, violated group size: 0.263\n", + "iteration: 47, error: 0.49482978723404264, fairness violation: 0.0008788936170212767, violated group size: 0.263\n", + "iteration: 48, error: 0.4949374999999999, fairness violation: 0.0008605833333333339, violated group size: 0.263\n", + "iteration: 49, error: 0.49504081632653046, fairness violation: 0.0008430204081632653, violated group size: 0.237\n", + "iteration: 50, error: 0.49514, fairness violation: 0.0008261600000000004, violated group size: 0.263\n", + "iteration: 51, error: 0.49523529411764705, fairness violation: 0.0008099607843137258, violated group size: 0.263\n", + "iteration: 52, error: 0.49532692307692294, fairness violation: 0.0007943846153846153, violated group size: 0.263\n", + "iteration: 53, error: 0.4954150943396228, fairness violation: 0.0007793962264150945, violated group size: 0.263\n", + "iteration: 54, error: 0.4936111111111111, fairness violation: 0.0009580740740740742, violated group size: 0.237\n", + "iteration: 55, error: 0.49372727272727274, fairness violation: 0.0009406545454545454, violated group size: 0.263\n", + "iteration: 56, error: 0.4938392857142857, fairness violation: 0.0009238571428571433, violated group size: 0.263\n", + "iteration: 57, error: 0.49394736842105263, fairness violation: 0.0009076491228070175, violated group size: 0.237\n", + "iteration: 58, error: 0.49405172413793097, fairness violation: 0.0008920000000000001, violated group size: 0.237\n", + "iteration: 59, error: 0.49415254237288136, fairness violation: 0.0008768813559322037, violated group size: 0.263\n", + "iteration: 60, error: 0.4942499999999999, fairness violation: 0.0008622666666666666, violated group size: 0.237\n", + "iteration: 61, error: 0.49434426229508205, fairness violation: 0.0008481311475409838, violated group size: 0.237\n", + "iteration: 62, error: 0.4942741935483872, fairness violation: 0.000834451612903226, violated group size: 0.237\n", + "iteration: 63, error: 0.4943650793650794, fairness violation: 0.0008212063492063492, violated group size: 0.263\n", + "iteration: 64, error: 0.492859375, fairness violation: 0.0009861250000000002, violated group size: 0.263\n", + "iteration: 65, error: 0.49250769230769237, fairness violation: 0.0010365846153846153, violated group size: 0.237\n", + "iteration: 66, error: 0.4923787878787878, fairness violation: 0.0010352424242424242, violated group size: 0.237\n", + "iteration: 67, error: 0.49249253731343284, fairness violation: 0.0010197910447761196, violated group size: 0.263\n", + "iteration: 68, error: 0.4926029411764706, fairness violation: 0.0010047941176470586, violated group size: 0.237\n", + "iteration: 69, error: 0.49271014492753634, fairness violation: 0.000990231884057971, violated group size: 0.237\n", + "iteration: 70, error: 0.4928142857142858, fairness violation: 0.0009760857142857143, violated group size: 0.237\n", + "iteration: 71, error: 0.491338028169014, fairness violation: 0.0011225633802816905, violated group size: 0.237\n", + "iteration: 72, error: 0.4901249999999999, fairness violation: 0.001251805555555556, violated group size: 0.237\n", + "iteration: 73, error: 0.49004109589041106, fairness violation: 0.0012476438356164388, violated group size: 0.263\n", + "iteration: 74, error: 0.48977027027027026, fairness violation: 0.0012884324324324327, violated group size: 0.237\n", + "iteration: 75, error: 0.4884266666666666, fairness violation: 0.0014166133333333335, violated group size: 0.237\n", + "iteration: 76, error: 0.4879736842105262, fairness violation: 0.0014665789473684216, violated group size: 0.263\n", + "iteration: 77, error: 0.4868831168831168, fairness violation: 0.001582961038961039, violated group size: 0.237\n", + "iteration: 78, error: 0.4856153846153846, fairness violation: 0.001696358974358975, violated group size: 0.263\n", + "iteration: 79, error: 0.484506329113924, fairness violation: 0.001806886075949368, violated group size: 0.263\n", + "iteration: 80, error: 0.48330000000000006, fairness violation: 0.0019265000000000005, violated group size: 0.237\n", + "iteration: 81, error: 0.4821234567901235, fairness violation: 0.002043160493827161, violated group size: 0.263\n", + "iteration: 82, error: 0.4811707317073171, fairness violation: 0.0021454146341463418, violated group size: 0.237\n", + "iteration: 83, error: 0.48024096385542164, fairness violation: 0.002245204819277109, violated group size: 0.237\n", + "iteration: 84, error: 0.4791428571428571, fairness violation: 0.002353904761904763, violated group size: 0.237\n", + "iteration: 85, error: 0.4782705882352941, fairness violation: 0.002454470588235295, violated group size: 0.237\n", + "iteration: 86, error: 0.477406976744186, fairness violation: 0.0025471860465116286, violated group size: 0.237\n", + "iteration: 87, error: 0.47637931034482767, fairness violation: 0.0026486666666666677, violated group size: 0.237\n", + "iteration: 88, error: 0.47537499999999994, fairness violation: 0.0027478409090909107, violated group size: 0.263\n", + "iteration: 89, error: 0.4743932584269664, fairness violation: 0.002844786516853933, violated group size: 0.263\n", + "iteration: 90, error: 0.4736222222222222, fairness violation: 0.002934311111111111, violated group size: 0.237\n", + "iteration: 91, error: 0.47268131868131874, fairness violation: 0.0030270769230769236, violated group size: 0.237\n", + "iteration: 92, error: 0.4717608695652174, fairness violation: 0.003117826086956522, violated group size: 0.237\n", + "iteration: 93, error: 0.4708602150537634, fairness violation: 0.0032066236559139794, violated group size: 0.263\n", + "iteration: 94, error: 0.46997872340425534, fairness violation: 0.003293531914893617, violated group size: 0.237\n", + "iteration: 95, error: 0.46911578947368426, fairness violation: 0.003378610526315791, violated group size: 0.263\n", + "iteration: 96, error: 0.46827083333333336, fairness violation: 0.0034619166666666674, violated group size: 0.263\n", + "iteration: 97, error: 0.46744329896907216, fairness violation: 0.0035435051546391766, violated group size: 0.237\n", + "iteration: 98, error: 0.46663265306122453, fairness violation: 0.003623428571428572, violated group size: 0.237\n", + "iteration: 99, error: 0.46583838383838383, fairness violation: 0.003701737373737375, violated group size: 0.237\n", + "iteration: 100, error: 0.4650599999999999, fairness violation: 0.0037784800000000016, violated group size: 0.237\n", + "iteration: 101, error: 0.4642970297029704, fairness violation: 0.003853702970297031, violated group size: 0.237\n", + "iteration: 102, error: 0.4635490196078431, fairness violation: 0.003927450980392159, violated group size: 0.237\n", + "iteration: 103, error: 0.46281553398058256, fairness violation: 0.003999766990291263, violated group size: 0.237\n", + "iteration: 104, error: 0.4620961538461538, fairness violation: 0.00407069230769231, violated group size: 0.237\n", + "iteration: 105, error: 0.46139047619047613, fairness violation: 0.004140266666666668, violated group size: 0.237\n", + "iteration: 106, error: 0.46069811320754717, fairness violation: 0.004208528301886796, violated group size: 0.263\n", + "iteration: 107, error: 0.4595607476635515, fairness violation: 0.00434639252336449, violated group size: 0.263\n", + "iteration: 108, error: 0.4588981481481481, fairness violation: 0.004411481481481484, violated group size: 0.263\n", + "iteration: 109, error: 0.45780733944954133, fairness violation: 0.004536256880733949, violated group size: 0.263\n", + "iteration: 110, error: 0.4567272727272727, fairness violation: 0.004667381818181821, violated group size: 0.237\n", + "iteration: 111, error: 0.45610810810810815, fairness violation: 0.004727819819819823, violated group size: 0.263\n", + "iteration: 112, error: 0.4550625, fairness violation: 0.004854892857142861, violated group size: 0.237\n", + "iteration: 113, error: 0.45446902654867255, fairness violation: 0.004912601769911508, violated group size: 0.237\n", + "iteration: 114, error: 0.45345614035087717, fairness violation: 0.005035824561403512, violated group size: 0.237\n", + "iteration: 115, error: 0.4528869565217391, fairness violation: 0.005090956521739133, violated group size: 0.237\n", + "iteration: 116, error: 0.4523275862068965, fairness violation: 0.005145137931034486, violated group size: 0.237\n", + "iteration: 117, error: 0.45176923076923076, fairness violation: 0.0051943418803418835, violated group size: 0.237\n", + "iteration: 118, error: 0.4516271186440677, fairness violation: 0.005198525423728817, violated group size: 0.237\n", + "iteration: 119, error: 0.45189915966386557, fairness violation: 0.0051628067226890785, violated group size: 0.237\n", + "iteration: 120, error: 0.45144999999999996, fairness violation: 0.005206683333333338, violated group size: 0.237\n", + "iteration: 121, error: 0.4518512396694215, fairness violation: 0.005163652892561989, violated group size: 0.237\n", + "iteration: 122, error: 0.45224590163934414, fairness violation: 0.005121327868852463, violated group size: 0.237\n", + "iteration: 123, error: 0.4526341463414635, fairness violation: 0.005079691056910574, violated group size: 0.263\n", + "iteration: 124, error: 0.453016129032258, fairness violation: 0.005038725806451616, violated group size: 0.237\n", + "iteration: 125, error: 0.4533920000000001, fairness violation: 0.004998416000000004, violated group size: 0.237\n", + "iteration: 126, error: 0.45376190476190476, fairness violation: 0.004958746031746036, violated group size: 0.237\n", + "iteration: 127, error: 0.45412598425196843, fairness violation: 0.004919700787401579, violated group size: 0.237\n", + "iteration: 128, error: 0.454484375, fairness violation: 0.004881265625000004, violated group size: 0.263\n", + "iteration: 129, error: 0.4548372093023255, fairness violation: 0.004843426356589152, violated group size: 0.237\n", + "iteration: 130, error: 0.4551846153846153, fairness violation: 0.004806169230769234, violated group size: 0.237\n", + "iteration: 131, error: 0.45552671755725194, fairness violation: 0.004769480916030538, violated group size: 0.237\n", + "iteration: 132, error: 0.45544696969696963, fairness violation: 0.004776439393939399, violated group size: 0.263\n", + "iteration: 133, error: 0.45570676691729317, fairness violation: 0.004740526315789478, violated group size: 0.263\n", + "iteration: 134, error: 0.4560373134328357, fairness violation: 0.004705149253731347, violated group size: 0.263\n", + "iteration: 135, error: 0.4563629629629629, fairness violation: 0.004670296296296301, violated group size: 0.263\n", + "iteration: 136, error: 0.4566838235294117, fairness violation: 0.004635955882352945, violated group size: 0.237\n", + "iteration: 137, error: 0.45699999999999996, fairness violation: 0.004602116788321174, violated group size: 0.263\n", + "iteration: 138, error: 0.45731159420289863, fairness violation: 0.004568768115942034, violated group size: 0.263\n", + "iteration: 139, error: 0.4571007194244604, fairness violation: 0.004580230215827343, violated group size: 0.237\n", + "iteration: 140, error: 0.45740714285714285, fairness violation: 0.00454751428571429, violated group size: 0.263\n", + "iteration: 141, error: 0.4575957446808511, fairness violation: 0.004521985815602841, violated group size: 0.263\n", + "iteration: 142, error: 0.4571056338028169, fairness violation: 0.004570253521126764, violated group size: 0.237\n", + "iteration: 143, error: 0.45681118881118876, fairness violation: 0.004607902097902102, violated group size: 0.263\n", + "iteration: 144, error: 0.45699999999999996, fairness violation: 0.004582486111111115, violated group size: 0.237\n", + "iteration: 145, error: 0.4567103448275862, fairness violation: 0.004619531034482763, violated group size: 0.237\n", + "iteration: 146, error: 0.45700684931506846, fairness violation: 0.004587890410958908, violated group size: 0.237\n", + "iteration: 147, error: 0.45697959183673464, fairness violation: 0.0045889251700680315, violated group size: 0.237\n", + "iteration: 148, error: 0.45727027027027034, fairness violation: 0.004557918918918922, violated group size: 0.237\n", + "iteration: 149, error: 0.4575570469798658, fairness violation: 0.004527328859060408, violated group size: 0.263\n", + "iteration: 150, error: 0.45784, fairness violation: 0.004497146666666673, violated group size: 0.263\n", + "iteration: 151, error: 0.4581192052980132, fairness violation: 0.0044673642384106, violated group size: 0.263\n", + "iteration: 152, error: 0.4583947368421052, fairness violation: 0.00443797368421053, violated group size: 0.237\n", + "iteration: 153, error: 0.4585555555555555, fairness violation: 0.0044120653594771275, violated group size: 0.237\n", + "iteration: 154, error: 0.45882467532467525, fairness violation: 0.00438341558441559, violated group size: 0.263\n", + "iteration: 155, error: 0.45909032258064514, fairness violation: 0.0043551354838709715, violated group size: 0.237\n", + "iteration: 156, error: 0.4590897435897436, fairness violation: 0.004357602564102568, violated group size: 0.237\n", + "iteration: 157, error: 0.45869426751592357, fairness violation: 0.004399286624203826, violated group size: 0.263\n", + "iteration: 158, error: 0.458759493670886, fairness violation: 0.004401443037974688, violated group size: 0.263\n", + "iteration: 159, error: 0.4588301886792453, fairness violation: 0.004400591194968558, violated group size: 0.263\n", + "iteration: 160, error: 0.45845, fairness violation: 0.004438262500000003, violated group size: 0.263\n", + "iteration: 161, error: 0.45841614906832295, fairness violation: 0.004440136645962736, violated group size: 0.237\n", + "iteration: 162, error: 0.4586728395061729, fairness violation: 0.004412728395061732, violated group size: 0.263\n", + "iteration: 163, error: 0.45892638036809813, fairness violation: 0.004385656441717795, violated group size: 0.263\n", + "iteration: 164, error: 0.4586829268292683, fairness violation: 0.004399378048780492, violated group size: 0.237\n", + "iteration: 165, error: 0.4584969696969697, fairness violation: 0.00441006060606061, violated group size: 0.237\n", + "iteration: 166, error: 0.4584156626506024, fairness violation: 0.004417759036144582, violated group size: 0.263\n", + "iteration: 167, error: 0.4579940119760479, fairness violation: 0.004459425149700603, violated group size: 0.263\n", + "iteration: 168, error: 0.45776190476190465, fairness violation: 0.004472380952380955, violated group size: 0.237\n", + "iteration: 169, error: 0.4574023668639053, fairness violation: 0.004510426035502962, violated group size: 0.237\n", + "iteration: 170, error: 0.4570529411764706, fairness violation: 0.0045452352941176485, violated group size: 0.263\n", + "iteration: 171, error: 0.45670760233918134, fairness violation: 0.004579637426900589, violated group size: 0.263\n", + "iteration: 172, error: 0.45630813953488364, fairness violation: 0.0046191511627907, violated group size: 0.237\n", + "iteration: 173, error: 0.4559132947976877, fairness violation: 0.00465820809248555, violated group size: 0.237\n", + "iteration: 174, error: 0.45567816091954016, fairness violation: 0.004688643678160922, violated group size: 0.263\n", + "iteration: 175, error: 0.45534857142857144, fairness violation: 0.004726857142857145, violated group size: 0.237\n", + "iteration: 176, error: 0.4556022727272728, fairness violation: 0.004700000000000003, violated group size: 0.263\n", + "iteration: 177, error: 0.4552203389830508, fairness violation: 0.004732361581920906, violated group size: 0.237\n", + "iteration: 178, error: 0.45484269662921345, fairness violation: 0.004769685393258429, violated group size: 0.237\n", + "iteration: 179, error: 0.4545307262569832, fairness violation: 0.004803944134078216, violated group size: 0.263\n", + "iteration: 180, error: 0.45416111111111107, fairness violation: 0.004840455555555557, violated group size: 0.237\n", + "iteration: 181, error: 0.4537955801104972, fairness violation: 0.004876563535911605, violated group size: 0.263\n", + "iteration: 182, error: 0.4534340659340659, fairness violation: 0.004912274725274727, violated group size: 0.263\n", + "iteration: 183, error: 0.45343169398907107, fairness violation: 0.004916513661202187, violated group size: 0.237\n", + "iteration: 184, error: 0.45307608695652174, fairness violation: 0.004951619565217393, violated group size: 0.263\n", + "iteration: 185, error: 0.4527243243243243, fairness violation: 0.004986345945945949, violated group size: 0.263\n", + "iteration: 186, error: 0.4527311827956989, fairness violation: 0.0049875698924731204, violated group size: 0.263\n", + "iteration: 187, error: 0.4523850267379678, fairness violation: 0.005021732620320858, violated group size: 0.263\n", + "iteration: 188, error: 0.4520425531914894, fairness violation: 0.005055531914893619, violated group size: 0.263\n", + "iteration: 189, error: 0.4517089947089947, fairness violation: 0.00508646560846561, violated group size: 0.237\n", + "iteration: 190, error: 0.4515842105263158, fairness violation: 0.005092126315789474, violated group size: 0.237\n", + "iteration: 191, error: 0.4514607329842931, fairness violation: 0.005097727748691103, violated group size: 0.263\n", + "iteration: 192, error: 0.45163020833333334, fairness violation: 0.005076114583333335, violated group size: 0.263\n", + "iteration: 193, error: 0.4516373056994819, fairness violation: 0.00507437305699482, violated group size: 0.237\n", + "iteration: 194, error: 0.4518865979381443, fairness violation: 0.005048216494845362, violated group size: 0.263\n", + "iteration: 195, error: 0.45213333333333333, fairness violation: 0.005022328205128207, violated group size: 0.263\n", + "iteration: 196, error: 0.45237755102040805, fairness violation: 0.004996704081632655, violated group size: 0.237\n", + "iteration: 197, error: 0.45261928934010154, fairness violation: 0.004971340101522845, violated group size: 0.237\n", + "iteration: 198, error: 0.4528585858585858, fairness violation: 0.0049462323232323255, violated group size: 0.237\n", + "iteration: 199, error: 0.4530954773869348, fairness violation: 0.004921376884422113, violated group size: 0.263\n", + "iteration: 200, error: 0.45333, fairness violation: 0.004896770000000002, violated group size: 0.263\n", + "iteration: 201, error: 0.4535621890547263, fairness violation: 0.004872407960199008, violated group size: 0.263\n", + "iteration: 202, error: 0.45379207920792075, fairness violation: 0.004848287128712874, violated group size: 0.263\n", + "iteration: 203, error: 0.4540197044334975, fairness violation: 0.004824403940886701, violated group size: 0.263\n", + "iteration: 204, error: 0.4542450980392157, fairness violation: 0.004800754901960786, violated group size: 0.263\n", + "iteration: 205, error: 0.4544682926829269, fairness violation: 0.004777336585365856, violated group size: 0.237\n", + "iteration: 206, error: 0.4546893203883495, fairness violation: 0.004754145631067963, violated group size: 0.263\n", + "iteration: 207, error: 0.4549082125603864, fairness violation: 0.004731178743961353, violated group size: 0.263\n", + "iteration: 208, error: 0.455125, fairness violation: 0.004708432692307694, violated group size: 0.263\n", + "iteration: 209, error: 0.4551961722488037, fairness violation: 0.004706315789473685, violated group size: 0.237\n", + "iteration: 210, error: 0.4554095238095238, fairness violation: 0.004683904761904762, violated group size: 0.237\n", + "iteration: 211, error: 0.4556208530805687, fairness violation: 0.004661706161137443, violated group size: 0.263\n", + "iteration: 212, error: 0.4558301886792453, fairness violation: 0.004639716981132077, violated group size: 0.237\n", + "iteration: 213, error: 0.45603755868544593, fairness violation: 0.004617934272300471, violated group size: 0.263\n", + "iteration: 214, error: 0.4557663551401869, fairness violation: 0.004645084112149534, violated group size: 0.237\n", + "iteration: 215, error: 0.45597209302325586, fairness violation: 0.004623479069767443, violated group size: 0.237\n", + "iteration: 216, error: 0.45617592592592593, fairness violation: 0.004602074074074076, violated group size: 0.263\n", + "iteration: 217, error: 0.45630414746543785, fairness violation: 0.004585235023041476, violated group size: 0.237\n", + "iteration: 218, error: 0.4559908256880733, fairness violation: 0.004612036697247707, violated group size: 0.237\n", + "iteration: 219, error: 0.45619178082191786, fairness violation: 0.004590977168949774, violated group size: 0.263\n", + "iteration: 220, error: 0.4563909090909091, fairness violation: 0.004570109090909093, violated group size: 0.237\n", + "iteration: 221, error: 0.45644796380090497, fairness violation: 0.0045708778280543, violated group size: 0.263\n", + "iteration: 222, error: 0.4565675675675675, fairness violation: 0.004552423423423426, violated group size: 0.263\n", + "iteration: 223, error: 0.45644394618834083, fairness violation: 0.004561766816143499, violated group size: 0.237\n", + "iteration: 224, error: 0.4566339285714286, fairness violation: 0.004543517857142857, violated group size: 0.237\n", + "iteration: 225, error: 0.456751111111111, fairness violation: 0.0045254311111111115, violated group size: 0.237\n", + "iteration: 226, error: 0.4569424778761062, fairness violation: 0.004505407079646018, violated group size: 0.237\n", + "iteration: 227, error: 0.45713215859030837, fairness violation: 0.0044855594713656384, violated group size: 0.237\n", + "iteration: 228, error: 0.45682894736842095, fairness violation: 0.004515780701754388, violated group size: 0.263\n", + "iteration: 229, error: 0.45701746724890835, fairness violation: 0.0044960611353711795, violated group size: 0.237\n", + "iteration: 230, error: 0.4567130434782609, fairness violation: 0.004523913043478262, violated group size: 0.237\n", + "iteration: 231, error: 0.4566969696969697, fairness violation: 0.004528952380952382, violated group size: 0.263\n", + "iteration: 232, error: 0.4568836206896552, fairness violation: 0.004509431034482759, violated group size: 0.263\n", + "iteration: 233, error: 0.45706866952789704, fairness violation: 0.0044900772532188845, violated group size: 0.263\n", + "iteration: 234, error: 0.45705128205128204, fairness violation: 0.0044911452991453, violated group size: 0.263\n", + "iteration: 235, error: 0.4567574468085106, fairness violation: 0.00452044255319149, violated group size: 0.237\n", + "iteration: 236, error: 0.45694067796610166, fairness violation: 0.004501288135593223, violated group size: 0.263\n", + "iteration: 237, error: 0.4568902953586497, fairness violation: 0.004506295358649791, violated group size: 0.263\n", + "iteration: 238, error: 0.4566008403361344, fairness violation: 0.004535159663865547, violated group size: 0.237\n", + "iteration: 239, error: 0.4564435146443515, fairness violation: 0.00454394979079498, violated group size: 0.263\n", + "iteration: 240, error: 0.45620000000000005, fairness violation: 0.004568466666666667, violated group size: 0.237\n", + "iteration: 241, error: 0.45591701244813276, fairness violation: 0.004596713692946059, violated group size: 0.263\n", + "iteration: 242, error: 0.4558057851239669, fairness violation: 0.0046051404958677685, violated group size: 0.263\n", + "iteration: 243, error: 0.4559218106995884, fairness violation: 0.004590090534979424, violated group size: 0.263\n", + "iteration: 244, error: 0.4561024590163935, fairness violation: 0.0045712786885245904, violated group size: 0.237\n", + "iteration: 245, error: 0.455930612244898, fairness violation: 0.00459518367346939, violated group size: 0.263\n", + "iteration: 246, error: 0.4558414634146341, fairness violation: 0.004601552845528456, violated group size: 0.237\n", + "iteration: 247, error: 0.4555668016194332, fairness violation: 0.00462897975708502, violated group size: 0.237\n", + "iteration: 248, error: 0.45541935483870977, fairness violation: 0.00463707258064516, violated group size: 0.237\n", + "iteration: 249, error: 0.45521285140562245, fairness violation: 0.004660329317269079, violated group size: 0.263\n", + "iteration: 250, error: 0.45498400000000006, fairness violation: 0.004687192, violated group size: 0.237\n", + "iteration: 251, error: 0.4547171314741036, fairness violation: 0.004713840637450199, violated group size: 0.263\n", + "iteration: 252, error: 0.4544563492063492, fairness violation: 0.004738396825396826, violated group size: 0.263\n", + "iteration: 253, error: 0.454189723320158, fairness violation: 0.004762758893280632, violated group size: 0.263\n", + "iteration: 254, error: 0.4540905511811024, fairness violation: 0.004770133858267717, violated group size: 0.263\n", + "iteration: 255, error: 0.45383529411764706, fairness violation: 0.004794180392156863, violated group size: 0.263\n", + "iteration: 256, error: 0.453640625, fairness violation: 0.0048161875, violated group size: 0.237\n", + "iteration: 257, error: 0.45363813229571986, fairness violation: 0.004815891050583657, violated group size: 0.263\n", + "iteration: 258, error: 0.45342248062015506, fairness violation: 0.004841317829457365, violated group size: 0.263\n", + "iteration: 259, error: 0.4531737451737452, fairness violation: 0.004864718146718148, violated group size: 0.263\n", + "iteration: 260, error: 0.4529615384615384, fairness violation: 0.004886115384615385, violated group size: 0.263\n", + "iteration: 261, error: 0.4527164750957854, fairness violation: 0.004909164750957853, violated group size: 0.237\n", + "iteration: 262, error: 0.45253053435114504, fairness violation: 0.004930229007633589, violated group size: 0.263\n", + "iteration: 263, error: 0.45232319391634984, fairness violation: 0.004954737642585551, violated group size: 0.237\n", + "iteration: 264, error: 0.45207954545454543, fairness violation: 0.0049790606060606075, violated group size: 0.263\n", + "iteration: 265, error: 0.45195471698113204, fairness violation: 0.00498531320754717, violated group size: 0.263\n", + "iteration: 266, error: 0.451751879699248, fairness violation: 0.005009338345864661, violated group size: 0.237\n", + "iteration: 267, error: 0.4517528089887641, fairness violation: 0.005010104868913857, violated group size: 0.237\n", + "iteration: 268, error: 0.45155223880597023, fairness violation: 0.005030320895522388, violated group size: 0.237\n", + "iteration: 269, error: 0.45142750929368036, fairness violation: 0.005034527881040892, violated group size: 0.237\n", + "iteration: 270, error: 0.45119259259259265, fairness violation: 0.005058014814814815, violated group size: 0.237\n", + "iteration: 271, error: 0.4509630996309963, fairness violation: 0.005079579335793357, violated group size: 0.263\n", + "iteration: 272, error: 0.45114338235294116, fairness violation: 0.005060904411764706, violated group size: 0.263\n", + "iteration: 273, error: 0.4513223443223443, fairness violation: 0.0050423663003663, violated group size: 0.237\n", + "iteration: 274, error: 0.45112773722627747, fairness violation: 0.00506202189781022, violated group size: 0.263\n", + "iteration: 275, error: 0.451069090909091, fairness violation: 0.005064298181818182, violated group size: 0.263\n", + "iteration: 276, error: 0.45124637681159424, fairness violation: 0.00504594927536232, violated group size: 0.263\n", + "iteration: 277, error: 0.45136462093862817, fairness violation: 0.005031155234657041, violated group size: 0.263\n", + "iteration: 278, error: 0.45153956834532366, fairness violation: 0.005013057553956834, violated group size: 0.237\n", + "iteration: 279, error: 0.4517132616487456, fairness violation: 0.0049950896057347665, violated group size: 0.263\n", + "iteration: 280, error: 0.45188571428571433, fairness violation: 0.004977250000000001, violated group size: 0.263\n", + "iteration: 281, error: 0.4520569395017794, fairness violation: 0.004959537366548043, violated group size: 0.263\n", + "iteration: 282, error: 0.45222695035460997, fairness violation: 0.004941950354609928, violated group size: 0.237\n", + "iteration: 283, error: 0.45239575971731455, fairness violation: 0.0049244876325088335, violated group size: 0.237\n", + "iteration: 284, error: 0.45256338028169013, fairness violation: 0.004907147887323943, violated group size: 0.263\n", + "iteration: 285, error: 0.4527298245614035, fairness violation: 0.004889929824561404, violated group size: 0.263\n", + "iteration: 286, error: 0.45289510489510487, fairness violation: 0.004872832167832167, violated group size: 0.237\n", + "iteration: 287, error: 0.4530592334494773, fairness violation: 0.004855853658536585, violated group size: 0.237\n", + "iteration: 288, error: 0.4532222222222223, fairness violation: 0.004838993055555554, violated group size: 0.237\n", + "iteration: 289, error: 0.45338408304498273, fairness violation: 0.004822249134948096, violated group size: 0.237\n", + "iteration: 290, error: 0.45332413793103443, fairness violation: 0.004826868965517241, violated group size: 0.237\n", + "iteration: 291, error: 0.45348453608247424, fairness violation: 0.00481028178694158, violated group size: 0.263\n", + "iteration: 292, error: 0.45364383561643834, fairness violation: 0.004793808219178081, violated group size: 0.237\n", + "iteration: 293, error: 0.45380204778156996, fairness violation: 0.0047774470989761075, violated group size: 0.263\n", + "iteration: 294, error: 0.45395918367346944, fairness violation: 0.004761197278911563, violated group size: 0.263\n", + "iteration: 295, error: 0.4541152542372881, fairness violation: 0.004745057627118644, violated group size: 0.263\n", + "iteration: 296, error: 0.4542702702702703, fairness violation: 0.0047290270270270275, violated group size: 0.263\n", + "iteration: 297, error: 0.45442424242424245, fairness violation: 0.004713104377104377, violated group size: 0.263\n", + "iteration: 298, error: 0.4545771812080538, fairness violation: 0.004697288590604027, violated group size: 0.263\n", + "iteration: 299, error: 0.45472909698996655, fairness violation: 0.004681578595317724, violated group size: 0.237\n", + "iteration: 300, error: 0.45488, fairness violation: 0.0046659733333333335, violated group size: 0.263\n", + "iteration: 301, error: 0.45502990033222596, fairness violation: 0.004650471760797341, violated group size: 0.263\n", + "iteration: 302, error: 0.4551788079470199, fairness violation: 0.004635072847682119, violated group size: 0.263\n", + "iteration: 303, error: 0.4553267326732674, fairness violation: 0.004619775577557755, violated group size: 0.263\n", + "iteration: 304, error: 0.45547368421052636, fairness violation: 0.004604578947368419, violated group size: 0.237\n", + "iteration: 305, error: 0.4556196721311475, fairness violation: 0.004589481967213113, violated group size: 0.237\n", + "iteration: 306, error: 0.4556633986928105, fairness violation: 0.004589973856209149, violated group size: 0.237\n", + "iteration: 307, error: 0.4557524429967426, fairness violation: 0.004576566775244298, violated group size: 0.237\n", + "iteration: 308, error: 0.45589610389610397, fairness violation: 0.004561707792207791, violated group size: 0.237\n", + "iteration: 309, error: 0.4559838187702266, fairness violation: 0.004548478964401294, violated group size: 0.263\n", + "iteration: 310, error: 0.45607096774193545, fairness violation: 0.004535335483870968, violated group size: 0.263\n", + "iteration: 311, error: 0.4560353697749196, fairness violation: 0.004539041800643086, violated group size: 0.237\n", + "iteration: 312, error: 0.45617628205128213, fairness violation: 0.004524493589743589, violated group size: 0.263\n", + "iteration: 313, error: 0.45631629392971246, fairness violation: 0.004510038338658147, violated group size: 0.263\n", + "iteration: 314, error: 0.45628025477707, fairness violation: 0.004513789808917198, violated group size: 0.263\n", + "iteration: 315, error: 0.4564190476190476, fairness violation: 0.004499460317460317, violated group size: 0.263\n", + "iteration: 316, error: 0.45650632911392414, fairness violation: 0.004488221518987341, violated group size: 0.237\n", + "iteration: 317, error: 0.45664353312302836, fairness violation: 0.004474063091482649, violated group size: 0.237\n", + "iteration: 318, error: 0.4567295597484277, fairness violation: 0.004462974842767294, violated group size: 0.237\n", + "iteration: 319, error: 0.4568652037617556, fairness violation: 0.004448984326018807, violated group size: 0.237\n", + "iteration: 320, error: 0.45699999999999996, fairness violation: 0.00443508125, violated group size: 0.263\n", + "iteration: 321, error: 0.4571339563862929, fairness violation: 0.0044212647975077875, violated group size: 0.263\n", + "iteration: 322, error: 0.4572670807453416, fairness violation: 0.004407534161490681, violated group size: 0.237\n", + "iteration: 323, error: 0.4573993808049535, fairness violation: 0.004393888544891641, violated group size: 0.263\n", + "iteration: 324, error: 0.4575308641975308, fairness violation: 0.004380327160493826, violated group size: 0.237\n", + "iteration: 325, error: 0.45751692307692304, fairness violation: 0.00438435076923077, violated group size: 0.263\n", + "iteration: 326, error: 0.4576472392638037, fairness violation: 0.0043709018404907984, violated group size: 0.263\n", + "iteration: 327, error: 0.45751376146788997, fairness violation: 0.0043894250764525975, violated group size: 0.237\n", + "iteration: 328, error: 0.4576432926829267, fairness violation: 0.004376042682926829, violated group size: 0.237\n", + "iteration: 329, error: 0.4577203647416414, fairness violation: 0.004364182370820668, violated group size: 0.237\n", + "iteration: 330, error: 0.45753939393939397, fairness violation: 0.004382557575757575, violated group size: 0.237\n", + "iteration: 331, error: 0.45757401812688814, fairness violation: 0.004383637462235649, violated group size: 0.237\n", + "iteration: 332, error: 0.4575602409638555, fairness violation: 0.004387566265060242, violated group size: 0.263\n", + "iteration: 333, error: 0.4573513513513513, fairness violation: 0.004408552552552551, violated group size: 0.237\n", + "iteration: 334, error: 0.4571766467065869, fairness violation: 0.004427994011976048, violated group size: 0.237\n", + "iteration: 335, error: 0.4570179104477612, fairness violation: 0.00444590447761194, violated group size: 0.263\n", + "iteration: 336, error: 0.4568928571428572, fairness violation: 0.00446229761904762, violated group size: 0.263\n", + "iteration: 337, error: 0.45668842729970327, fairness violation: 0.004482813056379821, violated group size: 0.263\n", + "iteration: 338, error: 0.4568165680473372, fairness violation: 0.004469550295857987, violated group size: 0.237\n", + "iteration: 339, error: 0.4569439528023599, fairness violation: 0.004456365781710914, violated group size: 0.263\n", + "iteration: 340, error: 0.45683235294117647, fairness violation: 0.004462776470588236, violated group size: 0.263\n", + "iteration: 341, error: 0.4569589442815249, fairness violation: 0.0044496891495601175, violated group size: 0.263\n", + "iteration: 342, error: 0.4569970760233918, fairness violation: 0.004449152046783626, violated group size: 0.263\n", + "iteration: 343, error: 0.45712244897959176, fairness violation: 0.004436180758017492, violated group size: 0.263\n", + "iteration: 344, error: 0.45721802325581407, fairness violation: 0.004423284883720929, violated group size: 0.237\n", + "iteration: 345, error: 0.45734202898550724, fairness violation: 0.0044104637681159405, violated group size: 0.237\n", + "iteration: 346, error: 0.4573294797687861, fairness violation: 0.004411416184971097, violated group size: 0.263\n", + "iteration: 347, error: 0.45726512968299704, fairness violation: 0.004415095100864553, violated group size: 0.263\n", + "iteration: 348, error: 0.4570948275862069, fairness violation: 0.0044323735632183885, violated group size: 0.237\n", + "iteration: 349, error: 0.45721776504298, fairness violation: 0.004422389684813753, violated group size: 0.263\n", + "iteration: 350, error: 0.4570685714285714, fairness violation: 0.004438194285714283, violated group size: 0.237\n", + "iteration: 351, error: 0.4568717948717949, fairness violation: 0.004457960113960113, violated group size: 0.237\n", + "iteration: 352, error: 0.45676136363636366, fairness violation: 0.004462801136363637, violated group size: 0.263\n", + "iteration: 353, error: 0.4565665722379603, fairness violation: 0.004482385269121813, violated group size: 0.263\n", + "iteration: 354, error: 0.45668926553672323, fairness violation: 0.0044697231638418065, violated group size: 0.263\n", + "iteration: 355, error: 0.45673521126760563, fairness violation: 0.004461138028169011, violated group size: 0.237\n", + "iteration: 356, error: 0.4565421348314607, fairness violation: 0.0044805617977528075, violated group size: 0.237\n", + "iteration: 357, error: 0.45653221288515405, fairness violation: 0.004481288515406163, violated group size: 0.263\n", + "iteration: 358, error: 0.45660893854748597, fairness violation: 0.004471418994413408, violated group size: 0.263\n", + "iteration: 359, error: 0.45641782729805014, fairness violation: 0.004490651810584957, violated group size: 0.237\n", + "iteration: 360, error: 0.45638611111111105, fairness violation: 0.004493977777777778, violated group size: 0.263\n", + "iteration: 361, error: 0.4563102493074792, fairness violation: 0.00449991135734072, violated group size: 0.263\n", + "iteration: 362, error: 0.456232044198895, fairness violation: 0.004504502762430939, violated group size: 0.263\n", + "iteration: 363, error: 0.45615426997245184, fairness violation: 0.004509068870523414, violated group size: 0.263\n", + "iteration: 364, error: 0.455967032967033, fairness violation: 0.004527934065934064, violated group size: 0.237\n", + "iteration: 365, error: 0.4557808219178083, fairness violation: 0.0045466958904109575, violated group size: 0.263\n", + "iteration: 366, error: 0.45590163934426237, fairness violation: 0.004534273224043714, violated group size: 0.237\n", + "iteration: 367, error: 0.4558937329700272, fairness violation: 0.004534833787465939, violated group size: 0.263\n", + "iteration: 368, error: 0.4557092391304348, fairness violation: 0.004553423913043478, violated group size: 0.263\n", + "iteration: 369, error: 0.4558292682926829, fairness violation: 0.004541084010840108, violated group size: 0.237\n", + "iteration: 370, error: 0.455672972972973, fairness violation: 0.004556994594594594, violated group size: 0.237\n", + "iteration: 371, error: 0.4555202156334232, fairness violation: 0.004574097035040431, violated group size: 0.263\n", + "iteration: 372, error: 0.4553387096774194, fairness violation: 0.0045923817204301075, violated group size: 0.263\n", + "iteration: 373, error: 0.45537801608579087, fairness violation: 0.004591506702412869, violated group size: 0.263\n", + "iteration: 374, error: 0.4553743315508022, fairness violation: 0.004593171122994652, violated group size: 0.237\n", + "iteration: 375, error: 0.45530133333333334, fairness violation: 0.004597354666666665, violated group size: 0.237\n", + "iteration: 376, error: 0.45514893617021285, fairness violation: 0.004615382978723405, violated group size: 0.263\n", + "iteration: 377, error: 0.455, fairness violation: 0.004632058355437666, violated group size: 0.263\n", + "iteration: 378, error: 0.4548492063492063, fairness violation: 0.00464989947089947, violated group size: 0.237\n", + "iteration: 379, error: 0.4546728232189973, fairness violation: 0.004667646437994721, violated group size: 0.263\n", + "iteration: 380, error: 0.4545236842105263, fairness violation: 0.004682805263157895, violated group size: 0.263\n", + "iteration: 381, error: 0.45437270341207353, fairness violation: 0.004699128608923883, violated group size: 0.237\n", + "iteration: 382, error: 0.45419895287958123, fairness violation: 0.004716607329842932, violated group size: 0.237\n", + "iteration: 383, error: 0.4540261096605745, fairness violation: 0.004733994778067884, violated group size: 0.237\n", + "iteration: 384, error: 0.45385416666666667, fairness violation: 0.004751291666666666, violated group size: 0.237\n", + "iteration: 385, error: 0.4537116883116883, fairness violation: 0.004767267532467533, violated group size: 0.263\n", + "iteration: 386, error: 0.4535414507772021, fairness violation: 0.00478438860103627, violated group size: 0.263\n", + "iteration: 387, error: 0.45337209302325576, fairness violation: 0.004801421188630492, violated group size: 0.263\n", + "iteration: 388, error: 0.4532036082474227, fairness violation: 0.004818365979381443, violated group size: 0.263\n", + "iteration: 389, error: 0.4530359897172237, fairness violation: 0.004835223650385605, violated group size: 0.237\n", + "iteration: 390, error: 0.45286923076923075, fairness violation: 0.004851994871794871, violated group size: 0.237\n", + "iteration: 391, error: 0.45272890025575446, fairness violation: 0.004868680306905372, violated group size: 0.263\n", + "iteration: 392, error: 0.45266836734693877, fairness violation: 0.0048731887755102034, violated group size: 0.237\n", + "iteration: 393, error: 0.45257251908396945, fairness violation: 0.004886117048346056, violated group size: 0.237\n", + "iteration: 394, error: 0.45240862944162424, fairness violation: 0.004900182741116752, violated group size: 0.263\n", + "iteration: 395, error: 0.45226835443037977, fairness violation: 0.004915377215189875, violated group size: 0.263\n", + "iteration: 396, error: 0.45210606060606057, fairness violation: 0.00493169191919192, violated group size: 0.237\n", + "iteration: 397, error: 0.45194458438287155, fairness violation: 0.004947924433249372, violated group size: 0.263\n", + "iteration: 398, error: 0.45178391959799, fairness violation: 0.004964075376884422, violated group size: 0.237\n", + "iteration: 399, error: 0.4517017543859648, fairness violation: 0.0049682656641604015, violated group size: 0.237\n", + "iteration: 400, error: 0.4515699999999999, fairness violation: 0.004983100000000003, violated group size: 0.263\n", + "iteration: 401, error: 0.4514139650872818, fairness violation: 0.004997860349127184, violated group size: 0.263\n", + "iteration: 402, error: 0.45125621890547263, fairness violation: 0.005013726368159207, violated group size: 0.263\n", + "iteration: 403, error: 0.45116377171215877, fairness violation: 0.005027161290322582, violated group size: 0.237\n", + "iteration: 404, error: 0.45108415841584154, fairness violation: 0.0050311435643564375, violated group size: 0.237\n", + "iteration: 405, error: 0.4509283950617283, fairness violation: 0.005046809876543212, violated group size: 0.237\n", + "iteration: 406, error: 0.4507733990147783, fairness violation: 0.005062399014778328, violated group size: 0.263\n", + "iteration: 407, error: 0.4506437346437346, fairness violation: 0.0050755823095823115, violated group size: 0.237\n", + "iteration: 408, error: 0.4504926470588236, fairness violation: 0.005089862745098043, violated group size: 0.263\n", + "iteration: 409, error: 0.45036430317848414, fairness violation: 0.005102914425427874, violated group size: 0.263\n", + "iteration: 410, error: 0.45048536585365856, fairness violation: 0.005090468292682928, violated group size: 0.237\n", + "iteration: 411, error: 0.45036009732360094, fairness violation: 0.0051046082725060855, violated group size: 0.263\n", + "iteration: 412, error: 0.4504805825242718, fairness violation: 0.005092218446601944, violated group size: 0.237\n", + "iteration: 413, error: 0.4504891041162228, fairness violation: 0.005092513317191287, violated group size: 0.263\n", + "iteration: 414, error: 0.4506086956521739, fairness violation: 0.005080212560386476, violated group size: 0.237\n", + "iteration: 415, error: 0.450689156626506, fairness violation: 0.005070255421686748, violated group size: 0.237\n", + "iteration: 416, error: 0.4505624999999999, fairness violation: 0.005083134615384617, violated group size: 0.263\n", + "iteration: 417, error: 0.4506091127098321, fairness violation: 0.005081175059952039, violated group size: 0.237\n", + "iteration: 418, error: 0.45072727272727275, fairness violation: 0.005069019138755984, violated group size: 0.237\n", + "iteration: 419, error: 0.4508448687350835, fairness violation: 0.00505692124105012, violated group size: 0.237\n", + "iteration: 420, error: 0.4509619047619047, fairness violation: 0.0050448809523809535, violated group size: 0.263\n", + "iteration: 421, error: 0.45107838479809986, fairness violation: 0.0050328978622327806, violated group size: 0.237\n", + "iteration: 422, error: 0.45119431279620853, fairness violation: 0.005020971563981045, violated group size: 0.263\n", + "iteration: 423, error: 0.4513096926713947, fairness violation: 0.005009101654846337, violated group size: 0.237\n", + "iteration: 424, error: 0.45142452830188673, fairness violation: 0.0049972877358490575, violated group size: 0.237\n", + "iteration: 425, error: 0.45153882352941177, fairness violation: 0.004985529411764709, violated group size: 0.263\n", + "iteration: 426, error: 0.45165258215962434, fairness violation: 0.0049738262910798145, violated group size: 0.263\n", + "iteration: 427, error: 0.45176580796252924, fairness violation: 0.004962177985948481, violated group size: 0.263\n", + "iteration: 428, error: 0.4518785046728972, fairness violation: 0.004950584112149535, violated group size: 0.263\n", + "iteration: 429, error: 0.451990675990676, fairness violation: 0.004939044289044292, violated group size: 0.263\n", + "iteration: 430, error: 0.4521023255813953, fairness violation: 0.004927558139534886, violated group size: 0.263\n", + "iteration: 431, error: 0.4522134570765662, fairness violation: 0.004916125290023203, violated group size: 0.237\n", + "iteration: 432, error: 0.45232407407407416, fairness violation: 0.004904745370370373, violated group size: 0.263\n", + "iteration: 433, error: 0.4524341801385681, fairness violation: 0.004893418013856815, violated group size: 0.237\n", + "iteration: 434, error: 0.4525437788018434, fairness violation: 0.004882142857142861, violated group size: 0.263\n", + "iteration: 435, error: 0.4526528735632184, fairness violation: 0.004870919540229886, violated group size: 0.237\n", + "iteration: 436, error: 0.4527614678899081, fairness violation: 0.004859747706422021, violated group size: 0.263\n", + "iteration: 437, error: 0.4528306636155607, fairness violation: 0.0048497116704805535, violated group size: 0.263\n", + "iteration: 438, error: 0.45294063926940636, fairness violation: 0.004839721461187217, violated group size: 0.237\n", + "iteration: 439, error: 0.45304783599088844, fairness violation: 0.004828697038724374, violated group size: 0.237\n", + "iteration: 440, error: 0.4531545454545455, fairness violation: 0.00481772272727273, violated group size: 0.263\n", + "iteration: 441, error: 0.4532607709750567, fairness violation: 0.004806798185941045, violated group size: 0.263\n", + "iteration: 442, error: 0.453366515837104, fairness violation: 0.004795923076923078, violated group size: 0.263\n", + "iteration: 443, error: 0.45347178329571103, fairness violation: 0.004785097065462756, violated group size: 0.263\n", + "iteration: 444, error: 0.4535765765765766, fairness violation: 0.0047743198198198205, violated group size: 0.237\n", + "iteration: 445, error: 0.4536808988764045, fairness violation: 0.004763591011235956, violated group size: 0.237\n", + "iteration: 446, error: 0.4537847533632287, fairness violation: 0.004752910313901348, violated group size: 0.263\n", + "iteration: 447, error: 0.4538881431767337, fairness violation: 0.004742277404921701, violated group size: 0.237\n", + "iteration: 448, error: 0.4539910714285715, fairness violation: 0.004731691964285714, violated group size: 0.237\n", + "iteration: 449, error: 0.45409354120267265, fairness violation: 0.0047211536748329634, violated group size: 0.237\n", + "iteration: 450, error: 0.4541955555555555, fairness violation: 0.004710662222222223, violated group size: 0.237\n", + "iteration: 451, error: 0.4542971175166297, fairness violation: 0.004700217294900223, violated group size: 0.263\n", + "iteration: 452, error: 0.45439823008849556, fairness violation: 0.004689818584070798, violated group size: 0.263\n", + "iteration: 453, error: 0.45449889624724066, fairness violation: 0.0046794657836644596, violated group size: 0.237\n", + "iteration: 454, error: 0.4545991189427313, fairness violation: 0.00466915859030837, violated group size: 0.237\n", + "iteration: 455, error: 0.4546989010989011, fairness violation: 0.004658896703296704, violated group size: 0.263\n", + "iteration: 456, error: 0.4547982456140351, fairness violation: 0.004648679824561405, violated group size: 0.237\n", + "iteration: 457, error: 0.4548971553610503, fairness violation: 0.004638507658643327, violated group size: 0.263\n", + "iteration: 458, error: 0.45499563318777286, fairness violation: 0.0046283799126637555, violated group size: 0.237\n", + "iteration: 459, error: 0.45505882352941174, fairness violation: 0.0046203616557734225, violated group size: 0.263\n", + "iteration: 460, error: 0.4551565217391304, fairness violation: 0.004610317391304348, violated group size: 0.237\n", + "iteration: 461, error: 0.4551149674620391, fairness violation: 0.004613683297180044, violated group size: 0.237\n", + "iteration: 462, error: 0.45519047619047615, fairness violation: 0.004603696969696971, violated group size: 0.237\n", + "iteration: 463, error: 0.45528725701943845, fairness violation: 0.004593753779697626, violated group size: 0.237\n", + "iteration: 464, error: 0.4553836206896551, fairness violation: 0.004583853448275864, violated group size: 0.263\n", + "iteration: 465, error: 0.4554795698924731, fairness violation: 0.004573995698924732, violated group size: 0.263\n", + "iteration: 466, error: 0.45553862660944205, fairness violation: 0.004565197424892706, violated group size: 0.263\n", + "iteration: 467, error: 0.4555674518201284, fairness violation: 0.004565571734475376, violated group size: 0.263\n", + "iteration: 468, error: 0.4556623931623932, fairness violation: 0.00455581623931624, violated group size: 0.237\n", + "iteration: 469, error: 0.4557569296375267, fairness violation: 0.004546102345415778, violated group size: 0.237\n", + "iteration: 470, error: 0.4557872340425532, fairness violation: 0.004545506382978723, violated group size: 0.237\n", + "iteration: 471, error: 0.45588110403397036, fairness violation: 0.004535855626326964, violated group size: 0.237\n", + "iteration: 472, error: 0.4559745762711865, fairness violation: 0.004526245762711867, violated group size: 0.263\n", + "iteration: 473, error: 0.45600422832980975, fairness violation: 0.0045256955602537, violated group size: 0.237\n", + "iteration: 474, error: 0.456097046413502, fairness violation: 0.004516147679324895, violated group size: 0.237\n", + "iteration: 475, error: 0.45618947368421053, fairness violation: 0.004506640000000003, violated group size: 0.263\n", + "iteration: 476, error: 0.4562478991596639, fairness violation: 0.0044991638655462185, violated group size: 0.237\n", + "iteration: 477, error: 0.45624109014675046, fairness violation: 0.004501656184486373, violated group size: 0.237\n", + "iteration: 478, error: 0.4563138075313808, fairness violation: 0.004493230125523012, violated group size: 0.263\n", + "iteration: 479, error: 0.45637160751565764, fairness violation: 0.004485828810020879, violated group size: 0.263\n", + "iteration: 480, error: 0.4564625000000001, fairness violation: 0.004476483333333333, violated group size: 0.237\n", + "iteration: 481, error: 0.45641787941787937, fairness violation: 0.00447900207900208, violated group size: 0.263\n", + "iteration: 482, error: 0.45650829875518667, fairness violation: 0.004469709543568465, violated group size: 0.263\n", + "iteration: 483, error: 0.4565983436853003, fairness violation: 0.004460455486542443, violated group size: 0.263\n", + "iteration: 484, error: 0.4566880165289256, fairness violation: 0.004451239669421488, violated group size: 0.263\n", + "iteration: 485, error: 0.45677731958762885, fairness violation: 0.004442061855670102, violated group size: 0.237\n", + "iteration: 486, error: 0.45680246913580247, fairness violation: 0.004442674897119343, violated group size: 0.263\n", + "iteration: 487, error: 0.45679671457905546, fairness violation: 0.004444258726899385, violated group size: 0.263\n", + "iteration: 488, error: 0.4568852459016393, fairness violation: 0.004435151639344263, violated group size: 0.263\n", + "iteration: 489, error: 0.4569734151329243, fairness violation: 0.004426081799591004, violated group size: 0.263\n", + "iteration: 490, error: 0.4570612244897959, fairness violation: 0.004417048979591837, violated group size: 0.237\n", + "iteration: 491, error: 0.45714867617107935, fairness violation: 0.004408052953156824, violated group size: 0.263\n", + "iteration: 492, error: 0.45723780487804877, fairness violation: 0.004400056910569106, violated group size: 0.237\n", + "iteration: 493, error: 0.45732454361054764, fairness violation: 0.004391131845841786, violated group size: 0.237\n", + "iteration: 494, error: 0.45741093117408893, fairness violation: 0.0043822429149797575, violated group size: 0.237\n", + "iteration: 495, error: 0.45749696969696974, fairness violation: 0.0043733898989899, violated group size: 0.263\n", + "iteration: 496, error: 0.4574536290322581, fairness violation: 0.004376995967741938, violated group size: 0.263\n", + "iteration: 497, error: 0.4575392354124748, fairness violation: 0.004368189134808854, violated group size: 0.263\n", + "iteration: 498, error: 0.45759036144578313, fairness violation: 0.004360369477911648, violated group size: 0.237\n", + "iteration: 499, error: 0.4575811623246493, fairness violation: 0.004363030060120242, violated group size: 0.263\n" + ] + } + ], + "source": [ + "C = 100\n", + "print_flag = True\n", + "gamma = .005\n", + "\n", + "\n", + "fair_model = GerryFairClassifier(C=C, printflag=print_flag, gamma=gamma, fairness_def='FP',\n", + " max_iters=max_iterations, heatmapflag=False)\n", + "\n", + "# fit method\n", + "fair_model.fit(data_set, early_termination=True)\n", + "\n", + "# predict method. If threshold in (0, 1) produces binary predictions\n", + "\n", + "dataset_yhat = fair_model.predict(data_set, threshold=False)\n", + "\n", + "\n" + ] + }, { - "data": { - "image/png": "\n", - "text/plain": [ - "" + "cell_type": "markdown", + "metadata": { + "id": "LrpRmOpVg9Fv" + }, + "source": [ + "**3-d heatmaps**\n", + "\n", + "We now show to generate a 3d-heatmap of unfairness using the `generate_heatmap` method. The $X-Y$ axes in the plot represent the coefficients of the linear threshold function that defines a protected subgroup with respect to the first two sensitive attributes. Which $2$ attributes are considered sensitive can be overwritten with the `col_index` argument. The $Z$-axes is the $\\gamma$-disparity (FP) of the corresponding subgroup defined by the linear threshold function. This is important because it allows us to (1) visualize convergence as the heatmap flattens and (2) brute force check the fairness in low-dimensions without relying on a heuristic auditor. See the [the rich subgroup fairness empirical paper](https://arxiv.org/abs/1808.08166) for a discussion of these plots. Note that in the below plot no group has a $\\gamma$-disparity of greater than $.005$, which we would expect since the set of linear threshold functions on two attributes is a subset of the set of linear threshold functions on all protected attributes, and the final model is $\\gamma$-fair." ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "\n", - "# output heatmap (brute force)\n", - "# replace None with the relative path if you want to save the plot\n", - "fair_model.heatmapflag = True\n", - "fair_model.heatmap_path = 'heatmap'\n", - "fair_model.generate_heatmap(data_set, dataset_yhat.labels)\n", - "Image(filename='{}.png'.format(fair_model.heatmap_path)) \n", - "\n", - "\n", - "\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "**black-box auditing**\n", - "\n", - "We now show to audit any black box classifier with respect to rich subgroup fairness under either FP or FN rate. Note the below auditing procedure would work for any set of (soft) predictions $\\hat{y}$, and need make no assumptions about the structure of the predictor. We note that as expected the disparity of the group found is the same as the disparity printed out in the last iteration of the `fit` method.\n", - " " - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "metadata": { - "pycharm": { - "is_executing": true - } - }, - "outputs": [ + }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "0.004955178356713431\n" - ] - } - ], - "source": [ - "\n", - "\n", - "gerry_metric = BinaryLabelDatasetMetric(data_set)\n", - "gamma_disparity = gerry_metric.rich_subgroup(array_to_tuple(dataset_yhat.labels), 'FP')\n", - "print(gamma_disparity)\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "**pareto curves**\n", - "\n", - "The `FairFictPlay` algorithm implemented in the `fit` method converges given access to perfect oracles for solving cost-sensitive classification (CSC) problems. A cost-sensitive classification problem over a hypothesis class $\\mathcal{H}$ is $$\\min_{h}\\sum_{i = 1}^{n}(1-h(x_i))c_0 + h(x_i)c_1$$\n", - "By default in this package, and in the companion [empirical](https://arxiv.org/abs/1808.08166) and [theory](https://arxiv.org/pdf/1711.05144.pdf) papers, the hypothesis class of the learner and the of the subgroups are hyperplanes. The corresponding heuristic oracle for solving the CSC problem first forms two regression problems $(x_i, c_0)$ and $(x_i, c_1)$. Then in the case of hyperplanes, trains two regressions $r_i: \\mathcal{X} \\to R$ which predict the costs of classifying a given point $x$ $0,1$ respectively. Finally the binary classifier output by the oracle is defined as $\\hat{r}(x) = \\arg\\min_{j \\in \\{0,1\\}}r_j(x)$. But of course if we are interesting in different hypothesis classes for the learner, we simply need different regressors. In this package in addition to linear regression, we've added support for regression trees, kernelized ridge regression, and support vector regression. Below we trace out Pareto curves of $\\gamma$-disparity vs. error for each of these different heuristic oracles. " - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "metadata": { - "pycharm": { - "is_executing": true - } - }, - "outputs": [ + "cell_type": "code", + "execution_count": 8, + "metadata": { + "pycharm": { + "is_executing": true + }, + "colab": { + "base_uri": "https://localhost:8080/", + "height": 497 + }, + "id": "4kKzNgmRg9Fw", + "outputId": "f8f0f0a7-babf-4a1c-f92f-d3f46f127e92" + }, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "image/png": "\n", + "text/plain": [ + "" + ] + }, + "metadata": {}, + "execution_count": 8 + } + ], + "source": [ + "\n", + "# output heatmap (brute force)\n", + "# replace None with the relative path if you want to save the plot\n", + "fair_model.heatmapflag = True\n", + "fair_model.heatmap_path = 'heatmap'\n", + "fair_model.generate_heatmap(data_set, dataset_yhat.labels)\n", + "Image(filename='{}.png'.format(fair_model.heatmap_path))\n", + "\n", + "\n", + "\n" + ] + }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "Curr Predictor: Linear\n", - "Curr Predictor: SVR\n", - "Curr Predictor: Tree\n", - "Curr Predictor: Kernel\n" - ] + "cell_type": "markdown", + "metadata": { + "id": "OYsi5G4Pg9Fw" + }, + "source": [ + "**black-box auditing**\n", + "\n", + "We now show to audit any black box classifier with respect to rich subgroup fairness under either FP or FN rate. Note the below auditing procedure would work for any set of (soft) predictions $\\hat{y}$, and need make no assumptions about the structure of the predictor. We note that as expected the disparity of the group found is the same as the disparity printed out in the last iteration of the `fit` method.\n", + " " + ] }, { - "data": { - "image/png": "\n", - "text/plain": [ - "" + "cell_type": "code", + "execution_count": 9, + "metadata": { + "pycharm": { + "is_executing": true + }, + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "lBcmHN2zg9Fw", + "outputId": "a72d2611-a00a-41b8-d617-04a8aa7a58e7" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "0.004363030060120244\n" + ] + } + ], + "source": [ + "\n", + "\n", + "gerry_metric = BinaryLabelDatasetMetric(data_set)\n", + "gamma_disparity = gerry_metric.rich_subgroup(array_to_tuple(dataset_yhat.labels), 'FP')\n", + "print(gamma_disparity)\n" ] - }, - "execution_count": 5, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "# set to 50 iterations for fast running of notebook - set >= 1000 when running real experiments\n", - "pareto_iters = 50\n", - "def multiple_classifiers_pareto(dataset, gamma_list=[0.002, 0.005, 0.01, 0.02, 0.05, 0.1], save_results=False, iters=pareto_iters):\n", - "\n", - " ln_predictor = linear_model.LinearRegression()\n", - " svm_predictor = svm.LinearSVR()\n", - " tree_predictor = tree.DecisionTreeRegressor(max_depth=3)\n", - " kernel_predictor = KernelRidge(alpha=1.0, gamma=1.0, kernel='rbf')\n", - " predictor_dict = {'Linear': {'predictor': ln_predictor, 'iters': iters},\n", - " 'SVR': {'predictor': svm_predictor, 'iters': iters},\n", - " 'Tree': {'predictor': tree_predictor, 'iters': iters},\n", - " 'Kernel': {'predictor': kernel_predictor, 'iters': iters}}\n", - "\n", - " results_dict = {}\n", - "\n", - " for pred in predictor_dict:\n", - " print('Curr Predictor: {}'.format(pred))\n", - " predictor = predictor_dict[pred]['predictor']\n", - " max_iters = predictor_dict[pred]['iters']\n", - " fair_clf = GerryFairClassifier(C=100, printflag=True, gamma=1, predictor=predictor, max_iters=max_iters)\n", - " fair_clf.printflag = False\n", - " fair_clf.max_iters=max_iters\n", - " errors, fp_violations, fn_violations = fair_clf.pareto(dataset, gamma_list)\n", - " results_dict[pred] = {'errors': errors, 'fp_violations': fp_violations, 'fn_violations': fn_violations}\n", - " plt.plot(errors, fp_violations, label=pred)\n", - "\n", - " if save_results:\n", - " pickle.dump(results_dict, open('results_dict_' + str(gamma_list) + '_gammas' + str(gamma_list) + '.pkl', 'wb'))\n", - "\n", - " plt.xlabel('Error')\n", - " plt.ylabel('Unfairness')\n", - " plt.legend()\n", - " plt.title('Error vs. Unfairness\\n(Adult Dataset)')\n", - " plt.savefig('gerryfair_pareto.png')\n", - " plt.close()\n", - "multiple_classifiers_pareto(data_set)\n", - "Image(filename='gerryfair_pareto.png') " - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "A natural question one might ask is, suppose we fix a statistical fairness definition for rich subgroup fairness like equality of false positive rates, `FP`. Does learning a classifier that is fair with respect to `FP` increase or decrease fairness with respect to false negative rates `FN`? One could see this relationship going in either direction - and indeed we submit that it is dataset dependent. In some cases, if enforcing `FP` fairness pushes the classifier towards the constant classifier, then it will also satisify `FN` rate fairness, since the constant classifier is perfectly fair. However, if the hypothesis class is sufficiently rich, then one would expect that ceteris paribus since we are optimizing for error in addition to `FP` rate fairness, the algorithm would increase `FN` rate unfairness in order to decrease error. Below we trace the FN vs. FP rate tradeoff across a range of input $\\gamma$, where the classifier is optimized only for `FP` rate fairness. " - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "metadata": { - "pycharm": { - "is_executing": true - } - }, - "outputs": [ + }, + { + "cell_type": "markdown", + "metadata": { + "id": "pHEF-qTag9Fw" + }, + "source": [ + "**pareto curves**\n", + "\n", + "The `FairFictPlay` algorithm implemented in the `fit` method converges given access to perfect oracles for solving cost-sensitive classification (CSC) problems. A cost-sensitive classification problem over a hypothesis class $\\mathcal{H}$ is $$\\min_{h}\\sum_{i = 1}^{n}(1-h(x_i))c_0 + h(x_i)c_1$$\n", + "By default in this package, and in the companion [empirical](https://arxiv.org/abs/1808.08166) and [theory](https://arxiv.org/pdf/1711.05144.pdf) papers, the hypothesis class of the learner and the of the subgroups are hyperplanes. The corresponding heuristic oracle for solving the CSC problem first forms two regression problems $(x_i, c_0)$ and $(x_i, c_1)$. Then in the case of hyperplanes, trains two regressions $r_i: \\mathcal{X} \\to R$ which predict the costs of classifying a given point $x$ $0,1$ respectively. Finally the binary classifier output by the oracle is defined as $\\hat{r}(x) = \\arg\\min_{j \\in \\{0,1\\}}r_j(x)$. But of course if we are interesting in different hypothesis classes for the learner, we simply need different regressors. In this package in addition to linear regression, we've added support for regression trees, kernelized ridge regression, and support vector regression. Below we trace out Pareto curves of $\\gamma$-disparity vs. error for each of these different heuristic oracles." + ] + }, { - "name": "stdout", - "output_type": "stream", - "text": [ - "gamma: 0.001 gamma: 0.002 gamma: 0.003 gamma: 0.004 gamma: 0.005 gamma: 0.0075 gamma: 0.01 gamma: 0.02 gamma: 0.03 gamma: 0.05 " - ] + "cell_type": "code", + "execution_count": 10, + "metadata": { + "pycharm": { + "is_executing": true + }, + "colab": { + "base_uri": "https://localhost:8080/", + "height": 568 + }, + "id": "2KbOJzJfg9Fw", + "outputId": "dbf3a216-2c8e-4711-c601-771810249fd5" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Curr Predictor: Linear\n", + "Curr Predictor: SVR\n", + "Curr Predictor: Tree\n", + "Curr Predictor: Kernel\n" + ] + }, + { + "output_type": "execute_result", + "data": { + "image/png": "\n", + "text/plain": [ + "" + ] + }, + "metadata": {}, + "execution_count": 10 + } + ], + "source": [ + "# set to 50 iterations for fast running of notebook - set >= 1000 when running real experiments\n", + "pareto_iters = 50\n", + "def multiple_classifiers_pareto(dataset, gamma_list=[0.002, 0.005, 0.01, 0.02, 0.05, 0.1], save_results=False, iters=pareto_iters):\n", + "\n", + " ln_predictor = linear_model.LinearRegression()\n", + " svm_predictor = svm.LinearSVR()\n", + " tree_predictor = tree.DecisionTreeRegressor(max_depth=3)\n", + " kernel_predictor = KernelRidge(alpha=1.0, gamma=1.0, kernel='rbf')\n", + " predictor_dict = {'Linear': {'predictor': ln_predictor, 'iters': iters},\n", + " 'SVR': {'predictor': svm_predictor, 'iters': iters},\n", + " 'Tree': {'predictor': tree_predictor, 'iters': iters},\n", + " 'Kernel': {'predictor': kernel_predictor, 'iters': iters}}\n", + "\n", + " results_dict = {}\n", + "\n", + " for pred in predictor_dict:\n", + " print('Curr Predictor: {}'.format(pred))\n", + " predictor = predictor_dict[pred]['predictor']\n", + " max_iters = predictor_dict[pred]['iters']\n", + " fair_clf = GerryFairClassifier(C=100, printflag=True, gamma=1, predictor=predictor, max_iters=max_iters)\n", + " fair_clf.printflag = False\n", + " fair_clf.max_iters=max_iters\n", + " errors, fp_violations, fn_violations = fair_clf.pareto(dataset, gamma_list)\n", + " results_dict[pred] = {'errors': errors, 'fp_violations': fp_violations, 'fn_violations': fn_violations}\n", + " plt.plot(errors, fp_violations, label=pred)\n", + "\n", + " if save_results:\n", + " pickle.dump(results_dict, open('results_dict_' + str(gamma_list) + '_gammas' + str(gamma_list) + '.pkl', 'wb'))\n", + "\n", + " plt.xlabel('Error')\n", + " plt.ylabel('Unfairness')\n", + " plt.legend()\n", + " plt.title('Error vs. Unfairness\\n(Adult Dataset)')\n", + " plt.savefig('gerryfair_pareto.png')\n", + " plt.close()\n", + "multiple_classifiers_pareto(data_set)\n", + "Image(filename='gerryfair_pareto.png')" + ] }, { - "data": { - "image/png": "\n", - "text/plain": [ - "" + "cell_type": "markdown", + "metadata": { + "id": "vuZlaXsgg9Fw" + }, + "source": [ + "A natural question one might ask is, suppose we fix a statistical fairness definition for rich subgroup fairness like equality of false positive rates, `FP`. Does learning a classifier that is fair with respect to `FP` increase or decrease fairness with respect to false negative rates `FN`? One could see this relationship going in either direction - and indeed we submit that it is dataset dependent. In some cases, if enforcing `FP` fairness pushes the classifier towards the constant classifier, then it will also satisify `FN` rate fairness, since the constant classifier is perfectly fair. However, if the hypothesis class is sufficiently rich, then one would expect that ceteris paribus since we are optimizing for error in addition to `FP` rate fairness, the algorithm would increase `FN` rate unfairness in order to decrease error. Below we trace the FN vs. FP rate tradeoff across a range of input $\\gamma$, where the classifier is optimized only for `FP` rate fairness." ] - }, - "execution_count": 6, - "metadata": {}, - "output_type": "execute_result" + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": { + "pycharm": { + "is_executing": true + }, + "colab": { + "base_uri": "https://localhost:8080/", + "height": 515 + }, + "id": "BmyF8-u9g9Fw", + "outputId": "bd958e75-a38d-43c1-bccd-f14ee0ef9fed" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "gamma: 0.001 gamma: 0.002 gamma: 0.003 gamma: 0.004 gamma: 0.005 gamma: 0.0075 gamma: 0.01 gamma: 0.02 gamma: 0.03 gamma: 0.05 " + ] + }, + { + "output_type": "execute_result", + "data": { + "image/png": "\n", + "text/plain": [ + "" + ] + }, + "metadata": {}, + "execution_count": 11 + } + ], + "source": [ + "def fp_vs_fn(dataset, gamma_list, iters):\n", + " fp_auditor = Auditor(dataset, 'FP')\n", + " fn_auditor = Auditor(dataset, 'FN')\n", + " fp_violations = []\n", + " fn_violations = []\n", + " for g in gamma_list:\n", + " print('gamma: {} '.format(g), end =\" \")\n", + " fair_model = GerryFairClassifier(C=100, printflag=False, gamma=g, max_iters=iters)\n", + " fair_model.gamma=g\n", + " fair_model.fit(dataset)\n", + " predictions = array_to_tuple((fair_model.predict(dataset)).labels)\n", + " _, fp_diff = fp_auditor.audit(predictions)\n", + " _, fn_diff = fn_auditor.audit(predictions)\n", + " fp_violations.append(fp_diff)\n", + " fn_violations.append(fn_diff)\n", + "\n", + " plt.plot(fp_violations, fn_violations, label='adult')\n", + " plt.xlabel('False Positive Disparity')\n", + " plt.ylabel('False Negative Disparity')\n", + " plt.legend()\n", + " plt.title('FP vs FN Unfairness')\n", + " plt.savefig('gerryfair_fp_fn.png')\n", + " plt.close()\n", + "\n", + "gamma_list = [0.001, 0.002, 0.003, 0.004, 0.005, 0.0075, 0.01, 0.02, 0.03, 0.05]\n", + "fp_vs_fn(data_set, gamma_list, pareto_iters)\n", + "Image(filename='gerryfair_fp_fn.png')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "pycharm": { + "is_executing": true + }, + "id": "NDHXlmO0g9Fx" + }, + "outputs": [], + "source": [] } - ], - "source": [ - "def fp_vs_fn(dataset, gamma_list, iters):\n", - " fp_auditor = Auditor(dataset, 'FP')\n", - " fn_auditor = Auditor(dataset, 'FN')\n", - " fp_violations = []\n", - " fn_violations = []\n", - " for g in gamma_list:\n", - " print('gamma: {} '.format(g), end =\" \")\n", - " fair_model = GerryFairClassifier(C=100, printflag=False, gamma=g, max_iters=iters)\n", - " fair_model.gamma=g\n", - " fair_model.fit(dataset)\n", - " predictions = array_to_tuple((fair_model.predict(dataset)).labels)\n", - " _, fp_diff = fp_auditor.audit(predictions)\n", - " _, fn_diff = fn_auditor.audit(predictions)\n", - " fp_violations.append(fp_diff)\n", - " fn_violations.append(fn_diff)\n", - "\n", - " plt.plot(fp_violations, fn_violations, label='adult')\n", - " plt.xlabel('False Positive Disparity')\n", - " plt.ylabel('False Negative Disparity')\n", - " plt.legend()\n", - " plt.title('FP vs FN Unfairness')\n", - " plt.savefig('gerryfair_fp_fn.png')\n", - " plt.close()\n", - "\n", - "gamma_list = [0.001, 0.002, 0.003, 0.004, 0.005, 0.0075, 0.01, 0.02, 0.03, 0.05]\n", - "fp_vs_fn(data_set, gamma_list, pareto_iters)\n", - "Image(filename='gerryfair_fp_fn.png')" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": { + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.9" + }, "pycharm": { - "is_executing": true + "stem_cell": { + "cell_type": "raw", + "metadata": { + "collapsed": false + }, + "source": [] + } + }, + "colab": { + "provenance": [] } - }, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.6.9" }, - "pycharm": { - "stem_cell": { - "cell_type": "raw", - "metadata": { - "collapsed": false - }, - "source": [] - } - } - }, - "nbformat": 4, - "nbformat_minor": 1 + "nbformat": 4, + "nbformat_minor": 0 }