forked from h2oai/xai_guidelines
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathresponsible_xai.bib
352 lines (309 loc) · 15.2 KB
/
responsible_xai.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
@article{fair_washing,
title = {Fairwashing: the {R}isk of {R}ationalization},
author = {A{\"\i}vodji, Ulrich and Arai, Hiromi and Fortineau, Olivier and Gambs, S{\'e}bastien and Hara, Satoshi and Tapp, Alain},
journal = {arXiv preprint arXiv:1901.09749},
year = {2019},
note = {URL: \url{https://arxiv.org/pdf/1901.09749.pdf}}}
@inproceedings{modeltracker,
title={Modeltracker: {R}edesigning {P}erformance {A}nalysis {T}ools for {M}achine {L}earning},
author={Amershi, Saleema and Chickering, Max and Drucker, Steven M. and Lee, Bongshin and Simard, Patrice and Suh, Jina},
booktitle={Proceedings of the 33rd Annual ACM Conference on Human Factors in Computing Systems},
pages={337--346},
year={2015},
organization={ACM},
note={URL: \url{https://www.microsoft.com/en-us/research/wp-content/uploads/2016/02/amershi.CHI2015.ModelTracker.pdf}}}
@inproceedings{grad_attr,
title={Towards {B}etter {U}nderstanding of {G}radient-based {A}ttribution {M}ethods for {D}eep {N}eural {N}etworks},
author={Ancona, Marco and Ceolini, Enea and Oztireli, Cengiz and Gross, Markus},
booktitle={6th International Conference on Learning Representations (ICLR 2018)},
note={URL: \url{https://www.research-collection.ethz.ch/bitstream/handle/20.500.11850/249929/Flow_ICLR_2018.pdf}},
year={2018}}
@article{angwin16,
Author = {Julia Angwin and Jeff Larson and Surya Mattu and Lauren Kirchner},
Journal = {ProPublica},
Title = {{M}achine {B}ias: {T}here's {S}oftware {U}sed {A}cross the {C}ountry to {P}redict {F}uture {C}riminals. {A}nd {I}t's {B}iased {A}gainst {B}lacks.},
note = {URL: \url{https://www.propublica.org/article/machine-bias-risk-assessments-in-criminal-sentencing}},
Year = {2016}}
@article{ale_plot,
title = {Visualizing the {E}ffects of {P}redictor {V}ariables in {B}lack {B}ox {S}upervised {L}earning {M}odels},
author = {Apley, Daniel W.},
journal = {arXiv preprint arXiv:1612.08468},
year = {2016},
note = {URL: \url{https://arxiv.org/pdf/1612.08468.pdf}}}
@article{dt_surrogate2,
title = {Interpreting {B}lackbox {M}odels via {M}odel {E}xtraction},
author ={Osbert Bastani and Carolyn Kim and Hamsa Bastani},
journal = {arXiv preprint arXiv:1705.08504},
note = {URL: \url{https://arxiv.org/pdf/1705.08504.pdf}},
year = {2017}}
@inproceedings{viper,
title={Verifiable {R}einforcement {L}earning {V}ia {P}olicy {E}xtraction},
author={Bastani, Osbert and Pu, Yewen and Solar-Lezama, Armando},
booktitle={Advances in Neural Information Processing Systems},
pages={2494--2504},
year={2018},
note={URL: \url{http://papers.nips.cc/paper/7516-verifiable-reinforcement-learning-via-policy-extraction.pdf}}}
@article{dt_surrogate1,
Author = {Mark W. Craven and Jude W. Shavlik},
Journal = {Advances in Neural Information Processing Systems},
Title = {Extracting {T}ree-{S}tructured {R}epresentations of {T}rained {N}etworks},
note={URL: \url{http://papers.nips.cc/paper/1152-extracting-tree-structured-representations-of-trained-networks.pdf}},
Year = {1996}}
@article{been_kim1,
Author = {Finale Doshi-Velez and Been Kim},
Title = {Towards a {R}igorous {S}cience of {I}nterpretable {M}achine {L}earning},
Journal = {arXiv preprint arXiv:1702.08608},
note = {URL: \url{https://arxiv.org/pdf/1702.08608.pdf}},
Year = {2017}}
@inproceedings{dwork2012fairness,
title={Fairness {T}hrough {A}wareness},
author={Dwork, Cynthia and Hardt, Moritz and Pitassi, Toniann and Reingold, Omer and Zemel, Richard},
booktitle={Proceedings of the 3rd Innovations in Theoretical Computer Science Conference},
pages={214--226},
year={2012},
organization={ACM},
note={URL: \url{https://arxiv.org/pdf/1104.3913.pdf}}}
@inproceedings{feldman2015certifying,
title={Certifying and {R}emoving {D}isparate {I}mpact},
author={Feldman, Michael and Friedler, Sorelle A. and Moeller, John and Scheidegger, Carlos and Venkatasubramanian, Suresh},
booktitle={Proceedings of the 21\textsuperscript{st} ACM SIGKDD International Conference on Knowledge Discovery and Data Mining},
pages={259--268},
year={2015},
organization={ACM},
note={URL: \url{https://arxiv.org/pdf/1412.3756.pdf}}}
@article{flores2016false,
title={False {P}ositives, {F}alse {N}egatives, and {F}alse {A}nalyses: {A} {R}ejoinder to {M}achine {B}ias: {T}here's {S}oftware {U}sed across the {C}ountry to {P}redict {F}uture {C}riminals. {A}nd {I}t's {B}iased against {B}lacks},
author={Flores, Anthony W. and Bechtel, Kristin and Lowenkamp, Christopher T.},
journal={Fed. Probation},
volume={80},
pages={38},
year={2016},
publisher={HeinOnline},
note={URL: \url{https://bit.ly/2Gesf9Y}}}
@book{esl,
Address = {New York},
Author = {Jerome Friedman and Trevor Hastie and Robert Tibshirani},
Booktitle = {\textit{The Elements of Statistical Learning}},
Publisher = {Springer},
Title = {\textbf{The Elements of Statistical Learning}},
note = {URL: \url{https://web.stanford.edu/~hastie/ElemStatLearn/printings/ESLII\_print12.pdf}},
Year = {2001}}
@article{gilpin2018explaining,
title = {Explaining {E}xplanations: {A}n {A}pproach to {E}valuating {I}nterpretability of {M}achine {L}earning},
author = {Leilani H. Gilpin and David Bau and Ben Z. Yuan and Ayesha Bajwa and Michael Specter and Lalana Kagal},
journal = {arXiv preprint arXiv:1806.00069},
note = {URL: \url{https://arxiv.org/pdf/1806.00069.pdf}},
year = {2018}}
@article{ice_plots,
Author = {Alex Goldstein and Adam Kapelner and Justin Bleich and Emil Pitkin},
Journal = {Journal of Computational and Graphical Statistics},
Number = {1},
Title = {Peeking {I}nside the {B}lack {B}ox: {V}isualizing {S}tatistical {L}earning with {P}lots of {I}ndividual {C}onditional {E}xpectation},
Volume = {24},
Year = {2015},
note = {URL: \url{https://arxiv.org/pdf/1309.6392.pdf}}}
@misc{gopinathan1998fraud,
title = {Fraud {D}etection using {P}redictive {M}odeling},
author = {Gopinathan, Krishna M. and Biafore, Louis S. and Ferguson, William M. and Lazarus, Michael A. and Pathria, Anu K. and Jost, Allen},
year = {1998},
month = oct # "~6",
publisher = {Google Patents},
note = {US Patent 5,819,226. URL: \url{https://patents.google.com/patent/US5819226A}}}
@article{guidotti2018survey,
title = {{A} {S}urvey of {M}ethods for {E}xplaining {B}lack {B}ox {M}odels},
author = {Guidotti, Riccardo and Monreale, Anna and Ruggieri, Salvatore and Turini, Franco and Giannotti, Fosca and Pedreschi, Dino},
journal = {ACM Computing Surveys (CSUR)},
volume = {51},
number = {5},
pages = {93},
year = {2018},
publisher = {ACM},
note = {URL: \url{https://arxiv.org/pdf/1802.01933.pdf}}}
@inproceedings{art_and_sci,
title = {On the {A}rt and {S}cience of {M}achine {L}earning {E}xplanations},
author = {Hall, Patrick},
booktitle={KDD '19 XAI Workshop Proceedings},
note = {URL: \url{https://arxiv.org/pdf/1810.02909.pdf}},
year = {2019}}
@inproceedings{hardt2016equality,
title={Equality of {O}pportunity in {S}upervised {L}earning},
author={Hardt, Moritz and Price, Eric and Srebro, Nati and others},
booktitle={Advances in Neural Information Processing Systems},
pages={3315--3323},
year={2016},
note={URL: \url{http://papers.nips.cc/paper/6374-equality-of-opportunity-in-supervised-learning.pdf}}}
@article{lime-sup,
title = {Locally {I}nterpretable {M}odels and {E}ffects {B}ased on {S}upervised {P}artitioning ({LIME-SUP})},
author = {Linwei Hu and Jie Chen and Vijayan N. Nair and Agus Sudjianto},
journal = {arXiv preprint arXiv:1806.00663},
note = {URL: \url{https://arxiv.org/ftp/arxiv/papers/1806/1806.00663.pdf}},
year = {2018}}
@article{kamiran2012data,
title={Data {P}reprocessing {T}echniques for {C}lassification {W}ithout {D}iscrimination},
author={Kamiran, Faisal and Calders, Toon},
journal={Knowledge and Information Systems},
volume={33},
number={1},
pages={1--33},
year={2012},
publisher={Springer},
note={URL: \url{https://bit.ly/2lH95lQ}}}
@misc{kangdebugging,
title={Debugging {M}achine {L}earning {M}odels via {M}odel {A}ssertions},
author={Kang, Daniel and Raghavan, Deepti and Bailis, Peter and Zaharia, Matei},
year={2019},
note={URL: \url{https://www-cs.stanford.edu/~matei/papers/2018/mlsys_model_assertions.pdf}}}
@article{keinan2004fair,
title = {Fair {A}ttribution of {F}unctional {C}ontribution in {A}rtificial and {B}iological {N}etworks},
author = {Keinan, Alon and Sandbank, Ben and Hilgetag, Claus C. and Meilijson, Isaac and Ruppin, Eytan},
journal = {Neural Computation},
volume = {16},
number = {9},
pages = {1887--1915},
year = {2004},
publisher = {MIT Press},
note={URL: \url{http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.436.6801&rep=rep1&type=pdf}}}
@misc{uci,
author = {M. Lichman},
year = {2013},
title = {{UCI} {M}achine {L}earning {R}epository},
note = {URL: \url{http://archive.ics.uci.edu/ml}},
institution = {University of California, Irvine, School of Information and Computer Sciences"}}
@article{lipovetsky2001analysis,
title={Analysis of {R}egression in {G}ame {T}heory {A}pproach},
author={Lipovetsky, Stan and Conklin, Michael},
journal={Applied Stochastic Models in Business and Industry},
volume={17},
number={4},
pages={319--330},
year={2001},
publisher={Wiley Online Library}}
@article{lipton1,
title = {The {M}ythos of {M}odel {I}nterpretability},
author = {Lipton, Zachary C.},
journal = {arXiv preprint arXiv:1606.03490},
year = {2016},
note = {URL: \url{https://arxiv.org/pdf/1606.03490.pdf}}}
@incollection{tree_shap,
title = {Consistent {I}ndividualized {F}eature {A}ttribution for {T}ree {E}nsembles},
author = {Lundberg, Scott M. and Erion, Gabriel G. and Lee, Su-In},
booktitle = {Proceedings of the 2017 ICML Workshop on Human Interpretability in Machine Learning (WHI 2017)},
pages = {15--21},
editor = {Been Kim and Dmitry M. Malioutov and Kush R. Varshney and Adrian Weller},
year = {2017},
note = {URL: \url{https://openreview.net/pdf?id=ByTKSo-m-}},
publisher = {ICML WHI 2017},
organization = {ICML}}
@incollection{shapley,
title = {A {U}nified {A}pproach to {I}nterpreting {M}odel {P}redictions},
author = {Lundberg, Scott M. and Lee, Su-In},
booktitle = {Advances in Neural Information Processing Systems 30},
editor = {I. Guyon and U. V. Luxburg and S. Bengio and H. Wallach and R. Fergus and S. Vishwanathan and R. Garnett},
pages = {4765--4774},
year = {2017},
publisher = {Curran Associates, Inc.},
note = {URL: \url{http://papers.nips.cc/paper/7062-a-unified-approach-to-interpreting-model-predictions.pdf}}}
@book{molnar,
title = {\textbf{\textit{{I}nterpretable {M}achine {L}earning}}},
author = {Christoph Molnar},
publisher = {christophm.github.io},
note = {URL: \url{https://christophm.github.io/interpretable-ml-book/}},
year = {2018}}
@article{murdoch2019interpretable,
title={Interpretable {M}achine {L}earning: {D}efinitions, {M}ethods, and {A}pplications},
author={Murdoch, W. James and Singh, Chandan and Kumbier, Karl and Abbasi-Asl, Reza and Yu, Bin},
journal={arXiv preprint arXiv:1901.04592},
year={2019},
note={URL: \url{https://arxiv.org/pdf/1901.04592.pdf}}}
@inproceedings{lime,
title = {Why {S}hould {I} {T}rust {Y}ou?: {E}xplaining the {P}redictions of {A}ny {C}lassifier},
author = {Marco Tulio Ribeiro and Sameer Singh and Carlos Guestrin},
booktitle = {Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining},
pages = {1135--1144},
year = {2016},
note = {URL: \url{http://www.kdd.org/kdd2016/papers/files/rfp0573-ribeiroA.pdf}},
organization = {ACM}}
@article{please_stop,
title = {Please {S}top {E}xplaining {B}lack {B}ox {M}odels for {H}igh {S}takes {D}ecisions},
author = {Rudin, Cynthia},
note = {URL: \url{https://arxiv.org/pdf/1811.10154.pdf}},
journal = {arXiv preprint arXiv:1811.10154},
year = {2018}}
@book{shapley1988shapley,
title = {\textit{The Shapley value: {E}ssays in honor of {L}loyd {S}. {S}hapley}},
author = {Shapley, Lloyd S. and Roth, Alvin E. and others},
year = {1988},
publisher = {Cambridge University Press},
note = {URL: \url{http://www.library.fa.ru/files/Roth2.pdf}}}
@article{shokri2019privacy,
title={Privacy {R}isks of {E}xplaining {M}achine {L}earning {M}odels},
author={Shokri, Reza and Strobel, Martin and Zick, Yair},
journal={arXiv preprint arXiv:1907.00164},
year={2019},
note={URL:\url{https://arxiv.org/pdf/1907.00164.pdf}}}
@inproceedings{membership_inference,
title={Membership {I}nference {A}ttacks {A}gainst {M}achine {L}earning {M}odels},
author={Shokri, Reza and Stronati, Marco and Song, Congzheng and Shmatikov, Vitaly},
booktitle={2017 IEEE Symposium on Security and Privacy (SP)},
pages={3--18},
year={2017},
organization={IEEE},
note={URL: \url{https://arxiv.org/pdf/1610.05820.pdf}}}
@article{kononenko2010efficient,
title = {An {E}fficient {E}xplanation of {I}ndividual {C}lassifications using {G}ame {T}heory},
author = {Strumbelj, Erik and Kononenko, Igor},
journal = {Journal of Machine Learning Research},
volume = {11},
number = {Jan},
pages = {1--18},
year = {2010},
note = {URL: \url{http://www.jmlr.org/papers/volume11/strumbelj10a/strumbelj10a.pdf}}}
@inproceedings{model_stealing,
title={Stealing {M}achine {L}earning {M}odels via {P}rediction {A}{P}{I}s},
author={Tram{\`e}r, Florian and Zhang, Fan and Juels, Ari and Reiter, Michael K. and Ristenpart, Thomas},
booktitle={25th $\{$USENIX$\}$ Security Symposium ($\{$USENIX$\}$ Security 16)},
pages={601--618},
year={2016},
note={URL: \url{https://www.usenix.org/system/files/conference/usenixsecurity16/sec16_paper_tramer.pdf}}}
@article{slim,
Author = {Ustun, Berk and Rudin, Cynthia},
Journal = {Machine Learning},
Number = {3},
Pages = {349--391},
Publisher = {Springer},
Title = {{Supersparse {L}inear {I}nteger {M}odels for {O}ptimized {M}edical {S}coring {S}ystems}},
Volume = {102},
note={URL: \url{https://users.cs.duke.edu/~cynthia/docs/UstunTrRuAAAI13.pdf}},
Year = {2016}}
@article{wf_xnn,
title = {Explainable {N}eural {N}etworks {B}ased on {A}dditive {I}ndex {M}odels},
author = {Vaughan, Joel and Sudjianto, Agus and Brahimi, Erind and Chen, Jie and Nair, Vijayan N.},
journal = {arXiv preprint arXiv:1806.01933},
note = {URL: \url{https://arxiv.org/pdf/1806.01933.pdf}},
year = {2018}}
@article{weller2017challenges,
title = {{C}hallenges for {T}ransparency},
author = {Weller, Adrian},
journal = {arXiv preprint arXiv:1708.01870},
year = {2017},
note = {URL: \url{https://arxiv.org/pdf/1708.01870.pdf}}}
@book{ff_interpretability,
author = {Williams, Mike and others},
title = {Interpretability},
publisher = {Fast Forward Labs},
year = {2017},
note = {URL: \url{https://www.cloudera.com/products/fast-forward-labs-research.html}}}
@inproceedings{sbrl,
title = {Scalable {B}ayesian {R}ule {L}ists},
author = {Hongyu Yang and Cynthia Rudin and Margo Seltzer},
booktitle = {Proceedings of the 34th International Conference on Machine Learning {(ICML)}},
note = {URL: \url{https://arxiv.org/pdf/1602.08610.pdf}},
year = {2017}}
@inproceedings{zhang2018mitigating,
title={Mitigating {U}nwanted {B}iases with {A}dversarial {L}earning},
author={Zhang, Brian Hu and Lemoine, Blake and Mitchell, Margaret},
booktitle={Proceedings of the 2018 AAAI/ACM Conference on AI, Ethics, and Society},
pages={335--340},
year={2018},
organization={ACM},
note={URL: \url{https://arxiv.org/pdf/1801.07593.pdf}}}