-
Notifications
You must be signed in to change notification settings - Fork 2
/
copa23.bib
1236 lines (1132 loc) · 61.7 KB
/
copa23.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
@Proceedings{COPA-2023,
booktitle = {Proceedings of the Twelfth Symposium on Conformal
and Probabilistic Prediction with Applications},
name = {Conformal and Probabilistic Prediction with
Applications},
shortname = {COPA 2023},
editor = {Papadopoulos, Harris and Nguyen, Khuong An and
Bostr\"{o}m, Henrik and Carlsson, Lars},
volume = 204,
year = 2023,
start = {2023-09-13},
end = {2023-09-15},
published = {2023-08-17},
url = {https://copa-conference.com},
address = {Limassol, Cyprus}
}
%% PREFACE %%
% 4 pages
@InProceedings{papadopoulos23,
title = {Preface},
author = {Papadopoulos, Harris and Nguyen, Khuong An and
Bostr\"{o}m, Henrik and Carlsson, Lars},
pages = {1--4},
}
%% GROUP 1 Implementations - 2 papers %%
% 1 - 1
%11 pages
@InProceedings{kuijk23,
title = {Conformal Regression in Calorie Prediction for Team
Jumbo-Visma},
author = {van Kuijk, Kristian and Dirksen, Mark and Seiler,
Christof},
pages = {5--15},
abstract = {UCI WorldTour races, the premier men's elite road
cycling tour, are grueling events that put physical
fitness and endurance of riders to the test. The
coaches of Team Jumbo-Visma have long been
responsible for predicting the energy needs of each
rider of the Dutch team for every race on the
calendar. Those must be estimated to ensure riders
have the energy and resources necessary to maintain
a high level of performance throughout a race. This
task, however, is both time-consuming and
challenging, as it requires precise estimates of
race speed and power output. Traditionally, the
approach to predicting energy needs has relied on
judgement and experience of coaches, but this method
has its limitations and often leads to inaccurate
predictions. In this paper, we propose a new, more
effective approach to predicting energy needs for
cycling races. By predicting the speed and power
with regression models, we provide the coaches with
calorie needs estimates for each individual rider
per stage instantly. In addition, we compare methods
to quantify uncertainty using conformal
prediction. The empirical analysis of the
jackknife+, jackknife-minmax,
jackknife-minmax-after-bootstrap, CV+, CV-minmax,
conformalized quantile regression, and inductive
conformal prediction methods in conformal prediction
reveals that all methods achieve valid prediction
intervals. All but minmax-based methods also produce
produce sufficiently narrow prediction intervals for
decision-making. Furthermore, methods computing
prediction intervals of fixed size produce tighter
intervals for low significance values. Among the
methods computing intervals of varying length across
the input space, inductive conformal prediction
computes narrower prediction intervals at larger
significance level.}
}
%1 - 2
%20 pages
@InProceedings{ernez23,
title = {Applying the conformal prediction paradigm for the
uncertainty quantification of an end-to-end
automatic speech recognition model (wav2vec 2.0)},
author = {Ernez, Fares and Arnold, Alexandre and Galametz,
Audrey and Kobus, Catherine and Ould-Amer, Nawal},
pages = {16--35},
abstract = {Uncertainty quantification is critical when using
Automatic Speech Recognition (ASR) in High Risk
Systems where safety is highly important. While
developing ASR models adapted to such context, a
range of techniques are being explored to measure
the uncertainty of their predictions. In this
paper, we present two algorithms: the first one
applies the Conformal Risk Control paradigm to
predict a set of sentences that controls the Word
Error Rate (WER) to an adjustable level of
guarantee. The second algorithm uses Inductive
Conformal Prediction (ICP) to predict uncertain
words in an automatic transcription. We analyze the
performance of the three algorithms using an
open-source ASR model based on Wav2vec 2.0. The CP
algorithms were trained on the “clean test” part of
the LibriSpeech corpus that contains approximately
2,600 sentences. The results show that the three
algorithms provide valid and efficient prediction
sets. We guarantee that the WER is below 2\% with a
confidence level of 80\% and an average set size of
29 sentences and we detect 90\% of the badly
transcripted words.}
}
%% GROUP2 Venn prediction - 3 papers %%
%2 - 1
%20 pages
@InProceedings{andeol23,
title = {Confident Object Detection via Conformal Prediction
and Conformal Risk Control: an Application to
Railway Signaling},
author = {Andeol, Leo and Fel, Thomas and de Grancey, Florence
and Mossina, Luca},
pages = {36--55},
abstract = {Deploying deep learning models in real-world
certied systems requires the ability to provide
condence estimates that accurately reflect their
uncertainty. In this paper, we demonstrate the use
of the conformal prediction framework to construct
reliable and trustworthy predictors for detecting
railway signals. Our approach is based on a novel
dataset that includes images taken from the
perspective of a train operator and state-of-the-art
object detectors. We test several conformal
approaches and introduce a new method based on
conformal risk control. Our findings demonstrate
the potential of the conformal prediction framework
to evaluate model performance and provide practical
guidance for achieving formally guaranteed
uncertainty bounds.}
}
%2 - 2
%18 pages
@InProceedings{vishwakarma23a,
title = {Enterprise Disk Drive Scrubbing Based on Mondrian
Conformal Predictors},
author = {Vishwakarma, Rahul and Hwang, Jinha and Messoudi,
Soundouss and Hedayatipour, Ava},
pages = {56--73},
abstract = {Disk scrubbing is a process aimed at resolving read
errors on disks by reading data from the
disk. However, scrubbing the entire storage array at
once can adversely impact system performance,
particularly during periods of high input/output
operations. Additionally, the continuous reading of
data from disks when scrubbing can result in wear
and tear, especially on larger capacity disks, due
to the significant time and energy consumption
involved. To address these issues, we propose a
selective disk scrubbing method that enhances the
overall reliability and power efficiency in data
centers. Our method employs a Machine Learning model
based on Mondrian Conformal prediction to identify
specific disks for scrubbing, by proactively
predicting the health status of each disk in the
storage pool, forecasting n-days in advance, and
using an open-source dataset. For disks predicted as
non-healthy, we mark them for replacement without
further action. For healthy drives, we create a set
and quantify their relative health across the entire
storage pool based on the predictor’s
confidence. This enables us to prioritize selective
scrubbing for drives with established scrubbing
frequency based on the scrub cycle. The method we
propose provides an efficient and dependable
solution for managing enterprise disk drives. By
scrubbing just 22.7\% of the total storage disks, we
can achieve optimized energy consumption and reduce
the carbon footprint of the data center. }
}
%2 - 3
%15 pages
@InProceedings{garcia23,
title = {An Uncertainty-Aware Sequential Approach for
Predicting Response to Neoadjuvant Therapy in Breast
Cancer},
author = {Garcia-Galindo, Alberto and Lopez-De-Castro, Marcos
and Armananzas, Ruben},
pages = {74--88},
abstract = {Neoadjuvant therapy (NAT) is considered the gold
standard preoperative treatment for reducing tumor
charge in breast cancer. However, the tumor’s
pathological response highly depends on patient
conditions and clinical factors. There is a dire
need to develop modeling tools to predict a patient
response to NAT and thus improve personalized
medical care plans. Recent studies have shown
promising results of machine learning (ML)
methodologies in breast cancer prognosis through the
combination of several modalities, including imaging
and molecular features derived from biopsy
analyses. We here present a ML model to predict
response to NAT through two sequential prediction
stages. First, a pre-treatment dynamic
contrast-enhanced magnetic resonance imaging model
is trained, followed by a second model with
molecular biomarkers-enriched data. We propose the
integration of the Conformal Prediction (CP)
framework in the first non-invasive model to
identify patients whose predicted responses show
large uncertainty and refer them to the second model
that includes data from invasive tests. The major
advantage of this procedure is in the reduction of
unnecessary biopsies. Different alternatives for the
standard ML algorithms and the CP functions are
explored on a publicly available clinical
dataset. Results clearly show the potential of our
uncertainty-aware clinical predictive tool in such
real scenarios.}
}
%% group 3 Real-world applications - 6 papers %%
% 3 - 1
%11 pages
@InProceedings{canete23a,
title = {Market Implied Conformal Volatility Intervals},
author = {Canete, Alejandro},
pages = {89--99},
abstract = {Volatility is a fundamental input for pricing and
risk management of nancial instruments. In the
following work we propose an algorithm to estimate
the market implied uncertainty of future realized
volatility. Our method interprets the market implied
volatility as a point prediction of future realized
volatility and applies online conformal prediction
to estimate the uncertainty of this prediction. We
analyze rolling coverage and width of several
nonconformity scores over 15 years of daily
data. The results suggest that conformal prediction
can be used to infer market implied prediction
intervals for realized volatility. }
}
% 3 - 2
%16 pages
@InProceedings{althoff23,
title = {Evaluation of conformal-based probabilistic
forecasting methods for short-term wind speed
forecasting},
author = {Althoff, Simon and Szabadv'ary, Johan Hallberg and
Anderson, Jonathan and Carlsson, Lars},
pages = {100--115},
abstract = {We apply Conformal Predictive Distribution Systems
(CPDS) and a non-exchangeable version of the
traditional Conformal Prediction (NECP) method to
short-term wind speed forecasting to generate
probabilistic forecasts. These are compared to the
more traditional Quantile Regression Forest (QRF)
method. A short-term forecast is available from a
few hours before the forecasted time period and is
only extended a couple days into the future. The
methods are supplied ensemble forecasts as input and
additionally the Conformal methods are supplied with
post-processed point forecasts for generating the
probability distributions. In the NECP case we
propose a method of producing probability
distributions by creating sequentially larger
prediction intervals. The methods are compared
through a teaching schedule, to mimic a real-world
setting. For each model update in the teaching
schedule a grid-search approach is applied to select
each method’s optimal hyperparameters, respectively.
The methods are tested out of the box with tweaks to
few hyperparameters. We also introduce a normalized
nonconformity score and use it with the conformal
method that handles data that violates the
exchangeability assumption. The resulting
probability distributions are compared to actual
wind measurements through Continuous Ranked
Probability Scores (CRPS) as well as their validity
and efficiency of certain prediction intervals. Our
results suggest that the conformal based methods,
with the pre-trained underlying model, produce
slightly more conservative but more efficient
probability distributions than QRF at a lower
computational cost. We further propose how the
conformal-based methods could be improved for the
application to real-world scenarios. }
}
% 3 - 3
%18 pages
@InProceedings{choudhury23,
title = {Evaluating potential sensitive information leaks on
a smartphone using the magnetometer and Conformal
Prediction},
author = {Choudhury, Robert and Luo, Zhiyuan and Nguyen,
Khuong An},
pages = {116--133},
abstract = {The low powered sensors used in modern Smartphones
do not require permissions when using low sampling
rates i.e. 200Hz and below. This has made them a
target for side channel attacks. In this paper we
perform a series of experiments that harvest raw
data from the low powered sensor known as the
magnetometer. We start by using unsupervised
learning with the cosine metric to provide clear
indications if it is possible to classify the data
into the different security events occurring at the
time of capture. We then build a model, designed to
be robust in terms of the orientation of the device,
to evaluate the risk of sensitive data being
correctly identified from magnetometer data despite
the limited sampling rate. Using a model trained
with LSTM on the whole data set with an 80/20 split,
our results show 100\% accuracy on our reverse
Turing test and 67.5\% on the key press test. We
also show that when analysing the captured
magnetometer responses to playing sound samples from
the loudspeaker it is very difficult to infer the
original sound. We extend the work using Inductive
Conformal Prediction by examining the property of
uncertainty for different confidence levels. We also
show that despite a high degree of uncertainty there
is the potential to infer security properties such
as the layout of a screen. To this end we show that
the number 5 in the center of a keypad occurs a
disproportionately high number of times in the
prediction set (68.3\%).}
}
% 3 - 4
%13 pages
@InProceedings{mekkaoui23,
title = {Neural Networks based Conformal Prediction for
Pipeline Structural Response},
author = {El Mekkaoui, Sara and Ferreira, Carla J and Guevara
G'omez, Juan Camilo and Agrell, Christian and
Vaughan, Nicholas James and Heggen, Hans Olav},
pages = {134--146},
abstract = {The widespread use of machine learning models has
achieved considerable success across various
domains. Nevertheless, their deployment in
safety-critical systems can result in catastrophic
consequences if uncertainties are not handled
properly. This study is concerned with the
simulation of the physical response of a subsea
pipeline when it is hooked by an anchor. Predicting
this response is crucial for risk assessment,
however, it is computationally unfeasible to run a
significant amount of input sets to compute the
probability of failure of the system. Therefore, the
use of a surrogate model becomes essential. In this
context, a surrogate model is a machine learning
model trained on data from a physicsbased
simulation. This is achieved by neural network based
surrogate models, as they are capable of modelling
complex relationships and provide greater accuracy
than other machine learning models in many use
cases. However, to ensure the safe use of these
models, it is important to understand the
uncertainty associated with their
predictions. Therefore, we apply the conformal
prediction framework to provide valid prediction
intervals and improve the uncertainty quantification
of the neural network models. In order to create
adaptive conformal prediction intervals, we employ
multilayer perceptron neural network models that
provide uncertainty estimates through both the Monte
Carlo dropout technique and treating the output as a
Gaussian distribution, with the neural network
providing estimates for both mean and variance. The
conformal prediction procedure improves the
uncertainty estimation of uncalibrated models and
guarantees new test samples are within the predicted
intervals with the corresponding selected confidence
level.}
}
% 3 - 5
%19 pages
@InProceedings{uddin23,
title = {Applications of Conformal Regression on Real-world
Industrial Use Cases using Crepes and MAPIE},
author = {Uddin, Nasir and Lofstrom, Tuwe},
pages = {147--165},
abstract = {Applying conformal prediction in real-world
industrial use cases is rare, and publications are
often limited to popular open-source data sets. This
paper demonstrates two experimental use cases where
the conformal prediction framework was applied to
regression problems at Husqvarna Group with the two
Python-based open-source platforms MAPIE and Crepes.
The paper concludes by discussing lessons learned
for the industry and some challenges for the
conformal prediction community to address.}
}
% 3 - 6
%3 pages
@InProceedings{canete23b,
title = {Online NoVaS Conformal Volatility Prediction},
author = {Canete, Alejandro},
pages = {166--168}
}
% 4 - 1
% 3 pages
@InProceedings{pham23,
title = {Capturing prediction uncertainty in upstream cell
culture models using conformal prediction and
Gaussian processes},
author = {Pham, Tien Dung and Aickelin, Uwe and Bassett,
Robert},
pages = {169--171},
abstract = { }
}
% 4 - 2
%3 pages
@InProceedings{vishwakarma23b,
title = {Variable Sparing of Disk Drives Based on Failure
Analysis},
author = {Vishwakarma, Rahul and Fardadi, Mahshid and Liu,
Bing},
pages = {172--174}
}
% 4 - 3
%19 pages
@InProceedings{angelopoulos23,
title = {Recommendation Systems with Distribution-Free
Reliability Guarantees},
author = {Angelopoulos, Anastasios N and Krauth, Karl and
Bates, Stephen and Wang, Yixin and Jordan, Michael
I},
pages = {175--193},
abstract = {When building recommendation systems, we seek to
output a helpful set of items to the user. Under the
hood, a ranking model predicts which of two
candidate items is better, and we must distill these
pairwise comparisons into the user-facing
output. However, a learned ranking model is never
perfect, so taking its predictions at face value
gives no guarantee that the user-facing output is
reliable. Building from a pre-trained ranking model,
we show how to return a set of items that is
rigorously guaranteed to contain mostly good
items. Our procedure endows any ranking model with
rigorous nite-sample control of the false
discovery rate (FDR), regardless of the (unknown)
data distribution. Moreover, our calibration
algorithm enables the easy and principled
integration of multiple objectives in recommender
systems. As an example, we show how to optimize for
recommendation diversity subject to a user-specied
level of FDR control, circumventing the need to
specify ad hoc weights of a diversity loss against
an accuracy loss. Throughout, we focus on the
problem of learning to rank a set of possible
recommendations, evaluating our methods on the
Yahoo! Learning to Rank and MSMarco datasets.}
}
% 4 - 4
% 20 pages
@InProceedings{tebjou23,
title = {Data-driven Reachability using Christoffel Functions
and Conformal Prediction},
author = {Tebjou, Abdelmouaiz and Frehse, Goran and
Chamroukhi, Fa"{i}cel},
pages = {194--213},
abstract = {An important mathematical tool in the analysis of
dynamical systems is the approximation of the reach
set, i.e., the set of states reachable after a given
time from a given initial state. This set is
difficult to compute for complex systems even if the
system dynamics are known and given by a system of
ordinary differential equations with known
coefficients. In practice, parameters are often
unknown and mathematical models difficult to
obtain. Data-based approaches are promised to avoid
these difficulties by estimating the reach set based
on a sample of states. If a model is available, this
training set can be obtained through numerical
simulation. In the absence of a model, real-life
observations can be used instead. A recently
proposed approach for data-based reach set
approximation uses Christoffel functions to
approximate the reach set. Under certain
assumptions, the approximation is guaranteed to
converge to the true solution. In this paper, we
improve upon these results by notably improving the
sample efficiency and relaxing some of the
assumptions by exploiting statistical guarantees
from conformal prediction with training and
calibration sets. In addition, we exploit an
incremental way to compute the Christoffel function
to avoid the calibration set while maintaining the
statistical convergence guarantees. Furthermore, our
approach is robust to outliers in the training and
calibration set.}
}
% 4 - 5
%20 pages
@InProceedings{lienen23,
title = {Conformal Credal Self-Supervised Learning},
author = {Lienen, Julian and Demir, Caglar and Hullermeier,
Eyke},
pages = {214--233},
abstract = {In semi-supervised learning, the paradigm of
self-training refers to the idea of learning from
pseudo-labels suggested by the learner
itself. Recently, corresponding methods have proven
effective and achieve state-of-the-art performance,
e.g., when applied to image classification
problems. However, pseudo-labels typically stem from
ad-hoc heuristics, relying on the quality of the
predictions though without guaranteeing their
validity. One such method, so-called credal
self-supervised learning, maintains
pseudo-supervision in the form of sets of (instead
of single) probability distributions over labels,
thereby allowing for a flexible yet
uncertainty-aware labeling. Again, however, there is
no justification beyond empirical effectiveness. To
address this deficiency, we make use of conformal
prediction, an approach that comes with guarantees
on the validity of set-valued predictions. As a
result, the construction of credal sets of labels is
supported by a rigorous theoretical foundation,
leading to better calibrated and less error-prone
supervision for unlabeled data. Along with this, we
present effective algorithms for learning from
credal self-supervision. An empirical study
demonstrates excellent calibration properties of the
pseudo-supervision, as well as the competitiveness
of our method on several image classification
benchmark datasets.}
}
% 4 - 6
% 17 pages
@InProceedings{rodriguez23,
title = {Self Learning using Venn-Abers predictors},
author = {Rodriguez, Come and Martin Bordini, Vitor and
Destercke, Sebastien and Quost, Benjamin},
pages = {234--250},
abstract = {In supervised learning problems, it is common to
have a lot of unlabeled data, but little labeled
data. It is then desirable to leverage the unlabeled
data to improve the learning procedure. One way to
do this is to have a model predict “pseudolabels”
for the unlabeled data, so as to use them for
learning. In self-learning, the pseudo-labels are
provided by the very same model to which they are
fed. As these pseudo-labels are by nature uncertain
and only partially reliable, it is then natural to
model this uncertainty and take it into account in
the learning process, if only to robustify the
self-learning procedure. This paper describes such
an approach, where we use Venn-Abers Predictors to
produce calibrated credal labels so as to quantify
the pseudo-labeling uncertainty. These labels are
then included in the learning process by optimizing
an adapted loss. Experiments show that taking into
account pseudo-label uncertainty both robustifies
the self-learning procedure and allows it to
converge faster in general.}
}
%% 5 POSTERS with extended abstracts %%
% 5 - 1
%16 pages
@InProceedings{javanmardi23,
title = {Conformal Prediction with Partially Labeled Data},
author = {Javanmardi, Alireza and Sale, Yusuf and Hofman, Paul
and H"ullermeier, Eyke},
pages = {251--266},
abstract = {While the predictions produced by conformal
prediction are set-valued, the data used for
training and calibration is supposed to be
precise. In the setting of superset learning or
learning from partial labels, a variant of weakly
supervised learning, it is exactly the other way
around: training data is possibly imprecise
(set-valued), but the model induced from this data
yields precise predictions. In this paper, we
combine the two settings by making conformal
prediction amenable to set-valued training data. We
propose a generalization of the conformal prediction
procedure that can be applied to set-valued training
and calibration data. We prove the validity of the
proposed method and present experimental studies in
which it compares favorably to natural baselines.}
}
% 5 - 2
%20 pages
@InProceedings{nouretdinov23a,
title = {Conformal Association Rule Mining (CARM): A novel
technique for data error detection and probabilistic
correction},
author = {Nouretdinov, Ilia and Gammerman, James},
pages = {267--286},
abstract = {Conformal prediction (CP) is a modern framework for
reliable machine learning. It is most commonly used
in the context of supervised learning, where in
combination with an underlying algorithm it
generates predicted labels for new, unlabelled
examples and complements each of them with an
individual measure of confidence. Conversely,
association rule mining (ARM) is an unsupervised
learning technique for discovering interesting
relationships in large datasets in the form of
rules. In this work, we integrate CP and ARM to
develop a novel technique termed Conformal
Association Rule Mining (CARM). The technique
enables the identification of probable errors within
a set of binary labels. Subsequently, these probable
errors are analysed using another modern framework
called Venn-ABERS prediction to correct the value in
a probabilistic way.}
}
% 5 - 3
%24 pages
@InProceedings{luo23,
title = {Anomalous Edge Detection in Edge Exchangeable Social
Network Models},
author = {Luo, Rui and Nettasinghe, Buddhika and
Krishnamurthy, Vikram},
pages = {287--310},
abstract = {This paper studies detecting anomalous edges in
directed graphs that model social networks. We
exploit edge exchangeability as a criterion for
distinguishing anomalous edges from normal
edges. Then we present an anomaly detector based on
conformal prediction theory; this detector has a
guaranteed upper bound for false positive rate. In
numerical experiments, we show that the proposed
algorithm achieves superior performance to baseline
methods.}
}
% 5 - 4
%13 pages
@InProceedings{ennadir23,
title = {Conformalized Adversarial Attack Detection for Graph
Neural Networks},
author = {Ennadir, Sofiane and Alkhatib, Amr and Bostrom,
Henrik and Vazirgiannis, Michalis},
pages = {311--323},
abstract = {Graph Neural Networks (GNNs) have achieved
remarkable performance on diverse graph
representation learning tasks. However, recent
studies have unveiled their susceptibility to
adversarial attacks, leading to the development of
various defense techniques to enhance their
robustness. In this work, instead of improving the
robustness, we propose a framework to detect
adversarial attacks and provide an adversarial
certainty score in the prediction. Our framework
evaluates whether an input graph significantly
deviates from the original data and provides a
well-calibrated p-value based on this score through
the conformal paradigm, therby controlling the false
alarm rate. We demonstrate the effectiveness of our
approach on various benchmark datasets. Although we
focus on graph classification, the proposed
framework can be readily adapted for other
graph-related tasks, such as node classification.}
}
% 5 - 5
%4 pages
@InProceedings{prinster23,
title = {Efficient Approximate Predictive Inference Under
Feedback Covariate Shift with Influence Functions},
author = {Prinster, Drew and Saria, Suchi and Liu, Anqi},
pages = {324--327}
}
%% invited talks
%19 pages
@InProceedings{eliades23,
title = {A Conformal Martingales Ensemble Approach for
addressing Concept Drift},
author = {Eliades, Charalambos and Papadopoulos, Harris},
pages = {328--346},
abstract = {We propose an ensemble learning approach to tackle
the problem of concept drift (CD) in data-stream
classication. Accurately detecting the change
point in the distribution is insufficient to ensure
precise predictions, particularly when the selection
of a representative training set is challenging or
computationally expensive. More specically, we
employ an ensemble of ten classiers that use a
majority voting mechanism to make predictions. To
promote diversity among models, we train each on a
different number of instances, resulting in
different sequences of p-values and construct an
Inductive Conformal Martingale (ICM) for each
one. When the ICM algorithm detects a change point
in the corresponding p-value sequence, we perform a
retraining process of the corresponding
classier. We evaluate the performance of our
proposed methodology on four benchmark datasets and
compare it to existing methods in the
literature. Our experimental results show that the
proposed approach exhibits comparable and in some
cases better accuracy than two state-of-the-art
algorithms.}
}
%20 pages
@InProceedings{vovk23,
title = {The power of forgetting in statistical hypothesis
testing},
author = {Vovk, Vladimir},
pages = {347--366},
abstract = {This paper places conformal testing in a general
framework of statistical hypothesis testing. A
standard approach to testing a composite null
hypothesis H is to test each of its elements and to
reject H when each of its elements is rejected. It
turns out that we can fully cover conformal testing
using this approach only if we allow forgetting some
of the data. However, we will see that the standard
approach covers conformal testing in a weak
asymptotic sense and under restrictive
assumptions. I will also list several possible
directions of further research, including developing
a general scheme of online testing.}
}
%2 pages
@InProceedings{nouretdinov23b,
title = {The Venn-ABERS Testing for Change-Point Detection},
author = {Nouretdinov, Ilia and Gammerman, Alex},
pages = {367--368}
}
%15 pages
@InProceedings{kato23,
title = {A Review of Nonconformity Measures for Conformal
Prediction in Regression},
author = {Kato, Yuko and Tax, David M.J. and Loog, Marco},
pages = {369--383},
abstract = {Conformal prediction provides distribution-free
uncertainty quantification under minimal
assumptions. An important ingredient in conformal
prediction is the so-called nonconformity measure,
which quantifies how the test sample differs from
the rest of the data. In this paper, existing
nonconformity measures from the current literature
are collected and their underlying ideas are
analyzed. Furthermore, the influence of different
factors on the performance of conformal prediction
are pointed out by focusing on the relation between
the influencing factors and the choice of
nonconformity measures. Lastly, we provide
suggestions for future work with regard to currently
existing knowledge gaps and development of new
nonconformity measures.}
}
%15 pages
@InProceedings{colombo23,
title = {On training locally adaptive CP},
author = {Colombo, Nicolo},
pages = {384--398},
abstract = {We address the problem of making Conformal
Prediction (CP) intervals locally adaptive. Most
existing methods focus on approximating the
object-conditional validity of the intervals by
partitioning or re-weighting the calibration
set. Our strategy is new and conceptually
different. Instead of re-weighting the calibration
data, we redefine the conformity measure through a
trainable change of variables, A → $\phi$X(A), that
depends explicitly on the object attributes,
X. Under certain conditions and if $\phi$X is
monotonic in A for any X, the transformations
produce prediction intervals that are guaranteed to
be marginally valid and have X-dependent sizes. We
describe how to parameterize and train $\phi$X to
maximize the interval efficiency. Contrary to other
CP-aware training methods, the objective function is
smooth and can be minimized through standard
gradient methods without approximations.}
}
%14 pages
@InProceedings{bostrom23,
title = {Mondrian Predictive Systems for Censored Data},
author = {Bostrom, Henrik and Linusson, Henrik and Vesterberg,
Anders},
pages = {399--412},
abstract = {Conformal predictive systems output predictions in
the form of well-calibrated cumulative distribution
functions (conformal predictive distributions). In
this paper, we apply conformal predictive systems to
the problem of time-to-event prediction, where the
conformal predictive distribution for a test object
may be used to obtain the expected time until an
event occurs, as well as p-values for an event to
take place earlier (or later) than some specified
time points. Specifically, we target right-censored
time-to-event prediction tasks, i.e., situations in
which the true time-to-event for a particular
training example may be unknown due to observation
of the example ending before any event occurs. By
leveraging the Kaplan-Meier estimator, we develop a
procedure for constructing Mondrian predictive
systems that are able to produce well-calibrated
cumulative distribution functions for right-censored
time-to-event prediction tasks. We show that the
proposed procedure is guaranteed to produce
conservatively valid predictive distributions, and
provide empirical support using simulated censoring
on benchmark data. The proposed approach is
contrasted with established techniques for survival
analysis, including random survival forests and
censored quantile regression forests, using both
synthetic and non-synthetic censoring.}
}
%17 pages
@InProceedings{giovannotti23,
title = {Evaluating Machine Translation Quality with
Conformal Predictive Distributions},
author = {Giovannotti, Patrizio},
pages = {413--429},
abstract = {This paper presents a new approach for assessing
uncertainty in machine translation by simultaneously
evaluating translation quality and providing a
reliable confidence score. Our approach utilizes
conformal predictive distributions to produce
prediction intervals with guaranteed coverage,
meaning that for any given significance level
$\epsilon$, we can expect the true quality score of
a translation to fall out of the interval at a rate
of 1 - $\epsilon$. In this paper, we demonstrate how
our method outperforms a simple, but effective
baseline on six different language pairs in terms of
coverage and sharpness. Furthermore, we validate
that our approach requires the data exchangeability
assumption to hold for optimal performance.}
}
%20 pages
@InProceedings{trunov23,
title = {Online aggregation of conformal predictive systems},
author = {Trunov, Vladimir G. and {V'yugin}, Vladimir V.},
pages = {430--449},
abstract = {The problem of online probabilistic forecasting is
considered. Probabilistic forecasts are obtained as
a result of the application of conformal predictive
systems. The conformal predictive system is a novel
method for obtaining reliable predictions which are
based on point forecasts of the regression
algorithm. The paper considers the case when at each
moment of time several competing conformal
predictive systems (experts) give their predictions
in the form of probability distribution
functions. Probabilistic forecasts of the experts
are combined by an aggregation algorithm into one
probabilistic forecast at each step of the
forecasting process, while expert forecasts can be
used partially. The developed methods are used to
solve the well-known problem of predicting the load
of an electrical network online. Numerical
experiments have shown the agreement of predictions
with real data.}
}
%20 pages
@InProceedings{alkhatib23,
title = {Approximating Score-based Explanation Techniques
Using Conformal Regression},
author = {Alkhatib, Amr and Bostrom, Henrik and Ennadir,
Sofiane and Johansson, Ulf},
pages = {450--469},
abstract = {Score-based explainable machine-learning techniques
are often used to understand the logic behind
black-box models. However, such explanation
techniques are often computationally expensive,
which limits their application in time-critical
contexts. Therefore, we propose and investigate the
use of computationally less costly regression models
for approximating the output of score-based
explanation techniques, such as SHAP. Moreover,
validity guarantees for the approximated values are
provided by the employed inductive conformal
prediction framework. We propose several
non-conformity measures designed to take the
difficulty of approximating the explanations into
account while keeping the computational cost low. We
present results from a large-scale empirical
investigation, in which the approximate explanations
generated by our proposed models are evaluated with
respect to efficiency (interval size). The results
indicate that the proposed method can significantly
improve execution time compared to the fast version
of SHAP, TreeSHAP. The results also suggest that the
proposed method can produce tight intervals, while
providing validity guarantees. Moreover, the
proposed approach allows for comparing explanations
of different approximation methods and selecting a
method based on how informative (tight) are the
predicted intervals.}
}
%15 pages
@InProceedings{gauraha23,
title = {Investigating the Contribution of Privileged
Information in Knowledge Transfer LUPI by
Explainable Machine Learning},
author = {Gauraha, Niharika and Bostrom, Henrik},
pages = {470--484},
abstract = {Learning Under Privileged Information (LUPI) is a
framework that exploits information that is
available during training only, i.e., the privileged
information (PI), to improve the classification of
objects for which this information is not
available. Knowledge transfer LUPI (KT-LUPI) extends
the framework by inferring PI for the test objects
through separate predictive models. Although the
effectiveness of the framework has been thoroughly
demonstrated, current investigations have provided
limited insights only regarding what parts of the
transferred PI contribute to the improved
performance. A better understanding of this could
not only lead to computational savings but
potentially also to novel strategies for exploiting
PI. We approach the problem by exploring the use of
explainable machine learning through the
state-of-the-art technique SHAP, to analyze the
contribution of the transferred privileged
information. We present results from experiments
with five classification and three regression
datasets, in which we compare the Shapley values of
the PI computed in two different settings; one where
the PI is assumed to be available during both
training and testing, hence representing an ideal
scenario, and a second setting, in which the PI is
available during training only but is transferred to
test objects, through KT-LUPI. The results indicate
that explainable machine learning indeed has the
potential as a tool to gain insights regarding the
effectiveness of KT-LUPI.}