-
Notifications
You must be signed in to change notification settings - Fork 0
/
dphil.bib
1985 lines (1742 loc) · 63.6 KB
/
dphil.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
% Encoding: UTF-8
@inproceedings{AhmedEtAl2012,
title={Scalable inference in latent variable models},
author={Ahmed, Amr and Aly, Moahmed and Gonzalez, Joseph and Narayanamurthy, Shravan and Smola, Alexander J},
booktitle={Proceedings of the fifth ACM international conference on Web search and data mining},
pages={123--132},
year={2012},
organization={ACM}
}
@article{AndrychowiczEtAl2016,
title={Learning to learn by gradient descent by gradient descent},
author={Andrychowicz, Marcin and Denil, Misha and Gomez, Sergio and Hoffman, Matthew W and Pfau, David and Schaul, Tom and de Freitas, Nando},
journal={arXiv preprint arXiv:1606.04474v1 [cs.NE]},
year={2016}
}
@article{ArcherEtAl2015,
title={Black box variational inference for state space models},
author={Archer, Evan and Park, Il Memming and Buesing, Lars and Cunningham, John and Paninski, Liam},
journal={arXiv preprint arXiv:1511.07367v1 [stat.ML]},
year={2015}
}
@article{ArjovskyEtAl2017,
title={Wasserstein gan},
author={Arjovsky, Martin and Chintala, Soumith and Bottou, L{\'e}on},
journal={arXiv preprint arXiv:1701.07875v2 [cs.LG]},
year={2017}
}
@article{BaEtAl2016,
title={Layer normalization},
author={Ba, Jimmy Lei and Kiros, Jamie Ryan and Hinton, Geoffrey E},
journal={arXiv preprint arXiv:1607.06450v1 [stat.ML]},
year={2016}
}
@inproceedings{BartlettEtAl2010,
title={Forgetting counts: Constant memory inference for a dependent hierarchical {Pitman--Yor} process},
author={Bartlett, Nicholas and Pfau, David and Wood, Frank},
booktitle={Proceedings of the 27th International Conference on Machine Learning (ICML-10)},
pages={63--70},
year={2010}
}
@article{Bengio2009,
title={Learning deep architectures for AI},
author={Bengio, Yoshua},
journal={Foundations and trends{\textregistered} in Machine Learning},
volume={2},
number={1},
pages={1--127},
year={2009},
publisher={Now Publishers Inc.}
}
@inproceedings{BengioBengio1999,
title={Modeling High-Dimensional Discrete Data with Multi-Layer Neural Networks.},
author={Bengio, Yoshua and Bengio, Samy},
booktitle={NIPS},
volume={99},
pages={400--406},
year={1999}
}
@article{BengioEtAl2013,
title={Representation learning: A review and new perspectives},
author={Bengio, Yoshua and Courville, Aaron and Vincent, Pascal},
journal={IEEE transactions on pattern analysis and machine intelligence},
volume={35},
number={8},
pages={1798--1828},
year={2013},
publisher={IEEE}
}
@article{BengioEtAl2015,
title={Towards biologically plausible deep learning},
author={Bengio, Yoshua and Lee, Dong-Hyun and Bornschein, Jorg and Lin, Zhouhan},
journal={arXiv preprint arXiv:1502.04156v2 [cs.LG]},
year={2015}
}
@article{BengioEtAl2016,
title={Feedforward Initialization for Fast Inference of Deep Generative Networks is biologically plausible},
author={Bengio, Yoshua and Scellier, Benjamin and Bilaniuk, Olexa and Sacramento, Joao and Senn, Walter},
journal={arXiv preprint arXiv:1606.01651v2 [cs.LG]},
year={2016}
}
@article{Bishop1994,
title={Mixture density networks},
author={Bishop, Christopher M},
year={1994},
publisher={Aston University}
}
@article{BleiEtAl2016,
title={Variational inference: A review for statisticians},
author={Blei, David M and Kucukelbir, Alp and McAuliffe, Jon D},
journal={arXiv preprint arXiv:1601.00670v2 [stat.CO]},
year={2016}
}
@article{BornscheinEtAl2014,
title={Reweighted wake-sleep},
author={Bornschein, J{\"o}rg and Bengio, Yoshua},
journal={arXiv preprint arXiv:1406.2751v4 [cs.LG]},
year={2016}
}
@article{BornscheinEtAl2016,
title={Bidirectional Helmholtz Machines},
author={Bornschein, Jorg and Shabanian, Samira and Fischer, Asja and Bengio, Yoshua},
journal={arXiv preprint arXiv:1506.03877v5 [cs.LG]},
year={2016}
}
@article{Bottou2014,
title={From machine learning to machine reasoning},
author={Bottou, L{\'e}on},
journal={Machine learning},
volume={94},
number={2},
pages={133--149},
year={2014},
publisher={Springer}
}
@article{BoulangerLewandowskiEtAl2012,
title={Modeling temporal dependencies in high-dimensional sequences: Application to polyphonic music generation and transcription},
author={Boulanger-Lewandowski, Nicolas and Bengio, Yoshua and Vincent, Pascal},
journal={arXiv preprint arXiv:1206.6392v1 [cs.LG]},
year={2012}
}
@article{BowmanEtAl2015,
title={Generating sentences from a continuous space},
author={Bowman, Samuel R and Vilnis, Luke and Vinyals, Oriol and Dai, Andrew M and Jozefowicz, Rafal and Bengio, Samy},
journal={arXiv preprint arXiv:1511.06349v4 [cs.LG]},
year={2015}
}
@article{BurdaEtAl2016,
title={Importance weighted autoencoders},
author={Burda, Yuri and Grosse, Roger and Salakhutdinov, Ruslan},
journal={arXiv preprint arXiv:1509.00519v3 [cs.LG]},
year={2016}
}
@inproceedings{ChenEtAl2014,
title={Stochastic Gradient Hamiltonian Monte Carlo},
author={Chen, Tianqi and Fox, Emily and Guestrin, Carlos},
booktitle={Proceedings of the 31st International Conference on Machine Learning (ICML-14)},
pages={1683--1691},
year={2014}
}
@article{ChenEtAl2016,
title={Variational lossy autoencoder},
author={Xi Chen and Diederik P. Kingma and Tim Salimans and Yan Duan and Prafulla Dhariwal and John Schulman and Ilya Sutskever and Pieter Abbeel},
journal={arXiv preprint arXiv:1611.02731 [cs.LG]},
year={2016}
}
@article{ChoEtAl2014,
title={On the properties of neural machine translation: Encoder-decoder approaches},
author={Cho, Kyunghyun and Van Merri{\"e}nboer, Bart and Bahdanau, Dzmitry and Bengio, Yoshua},
journal={arXiv preprint arXiv:1409.1259v2 [cs.CL]},
year={2014}
}
@article{ChungEtAl2014,
title={Empirical evaluation of gated recurrent neural networks on sequence modeling},
author={Chung, Junyoung and Gulcehre, Caglar and Cho, KyungHyun and Bengio, Yoshua},
journal={arXiv preprint arXiv:1412.3555v1 [cs.NE},
year={2014}
}
@article{ChungEtAl2015,
title={Gated feedback recurrent neural networks},
author={Chung, Junyoung and G{\"u}l{\c{c}}ehre, Caglar and Cho, Kyunghyun and Bengio, Yoshua},
journal={CoRR, abs/1502.02367},
year={2015}
}
@article{ChungEtAl2016,
title={Hierarchical Multiscale Recurrent Neural Networks},
author={Chung, Junyoung and Ahn, Sungjin and Bengio, Yoshua},
journal={arXiv preprint arXiv:1609.01704v2 [cs.LG]},
year={2016}
}
@article{Cusumano2018,
title={Using probabilistic programs as proposals},
author={Cusumano-Towner, Marco F and Mansinghka, Vikash K},
journal={arXiv preprint arXiv:1801.03612},
year={2018}
}
@inproceedings{DauphinGrangier2016,
title={Predicting distributions with Linearizing Belief Networks},
author={Dauphin, Yann N and Grangier, David},
booktitle={4th International Conference on Learning Representations (ICLR)},
year={2016}
}
@inproceedings{DeanEtAl2012,
title={Large scale distributed deep networks},
author={Dean, Jeffrey and Corrado, Greg and Monga, Rajat and Chen, Kai and Devin, Matthieu and Mao, Mark and Senior, Andrew and Tucker, Paul and Yang, Ke and Le, Quoc V and others},
booktitle={Advances in Neural Information Processing Systems},
pages={1223--1231},
year={2012}
}
@article{DuEtAl2016,
title={Learning Deep Generative Models with Doubly Stochastic MCMC},
author={Du, Chao and Zhu, Jun and Zhang, Bo},
journal={arXiv preprint arXiv:1506.04557v4 [cs.LG]},
year={2016}
}
@book{EricssonPool2016,
author = {Anders Ericsson and Robert Pool},
title = {Peak: Secrets from the New Science of Expertise},
publisher = {Bodley Head},
year = 2016
}
@article{FishelsonGeiger2004,
title={Optimizing exact genetic linkage computations},
author={Fishelson, Ma{\'a}yan and Geiger, Dan},
journal={Journal of Computational Biology},
volume={11},
number={2-3},
pages={263--275},
year={2004},
publisher={Mary Ann Liebert, Inc.}
}
@article{FraccaroEtAl2016,
title={Sequential Neural Models with Stochastic Layers},
author={Fraccaro, Marco and S{\o}nderby, S{\o}ren Kaae and Paquet, Ulrich and Winther, Ole},
journal={arXiv preprint arXiv:1605.07571},
year={2016}
}
@inproceedings{GanEtAl2015,
title={Deep temporal sigmoid belief networks for sequence modeling},
author={Gan, Zhe and Li, Chunyuan and Henao, Ricardo and Carlson, David E and Carin, Lawrence},
booktitle={Advances in Neural Information Processing Systems},
pages={2458--2466},
year={2015}
}
@inproceedings{GanEtAl2015b,
title={Learning Deep Sigmoid Belief Networks with Data Augmentation.},
author={Gan, Zhe and Henao, Ricardo and Carlson, David E and Carin, Lawrence},
booktitle={AISTATS},
year={2015}
}
@inproceedings{GasthausEtAl2010,
title={Lossless compression based on the sequence memoizer},
author={Gasthaus, Jan and Wood, Frank and Teh, Yee Whye},
booktitle={Data Compression Conference (DCC), 2010},
pages={337--345},
year={2010},
organization={IEEE}
}
@inproceedings{GasthausTeh2010,
title={Improvements to the sequence memoizer},
author={Gasthaus, Jan and Teh, Yee Whye},
booktitle={Advances in Neural Information Processing Systems},
pages={685--693},
year={2010}
}
@article{GelmanEtAl2014,
title={Expectation propagation as a way of life},
author={Gelman, Andrew and Vehtari, Aki and Jyl{\"a}nki, Pasi and Robert, Christian and Chopin, Nicolas and Cunningham, John P},
journal={arXiv preprint arXiv:1412.4869},
year={2014}
}
@inproceedings{GermainEtAl2015,
title={MADE: masked autoencoder for distribution estimation},
author={Germain, Mathieu and Gregor, Karol and Murray, Iain and Larochelle, Hugo},
booktitle={Proceedings of the 32nd International Conference on Machine Learning (ICML-15)},
pages={881--889},
year={2015}
}
@article{GersEtAl2000,
title={Learning to forget: Continual prediction with LSTM},
author={Gers, Felix A and Schmidhuber, J{\"u}rgen and Cummins, Fred},
journal={Neural computation},
volume={12},
number={10},
pages={2451--2471},
year={2000},
publisher={MIT Press}
}
@inproceedings{GersSchmidhuber2000,
title={Recurrent nets that time and count},
author={Gers, Felix A and Schmidhuber, J{\"u}rgen},
booktitle={Neural Networks, 2000. IJCNN 2000, Proceedings of the IEEE-INNS-ENNS International Joint Conference on},
volume={3},
pages={189--194},
year={2000},
organization={IEEE}
}
@inproceedings{Gershman2014,
title={Amortized inference in probabilistic reasoning},
author={Gershman, Samuel J and Goodman, Noah D},
booktitle={Proceedings of the 36th Annual Conference of the Cognitive Science Society},
year={2014}
}
@inproceedings{Ghahramani1996,
title={Factorial hidden Markov models},
author={Ghahramani, Zoubin and Jordan, Michael I},
booktitle={Advances in Neural Information Processing Systems},
pages={472--478},
year={1996}
}
@article{Ghahramani2015,
title={Probabilistic machine learning and artificial intelligence},
author={Ghahramani, Zoubin},
journal={Nature},
volume={521},
number={7553},
pages={452--459},
year={2015},
publisher={Nature Publishing Group}
}
@article {GibbsSu2002,
author = {Gibbs, Alison L. and Su, Francis Edward},
title = {On Choosing and Bounding Probability Metrics},
journal = {International Statistical Review},
volume = {70},
number = {3},
publisher = {Blackwell Publishing Ltd},
issn = {1751-5823},
url = {http://dx.doi.org/10.1111/j.1751-5823.2002.tb00178.x},
doi = {10.1111/j.1751-5823.2002.tb00178.x},
pages = {419--435},
keywords = {Discrepancy, Hellinger distance, Probability metrics, Prokhorov metric, Relative entropy, Rates of convergence, Wasserstein distance},
year = {2002},
}
@inproceedings{GoodfellowEtAl2014,
title={Generative adversarial nets},
author={Goodfellow, Ian and Pouget-Abadie, Jean and Mirza, Mehdi and Xu, Bing and Warde-Farley, David and Ozair, Sherjil and Courville, Aaron and Bengio, Yoshua},
booktitle={Advances in neural information processing systems},
pages={2672--2680},
year={2014}
}
@book{GoodfellowEtAl2016,
title={Deep Learning},
author={Ian Goodfellow and Yoshua Bengio and Aaron Courville},
publisher={MIT Press},
url={http://www.deeplearningbook.org},
year={2016}
}
@inproceedings{Goodman2013,
title={The principles and practice of probabilistic programming},
author={Goodman, Noah D},
booktitle={ACM SIGPLAN Notices},
volume={48},
number={1},
pages={399--402},
year={2013},
organization={ACM}
}
@inproceedings{GoodmanEtAl2008,
title={Church: A language for generative models},
author={Goodman, ND and Mansinghka, VK and Roy, D and Bonawitz, K and Tenenbaum, JB},
booktitle={Proceedings of the 24th Conference on Uncertainty in Artificial Intelligence, UAI 2008},
pages={220--229},
year={2008}
}
@article{Graves2016,
title={Adaptive Computation Time for Recurrent Neural Networks},
author={Graves, Alex},
journal={arXiv preprint arXiv:1603.08983v4 [cs.NE]},
year={2016}
}
@article{GravesEtAl2014,
title={Neural turing machines},
author={Graves, Alex and Wayne, Greg and Danihelka, Ivo},
journal={arXiv preprint arXiv:1410.5401v2 [cs.NE]},
year={2014}
}
@article{GravesSchmidhuber2005,
title={Framewise phoneme classification with bidirectional LSTM and other neural network architectures},
author={Graves, Alex and Schmidhuber, J{\"u}rgen},
journal={Neural Networks},
volume={18},
number={5},
pages={602--610},
year={2005},
publisher={Elsevier}
}
@article{GreffEtAl2015,
title={LSTM: A search space odyssey},
author={Greff, Klaus and Srivastava, Rupesh Kumar and Koutn{\'\i}k, Jan and Steunebrink, Bas R and Schmidhuber, J{\"u}rgen},
journal={arXiv preprint arXiv:1503.04069},
year={2015}
}
@article{GregorEtAl2015,
title={DRAW: A recurrent neural network for image generation},
author={Gregor, Karol and Danihelka, Ivo and Graves, Alex and Rezende, Danilo Jimenez and Wierstra, Daan},
journal={arXiv preprint arXiv:1502.04623v2 [cs.CV]},
year={2015}
}
@article{GrettonEtAl2012,
title={A kernel two-sample test},
author={Gretton, Arthur and Borgwardt, Karsten M and Rasch, Malte J and Sch{\"o}lkopf, Bernhard and Smola, Alexander},
journal={Journal of Machine Learning Research},
volume={13},
number={Mar},
pages={723--773},
year={2012}
}
@inproceedings{GuEtAl2015,
title={Neural Adaptive Sequential Monte Carlo},
author={Gu, Shixiang and Ghahramani, Zoubin and Turner, Richard E},
booktitle={Advances in Neural Information Processing Systems},
pages={2629--2637},
year={2015}
}
@article{GulrajaniEtAl2017,
title={Improved Training of Wasserstein GANs},
author={Gulrajani, Ishaan and Ahmed, Faruk and Arjovsky, Martin and Dumoulin, Vincent and Courville, Aaron},
journal={arXiv preprint arXiv:1704.00028},
year={2017}
}
@article{Harik2010,
title={Variational program inference},
author={Harik, Georges and Shazeer, Noam},
journal={arXiv preprint arXiv:1006.0991},
year={2010}
}
@article{HasencleverWebb2016,
author = "Hasenclever, Leonard and Webb, Stefan and Lienart, Thibaut and Vollmer, Sebastian and Teh, Yee Whye and Lakshminarayanan, Balaji and Blundell, Charles",
year = "2016",
title = "Distributed Bayesian Learning with Stochastic Natural-gradient Expectation Propagation and the Posterior Server",
journal = "(In preparation)"
}
@article{HeEtAl2016,
title={Identity mappings in deep residual networks},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
journal={arXiv preprint arXiv:1603.05027v2 [cs.CV]},
year={2016}
}
@inproceedings{HenaoEtAl2015,
title={Deep Poisson factor modeling},
author={Henao, Ricardo and Gan, Zhe and Lu, James and Carin, Lawrence},
booktitle={Advances in Neural Information Processing Systems},
pages={2800--2808},
year={2015}
}
@article{HintonEtAl2012,
title={Deep neural networks for acoustic modeling in speech recognition: The shared views of four research groups},
author={Hinton, Geoffrey and Deng, Li and Yu, Dong and Dahl, George E and Mohamed, Abdel-rahman and Jaitly, Navdeep and Senior, Andrew and Vanhoucke, Vincent and Nguyen, Patrick and Sainath, Tara N and others},
journal={IEEE Signal Processing Magazine},
volume={29},
number={6},
pages={82--97},
year={2012},
publisher={IEEE}
}
@article{HochreiterSchmidhuber1997,
title={Long short-term memory},
author={Hochreiter, Sepp and Schmidhuber, J{\"u}rgen},
journal={Neural computation},
volume={9},
number={8},
pages={1735--1780},
year={1997},
publisher={MIT Press}
}
@article{HoffmanEtAl2013,
title={Stochastic variational inference},
author={Hoffman, Matthew D and Blei, David M and Wang, Chong and Paisley, John},
journal={The Journal of Machine Learning Research},
volume={14},
number={1},
pages={1303--1347},
year={2013},
publisher={JMLR.org}
}
@article{HoffmanGelman2014,
title={The no-U-turn sampler: Adaptively setting path lengths in Hamiltonian Monte Carlo},
author={Hoffman, Matthew D and Gelman, Andrew},
journal={The Journal of Machine Learning Research},
volume={15},
number={1},
pages={1593--1623},
year={2014},
publisher={JMLR. org}
}
@article{HuangEtAl2016,
title={Deep networks with stochastic depth},
author={Huang, Gao and Sun, Yu and Liu, Zhuang and Sedra, Daniel and Weinberger, Kilian},
journal={arXiv preprint arXiv:1603.09382v2 [cs.LG]},
year={2016}
}
@article{Huet1997,
title={The zipper},
author={Huet, G{\'e}rard},
journal={Journal of Functional Programming},
volume={7},
number={05},
pages={549--554},
year={1997},
publisher={Cambridge Univ Press}
}
@inproceedings{JangEtAl2016,
title={Categorical Reparameterization with Gumbel-Softmax},
author={Jang, Eric and Gu, Shixiang and Poole, Ben},
booktitle={International Conference on Learning Representations (ICLR)},
year={2017}
}
@article{JohnsonEtAl2016,
title={Composing graphical models with neural networks for structured representations and fast inference},
author={Johnson, Matthew J and Duvenaud, David and Wiltschko, Alexander B and Datta, Sandeep R and Adams, Ryan P},
journal={arXiv preprint arXiv:1603.06277v2 [stat.ML]},
year={2016}
}
@unpublished{JordanTeh2014,
title={A gentle introduction to the {Dirichlet} process, the beta process and {Bayesian} nonparametrics [{DRAFT}]},
author={Jordan, Michael I. and Teh, Yee Whye},
note={Unpublished}
}
@article{Kahn1962,
title={Topological sorting of large networks},
author={Kahn, Arthur B},
journal={Communications of the ACM},
volume={5},
number={11},
pages={558--562},
year={1962},
publisher={ACM}
}
@article{KalchbrennerEtAl2016a,
title={Grid long short-term memory},
author={Kalchbrenner, Nal and Danihelka, Ivo and Graves, Alex},
journal={arXiv preprint arXiv:1507.01526v3 [cs.NE]},
year={2015}
}
@article{KalchbrennerEtAl2016b,
title={Video pixel networks},
author={Kalchbrenner, Nal and Oord, Aaron van den and Simonyan, Karen and Danihelka, Ivo and Vinyals, Oriol and Graves, Alex and Kavukcuoglu, Koray},
journal={arXiv preprint arXiv:1610.00527v1 [cs.CV]},
year={2016}
}
@article{Kalchbrenner2016c,
title={Neural machine translation in linear time},
author={Kalchbrenner, Nal and Espeholt, Lasse and Simonyan, Karen and Oord, Aaron van den and Graves, Alex and Kavukcuoglu, Koray},
journal={arXiv preprint arXiv:1610.10099v1 [cs.CL]},
year={2016}
}
@article{KarpathyEtAl2015,
title={Visualizing and understanding recurrent networks},
author={Karpathy, Andrej and Johnson, Justin and Fei-Fei, Li},
journal={arXiv preprint arXiv:1506.02078},
year={2015}
}
@article{KingmaBa2014,
title={Adam: A Method for Stochastic Optimization},
author={Kingma, Diederik and Ba, Jimmy},
journal={arXiv preprint arXiv:1412.6980},
year={2014}
}
@inproceedings{KingmaEtAl2016,
title={Improving variational inference with inverse autoregressive flow},
author={Kingma, Diederik P and Salimans, Tim and Welling, Max},
booktitle = {Advances in Neural Information Processing Systems},
pages = {4736--4744},
year={2016}
}
@inproceedings{KingmaWelling2013,
title={Auto-encoding variational bayes},
author={Kingma, Diederik P and Welling, Max},
journal={arXiv preprint arXiv:1312.6114v10 [stat.ML]},
booktitle={International Conference on Learning Representations (ICLR)},
year={2014}
}
@inproceedings{KirosEtAl2015,
title={Skip-thought vectors},
author={Kiros, Ryan and Zhu, Yukun and Salakhutdinov, Ruslan R and Zemel, Richard and Urtasun, Raquel and Torralba, Antonio and Fidler, Sanja},
booktitle={Advances in neural information processing systems},
pages={3294--3302},
year={2015}
}
@inproceedings{KiselyovShan2009,
title={Embedded probabilistic programming},
author={Kiselyov, Oleg and Shan, Chung-Chieh},
booktitle={Domain-Specific Languages},
pages={360--384},
year={2009},
organization={Springer}
}
@book{KollerFriedman2009,
author = {Daphne Koller and Nir Friedman},
title = {Probabilistic Graphical Models},
publisher = {MIT Press},
year = 2009,
isbn = {9780262013192}
}
@article{KrishnanEtAl2015,
title={Deep Kalman Filters},
author={Krishnan, Rahul G and Shalit, Uri and Sontag, David},
journal={arXiv preprint arXiv:1511.05121v1 [stat.ML]},
year={2015}
}
@inproceedings{KrishnanEtAl2017,
title={Structured Inference Networks for Nonlinear State Space Models.},
author={Krishnan, Rahul G and Shalit, Uri and Sontag, David},
booktitle={AAAI},
pages={2101--2109},
year={2017}
}
@inproceedings{KrizhevskyEtAl2012,
title={Imagenet classification with deep convolutional neural networks},
author={Krizhevsky, Alex and Sutskever, Ilya and Hinton, Geoffrey E},
booktitle={Advances in neural information processing systems},
pages={1097--1105},
year={2012}
}
@article{KruegerEtAl2016,
title={Zoneout: Regularizing RNNs by Randomly Preserving Hidden Activations},
author={Krueger, David and Maharaj, Tegan and Kram{\'a}r, J{\'a}nos and Pezeshki, Mohammad and Ballas, Nicolas and Ke, Nan Rosemary and Goyal, Anirudh and Bengio, Yoshua and Larochelle, Hugo and Courville, Aaron and others},
journal={arXiv preprint arXiv:1606.01305v2 [cs.NE]},
year={2016}
}
@inproceedings{LakeEtAl2013,
title={One-shot learning by inverting a compositional causal process},
author={Lake, Brenden M and Salakhutdinov, Ruslan R and Tenenbaum, Josh},
booktitle={Advances in neural information processing systems},
pages={2526--2534},
year={2013}
}
@article{LakeEtAl2016,
title={Building machines that learn and think like people},
author={Lake, Brenden M and Ullman, Tomer D and Tenenbaum, Joshua B and Gershman, Samuel J},
journal={arXiv preprint arXiv:1604.00289v2 [cs.AI]},
year={2016}
}
@article{UriaEtAl2016,
title={Neural autoregressive distribution estimation},
author={Uria, Benigno and C{\^o}t{\'e}, Marc-Alexandre and Gregor, Karol and Murray, Iain and Larochelle, Hugo},
journal={Journal of Machine Learning Research},
volume={17},
number={205},
pages={1--37},
year={2016}
}
@article{LeCunEtAl1998,
title={Gradient-based learning applied to document recognition},
author={LeCun, Yann and Bottou, L{\'e}on and Bengio, Yoshua and Haffner, Patrick},
journal={Proceedings of the IEEE},
volume={86},
number={11},
pages={2278--2324},
year={1998},
publisher={IEEE}
}
@article{LeeSeung1999,
title={Learning the parts of objects by non-negative matrix factorization},
author={Lee, Daniel D and Seung, H Sebastian},
journal={Nature},
volume={401},
number={6755},
pages={788--791},
year={1999},
publisher={Nature Publishing Group}
}
@inproceedings{LeEtAl2016,
title={Inference compilation and universal probabilistic programming},
author={Le, Tuan Anh and Baydin, Atilim Gunes and Wood, Frank},
booktitle={AISTATS},
year={2017}
}
@inproceedings{LeEtAl2017,
title={Auto-Encoding Sequential Monte Carlo},
author={Le, Tuan Anh and Igl, Maximilian and Jin, Tom and Rainforth, Tom and Wood, Frank},
booktitle={International Conference on Learning Representations (ICLR)},
year={2018}
}
@inproceedings{LeMikolov2014,
title={Distributed Representations of Sentences and Documents.},
author={Le, Quoc V and Mikolov, Tomas},
booktitle={ICML},
volume={14},
pages={1188--1196},
year={2014}
}
@inproceedings{LiEtAl2014,
title={Scaling distributed machine learning with the parameter server},
author={Li, Mu and Andersen, David G and Park, Jun Woo and Smola, Alexander J and Ahmed, Amr and Josifovski, Vanja and Long, James and Shekita, Eugene J and Su, Bor-Yiing},
booktitle={Proc. OSDI},
pages={583--598},
year={2014}
}
@inproceedings{LiEtAl2016,
title={Black-Box Alpha Divergence Minimization},
author={Li, Yingzhen and Rowland, Mark and Bui, Thang and Hernandez-Lobato, Daniel and Turner, Richard and others},
booktitle={Proceedings of The 33rd International Conference on Machine Learning},
pages={1511--1520},
year={2016}
}
@article{LiTurner2016,
title={{R\'enyi} divergence variational inference},
author={Li, Yingzhen and Turner, Richard E.},
journal={arXiv preprint arXiv:1602.02311v3 [stat.ML]},
year={2016}
}
@inproceedings{MaaloeEtAl2016,
title={Auxiliary Deep Generative Models},
author={Maal{\o}e, Lars and S{\o}nderby, Casper Kaae and S{\o}nderby, S{\o}ren Kaae and Winther, Ole},
booktitle={Proceedings of The 33rd International Conference on Machine Learning},
year={2016}
}
@book{Mackay2003,
title={Information theory, inference and learning algorithms},
author={MacKay, David JC},
year={2003},
publisher={Cambridge University Press}
}
@inproceedings{MaddisonEtAl2016,
title={The Concrete Distribution: A Continuous Relaxation of Discrete Random Variables},
author={Maddison, Chris J and Mnih, Andriy and Teh, Yee Whye},
booktitle={International Conference on Learning Representations (ICLR)},
year={2017}
}
@inproceedings{MaddisonEtAl2017,
title={Filtering Variational Objectives},
author={Maddison, Chris J and Lawson, John and Tucker, George and Heess, Nicolas and Norouzi, Mohammad and Mnih, Andriy and Doucet, Arnaud and Teh, Yee},
booktitle={Advances in Neural Information Processing Systems},
pages={6576--6586},
year={2017}
}
@inproceedings{MaEtAl2015,
title={A complete recipe for stochastic gradient MCMC},
author={Ma, Yi-An and Chen, Tianqi and Fox, Emily},
booktitle={Advances in Neural Information Processing Systems},
pages={2899--2907},
year={2015}
}
@article{MeschederEtAl2017,
title={Adversarial Variational Bayes: Unifying Variational Autoencoders and Generative Adversarial Networks},
author={Mescheder, Lars and Nowozin, Sebastian and Geiger, Andreas},
journal={arXiv preprint arXiv:1701.04722},
year={2017}
}
@inproceedings{MikolovEtAl2013,
title={Distributed representations of words and phrases and their compositionality},
author={Mikolov, Tomas and Sutskever, Ilya and Chen, Kai and Corrado, Greg S and Dean, Jeff},
booktitle={Advances in neural information processing systems},
pages={3111--3119},
year={2013}
}
@article{MnihEtAl2015,
title={Human-level control through deep reinforcement learning},
author={Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Rusu, Andrei A and Veness, Joel and Bellemare, Marc G and Graves, Alex and Riedmiller, Martin and Fidjeland, Andreas K and Ostrovski, Georg and others},
journal={Nature},
volume={518},
number={7540},
pages={529--533},
year={2015},
publisher={Nature Publishing Group}
}
@inproceedings{MnihGregor2014,
title={Neural Variational Inference and Learning in Belief Networks},
author={Mnih, Andriy and Gregor, Karol},
booktitle={Proceedings of the 31st International Conference on Machine Learning (ICML-14)},
pages={1791--1799},
year={2014}
}
@article{MnihRezende2016,
title={Variational inference for {Monte} {Carlo} objectives},
author={Mnih, Andriy and Rezende, Danilo J.},
journal={arXiv preprint arXiv:1602.06725v2 [cs.LG]},
year={2016}
}
@inproceedings{NaessethEtAl2017,
title={Variational Sequential Monte Carlo},
author={Naesseth, Christian A and Linderman, Scott W and Ranganath, Rajesh and Blei, David M},
booktitle={Proceedings of the 21st International Conference on Artificial Intelligence and Statistics (AISTATS)},
year={2018}
}
@article{Neal1990,
title={Learning stochastic feedforward networks},
author={Neal, Radford M},
journal={Department of Computer Science, University of Toronto},
year={1990},
publisher={Citeseer}
}
@inproceedings{Neal1993,
title={Bayesian learning via stochastic dynamics},
author={Neal, Radford M},
booktitle={Advances in neural information processing systems},
pages={475--482},
year={1993}
}
@article{Neal1998,
title={Annealed importance sampling (Technical Report 9805 (revised))},
author={Neal, Radford M},
journal={Department of Statistics, University of Toronto},
year={1998}
}
@article{Neal2011,
title={MCMC using Hamiltonian dynamics},
author={Neal, Radford M},
journal={Handbook of Markov Chain Monte Carlo},
volume={2},
year={2011}
}
@book{Neal2012,
title={Bayesian learning for neural networks},
author={Neal, Radford M},
volume={118},
year={2012},
publisher={Springer Science \& Business Media}
}
@article{NeiswangerEtAl2013,
title={Asymptotically exact, embarrassingly parallel MCMC},
author={Neiswanger, Willie and Wang, Chong and Xing, Eric},
journal={arXiv preprint arXiv:1311.4780},
year={2013}
}
@inproceedings{Nesterov1983,
title={A method for unconstrained convex minimization problem with the rate of convergence O (1/k2)},
author={Nesterov, Yurii},
booktitle={Doklady an SSSR},
volume={269},
pages={543--547},
year={1983}
}
@inproceedings{NowozinEtAl2016,
title={f-GAN: Training generative neural samplers using variational divergence minimization},
author={Nowozin, Sebastian and Cseke, Botond and Tomioka, Ryota},
booktitle={Advances in Neural Information Processing Systems},
pages={271--279},
year={2016}
}
@unpublished{Orbanz2014,
title={Lecture notes on {Bayesian} nonparametrics [{DRAFT}]},
author={Orbanz, Peter},
note={Unpublished}
}
@inproceedings{PaigeWood2014,
title={A compilation target for probabilistic programming languages},
author={Paige, Brooks and Wood, Frank},
booktitle={Proceedings of the 31st International Conference on Machine Learning (ICML-14)},
pages={1935--1943},
year={2014}
}
@inproceedings{PaigeWood2016,
title={Inference networks for Sequential Monte Carlo in graphical models},
author={Paige, Brooks and Wood, Frank},
booktitle={Proceedings of the 33rd International Conference on Machine Learning},
volume={48},
year={2016}
}
@inproceedings{PascanuEtAl2013,
title={On the difficulty of training recurrent neural networks},
author={Pascanu, Razvan and Mikolov, Tomas and Bengio, Yoshua},
booktitle={Proceedings of The 30th International Conference on Machine Learning},
pages={1310--1318},
year={2013}
}
@article{Pollack1990,
title={Recursive distributed representations},
author={Pollack, Jordan B},
journal={Artificial Intelligence},
volume={46},
number={1},
pages={77--105},
year={1990},
publisher={Elsevier}
}
@article{PougetEtAl2013,
title={Probabilistic brains: knowns and unknowns},
author={Pouget, Alexandre and Beck, Jeffrey M and Ma, Wei Ji and Latham, Peter E},
journal={Nature neuroscience},
volume={16},
number={9},
pages={1170--1178},
year={2013},
publisher={Nature Publishing Group}
}
@inproceedings{RanganathetAl2014b,
title={Black Box Variational Inference},
author={Ranganath, Rajesh and Gerrish, Sean and Blei, David},
booktitle={Proceedings of the Seventeenth International Conference on Artificial Intelligence and Statistics},
pages={814--822},
year={2014}
}
@inproceedings{RanganathEtAl2014,
title={Deep exponential families},
author={Ranganath, Rajesh and Tang, Linpeng and Charlin, Laurent and Blei, David M},
booktitle={Proceedings of the Eighteenth International Conference on Artificial Intelligence and Statistics (AISTATS)},
year={2015}
}
@article{ReedDeFreitas2015,
title={Neural programmer-interpreters},
author={Reed, Scott and de Freitas, Nando},
journal={arXiv preprint arXiv:1511.06279v4 [cs.LG]},
year={2015}
}
@article{RenEtAl2016,