-
Notifications
You must be signed in to change notification settings - Fork 2
/
ref.bib
80 lines (71 loc) · 3.21 KB
/
ref.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
@misc{Christoffersen21,
title={Asymptotically Exact and Fast Gaussian Copula Models for Imputation of Mixed Data Types},
author={Benjamin Christoffersen and Mark Clements and Keith Humphreys and Hedvig Kjellström},
year={2021},
eprint={2102.02642},
archivePrefix={arXiv},
primaryClass={stat.ML}
}
@inproceedings{zhao20Mat,
title={Matrix Completion with Quantified Uncertainty through Low Rank {G}aussian Copula},
author={Yuxuan Zhao and Madeleine Udell},
year={2020},
eprint={2006.10829},
archivePrefix={arXiv},
primaryClass={stat.ML},
booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
}
@inproceedings{zhao20,
author = {Zhao, Yuxuan and Udell, Madeleine},
title = {Missing Value Imputation for Mixed Data via {G}aussian Copula},
year = {2020},
isbn = {9781450379984},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
doi = {10.1145/3394486.3403106},
abstract = {Missing data imputation forms the first critical step of many data analysis pipelines. The challenge is greatest for mixed data sets, including real, Boolean, and ordinal data, where standard techniques for imputation fail basic sanity checks: for example, the imputed values may not follow the same distributions as the data. This paper proposes a new semiparametric algorithm to impute missing values, with no tuning parameters. The algorithm models mixed data as a Gaussian copula. This model can fit arbitrary marginals for continuous variables and can handle ordinal variables with many levels, including Boolean variables as a special case. We develop an efficient approximate EM algorithm to estimate copula parameters from incomplete mixed data. The resulting model reveals the statistical associations among variables. Experimental results on several synthetic and real datasets show the superiority of our proposed algorithm to state-of-the-art imputation algorithms for mixed data.},
booktitle = {Proceedings of the 26th ACM SIGKDD International Conference on Knowledge Discovery \& Data Mining},
pages = {636–646},
numpages = {11},
keywords = {missing values, mixed data, ordinal data, Gaussian copula, imputation},
location = {Virtual Event, CA, USA},
series = {KDD '20}
}
@article{Kingma15,
title={Adam: A Method for Stochastic Optimization},
author={Diederik P. Kingma and Jimmy Ba},
journal={CoRR},
year={2015},
volume={abs/1412.6980}
}
@article{hoff07,
author = "Hoff, Peter D.",
doi = "10.1214/07-AOAS107",
fjournal = "Annals of Applied Statistics",
journal = "Ann. Appl. Stat.",
month = "06",
number = "1",
pages = "265--283",
publisher = "The Institute of Mathematical Statistics",
title = "Extending the rank likelihood for semiparametric copula estimation",
url = "https://doi.org/10.1214/07-AOAS107",
volume = "1",
year = "2007"
}
@article{Genz02,
author = {Alan Genz and Frank Bretz},
title = {Comparison of Methods for the Computation of Multivariate t Probabilities},
journal = {Journal of Computational and Graphical Statistics},
volume = {11},
number = {4},
pages = {950-971},
year = {2002},
publisher = {Taylor & Francis},
doi = {10.1198/106186002394},
URL = {
https://doi.org/10.1198/106186002394
},
eprint = {
https://doi.org/10.1198/106186002394
}
}