-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathreferences.bib
7921 lines (7537 loc) · 287 KB
/
references.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% This file is automatically generated. Do not modify this
% file directly, or else your changes will be overwritten.
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%"
@article{ferguson73dp,
author = {T. S. Ferguson},
journal = {Annals of Statistics},
pages = {209--230},
title = {A {B}ayesian Analysis of Some Nonparametric Problems},
volume = {1},
year = {1973},
}
@article{ferguson74prior,
author = {T. S. Ferguson},
journal = {Annals of Statistics},
pages = {615--629},
title = {Prior distributions on spaces of probability measures},
volume = {2},
year = {1974},
}
@article{blackwell73urn,
author = {D. Blackwell and J. B. MacQueen},
journal = {Annals of Statistics},
pages = {353--355},
title = {{F}erguson Distributions via {P}\'olya Urn Schemes},
volume = {1},
year = {1973},
}
@article{aldous85exch,
author = {D. Aldous},
journal = {Springer Lecture Notes in Math},
pages = {1--198},
title = {Exchangeability and related topics},
volume = {1117},
year = {1985},
}
@article{antoniak74dpmix,
author = {C. E. Antoniak},
journal = {Annals of Statistics},
pages = {1152--1174},
title = {Mixtures of {D}irichlet Processes with Applications to {B}ayesian Nonparametric Problems},
volume = {2},
year = {1974},
}
@article{sethuraman94stick,
author = {J. Sethuraman},
journal = {Statistica Sinica},
pages = {639--650},
title = {A Constructive Definition of {D}irichlet Priors},
volume = {4},
year = {1994},
}
@article{escobar95mixture,
author = {M. D. Escobar and M. West},
journal = {Journal of the American Statistical Association (JASA)},
pages = {577--588},
title = {{B}ayesian Density Estimation and Inference Using Mixtures},
volume = {90},
year = {1995},
}
@techreport{west95hyper,
author = {M. West},
institution = {Department of Statistics, Duke University (Duke University)},
title = {Hyperparameter estimation in {D}irichlet process mixture models},
year = {1995},
}
@article{pitman97yor,
author = {J. Pitman and M. Yor},
journal = {Annals of Probability},
pages = {855--900},
title = {The two-parameter {P}oisson-{D}irichlet distribution derived from a stable subordinator},
volume = {25},
year = {1997},
}
@article{ishwaran02exact,
author = {H. Ishwaran and M. Zarepour},
journal = {Canadian Journal of Statististics},
pages = {269--284},
title = {Exact and approximate sum-representations for the {D}irichlet process},
volume = {30},
year = {2002},
}
@inproceedings{griffiths06ibp,
author = {T. Griffiths and Z. Ghahramani},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {Infinite Latent Feature Models and the {I}ndian Buffet Process},
year = {2006},
}
@inproceedings{thibaux07hbp,
author = {R. Thibaux and M. I. Jordan},
booktitle = {Artificial Intelligence and Statistics (AISTATS)},
title = {Hierarchical {B}eta Processes and the {I}ndian Buffet Process},
year = {2007},
}
@inproceedings{xing08haplotype,
author = {J. V. Gael and Y. Saatci and Y. W. Teh and Z. Ghahramani},
booktitle = {International Conference on Machine Learning (ICML)},
pages = {1088--1095},
title = {Beam Sampling for the Infinite Hidden {M}arkov Model},
year = {2008},
}
@inproceedings{xing04haplotype,
author = {E. P. Xing and R. Sharan and M. I. Jordan},
booktitle = {International Conference on Machine Learning (ICML)},
pages = {111--118},
title = {{B}ayesian Haplotype Inference via the {D}irichlet Process},
year = {2004},
}
@article{teh06hdp,
author = {Y. W. Teh and M. I. Jordan and M. Beal and D. Blei},
journal = {Journal of the American Statistical Association (JASA)},
pages = {1566--1581},
title = {Hierarchical {D}irichlet processes},
volume = {101},
year = {2006},
}
@article{rodriguez08ndp,
author = {A. Rodriguez and D. B. Dunson and A. E. Gelfand},
journal = {Journal of the American Statistical Association (JASA)},
pages = {1131--1144},
title = {The nested {D}irichlet process},
volume = {103},
year = {2008},
}
@inproceedings{beal02ihmm,
author = {M. Beal and Z. Ghahramani and C. Rasmussen},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
pages = {577--584},
title = {The infinite hidden {M}arkov model},
year = {2002},
}
@inproceedings{sohn07ihmm,
author = {K. Sohn and E. P. Xing},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {A Hidden {M}arkov {D}irichlet Process Model for Genetic Recombination in Open Ancestral Space},
year = {2007},
}
@inproceedings{teh06pitmanyor,
author = {Y. W. Teh},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
pages = {985--992},
title = {A Hierarchical {B}ayesian Language Model Based On {P}itman-{Y}or Processes},
year = {2006},
}
@inproceedings{goldwater06segmentation,
author = {S. Goldwater and T. Griffiths and M. Johnson},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
title = {Contextual Dependencies in Unsupervised Word Segmentation},
year = {2006},
}
@inproceedings{sudderth06transformed,
author = {E. B. Sudderth and A. B. Torralba and W. T. Freeman and A. S. Willsky},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
pages = {1297--1304},
title = {Describing Visual Scenes using Transformed {D}irichlet Processes},
year = {2006},
}
@article{daume05clustering,
author = {H. Daume and D. Marcu},
journal = {Journal of Machine Learning Research (JMLR)},
pages = {1--48},
title = {A {B}ayesian Model for Supervised Clustering with the {D}irichlet Process Prior},
volume = {1},
year = {2005},
}
@article{blei05variational,
author = {D. Blei and M. I. Jordan},
journal = {Bayesian Analysis},
pages = {121--144},
title = {Variational Inference for {D}irichlet Process Mixtures},
volume = {1},
year = {2005},
}
@inproceedings{teh07collapsed,
author = {Y. W. Teh and D. Newman and M. Welling},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
pages = {1353--1360},
title = {A Collapsed Variational {B}ayesian Inference Algorithm for {L}atent {D}irichlet {A}llocation},
year = {2007},
}
@inproceedings{kurihara07accelerated,
author = {K. Kurihara and M. Welling and N. Vlassis},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {Accelerated Variational {D}irichlet Mixture Models},
year = {2007},
}
@inproceedings{kurihara07collapsed,
author = {K. Kurihara and M. Welling and Y. W. Teh},
booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)},
title = {Collapsed Variational {D}irichlet Process Mixture Models},
year = {2007},
}
@inproceedings{daume07astar,
author = {H. Daume},
booktitle = {Artificial Intelligence and Statistics (AISTATS)},
title = {Fast search for {D}irichlet process mixture models},
year = {2007},
}
@inproceedings{heller05hierarchical,
author = {K. A. Heller and Z. Ghahramani},
booktitle = {International Conference on Machine Learning (ICML)},
title = {{B}ayesian Hierarchical Clustering},
year = {2005},
}
@article{ishwaran01gibbs,
author = {H. Ishwaran and L. F. James},
journal = {Journal of the American Statistical Association (JASA)},
pages = {161--173},
title = {{G}ibbs Sampling Methods for Stick-Breaking Priors},
volume = {96},
year = {2001},
}
@article{papaspiliopoulos08retro,
author = {O. Papaspiliopoulos and G. O. Roberts},
journal = {Biometrika},
pages = {169--186},
title = {Retrospective {MCMC} for {D}irichlet process hierarchical models},
volume = {95},
year = {2008},
}
@article{walker04slice,
author = {S. G. Walker},
journal = {Communications in Statistics - Simulation and Computation},
pages = {45--54},
title = {Sampling the {D}irichlet Mixture Model with Slices},
volume = {36},
year = {2004},
}
@techreport{dahl03splitmerge,
author = {D. B. Dahl},
institution = {Department of Statistics, University of Wisconsin (U. Wisconsin)},
title = {An Improved Merge-Split Sampler for Conjugate {D}irichlet Process Mixture Models},
year = {2003},
}
@techreport{dahl03univariate,
author = {D. B. Dahl},
institution = {Department of Statistics, University of Wisconsin (U. Wisconsin)},
title = {Modal Clustering in a Univariate Class of Product Partition Models},
year = {2003},
}
@techreport{neal00dp,
author = {R. Neal},
institution = {Department of Statistics, University of Toronto (U. Toronto)},
title = {{M}arkov Chain Sampling Methods for {D}irichlet Process Mixture Models},
year = {2000},
}
@techreport{jain00splitmerge,
author = {S. Jain and R. Neal},
institution = {Department of Statistics, University of Toronto (U. Toronto)},
title = {A Split-Merge {M}arkov Chain {M}onte {C}arlo Procedure for the {D}irichlet Process Mixture Model},
year = {2000},
}
@techreport{jain05splitmerge,
author = {S. Jain and R. Neal},
institution = {Department of Statistics, University of Toronto (U. Toronto)},
title = {Splitting and merging components of a nonconjugate {D}irichlet process mixture model},
year = {2005},
}
@article{blei03lda,
author = {D. Blei and A. Ng and M. I. Jordan},
journal = {Journal of Machine Learning Research (JMLR)},
pages = {993--1022},
title = {Latent {D}irichlet Allocation},
volume = {3},
year = {2003},
}
@inproceedings{hamze04fields,
author = {F. Hamze and N. d. Freitas},
booktitle = {Uncertainty in Artificial Intelligence (UAI)},
title = {From Fields to Trees},
year = {2004},
}
@inproceedings{welling06flexible,
author = {M. Welling},
booktitle = {International Conference on Machine Learning Workshop on Nonparametric Bayesian Methods},
title = {Flexible Priors for Infinite Mixture Models},
year = {2006 2006},
}
@article{johnson84randproj,
author = {W. Johnson and J. Lindenstrauss},
journal = {Contemporary Mathematics},
pages = {189--206},
title = {Extensions of {L}ipschitz maps into a {H}ilbert space},
volume = {26},
year = {1984},
}
@inproceedings{dasgupta99mixgauss,
author = {S. Dasgupta},
booktitle = {Foundations of Computer Science (FOCS)},
title = {Learning mixtures of {G}aussians},
year = {1999},
}
@article{kannan97convex,
author = {R. Kannan and L. Lovasz and M. Simonovits},
journal = {Random Structures and Algorithms},
pages = {1--50},
title = {Random walks and an ${O}^*(n^5)$ volume algorithm for convex bodies},
volume = {11},
year = {1997},
}
@inproceedings{friedman00bayesian,
author = {N. Friedman and D. Koller},
booktitle = {Uncertainty in Artificial Intelligence (UAI)},
pages = {201--210},
title = {Being {B}ayesian about {B}ayesian Network Structure: A {B}ayesian Approach to Structure Discovery in {B}ayesian Networks},
year = {2000},
}
@article{swendsen87,
author = {R. H. Swendsen and J. S. Wang},
journal = {Physics Review Letters},
pages = {86--88},
title = {Nonuniversal critical dynamics in {MC} simulations},
volume = {58},
year = {1987},
}
@article{barbu05swendsen,
author = {A. Barbu and S. C. Zhu},
journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)},
pages = {1239--1253},
title = {Generalizing {S}wendsen-{W}ang to sampling arbitrary posterior probabilities},
volume = {27},
year = {2005},
}
@article{tanner87da,
author = {M. A. Tanner and W. H. Wong},
journal = {Journal of the American Statistical Association (JASA)},
pages = {528--540},
title = {The calculation of posterior distributions by data augmentation},
volume = {82},
year = {1987},
}
@article{liu98pxem,
author = {C. Liu and D. Rubin and Y. N. Wu},
journal = {Biometrika},
pages = {755--770},
title = {Parameter expansion to accelerate {EM}: the {PX-EM} algorithm},
volume = {85},
year = {1998},
}
@article{liu99pxda,
author = {J. Liu and Y. Wu},
journal = {Journal of the American Statistical Association (JASA)},
pages = {1264--1274},
title = {Parameter expansion for data augmentation},
volume = {94},
year = {1999},
}
@techreport{pitman02process,
author = {J. Pitman},
institution = {Department of Statistics, University of California at Berkeley (UC Berkeley)},
number = {621},
title = {Combinatorial Stochastic Processes},
year = {2002},
}
@book{bertsekas99nlp,
author = {D. Bertsekas},
publisher = {Athena Scientific},
title = {Nonlinear Programming},
year = {1999},
}
@techreport{mackay97hmm,
author = {D. MacKay},
institution = {University of Cambridge},
title = {Ensemble Learning for Hidden {M}arkov Models},
year = {1997},
}
@inproceedings{hermjakob01parsing,
author = {U. Hermjakob},
booktitle = {Workshop on Open-domain question answering, ACL},
pages = {1--6},
title = {Parsing and Question Classification for Question Answering},
year = {2001},
}
@article{gildea02semantic,
author = {D. Gildea and D. Jurafsky},
journal = {Computational Linguistics},
pages = {245--288},
title = {Automatic Labeling of Semantic Roles},
volume = {28},
year = {2002},
}
@inproceedings{galley04translation,
author = {M. Galley and M. Hopkins and K. Knight and D. Marcu},
booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)},
pages = {273--280},
title = {What's in a translation rule?},
year = {2004},
}
@inproceedings{melamed04smt,
author = {I. D. Melamed},
booktitle = {Association for Computational Linguistics (ACL)},
title = {Statistical Machine Translation by Parsing},
year = {2004},
}
@article{chomsky56models,
author = {N. Chomsky},
journal = {IRE Transactions on Information Theory},
pages = {113--124},
title = {Three models for the description of language},
volume = {2},
year = {1956},
}
@book{manning99nlp,
author = {C. Manning and H. Schütze},
publisher = {MIT Press},
title = {Foundations of Statistical Natural Language Processing},
year = {1999},
}
@article{marcus93treebank,
author = {M. P. Marcus and M. A. Marcinkiewicz and B. Santorini},
journal = {Computational Linguistics},
pages = {313--330},
title = {Building a large annotated corpus of {E}nglish: the {P}enn {T}reebank},
volume = {19},
year = {1993},
}
@inproceedings{charniak96treebank,
author = {E. Charniak},
booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)},
pages = {1031--1036},
title = {Tree-bank Grammars},
year = {1996},
}
@inproceedings{kurihara04varpcfg,
author = {K. Kurihara and T. Sato},
booktitle = {International Joint Conference on Natural Language Processing Workshop Beyond Shallow Analyses},
title = {An Application of the Variational {B}ayesian Approach to Probabilistic Context-Free Grammars},
year = {2004},
}
@inproceedings{kurihara06varinduct,
author = {K. Kurihara and T. Sato},
booktitle = {International Colloquium on Grammatical Inference},
title = {Variational {B}ayesian Grammar Induction for Natural Language},
year = {2006},
}
@inproceedings{petrov06latent,
author = {S. Petrov and L. Barrett and R. Thibaux and D. Klein},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
pages = {433--440},
title = {Learning Accurate, Compact, and Interpretable Tree Annotation},
year = {2006},
}
@inproceedings{stolcke94merge,
author = {A. Stolcke and S. Omohundro},
booktitle = {International Colloquium on Grammatical Inference and Applications},
pages = {106--118},
title = {Inducing Probabilistic Grammars by {B}ayesian Model Merging},
year = {1994},
}
@inproceedings{wolff88syntax,
author = {J. G. Wolff},
booktitle = {Categories and processes in language acquisition},
pages = {179--215},
title = {Learning syntax and meanings through optimization and distributional analysis},
year = {1988},
}
@phdthesis{collins99thesis,
author = {M. Collins},
school = {University of Pennsylvania},
title = {Head-Driven Statistical Models for Natural Language Parsing},
year = {1999},
}
@inproceedings{eisner96dependency,
author = {J. Eisner},
booktitle = {International Conference on Computational Linguistics (COLING)},
pages = {340--345},
title = {Three New Probabilistic Models for Dependency Parsing: An Exploration},
year = {1996},
}
@inproceedings{charniak00maxent,
author = {E. Charniak},
booktitle = {Applied Natural Language Processing and North American Association for Computational Linguistics (ANLP/NAACL)},
pages = {132--139},
title = {A maximum-entropy-inspired parser},
year = {2000},
}
@inproceedings{klein03unlexicalized,
author = {D. Klein and C. Manning},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {423--430},
title = {Accurate Unlexicalized Parsing},
year = {2003},
}
@article{johnson98parent,
author = {M. Johnson},
journal = {Computational Linguistics},
pages = {613--632},
title = {{PCFG} Models of Linguistic Tree Representations},
volume = {24},
year = {1998},
}
@inproceedings{matsuzaki05latent,
author = {T. Matsuzaki and Y. Miyao and J. Tsujii},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {75--82},
title = {Probabilistic {CFG} with Latent Annotations},
year = {2005},
}
@inproceedings{johnson06adaptor,
author = {M. Johnson and T. Griffiths and S. Goldwater},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
pages = {641--648},
title = {Adaptor Grammars: A Framework for Specifying Compositional Nonparametric {B}ayesian Models},
year = {2006},
}
@inproceedings{blei04nested,
author = {D. Blei and T. Griffiths and M. I. Jordan and J. Tenenbaum},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {Hierarchical topic models and the nested {C}hinese restaurant process},
year = {2004},
}
@inproceedings{goldwater05interpolate,
author = {S. Goldwater and T. Griffiths and M. Johnson},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {Interpolating Between Types and Tokens by Estimating Power-Law Generators},
year = {2005},
}
@inproceedings{johnson07mcmc,
author = {M. Johnson and T. Griffiths and S. Goldwater},
booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)},
pages = {139--146},
title = {{B}ayesian Inference for {PCFG}s via {M}arkov Chain {M}onte {C}arlo},
year = {2007},
}
@inproceedings{haghighi07coref,
author = {A. Haghighi and D. Klein},
booktitle = {Association for Computational Linguistics (ACL)},
title = {Unsupervised Coreference Resolution in a Nonparametric {B}ayesian Model},
year = {2007},
}
@inproceedings{daume06sum,
author = {H. Daume and D. Marcu},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
title = {{B}ayesian Query-Focused Summarization},
year = {2006},
}
@inproceedings{finkel07inftree,
author = {J. R. Finkel and T. Grenager and C. Manning},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {272--279},
title = {The Infinite Tree},
year = {2007},
}
@inproceedings{petrov07split,
author = {S. Petrov and D. Klein},
booktitle = {Human Language Technology and North American Association for Computational Linguistics (HLT/NAACL)},
pages = {404--411},
title = {Learning and Inference for Hierarchically Split {PCFG}s},
year = {2007},
}
@inproceedings{mcclosky06self,
author = {D. McClosky and E. Charniak and M. Johnson},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
title = {Reranking and Self-Training for Parser Adaptation},
year = {2006},
}
@article{lari90scfg,
author = {K. Lari and S. J. Young},
journal = {Computer Speech and Language},
pages = {35--56},
title = {The estimation of stochastic context-free grammars using the inside-outside algorithm},
volume = {4},
year = {1990},
}
@article{brown93mt,
author = {P. F. Brown and S. A. D. Pietra and V. J. D. Pietra and R. L. Mercer},
journal = {Computational Linguistics},
pages = {263--311},
title = {The Mathematics of Statistical Machine Translation: Parameter Estimation},
volume = {19},
year = {1993},
}
@inproceedings{neal98gem,
author = {R. M. Neal and G. E. Hinton},
booktitle = {Learning in Graphical Models},
pages = {355--368},
title = {A new view of the {EM} algorithm that justifies incremental, sparse and other variants},
year = {1998},
}
@inproceedings{collins99unsupervised,
author = {M. Collins and Y. Singer},
booktitle = {Empirical Methods in Natural Language Processing (EMNLP)},
title = {Unsupervised Models for Named Entity Classification},
year = {1999},
}
@inproceedings{chen96smoothing,
author = {S. F. Chen and J. Goodman},
booktitle = {Association for Computational Linguistics (ACL)},
title = {An Empirical Study of Smoothing Techniques for Language Modeling},
year = {1996},
}
@inproceedings{ney96hmm,
author = {H. Ney and S. Vogel},
booktitle = {International Conference on Computational Linguistics (COLING)},
pages = {836--841},
title = {{HMM}-Based Word Alignment in Statistical Translation},
year = {1996},
}
@inproceedings{blum98cotraining,
author = {A. Blum and T. Mitchell},
booktitle = {Conference on Learning Theory (COLT)},
title = {Combining Labeled and Unlabeled Data with Co-training},
year = {1998},
}
@inproceedings{carroll92dependency,
author = {G. Carroll and E. Charniak},
booktitle = {Workshop Notes for Statistically-Based NLP Techniques, AAAI},
pages = {1--13},
title = {Two Experiments on Learning Probabilistic Dependency Grammars from Corpora},
year = {1992},
}
@inproceedings{haghighi06induction,
author = {A. Haghighi and D. Klein},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
title = {Prototype-based Grammar Induction},
year = {2006},
}
@inproceedings{pereira92bracket,
author = {F. Pereira and Y. Shabes},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {128--135},
title = {Inside-outside reestimation from partially bracketed corpora},
year = {1992},
}
@article{merialdo94tagging,
author = {B. Merialdo},
journal = {Computational Linguistics},
pages = {155--171},
title = {Tagging {E}nglish text with a probabilistic model},
volume = {20},
year = {1994},
}
@inproceedings{clark01induction,
author = {A. Clark},
booktitle = {Computational Natural Language Learning (CoNLL)},
title = {Unsupervised induction of stochastic context free grammars with distributional clustering},
year = {2001},
}
@inproceedings{paskin02bigrams,
author = {M. A. Paskin},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {Grammatical Bigrams},
year = {2002},
}
@inproceedings{klein04induction,
author = {D. Klein and C. D. Manning},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {478--485},
title = {Corpus-Based Induction of Syntactic Structure: Models of Dependency and Constituency},
year = {2004},
}
@inproceedings{smith05contrastive,
author = {N. Smith and J. Eisner},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {354--362},
title = {Contrastive Estimation: Training Log-Linear Models on Unlabeled Data},
year = {2005},
}
@inproceedings{smith06anneal,
author = {N. Smith and J. Eisner},
booktitle = {International Conference on Computational Linguistics and Association for Computational Linguistics (COLING/ACL)},
title = {Annealing Structural Bias in Multilingual Weighted Grammar Induction},
year = {2006},
}
@inproceedings{goldwater07pos,
author = {S. Goldwater and T. Griffiths},
booktitle = {Association for Computational Linguistics (ACL)},
title = {A Fully {B}ayesian Approach to Unsupervised Part-of-Speech Tagging},
year = {2007},
}
@inproceedings{johnson08synergy,
author = {M. Johnson},
booktitle = {Human Language Technology and Association for Computational Linguistics (HLT/ACL)},
pages = {398--406},
title = {Using Adaptor Grammars to Identify Synergies in the Unsupervised Acquisition of Linguistic Structure},
year = {2008},
}
@inproceedings{johnson07pos,
author = {M. Johnson},
booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)},
title = {Why doesn't {EM} find good {HMM} {POS}-taggers?},
year = {2007},
}
@article{goldwater09segmentation,
author = {S. Goldwater and T. Griffiths and M. Johnson},
journal = {Cognition},
pages = {21--54},
title = {A {B}ayesian Framework for Word Segmentation: Exploring the Effects of Context},
volume = {112},
year = {2009},
}
@inproceedings{johnson09segmentation,
author = {M. Johnson and S. Goldwater},
booktitle = {North American Association for Computational Linguistics (NAACL)},
pages = {317--325},
title = {Improving nonparameteric {B}ayesian inference: experiments on unsupervised word segmentation with adaptor grammars},
year = {2009},
}
@inproceedings{cohn09ptsg,
author = {T. Cohn and S. Goldwater and P. Blunsom},
booktitle = {North American Association for Computational Linguistics (NAACL)},
pages = {548--556},
title = {Inducing Compact but Accurate Tree-Substitution Grammars},
year = {2009},
}
@inproceedings{post09ptsg,
author = {M. Post and D. Gildea},
booktitle = {Association for Computational Linguistics and International Joint Conference on Natural Language Processing (ACL-IJCNLP)},
title = {{B}ayesian learning of a tree substitution grammar},
year = {2009},
}
@inproceedings{gao08comparison,
author = {J. Gao and M. Johnson},
booktitle = {Empirical Methods in Natural Language Processing (EMNLP)},
pages = {344--352},
title = {A comparison of {B}ayesian estimators for unsupervised Hidden {M}arkov Model {POS} taggers},
year = {2008},
}
@inproceedings{grenager05segmentation,
author = {T. Grenager and D. Klein and C. D. Manning},
booktitle = {Association for Computational Linguistics (ACL)},
pages = {371--378},
title = {Unsupervised learning of field segmentation models for information extraction},
year = {2005},
}
@article{dasgupta07em,
author = {S. Dasgupta and L. Schulman},
journal = {Journal of Machine Learning Research (JMLR)},
title = {A Probabilistic Analysis of {EM} for Mixtures of Separated, Spherical {G}aussians},
volume = {8},
year = {2007},
}
@article{ron98pfa,
author = {D. Ron and Y. Singer and N. Tishby},
journal = {Journal of Computer and System Sciences},
pages = {133--152},
title = {On the Learnability and Usage of Acyclic Probabilistic Finite Automata},
volume = {56},
year = {1998},
}
@inproceedings{srebro06mixture,
author = {N. Srebro and G. Shakhnarovich and S. Roweis},
booktitle = {International Conference on Machine Learning (ICML)},
pages = {865--872},
title = {An investigation of computational and informational limits in {G}aussian mixture clustering},
year = {2006},
}
@inproceedings{feldman05product,
author = {J. Feldman and R. O'Donnell and R. A. Servedio},
booktitle = {Foundations of Computer Science (FOCS)},
pages = {501--510},
title = {Learning mixtures of product distributions over discrete domains},
year = {2005},
}
@article{clark05fsa,
author = {A. Clark and F. Thollard},
journal = {Journal of Machine Learning Research (JMLR)},
pages = {473--497},
title = {{PAC}-learnability of Probabilistic Deterministic Finite State Automata},
volume = {5},
year = {2005},
}
@article{blackwell57identifiable,
author = {D. Blackwell and L. Koopmans},
journal = {Annals of Mathematical Statistics},
pages = {1011--1015},
title = {On the Identifiability Problem for Functions of Finite {M}arkov Chains},
volume = {28},
year = {1957},
}
@techreport{adriaans99shallow,
author = {P. W. Adriaans},
institution = {Stanford University},
title = {Learning Shallow Context-Free Languages under Simple Distributions},
year = {1999},
}
@article{kuhn55hungarian,
author = {H. W. Kuhn},
journal = {Naval Research Logistic Quarterly},
pages = {83--97},
title = {The {H}ungarian method for the assignment problem},
volume = {2},
year = {1955},
}
@phdthesis{ratnaparkhi98thesis,
author = {A. Ratnaparkhi},
school = {University of Pennsylvania},
title = {Maximum entropy models for natural language ambiguity resolution},
year = {1998},
}
@inproceedings{mccallum00memm,
author = {A. McCallum and D. Freitag and F. Pereira},
booktitle = {International Conference on Machine Learning (ICML)},
title = {Maximum Entropy {M}arkov Models for Information Extraction and Segmentation},
year = {2000},
}
@inproceedings{lafferty01crf,
author = {J. Lafferty and A. McCallum and F. Pereira},
booktitle = {International Conference on Machine Learning (ICML)},
pages = {282--289},
title = {Conditional Random Fields: Probabilistic Models for Segmenting and Labeling Data},
year = {2001},
}
@inproceedings{kakade02objective,
author = {S. Kakade and Y. W. Teh and S. Roweis},
booktitle = {International Conference on Machine Learning (ICML)},
title = {An Alternate Objective Function for {M}arkovian Fields},
year = {2002},
}
@inproceedings{klein02conditional,
author = {D. Klein and C. D. Manning},
booktitle = {Empirical Methods in Natural Language Processing (EMNLP)},
title = {Conditional structure versus conditional estimation in {NLP} models},
year = {2002},
}
@inproceedings{ng02compare,
author = {A. Y. Ng and M. I. Jordan},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {On Discriminative vs. Generative classifiers: A comparison of logistic regression and naive {B}ayes},
year = {2002},
}
@article{white82mis,
author = {H. White},
journal = {Econometrica},
title = {Maximum likelihood estimation of misspecified models},
volume = {50},
year = {1982},
}
@article{godambe87quasi,
author = {V. P. Godambe and C. C. Heyde},
journal = {International Statistical Review},
pages = {231--244},
title = {Quasi-likelihood and Optimal estimation},
volume = {55},
year = {1987},
}
@inproceedings{pal06mcl,
author = {A. McCallum and C. Pal and G. Druck and X. Wang},
booktitle = {Association for the Advancement of Artificial Intelligence (AAAI)},
title = {Multi-Conditional Learning: Generative/Discriminative Training for Clustering and Classification},
year = {2006},
}
@inproceedings{lasserre06hybrid,
author = {J. A. Lasserre and C. M. Bishop and T. P. Minka},
booktitle = {Computer Vision and Pattern Recognition (CVPR)},
pages = {87--94},
title = {Principled Hybrids of Generative and Discriminative Models},
year = {2006},
}
@inproceedings{raina04hybrid,
author = {R. Raina and Y. Shen and A. Ng and A. McCallum},
booktitle = {Advances in Neural Information Processing Systems (NIPS)},
title = {Classification with hybrid generative/discriminative models},
year = {2004},
}
@inproceedings{suzuki07hybrid,
author = {J. Suzuki and A. Fujino and H. Isozaki},
booktitle = {Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP/CoNLL)},
title = {Semi-Supervised Structured Output Learning based on a Hybrid Generative and Discriminative Approach},
year = {2007},
}
@inproceedings{bouchard04tradeoff,
author = {G. Bouchard and B. Triggs},
booktitle = {International Conference on Computational Statistics},
pages = {721--728},
title = {The Trade-Off Between Generative and Discriminative Classifiers},
year = {2004},
}
@book{vaart98asymptotic,
author = {A. W. van der Vaart},
publisher = {Cambridge University Press},
title = {Asymptotic statistics},
year = {1998},
}
@article{besag75pseudo,
author = {J. Besag},
journal = {The Statistician},
pages = {179--195},
title = {The analysis of non-lattice data},
volume = {24},
year = {1975},
}
@article{lindsay88composite,
author = {B. Lindsay},
journal = {Contemporary Mathematics},
pages = {221--239},
title = {Composite likelihood methods},
volume = {80},
year = {1988},
}
@inproceedings{sutton05piecewise,
author = {C. Sutton and A. McCallum},
booktitle = {Uncertainty in Artificial Intelligence (UAI)},
title = {Piecewise Training of Undirected Models},
year = {2005},
}
@inproceedings{sutton07pwpl,
author = {C. Sutton and A. McCallum},
booktitle = {International Conference on Machine Learning (ICML)},
title = {Piecewise Pseudolikelihood for Efficient {CRF} Training},
year = {2007},
}
@article{cox04pseudo,
author = {D. R. Cox and N. Reid},
journal = {Biometrika},
pages = {729--737},
title = {A note on pseudolikelihood constructed from marginal densities},
volume = {91},
year = {2004},
}
@article{varin08composite,
author = {C. Varin},
journal = {Advances in Statistical Analysis},
pages = {1--28},
title = {On composite marginal likelihoods},
volume = {92},
year = {2008},
}
@article{wainwright06wrong,
author = {M. Wainwright},
journal = {Journal of Machine Learning Research (JMLR)},
pages = {1829--1859},
title = {Estimating the ``wrong'' graphical model: Benefits in the computation-limited setting},
volume = {7},
year = {2006},
}
@inproceedings{wainwright03trw,
author = {M. Wainwright and T. Jaakkola and A. Willsky},
booktitle = {Artificial Intelligence and Statistics (AISTATS)},
title = {Tree-reweighted belief propagation algorithms and approximate {ML} estimation by pseudo-moment matching},
year = {2003},
}
@article{hyvarinen06pseudolikelihood,
author = {A. Hyv\"arinen},
journal = {Neural Computation},
pages = {2283--2292},
title = {Consistency of pseudolikelihood estimation of fully visible {B}oltzmann machines},
volume = {18},
year = {2006},
}
@inproceedings{hinton99poe,
author = {G. Hinton},
booktitle = {International Conference on Artificial Neural Networks (ICANN)},
title = {Products of Experts},
year = {1999},
}
@book{robert04mc,
author = {C. P. Robert and G. Casella},
publisher = {Springer},
title = {{M}onte {C}arlo Statistical Methods},
year = {2004},
}
@article{wainwright08varinf,
author = {M. Wainwright and M. I. Jordan},
journal = {Foundations and Trends in Machine Learning},
pages = {1--307},
title = {Graphical models, exponential families, and variational inference},
volume = {1},
year = {2008},
}
@article{siepel04phylohmm,
author = {A. Siepel and D. Haussler},
journal = {Journal of Computational Biology},
pages = {413--428},
title = {Combining phylogenetic and hidden {M}arkov models in biosequence analysis},
volume = {11},
year = {2004},
}
@article{felsenstein96phylohmm,
author = {J. Felsenstein and G. A. Churchill},
journal = {Molecular Biology and Evolution},
pages = {93--104},
title = {A hidden {M}arkov model approach to variation among sites in rate of evolution},
volume = {13},
year = {1996},
}
@article{jojic04phylohmm,
author = {V. Jojic and N. Jojic and C. Meek and D. Geiger and A. Siepel and D. Haussler and D. Heckerman},
journal = {Bioinformatics},
pages = {161--168},
title = {Efficient approximations for learning phylogenetic {HMM} models from data},
volume = {20},
year = {2004},
}
@inproceedings{geiger05structured,
author = {D. Geiger and C. Meek},
booktitle = {Artificial Intelligence and Statistics (AISTATS)},
title = {Structured Variational Inference Procedures and their Realizations},
year = {2005},
}
@inproceedings{shotton06textonboost,
author = {J. Shotton and J. Winn and C. Rother and A. Criminisi},
booktitle = {European Conference on Computer Vision (ECCV)},
title = {TextonBoost: Joint Appearance, Shape and Context Modeling for Multi-Class Object Recognition and Segmentation},
year = {2006},
}
@article{zhu06grammar,
author = {S. C. Zhu and D. Mumford},
journal = {Foundations and Trends in Computer Graphics and Vision},
pages = {259--362},