-
Notifications
You must be signed in to change notification settings - Fork 0
/
CQAPaper.bib
2414 lines (2216 loc) · 164 KB
/
CQAPaper.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
%% This BibTeX bibliography file was created using BibDesk.
%% http://bibdesk.sourceforge.net/
%% Created for Paul Edlefsen at 2015-10-23 13:42:42 +0200
%% Saved with string encoding Unicode (UTF-8)
@article{Rumelhart:1986,
Author = {Rumelhart, D.E. and Hintont, G.E. and Williams, R.J.},
Date-Added = {2011-05-01 17:33:41 -0700},
Date-Modified = {2011-05-01 17:34:07 -0700},
Issn = {0028-0836},
Journal = {Nature},
Number = {6088},
Pages = {533--536},
Title = {{Learning representations by back-propagating errors}},
Volume = {323},
Year = {1986}}
@article{Mamitsuka:1998,
Author = {Mamitsuka, H.},
Date-Added = {2011-05-01 17:13:48 -0700},
Date-Modified = {2011-05-01 17:14:14 -0700},
Issn = {0887-3585},
Journal = {Proteins Structure Function and Genetics},
Number = {4},
Pages = {460--474},
Title = {{Predicting peptides that bind to MHC molecules using supervised learning of hidden Markov models}},
Volume = {33},
Year = {1998}}
@article{Baldi:1994,
Abstract = {Hidden Markov model (HMM) techniques are used to model families of biological sequences. A smooth and convergent algorithm is introduced to iteratively adapt the transition and emission parameters of the models from the examples in a given family. The HMM approach is applied to three protein families: globins, immunoglobulins, and kinases. In all cases, the models derived capture the important statistical characteristics of the family and can be used for a number of tasks, including multiple alignments, motif detection, and classification. For K sequences of average length N, this approach yields an effective multiple-alignment algorithm which requires O(KN2) operations, linear in the number of sequences.},
Author = {Baldi, P and Chauvin, Y and Hunkapiller, T and McClure, M A},
Date-Added = {2011-05-01 16:52:59 -0700},
Date-Modified = {2011-05-01 16:53:33 -0700},
Eprint = {http://www.pnas.org/content/91/3/1059.full.pdf+html},
Journal = {Proceedings of the National Academy of Sciences},
Number = {3},
Pages = {1059-1063},
Title = {Hidden Markov models of biological primary sequence information},
Volume = {91},
Year = {1994},
Bdsk-Url-1 = {http://www.pnas.org/content/91/3/1059.abstract}}
@article{baldi1994smooth,
Author = {Baldi, Pierre and Chauvin, Yves},
Journal = {Neural Computation},
Number = {2},
Pages = {307--318},
Title = {Smooth on-line learning algorithms for hidden Markov models},
Volume = {6},
Year = {1994}}
@article{Hunter:2004,
Author = {Hunter, D.R. and Lange, K.},
Date-Added = {2011-05-01 16:42:53 -0700},
Date-Modified = {2011-05-01 16:43:29 -0700},
Issn = {0003-1305},
Journal = {The American Statistician},
Number = {1},
Pages = {30--37},
Publisher = {ASA},
Title = {{A tutorial on MM algorithms}},
Volume = {58},
Year = {2004}}
@article{Mamitsuka:1996,
Author = {Mamitsuka, Hiroshi},
Date-Added = {2011-05-01 16:38:30 -0700},
Date-Modified = {2011-05-01 16:39:52 -0700},
Doi = {10.1089/cmb.1996.3.361},
Eprint = {http://www.liebertonline.com/doi/pdf/10.1089/cmb.1996.3.361},
Journal = {Journal of Computational Biology},
Number = {3},
Pages = {361-373},
Title = {A Learning Method of Hidden Markov Models for Sequence Discrimination},
Volume = {3},
Year = {1996},
Bdsk-Url-1 = {http://www.liebertonline.com/doi/abs/10.1089/cmb.1996.3.361},
Bdsk-Url-2 = {http://dx.doi.org/10.1089/cmb.1996.3.361}}
@article{meng:1997aof,
Author = {Meng, X.L. and van Dyk, D.},
Date-Added = {2009-05-18 20:01:43 -0400},
Date-Modified = {2009-05-18 20:01:43 -0400},
Journal = {Journal of the Royal Statistical Society. Series B (Methodological)},
Pages = {511--567},
Publisher = {Blackwell Publishers},
Title = {{The EM algorithm--an old folk-song sung to a fast new tune}},
Year = {1997}}
@unpublished{PreCBW,
Author = {Edlefsen, Paul T. and Siegel, Andrew F and Kolker, Eugene},
Date-Added = {2009-05-18 19:45:42 -0400},
Date-Modified = {2009-05-18 21:13:45 -0400},
Note = {unpublished},
Title = {{A conditional maximization procedure for Profile hidden Markov models}},
Year = {2003}}
@misc{ronquist:2003,
Author = {Ronquist, F. and Huelsenbeck, J.P.},
Date-Added = {2009-05-12 13:17:32 -0400},
Date-Modified = {2009-05-12 13:17:32 -0400},
Journal = {Bioinformatics},
Number = {12},
Pages = {1572--1574},
Publisher = {Oxford Univ Press},
Title = {{MrBayes 3: Bayesian phylogenetic inference under mixed models}},
Volume = {19},
Year = {2003}}
@article{heinrich-2004,
Adsnote = {Provided by the Smithsonian/NASA Astrophysics Data System},
Adsurl = {http://adsabs.harvard.edu/abs/2004physics...9129H},
Author = {{Heinrich}, J. and {Blocker}, C. and {Conway}, J. and {Demortier}, L. and {Lyons}, L. and {Punzi}, G. and {Sinervo}, P.~K.},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Eprint = {physics/0409129},
Journal = {ArXiv Physics e-prints},
Month = sep,
Title = {{Interval estimation in the presence of nuisance parameters. 1. Bayesian approach}},
Year = 2004}
@article{Dempster:IJAR,
Abstract = { The Dempster-Shafer (DS) theory of probabilistic reasoning is presented in terms of a semantics whereby every meaningful formal assertion is associated with a triple (p, q, r) where p is the probability "for" the assertion, q is the probability "against" the assertion, and r is the probability of "don't know". Arguments are presented for the necessity of "don't know". Elements of the calculus are sketched, including the extension of a DS model from a margin to a full state space, and DS combination of independent DS uncertainty assessments on the full space. The methodology is applied to inference and prediction from Poisson counts, including an introduction to the use of join-tree model structure to simplify and shorten computation. The relation of DS theory to statistical significance testing is elaborated, introducing along the way the new concept of "dull" null hypothesis.},
Author = {Dempster, A. P.},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:11:08 -0400},
Journal = {International Journal of Approximate Reasoning},
Keywords = {Dempster-Shafer; Belief functions; State space; Poisson model; Join-tree computation; Statistical significance; Dull null hypothesis},
Pages = {365--377},
Title = {{The Dempster-Shafer calculus for statisticians}},
Ty = {JOUR},
Volume = {48},
Year = {2008},
Bdsk-Url-1 = {http://www.sciencedirect.com/science/article/B6V07-4NF7Y50-1/2/93422a4d194c97649d5a67f034772acf}}
@article{Shenoy:1986,
Author = {P. P. Shenoy and G. Shafer},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Journal = {IEEE Expert},
Number = {3},
Pages = {43-52},
Title = {Propagating belief functions with local computations},
Volume = {1},
Year = {1986}}
@article{Dempster:196712,
Abstract = {This paper provides detailed formulae for upper and lower probability inferences, based on a sample from a finite population with a discrete univariate observable characteristic, and directed towards the unknown parameters of the population or properties of a future sample. The model is set up in $\S2$ and the detailed formulae are given in $\S3$. Section 4 demonstrates a limited relationship with confidence statements and $\S5$ explores some special cases.},
Author = {Dempster, A. P.},
Bdsk-Url-1 = {http://links.jstor.org/sici?sici=0006-3444\%5C(196712\%5C)54\%5C:3\%5C/4\%5C\%3C515\%5C:UALPIB\%5C\%3E2.0.CO\%5C;2-A},
Bdsk-Url-2 = {http://links.jstor.org/sici?sici=0006-3444\%5C\%28196712\%5C\%2954\%5C\%3A3\%5C\%2F4\%5C\%3C515\%5C\%3AUALPIB\%5C\%3E2.0.CO\%5C\%3B2-A},
Copyright = {Copyright 1967 Biometrika Trust},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Issn = {0006-3444},
Journal = {Biometrika},
Jstor_Articletype = {Full Length Article},
Jstor_Date = {196712},
Jstor_Formatteddate = {Dec., 1967},
Month = {dec},
Number = {3/4},
Pages = {515--528},
Publisher = {Biometrika Trust},
Title = {Upper and Lower Probability Inferences Based on a Sample from a Finite Univariate Population},
Volume = {54},
Year = {1967}}
@article{Dempster:196704,
Abstract = {A multivalued mapping from a space $X$ to a space $S$ carries a probability measure defined over subsets of $X$ into a system of upper and lower probabilities over subsets of $S$. Some basic properties of such systems are explored in Sections 1 and 2. Other approaches to upper and lower probabilities are possible and some of these are related to the present approach in Section 3. A distinctive feature of the present approach is a rule for conditioning, or more generally, a rule for combining sources of information, as discussed in Sections 4 and 5. Finally, the context in statistical inference from which the present theory arose is sketched briefly in Section 6.},
Author = {Dempster, A. P.},
Bdsk-Url-1 = {http://links.jstor.org/sici?sici=0003-4851\%5C(196704\%5C)38\%5C:2\%5C\%3C325\%5C:UALPIB\%5C\%3E2.0.CO\%5C;2-A},
Bdsk-Url-2 = {http://links.jstor.org/sici?sici=0003-4851\%5C\%28196704\%5C\%2938\%5C\%3A2\%5C\%3C325\%5C\%3AUALPIB\%5C\%3E2.0.CO\%5C\%3B2-A},
Copyright = {Copyright 1967 Institute of Mathematical Statistics},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Issn = {0003-4851},
Journal = {The Annals of Mathematical Statistics},
Jstor_Articletype = {Full Length Article},
Jstor_Date = {196704},
Jstor_Formatteddate = {Apr., 1967},
Month = {apr},
Number = {2},
Pages = {325--339},
Publisher = {Institute of Mathematical Statistics},
Title = {Upper and Lower Probabilities Induced by a Multivalued Mapping},
Volume = {38},
Year = {1967}}
@article{Dempster:196806,
Abstract = {Within the class of models producing upper and lower probability systems, as discussed in Dempster (1967a), a simple and important subclass may be characterized by random intervals on the line. Detailed expressions are given here for the upper and lower probabilities of a general fixed closed interval determined by a general random closed interval. Such random closed intervals occur in the applications of the general class of models to statistical inference described in Dempster (1966, 1967b, 1968). The illustration given here concerns inference about binomial $p$ and stresses the flexibility allowed in the introduction of prior information.},
Author = {Dempster, A. P.},
Bdsk-Url-1 = {http://links.jstor.org/sici?sici=0003-4851\%5C(196806\%5C)39\%5C:3\%5C\%3C957\%5C:UALPGB\%5C\%3E2.0.CO\%5C;2-L},
Bdsk-Url-2 = {http://links.jstor.org/sici?sici=0003-4851\%5C\%28196806\%5C\%2939\%5C\%3A3\%5C\%3C957\%5C\%3AUALPGB\%5C\%3E2.0.CO\%5C\%3B2-L},
Copyright = {Copyright 1968 Institute of Mathematical Statistics},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Issn = {0003-4851},
Journal = {The Annals of Mathematical Statistics},
Jstor_Articletype = {Full Length Article},
Jstor_Date = {196806},
Jstor_Formatteddate = {Jun., 1968},
Month = {jun},
Number = {3},
Pages = {957--966},
Publisher = {Institute of Mathematical Statistics},
Title = {Upper and Lower Probabilities Generated by a Random Closed Interval},
Volume = {39},
Year = {1968}}
@article{Dempster:1968,
Abstract = {Procedures of statistical inference are described which generalize Bayesian inference in specific ways. Probability is used in such a way that in general only bounds may be placed on the probabilities of given events, and probability systems of this kind are suggested both for sample information and for prior information. These systems are then combined using a specified rule. Illustrations are given for inferences about trinomial probabilities, and for inferences about a monotone sequence of binomial $p_i$. Finally, some comments are made on the general class of models which produce upper and lower probabilities, and on the specific models which underlie the suggested inference procedures.},
Author = {Dempster, A. P.},
Bdsk-Url-1 = {http://links.jstor.org/sici?sici=0035-9246\%5C(1968\%5C)30\%5C:2\%5C\%3C205\%5C:AGOBI\%5C\%3E2.0.CO\%5C;2-J},
Bdsk-Url-2 = {http://links.jstor.org/sici?sici=0035-9246\%5C\%281968\%5C\%2930\%5C\%3A2\%5C\%3C205\%5C\%3AAGOBI\%5C\%3E2.0.CO\%5C\%3B2-J},
Copyright = {Copyright 1968 Royal Statistical Society},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:09:12 -0400},
Issn = {0035-9246},
Journal = {Journal of the Royal Statistical Society. Series B (Methodological)},
Jstor_Articletype = {Full Length Article},
Jstor_Date = {1968},
Jstor_Formatteddate = {1968},
Number = {2},
Pages = {205--247},
Publisher = {Royal Statistical Society},
Title = {A Generalization of {Bayesian} Inference},
Volume = {30},
Year = {1968}}
@article{Kohlas:1994fk,
Abstract = {The mathematical theory of evidence has been introduced by Glenn Shafer in 1976 as a new approach to the representation of uncertainty. This theory can be represented under several distinct but more or less equivalent forms. Probabilistic interpretations of evidence theory have their roots in Arthur Dempster's multivalued mappings of probability spaces. This leads to random set and more generally to random filter models of evidence. In this probabilistic view evidence is seen as more or less probable arguments for certain hypotheses and they can be used to support those hypotheses to certain degrees. These degrees of support are in fact the reliabilities with which the hypotheses can be derived from the evidence. Alternatively, the mathematical theory of evidence can be founded axiomatically on the notion of belief functions or on the allocation of belief masses to subsets of a frame of discernment. These approaches aim to present evidence theory as an extension of probability theory. Evidence theory has been used to represent uncertainty in expert systems, especially in the domain of diagnostics. It can be applied to decision analysis and it gives a new perspective for statistical analysis. Among its further applications are image processing, project planning and scheduling and risk analysis. The computational problems of evidence theory are well understood and even though the problem is complex, efficient methods are available.},
Author = {Kohlas, J{\"u}rg and Monney, Paul-Andr{\'e}},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Journal = {Mathematical Methods of Operations Research},
M3 = {10.1007/BF01440734},
Number = {1},
Pages = {35--68},
Title = {Theory of evidence: A survey of its mathematical foundations, applications and computational aspects},
Ty = {JOUR},
Volume = {39},
Year = {1994},
Bdsk-Url-1 = {http://dx.doi.org/10.1007/BF01440734}}
@article{Kennes:1992lr,
Author = {Kennes, R.},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Isbn = {0018-9472},
Journal = {Systems, Man and Cybernetics, IEEE Transactions on},
Journal1 = {Systems, Man and Cybernetics, IEEE Transactions on},
Keywords = {Boolean algebra; directed graphs; Boolean lattice; Dempster's rule; Dempster-Shafer theory; Mobius transformation; directed graphs; general binary relations},
Number = {2},
Pages = {201--223},
Title = {Computational aspects of the Mobius transformation of graphs},
Title1 = {Systems, Man and Cybernetics, IEEE Transactions on},
Ty = {JOUR},
Volume = {22},
Year = {1992}}
@article{searches_bosons,
Author = {P. Igo-Kemenes},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:23:18 -0400},
Editor = {W.-M. Yao et al.},
Journal = {Journal of Physics G},
Number = {1},
Series = {The Review of Particle Physics},
Title = {{Searches for Higgs bosons}},
Volume = {33},
Year = {2006},
Bdsk-Url-1 = {http://pdg.lbl.gov/2006/reviews/higgs_s055.pdf}}
@article{rolke-2005-551,
Author = {Wolfgang A. Rolke and Angel M. Lopez and Jan Conrad},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Journal = {NUCL.INSTRUM.METH.A},
Pages = {493},
Title = {Limits and Confidence Intervals in the Presence of Nuisance Parameters},
Volume = {551},
Year = {2005},
Bdsk-Url-1 = {http://www.citebase.org/abstract?id=oai:arXiv.org:physics/0403059}}
@article{Cobb:2006,
Author = {Barry R. Cobb and Prakash P. Shenoy},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Journal = {International Journal of Approximate Reasoning},
Month = apr,
Pages = {314--330},
Title = {On the Plausibility Transformation Method for Translating Belief Function Models to Probability Models},
Volume = {41(3)},
Year = {2006}}
@book{Almond:1995,
Address = {London},
Author = {Almond, Russell G.},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-10 14:45:35 -0400},
Db = {WorldCat},
Id = {31374056},
Isbn = {0412066610 9780412066610},
Language = {English},
Publisher = {Chapman \& Hall},
Title = {Graphical belief modeling},
Ty = {BOOK},
Year = {1995},
Bdsk-Url-1 = {http://worldcat.org}}
@book{Kohlas:uq,
Author = {Kohlas, J{\"u}rg and Monney, Paul-Andr{\'e}},
Call-Number = {QA273},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Dewey-Call-Number = {519.5/4},
Genre = {Probabilities},
Publisher = {Springer},
Title = {A mathematical theory of hints : an approach to the Dempster-Shafer theory of evidence},
Volume = {425},
Year = {1995}}
@book{Shafer:1976qy,
Address = {Princeton, N.J.},
Author = {Shafer, Glenn},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Genre = {Probabilities},
Publisher = {Princeton University Press},
Title = {A mathematical theory of evidence},
Year = {1976}}
@incollection{Thoma:1991,
Address = {Amsterdam},
Author = {H. M. Thoma},
Booktitle = {Conditional Logic in Expert Systems},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Editor = {I. R. Goodman and M. M. Gupta and H. T. Nguyen and G. S. Rogers},
Pages = {269-308},
Publisher = {North-Holland},
Title = {Belief Function Computations},
Year = 1991}
@inproceedings{Pearl:1982,
Author = {{Pearl}, J.},
Booktitle = {Proceedings American Association of Artificial Intelligence National Conference on AI},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Pages = {133-136},
Title = {{Reverend Bayes on inference engines: A distributed hierarchical approach}},
Year = 1982}
@inproceedings{Punzi,
Adsnote = {Provided by the Smithsonian/NASA Astrophysics Data System},
Adsurl = {http://adsabs.harvard.edu/abs/2006sppp.conf...88P},
Author = {{Punzi}, G.},
Booktitle = {Statistical Problems in Particle Physics, Astrophysics and Cosmology},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Editor = {{Lyons}, L. and {Karag{\"o}z {\"U}nel}, M.},
Pages = {88-+},
Title = {{Ordering Algorithms and Confidence Intervals in the Presence of Nuisance Parameters}},
Year = 2006}
@inproceedings{Demortier,
Adsnote = {Provided by the Smithsonian/NASA Astrophysics Data System},
Adsurl = {http://adsabs.harvard.edu/abs/2006sppp.conf...11D},
Author = {{Demortier}, L.},
Booktitle = {Statistical Problems in Particle Physics, Astrophysics and Cosmology},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Editor = {{Lyons}, L. and {Karag{\"o}z {\"U}nel}, M.},
Pages = {11-+},
Title = {{Bayesian Reference Analysis}},
Year = 2006}
@inproceedings{Cranmer,
Adsnote = {Provided by the Smithsonian/NASA Astrophysics Data System},
Adsurl = {http://adsabs.harvard.edu/abs/2003sppp.conf..261C},
Author = {{Cranmer}, K.},
Booktitle = {Statistical Problems in Particle Physics, Astrophysics, and Cosmology},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Editor = {{Lyons}, L. and {Mount}, R. and {Reitmeyer}, R.},
Pages = {261-+},
Title = {{Frequentist Hypothesis Testing with Background Uncertainty}},
Year = 2003}
@inproceedings{conrad-2006,
Adsnote = {Provided by the Smithsonian/NASA Astrophysics Data System},
Adsurl = {http://adsabs.harvard.edu/abs/2006sppp.conf...93C},
Author = {{Conrad}, J. and {Tegenfeldt}, F.},
Booktitle = {Statistical Problems in Particle Physics, Astrophysics and Cosmology},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Editor = {{Lyons}, L. and {Karag{\"o}z {\"U}nel}, M.},
Pages = {93-+},
Title = {{Likelihood Ratio Intervals with Bayesian Treatment of Uncertainties: Coverage, Power and Combined Experiments}},
Year = 2006}
@inproceedings{Cousins,
Author = {Robert D. Cousins},
Booktitle = {PHYSTAT 05},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Title = {Treatment of Nuisance Parameters in High Energy Physics, and Possible Justifications and Improvements in the Statistics Literature},
Year = {2005},
Bdsk-Url-1 = {http://www.physics.ox.ac.uk/phystat05/proceedings/files/oxford_cousins_final.pdf}}
@inproceedings{Reid,
Author = {N. Reid},
Booktitle = {PHYSTAT 05},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Title = {Response (to Cousins)},
Year = {2005},
Bdsk-Url-1 = {http://www.physics.ox.ac.uk/phystat05/proceedings/files/Reid-response.pdf}}
@inproceedings{heinrich-2007,
Author = {Joel Heinrich},
Booktitle = {Proceedings of the 2007 PHYSTAT LHC Workshop on Statistical Issues for LHC Physics},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Editor = {{Prosper}, H. B. and {Lyons}, L. and {De Roeck}, A.},
Pages = {133--142},
Title = {Review of the Banff Challenge on Upper Limits},
Year = {2008},
Bdsk-Url-1 = {http://physics.rockefeller.edu/~luc/proceedings/phystat2007_heinrich.pdf}}
@misc{Atlas,
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-10 14:46:41 -0400},
Title = {The ATLAS Experiment},
Bdsk-Url-1 = {http://atlas.ch/}}
@unpublished{a1_project_site,
Author = {Joel Heinrich},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:28:09 -0400},
Month = jul,
Note = {http://newton.hep.upenn.edu/~heinrich/birs/},
Title = {{BIRS A1 Limits Project}},
Year = {2006},
Bdsk-Url-1 = {http://newton.hep.upenn.edu/~heinrich/birs/}}
@unpublished{a1,
Author = {Joel Heinrich},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:22:37 -0400},
Month = jul,
Note = {http://newton.hep.upenn.edu/~heinrich/birs/project.pdf},
Title = {Limits Comparison Project},
Year = {2006},
Bdsk-Url-1 = {http://newton.hep.upenn.edu/~heinrich/birs/project.pdf}}
@phdthesis{Kong:thesis,
Author = {A. Kong},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
School = {Department of Statistics, Harvard University},
Title = {Multivariate Belief Functions and Graphical Models},
Year = {1986}}
@phdthesis{Almond:thesis,
Author = {Almond, Russell G.},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
School = {Harvard University},
Title = {Fusion and Propagation of Graphical Belief Models: An Implementation and an Example},
Year = {1989}}
@phdthesis{Thoma:thesis,
Address = {Cambridge, MA},
Author = {H. M. Thoma},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
School = {Statistics Department, Harvard University},
Title = {Factorization of belief functions},
Year = {1989}}
@techreport{Almond:1988,
Author = {Almond, Russell G.},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Institution = {Statistics Department, Harvard University},
Month = {June},
Number = {S-121},
Title = {Fusion and Propagation in Graphical Belief Models},
Year = {1988},
Bdsk-Url-1 = {http://ralmond.net/pubs/captain.pdf}}
@techreport{blimitguide,
Author = {Joel Heinrich},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:10:14 -0400},
Month = oct,
Number = {7232},
Title = {{User Guide to Bayesian-Limit Software Package}},
Year = {2004},
Bdsk-Url-1 = {http://www-cdf.fnal.gov/publications/cdf7232_blimitguide.pdf}}
@techreport{genlimit,
Author = {Joel Heinrich},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Institution = {The Collider Detector at Fermilab},
Month = apr,
Number = {7587},
Title = {Bayesian limit software: multi-channel with correlated backgrounds and efficiencies},
Year = {2005},
Bdsk-Url-1 = {http://www-cdf.fnal.gov/publications/cdf7587_genlimit.pdf}}
@unpublished{birs_workshop_objectives,
Author = {James Linnemann and Louis Lyons and Nancy Reid},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-18 21:28:32 -0400},
Month = jul,
Note = {http://www.birs.ca/workshops/2006/06w5054/Objectives06w5054.html},
Title = {{BIRS} Workshop on Statistical Inference Problems in High Energy Physics and Astronomy Objectives Document},
Year = {2006},
Bdsk-Url-1 = {http://www.birs.ca/workshops/2006/06w5054/Objectives06w5054.html}}
@article{PaulsPosterAtHIVDynamics2015,
Author = {Edlefsen, Paul T},
Title = {{P}oster {A}bstract: Identifying within-host {HIV-1} subpopulations by cosegregation of {P}rofile {H}idden {M}arkov {M}odel update vectors},
Journal = {{HIV} Dynamics and Evolution},
Month = {May},
Year = {2015}}
@unpublished{birs_workshop_report,
Author = {James Linnemann and Louis Lyons and Nancy Reid},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Month = feb,
Note = {http://www.birs.ca/workshops/2006/06w5054/report06w5054.pdf},
Title = {Report for Workshop 06w5054: Statistical inference Problems in High Energy Physics and Astronomy},
Year = {2007},
Bdsk-Url-1 = {http://www.birs.ca/workshops/2006/06w5054/report06w5054.pdf}}
@unpublished{a1_slides,
Author = {Joel Heinrich},
Date-Added = {2009-05-09 14:19:07 -0400},
Date-Modified = {2009-05-09 14:19:07 -0400},
Month = jul,
Note = {http://newton.hep.upenn.edu/~heinrich/birs/a1.pdf},
Title = {Setting the Scene for Limits and Nuisance Parameters},
Year = {2006},
Bdsk-Url-1 = {http://newton.hep.upenn.edu/~heinrich/birs/a1.pdf}}
@article{Karplus1998,
Author = {Karplus, K and Barrett, C and Hughey, R},
Doi = {10.1093/bioinformatics/14.10.846},
Journal = {Bioinformatics},
Pages = {846-856},
Pubmedid = {9927713},
Title = {Hidden Markov models for detecting remote protein homologies},
Volume = {14},
Year = {1998},
Bdsk-Url-1 = {http://dx.doi.org/10.1093/bioinformatics/14.10.846}}
@techreport{SAMDocumentation,
Author = {Hughey, R. and Karplus, K. and Krogh, A.},
Date-Added = {2009-05-06 06:15:02 -0400},
Date-Modified = {2009-05-06 06:18:02 -0400},
Institution = {Baskin School of Engineering. University of California Santa Cruz},
Number = {UCSC-CRL-99-11, updated for SAM Version 3.4},
Title = {{SAM Sequence Alignment and Modeling Software System}},
Year = {2003}}
@article{KullbackLeibler,
Author = {Kullback, S and Leibler, RA},
Doi = {10.1214/aoms/1177729694},
Journal = {Ann Math Stat},
Pages = {79-86},
Title = {On information and sufficiency},
Volume = {22},
Year = {1951},
Bdsk-Url-1 = {http://dx.doi.org/10.1214/aoms/1177729694}}
@unpublished{HMMerUsersGuide,
Author = {Eddy, SR},
Date-Added = {2009-05-06 06:11:52 -0400},
Date-Modified = {2009-05-06 06:11:52 -0400},
Note = {St Louis, MO: Washington University School of Medicine},
Title = {{HMMER User's Guide: Biological sequence analysis using profile hidden Markov models}},
Year = {1998}}
@unpublished{HMMerUsersGuide3.1,
Author = {Eddy, SR and Wheeler, TJ},
Note = {http://hmmer.janelia.org/},
Title = {HMMER User's Guide, version 3.1},
Year = {2013}}
@article{PHMMLogos,
Abstract = {BACKGROUND:Profile Hidden Markov Models (pHMMs) are a widely used tool for protein family research. Up to now, however, there exists no method to visualize all of their central aspects graphically in an intuitively understandable way.RESULTS:We present a visualization method that incorporates both emission and transition probabilities of the pHMM, thus extending sequence logos introduced by Schneider and Stephens. For each emitting state of the pHMM, we display a stack of letters. The stack height is determined by the deviation of the position's letter emission frequencies from the background frequencies. The stack width visualizes both the probability of reaching the state (the hitting probability) and the expected number of letters the state emits during a pass through the model (the state's expected contribution).A web interface offering online creation of HMM Logos and the corresponding source code can be found at the Logos web server of the Max Planck Institute for Molecular Genetics http://logos.molgen.mpg.de.CONCLUSIONS:We demonstrate that HMM Logos can be a useful tool for the biologist: We use them to highlight differences between two homologous subfamilies of GTPases, Rab and Ras, and we show that they are able to indicate structural elements of Ras.},
Author = {Schuster-Bockler, Benjamin and Schultz, Jorg and Rahmann, Sven},
Date-Added = {2009-05-05 12:28:31 -0400},
Date-Modified = {2009-05-18 21:21:51 -0400},
Doi = {10.1186/1471-2105-5-7},
Issn = {1471-2105},
Journal = {BMC Bioinformatics},
Number = {1},
Pages = {7},
Pubmedid = {14736340},
Title = {{HMM Logos for visualization of protein families}},
Volume = {5},
Year = {2004},
Bdsk-Url-1 = {http://www.biomedcentral.com/1471-2105/5/7},
Bdsk-Url-2 = {http://dx.doi.org/10.1186/1471-2105-5-7}}
@article{letunic2006sdc,
Annote = {Uses HMMer},
Author = {Letunic, I. and Copley, R.R. and Pils, B. and Pinkert, S. and Schultz, J. and Bork, P.},
Date-Added = {2009-05-05 07:51:56 -0400},
Date-Modified = {2009-05-05 07:52:08 -0400},
Journal = {Nucleic Acids Research},
Keywords = {HMMer},
Number = {Database Issue},
Pages = {D257},
Publisher = {Oxford Univ Press},
Title = {{SMART 5: domains in the context of genomes and networks}},
Volume = {34},
Year = {2006}}
@article{haft2003tdp,
Annote = {Uses HMMer},
Author = {Haft, D.H. and Selengut, J.D. and White, O.},
Date-Added = {2009-05-05 07:49:57 -0400},
Date-Modified = {2009-05-05 07:50:30 -0400},
Journal = {Nucleic Acids Research},
Keywords = {HMMer},
Number = {1},
Pages = {371},
Publisher = {Oxford Univ Press},
Title = {{The TIGRFAMs database of protein families}},
Volume = {31},
Year = {2003}}
@article{madera2002cph,
Author = {Madera, M. and Gough, J.},
Date-Added = {2009-05-05 07:42:02 -0400},
Date-Modified = {2009-05-05 07:42:02 -0400},
Journal = {Nucleic acids research},
Number = {19},
Pages = {4321},
Publisher = {Oxford Univ Press},
Title = {{A comparison of profile hidden Markov model procedures for remote homology detection}},
Volume = {30},
Year = {2002}}
@article{coin:2003,
Author = {Coin, L. and Bateman, A. and Durbin, R.},
Date-Added = {2009-05-05 07:40:15 -0400},
Date-Modified = {2009-05-05 07:40:15 -0400},
Journal = {Proceedings of the National Academy of Sciences},
Number = {8},
Pages = {4516--4520},
Publisher = {National Acad Sciences},
Title = {{Enhanced protein domain discovery by using language modeling techniques from speech recognition}},
Volume = {100},
Year = {2003}}
@article{coin:2004,
Author = {Coin, L. and Bateman, A. and Durbin, R.},
Date-Added = {2009-05-05 07:38:24 -0400},
Date-Modified = {2009-05-05 07:38:24 -0400},
Journal = {BMC bioinformatics},
Number = {1},
Pages = {56},
Publisher = {BioMed Central Ltd},
Title = {{Enhanced protein domain discovery using taxonomy}},
Volume = {5},
Year = {2004}}
@article{hargbo:1999,
Author = {Hargbo, J. and Elofsson, A.},
Date-Added = {2009-05-05 07:36:05 -0400},
Date-Modified = {2009-05-05 07:36:05 -0400},
Journal = {Proteins: Structure, Function, and Genetics},
Number = {1},
Publisher = {John Wiley \& Sons, Inc. New York},
Title = {{Hidden Markov models that use predicted secondary structures for fold recognition}},
Volume = {36},
Year = {1999}}
@article{karchin:2003,
Author = {Karchin, R. and Cline, M. and Mandel-Gutfreund, Y. and Karplus, K.},
Date-Added = {2009-05-05 07:34:34 -0400},
Date-Modified = {2009-05-05 07:34:34 -0400},
Journal = {Proteins: Structure, Function, and Genetics},
Number = {4},
Pages = {504--514},
Publisher = {Wiley Subscription Services, Inc., A Wiley Company New York},
Title = {{Hidden Markov models that use predicted local structure for fold recognition: alphabets of backbone geometry}},
Volume = {51},
Year = {2003}}
@article{qian:2003,
Author = {Qian, B. and Goldstein, R.A.},
Date-Added = {2009-05-05 07:31:28 -0400},
Date-Modified = {2009-05-05 07:31:28 -0400},
Journal = {Proteins: Structure, Function, and Genetics},
Number = {3},
Publisher = {Wiley Subscription Services, Inc., A Wiley Company Hoboken},
Title = {{Detecting distant homologs using phylogenetic tree-based HMMs}},
Volume = {52},
Year = {2003}}
@article{mitchison:1995,
Author = {Mitchison, G. and Durbin, R.},
Date-Added = {2009-05-05 07:27:41 -0400},
Date-Modified = {2009-05-05 07:27:41 -0400},
Journal = {Journal of Molecular Evolution},
Number = {6},
Pages = {1139--1151},
Publisher = {Springer},
Title = {{Tree-based maximal likelihood substitution matrices and hidden Markov models}},
Volume = {41},
Year = {1995}}
@conference{eddy:1995,
Author = {Eddy, S.R.},
Booktitle = {Proc Int Conf Intell Syst Mol Biol},
Date-Added = {2009-05-04 16:44:18 -0400},
Date-Modified = {2009-05-04 16:44:18 -0400},
Pages = {114--120},
Title = {{Multiple alignment using hidden Markov models}},
Volume = {3},
Year = {1995}}
@article{scott:2002,
Author = {Scott, S.L.},
Date-Added = {2009-05-02 12:22:56 -0400},
Date-Modified = {2009-05-02 12:22:56 -0400},
Journal = {Journal of the American Statistical Association},
Number = {457},
Pages = {337--352},
Publisher = {ASA},
Title = {{Bayesian methods for hidden Markov models: Recursive computing in the 21st century}},
Volume = {97},
Year = {2002}}
@article{edlefsen2010transposon,
Author = {Edlefsen, Paul T and Liu, Jun S},
Journal = {BMC genomics},
Number = {Suppl 1},
Pages = {S10},
Publisher = {BioMed Central Ltd},
Title = {Transposon identification using {Profile HMMs}},
Volume = {11},
Year = {2010}}
@article{sonnhammer:1997,
Author = {Sonnhammer, E.L.L. and Eddy, S.R. and Durbin, R.},
Date-Added = {2009-05-01 12:48:45 -0400},
Date-Modified = {2009-05-01 12:48:45 -0400},
Journal = {Proteins: Structure, Function, and Genetics},
Number = {3},
Pages = {405--420},
Publisher = {Wiley Subscription Services, Inc., A Wiley Company Hoboken},
Title = {{Pfam: a comprehensive database of protein domain families based on seed alignments}},
Volume = {28},
Year = {1997}}
@article{schwartz:2003,
Author = {Schwartz, S. and Kent, W.J. and Smit, A. and Zhang, Z. and Baertsch, R. and Hardison, R.C. and Haussler, D. and Miller, W.},
Date-Added = {2009-04-29 16:27:02 -0400},
Date-Modified = {2009-05-10 14:47:14 -0400},
Journal = {Genome Research},
Number = {1},
Pages = {103--107},
Publisher = {Cold Spring Harbor Laboratory Press},
Title = {{Human-mouse alignments with BLASTZ}},
Volume = {13},
Year = {2003}}
@article{rosenbloom:2008,
Author = {Rosenbloom, K. and Taylor, J. and Schaeffer, S. and Kent, J. and Haussler, D. and Miller, W.},
Date-Added = {2009-04-29 16:25:18 -0400},
Date-Modified = {2009-04-29 16:25:18 -0400},
Journal = {METHODS IN MOLECULAR BIOLOGY-CLIFTON THEN TOTOWA-},
Pages = {133},
Publisher = {Springer},
Title = {{Phylogenomic resources at the UCSC Genome Browser}},
Volume = {422},
Year = {2008}}
@article{kent:2003,
Author = {Kent, W.J. and Baertsch, R. and Hinrichs, A. and Miller, W. and Haussler, D.},
Date-Added = {2009-04-29 16:23:44 -0400},
Date-Modified = {2009-04-29 16:23:44 -0400},
Journal = {Proceedings of the National Academy of Sciences},
Number = {20},
Pages = {11484--11489},
Publisher = {National Acad Sciences},
Title = {{Evolution's cauldron: Duplication, deletion, and rearrangement in the mouse and human genomes}},
Volume = {100},
Year = {2003}}
@book{eddy:1992,
Author = {Eddy, S. and {School of Medicine and Dept. of Genetics and National Human Genome Research Institute (US)}},
Date-Added = {2009-04-28 14:47:10 -0400},
Date-Modified = {2009-04-28 14:47:10 -0400},
Publisher = {Washington University School of Medicine},
Title = {{HMMER profile hidden Markov models for biological sequence analysis}},
Year = {1992}}
@article{hughey:1996,
Author = {Hughey, R. and Krogh, A.},
Date-Added = {2009-04-28 14:44:54 -0400},
Date-Modified = {2009-04-28 14:44:54 -0400},
Journal = {Bioinformatics},
Number = {2},
Pages = {95--107},
Publisher = {Oxford Univ Press},
Title = {{Hidden Markov models for sequence analysis: extension and analysis of the basic method}},
Volume = {12},
Year = {1996}}
@unpublished{SAM,
Author = {Hughey, R and Krogh, A},
Note = {Santa Cruz: University of California},
Title = {SAM: Sequence alignment and modeling software system},
Year = {1995}}
@article{Needleman:1970,
Author = {Needleman, S.B. and Wunsch, C.D.},
Date-Added = {2009-04-28 13:17:15 -0400},
Date-Modified = {2009-04-28 14:04:42 -0400},
Journal = {J. Mol. Biol.},
Pages = {443---453},
Title = {A general method applicable to the search for similarities in the amino acid sequence of two proteins},
Volume = {48},
Year = {1970}}
@article{altschul:1990,
Author = {Altschul, S.F. and Gish, W. and Miller, W. and Myers, E.W. and Lipman, D.J.},
Date-Added = {2009-04-28 13:16:02 -0400},
Date-Modified = {2009-04-28 13:16:02 -0400},
Journal = {J. mol. Biol},
Number = {3},
Pages = {403--410},
Title = {{Basic local alignment search tool}},
Volume = {215},
Year = {1990}}
@article{smith:1981,
Author = {Smith, TF and Waterman, MS},
Date-Added = {2009-04-28 13:06:53 -0400},
Date-Modified = {2009-04-28 13:06:53 -0400},
Journal = {J. Mol. Bwl},
Pages = {195--197},
Title = {{Identification of common molecular subsequences}},
Volume = {147},
Year = {1981}}
@article{Wong:2008wj,
Abstract = {The statistical methods applied to the analysis of genomic data do not account for uncertainty in the sequence alignment. Indeed, the alignment is treated as an observation, and all of the subsequent inferences depend on the alignment being correct. This may not have been too problematic for many phylogenetic studies, in which the gene is carefully chosen for, among other things, ease of alignment. However, in a comparative genomics study, the same statistical methods are applied repeatedly on thousands of genes, many of which will be difficult to align. Using genomic data from seven yeast species, we show that uncertainty in the alignment can lead to several problems, including different alignment methods resulting in different conclusions. },
Annote = {10.1126/science.1151532},
Author = {Wong, Karen M. and Suchard, Marc A. and Huelsenbeck, John P.},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-04-28 11:57:31 -0400},
Journal = {Science},
Journal1 = {Science},
Number = {5862},
Pages = {473--476},
Title = {Alignment Uncertainty and Genomic Analysis},
Ty = {JOUR},
Volume = {319},
Year = {2008},
Bdsk-Url-1 = {http://www.sciencemag.org/cgi/content/abstract/319/5862/473}}
@article{thompson:1994,
Author = {Thompson, JD and Higgins, DG and Gibson, TJ and Clustal, W.},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-04-28 11:57:31 -0400},
Journal = {Nucleic Acids Res},
Number = {22},
Pages = {4673--4680},
Title = {{Improving the sensitivity of progressive multiple sequence alignment through sequence weighting, position-specific gap penalties and weight matrix choice}},
Volume = {22},
Year = {1994}}
@article{katoh:2005,
Author = {Katoh, K. and Kuma, K. and Toh, H. and Miyata, T.},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-04-28 11:57:31 -0400},
Journal = {Nucleic acids research},
Number = {2},
Pages = {511},
Publisher = {Oxford Univ Press},
Title = {{MAFFT version 5: improvement in accuracy of multiple sequence alignment}},
Volume = {33},
Year = {2005}}
@article{Edgar:2004bmc,
Abstract = {BACKGROUND:In a previous paper, we introduced MUSCLE, a new program for creating multiple alignments of protein sequences, giving a brief summary of the algorithm and showing MUSCLE to achieve the highest scores reported to date on four alignment accuracy benchmarks. Here we present a more complete discussion of the algorithm, describing several previously unpublished techniques that improve biological accuracy and / or computational complexity. We introduce a new option, MUSCLE-fast, designed for high-throughput applications. We also describe a new protocol for evaluating objective functions that align two profiles.RESULTS:We compare the speed and accuracy of MUSCLE with CLUSTALW, Progressive POA and the MAFFT script FFTNS1, the fastest previously published program known to the author. Accuracy is measured using four benchmarks: BAliBASE, PREFAB, SABmark and SMART. We test three variants that offer highest accuracy (MUSCLE with default settings), highest speed (MUSCLE-fast), and a carefully chosen compromise between the two (MUSCLE-prog). We find MUSCLE-fast to be the fastest algorithm on all test sets, achieving average alignment accuracy similar to CLUSTALW in times that are typically two to three orders of magnitude less. MUSCLE-fast is able to align 1,000 sequences of average length 282 in 21 seconds on a current desktop computer.CONCLUSIONS:MUSCLE offers a range of options that provide improved speed and / or alignment accuracy compared with currently available programs. MUSCLE is freely available at http://www.drive5.com/muscle.},
Author = {Edgar, Robert},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-05-18 21:26:28 -0400},
Doi = {10.1186/1471-2105-5-113},
Issn = {1471-2105},
Journal = {BMC Bioinformatics},
Number = {1},
Pages = {113},
Pubmedid = {15318951},
Title = {{MUSCLE: a multiple sequence alignment method with reduced time and space complexity}},
Volume = {5},
Year = {2004},
Bdsk-Url-1 = {http://www.biomedcentral.com/1471-2105/5/113},
Bdsk-Url-2 = {http://dx.doi.org/10.1186/1471-2105-5-113}}
@article{Edgar:2004sf,
Abstract = {We describe MUSCLE, a new computer program for creating multiple alignments of protein sequences. Elements of the algorithm include fast distance estimation using kmer counting, progressive alignment using a new profile function we call the log-expectation score, and refinement using tree-dependent restricted partitioning. The speed and accuracy of MUSCLE are compared with T-Coffee, MAFFT and CLUSTALW on four test sets of reference alignments: BAliBASE, SABmark, SMART and a new benchmark, PREFAB. MUSCLE achieves the highest, or joint highest, rank in accuracy on each of these sets. Without refinement, MUSCLE achieves average accuracy statistically indistinguishable from T-Coffee and MAFFT, and is the fastest of the tested methods for large numbers of sequences, aligning 5000 sequences of average length 350 in 7 min on a current desktop computer. The MUSCLE program, source code and PREFAB test data are freely available at http://www.drive5. com/muscle. },
Annote = {10.1093/nar/gkh340},
Author = {Edgar, Robert C.},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-05-18 21:26:07 -0400},
Journal = {Nucleic Acids Research},
Journal1 = {Nucl. Acids Res.},
Number = {5},
Pages = {1792--1797},
Title = {{MUSCLE: multiple sequence alignment with high accuracy and high throughput}},
Ty = {JOUR},
Volume = {32},
Year = {2004},
Bdsk-Url-1 = {http://nar.oxfordjournals.org/cgi/content/abstract/32/5/1792}}
@article{notredame:2000,
Author = {Notredame, C. and Higgins, D.G. and Heringa, J.},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-04-28 11:57:31 -0400},
Journal = {Journal of molecular biology},
Number = {1},
Pages = {205--217},
Publisher = {Elsevier},
Title = {{T-Coffee: A novel method for fast and accurate multiple sequence alignment}},
Volume = {302},
Year = {2000}}
@article{Lunter:2008fj,
Abstract = {Sequence alignment underpins all of comparative genomics, yet it remains an incompletely solved problem. In particular, the statistical uncertainty within inferred alignments is often disregarded, while parametric or phylogenetic inferences are considered meaningless without confidence estimates. Here, we report on a theoretical and simulation study of pairwise alignments of genomic DNA at humanmouse divergence. We find that >15{\%} of aligned bases are incorrect in existing whole-genome alignments, and we identify three types of alignment error, each leading to systematic biases in all algorithms considered. Careful modeling of the evolutionary process improves alignment quality; however, these improvements are modest compared with the remaining alignment errors, even with exact knowledge of the evolutionary model, emphasizing the need for statistical approaches to account for uncertainty. We develop a new algorithm, Marginalized Posterior Decoding (MPD), which explicitly accounts for uncertainties, is less biased and more accurate than other algorithms we consider, and reduces the proportion of misaligned bases by a third compared with the best existing algorithm. To our knowledge, this is the first nonheuristic algorithm for DNA sequence alignment to show robust improvements over the classic NeedlemanWunsch algorithm. Despite this, considerable uncertainty remains even in the improved alignments. We conclude that a probabilistic treatment is essential, both to improve alignment quality and to quantify the remaining uncertainty. This is becoming increasingly relevant with the growing appreciation of the importance of noncoding DNA, whose study relies heavily on alignments. Alignment errors are inevitable, and should be considered when drawing conclusions from alignments. Software and alignments to assist researchers in doing this are provided at http://genserv.anat.ox.ac.uk/grape/. },
Annote = {10.1101/gr.6725608},
Author = {Lunter, Gerton and Rocco, Andrea and Mimouni, Naila and Heger, Andreas and Caldeira, Alexandre and Hein, Jotun},
Date-Added = {2009-04-28 11:57:31 -0400},
Date-Modified = {2009-04-28 11:57:31 -0400},
Journal = {Genome Research},
Journal1 = {Genome Res.},
Number = {2},
Pages = {298--309},
Title = {Uncertainty in homology inferences: Assessing and improving genomic sequence alignment},
Ty = {JOUR},
Volume = {18},
Year = {2008},
Bdsk-Url-1 = {http://www.genome.org/cgi/content/abstract/18/2/298}}
@article{iupaciub:1983,
Author = {IUPAC-IUB},
Date-Added = {2009-04-28 10:29:59 -0400},
Date-Modified = {2009-04-28 10:29:59 -0400},
Journal = {Eur. J. Biochem.},
Pages = {9--15},
Title = {{IUPAC-IUB, Joint Commision on Biochemical Nomenclature}},
Volume = {131},
Year = {1983}}
@article{altschul:1997,
Author = {Altschul, SF and Madden, TL and Schaffer, AA and Zhang, J. and Zhang, Z. and Miller, W. and Lipman, DJ},
Date-Added = {2009-04-27 17:33:50 -0400},
Date-Modified = {2009-04-27 17:33:50 -0400},
Journal = {Nucleic acids research},
Number = {17},
Pages = {3389},
Publisher = {Oxford Univ Press},
Title = {{Gapped BLAST and PSI-BLAST: a new generation of protein database search programs}},
Volume = {25},
Year = {1997}}
@unpublished{Crossmatch,
Author = {Green, P.},
Date-Added = {2009-04-27 17:29:19 -0400},
Date-Modified = {2009-05-18 21:30:45 -0400},
Note = {At http://bozeman.mbt.washington.edu/phrap.docs/swat.html},
Title = {{Crossmatch}},
Year = {1994}}
@unpublished{WU-BLAST,
Author = {Gish, W.},
Date-Added = {2009-04-27 17:25:37 -0400},
Date-Modified = {2009-05-18 21:14:27 -0400},
Note = {http://blast.wustl.edu},
Title = {{WU-BLAST}},