-
Notifications
You must be signed in to change notification settings - Fork 0
/
bibtex.bib
714 lines (684 loc) · 31.6 KB
/
bibtex.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
@ARTICLE{Kim2013-vg,
title = {{TopHat2}: accurate alignment of transcriptomes in the
presence of insertions, deletions and gene fusions},
author = "Kim, Daehwan and Pertea, Geo and Trapnell, Cole and Pimentel,
Harold and Kelley, Ryan and Salzberg, Steven L",
affiliation = "Center for Bioinformatics and Computational Biology,
University of Maryland, College Park, MD, 20742, USA.
journal = "Genome Biol.",
volume = 14,
number = 4,
pages = "R36",
month = "25~" # apr,
year = 2013,
url = "http://dx.doi.org/10.1186/gb-2013-14-4-r36",
issn = "1465-6906",
pmid = "23618408",
doi = "10.1186/gb-2013-14-4-r36"
}
@ARTICLE{Langmead2012-bs,
title = {Fast gapped-read alignment with Bowtie 2},
author = "Langmead, Ben and Salzberg, Steven L",
journal = "Nat. Methods",
publisher = "Nature Publishing Group",
volume = 9,
number = 4,
pages = "357--359",
month = apr,
year = 2012,
url = "http://dx.doi.org/10.1038/nmeth.1923",
issn = "1548-7091",
pmid = "22388286",
doi = "10.1038/nmeth.1923"
}
@ARTICLE{Howard2013-fq,
title = {High-throughput {RNA} sequencing of pseudomonas-infected
Arabidopsis reveals hidden transcriptome complexity and novel
splice variants},
author = "Howard, Brian E and Hu, Qiwen and Babaoglu, Ahmet Can and
Chandra, Manan and Borghi, Monica and Tan, Xiaoping and He,
Luyan and Winter-Sederoff, Heike and Gassmann, Walter and
Veronese, Paola and Heber, Steffen",
affiliation = "Department of Computer Science, North Carolina State
University, Raleigh, North Carolina, United States of America.",
journal = "PLoS One",
volume = 8,
number = 10,
pages = "e74183",
month = "1~" # oct,
year = 2013,
url = "http://dx.doi.org/10.1371/journal.pone.0074183",
issn = "1932-6203",
pmid = "24098335",
doi = "10.1371/journal.pone.0074183",
pmc = "PMC3788074"
}
@ARTICLE{Li2009-oc,
title = {Fast and accurate short read alignment with {Burrows-Wheeler}
transform},
author = "Li, H and Durbin, R",
journal = "Bioinformatics",
volume = 25,
number = 14,
pages = "1754--1760",
month = jul,
year = 2009,
url = "http://dx.doi.org/10.1093/bioinformatics/btp324",
issn = "1367-4803",
pmid = "19451168",
doi = "10.1093/bioinformatics/btp324"
}
@ARTICLE{Li2013-oy,
title = "Aligning sequence reads, clone sequences and assembly
contigs with {BWA-MEM}",
author = "Li, Heng",
abstract = "Summary: BWA-MEM is a new alignment algorithm for aligning
sequence reads or long query sequences against a large
reference genome such as human. It automatically chooses
between local and end-to-end alignments, supports paired-end
reads and performs chimeric alignment. The algorithm is
robust to sequencing errors and applicable to a wide range
of sequence lengths from 70bp to a few megabases. For
mapping 100bp sequences, BWA-MEM shows better performance
than several state-of-art read aligners to date.
Availability and implementation: BWA-MEM is implemented as a
component of BWA, which is available at
http://github.com/lh3/bwa. Contact:
journal = "arXiv [q-bio.GN]",
month = mar,
year = 2013,
url = "http://arxiv.org/abs/1303.3997",
archivePrefix = "arXiv",
primaryClass = "q-bio.GN",
eprint = "1303.3997"
}
@ARTICLE{Liao2013-bn,
title = {The Subread aligner: fast, accurate and scalable read mapping
by seed-and-vote},
author = "Liao, Yang and Smyth, Gordon K and Shi, Wei",
affiliation = "Division of Bioinformatics, The Walter and Eliza Hall
Institute of Medical Research, 1G Royal Parade, Parkville,
Victoria 3052, Australia.",
journal = "Nucleic Acids Res.",
volume = 41,
number = 10,
pages = "e108",
month = "4~" # apr,
year = 2013,
url = "http://dx.doi.org/10.1093/nar/gkt214",
issn = "0305-1048",
pmid = "23558742",
doi = "10.1093/nar/gkt214",
pmc = "PMC3664803"
}
@MISC{Girke2014-oy,
title = {{systemPipeR}: {NGS} workflow and report generation
environment},
author = "Girke, Thomas",
institution = "UC Riverside",
month = "28~" # jun,
year = 2014,
url = "https://github.com/tgirke/systemPipeR"
}
@ARTICLE{Lawrence2013-kt,
title = {Software for computing and annotating genomic ranges},
author = "Lawrence, Michael and Huber, Wolfgang and Pag\`{e}s, Herv\'{e}
and Aboyoun, Patrick and Carlson, Marc and Gentleman, Robert
and Morgan, Martin T and Carey, Vincent J",
affiliation = "Bioinformatics and Computational Biology, Genentech, Inc.,
South San Francisco, California, United States of America.
journal = "PLoS Comput. Biol.",
volume = 9,
number = 8,
pages = "e1003118",
month = "8~" # aug,
year = 2013,
url = "http://dx.doi.org/10.1371/journal.pcbi.1003118",
issn = "1553-734X",
pmid = "23950696",
doi = "10.1371/journal.pcbi.1003118",
pmc = "PMC3738458"
}
@ARTICLE{Robinson2010-uk,
title = {edgeR: a Bioconductor package for differential expression analysis
of digital gene expression data},
author = "Robinson, M D and McCarthy, D J and Smyth, G K",
journal = "Bioinformatics",
volume = 26,
number = 1,
pages = "139--140",
month = jan,
year = 2010,
url = "http://dx.doi.org/10.1093/bioinformatics/btp616",
issn = "1367-4803",
pmid = "19910308",
doi = "10.1093/bioinformatics/btp616"
}
@ARTICLE{Love2014-sh,
title = {Moderated estimation of fold change and dispersion for {RNA-seq}
data with {DESeq2}},
author = "Love, Michael and Huber, Wolfgang and Anders, Simon",
journal = "Genome Biol.",
volume = 15,
number = 12,
pages = "550",
year = 2014,
url = "http://genomebiology.com/2014/15/12/550",
issn = "1465-6906",
doi = "10.1186/s13059-014-0550-8"
}
@ARTICLE{McKenna2010-ql,
title = {The Genome Analysis Toolkit: a {MapReduce} framework for
analyzing next-generation {DNA} sequencing data},
author = "McKenna, Aaron and Hanna, Matthew and Banks, Eric and
Sivachenko, Andrey and Cibulskis, Kristian and Kernytsky,
Andrew and Garimella, Kiran and Altshuler, David and Gabriel,
Stacey and Daly, Mark and DePristo, Mark A",
affiliation = "Program in Medical and Population Genetics, The Broad
Institute of Harvard and MIT, Cambridge, Massachusetts 02142,
USA.",
journal = "Genome Res.",
volume = 20,
number = 9,
pages = "1297--1303",
month = "19~" # jul,
year = 2010,
url = "http://dx.doi.org/10.1101/gr.107524.110",
issn = "1088-9051",
pmid = "20644199",
doi = "10.1101/gr.107524.110",
pmc = "PMC2928508"
}
@ARTICLE{Li2011-ll,
title = {A statistical framework for {SNP} calling, mutation discovery,
association mapping and population genetical parameter estimation
from sequencing data},
author = "Li, Heng",
journal = "Bioinformatics",
volume = 27,
number = 21,
pages = "2987--2993",
month = "1~" # nov,
year = 2011,
url = "http://bioinformatics.oxfordjournals.org/content/27/21/2987.abstract",
issn = "1367-4803",
doi = "10.1093/bioinformatics/btr509"
}
@ARTICLE{Wu2010-iq,
title = {Fast and {SNP-tolerant} detection of complex variants and splicing
in short reads},
author = "Wu, T D and Nacu, S",
journal = "Bioinformatics",
volume = 26,
number = 7,
pages = "873--881",
month = apr,
year = 2010,
url = "http://dx.doi.org/10.1093/bioinformatics/btq057",
issn = "1367-4803",
pmid = "20147302",
doi = "10.1093/bioinformatics/btq057"
}
@ARTICLE{Zhang2008-pc,
title = {Model-based analysis of {ChIP-Seq} ({MACS})},
author = "Zhang, Y and Liu, T and Meyer, C A and Eeckhoute, J and Johnson, D
S and Bernstein, B E and Nussbaum, C and Myers, R M and Brown, M
and Li, W and Liu, X S",
journal = "Genome Biol.",
volume = 9,
number = 9,
year = 2008,
url = "http://dx.doi.org/10.1186/gb-2008-9-9-r137",
issn = "1465-6906",
pmid = "18798982",
doi = "10.1186/gb-2008-9-9-r137"
}
@ARTICLE{Yu2015-xu,
title = {{ChIPseeker}: an {R/Bioconductor} package for {ChIP} peak
annotation, comparison and visualization},
author = "Yu, Guangchuang and Wang, Li-Gen and He, Qing-Yu",
affiliation = "Key Laboratory of Functional Protein Research of Guangdong
Higher Education Institutes, College of Life Science and
Technology, Jinan University, Guangzhou 510632, China, State
Key Laboratory of Emerging Infectious Diseases, School of
Public Health, The University of Hong Kong, Hong Kong SAR,
China and. Guangdong Information Center, Guangzhou 510031,
China. Key Laboratory of Functional Protein Research of
Guangdong Higher Education Institutes, College of Life Science
and Technology, Jinan University, Guangzhou 510632, China.",
journal = "Bioinformatics",
volume = 31,
number = 14,
pages = "2382--2383",
month = "15~" # jul,
year = 2015,
url = "http://dx.doi.org/10.1093/bioinformatics/btv145",
issn = "1367-4803, 1367-4811",
pmid = "25765347",
doi = "10.1093/bioinformatics/btv145"
}
@ARTICLE{Zhu2010-zo,
title = {{ChIPpeakAnno}: a Bioconductor package to annotate {ChIP-seq}
and {ChIP-chip} data},
author = "Zhu, Lihua J and Gazin, Claude and Lawson, Nathan D and
Pag\`{e}s, Herv\'{e} and Lin, Simon M and Lapointe, David S
and Green, Michael R",
affiliation = "Program in Gene Function and Expression, University of
Massachusetts Medical School, Worcester, Massachusetts 01605,
USA. [email protected]",
journal = "BMC Bioinformatics",
volume = 11,
pages = "237",
month = "11~" # may,
year = 2010,
url = "http://dx.doi.org/10.1186/1471-2105-11-237",
issn = "1471-2105",
pmid = "20459804",
doi = "10.1186/1471-2105-11-237",
pmc = "PMC3098059"
}
@ARTICLE{Juntawong2014-ny,
title = {Translational dynamics revealed by genome-wide profiling of
ribosome footprints in Arabidopsis},
author = "Juntawong, Piyada and Girke, Thomas and Bazin, J\'{e}r\'{e}mie
and Bailey-Serres, Julia",
affiliation = "Center for Plant Cell Biology and Department of Botany and
Plant Sciences, University of California, Riverside, CA 92521.",
journal = "Proc. Natl. Acad. Sci. U. S. A.",
volume = 111,
number = 1,
pages = "E203--12",
month = "7~" # jan,
year = 2014,
url = "http://dx.doi.org/10.1073/pnas.1317811111",
annote = "PMID: 24367078",
keywords = "alternative splicing; long intergenic noncoding RNA; ribosome
profiling; translational efficiency; uORF",
issn = "0027-8424, 1091-6490",
pmid = "24367078",
doi = "10.1073/pnas.1317811111",
pmc = "PMC3890782"
}
@ARTICLE{Ingolia2009-cb,
title = {Genome-wide analysis in vivo of translation with nucleotide
resolution using ribosome profiling},
author = "Ingolia, N T and Ghaemmaghami, S and Newman, J R and Weissman, J S",
journal = "Science",
volume = 324,
number = 5924,
pages = "218--223",
month = apr,
year = 2009,
url = "http://dx.doi.org/10.1016/j.ymeth.2009.03.016",
issn = "0036-8075",
pmid = "19213877",
doi = "10.1016/j.ymeth.2009.03.016"
}
@ARTICLE{Aspden2014-uu,
title = {Extensive translation of small Open Reading Frames revealed by
{Poly-Ribo-Seq}},
author = "Aspden, Julie L and Eyre-Walker, Ying Chen and Phillips, Rose
J and Amin, Unum and Mumtaz, Muhammad Ali S and Brocard,
Michele and Couso, Juan-Pablo",
affiliation = "School of Life Sciences, University of Sussex, Brighton,
United Kingdom. School of Life Sciences, University of Sussex,
Brighton, United Kingdom. School of Life Sciences, University
of Sussex, Brighton, United Kingdom. School of Life Sciences,
University of Sussex, Brighton, United Kingdom. School of Life
Sciences, University of Sussex, Brighton, United Kingdom.
School of Life Sciences, University of Sussex, Brighton,
United Kingdom. School of Life Sciences, University of Sussex,
Brighton, United Kingdom.",
journal = "Elife",
volume = 3,
pages = "e03528",
month = "21~" # aug,
year = 2014,
url = "http://dx.doi.org/10.7554/eLife.03528",
keywords = "biochemistry; d. melanogaster; evolutionary biology; genomics;
non-coding RNAs; small open reading Frames; transmembrane
peptides",
issn = "2050-084X",
pmid = "25144939",
doi = "10.7554/eLife.03528",
pmc = "PMC4359375"
}
@ARTICLE{Ingolia2011-fc,
title = {Ribosome profiling of mouse embryonic stem cells reveals the
complexity and dynamics of mammalian proteomes},
author = "Ingolia, N T and Lareau, L F and Weissman, J S",
journal = "Cell",
volume = 147,
number = 4,
pages = "789--802",
month = "11~" # nov,
year = 2011,
url = "http://www.ncbi.nlm.nih.gov/pubmed/22056041",
issn = "0092-8674, 1097-4172;0092-8674",
pmid = "22056041",
doi = "10.1016/j.cell.2011.10.002"
}
@ARTICLE{Juntawong2015-ru,
title = {Ribosome profiling: a tool for quantitative evaluation of
dynamics in {mRNA} translation},
author = "Juntawong, Piyada and Hummel, Maureen and Bazin, Jeremie and
Bailey-Serres, Julia",
affiliation = "Center for Plant Cell Biology and Department of Botany and
Plant Sciences, University of California, Riverside, CA,
92521, USA.",
journal = "Methods Mol. Biol.",
volume = 1284,
pages = "139--173",
year = 2015,
url = "http://dx.doi.org/10.1007/978-1-4939-2444-8_7",
issn = "1064-3745, 1940-6029",
pmid = "25757771",
doi = "10.1007/978-1-4939-2444-8\_7"
}
@ARTICLE{H_Backman2016-bt,
title = "{systemPipeR: NGS workflow and report generation environment}",
author = "H Backman, Tyler W and Girke, Thomas",
affiliation = "Institute for Integrative Genome Biology, University of
California, Riverside, 1207F Genomics Building, 3401 Watkins
Drive, Riverside, 92521, CA, USA. Institute for Integrative
Genome Biology, University of California, Riverside, 1207F
Genomics Building, 3401 Watkins Drive, Riverside, 92521, CA,
USA. [email protected].",
journal = "BMC Bioinformatics",
volume = 17,
number = 1,
pages = "388",
month = "20~" # sep,
year = 2016,
url = "http://dx.doi.org/10.1186/s12859-016-1241-0",
keywords = "Analysis workflow; ChIP-Seq; Next Generation Sequencing (NGS);
RNA-Seq; Ribo-Seq; VAR-Seq",
language = "en",
issn = "1471-2105",
pmid = "27650223",
doi = "10.1186/s12859-016-1241-0",
pmc = "PMC5029110"
}
@ARTICLE{Kim2015-ve,
title = "{HISAT}: a fast spliced aligner with low memory requirements",
author = "Kim, Daehwan and Langmead, Ben and Salzberg, Steven L",
abstract = "HISAT (hierarchical indexing for spliced alignment of
transcripts) is a highly efficient system for aligning reads from
RNA sequencing experiments. HISAT uses an indexing scheme based
on the Burrows-Wheeler transform and the Ferragina-Manzini (FM)
index, employing two types of indexes for alignment: a
whole-genome FM index to anchor each alignment and numerous local
FM indexes for very rapid extensions of these alignments. HISAT's
hierarchical index for the human genome contains 48,000 local FM
indexes, each representing a genomic region of ∼64,000 bp. Tests
on real and simulated data sets showed that HISAT is the fastest
system currently available, with equal or better accuracy than
any other method. Despite its large number of indexes, HISAT
requires only 4.3 gigabytes of memory. HISAT supports genomes of
any size, including those larger than 4 billion bases.",
journal = "Nat. Methods",
volume = 12,
number = 4,
pages = "357--360",
month = apr,
year = 2015,
language = "en"
}
@Manual{Rsamtools,
title = {Rsamtools: Binary alignment (BAM), FASTA, variant call (BCF), and tabix
file import},
author = {Martin Morgan and Herv\'e Pag\`es and Valerie Obenchain and Nathaniel Hayden},
year = {2019},
note = {R package version 2.0.0},
url = {http://bioconductor.org/packages/Rsamtools},
}
@ARTICLE{Anders2010-tp,
title = "Differential expression analysis for sequence count data",
author = "Anders, Simon and Huber, Wolfgang",
abstract = "High-throughput sequencing assays such as RNA-Seq, ChIP-Seq or
barcode counting provide quantitative readouts in the form of
count data. To infer differential signal in such data correctly
and with good statistical power, estimation of data variability
throughout the dynamic range and a suitable error model are
required. We propose a method based on the negative binomial
distribution, with variance and mean linked by local regression
and present an implementation, DESeq, as an R/Bioconductor
package.",
journal = "Genome Biol.",
volume = 11,
number = 10,
pages = "R106",
month = oct,
year = 2010,
language = "en"
}
@ARTICLE{Martin2011-bh,
title = "Cutadapt removes adapter sequences from high-throughput
sequencing reads",
author = "Martin, Marcel",
abstract = "When small RNA is sequenced on current sequencing machines, the
resulting reads are usually longer than the RNA and therefore
contain parts of the 3' adapter. That adapter must be found and
removed error-tolerantly from each read before read mapping.
Previous solutions are either hard to use or do not offer
required features, in particular support for color space data. As
an easy to use alternative, we developed the command-line tool
cutadapt, which supports 454, Illumina and SOLiD (color space)
data, offers two adapter trimming algorithms, and has other
useful features. Cutadapt, including its MIT-licensed source
code, is available for download at
http://code.google.com/p/cutadapt/",
journal = "EMBnet.journal",
volume = 17,
number = 1,
pages = "10--12",
month = may,
year = 2011,
keywords = "next generation sequencing; small RNA; microRNA; adapter removal",
language = "en"
}
@ARTICLE{Bolger2014-yr,
title = "Trimmomatic: a flexible trimmer for Illumina sequence data",
author = "Bolger, Anthony M and Lohse, Marc and Usadel, Bjoern",
abstract = "MOTIVATION: Although many next-generation sequencing (NGS) read
preprocessing tools already existed, we could not find any tool
or combination of tools that met our requirements in terms of
flexibility, correct handling of paired-end data and high
performance. We have developed Trimmomatic as a more flexible and
efficient preprocessing tool, which could correctly handle
paired-end data. RESULTS: The value of NGS read preprocessing is
demonstrated for both reference-based and reference-free tasks.
Trimmomatic is shown to produce output that is at least
competitive with, and in many cases superior to, that produced by
other tools, in all scenarios tested. AVAILABILITY AND
IMPLEMENTATION: Trimmomatic is licensed under GPL V3. It is
cross-platform (Java 1.5+ required) and available at
http://www.usadellab.org/cms/index.php?page=trimmomatic CONTACT:
[email protected] SUPPLEMENTARY INFORMATION:
Supplementary data are available at Bioinformatics online.",
journal = "Bioinformatics",
volume = 30,
number = 15,
pages = "2114--2120",
month = aug,
year = 2014,
language = "en"
}
% The entry below contains non-ASCII chars that could not be converted
% to a LaTeX equivalent.
@ARTICLE{Ziemann2016-mp,
title = "Evaluation of {microRNA} alignment techniques",
author = "Ziemann, Mark and Kaspi, Antony and El-Osta, Assam",
abstract = "Genomic alignment of small RNA (smRNA) sequences such as
microRNAs poses considerable challenges due to their short length
(∼21 nucleotides [nt]) as well as the large size and complexity
of plant and animal genomes. While several tools have been
developed for high-throughput mapping of longer mRNA-seq reads
(>30 nt), there are few that are specifically designed for
mapping of smRNA reads including microRNAs. The accuracy of these
mappers has not been systematically determined in the case of
smRNA-seq. In addition, it is unknown whether these aligners
accurately map smRNA reads containing sequence errors and
polymorphisms. By using simulated read sets, we determine the
alignment sensitivity and accuracy of 16 short-read mappers and
quantify their robustness to mismatches, indels, and nontemplated
nucleotide additions. These were explored in the context of a
plant genome (Oryza sativa, ∼500 Mbp) and a mammalian genome
(Homo sapiens, ∼3.1 Gbp). Analysis of simulated and real
smRNA-seq data demonstrates that mapper selection impacts
differential expression results and interpretation. These results
will inform on best practice for smRNA mapping and enable more
accurate smRNA detection and quantification of expression and RNA
editing.",
journal = "RNA",
volume = 22,
number = 8,
pages = "1120--1138",
month = aug,
year = 2016,
keywords = "gene expression; microRNA; next-generation sequencing; short-read
aligners; small RNA sequencing",
language = "en"
}
@ARTICLE{Li2009-ys,
title = "Fast and accurate short read alignment with {Burrows-Wheeler}
transform",
author = "Li, Heng and Durbin, Richard",
abstract = "MOTIVATION: The enormous amount of short reads generated by the
new DNA sequencing technologies call for the development of fast
and accurate read alignment programs. A first generation of hash
table-based methods has been developed, including MAQ, which is
accurate, feature rich and fast enough to align short reads from
a single individual. However, MAQ does not support gapped
alignment for single-end reads, which makes it unsuitable for
alignment of longer reads where indels may occur frequently. The
speed of MAQ is also a concern when the alignment is scaled up to
the resequencing of hundreds of individuals. RESULTS: We
implemented Burrows-Wheeler Alignment tool (BWA), a new read
alignment package that is based on backward search with
Burrows-Wheeler Transform (BWT), to efficiently align short
sequencing reads against a large reference sequence such as the
human genome, allowing mismatches and gaps. BWA supports both
base space reads, e.g. from Illumina sequencing machines, and
color space reads from AB SOLiD machines. Evaluations on both
simulated and real data suggest that BWA is approximately 10-20x
faster than MAQ, while achieving similar accuracy. In addition,
BWA outputs alignment in the new standard SAM (Sequence
Alignment/Map) format. Variant calling and other downstream
analyses after the alignment can be achieved with the open source
SAMtools software package. AVAILABILITY:
http://maq.sourceforge.net.",
journal = "Bioinformatics",
volume = 25,
number = 14,
pages = "1754--1760",
month = jul,
year = 2009,
language = "en"
}
@ARTICLE{Tam2015-gb,
title = "Optimization of {miRNA-seq} data preprocessing",
author = "Tam, Shirley and Tsao, Ming-Sound and McPherson, John D",
abstract = "The past two decades of microRNA (miRNA) research has solidified
the role of these small non-coding RNAs as key regulators of many
biological processes and promising biomarkers for disease. The
concurrent development in high-throughput profiling technology
has further advanced our understanding of the impact of their
dysregulation on a global scale. Currently, next-generation
sequencing is the platform of choice for the discovery and
quantification of miRNAs. Despite this, there is no clear
consensus on how the data should be preprocessed before
conducting downstream analyses. Often overlooked, data
preprocessing is an essential step in data analysis: the presence
of unreliable features and noise can affect the conclusions drawn
from downstream analyses. Using a spike-in dilution study, we
evaluated the effects of several general-purpose aligners (BWA,
Bowtie, Bowtie 2 and Novoalign), and normalization methods
(counts-per-million, total count scaling, upper quartile scaling,
Trimmed Mean of M, DESeq, linear regression, cyclic loess and
quantile) with respect to the final miRNA count data
distribution, variance, bias and accuracy of differential
expression analysis. We make practical recommendations on the
optimal preprocessing methods for the extraction and
interpretation of miRNA count data from small RNA-sequencing
experiments.",
journal = "Brief. Bioinform.",
volume = 16,
number = 6,
pages = "950--963",
month = nov,
year = 2015,
keywords = "data preprocessing; miRNA sequencing; miRNA-seq normalization;
small RNA sequence alignment",
language = "en"
}
@ARTICLE{Aparicio-Puerta2019-fa,
title = "{sRNAbench} and {sRNAtoolbox} 2019: intuitive fast small {RNA}
profiling and differential expression",
author = "Aparicio-Puerta, Ernesto and Lebr{\'o}n, Ricardo and Rueda,
Antonio and G{\'o}mez-Mart{\'\i}n, Cristina and Giannoukakos,
Stavros and Jaspez, David and Medina, Jos{\'e} Mar{\'\i}a and
Zubkovic, Andreja and Jurak, Igor and Fromm, Bastian and Marchal,
Juan Antonio and Oliver, Jos{\'e} and Hackenberg, Michael",
abstract = "Since the original publication of sRNAtoolbox in 2015, small RNA
research experienced notable advances in different directions.
New protocols for small RNA sequencing have become available to
address important issues such as adapter ligation bias, PCR
amplification artefacts or to include internal controls such as
spike-in sequences. New microRNA reference databases were
developed with different foci, either prioritizing accuracy (low
number of false positives) or completeness (low number of false
negatives). Additionally, other small RNA molecules as well as
microRNA sequence and length variants (isomiRs) have continued to
gain importance. Finally, the number of microRNA sequencing
studies deposited in GEO nearly triplicated from 2014 (280) to
2018 (764). These developments imply that fast and easy-to-use
tools for expression profiling and subsequent downstream analysis
of miRNA-seq data are essential to many researchers. Key features
in this sRNAtoolbox release include addition of all major RNA
library preparation protocols to sRNAbench and improvements in
sRNAde, a tool that summarizes several aspects of small RNA
sequencing studies including the detection of consensus
differential expression. A special emphasis was put on the
user-friendliness of the tools, for instance sRNAbench now
supports parallel launching of several jobs to improve
reproducibility and user time efficiency.",
journal = "Nucleic Acids Res.",
volume = 47,
number = "W1",
pages = "W530--W535",
month = jul,
year = 2019,
language = "en"
}
@ARTICLE{Buenrostro2013-ap,
title = "Transposition of native chromatin for fast and sensitive
epigenomic profiling of open chromatin, {DNA-binding} proteins
and nucleosome position",
author = "Buenrostro, Jason D and Giresi, Paul G and Zaba, Lisa C and
Chang, Howard Y and Greenleaf, William J",
abstract = "We describe an assay for transposase-accessible chromatin using
sequencing (ATAC-seq), based on direct in vitro transposition of
sequencing adaptors into native chromatin, as a rapid and
sensitive method for integrative epigenomic analysis. ATAC-seq
captures open chromatin sites using a simple two-step protocol
with 500-50,000 cells and reveals the interplay between genomic
locations of open chromatin, DNA-binding proteins, individual
nucleosomes and chromatin compaction at nucleotide resolution. We
discovered classes of DNA-binding factors that strictly avoided,
could tolerate or tended to overlap with nucleosomes. Using
ATAC-seq maps of human CD4(+) T cells from a proband obtained on
consecutive days, we demonstrated the feasibility of analyzing an
individual's epigenome on a timescale compatible with clinical
decision-making.",
journal = "Nat. Methods",
volume = 10,
number = 12,
pages = "1213--1218",
month = dec,
year = 2013,
language = "en"
}