-
Notifications
You must be signed in to change notification settings - Fork 0
/
data_management_guidance.bib
473 lines (433 loc) · 24.1 KB
/
data_management_guidance.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
@misc{blumerEPFLLibraryResearch2019,
title = {{{EPFL Library Research Data Management Fastguides}}},
author = {Blumer, Eliane Ninfa and Chaptinel, Jérôme Julien and Masson, Antoine and Reichler, Fintin and Samath, Sitthida},
date = {2019},
publisher = {{Zenodo}},
url = {https://doi.org/10.5281/zenodo.3327830},
langid = {english}
}
@article{borerSimpleGuidelinesEffective2009,
title = {Some {{Simple Guidelines}} for {{Effective Data Management}}},
author = {Borer, Elizabeth T. and Seabloom, Eric W. and Jones, Matthew B. and Schildhauer, Mark},
date = {2009-04},
journaltitle = {Bulletin of the Ecological Society of America},
shortjournal = {Bulletin of the Ecological Society of America},
volume = {90},
number = {2},
pages = {205--214},
issn = {0012-9623},
doi = {10.1890/0012-9623-90.2.205},
url = {http://doi.wiley.com/10.1890/0012-9623-90.2.205},
urldate = {2020-08-05},
langid = {english},
file = {/home/jen/papers/Borer_et_al-2009-The_Bulletin_of_the_Ecological_Society_of_America.pdf}
}
@online{CFConventionsHome2020,
title = {{{CF Conventions Home Page}}},
date = {2020},
url = {http://cfconventions.org/},
urldate = {2020-10-19},
file = {/home/jen/Zotero/storage/UPX3YS6D/cfconventions.org.html}
}
@online{chanS3KeysAre2020,
title = {S3 Keys Are Not File Paths},
author = {Chan, Alex W. L.},
date = {2020},
url = {https://alexwlchan.net/2020/08/s3-keys-are-not-file-paths/},
urldate = {2020-09-15},
abstract = {Although an S3 key looks a lot like a file path, they aren't always the same, and the distinction can trip you up.},
langid = {english},
organization = {{alexwlchan}},
file = {/home/jen/Zotero/storage/6TVAZXXV/s3-keys-are-not-file-paths.html}
}
@online{chanS3PrefixesAre2020,
title = {S3 Prefixes Are Not Directories},
author = {Chan, Alex W. L.},
date = {2020},
url = {https://alexwlchan.net/2020/08/s3-prefixes-are-not-directories/},
urldate = {2020-09-15},
abstract = {Although an S3 prefix looks a lot like a directory path, they aren't the same. Whether or not you include a trailing slash can change the behaviour.},
langid = {english},
organization = {{alexwlchan}},
file = {/home/jen/Zotero/storage/SPG3UPDX/s3-prefixes-are-not-directories.html}
}
@article{colavizzaCitationAdvantageLinking2020,
title = {The Citation Advantage of Linking Publications to Research Data},
author = {Colavizza, Giovanni and Hrynaszkiewicz, Iain and Staden, Isla and Whitaker, Kirstie and McGillivray, Barbara},
editor = {Wicherts, Jelte M.},
date = {2020-04-22},
journaltitle = {PLOS ONE},
shortjournal = {PLoS ONE},
volume = {15},
number = {4},
pages = {e0230416},
issn = {1932-6203},
doi = {10.1371/journal.pone.0230416},
url = {https://dx.plos.org/10.1371/journal.pone.0230416},
urldate = {2020-08-05},
abstract = {Efforts to make research results open and reproducible are increasingly reflected by journal policies encouraging or mandating authors to provide data availability statements. As a consequence of this, there has been a strong uptake of data availability statements in recent literature. Nevertheless, it is still unclear what proportion of these statements actually contain well-formed links to data, for example via a URL or permanent identifier, and if there is an added value in providing such links. We consider 531, 889 journal articles published by PLOS and BMC, develop an automatic system for labelling their data availability statements according to four categories based on their content and the type of data availability they display, and finally analyze the citation advantage of different statement categories via regression. We find that, following mandated publisher policies, data availability statements become very common. In 2018 93.7\% of 21,793 PLOS articles and 88.2\% of 31,956 BMC articles had data availability statements. Data availability statements containing a link to data in a repository—rather than being available on request or included as supporting information files—are a fraction of the total. In 2017 and 2018, 20.8\% of PLOS publications and 12.2\% of BMC publications provided DAS containing a link to data in a repository. We also find an association between articles that include statements that link to data in a repository and up to 25.36\% (± 1.07\%) higher citation impact on average, using a citation prediction model. We discuss the potential implications of these results for authors (researchers) and journal publishers who make the effort of sharing their data in repositories. All our data and code are made available in order to reproduce and extend our results.},
langid = {english},
file = {/home/jen/papers/journal.pone.0230416.pdf}
}
@article{cookBestPracticesPreparing2001,
title = {Best {{Practices}} for {{Preparing Ecological Data Sets}} to {{Share}} and {{Archive}}},
author = {Cook, Robert B. and Olsen, Richard J. and Kanciruk, Paul and Hook, Leslie A.},
date = {2001},
journaltitle = {Bulletin of the Ecological Society of America},
volume = {82},
number = {2},
pages = {138--141},
doi = {10.1890/0012-9623(2001)082[0136:C]2.0.CO;2},
url = {https://doi.org/10.1890/0012-9623(2001)082[0136:C]2.0.CO;2},
langid = {english},
file = {/home/jen/papers/20168543.pdf}
}
@article{coppBarcodesAreUseful2014,
title = {Barcodes {{Are}} a {{Useful Tool}} for {{Labeling}} and {{Tracking Ecological Samples}}},
author = {Copp, Adam J. and Kennedy, Theodore A. and Muehlbauer, Jeffrey D.},
date = {2014-07},
journaltitle = {Bulletin of the Ecological Society of America},
shortjournal = {Bulletin of the Ecological Society of America},
volume = {95},
number = {3},
pages = {293--300},
issn = {0012-9623},
doi = {10.1890/0012-9623-95.3.293},
url = {http://doi.wiley.com/10.1890/0012-9623-95.3.293},
urldate = {2020-08-05},
langid = {english},
file = {/home/jen/papers/0012-9623-95.3.293.pdf}
}
@online{craig-woodRclone2014,
title = {Rclone},
author = {Craig-Wood, Nick},
date = {2014/2020},
url = {https://rclone.org/},
urldate = {2020-10-19},
organization = {{RCLONE}},
file = {/home/jen/Zotero/storage/G3ABGRDI/rclone.org.html}
}
@misc{datacitemetadataworkinggroupDataCiteMetadataSchema2019a,
title = {{{DataCite Metadata Schema Documentation}} for the {{Publication}} and {{Citation}} of {{Research Data}} v4.3},
author = {{DataCite Metadata Working Group}},
options = {useprefix=true},
date = {2019},
publisher = {{DataCite}},
doi = {10.14454/7XQ3-ZF69},
url = {https://schema.datacite.org/meta/kernel-4.3/},
urldate = {2020-10-19},
editora = {de Smaele, Madeleine and Dasler, Robin and Ashton, Jan and Roy, Sophie and Fenner, Martin and Jacobson, Mark and Bernal Martínez, Isabel and Burger, Marleen and Yahia, Mohamed and Zolly, Lisa and Habermann, Ted and Raugh, Anne and Ilik, Violeta and La Roi, Andreas},
editoratype = {collaborator},
langid = {english},
version = {4.3},
file = {/home/jen/papers/DataCite-MetadataKernel_v4.3.pdf}
}
@online{dataoneDocumentStoreData2019,
title = {Document and Store Data Using Stable File Formats | {{DataONE}}},
author = {{DataONE}},
date = {2019-03},
url = {https://old.dataone.org/best-practices/document-and-store-data-using-stable-file-formats},
urldate = {2020-07-24},
organization = {{DataONE}},
file = {/home/jen/Zotero/storage/WZCRHUDP/document-and-store-data-using-stable-file-formats.html}
}
@online{downieBitesizedRDMReadme2019,
title = {Bite-Sized {{RDM}} \#5 - the Readme File},
author = {Downie, Alastair},
date = {2019-12-02},
url = {https://gurdoncomputing.blog/2019/12/02/bite-sized-research-data-management-5-the-readme-file},
urldate = {2020-02-27},
organization = {{IT and Research Data Management at the Gurdon Institute}}
}
@article{fegrausMaximizingValueEcological2005,
title = {Maximizing the {{Value}} of {{Ecological Data}} with {{Structured Metadata}}: {{An Introduction}} to {{Ecological Metadata Language}} ({{EML}}) and {{Principles}} for {{Metadata Creation}}},
shorttitle = {Maximizing the {{Value}} of {{Ecological Data}} with {{Structured Metadata}}},
author = {Fegraus, Eric H. and Andelman, Sandy and Jones, Matthew B. and Schildhauer, Mark},
date = {2005-07},
journaltitle = {Bulletin of the Ecological Society of America},
shortjournal = {Bulletin of the Ecological Society of America},
volume = {86},
number = {3},
pages = {158--168},
issn = {0012-9623},
doi = {10.1890/0012-9623(2005)86[158:MTVOED]2.0.CO;2},
url = {http://doi.wiley.com/10.1890/0012-9623(2005)86[158:MTVOED]2.0.CO;2},
urldate = {2020-10-19},
langid = {english},
file = {/home/jen/papers/bullecosociamer.86.3.158.pdf}
}
@online{FrictionlessData2020,
title = {Frictionless {{Data}}},
date = {2020},
url = {https://frictionlessdata.io/},
urldate = {2020-10-19},
abstract = {Bringing simplicity and gracefulness to the data experience},
langid = {american},
organization = {{Frictionless Data}},
file = {/home/jen/Zotero/storage/729V9SRA/frictionlessdata.io.html}
}
@online{githubinc.GitHubWhereWorld2020,
title = {{{GitHub}}: {{Where}} the World Builds Software · {{GitHub}}},
author = {{GitHub, Inc.}},
date = {2020},
url = {https://github.com/},
urldate = {2020-10-19},
file = {/home/jen/Zotero/storage/LDRNATGD/github.com.html}
}
@article{grayScientificDataManagement2005a,
title = {Scientific Data Management in the Coming Decade},
author = {Gray, Jim and Liu, David T. and Nieto-Santisteban, Maria and Szalay, Alex and DeWitt, David J. and Heber, Gerd},
date = {2005-12},
journaltitle = {ACM SIGMOD Record},
shortjournal = {SIGMOD Rec.},
volume = {34},
number = {4},
pages = {34--41},
issn = {0163-5808},
doi = {10.1145/1107499.1107503},
url = {https://dl.acm.org/doi/10.1145/1107499.1107503},
urldate = {2020-10-19},
langid = {english},
file = {/home/jen/papers/1107499.1107503.pdf}
}
@online{greenbeltmd:earthsciencedataandinformationsystemearthscienceprojectsdivisiongoddardspaceflightcentergsfcnationalaeronauticsandspaceadministrationnasaGlobalChangeMaster2020,
title = {Global {{Change Master Directory}} ({{GCMD}}) {{Keywords}} | {{Earthdata}}},
author = {{Greenbelt, MD: Earth Science Data and Information System, Earth Science Projects Division, Goddard Space Flight Center (GSFC) National Aeronautics and Space Administration (NASA)}},
date = {2020},
url = {https://earthdata.nasa.gov/earth-observation-data/find-data/gcmd/gcmd-keywords/},
urldate = {2020-10-19},
abstract = {GCMD Keywords are a hierarchical set of controlled Earth science vocabularies that ensure Earth science data and services are described in a consistent manner.},
langid = {english},
file = {/home/jen/Zotero/storage/DIDQF6EX/gcmd-keywords.html}
}
@online{macfarlanePandoc2006,
title = {Pandoc},
author = {MacFarlane, John},
date = {2006/2020},
url = {https://pandoc.org/MANUAL.html},
urldate = {2020-11-04},
organization = {{Pandoc}}
}
@inproceedings{mccarthyMetadataManagementLarge1982,
title = {Metadata Management for Large Statistical Databases},
booktitle = {Proceedings of the {{Eighth International Conference}} on {{Very Large Data Bases}}},
author = {McCarthy, J L},
date = {1982-09},
pages = {234--243},
location = {{Mexico City, Mexico}},
url = {https://escholarship.org/content/qt5cc031cm/qt5cc031cm.pdf},
abstract = {Data description or metadata presents a significant database management challenge, particularly for scientific and statistical databases. Ideally, we would like to access and manipulate data and metadata using the same DBMS tools, but there are few systems that even begin to provide such integrated capabilities. This paper outlines a framework for more integrated metadata management by synthesizing ideas from statistical analysis, bibliographic retrieval; data dictionary, and database management systems. Drawing on experience and examples from a large statistical database project, the paper discusses and analyzes: • general types and uses of data about data • special types of metadata for statistical databases • metadata structure and characteristics • principles and requirements for metadata management},
eventtitle = {Eighth {{International Conference}} on {{Very Large Data Bases}}, {{September}} 8-10, 1982; and Published in the {{Proceedings}}},
langid = {english},
file = {/home/jen/papers/qt5cc031cm.pdf}
}
@article{michenerMetainformationConceptsEcological2005,
title = {Meta-Information Concepts for Ecological Data Management},
author = {Michener, William K.},
date = {2005},
journaltitle = {Ecological Informatics},
shortjournal = {Ecological Informatics},
volume = {1},
number = {1},
pages = {3--7},
issn = {15749541},
doi = {10.1016/j.ecoinf.2005.08.004},
url = {https://linkinghub.elsevier.com/retrieve/pii/S157495410500004X},
urldate = {2020-10-19},
abstract = {Ecological databases continue to grow in volume, breadth and complexity. Higher level descriptions of data (i.e., metadata) and information derived from subsequent data processing and analyses (i.e., “meta-information” in the broadest sense) are essential for understanding and using the increasingly complex and voluminous data and information. The concepts of meta-information, in general, and metadata, in particular, have evolved in concert with the increasing needs for functionality by the community. From a scientific perspective, metadata may be characterized as having developed from initially supporting data discovery; to facilitating acquisition, comprehension and utilization of data by humans; and, most recently, to beginning to enable automated data discovery, ingestion, processing and analysis via metadata-enabled scientific workflow systems. The continued conceptual and operational developments in metadata required to support comprehensive automated scientific workflow systems portend many challenges and opportunities. For example, there are significant opportunities for collaboration among ecologists and computer scientists in developing domain-specific controlled vocabularies and ontologies that provide the basis for semantic mediation—the “glue” technologies that enable automated data discovery, ingestion, processing and analysis. Similarly, there are opportunities for computer scientists and engineers to develop new mechanisms that support automated metadata encoding—such as providing the information that would be necessary to understand the end-to-end flow of sensor data from in situ data collection, streaming through quality assurance filtering, aggregation, transformation and additional processing, analysis, and publication of digital products. As the technologies mature, we still have many sociological barriers to overcome including the needs for increased attention to software usability testing and engineering to enhance user-friendliness of metadata management software, new capital investments in ecological data archives, and increasing the metadata management benefit–cost ratio for the average scientist via incentives and enabling tools.},
langid = {english},
file = {/home/jen/papers/1-s2.0-S157495410500004X-main.pdf}
}
@article{michenerNongeospatialMetadataEcological1997,
title = {Nongeospatial Metadata for the Ecological Sciences},
author = {Michener, William K and Brunt, James W and Helly, John J and Kirchner, Thomas B and Stafford, Susan G},
date = {1997},
journaltitle = {Ecological Applications},
volume = {7},
number = {1},
pages = {13},
doi = {10.1890/1051-0761(1997)007[0330:NMFTES]2.0.CO;2},
url = {https://doi.org/10.1890/1051-0761(1997)007[0330:NMFTES]2.0.CO;2},
abstract = {Issues related to data preservation and sharing are receiving increased attention from scientific societies, funding agencies, and the broad scientific community. Ecologists, for example, are increasingly using data collected by other scientists to address questions at broader spatial, temporal, and thematic scales (e.g., global change, biodiversity, sustainability). No data set is perfect and self-explanatory. Ecologists must, therefore, rely upon a set of instructions or documentation to acquire a specific data set, determine its suitability for meeting specific research objectives, and accurately interpret results from subsequent processing, analysis, and modeling.},
langid = {english},
file = {/home/jen/papers/Michener_etal_1997_EcolApplications.pdf}
}
@article{pengReproducibleResearchComputational2011,
title = {Reproducible {{Research}} in {{Computational Science}}},
author = {Peng, Roger D.},
date = {2011-12-02},
journaltitle = {Science},
shortjournal = {Science},
volume = {334},
number = {6060},
pages = {1226--1227},
issn = {0036-8075, 1095-9203},
doi = {10.1126/science.1213847},
url = {https://www.sciencemag.org/lookup/doi/10.1126/science.1213847},
urldate = {2020-10-19},
langid = {english},
file = {/home/jen/papers/1226.full.pdf}
}
@book{recknagelEcologicalInformatics2018a,
title = {Ecological {{Informatics}}},
editor = {Recknagel, Friedrich and Michener, William K.},
date = {2018},
edition = {3rd edition},
publisher = {{Springer International Publishing}},
location = {{Cham}},
doi = {10.1007/978-3-319-59928-1},
url = {http://link.springer.com/10.1007/978-3-319-59928-1},
urldate = {2020-10-19},
isbn = {978-3-319-59926-7},
langid = {english},
pagetotal = {478},
file = {/home/jen/papers/2018_Book_EcologicalInformatics.pdf}
}
@online{SchemaOrg2020,
title = {Schema.Org},
date = {2020-09-07},
url = {https://schema.org/},
urldate = {2020-10-19},
file = {/home/jen/Zotero/storage/I4NL4AIT/schema.org.html}
}
@online{SeaDataNet,
title = {{{SeaDataNet}}},
url = {https://www.seadatanet.org/},
urldate = {2020-10-19},
abstract = {SeaDataNet is a pan-European infrastructure to ease the access to marine data measured by the countries bordering the European seas.},
langid = {british},
organization = {{SeaDataNet}},
file = {/home/jen/Zotero/storage/BDTYMWXX/www.seadatanet.org.html}
}
@book{smithFieldTrialsHealth2015,
title = {Field Trials of Health Interventions: A Toolbox},
shorttitle = {Field Trials of Health Interventions},
editor = {Smith, Peter G. and Morrow, R. H. and Ross, David A. and International Epidemiological Association and Wellcome Trust (London, England)},
date = {2015},
edition = {3rd edition},
publisher = {{Oxford University Press}},
location = {{Oxford}},
abstract = {Before new interventions can be used in disease control programmes, it is essential that they are carefully evaluated in "field trials", which may be complex and expensive undertakings. Descriptions of the detailed procedures and methods used in trials that have been conducted in the past have generally not been published. As a consequence, those planning such trials have few guidelines available and little access to previously accumulated knowledge. In this book the practical issues of trial design and conduct are discussed fully and in sufficient detail for the text to be used as a "toolbox" by field investigators. The toolbox has now been extensively tested through use of the first two editions and this third edition is a comprehensive revision, incorporating the many developments that have taken place with respect to trials since 1996 and involving more than 30 contributors. Most of the chapters have been extensively revised and 7 new chapters have been added.--},
isbn = {978-0-19-873286-0},
langid = {english},
pagetotal = {444},
keywords = {methods,Randomized Controlled Trials as Topic,Research Methodology,Socioeconomic Factors,Tropical medicine,Tropical Medicine},
annotation = {OCLC: ocn925532147},
file = {/home/jen/papers/Bookshelf_NBK305515.pdf}
}
@online{stanforduniversitylibrariesBestPracticesFile,
title = {Best Practices for File Formats},
author = {{Stanford University Libraries}},
url = {https://library.stanford.edu/research/data-management-services/data-best-practices/best-practices-file-formats},
urldate = {2020-07-24},
langid = {english},
organization = {{Stanford Libraries}}
}
@online{swissdatasciencecenterRenku2018,
title = {Renku},
author = {{Swiss Data Science Center}},
date = {2018-05-23},
url = {https://datascience.ch/renku/},
urldate = {2020-10-19},
langid = {american},
organization = {{SDSC}},
file = {/home/jen/Zotero/storage/TWHZLNIA/renku.html}
}
@online{thelibrariesofthemassachusettsinstituteoftechnologyFileFormatsLongterm,
title = {File Formats for Long-Term Access | {{Data}} Management},
author = {{The libraries of the Massachusetts Institute of Technology}},
url = {https://libraries.mit.edu/data-management/store/formats/},
urldate = {2020-07-24},
organization = {{Data management}}
}
@online{theuniversityofedinburghDocumentationMetadataCitation2021,
title = {Documentation, Metadata, Citation},
author = {{The University of Edinburgh}},
date = {2021-09},
url = {https://mantra.edina.ac.uk/documentation_metadata_citation/},
urldate = {2020-07-31},
organization = {{MANTRA Research Data Management Training.}},
file = {/home/jen/Zotero/storage/8328D6XP/documentation_metadata_citation.html}
}
@online{theuniversityofedinburghStorageSecurity2021,
title = {Storage and Security},
author = {{The University of Edinburgh}},
date = {2021-09},
url = {https://mantra.edina.ac.uk/storageandsecurity/},
urldate = {2020-07-28},
organization = {{MANTRA Research Data Management Training.}}
}
@online{wholetaleWholeTale2019,
title = {The {{Whole Tale}}},
author = {{Wholetale}},
date = {2019},
url = {https://wholetale.org/},
urldate = {2020-10-19},
file = {/home/jen/Zotero/storage/FJPSX67X/wholetale.org.html}
}
@inreference{wikipediacontributorsChecksum2020,
title = {Checksum},
booktitle = {Wikipedia, {{The Free Encyclopedia}}},
author = {{Wikipedia contributors}},
date = {2020-06-16},
publisher = {{Wikipedia, The Free Encyclopedia}},
url = {https://en.wikipedia.org/w/index.php?title=Checksum&oldid=962858813},
urldate = {2020-07-28},
annotation = {Page Version ID: 962858813}
}
@inreference{wikipediacontributorsComparisonOnlineBackup2020,
title = {Comparison of Online Backup Services},
booktitle = {Wikipedia, {{The Free Encyclopedia}}},
author = {{Wikipedia contributors}},
date = {2020-10-19},
publisher = {{Wikipedia, The Free Encyclopedia}},
url = {https://en.wikipedia.org/w/index.php?title=Comparison_of_online_backup_services&oldid=984305279},
urldate = {2020-07-28},
langid = {english},
annotation = {Page Version ID: 984305279},
file = {/home/jen/Zotero/storage/UL29P7K9/index.html}
}
@inreference{wikipediacontributorsMd5sum2020,
title = {Md5sum},
booktitle = {Wikipedia, {{The Free Encyclopedia}}},
author = {{Wikipedia contributors}},
date = {2020-06-09},
publisher = {{Wikipedia, The Free Encyclopedia}},
url = {https://en.wikipedia.org/w/index.php?title=Md5sum&oldid=961659444},
urldate = {2020-09-15},
annotation = {Page Version ID: 961659444}
}
@inreference{wikipediacontributorsSha1sum2020,
title = {Sha1sum},
booktitle = {Wikipedia, {{The Free Encyclopedia}}},
author = {{Wikipedia contributors}},
date = {2020-06-30},
publisher = {{Wikipedia, The Free Encyclopedia}},
url = {https://en.wikipedia.org/w/index.php?title=Sha1sum&oldid=965259914},
urldate = {2020-09-15},
annotation = {Page Version ID: 965259914}
}
@online{zenodoZenodoResearchShared,
title = {Zenodo - {{Research}}. {{Shared}}.},
author = {{Zenodo}},
url = {https://zenodo.org/},
urldate = {2020-09-15},
organization = {{Zenodo}}
}
@article{ziemannGeneNameErrors2016,
title = {Gene Name Errors Are Widespread in the Scientific Literature},
author = {Ziemann, Mark and Eren, Yotam and El-Osta, Assam},
date = {2016-12},
journaltitle = {Genome Biology},
shortjournal = {Genome Biol},
volume = {17},
number = {1},
pages = {177},
issn = {1474-760X},
doi = {10.1186/s13059-016-1044-7},
url = {http://genomebiology.biomedcentral.com/articles/10.1186/s13059-016-1044-7},
urldate = {2020-09-15},
abstract = {The spreadsheet software Microsoft Excel, when used with default settings, is known to convert gene names to dates and floating-point numbers. A programmatic scan of leading genomics journals reveals that approximately one-fifth of papers with supplementary Excel gene lists contain erroneous gene name conversions.},
langid = {english},
file = {/home/jen/papers/s13059-016-1044-7}
}