references.bib 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830
  1. @unpublished{solomon-data,
  2. TITLE = {{Long-form, child-centered audio-recordings collected in the Solomon Islands in 2019}},
  3. AUTHOR = {Walker, Sara and Grosjean, Paulina and Cristia, Alejandrina},
  4. NOTE = {unpublished private dataset},
  5. YEAR = {2019},
  6. }
  7. @article{soderstrom2021developing,
  8. title={Developing A Cross-Cultural Annotation System and MetaCorpus for Studying Infants’ Real World Language Experience},
  9. author={Soderstrom, Melanie and Casillas, Marisa and Bergelson, Elika and Rosemberg, Celia and Alam, Florencia and Warlaumont, Anne S and Bunce, John},
  10. journal={Collabra: Psychology},
  11. volume={7},
  12. number={1},
  13. pages={23445},
  14. year={2021},
  15. publisher={University of California Press}
  16. }
  17. @article{soska2021hyper,
  18. title={(Hyper) active Data Curation: A Video Case Study from Behavioral Science},
  19. author={Soska, Kasey and Xu, Melody and Gonzalez, Sandy and Hertzberg, Orit and Gilmore, Rick O and Tamis-LeMonda, Catherine and Adolph, Karen E},
  20. year={2021},
  21. journal={PsyArXiv},
  22. url={https://psyarxiv.com/89rcb/download?format=pdf}
  23. }
  24. @article{ear1,
  25. doi = {10.3758/bf03195410},
  26. url = {https://doi.org/10.3758/bf03195410},
  27. year = {2001},
  28. month = nov,
  29. publisher = {Springer Science and Business Media {LLC}},
  30. volume = {33},
  31. number = {4},
  32. pages = {517--523},
  33. author = {Matthias R. Mehl and James W. Pennebaker and D. Michael Crow and James Dabbs and John H. Price},
  34. title = {The Electronically Activated Recorder ({EAR}): A device for sampling naturalistic daily activities and conversations},
  35. journal = {Behavior Research Methods, Instruments, {\&} Computers}
  36. }
  37. @inproceedings{schuller2017interspeech,
  38. title={The Interspeech 2017 computational paralinguistics challenge: Addressee, cold \& snoring},
  39. author={Schuller, Bj{\"o}rn and Steidl, Stefan and Batliner, Anton and Bergelson, Elika and Krajewski, Jarek and Janott, Christoph and Amatuni, Andrei and Casillas, Marisa and Seidl, Amdanda and Soderstrom, Melanie and others},
  40. booktitle={Interspeech},
  41. year={2017}
  42. }
  43. @article{lenaeval1,
  44. title={A thorough evaluation of the Language Environment Analysis (LENA) system},
  45. author={Cristia, Alejandrina and Lavechin, Marvin and Scaff, Camila and Soderstrom, Melanie and Rowland, Caroline and R{\"a}s{\"a}nen, Okko and Bunce, John and Bergelson, Elika},
  46. year={2019},
  47. publisher={OSF Preprints},
  48. journal={Behavior Research Methods}
  49. }
  50. @article{boersma2006praat,
  51. title={Praat: doing phonetics by computer},
  52. author={Boersma, Paul},
  53. journal={http://www. praat. org/},
  54. year={2006}
  55. }
  56. @inproceedings{krishnamachari2021developing,
  57. title={Developing Neural Representations for Robust Child-Adult Diarization},
  58. author={Krishnamachari, Suchitra and Kumar, Manoj and Kim, So Hyun and Lord, Catherine and Narayanan, Shrikanth},
  59. booktitle={2021 IEEE Spoken Language Technology Workshop (SLT)},
  60. pages={590--597},
  61. year={2021},
  62. organization={IEEE}
  63. }
  64. @article{warlaumont2014social,
  65. title={A social feedback loop for speech development and its reduction in autism},
  66. author={Warlaumont, Anne S and Richards, Jeffrey A and Gilkerson, Jill and Oller, D Kimbrough},
  67. journal={Psychological science},
  68. volume={25},
  69. number={7},
  70. pages={1314--1324},
  71. year={2014},
  72. publisher={Sage Publications Sage CA: Los Angeles, CA}
  73. }
  74. @article{riad2020vocal,
  75. title={Vocal markers from sustained phonation in Huntington's Disease},
  76. author={Riad, Rachid and Titeux, Hadrien and Lemoine, Laurie and Montillot, Justine and Bagnou, Jennifer Hamet and Cao, Xuan Nga and Dupoux, Emmanuel and Bachoud-L{\'e}vi, Anne-Catherine},
  77. journal={Interspeech},
  78. year={2020}
  79. }
  80. @article{ear2,
  81. doi = {10.1037/0022-3514.84.4.857},
  82. url = {https://doi.org/10.1037/0022-3514.84.4.857},
  83. year = {2003},
  84. publisher = {American Psychological Association ({APA})},
  85. volume = {84},
  86. number = {4},
  87. pages = {857--870},
  88. author = {Matthias R. Mehl and James W. Pennebaker},
  89. title = {The sounds of social life: A psychometric analysis of students{\textquotesingle} daily social environments and natural conversations.},
  90. journal = {Journal of Personality and Social Psychology}
  91. }
  92. @book{macwhinney2000childes,
  93. title={The CHILDES project: The database},
  94. author={MacWhinney, Brian},
  95. volume={2},
  96. year={2000},
  97. publisher={Psychology Press}
  98. }
  99. @inproceedings{vandam2016homebank,
  100. title={HomeBank: An online repository of daylong child-centered audio recordings},
  101. author={VanDam, Mark and Warlaumont, Anne S and Bergelson, Elika and Cristia, Alejandrina and Soderstrom, Melanie and De Palma, Paul and MacWhinney, Brian},
  102. booktitle={Seminars in Speech and Language},
  103. volume={37},
  104. pages={128},
  105. year={2016},
  106. organization={NIH Public Access}
  107. }
  108. @article{christakis2009audible,
  109. title={Audible television and decreased adult words, infant vocalizations, and conversational turns: a population-based study},
  110. author={Christakis, Dimitri A and Gilkerson, Jill and Richards, Jeffrey A and Zimmerman, Frederick J and Garrison, Michelle M and Xu, Dongxin and Gray, Sharmistha and Yapanel, Umit},
  111. journal={Archives of pediatrics \& adolescent medicine},
  112. volume={163},
  113. number={6},
  114. pages={554--558},
  115. year={2009},
  116. publisher={American Medical Association}
  117. }
  118. @misc{warl,
  119. doi = {10.21415/T54S3C},
  120. url = {http://homebank.talkbank.org/access/Password/Warlaumont.html},
  121. author = {Warlaumont, Anne},
  122. title = {HomeBank Warlaumont Corpus},
  123. publisher = {TalkBank},
  124. year = {2016}
  125. }
  126. @article{Nee2021,
  127. doi = {10.3765/plsa.v6i1.4967},
  128. url = {https://doi.org/10.3765/plsa.v6i1.4967},
  129. year = {2021},
  130. month = mar,
  131. publisher = {Linguistic Society of America},
  132. volume = {6},
  133. number = {1},
  134. pages = {213},
  135. author = {Julia Nee},
  136. title = {Understanding the effects of language revitalization workshops using long-format speech environment recordings},
  137. journal = {Proceedings of the Linguistic Society of America}
  138. }
  139. @article{casillas2019step,
  140. author = {Casillas, Marisa and Cristia, Alejandrina},
  141. title = "{A step-by-step guide to collecting and analyzing long-format speech environment (LFSE) recordings}",
  142. journal = {Collabra: Psychology},
  143. volume = {5},
  144. number = {1},
  145. year = {2019},
  146. month = {05},
  147. issn = {2474-7394},
  148. doi = {10.1525/collabra.209},
  149. url = {https://doi.org/10.1525/collabra.209},
  150. note = {24},
  151. eprint = {https://online.ucpress.edu/collabra/article-pdf/5/1/24/437539/209-3199-1-pb.pdf},
  152. }
  153. @article{lavechin2020opensource,
  154. title={An open-source voice type classifier for child-centered daylong recordings},
  155. author={Marvin Lavechin and Ruben Bousbib and Hervé Bredin and Emmanuel Dupoux and Alejandrina Cristia},
  156. year={2020},
  157. journal={Interspeech}
  158. }
  159. @article{rasanen2020,
  160. title={ALICE: An open-source tool for automatic measurement of phoneme, syllable, and word counts from child-centered daylong recordings},
  161. author={R{\"a}s{\"a}nen, Okko and Seshadri, Shreyas and Lavechin, Marvin and Cristia, Alejandrina and Casillas, Marisa},
  162. journal={Behavior Research Methods},
  163. pages={1--18},
  164. year={2020},
  165. publisher={Springer}
  166. }
  167. @inproceedings{AlFutaisi2019,
  168. doi = {10.1145/3340555.3353751},
  169. url = {https://doi.org/10.1145/3340555.3353751},
  170. year = {2019},
  171. month = oct,
  172. publisher = {{ACM}},
  173. author = {Najla Al Futaisi and Zixing Zhang and Alejandrina Cristia and Anne Warlaumont and Bjorn Schuller},
  174. title = {{VCMNet}: Weakly Supervised Learning for Automatic Infant Vocalisation Maturity Analysis},
  175. booktitle = {2019 International Conference on Multimodal Interaction}
  176. }
  177. @misc{pympi-1.70,
  178. author={Lubbers, Mart and Torreira, Francisco},
  179. title={pympi-ling: a {Python} module for processing {ELAN}s {EAF} and {Praat}s {TextGrid} annotation files.},
  180. howpublished={\url{https://pypi.python.org/pypi/pympi-ling}},
  181. year={2013-2021},
  182. note={Version 1.70}
  183. }
  184. @inproceedings{bird2020decolonising,
  185. title={Decolonising speech and language technology},
  186. author={Bird, Steven},
  187. booktitle={Proceedings of the 28th International Conference on Computational Linguistics},
  188. pages={3504--3519},
  189. year={2020}
  190. }
  191. @article{cychosz2021using,
  192. title={Using big data from long-form recordings to study development and optimize societal impact},
  193. author={Cychosz, Meg and Cristia, Alejandrina},
  194. year={2021},
  195. journal={OSF Preprints}
  196. }
  197. @article{Cychosz2020,
  198. doi = {10.3758/s13428-020-01365-9},
  199. url = {https://doi.org/10.3758/s13428-020-01365-9},
  200. year = {2020},
  201. month = feb,
  202. publisher = {Springer Science and Business Media {LLC}},
  203. volume = {52},
  204. number = {5},
  205. pages = {1951--1969},
  206. author = {Margaret Cychosz and Rachel Romeo and Melanie Soderstrom and Camila Scaff and Hillary Ganek and Alejandrina Cristia and Marisa Casillas and Kaya de Barbaro and Janet Y. Bang and Adriana Weisleder},
  207. title = {Longform recordings of everyday life: Ethics for best practices},
  208. journal = {Behavior Research Methods}
  209. }
  210. @misc{eaf-anonymizer-original,
  211. title={HomeBank ITS file anonymizer},
  212. url={https://github.com/HomeBankCode/ITS_annonymizer},
  213. journal={GitHub},
  214. author={Sarah MacEwan},
  215. year = {2019}
  216. }
  217. @inproceedings{Casillas2017,
  218. author={Marisa Casillas and Elika Bergelson and Anne S. Warlaumont and Alejandrina Cristia and Melanie Soderstrom and Mark VanDam and Han Sloetjes},
  219. title={A New Workflow for Semi-Automatized Annotations: Tests with Long-Form Naturalistic Recordings of Childrens Language Environments},
  220. year=2017,
  221. booktitle={Proc. Interspeech 2017},
  222. pages={2098--2102},
  223. doi={10.21437/Interspeech.2017-1418},
  224. url={http://dx.doi.org/10.21437/Interspeech.2017-1418}
  225. }
  226. @article{Poldrack2014,
  227. doi = {10.1038/nn.3818},
  228. url = {https://doi.org/10.1038/nn.3818},
  229. year = {2014},
  230. month = oct,
  231. publisher = {Springer Science and Business Media {LLC}},
  232. volume = {17},
  233. number = {11},
  234. pages = {1510--1517},
  235. author = {Russell A Poldrack and Krzysztof J Gorgolewski},
  236. title = {Making big data open: data sharing in neuroimaging},
  237. journal = {Nature Neuroscience}
  238. }
  239. @misc{starter,
  240. doi = {10.17910/B7.390},
  241. url = {http://databrary.org/volume/390},
  242. author = {Bergelson, Elika and Warlaumont, Anne and Cristia, Alejandrina and Casillas, Marisa and Rosemberg, Celia and Soderstrom, Melanie and Rowland, Caroline and Durrant, Samantha and Bunce, John},
  243. title = {Starter-ACLEW},
  244. publisher = {Databrary},
  245. year = {2017},
  246. copyright = {Databrary Access Agreement}
  247. }
  248. @article{Perkel_2019,
  249. doi = {10.1038/d41586-019-01040-w},
  250. url = {https://doi.org/10.1038/d41586-019-01040-w},
  251. year = 2019,
  252. month = {apr},
  253. publisher = {Springer Science and Business Media {LLC}},
  254. volume = {568},
  255. number = {7750},
  256. pages = {131--132},
  257. author = {Jeffrey M. Perkel},
  258. title = {11 ways to avert a data-storage disaster},
  259. journal = {Nature}
  260. }
  261. @misc{ffmpeg,
  262. title={ffmpeg tool},
  263. author={ffmpeg{ }Developers},
  264. url={http://ffmpeg.org/},
  265. year={2021}
  266. }
  267. @article{Brase2009datacite,
  268. doi = {10.2139/ssrn.1639998},
  269. url = {https://doi.org/10.2139/ssrn.1639998},
  270. year = {2010},
  271. publisher = {Elsevier {BV}},
  272. author = {Jan Brase},
  273. title = {Datacite - A Global Registration Agency for Research Data},
  274. journal = {{SSRN} Electronic Journal}
  275. }
  276. @misc{robert2018pydub,
  277. title={Pydub},
  278. author={Robert, James and Webbie, Marc and others},
  279. year={2018},
  280. publisher={GitHub},
  281. url={http://pydub.com/}
  282. }
  283. @article{ryant2019second,
  284. title={The second dihard diarization challenge: Dataset, task, and baselines},
  285. author={Ryant, Neville and Church, Kenneth and Cieri, Christopher and Cristia, Alejandrina and Du, Jun and Ganapathy, Sriram and Liberman, Mark},
  286. journal={arXiv preprint arXiv:1906.07839},
  287. year={2019}
  288. }
  289. @article{ryant2018first,
  290. title={First DIHARD challenge evaluation plan},
  291. author={Ryant, Neville and Church, Kenneth and Cieri, Christopher and Cristia, Alejandrina and Du, Jun and Ganapathy, Sriram and Liberman, Mark},
  292. journal={2018, tech. Rep.},
  293. year={2018}
  294. }
  295. @article{ryant2020third,
  296. title={Third DIHARD Challenge Evaluation Plan},
  297. author={Ryant, Neville and Church, Kenneth and Cieri, Christopher and Du, Jun and Ganapathy, Sriram and Liberman, Mark},
  298. journal={arXiv preprint arXiv:2006.05815},
  299. year={2020}
  300. }
  301. @article{Wilkinson2016,
  302. doi = {10.1038/sdata.2016.18},
  303. url = {https://doi.org/10.1038/sdata.2016.18},
  304. year = {2016},
  305. month = mar,
  306. publisher = {Springer Science and Business Media {LLC}},
  307. volume = {3},
  308. number = {1},
  309. author = {Mark D. Wilkinson and Michel Dumontier and IJsbrand Jan Aalbersberg and Gabrielle Appleton and Myles Axton and Arie Baak and Niklas Blomberg and Jan-Willem Boiten and Luiz Bonino da Silva Santos and Philip E. Bourne and Jildau Bouwman and Anthony J. Brookes and Tim Clark and Merc{\`{e}} Crosas and Ingrid Dillo and Olivier Dumon and Scott Edmunds and Chris T. Evelo and Richard Finkers and Alejandra Gonzalez-Beltran and Alasdair J.G. Gray and Paul Groth and Carole Goble and Jeffrey S. Grethe and Jaap Heringa and Peter A.C 't Hoen and Rob Hooft and Tobias Kuhn and Ruben Kok and Joost Kok and Scott J. Lusher and Maryann E. Martone and Albert Mons and Abel L. Packer and Bengt Persson and Philippe Rocca-Serra and Marco Roos and Rene van Schaik and Susanna-Assunta Sansone and Erik Schultes and Thierry Sengstag and Ted Slater and George Strawn and Morris A. Swertz and Mark Thompson and Johan van der Lei and Erik van Mulligen and Jan Velterop and Andra Waagmeester and Peter Wittenburg and Katherine Wolstencroft and Jun Zhao and Barend Mons},
  310. title = {The {FAIR} Guiding Principles for scientific data management and stewardship},
  311. journal = {Scientific Data}
  312. }
  313. @misc{zenodo,
  314. doi = {10.25495/7GXK-RD71},
  315. url = {https://www.zenodo.org/},
  316. author = {{European Organization For Nuclear Research} and {OpenAIRE}},
  317. keywords = {FOS: Physical sciences, Publication, Dataset},
  318. language = {en},
  319. title = {Zenodo},
  320. publisher = {CERN},
  321. year = {2013}
  322. }
  323. @article {dataverse,
  324. title = {An Introduction to the Dataverse Network as an Infrastructure for Data Sharing},
  325. journal = {Sociological Methods and Research},
  326. volume = {36},
  327. year = {2007},
  328. pages = {173{\textendash}199},
  329. abstract = {We introduce a set of integrated developments in web application software, networking, data citation standards, and statistical methods designed to put some of the universe of data and data sharing practices on somewhat firmer ground. We have focused on social science data, but aspects of what we have developed may apply more widely. The idea is to facilitate the public distribution of persistent, authorized, and verifiable data, with powerful but easy-to-use technology, even when the data are confidential or proprietary. We intend to solve some of the sociological problems of data sharing via technological means, with the result intended to benefit both the scientific community and the sometimes apparently contradictory goals of individual researchers.},
  330. author = {Gary King}
  331. }
  332. @misc{pandas-software,
  333. author = {The Pandas development team},
  334. title = {pandas-dev/pandas: Pandas},
  335. month = feb,
  336. year = 2020,
  337. publisher = {Zenodo},
  338. version = {latest},
  339. doi = {10.5281/zenodo.3509134},
  340. url = {https://doi.org/10.5281/zenodo.3509134}
  341. }
  342. @InProceedings{pandas-paper,
  343. author = { Wes McKinney },
  344. title = { {D}ata {S}tructures for {S}tatistical {C}omputing in {P}ython },
  345. booktitle = { {P}roceedings of the 9th {P}ython in {S}cience {C}onference },
  346. pages = { 56 - 61 },
  347. year = { 2010 },
  348. editor = { St\'efan van der Walt and Jarrod Millman },
  349. doi = { 10.25080/Majora-92bf1922-00a }
  350. }
  351. @misc{gilkerson2008power,
  352. title={The power of talk (LENA Foundation Technical Report LTR-01-2)},
  353. author={Gilkerson, J and Richards, JA},
  354. year={2008},
  355. publisher={Retrieved from LENA Foundation: https://www.lena.org/wp-content/uploads/2016/07/LTR-01-2_PowerOfTalk.pdf}
  356. }
  357. @article{vandam2018vetting,
  358. title={Vetting Manual: Preparation of Recordings for Unrestricted Publication in HomeBank (Version 1.1)},
  359. author={VanDam, M and Warlaumont, A and MacWhinney, B and Soderstrom, M and Bergelson, E},
  360. journal={DOI: https://doi. org/10.21415/T56H4M},
  361. year={2018}
  362. }
  363. @article{broesch2020navigating,
  364. title={Navigating cross-cultural research: methodological and ethical considerations},
  365. author={Broesch, Tanya and Crittenden, Alyssa N and Beheim, Bret A and Blackwell, Aaron D and Bunce, John A and Colleran, Heidi and Hagel, Kristin and Kline, Michelle and McElreath, Richard and Nelson, Robin G and others},
  366. journal={Proceedings of the Royal Society B},
  367. volume={287},
  368. number={1935},
  369. pages={20201245},
  370. year={2020},
  371. publisher={The Royal Society}
  372. }
  373. @Article{10.12688/f1000research.10783.1,
  374. AUTHOR = { Ghosh, SS and Poline, JB and Keator, DB and Halchenko, YO and Thomas, AG and Kessler, DA and Kennedy, DN},
  375. TITLE = {A very simple, re-executable neuroimaging publication [version 1; peer review: 2 approved with reservations]
  376. },
  377. JOURNAL = {F1000Research},
  378. VOLUME = {6},
  379. YEAR = {2017},
  380. NUMBER = {124},
  381. DOI = {10.12688/f1000research.10783.1}
  382. }
  383. @Article{Eglen2017,
  384. author={Eglen, Stephen J.
  385. and Marwick, Ben
  386. and Halchenko, Yaroslav O.
  387. and Hanke, Michael
  388. and Sufi, Shoaib
  389. and Gleeson, Padraig
  390. and Silver, R. Angus
  391. and Davison, Andrew P.
  392. and Lanyon, Linda
  393. and Abrams, Mathew
  394. and Wachtler, Thomas
  395. and Willshaw, David J.
  396. and Pouzat, Christophe
  397. and Poline, Jean-Baptiste},
  398. title={Toward standard practices for sharing computer code and programs in neuroscience},
  399. journal={Nature Neuroscience},
  400. year={2017},
  401. month={Jun},
  402. day={01},
  403. volume={20},
  404. number={6},
  405. pages={770-773},
  406. abstract={Computational techniques are central in many areas of neuroscience and are relatively easy to share. This paper describes why computer programs underlying scientific publications should be shared and lists simple steps for sharing. Together with ongoing efforts in data sharing, this should aid reproducibility of research.},
  407. issn={1546-1726},
  408. doi={10.1038/nn.4550},
  409. url={https://doi.org/10.1038/nn.4550}
  410. }
  411. @article{xu2008lenatm,
  412. title={The lenaTM language environment analysis system: The interpretive time segments (its) file},
  413. author={Xu, D and Yapanel, U and Gray, S and Baer, CT},
  414. journal={LENA Research Foundation Technical Report LTR-04-2},
  415. year={2008}
  416. }
  417. @article{levin2021sensing,
  418. title={Sensing everyday activity: Parent perceptions and feasibility},
  419. author={Levin, Hannah I and Egger, Dominique and Andres, Lara and Johnson, Mckensey and Bearman, Sarah Kate and de Barbaro, Kaya},
  420. journal={Infant Behavior and Development},
  421. volume={62},
  422. pages={101511},
  423. year={2021},
  424. publisher={Elsevier}
  425. }
  426. @inproceedings{wittenburg2006elan,
  427. title={ELAN: a professional framework for multimodality research},
  428. author={Wittenburg, Peter and Brugman, Hennie and Russel, Albert and Klassmann, Alex and Sloetjes, Han},
  429. booktitle={5th International Conference on Language Resources and Evaluation (LREC 2006)},
  430. pages={1556--1559},
  431. year={2006}
  432. }
  433. @article{MacWhinney2000,
  434. doi = {10.1162/coli.2000.26.4.657},
  435. url = {https://doi.org/10.1162/coli.2000.26.4.657},
  436. year = {2000},
  437. month = dec,
  438. publisher = {{MIT} Press - Journals},
  439. volume = {26},
  440. number = {4},
  441. pages = {657},
  442. author = {Brian MacWhinney},
  443. title = {The {CHILDES} Project: Tools for Analyzing Talk (third edition): Volume I: Transcription format and programs, Volume {II}: The database},
  444. journal = {Computational Linguistics}
  445. }
  446. @article{pub.1022076283,
  447. author = {Van Essen, David C. and Smith, Stephen M. and Barch, Deanna M. and Behrens, Timothy E.J. and Yacoub, Essa and Ugurbil, Kamil and Consortium, for the WU-Minn HCP},
  448. doi = {10.1016/j.neuroimage.2013.05.041},
  449. journal = {NeuroImage},
  450. keywords = {},
  451. number = {},
  452. pages = {62-79},
  453. title = {The WU-Minn Human Connectome Project: An overview},
  454. url = {http://europepmc.org/articles/pmc3724347?pdf=render},
  455. volume = {80},
  456. year = {2013}
  457. }
  458. @misc{vandam-day,
  459. doi = {10.21415/T5388S},
  460. url = {http://homebank.talkbank.org/access/Public/VanDam-5minute.html},
  461. author = {VanDam, Mark},
  462. title = {HomeBank VanDam Public 5-minute Corpus},
  463. publisher = {TalkBank},
  464. year = {2015}
  465. }
  466. @misc{exelang-book,
  467. url = {https://bookdown.org/alecristia/exelang-book/},
  468. author = {Pisani, Sara and Gautheron, Lucas and Cristia, Alejandrina},
  469. title = {Long-form recordings: From A to Z},
  470. year = {2021}
  471. }
  472. @INPROCEEDINGS{zooniverse,
  473. author = {{Borne}, K.~D. and {Zooniverse Team}},
  474. title = "{The Zooniverse: A Framework for Knowledge Discovery from Citizen Science Data}",
  475. keywords = {0800 EDUCATION, 0815 EDUCATION / Informal education, 1914 INFORMATICS / Data mining, 1942 INFORMATICS / Machine learning},
  476. booktitle = {AGU Fall Meeting Abstracts},
  477. year = 2011,
  478. volume = {2011},
  479. month = dec,
  480. eid = {ED23C-0650},
  481. adsurl = {https://ui.adsabs.harvard.edu/abs/2011AGUFMED23C0650B},
  482. adsnote = {Provided by the SAO/NASA Astrophysics Data System}
  483. }
  484. @article{semenzin2020a,
  485. doi = {10.31219/osf.io/z6exv},
  486. url = {https://doi.org/10.31219/osf.io/z6exv},
  487. year = {2020},
  488. month = nov,
  489. publisher = {Center for Open Science},
  490. author = {Semenzin, Chiara and Hamrick, Lisa and Seidl, Amanda and Lynne Kelleher, Bridgette and Cristia, Alejandrina},
  491. title = {Describing vocalizations in young children: A big data approach through citizen science annotation},
  492. journal = {}
  493. }
  494. @article{semenzin2020b,
  495. doi = {10.31219/osf.io/gpxf5},
  496. url = {https://doi.org/10.31219/osf.io/gpxf5},
  497. year = {2020},
  498. month = nov,
  499. publisher = {Center for Open Science},
  500. author = {Semenzin, Chiara and Hamrick, Lisa and Seidl, Amanda and Lynne Kelleher, Bridgette and Cristia, Alejandrina},
  501. title = {Towards Large-Scale Data Annotation of Audio from Wearables: Validating Zooniverse Annotations of Infant Vocalization Types},
  502. journal = {}
  503. }
  504. @book{datalad_handbook,
  505. doi = {10.5281/ZENODO.3608612},
  506. url = {https://zenodo.org/record/3608612},
  507. author = {Wagner, Adina S. and Waite, Laura K. and Meyer, Kyle and Heckner, Marisa K. and Kadelka, Tobias and Reuter, Niels and Waite, Alexander Q. and Poldrack, Benjamin and Markiewicz, Christopher J. and Halchenko, Yaroslav O. and Vavra, Peter and Chormai, Pattarawat and Poline, Jean-Baptiste and Paas, Lya K. and Herholz, Peer and Mochalski, Lisa N. and Kraljevic, Nevena and Wiersch, Lisa and Hutton, Alexandre and Hanke, Michael},
  508. keywords = {data management, book, datalad, version control, teaching resource},
  509. title = {The DataLad Handbook},
  510. publisher = {Zenodo},
  511. year = {2020},
  512. copyright = {Creative Commons Attribution Share Alike 4.0 International}
  513. }
  514. @article{datalad_paper,
  515. doi = {10.21105/joss.03262},
  516. url = {https://doi.org/10.21105/joss.03262},
  517. year = {2021},
  518. month = jul,
  519. publisher = {The Open Journal},
  520. volume = {6},
  521. number = {63},
  522. pages = {3262},
  523. author = {Yaroslav Halchenko and Kyle Meyer and Benjamin Poldrack and Debanjum Solanky and Adina Wagner and Jason Gors and Dave MacFarlane and Dorian Pustina and Vanessa Sochat and Satrajit Ghosh and Christian M\"{o}nch and Christopher Markiewicz and Laura Waite and Ilya Shlyakhter and Alejandro de la Vega and Soichi Hayashi and Christian H\"{a}usler and Jean-Baptiste Poline and Tobias Kadelka and Kusti Skyt{\'{e}}n and Dorota Jarecka and David Kennedy and Ted Strauss and Matt Cieslak and Peter Vavra and Horea-Ioan Ioanas and Robin Schneider and Mika Pfl\"{u}ger and James Haxby and Simon Eickhoff and Michael Hanke},
  524. title = {{DataLad}: distributed system for joint management of code, data, and their relationship},
  525. journal = {Journal of Open Source Software}
  526. }
  527. @article{decentralization_hanke,
  528. doi = {10.1515/nf-2020-0037},
  529. url = {https://doi.org/10.1515/nf-2020-0037},
  530. year = {2021},
  531. month = jan,
  532. publisher = {Walter de Gruyter {GmbH}},
  533. volume = {0},
  534. number = {0},
  535. author = {Michael Hanke and Franco Pestilli and Adina S. Wagner and Christopher J. Markiewicz and Jean-Baptiste Poline and Yaroslav O. Halchenko},
  536. title = {In defense of decentralized research data management},
  537. journal = {Neuroforum}
  538. }
  539. @article{decentralization_robinson,
  540. doi = {10.1038/sdata.2018.221},
  541. url = {https://doi.org/10.1038/sdata.2018.221},
  542. year = {2018},
  543. month = oct,
  544. publisher = {Springer Science and Business Media {LLC}},
  545. volume = {5},
  546. number = {1},
  547. author = {Danielle C. Robinson and Joe A. Hand and Mathias Buus Madsen and Karissa R. McKelvey},
  548. title = {The Dat Project, an open and decentralized research data tool},
  549. journal = {Scientific Data}
  550. }
  551. @misc{reproducible_paper,
  552. author = {Adina Wagner},
  553. title = {datalad-handbook/repro-paper-sketch: A template to create a reproducible paper with LaTeX, Makefiles, Python, and DataLad},
  554. howpublished = {\url{https://github.com/datalad-handbook/repro-paper-sketch/}},
  555. month = {},
  556. year = {2020},
  557. note = {(Accessed on 04/30/2021)},
  558. journal = {}
  559. }
  560. @book{alpha,
  561. author = {Krippendorff, Klaus},
  562. title = {Content analysis : an introduction to its methodology},
  563. publisher = {SAGE},
  564. year = {2013},
  565. address = {Los Angeles London},
  566. isbn = {1412983150},
  567. chapter = {12}
  568. }
  569. @article{kappa,
  570. doi = {10.1037/h0031619},
  571. url = {https://doi.org/10.1037/h0031619},
  572. year = {1971},
  573. publisher = {American Psychological Association ({APA})},
  574. volume = {76},
  575. number = {5},
  576. pages = {378--382},
  577. author = {Joseph L. Fleiss},
  578. title = {Measuring nominal scale agreement among many raters.},
  579. journal = {Psychological Bulletin}
  580. }
  581. @Book{AC1,
  582. author = {Gwet, Kilem},
  583. title = {Handbook of inter-rater reliability : the definitive guide to measuring the extent of agreement among raters},
  584. publisher = {Advanced Analytics, LLC},
  585. year = {2014},
  586. address = {Gaithersburg, MD},
  587. isbn = {0970806280}
  588. }
  589. @article{nltk,
  590. added-at = {2020-01-10T00:00:00.000+0100},
  591. author = {Loper, Edward and Bird, Steven},
  592. biburl = {https://www.bibsonomy.org/bibtex/2eac35636d7e2bb4a0264313ed0791372/dblp},
  593. ee = {https://arxiv.org/abs/cs/0205028},
  594. interhash = {1af05e5f1cea0feeea8da5f68707a841},
  595. intrahash = {eac35636d7e2bb4a0264313ed0791372},
  596. journal = {CoRR},
  597. keywords = {dblp},
  598. timestamp = {2020-01-11T11:43:05.000+0100},
  599. title = {NLTK: The Natural Language Toolkit},
  600. url = {http://dblp.uni-trier.de/db/journals/corr/corr0205.html#cs-CL-0205028},
  601. volume = {cs.CL/0205028},
  602. year = 2002
  603. }
  604. @article{gamma,
  605. doi = {10.1162/coli_a_00227},
  606. url = {https://doi.org/10.1162/coli_a_00227},
  607. year = {2015},
  608. month = sep,
  609. publisher = {{MIT} Press - Journals},
  610. volume = {41},
  611. number = {3},
  612. pages = {437--479},
  613. author = {Yann Mathet and Antoine Widl\"{o}cher and Jean-Philippe M{\'{e}}tivier},
  614. title = {The Unified and Holistic Method Gamma ($\upgamma$) for Inter-Annotator Agreement Measure and Alignment},
  615. journal = {Computational Linguistics}
  616. }
  617. @unpublished{pygamma_agreement,
  618. TITLE = {{pygamma-agreement: Gamma $\gamma$ measure for inter/intra-annotator agreement in Python}},
  619. AUTHOR = {Titeux, Hadrien and Riad, Rachid},
  620. URL = {https://hal.archives-ouvertes.fr/hal-03144116},
  621. NOTE = {working paper or preprint},
  622. YEAR = {2021},
  623. MONTH = Feb,
  624. KEYWORDS = {Annotation de corpus},
  625. PDF = {https://hal.archives-ouvertes.fr/hal-03144116/file/gamma-paper.pdf},
  626. HAL_ID = {hal-03144116},
  627. HAL_VERSION = {v1},
  628. }
  629. @inproceedings{pyannote.metrics,
  630. author = {Herv\'e Bredin},
  631. title = {{pyannote.metrics: a toolkit for reproducible evaluation, diagnostic, and error analysis of speaker diarization systems}},
  632. booktitle = {{Interspeech 2017, 18th Annual Conference of the International Speech Communication Association}},
  633. year = {2017},
  634. month = {August},
  635. address = {Stockholm, Sweden},
  636. url = {http://pyannote.github.io/pyannote-metrics},
  637. }
  638. @inproceedings{mfa,
  639. author={Michael McAuliffe and Michaela Socolof and Sarah Mihuc and Michael Wagner and Morgan Sonderegger},
  640. title={Montreal Forced Aligner: Trainable Text-Speech Alignment Using Kaldi},
  641. year=2017,
  642. booktitle={Proc. Interspeech 2017},
  643. pages={498--502},
  644. doi={10.21437/Interspeech.2017-1386},
  645. url={http://dx.doi.org/10.21437/Interspeech.2017-1386}
  646. }
  647. @article{Wu2018,
  648. doi = {10.2196/10046},
  649. url = {https://doi.org/10.2196/10046},
  650. year = {2018},
  651. month = jun,
  652. publisher = {{JMIR} Publications Inc.},
  653. volume = {6},
  654. number = {6},
  655. pages = {e10046},
  656. author = {Robert Wu and Daniyal Liaqat and Eyal de Lara and Tatiana Son and Frank Rudzicz and Hisham Alshaer and Pegah Abed-Esfahani and Andrea S Gershon},
  657. title = {Feasibility of Using a Smartwatch to Intensively Monitor Patients With Chronic Obstructive Pulmonary Disease: Prospective Cohort Study},
  658. journal = {{JMIR} {mHealth} and {uHealth}}
  659. }
  660. @article{Gorgolewski2016,
  661. doi = {10.1038/sdata.2016.44},
  662. url = {https://doi.org/10.1038/sdata.2016.44},
  663. year = {2016},
  664. month = jun,
  665. publisher = {Springer Science and Business Media {LLC}},
  666. volume = {3},
  667. number = {1},
  668. author = {Krzysztof J. Gorgolewski and Tibor Auer and Vince D. Calhoun and R. Cameron Craddock and Samir Das and Eugene P. Duff and Guillaume Flandin and Satrajit S. Ghosh and Tristan Glatard and Yaroslav O. Halchenko and Daniel A. Handwerker and Michael Hanke and David Keator and Xiangrui Li and Zachary Michael and Camille Maumet and B. Nolan Nichols and Thomas E. Nichols and John Pellman and Jean-Baptiste Poline and Ariel Rokem and Gunnar Schaefer and Vanessa Sochat and William Triplett and Jessica A. Turner and Gaël Varoquaux and Russell A. Poldrack},
  669. title = {The brain imaging data structure, a format for organizing and describing outputs of neuroimaging experiments},
  670. journal = {Scientific Data}
  671. }
  672. @article{Horien2020,
  673. doi = {10.1038/s41562-020-01005-4},
  674. url = {https://doi.org/10.1038/s41562-020-01005-4},
  675. year = {2020},
  676. month = dec,
  677. publisher = {Springer Science and Business Media {LLC}},
  678. volume = {5},
  679. number = {2},
  680. pages = {185--193},
  681. author = {Corey Horien and Stephanie Noble and Abigail S. Greene and Kangjoo Lee and Daniel S. Barron and Siyuan Gao and David O'Connor and Mehraveh Salehi and Javid Dadashkarimi and Xilin Shen and Evelyn M. R. Lake and R. Todd Constable and Dustin Scheinost},
  682. title = {A hitchhiker's guide to working with large, open-source neuroimaging datasets},
  683. journal = {Nature Human Behaviour}
  684. }
  685. @article{Powell2021,
  686. doi = {10.1038/d41586-021-00331-5},
  687. url = {https://doi.org/10.1038/d41586-021-00331-5},
  688. year = {2021},
  689. month = feb,
  690. publisher = {Springer Science and Business Media {LLC}},
  691. volume = {590},
  692. number = {7845},
  693. pages = {198--201},
  694. author = {Kendall Powell},
  695. title = {The broken promise that undermines human genome research},
  696. journal = {Nature}
  697. }
  698. @article{hanke_defense_2021,
  699. title = {In defense of decentralized research data management},
  700. volume = {0},
  701. issn = {2363-7013, 0947-0875},
  702. url = {https://www.degruyter.com/document/doi/10.1515/nf-2020-0037/html},
  703. doi = {10.1515/nf-2020-0037},
  704. language = {en},
  705. number = {0},
  706. urldate = {2021-03-22},
  707. journal = {Neuroforum},
  708. author = {Hanke, Michael and Pestilli, Franco and Wagner, Adina S. and Markiewicz, Christopher J. and Poline, Jean-Baptiste and Halchenko, Yaroslav O.},
  709. month = jan,
  710. year = {2021},
  711. pages = {000010151520200037},
  712. }
  713. @article{gravityspy,
  714. doi = {10.1088/1361-6382/aa5cea},
  715. url = {https://doi.org/10.1088/1361-6382/aa5cea},
  716. year = {2017},
  717. month = feb,
  718. publisher = {{IOP} Publishing},
  719. volume = {34},
  720. number = {6},
  721. pages = {064003},
  722. author = {M Zevin and S Coughlin and S Bahaadini and E Besler and N Rohani and S Allen and M Cabero and K Crowston and A K Katsaggelos and S L Larson and T K Lee and C Lintott and T B Littenberg and A Lundgren and C {\O}sterlund and J R Smith and L Trouille and V Kalogera},
  723. title = {Gravity Spy: integrating advanced {LIGO} detector characterization, machine learning, and citizen science},
  724. journal = {Classical and Quantum Gravity}
  725. }
  726. % code
  727. @misc{zooniverse_example,
  728. doi = {10.12751/G-NODE.K2H9AZ},
  729. url = {https://doi.gin.g-node.org/10.12751/g-node.k2h9az},
  730. author = {Gautheron, Lucas},
  731. keywords = {daylong recordings, crowd-sourcing, speech data management, annotation campaigns},
  732. language = {en},
  733. title = {Launching a campaign of annotations on Zooniverse with ChildProject},
  734. publisher = {G-Node},
  735. year = {2021},
  736. copyright = {MIT License}
  737. }
  738. @article{datalad_procedures,
  739. doi = {10.17605/OSF.IO/6VCXK},
  740. url = {https://osf.io/6vcxk/},
  741. author = {Gautheron, Lucas},
  742. title = {DataLad Procedures for the management of long-form recordings},
  743. publisher = {Open Science Framework},
  744. year = {2021},
  745. journal = {}
  746. }
  747. @article{datalad_extension,
  748. doi = {10.17605/OSF.IO/C2J5A},
  749. url = {https://osf.io/c2j5a/},
  750. author = {Gautheron, Lucas},
  751. title = {DataLad extension for child-centered in-situ recordings},
  752. publisher = {Open Science Framework},
  753. year = {2021},
  754. copyright = {MIT License},
  755. journal = {}
  756. }