@inproceedings{fraser-etal-2019-importance,
title = "The importance of sharing patient-generated clinical speech and language data",
author = {Fraser, Kathleen C. and
Linz, Nicklas and
Lindsay, Hali and
K{\"o}nig, Alexandra},
editor = "Niederhoffer, Kate and
Hollingshead, Kristy and
Resnik, Philip and
Resnik, Rebecca and
Loveys, Kate",
booktitle = "Proceedings of the Sixth Workshop on Computational Linguistics and Clinical Psychology",
month = jun,
year = "2019",
address = "Minneapolis, Minnesota",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W19-3007",
doi = "10.18653/v1/W19-3007",
pages = "55--61",
abstract = "Increased access to large datasets has driven progress in NLP. However, most computational studies of clinically-validated, patient-generated speech and language involve very few datapoints, as such data are difficult (and expensive) to collect. In this position paper, we argue that we must find ways to promote data sharing across research groups, in order to build datasets of a more appropriate size for NLP and machine learning analysis. We review the benefits and challenges of sharing clinical language data, and suggest several concrete actions by both clinical and NLP researchers to encourage multi-site and multi-disciplinary data sharing. We also propose the creation of a collaborative data sharing platform, to allow NLP researchers to take a more active responsibility for data transcription, annotation, and curation.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="fraser-etal-2019-importance">
<titleInfo>
<title>The importance of sharing patient-generated clinical speech and language data</title>
</titleInfo>
<name type="personal">
<namePart type="given">Kathleen</namePart>
<namePart type="given">C</namePart>
<namePart type="family">Fraser</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nicklas</namePart>
<namePart type="family">Linz</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hali</namePart>
<namePart type="family">Lindsay</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Alexandra</namePart>
<namePart type="family">König</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-06</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Sixth Workshop on Computational Linguistics and Clinical Psychology</title>
</titleInfo>
<name type="personal">
<namePart type="given">Kate</namePart>
<namePart type="family">Niederhoffer</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kristy</namePart>
<namePart type="family">Hollingshead</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Philip</namePart>
<namePart type="family">Resnik</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Rebecca</namePart>
<namePart type="family">Resnik</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kate</namePart>
<namePart type="family">Loveys</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Minneapolis, Minnesota</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Increased access to large datasets has driven progress in NLP. However, most computational studies of clinically-validated, patient-generated speech and language involve very few datapoints, as such data are difficult (and expensive) to collect. In this position paper, we argue that we must find ways to promote data sharing across research groups, in order to build datasets of a more appropriate size for NLP and machine learning analysis. We review the benefits and challenges of sharing clinical language data, and suggest several concrete actions by both clinical and NLP researchers to encourage multi-site and multi-disciplinary data sharing. We also propose the creation of a collaborative data sharing platform, to allow NLP researchers to take a more active responsibility for data transcription, annotation, and curation.</abstract>
<identifier type="citekey">fraser-etal-2019-importance</identifier>
<identifier type="doi">10.18653/v1/W19-3007</identifier>
<location>
<url>https://aclanthology.org/W19-3007</url>
</location>
<part>
<date>2019-06</date>
<extent unit="page">
<start>55</start>
<end>61</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T The importance of sharing patient-generated clinical speech and language data
%A Fraser, Kathleen C.
%A Linz, Nicklas
%A Lindsay, Hali
%A König, Alexandra
%Y Niederhoffer, Kate
%Y Hollingshead, Kristy
%Y Resnik, Philip
%Y Resnik, Rebecca
%Y Loveys, Kate
%S Proceedings of the Sixth Workshop on Computational Linguistics and Clinical Psychology
%D 2019
%8 June
%I Association for Computational Linguistics
%C Minneapolis, Minnesota
%F fraser-etal-2019-importance
%X Increased access to large datasets has driven progress in NLP. However, most computational studies of clinically-validated, patient-generated speech and language involve very few datapoints, as such data are difficult (and expensive) to collect. In this position paper, we argue that we must find ways to promote data sharing across research groups, in order to build datasets of a more appropriate size for NLP and machine learning analysis. We review the benefits and challenges of sharing clinical language data, and suggest several concrete actions by both clinical and NLP researchers to encourage multi-site and multi-disciplinary data sharing. We also propose the creation of a collaborative data sharing platform, to allow NLP researchers to take a more active responsibility for data transcription, annotation, and curation.
%R 10.18653/v1/W19-3007
%U https://aclanthology.org/W19-3007
%U https://doi.org/10.18653/v1/W19-3007
%P 55-61
Markdown (Informal)
[The importance of sharing patient-generated clinical speech and language data](https://aclanthology.org/W19-3007) (Fraser et al., CLPsych 2019)
ACL