@inproceedings{7c9f023d25684ddea3a97b40936f2b6f,
title = "Combining pattern matching with word embeddings for the extraction of experimental variables from scientific literature",
abstract = "Scientists frequently use experiments published in other articles or reports by governing entities (e.g. NIH) as templates for reporting on their own experiments. Those templates occasionally change to reflect new discoveries. For creating retrospective studies and meta-analyses, finding the template parameters associated with scientific results can be critical. To aid in the extraction of experimental parameters (e.g. animal housing temperature) in a corpus of ∼8M scientific reports, we used a combination of pattern matching, part of speech tagging, units and measures extraction, and machine learning. We describe a use case where the housing temperature used for experiments involving mice was shown to impact their response to tumor reduction drugs. We show that 1) combining deep learning and pattern matching is a good model to address the problem described and 2) that researcher's behavior and experimental template usage takes a while to change after the publication of an important discovery.",
keywords = "biomedical, machine learning, neural networks, pattern matching, regular expressions, Spark, units and measures",
author = "Deus, {Helena F.} and Corey Harper and Darin McBeath and Ron Daniel",
year = "2018",
month = jan,
day = "12",
doi = "10.1109/BigData.2017.8258456",
language = "English",
series = "Proceedings - 2017 IEEE International Conference on Big Data, Big Data 2017",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "4287--4292",
editor = "Zoran Obradovic and Ricardo Baeza-Yates and Jeremy Kepner and Raghunath Nambiar and Chonggang Wang and Masashi Toyoda and Toyotaro Suzumura and Xiaohua Hu and Alfredo Cuzzocrea and Ricardo Baeza-Yates and Jian Tang and Hui Zang and Jian-Yun Nie and Rumi Ghosh",
booktitle = "Proceedings - 2017 IEEE International Conference on Big Data, Big Data 2017",
note = "5th IEEE International Conference on Big Data, Big Data 2017 ; Conference date: 11-12-2017 Through 14-12-2017",
}