@inproceedings{304c1dde298e4abe93a15756d0b64fde,
title = "Term familiarity to indicate perceived and actual difficulty of text in medical digital libraries",
abstract = "With increasing text digitization, digital libraries can personalize materials for individuals with different education levels and language skills. To this end, documents need meta-information describing their difficulty level. Previous attempts at such labeling used readability formulas but the formulas have not been validated with modern texts and their outcome is seldom associated with actual difficulty. We focus on medical texts and are developing new, evidence-based meta-tags that are associated with perceived and actual text difficulty. This work describes a first tag, 'term familiarity', which is based on term frequency in the Google corpus. We evaluated its feasibility to serve as a tag by looking at a document corpus (N=1,073) and found that terms in blogs or journal articles displayed unexpected but significantly different scores. Term familiarity was then applied to texts and results from a previous user study (N=86) and could better explain differences for perceived and actual difficulty.",
keywords = "Actual Difficulty, Health Informatics, Lexical Tags, Meta Information, Natural Language Processing, Perceived Difficulty",
author = "Gondy Leroy and Endicott, {James E.}",
year = "2011",
doi = "10.1007/978-3-642-24826-9_38",
language = "English (US)",
isbn = "9783642248252",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
pages = "307--310",
booktitle = "Digital Libraries",
note = "13th International Conference on Asia-Pacific Digital Libraries, ICADL 2011 ; Conference date: 24-10-2011 Through 27-10-2011",
}