Research aimed at correcting words in text has focused on three progressively more difficult problems:(1) nonword error detection; (2) isolated-word error correction; and (3) context-dependent work correction. In response to the first problem, efficient pattern-matching and n-gram analysis techniques have been developed for detecting strings that do not appear in a given word list. In response to the second problem, a variety of general and application-specific spelling correction techniques have been developed. Some of them were based on detailed studies of spelling error patterns. In response to the third problem, a few experiments using natural-language-processing tools or statistical-language models have been carried out. This article surveys documented findings on spelling error patterns, provides descriptions of various nonword detection and isolated-word error correction techniques, reviews the state of the art of context-dependent word correction techniques, and discusses research issues related to all three areas of automatic error correction in text.
Description
Technique for automatically correcting words in text
%0 Journal Article
%1 146380
%A Kukich, Karen
%C New York, NY, USA
%D 1992
%I ACM
%J ACM Comput. Surv.
%K edit repair
%N 4
%P 377--439
%R http://doi.acm.org/10.1145/146370.146380
%T Technique for automatically correcting words in text
%U http://portal.acm.org/citation.cfm?doid=146370.146380#
%V 24
%X Research aimed at correcting words in text has focused on three progressively more difficult problems:(1) nonword error detection; (2) isolated-word error correction; and (3) context-dependent work correction. In response to the first problem, efficient pattern-matching and n-gram analysis techniques have been developed for detecting strings that do not appear in a given word list. In response to the second problem, a variety of general and application-specific spelling correction techniques have been developed. Some of them were based on detailed studies of spelling error patterns. In response to the third problem, a few experiments using natural-language-processing tools or statistical-language models have been carried out. This article surveys documented findings on spelling error patterns, provides descriptions of various nonword detection and isolated-word error correction techniques, reviews the state of the art of context-dependent word correction techniques, and discusses research issues related to all three areas of automatic error correction in text.
@article{146380,
abstract = {Research aimed at correcting words in text has focused on three progressively more difficult problems:(1) nonword error detection; (2) isolated-word error correction; and (3) context-dependent work correction. In response to the first problem, efficient pattern-matching and n-gram analysis techniques have been developed for detecting strings that do not appear in a given word list. In response to the second problem, a variety of general and application-specific spelling correction techniques have been developed. Some of them were based on detailed studies of spelling error patterns. In response to the third problem, a few experiments using natural-language-processing tools or statistical-language models have been carried out. This article surveys documented findings on spelling error patterns, provides descriptions of various nonword detection and isolated-word error correction techniques, reviews the state of the art of context-dependent word correction techniques, and discusses research issues related to all three areas of automatic error correction in text.},
added-at = {2008-09-11T22:19:04.000+0200},
address = {New York, NY, USA},
author = {Kukich, Karen},
biburl = {https://www.bibsonomy.org/bibtex/27ce26ebfd4db241729d82d805134788c/ljiang},
description = {Technique for automatically correcting words in text},
doi = {http://doi.acm.org/10.1145/146370.146380},
interhash = {2df02da545e63d953f0b5d5314245816},
intrahash = {7ce26ebfd4db241729d82d805134788c},
issn = {0360-0300},
journal = {ACM Comput. Surv.},
keywords = {edit repair},
number = 4,
pages = {377--439},
publisher = {ACM},
timestamp = {2008-10-11T21:20:35.000+0200},
title = {Technique for automatically correcting words in text},
url = {http://portal.acm.org/citation.cfm?doid=146370.146380#},
volume = 24,
year = 1992
}