@Book{NAACLHLTDemos:2007, editor = {Bob Carpenter and Amanda Stent and Jason D. Williams}, title ... more @Book{NAACLHLTDemos:2007, editor = {Bob Carpenter and Amanda Stent and Jason D. Williams}, title = {Proceedings of Human Language Technologies: The Annual Conference of the North American Chapter of the Association for Computational Linguistics (NAACL-HLT)}, month = {April}, year = {2007}, address = {Rochester, New York, USA}, publisher = {Association for Computational Linguistics}, url = {http://www.aclweb.org/anthology/N/N07/N07-4} } @InProceedings{allen-EtAl:2007:NAACLHLTDemos, author = {Allen, James and Chambers ...
The main purposes of the current study are to: (a) examine the interactional effects among test-t... more The main purposes of the current study are to: (a) examine the interactional effects among test-takers, tasks, and raters, as well as the main effects of these facets, in an ESL writing test consisting of both integrated and independent writing tasks and (b) thereby identify additional sources of score variability and error in the rating of test-taker responses. A total of 162 test-takers with 29 different L1 backgrounds participated in the study, each of whom took the same six writing tasks, which included 3 Listening-Writing (LW), 2 Reading-Writing (RW), and 1 Independent Writing (IW) tasks. Each of the essays was rated by each of the 6 trained raters to obtain a completely-crossed data matrix for the test-takers, tasks, and raters. A computer program, FACETS (Linacre, 1998), was used to calibrate the test-takers, tasks, and raters and conduct interaction analysis on 970 essays. Results of the analyses revealed that raters seemed to be having slight difficulty in maintaining a con...
Proceedings of Human Language Technologies: The Annual Conference of the North American Chapter of the Association for Computational Linguistics: Demonstrations on XX - NAACL '07, 2007
Abstract: This paper reports the results of generalizability theory (G) analyses done for new wri... more Abstract: This paper reports the results of generalizability theory (G) analyses done for new writing and speaking tasks for the Test of English as a Foreign Language (TOEFL). For writing, a special focus was placed on evaluating the impact on the reliability of the ...
Eighty-three Test of English as a Foreign Language (TOEFL) writing prompts administered via compu... more Eighty-three Test of English as a Foreign Language (TOEFL) writing prompts administered via computer-based testing between July 1998 and August 2000 were examined for differences attributable to the response mode (handwriting or word processing) chosen by examinees. Differences were examined statistically using polytomous logistic regression. A variable measuring English-language ability (ELA) was developed from the multiple-choice components of the TOEFL and used as a matching variable. Although there was little observed difference in mean writing scores, when examinees were matched on ELA, small differences were observed in effect sizes consistently favoring the handwriting response mode. This difference favoring the handwriting response mode occurred for all of the writing prompts analyzed, suggesting a general effect for response mode. Differences for individual writing prompts were small, however.
Diagnostic language assessment (DLA) is gaining a lot of attention from language teachers, tester... more Diagnostic language assessment (DLA) is gaining a lot of attention from language teachers, testers, and applied linguists. With a recent surge of interest in DLA, there seems to be an urgent need to assess where the field of DLA stands at the moment and develop a general sense of where it should be moving in the future. The current article, as the first article in this special issue, aims to provide a general theoretical background for discussion of DLA and address some fundamental issues surrounding DLA. More specifically, the article (a) examines some of the defining characteristics of DLA and its major components, (b) reviews the current state of DLA in conjunction with these components, and (c) identifies some promising areas of future research and development of DLA where important breakthroughs can be made in the future. Some of the major obstacles and challenges facing DLA are identified and discussed, along with some possible solutions to them.
@Book{NAACLHLTDemos:2007, editor = {Bob Carpenter and Amanda Stent and Jason D. Williams}, title ... more @Book{NAACLHLTDemos:2007, editor = {Bob Carpenter and Amanda Stent and Jason D. Williams}, title = {Proceedings of Human Language Technologies: The Annual Conference of the North American Chapter of the Association for Computational Linguistics (NAACL-HLT)}, month = {April}, year = {2007}, address = {Rochester, New York, USA}, publisher = {Association for Computational Linguistics}, url = {http://www.aclweb.org/anthology/N/N07/N07-4} } @InProceedings{allen-EtAl:2007:NAACLHLTDemos, author = {Allen, James and Chambers ...
The main purposes of the current study are to: (a) examine the interactional effects among test-t... more The main purposes of the current study are to: (a) examine the interactional effects among test-takers, tasks, and raters, as well as the main effects of these facets, in an ESL writing test consisting of both integrated and independent writing tasks and (b) thereby identify additional sources of score variability and error in the rating of test-taker responses. A total of 162 test-takers with 29 different L1 backgrounds participated in the study, each of whom took the same six writing tasks, which included 3 Listening-Writing (LW), 2 Reading-Writing (RW), and 1 Independent Writing (IW) tasks. Each of the essays was rated by each of the 6 trained raters to obtain a completely-crossed data matrix for the test-takers, tasks, and raters. A computer program, FACETS (Linacre, 1998), was used to calibrate the test-takers, tasks, and raters and conduct interaction analysis on 970 essays. Results of the analyses revealed that raters seemed to be having slight difficulty in maintaining a con...
Proceedings of Human Language Technologies: The Annual Conference of the North American Chapter of the Association for Computational Linguistics: Demonstrations on XX - NAACL '07, 2007
Abstract: This paper reports the results of generalizability theory (G) analyses done for new wri... more Abstract: This paper reports the results of generalizability theory (G) analyses done for new writing and speaking tasks for the Test of English as a Foreign Language (TOEFL). For writing, a special focus was placed on evaluating the impact on the reliability of the ...
Eighty-three Test of English as a Foreign Language (TOEFL) writing prompts administered via compu... more Eighty-three Test of English as a Foreign Language (TOEFL) writing prompts administered via computer-based testing between July 1998 and August 2000 were examined for differences attributable to the response mode (handwriting or word processing) chosen by examinees. Differences were examined statistically using polytomous logistic regression. A variable measuring English-language ability (ELA) was developed from the multiple-choice components of the TOEFL and used as a matching variable. Although there was little observed difference in mean writing scores, when examinees were matched on ELA, small differences were observed in effect sizes consistently favoring the handwriting response mode. This difference favoring the handwriting response mode occurred for all of the writing prompts analyzed, suggesting a general effect for response mode. Differences for individual writing prompts were small, however.
Diagnostic language assessment (DLA) is gaining a lot of attention from language teachers, tester... more Diagnostic language assessment (DLA) is gaining a lot of attention from language teachers, testers, and applied linguists. With a recent surge of interest in DLA, there seems to be an urgent need to assess where the field of DLA stands at the moment and develop a general sense of where it should be moving in the future. The current article, as the first article in this special issue, aims to provide a general theoretical background for discussion of DLA and address some fundamental issues surrounding DLA. More specifically, the article (a) examines some of the defining characteristics of DLA and its major components, (b) reviews the current state of DLA in conjunction with these components, and (c) identifies some promising areas of future research and development of DLA where important breakthroughs can be made in the future. Some of the major obstacles and challenges facing DLA are identified and discussed, along with some possible solutions to them.
Uploads
Papers by Yong-Won Lee