@inproceedings{466f4ff022a04fa18c3fef008fb4edb2,
title = "A computer science text corpus/search engine x-TeC and its applications",
abstract = "We built a computer science text corpus/search engine called X-Tec. We automatically collected 2.98 million sentences (68.9 million words) from carefully chosen English computer science documents on the Web using 678 hours. We also built an interactive sample sentence query system and an automatic expression diagnostic system for graduate students. Our computer science text corpus/search engine can be also used for knowledge search and word co-occurrence frequency retrieval.",
author = "Takehiro Tokuda and Yusuke Soyama and Tetsuya Suzuki",
note = "Publisher Copyright: {\textcopyright} 2006 The authors. All rights reserved.; 15th European-Japanese Conference on Information Modelling and Knowledge Bases, EJC 2005 ; Conference date: 16-05-2005 Through 20-05-2005",
year = "2006",
language = "English",
series = "Frontiers in Artificial Intelligence and Applications",
publisher = "IOS Press BV",
pages = "253--259",
editor = "Yasushi Kiyoki and Jaak Henno and Hannu Jaakkola and Hannu Kangassalo",
booktitle = "Information Modelling and Knowledge Bases XVII",
}