# jemdoc: menu{MENU}{pubs_icsc2011.html}, showsource = SBA-term: Sparse Bilingual Association for Terms - *Download:* [Pubs/icsc2011.pdf .pdf] - *Authors:* Xinyu Dai and Jinzhu Jia and Laurent El Ghaoui and Bin Yu. - *Status:* Accepted for publication in /Proc. [http://www.ieee-icsc.org/ICSC2011/ Fifth IEEE International Conference on Semantic Computing]/, September 2011. - *Abstract:* Bilingual semantic term association is very useful in cross-language information retrieval, statistical machine translation, and many other applications in natural language processing. In this paper, we present a method, named SBA-term, which applies sparse linear regression (Lasso, Least Squares with $l_1$ penalty) and $l^{2}$ rescaling for design matrix to the task of bilingual term association. The approach hinges on formulating the task as a feature selection problem within a classification framework. Our experimental results indicate that our novel proposed method is more efficient than co-occurrence at extracting relevant bilingual terms semantic associations. In addition, our approach connects the vibrant area of sparse machine learning to an important problem of natural language processing. #- *Related links:* - *Bibtex reference:* ~~~ {}{} @inproceedings{DJEB:11, Author = {X. Dai and J. Jia and L. {El Ghaoui} and B. Yu}, Title = {{SBA}-term: Sparse Bilingual Association for Terms}, BookTitle = {Fifth IEEE International Conference on Semantic Computing}, Address= {Palo Alto, CA, USA}, Month = sep, Year = {2011} } ~~~