@inproceedings{8fcbdc8b94be4f8c9e99566f06808a10,
title = "Fusing domain-specific data with general data for in-domain applications",
abstract = "This paper analyzes the lexical semantics of domain-specific terms based on various pre-Trained specific domain and general domain word vectors, and addresses the semantic drift between domains. To capture lexical semantics in the specific domain, we propose a bridge mechanism to introduce domain-specific data into general data, and re-Train word vectors. We find that even a small-scale fusion can result in the similar lexical semantics learned by using the large-scale domain-specific dataset. Experiments on sentiment analysis and outlier detection show that application of word embedding by the fusion dataset has the better performance than applications of word embeddings by pure large domain-specific and pure large general datasets. The simple, but effective methodology facilitates the domain adaptation of distributed word representations.",
keywords = "Cross-domain data fusion, Outlier detection, Sentiment analysis",
author = "Yen, {An Zi} and Huang, {Hen Hsen} and Chen, {Hsin Hsi}",
note = "Publisher Copyright: {\textcopyright} 2017 ACM.; 16th IEEE/WIC/ACM International Conference on Web Intelligence, WI 2017 ; Conference date: 23-08-2017 Through 26-08-2017",
year = "2017",
month = aug,
day = "23",
doi = "10.1145/3106426.3106473",
language = "English",
series = "Proceedings - 2017 IEEE/WIC/ACM International Conference on Web Intelligence, WI 2017",
publisher = "Association for Computing Machinery, Inc",
pages = "566--572",
booktitle = "Proceedings - 2017 IEEE/WIC/ACM International Conference on Web Intelligence, WI 2017",
}