2017
Phan, Anh Viet; Nguyen, Minh Le; Bui, Lam Thu
Convolutional neural networks over control flow graphs for software defect prediction Inproceedings
In: 2017 IEEE 29th International Conference on Tools with Artificial Intelligence (ICTAI), pp. 45–52, IEEE 2017.
BibTeX | Tags:
@inproceedings{phan2017convolutional,
title = {Convolutional neural networks over control flow graphs for software defect prediction},
author = {Anh Viet Phan and Minh Le Nguyen and Lam Thu Bui},
year = {2017},
date = {2017-01-01},
booktitle = {2017 IEEE 29th International Conference on Tools with Artificial Intelligence (ICTAI)},
pages = {45--52},
organization = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Carvalho, Danilo S; Nguyen, Minh-Le
WIKTDV: Data extraction and vector representation resource for Wiktionary senses Conference
vol. 2017-January, 2017, (cited By 0).
Abstract | Links | BibTeX | Tags:
@conference{Carvalho2017239,
title = {WIKTDV: Data extraction and vector representation resource for Wiktionary senses},
author = {Danilo S Carvalho and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85043694499&doi=10.1109%2fKSE.2017.8119465&partnerID=40&md5=b849fb4ebc15878e48f4c65e8039b895},
doi = {10.1109/KSE.2017.8119465},
year = {2017},
date = {2017-01-01},
journal = {Proceedings - 2017 9th International Conference on Knowledge and Systems Engineering, KSE 2017},
volume = {2017-January},
pages = {239-244},
abstract = {Effective use of collaborative web resources, such as Wikipedia and Wiktionary, has been a recurrent topic of research in the Natural Language Processing and Information Retrieval communities. The same can be said about the use of vector-based language representations, e.g., word, sentence, document embeddings. However, there is currently a shortage of resources that offer vector representations that can take advantage of the structural properties of web resources. This paper describes a system for extracting information from Wiktionary to a machine-readable format and using this information to obtain vector representations that can be used for semantic similarity computation and basic word sense disambiguation. The methodology used to build the system is also discussed. Experimental evaluation on the semantic similarity task indicate efficiency close to the reference method applied in this work. A web service and visualization facilities complete the set of contributions. © 2017 IEEE.},
note = {cited By 0},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Vo, Quan-Hoang; Nguyen, Huy-Tien; Le, Bac; Nguyen, Minh-Le
Multi-channel LSTM-CNN model for Vietnamese sentiment analysis Conference
vol. 2017-January, 2017, (cited By 45).
Abstract | Links | BibTeX | Tags:
@conference{Vo201724,
title = {Multi-channel LSTM-CNN model for Vietnamese sentiment analysis},
author = {Quan-Hoang Vo and Huy-Tien Nguyen and Bac Le and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85042233213&doi=10.1109%2fKSE.2017.8119429&partnerID=40&md5=441295949db139c45e50302879d06804},
doi = {10.1109/KSE.2017.8119429},
year = {2017},
date = {2017-01-01},
journal = {Proceedings - 2017 9th International Conference on Knowledge and Systems Engineering, KSE 2017},
volume = {2017-January},
pages = {24-29},
abstract = {Convolutional neural network (CNN) and Long Short Term Memory (LSTM) have shown the state of the art results for sentiment analysis in English corpus. However, there are not many studies of this approach for Vietnamese corpus. In our work, CNN and LSTM are employed to generate information channels for Vietnamese sentiment analysis. Because each deep learning model (e.g. CNN, LSTM) has a particular advantage, this scenario provides a novel and efficient way for integrating the advantages of CNN and LSTM. In addition, we introduced a Vietnamese corpus, which collected comments/reviews from Vietnamese commercial web pages and was annotated by three human annotators. We evaluated our approach on our corpus and VLSP corpus. According to the experimental results, the proposed model outperforms SVM, LSTM, and CNN on the two datasets. © 2017 IEEE.},
note = {cited By 45},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Minh-Tien; Cuong, Tran Viet; Hoai, Nguyen Xuan; Nguyen, Minh-Le
Utilizing user posts to enrich web document summarization with matrix co-factorization Conference
vol. 2017-December, 2017, (cited By 6).
Abstract | Links | BibTeX | Tags:
@conference{Nguyen201770,
title = {Utilizing user posts to enrich web document summarization with matrix co-factorization},
author = {Minh-Tien Nguyen and Tran Viet Cuong and Nguyen Xuan Hoai and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85041042396&doi=10.1145%2f3155133.3155196&partnerID=40&md5=96422d5dca8d2451a3690813d7c611cc},
doi = {10.1145/3155133.3155196},
year = {2017},
date = {2017-01-01},
journal = {ÄCM International Conference Proceeding Series"},
volume = {2017-December},
pages = {70-77},
abstract = {In the context of social media, users tend to post relevant information corresponding to an event mentioned in a Web document. This paper presents a model to capture the nature of the relationships between sentences and user posts such as relevant comments in sharing hidden topics for enriching summarization. Unlike the previous methods which usually base on hand-crafted features, our approach ranks sentences and comments based on their importance affecting the topics. The sentence-comment relation is formulated in a share topic matrix, which presents their mutual reinforcement support. Our newly proposed matrix co-factorization algorithm computes the score of each sentence and comment and extracts top m ranked sentences and m comments as the summarization. Experimental results on two datasets in English and Vietnamese of the social context summarization task and DUC 2004 confirm the efficiency of our model in summarizing Web documents. © 2017 Association for Computing Machinery.},
note = {cited By 6},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Tran, Van-Khanh; Nguyen, Van-Tao; Shirai, Kiyoaki; Nguyen, Minh-Le
Towards domain adaptation for neural network language generation in dialogue Conference
vol. 2017-January, 2017, (cited By 1).
Abstract | Links | BibTeX | Tags:
@conference{Tran201719,
title = {Towards domain adaptation for neural network language generation in dialogue},
author = {Van-Khanh Tran and Van-Tao Nguyen and Kiyoaki Shirai and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85043382754&doi=10.1109%2fNAFOSTED.2017.8108032&partnerID=40&md5=0466b2239fad9fa0e460255ae86b8d28},
doi = {10.1109/NAFOSTED.2017.8108032},
year = {2017},
date = {2017-01-01},
journal = {2017 4th NAFOSTED Conference on Information and Computer Science, NICS 2017 - Proceedings},
volume = {2017-January},
pages = {19-24},
abstract = {Extending from limited domain to a new domain is crucial for Natural Language Generation in Dialogue, especially when there are sufficient annotated data in the source domain, but there is little labeled data in the target domain. This paper studies the performance and domain adaptation of two different Neural Network Language Generators in Spoken Dialogue Systems: a gating-based Recurrent Neural Network Generator and an extension of an Attentional Encoder-Decoder Generator. We found in model fine-tuning scenario that by separating slot and value parameterizations, the attention-based generators, in comparison to the gating-based generators, show ability to not only prevent semantic repetition in generated outputs and obtain better performance across all domains, but also adapt faster to a new, unseen domain by leveraging existing data. The empirical results show that the attention-based generator can adapt to an open domain when only a limited amount of target domain data is available. © 2017 IEEE.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Huy Thanh; Nguyen, Minh Le
Sentence modeling with deep neural architecture using lexicon and character attention mechanism for sentiment classification Inproceedings
In: Proceedings of the Eighth International Joint Conference on Natural Language Processing (Volume 1: Long Papers), pp. 536–544, 2017.
BibTeX | Tags:
@inproceedings{nguyen2017sentence,
title = {Sentence modeling with deep neural architecture using lexicon and character attention mechanism for sentiment classification},
author = {Huy Thanh Nguyen and Minh Le Nguyen},
year = {2017},
date = {2017-01-01},
booktitle = {Proceedings of the Eighth International Joint Conference on Natural Language Processing (Volume 1: Long Papers)},
pages = {536--544},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Viet, Lai Dac; Sinh, Vu Trong; Minh, Nguyen Le; Satoh, Ken
ConvAMR: Abstract meaning representation parsing for legal document Journal Article
In: ärXiv preprint arXiv:1711.06141", 2017.
BibTeX | Tags:
@article{viet2017convamr,
title = {ConvAMR: Abstract meaning representation parsing for legal document},
author = {Lai Dac Viet and Vu Trong Sinh and Nguyen Le Minh and Ken Satoh},
year = {2017},
date = {2017-01-01},
journal = {ärXiv preprint arXiv:1711.06141"},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Viet, Tran Hong; Vinh, Nguyen Van; Huyen, Vu Thuong; Minh, Nguyen Le
Dependency-based pre-ordering for English-Vietnamese statistical machine translation Journal Article
In: VNU Journal of Science: Computer Science and Communication Engineering, vol. 33, no. 2, 2017.
BibTeX | Tags:
@article{viet2017dependency,
title = {Dependency-based pre-ordering for English-Vietnamese statistical machine translation},
author = {Tran Hong Viet and Nguyen Van Vinh and Vu Thuong Huyen and Nguyen Le Minh},
year = {2017},
date = {2017-01-01},
journal = {VNU Journal of Science: Computer Science and Communication Engineering},
volume = {33},
number = {2},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Lai, Dac-Viet; Son, Nguyen Truong; Minh, Nguyen Le
Deletion-based sentence compression using Bi-enc-dec LSTM Inproceedings
In: International Conference of the Pacific Association for Computational Linguistics, pp. 249–260, Springer, Singapore 2017.
BibTeX | Tags:
@inproceedings{lai2017deletion,
title = {Deletion-based sentence compression using Bi-enc-dec LSTM},
author = {Dac-Viet Lai and Nguyen Truong Son and Nguyen Le Minh},
year = {2017},
date = {2017-01-01},
booktitle = {International Conference of the Pacific Association for Computational Linguistics},
pages = {249--260},
organization = {Springer, Singapore},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Nguyen, Minh-Tien; Tran, Duc-Vu; Tran, Chien-Xuan; Nguyen, Minh-Le
Exploiting User-Generated Content to Enrich Web Document Summarization Journal Article
In: International Journal on Artificial Intelligence Tools, vol. 26, no. 5, 2017, (cited By 3).
Abstract | Links | BibTeX | Tags:
@article{Nguyen2017,
title = {Exploiting User-Generated Content to Enrich Web Document Summarization},
author = {Minh-Tien Nguyen and Duc-Vu Tran and Chien-Xuan Tran and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85032872652&doi=10.1142%2fS021821301760017X&partnerID=40&md5=7a2aa5b3d0303ac1009b59b75c7114d2},
doi = {10.1142/S021821301760017X},
year = {2017},
date = {2017-01-01},
journal = {International Journal on Artificial Intelligence Tools},
volume = {26},
number = {5},
abstract = {Üser-generated content such as comments or tweets (also called by social information) following a Web document provides additional information for enriching the content of an event mentioned in sentences. This paper presents a framework named SoSVMRank, which integrates the user-generated content of a Web document to generate a highquality summarization. In order to do that, the summarization was formulated as a learning to rank task, in which comments or tweets are exploited to support sentences in a mutual reinforcement fashion. To model sentence-comment (or tweet) relation, a set of local and social features are proposed. After ranking, top m ranked sentences and comments (or tweets) are selected as the summarization. To validate the efficiency of our framework, sentence and story highlight extraction tasks were taken as a case study on three datasets in two languages, English and Vietnamese. Experimental results indicate that: (i) our new features improve the summary performance of the framework in term of ROUGE-scores compared to state-of-The-Art baselines and (ii) the integration of user-generated content benefits single-document summarization. © 2017 World Scientific Publishing Company."},
note = {cited By 3},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Carvalho, Danilo Silva; Nguyen, Minh-Le
Efficient neural-based patent document segmentation with term order probabilities Conference
2017, (cited By 1).
Abstract | Links | BibTeX | Tags:
@conference{Carvalho2017171,
title = {Efficient neural-based patent document segmentation with term order probabilities},
author = {Danilo Silva Carvalho and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85070734361&partnerID=40&md5=e4947c5caa74b0f7e4b736e07b4651d1},
year = {2017},
date = {2017-01-01},
journal = {ESANN 2017 - Proceedings, 25th European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning},
pages = {171-176},
abstract = {The internationally growing trend of patent applications puts great pressure on the agents involved in managing this kind of information and creates a demand for efficient and effective patent analysis methods. This work presents a computationally efficient approach for patent docu- ment segmentation based on structured ANNs and a simple distributional semantics composition method. The conducted experiments indicate effec- tiveness of the approach, which benefits a wide array of patent processing techniques that work upon structured inputs. © ESANN 2017 - Proceedings, 25th European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning. All rights reserved.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Trieu, Hai-Long; Pham, Trung-Tin; Nguyen, Le-Minh
The JAIST machine translation systems for WMT 17 Conference
2017, (cited By 2).
Abstract | Links | BibTeX | Tags:
@conference{Trieu2017405,
title = {The JAIST machine translation systems for WMT 17},
author = {Hai-Long Trieu and Trung-Tin Pham and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85080439079&partnerID=40&md5=da84baff5e105a1af2df160a5b65389e},
year = {2017},
date = {2017-01-01},
journal = {WMT 2017 - 2nd Conference on Machine Translation, Proceedings},
pages = {405-409},
abstract = {We describe the JAIST phrase-based machine translation systems that participated in the news translation shared task of the WMT17. In this work, we participated in the Turkish-English translation, in which only a small amount of bilingual training data is available, so that it is an example of the low-resource setting in machine translation. In order to solve the problem, we focus on two strategies: building a bilingual corpus from comparable data and exploiting existing parallel data based on phrase pivot translation. In order to utilize the strategies to enhance machine translation on the low-resource setting most effectively, we introduce a system combining the extracted corpus, the pivot translation, and the direct training data. Experimental results showed that our combined systems significantly improved the baseline models, which were trained on the small bilingual data. © 2017 Association for Computational Linguistics},
note = {cited By 2},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Phan, Anh Viet; Nguyen, Minh Le; Bui, Lam Thu
Feature weighting and SVM parameters optimization based on genetic algorithms for classification problems Journal Article
In: Äpplied Intelligence", vol. 46, no. 2, pp. 455-469, 2017, (cited By 72).
Abstract | Links | BibTeX | Tags:
@article{Phan2017455,
title = {Feature weighting and SVM parameters optimization based on genetic algorithms for classification problems},
author = {Anh Viet Phan and Minh Le Nguyen and Lam Thu Bui},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84986269058&doi=10.1007%2fs10489-016-0843-6&partnerID=40&md5=6351588a149d8e56f0f07ec92ada6b31},
doi = {10.1007/s10489-016-0843-6},
year = {2017},
date = {2017-01-01},
journal = {Äpplied Intelligence"},
volume = {46},
number = {2},
pages = {455-469},
abstract = {Support Vector Machines (SVMs) are widely known as an efficient supervised learning model for classification problems. However, the success of an SVM classifier depends on the perfect choice of its parameters as well as the structure of the data. Thus, the aim of this research is to simultaneously optimize the parameters and feature weighting in order to increase the strength of SVMs. We propose a novel hybrid model, the combination of genetic algorithms (GAs) and SVMs, for feature weighting and parameter optimization to solve classification problems efficiently. We call it as the GA-SVM model. Our GA is designed with a special direction-based crossover operator. Experiments were conducted on several real-world datasets using the proposed model and Grid Search, a traditional method of searching optimal parameters. The results show that the GA-SVM model achieves significant improvement in the performance of classification on all the datasets in comparison with Grid Search. In terms of accuracy, out method is competitive with some state-of-the-art techniques for feature selection and feature weighting. © 2016, Springer Science+Business Media New York.},
note = {cited By 72},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Tran, Van-Khanh; Nguyen, Le-Minh
2017, (cited By 17).
Abstract | Links | BibTeX | Tags:
@conference{Tran2017231,
title = {Neural-based natural language generation in dialogue using RNN encoder-decoder with semantic aggregation},
author = {Van-Khanh Tran and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85073185378&partnerID=40&md5=18f08ac1cc06c4bb48f0ce1b2d956c77},
year = {2017},
date = {2017-01-01},
journal = {SIGDIAL 2017 - 18th Annual Meeting of the Special Interest Group on Discourse and Dialogue, Proceedings of the Conference},
pages = {231-240},
abstract = {Natural language generation (NLG) is an important component in spoken dialogue systems. This paper presents a model called Encoder-Aggregator-Decoder which is an extension of an Recurrent Neural Network based Encoder-Decoder architecture. The proposed Semantic Aggregator consists of two components: an Aligner and a Refiner. The Aligner is a conventional attention calculated over the encoded input information, while the Refiner is another attention or gating mechanism stacked over the attentive Aligner in order to further select and aggregate the semantic elements. The proposed model can be jointly trained both text planning and text realization to produce natural language utterances. The model was extensively assessed on four different NLG domains, in which the results showed that the proposed generator consistently outperforms the previous methods on all the NLG domains. © 2017 Association for Computational Linguistics.},
note = {cited By 17},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Tran, Van-Khanh; Nguyen, Le-Minh
Natural language generation for spoken dialogue system using RNN encoder-decoder networks Conference
2017, (cited By 30).
Abstract | Links | BibTeX | Tags:
@conference{Tran2017442,
title = {Natural language generation for spoken dialogue system using RNN encoder-decoder networks},
author = {Van-Khanh Tran and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85043390374&doi=10.18653%2fv1%2fk17-1044&partnerID=40&md5=e09901b293db8a8cd6a7a479f6a16b44},
doi = {10.18653/v1/k17-1044},
year = {2017},
date = {2017-01-01},
journal = {CoNLL 2017 - 21st Conference on Computational Natural Language Learning, Proceedings},
pages = {442-451},
abstract = {Natural language generation (NLG) is a critical component in a spoken dialogue system. This paper presents a Recurrent Neural Network based Encoder-Decoder architecture, in which an LSTM-based decoder is introduced to select, aggregate semantic elements produced by an attention mechanism over the input elements, and to produce the required utterances. The proposed generator can be jointly trained both sentence planning and surface realization to produce natural language sentences. The proposed model was extensively evaluated on four different NLG datasets. The experimental results showed that the proposed generators not only consistently outperform the previous methods across all the NLG domains but also show an ability to generalize from a new, unseen domain and learn from multi-domain datasets. © 2017 Association for Computational Linguistics.},
note = {cited By 30},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Minh-Tien; Tran, Duc-Vu; Tran, Chien-Xuan; Nguyen, Minh-Le
Summarizing web documents using sequence labeling with user-generated content and third-party sources Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 10260 LNCS, pp. 454-467, 2017, (cited By 3).
Abstract | Links | BibTeX | Tags:
@article{Nguyen2017454,
title = {Summarizing web documents using sequence labeling with user-generated content and third-party sources},
author = {Minh-Tien Nguyen and Duc-Vu Tran and Chien-Xuan Tran and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85021713301&doi=10.1007%2f978-3-319-59569-6_54&partnerID=40&md5=04ec44eddd5a4eea42b691a9f7e9cac4},
doi = {10.1007/978-3-319-59569-6_54},
year = {2017},
date = {2017-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {10260 LNCS},
pages = {454-467},
abstract = {This paper presents SoCRFSum, a summary model which integrates user-generated content as comments and third-party sources such as relevant articles of a Web document to generate a high-quality summarization. The summarization was formulated as a sequence labeling problem, which exploits the support of external information to model sentences and comments. After modeling, Conditional Random Fields were adopted for sentence selection. SoCRFSum was validated on a dataset collected from Yahoo News. Promising results indicate that by integrating the user-generated and third-party information, our method obtains improvements of ROUGE-scores over state-of-the-art baselines. © Springer International Publishing AG 2017.},
note = {cited By 3},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Trieu, Hai-Long; Iida, Hiroyuki; Bao, Nhien Pham Hoang; Nguyen, Le-Minh
Towards developing dialogue systems with entertaining conversations Conference
vol. 2, 2017, (cited By 2).
Abstract | Links | BibTeX | Tags:
@conference{Trieu2017511,
title = {Towards developing dialogue systems with entertaining conversations},
author = {Hai-Long Trieu and Hiroyuki Iida and Nhien Pham Hoang Bao and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85065871212&doi=10.5220%2f0006192105110518&partnerID=40&md5=becabde9da82c188038dbcdc76db0291},
doi = {10.5220/0006192105110518},
year = {2017},
date = {2017-01-01},
journal = {ICAART 2017 - Proceedings of the 9th International Conference on Agents and Artificial Intelligence},
volume = {2},
pages = {511-518},
abstract = {This paper explores a novel approach to developing a dialogue system that is able to make entertaining conversations with users. It proposes a method to improve the current goal-driven dialogue systems which support users for specific tasks while satisfying users' goals with entertaining conversations. It then develops a dialogue system in which a set of features are considered to generate entertaining conversations, while reasonably prolonging the original too short dialogue. The game refinement measure is employed for the assessment of attractiveness since the conversations in dialogue systems can be seen as the process by which a player creates shoots or moves to win a game. The dialogues generated by the proposed method are evaluated by human subjects. The results confirm the effectiveness of the proposed method. The present idea can be a promising way to realize dialogue systems with entertaining conversations although further investigations are needed. © 2017 by SCITEPRESS - Science and Technology Publications, Lda.},
note = {cited By 2},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Do, Phong-Khac; Nguyen, Huy-Tien; Tran, Chien-Xuan; Nguyen, Minh-Tien; Nguyen, Minh-Le
Legal question answering using ranking SVM and deep convolutional neural network Journal Article
In: ärXiv preprint arXiv:1703.05320", 2017.
BibTeX | Tags:
@article{do2017legal,
title = {Legal question answering using ranking SVM and deep convolutional neural network},
author = {Phong-Khac Do and Huy-Tien Nguyen and Chien-Xuan Tran and Minh-Tien Nguyen and Minh-Le Nguyen},
year = {2017},
date = {2017-01-01},
journal = {ärXiv preprint arXiv:1703.05320"},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nguyen, Minh-Tien; Nguyen, Minh-Le
Intra-relation or inter-relation?: Exploiting social information for Web document summarization Journal Article
In: Expert Systems with Applications, vol. 76, pp. 71-84, 2017, (cited By 7).
Abstract | Links | BibTeX | Tags:
@article{Nguyen201771,
title = {Intra-relation or inter-relation?: Exploiting social information for Web document summarization},
author = {Minh-Tien Nguyen and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85011636014&doi=10.1016%2fj.eswa.2017.01.023&partnerID=40&md5=a9be4e1df6312d315a0416a0a3074e27},
doi = {10.1016/j.eswa.2017.01.023},
year = {2017},
date = {2017-01-01},
journal = {Expert Systems with Applications},
volume = {76},
pages = {71-84},
abstract = {Traditional summarization methods only use the internal information of a Web document while ignoring its social information such as tweets from Twitter, which can provide a perspective viewpoint for readers towards an event. This paper proposes a framework named SoRTESum to take the advantages of social information such as document content reflection to extract summary sentences and social messages. In order to do that, the summarization was formulated in two steps: scoring and ranking. In the scoring step, the score of a sentence or social message is computed by using intra-relation and inter-relation which integrate the support of local and social information in a mutual reinforcement form. To calculate these relations, 16 features are proposed. After scoring, the summarization is generated by selecting top m ranked sentences and social messages. SoRTESum was extensively evaluated on two datasets. Promising results show that: (i) SoRTESum obtains significant improvements of ROUGE-scores over state-of-the-art baselines and competitive results with the learning to rank approach trained by RankBoost and (ii) combining intra-relation and inter-relation benefits single-document summarization. © 2017 Elsevier Ltd},
note = {cited By 7},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Trieu, Hai-Long; Nguyen, Le-Minh
Applying semantic similarity to phrase pivot translation Conference
2017, (cited By 1).
Abstract | Links | BibTeX | Tags:
@conference{Trieu20171043,
title = {Applying semantic similarity to phrase pivot translation},
author = {Hai-Long Trieu and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85013629392&doi=10.1109%2fICTAI.2016.0157&partnerID=40&md5=25e81914122837a5d160ac3b0900e7fb},
doi = {10.1109/ICTAI.2016.0157},
year = {2017},
date = {2017-01-01},
journal = {Proceedings - 2016 IEEE 28th International Conference on Tools with Artificial Intelligence, ICTAI 2016},
pages = {1043-1047},
abstract = {Pivot methods have shown to be an effective solution to overcome the problem of unavailable large bilingual corpora in statistical machine translation. The representative approach of pivot methods is the phrase pivot translation which is based on common pivot phrases to produce connections between source-pivot and pivot-Target phrase tables. Nevertheless, this approach produces insufficient connections behind the phrase tables because pivot phrases still contain the same meaning even when they are not matched to each other. In this work, we propose applying semantic similarity between pivot phrases to phrase pivot translation. In order to extract similar pivot phrases, we used string similarity measures for phrase similarity, and WordNet and Word2Vec were used for word similarity. The experiments show that using semantic similarity is able to extract more informative phrases, which can support for phrase pivot translation. © 2016 IEEE.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Minh-Tien; Tran, Duc-Vu; Tran, Chien-Xuan; Nguyen, Minh-Le
Learning to Summarize Web Documents using Social Information Conference
2017, (cited By 7).
Abstract | Links | BibTeX | Tags:
@conference{Nguyen2017619,
title = {Learning to Summarize Web Documents using Social Information},
author = {Minh-Tien Nguyen and Duc-Vu Tran and Chien-Xuan Tran and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85013641514&doi=10.1109%2fICTAI.2016.97&partnerID=40&md5=49b63da3bb54f6f38619d4cf95c1bd61},
doi = {10.1109/ICTAI.2016.97},
year = {2017},
date = {2017-01-01},
journal = {Proceedings - 2016 IEEE 28th International Conference on Tools with Artificial Intelligence, ICTAI 2016},
pages = {619-626},
abstract = {This paper presents a method named SoSVMRank, which integrates the social information of a Web document to generate a high-quality summarization. In order to do that, the summarization was formulated as a learning to rank task, in which the order of a sentence or comment was determined by its informative information. The informative information was measured by a set of local and social features in which the social features were exploited to support the local ones when modeling a sentence or comment. To enrich information, new features were also proposed. After ranking, top m ranked sentences and comments were selected as the summarization. Our method was extensively evaluated on two datasets. Promising results indicate that: (1) by using new features, our method achieves improvements in both ROUGE- 1 and ROUGE-2 of the summarization over state-of-The-Art baselines and (2) integrating social information benefits the summarization. © 2016 IEEE.},
note = {cited By 7},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Carvalho, Danilo S; Nguyen, Minh-Tien; Tran, Chien-Xuan; Nguyen, Minh-Le
Lexical-morphological modeling for legal text analysis Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 10091 LNCS, pp. 295-311, 2017, (cited By 0).
Abstract | Links | BibTeX | Tags:
@article{Carvalho2017295,
title = {Lexical-morphological modeling for legal text analysis},
author = {Danilo S Carvalho and Minh-Tien Nguyen and Chien-Xuan Tran and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85018438156&doi=10.1007%2f978-3-319-50953-2_21&partnerID=40&md5=c24e3545b9a508190fa1254bd09a3c3d},
doi = {10.1007/978-3-319-50953-2_21},
year = {2017},
date = {2017-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {10091 LNCS},
pages = {295-311},
abstract = {In the context of the Competition on Legal Information Extraction/Entailment (COLIEE), we propose a method comprising the necessary steps for finding relevant documents to a legal question and deciding on textual entailment evidence to provide a correct answer. The proposed method is based on the combination of several lexical and morphological characteristics, to build a language model and a set of features for Machine Learning algorithms. We provide a detailed study on the proposed method performance and failure cases, indicating that it is competitive with state-of-the-art approaches on Legal Information Retrieval and Question Answering, while not needing extensive training data nor depending on expert produced knowledge. The proposed method achieved significant results in the competition, indicating a substantial level of adequacy for the tasks addressed. © Springer International Publishing AG 2017.},
note = {cited By 0},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Carvalho, Danilo S; Nguyen, Minh Le; Iida, Hiroyuki
An analysis of majority voting in homogeneous groups for checkers: understanding group performance through unbalance Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 10664 LNCS, pp. 213-223, 2017, (cited By 0).
Abstract | Links | BibTeX | Tags:
@article{Carvalho2017213,
title = {An analysis of majority voting in homogeneous groups for checkers: understanding group performance through unbalance},
author = {Danilo S Carvalho and Minh Le Nguyen and Hiroyuki Iida},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85039419928&doi=10.1007%2f978-3-319-71649-7_18&partnerID=40&md5=260c08c95a73b3441b1bd1e21ab68da2},
doi = {10.1007/978-3-319-71649-7_18},
year = {2017},
date = {2017-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {10664 LNCS},
pages = {213-223},
abstract = {Experimental evidence and theoretical advances over the years have created an academic consensus regarding majority voting systems, namely that, under certain conditions, the group performs better than its components. However, the underlying reason for such conditions, e.g., stochastic independence of agents, is not often explored and may help to improve performance in known setups by changing agent behavior, or find new ways of combining agents to take better advantage of their characteristics. In this work, an investigation is conducted for homogeneous groups of independent agents playing the game of Checkers. The analysis aims to find the relationship between the change in performance caused by majority voting, the group size, and the underlying decision process of each agent, which is mapped to its source of non-determinism. A characteristic unbalance in Checkers, due to an apparent initiative disadvantage, serves as a pivot for the study, from which decisions can be separated into beneficial or detrimental biases. Experimental results indicate that performance changes caused by majority voting may be beneficial or not, and are linked to the game properties and player skill. Additionally, a way of improving agent performance by manipulating its non-determinism source is briefly explored. © Springer International Publishing AG 2017.},
note = {cited By 0},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Phan, Anh Viet; Nguyen, Minh Le; Bui, Lam Thu
SibStCNN and TBCNN + kNN-TED: New models over tree structures for source code classification Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 10585 LNCS, pp. 120-128, 2017, (cited By 1).
Abstract | Links | BibTeX | Tags:
@article{Phan2017120,
title = {SibStCNN and TBCNN + kNN-TED: New models over tree structures for source code classification},
author = {Anh Viet Phan and Minh Le Nguyen and Lam Thu Bui},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85034260728&doi=10.1007%2f978-3-319-68935-7_14&partnerID=40&md5=2ba471a53fcef42241778ae66a7ccf19},
doi = {10.1007/978-3-319-68935-7_14},
year = {2017},
date = {2017-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {10585 LNCS},
pages = {120-128},
abstract = {This paper aims to solve a software engineering problem by applying several approaches to exploit tree representations of programs. Firstly, we propose a new sibling-subtree convolutional neural network (SibStCNN), and combination models of tree-based neural networks and k-Nearest Neighbors (kNN) for source code classification. Secondly, we present a pruning tree technique to reduce data dimension and strengthen classifiers. The experiments show that the proposed models outperform other methods, and the pruning tree leads to not only a substantial reduction in execution time but also an increase in accuracy. © Springer International Publishing AG 2017.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Truong, Son Nguyen; Minh, N Le; Satoh, K; Satoshi, T; Shimazu, A
Single and multiple layer BI-LSTMCRF for recognizing requisite and effectuation parts in legal texts Inproceedings
In: Proc. of the 2nd Workshop on Automated Semantic Analysis of Information in Legal Texts, 2017.
BibTeX | Tags:
@inproceedings{truong2017single,
title = {Single and multiple layer BI-LSTMCRF for recognizing requisite and effectuation parts in legal texts},
author = {Son Nguyen Truong and N Le Minh and K Satoh and T Satoshi and A Shimazu},
year = {2017},
date = {2017-01-01},
booktitle = {Proc. of the 2nd Workshop on Automated Semantic Analysis of Information in Legal Texts},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Phan, Anh Viet; Nguyen, Minh Le
Convolutional neural networks on assembly code for predicting software defects Inproceedings
In: 2017 21st Asia Pacific Symposium on Intelligent and Evolutionary Systems (IES), pp. 37–42, IEEE 2017.
BibTeX | Tags:
@inproceedings{phan2017convolutional_2,
title = {Convolutional neural networks on assembly code for predicting software defects},
author = {Anh Viet Phan and Minh Le Nguyen},
year = {2017},
date = {2017-01-01},
booktitle = {2017 21st Asia Pacific Symposium on Intelligent and Evolutionary Systems (IES)},
pages = {37--42},
organization = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Carvalho, Danilo S; Tran, Vu Duc; Tran, Van-Khanh; Nguyen, Le-Minh
Improving legal information retrieval by distributional composition with term order probabilities. Inproceedings
In: COLIEE@ ICAIL, pp. 43–56, 2017.
BibTeX | Tags:
@inproceedings{carvalho2017improving,
title = {Improving legal information retrieval by distributional composition with term order probabilities.},
author = {Danilo S Carvalho and Vu Duc Tran and Van-Khanh Tran and Le-Minh Nguyen},
year = {2017},
date = {2017-01-01},
booktitle = {COLIEE@ ICAIL},
pages = {43--56},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Viet, Lai Dac; Sinh, Vu Trong; Minh, Nguyen Le; Satoh, Ken
ConvAMR: abstract meaning representation parsing for legal document Journal Article
In: ärXiv e-prints", pp. ärXiv–1711", 2017.
BibTeX | Tags:
@article{dac2017convamr,
title = {ConvAMR: abstract meaning representation parsing for legal document},
author = {Lai Dac Viet and Vu Trong Sinh and Nguyen Le Minh and Ken Satoh},
year = {2017},
date = {2017-01-01},
journal = {ärXiv e-prints"},
pages = {ärXiv--1711"},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2016
Nguyen-Van, Hao; Nguyen, Thang; Quan, Vu; Nguyen, Minh; Pham-Nguyen, Loan
A topology of charging mode control circuit suitable for long-life Li-Ion battery charger Inproceedings
In: 2016 IEEE Sixth International Conference on Communications and Electronics (ICCE), pp. 167–171, IEEE 2016.
BibTeX | Tags:
@inproceedings{nguyen2016topology,
title = {A topology of charging mode control circuit suitable for long-life Li-Ion battery charger},
author = {Hao Nguyen-Van and Thang Nguyen and Vu Quan and Minh Nguyen and Loan Pham-Nguyen},
year = {2016},
date = {2016-01-01},
booktitle = {2016 IEEE Sixth International Conference on Communications and Electronics (ICCE)},
pages = {167--171},
organization = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Carvalho, Danilo S; Tran, Vu Duc; Tran, Khanh Van; Lai, Viet Dac; Nguyen, Minh-Le
Lexical to discourse-level corpus modeling for legal question answering Inproceedings
In: Tenth International Workshop on Juris-Informatics (JURISIN), 2016.
BibTeX | Tags:
@inproceedings{carvalho2016lexical,
title = {Lexical to discourse-level corpus modeling for legal question answering},
author = {Danilo S Carvalho and Vu Duc Tran and Khanh Van Tran and Viet Dac Lai and Minh-Le Nguyen},
year = {2016},
date = {2016-01-01},
booktitle = {Tenth International Workshop on Juris-Informatics (JURISIN)},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Öng, Hong Xuan; Tojo, Satoshi; others",
Reranking CCG parser for Jazz chord sequences Conference
2016, (cited By 0).
Abstract | Links | BibTeX | Tags:
@conference{Ong2016205,
title = {Reranking CCG parser for Jazz chord sequences},
author = {Hong Xuan Öng and Satoshi Tojo and others"},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85007001618&doi=10.1109%2fKSE.2016.7758054&partnerID=40&md5=15f6b3be33d62300181e33237e8d5c41},
doi = {10.1109/KSE.2016.7758054},
year = {2016},
date = {2016-01-01},
journal = {Proceedings - 2016 8th International Conference on Knowledge and Systems Engineering, KSE 2016},
pages = {205-211},
abstract = {When listen to the music, specifically chord progression, each person can have more than one understanding or feeling about what they heard which we call musical intuitions of listeners or human capacity of musical understanding. To disambiguate the chord progression, Granroth-Wilding et al. have employed Probabilistic Combinatory Categorial Grammar (PCCG), and they acquired the recall value of 88.78%, and the precision value of 90.18%. Because this chord progression parser only outputs the one with the highest probability, the correct solution may still reside in the following candidates. In this paper, we use the reranking model to improve the performance of the parser. By selecting a set of simple n-gram features and configuring perceptron algorithm for finding optimizing parameters, we have improved performance of the system by 2.2%, and even 6.57% when we could perfectly pick up correct candidates from 5000-best results. © 2016 IEEE.},
note = {cited By 0},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Trieu, Hai Long; Nguyen, Minh Le; Nguyen, Phuong-Thai
Dealing with out-of-vocabulary problem in sentence alignment using word similarity Conference
2016, (cited By 4).
Abstract | Links | BibTeX | Tags:
@conference{Trieu2016259,
title = {Dealing with out-of-vocabulary problem in sentence alignment using word similarity},
author = {Hai Long Trieu and Minh Le Nguyen and Phuong-Thai Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85015839847&partnerID=40&md5=2a499d26d847621b06076910c8a571f6},
year = {2016},
date = {2016-01-01},
journal = {Proceedings of the 30th Pacific Asia Conference on Language, Information and Computation, PACLIC 2016},
pages = {259-266},
abstract = {Sentence alignment plays an essential role in building bilingual corpora which are valuable resources for many applications like statistical machine translation. In various approaches of sentence alignment, length-and-word-based methods which are based on sentence length and word correspondences have been shown to be the most effective. Nevertheless a drawback of using bilingual dictionaries trained by IBM Models in length-and-word-based methods is the problem of out-of-vocabulary (OOV). We propose using word similarity learned from monolingual corpora to overcome the problem. Experimental results showed that our method can reduce the OOV ratio and achieve a better performance than some other lengthand- word-based methods. This implies that using word similarity learned from monolingual data may help to deal with OOV problem in sentence alignment.},
note = {cited By 4},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Minh-Tien; Lai, Dac Viet; Do, Phong-Khac; Tran, Duc-Vu; Nguyen, Minh Le
Vsolscsum: Building a vietnamese sentence-comment dataset for social context summarization Inproceedings
In: Proceedings of the 12th Workshop on Asian Language Resources (ALR12), pp. 38–48, 2016.
BibTeX | Tags:
@inproceedings{nguyen2016vsolscsum,
title = {Vsolscsum: Building a vietnamese sentence-comment dataset for social context summarization},
author = {Minh-Tien Nguyen and Dac Viet Lai and Phong-Khac Do and Duc-Vu Tran and Minh Le Nguyen},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of the 12th Workshop on Asian Language Resources (ALR12)},
pages = {38--48},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Son, Nguyen Truong; Quoc, Ho Bao; Shimazu, Akira; others,
Recognizing logical parts in legal texts using neural architectures Conference
2016, (cited By 3).
Abstract | Links | BibTeX | Tags:
@conference{Son2016252,
title = {Recognizing logical parts in legal texts using neural architectures},
author = {Nguyen Truong Son and Ho Bao Quoc and Akira Shimazu and others},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85006967216&doi=10.1109%2fKSE.2016.7758062&partnerID=40&md5=d1263aa95fbb64ee235de5b982b05b89},
doi = {10.1109/KSE.2016.7758062},
year = {2016},
date = {2016-01-01},
journal = {Proceedings - 2016 8th International Conference on Knowledge and Systems Engineering, KSE 2016},
pages = {252-257},
abstract = {This paper proposes neural networks approaches to recognize logical parts in Vietnamese legal documents. We utilize four models based on recurrent neural networks including Long Short Term Memory (LSTM), Bidirectional LSTM and their combination with Conditional Random Fields. The experimental results on the Vietnamese Business Law data set shows the promising of this approach. Although, these approaches don't use any engineering features like traditional approaches, they can produce the state-of-the-art performance. © 2016 IEEE.},
note = {cited By 3},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Le, Tung; Nguyen, Le-Minh; Shimazu, Akira; Dien, Dinh
Phrase-based compressive summarization for English-Vietnamese Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 9978 LNAI, pp. 331-342, 2016, (cited By 1).
Abstract | Links | BibTeX | Tags:
@article{Le2016331,
title = {Phrase-based compressive summarization for English-Vietnamese},
author = {Tung Le and Le-Minh Nguyen and Akira Shimazu and Dinh Dien},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85006062708&doi=10.1007%2f978-3-319-49046-5_28&partnerID=40&md5=172c7911cf31fb56783e97cf2374caec},
doi = {10.1007/978-3-319-49046-5_28},
year = {2016},
date = {2016-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {9978 LNAI},
pages = {331-342},
abstract = {Cross-language summarization is the novel topic which is extremely practical and necessary for capturing, tracing, and retrieving the huge data. Especially, for many low-resource languages as Vietnamese, Chinese,…, there are not any previous works to solve this problem as well as datasets. Therefore we propose to apply Phrase based Compressive Summarization for English-Vietnamese. This model takes advantages of the relation between translation and summarization phases to overcome the popular drawback in most antecedent researches. Besides, the bilingual corpus for English-Vietnamese summarization built manually on the dataset is extremely helpful for a lot of later works. In this dataset, our system achieves approximately 37% in ROUGE-1 score which is equivalent to systems on other language pairs. This significant and encouraging result proves the effectiveness of our approach and the quality of our manual datasets in English-Vietnamese. © Springer International Publishing AG 2016.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nguyen, Xuan-Huy; Nguyen, Le-Minh
Linguistic features and learning to rank methods for shopping advice Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 9978 LNAI, pp. 269-279, 2016, (cited By 1).
Abstract | Links | BibTeX | Tags:
@article{Nguyen2016269,
title = {Linguistic features and learning to rank methods for shopping advice},
author = {Xuan-Huy Nguyen and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85005991814&doi=10.1007%2f978-3-319-49046-5_23&partnerID=40&md5=c7b5ade8d1aea6e215c7b1cfcdd88c53},
doi = {10.1007/978-3-319-49046-5_23},
year = {2016},
date = {2016-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {9978 LNAI},
pages = {269-279},
abstract = {We present a recommendation system (RS) which helps users in buying products based on summarizing all the customer reviews of product attributes. Our recommendation system extracts users’ opinions for products through a decision tree. Each node of the tree is a question to the users. From each node, our RS gives a ranked list of products which is matches the opinions of users. We explain (a) a learning tree structure, for instance, at each node which questions can be asked; and (b) producing a suitably ranked list at each node. Firstly, we use a topdown strategy to build a decision tree in order to select the best user attributes corresponding to a question which is asked at each node. Secondly, we use a learning-to-rank method to learn a ranked list of products for each node of the tree. In experimentation, we use amazon datasets for computer products. We evaluate our RS by using mean reciprocal rank (MRR). Experimental results show that RankBoost achieves better quality than RankSVM. © Springer International Publishing AG 2016.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nguyen, Minh-Tien; Tran, Chien-Xuan; Tran, Duc-Vu; Nguyen, Minh-Le
SoLSCSum: A linked sentence-comment dataset for social context summarization Conference
vol. 24-28-October-2016, 2016, (cited By 14).
Abstract | Links | BibTeX | Tags:
@conference{Nguyen20162409,
title = {SoLSCSum: A linked sentence-comment dataset for social context summarization},
author = {Minh-Tien Nguyen and Chien-Xuan Tran and Duc-Vu Tran and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84996537865&doi=10.1145%2f2983323.2983376&partnerID=40&md5=9d85eaee3c9a9f8463c159d767564ef2},
doi = {10.1145/2983323.2983376},
year = {2016},
date = {2016-01-01},
journal = {International Conference on Information and Knowledge Management, Proceedings},
volume = {24-28-October-2016},
pages = {2409-2412},
abstract = {This paper presents a dataset named SoLSCSum for social context summarization. The dataset includes 157 open-domain articles along with their comments collected from Yahoo News. The articles and their comments were manually annotated by two annota-tors to extract standard summaries. The inter-annotator agreement is 74.5% and Cohen's Kappa is 0.5845. To illustrate the potential use of our dataset, a learning to rank model was trained by using a set of local and cross features. Experimental results demonstrate that: (1) our model trained by Ranking SVM obtains significant improvements from 5.5% to 14.8% of ROUGE-1 over state-of-the-art baselines in document summarization and (2) our dataset can be used to train summary methods such as SVM. © 2016 ACM.},
note = {cited By 14},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Minh-Tien; Phan, Viet-Anh; Nguyen, Truong-Son; Nguyen, Minh-Le
Learning to rank questions for community question answering with ranking SVM Journal Article
In: ärXiv preprint arXiv:1608.04185", 2016.
BibTeX | Tags:
@article{nguyen2016learning,
title = {Learning to rank questions for community question answering with ranking SVM},
author = {Minh-Tien Nguyen and Viet-Anh Phan and Truong-Son Nguyen and Minh-Le Nguyen},
year = {2016},
date = {2016-01-01},
journal = {ärXiv preprint arXiv:1608.04185"},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nguyen, Minh
SDP-JAIST: a shallow discourse parsing system@ CoNLL 2016 shared task Inproceedings
In: Proceedings of the CoNLL-16 shared task, pp. 143–149, 2016.
BibTeX | Tags:
@inproceedings{nguyen2016sdp,
title = {SDP-JAIST: a shallow discourse parsing system@ CoNLL 2016 shared task},
author = {Minh Nguyen},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of the CoNLL-16 shared task},
pages = {143--149},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Tung, Vu Xuan; Minh, Nguyen Le; Hoang, Duc Tam
Semantic Parsing for Vietnamese Question Answering System Conference
2016, (cited By 2).
Abstract | Links | BibTeX | Tags:
@conference{Tung2016332,
title = {Semantic Parsing for Vietnamese Question Answering System},
author = {Vu Xuan Tung and Nguyen Le Minh and Duc Tam Hoang},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84964706599&doi=10.1109%2fKSE.2015.42&partnerID=40&md5=3d3887c3a2df39a82a935095f0c9cac3},
doi = {10.1109/KSE.2015.42},
year = {2016},
date = {2016-01-01},
journal = {Proceedings - 2015 IEEE International Conference on Knowledge and Systems Engineering, KSE 2015},
pages = {332-335},
abstract = {Based on a framework for English, we developed a Vietnamese Question Answering System. The learning paradigm in the framework reduces the burden of providing supervision during semantic parsing. Whilst taking the advantages from this mechanism, we further create our own feature calculation which is suitable for Vietnamese. A method of dynamic learning for feature computation is also presented in this work. © 2015 IEEE.},
note = {cited By 2},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Tran, Hong Viet; Nguyen, Van Vinh; Nguyen, Le Minh
Improving english-vietnamese statistical machine translation using preprocessing dependency syntactic Journal Article
In: 2016.
BibTeX | Tags:
@article{tran2016improving,
title = {Improving english-vietnamese statistical machine translation using preprocessing dependency syntactic},
author = {Hong Viet Tran and Van Vinh Nguyen and Le Minh Nguyen},
year = {2016},
date = {2016-01-01},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nguyen, Minh-Tien; Nguyen, Minh-Le
SoRTESum: A social context framework for single-document summarization Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 9626, pp. 3-14, 2016, (cited By 15).
Abstract | Links | BibTeX | Tags:
@article{Nguyen20163,
title = {SoRTESum: A social context framework for single-document summarization},
author = {Minh-Tien Nguyen and Minh-Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84962524395&doi=10.1007%2f978-3-319-30671-1_1&partnerID=40&md5=3e61997c6953d21d468f1188e06de8d8},
doi = {10.1007/978-3-319-30671-1_1},
year = {2016},
date = {2016-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {9626},
pages = {3-14},
abstract = {The combination of web document contents, sentences and users’ comments from social networks provides a viewpoint of a web document towards a special event. This paper proposes a framework named SoRTESum to take advantage of information from Twitter viz. Diversity and reflection of document content to generate high-quality summaries by a novel sentence similarity measurement. The framework first formulates sentences and tweets by recognizing textual entailment (RTE) relation to incorporate social information. Next, they are modeled in a Dual Wing Entailment Graph, which captures the entailment relation to calculate the sentence similarity based on mutual reinforcement information. Finally, important sentences and representative tweets are selected by a ranking algorithm. By incorporating social information, SoRTESum obtained improvements over state-of-the-art unsupervised baselines e.g., Random, SentenceLead, LexRank of 0.51 %-8.8% of ROUGE-1 and comparable results with strong supervised methods e.g., L2R and CrossL2R trained by RankBoost for single-document summarization. © Springer International Publishing Switzerland 2016.},
note = {cited By 15},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Ittoo, Ashwin; Nguyen, Le Min; Bosch, Antal
Editorial: Special issue on natural language processing and text analytics in industry Journal Article
In: Computers in Industry, vol. 78, pp. 1-2, 2016, (cited By 1).
@article{Ittoo20161,
title = {Editorial: Special issue on natural language processing and text analytics in industry},
author = {Ashwin Ittoo and Le Min Nguyen and Antal Bosch},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84957388513&doi=10.1016%2fj.compind.2016.01.001&partnerID=40&md5=a3b63512b641693d67a70d5d611445fe},
doi = {10.1016/j.compind.2016.01.001},
year = {2016},
date = {2016-01-01},
journal = {Computers in Industry},
volume = {78},
pages = {1-2},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Hoang, Duc Tam; Nguyen, Minh Le; Pham, Son Bao
L2S: Transforming Natural Language Questions into SQL Queries Conference
2016, (cited By 1).
Abstract | Links | BibTeX | Tags:
@conference{Hoang201685,
title = {L2S: Transforming Natural Language Questions into SQL Queries},
author = {Duc Tam Hoang and Minh Le Nguyen and Son Bao Pham},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84964788492&doi=10.1109%2fKSE.2015.38&partnerID=40&md5=c898c4461dc5e529db8cd2fefe5fd535},
doi = {10.1109/KSE.2015.38},
year = {2016},
date = {2016-01-01},
journal = {Proceedings - 2015 IEEE International Conference on Knowledge and Systems Engineering, KSE 2015},
pages = {85-90},
abstract = {The reliability of a question answering system is bounded by the availability of resources and linguistic tools. In this paper, we introduce a hybrid approach to transforming natural language questions into structured queries. It alleviates the lack of experts in domain observation and the deficient performance of linguistic tools. Specifically, we exploit the semantic information for mapping natural language terminologies to structured query and bipartite graph model for the matching phase. Experimental results on the Vietnam national university entrance exam dataset and the Geoqueries880 dataset achieve accuracies of 91.14% and 87.55%, respectively. © 2015 IEEE.},
note = {cited By 1},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Nguyen, Minh-Tien; Ha, Quang-Thuy; Nguyen, Thi-Dung; Nguyen, Tri-Thanh; Nguyen, Le-Minh
Recognizing Textual Entailment in Vietnamese Text: An Experimental Study Conference
2016, (cited By 7).
Abstract | Links | BibTeX | Tags:
@conference{Nguyen2016108,
title = {Recognizing Textual Entailment in Vietnamese Text: An Experimental Study},
author = {Minh-Tien Nguyen and Quang-Thuy Ha and Thi-Dung Nguyen and Tri-Thanh Nguyen and Le-Minh Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84964725492&doi=10.1109%2fKSE.2015.23&partnerID=40&md5=d17bf859f8ed15798dcc1304327b343a},
doi = {10.1109/KSE.2015.23},
year = {2016},
date = {2016-01-01},
journal = {Proceedings - 2015 IEEE International Conference on Knowledge and Systems Engineering, KSE 2015},
pages = {108-113},
abstract = {This paper proposes a model which utilizes Support Vector Machines (SVMs) - a machine learning approach for recognizing textual entailment in Vietnamese text, including three steps: (1) feature extraction, (2) training and (3) judgement by voting. In the first step, many features (e.g., Euclidean distance, Cosine, if-idf, etc) were extracted to train three classification models for the second step. The final step judged whether there is an entailment relation between a text and a hypothesis (another text can be plausibly inferred from the original one) or not. To improve the recognition quality, a combination of classifiers was proposed under voting method as human judgement on Vietnamese version of RTE-3. By using voting, our approach obtained significant improvements (from 1.2% to 9.4% of F-score) in comparison with baselines and ensemble methods, e.g. AdaBoost and Bagging. © 2015 IEEE.},
note = {cited By 7},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Gao, K; Knight, J; Le, T; Do, D; James, A; Green, T; Dickinson, A; Nguyen, M; Kangas, L; Tolentino, J; others,
Performance of the Aptimatextregistered HBV Quant assay on the fully automated Panthertextregistered system Journal Article
In: Journal of Clinical Virology, no. 82, pp. S24, 2016.
BibTeX | Tags:
@article{gao2016performance,
title = {Performance of the Aptimatextregistered HBV Quant assay on the fully automated Panthertextregistered system},
author = {K Gao and J Knight and T Le and D Do and A James and T Green and A Dickinson and M Nguyen and L Kangas and J Tolentino and others},
year = {2016},
date = {2016-01-01},
journal = {Journal of Clinical Virology},
number = {82},
pages = {S24},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Vo, Trung Thien; Le, Bac; Nguyen, Minh Le
Scoring explanatoriness of a sentence and ranking for explanatory opinion summary Journal Article
In: Studies in Computational Intelligence, vol. 642, pp. 277-286, 2016, (cited By 0).
Abstract | Links | BibTeX | Tags:
@article{Vo2016277,
title = {Scoring explanatoriness of a sentence and ranking for explanatory opinion summary},
author = {Trung Thien Vo and Bac Le and Minh Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84966549066&doi=10.1007%2f978-3-319-31277-4_24&partnerID=40&md5=559cce9534700f4cb8a6eec6f8536528},
doi = {10.1007/978-3-319-31277-4_24},
year = {2016},
date = {2016-01-01},
journal = {Studies in Computational Intelligence},
volume = {642},
pages = {277-286},
abstract = {Ön the online reviews, one of the important types of information is the sentiment explanation which expresses a content users generated. Sentiment explanation is a sentence that expresses detailed reason of sentiment (i.e., “explanatoriness”) and plays an important role in opinion summarization. In this paper, we propose and study a method for scoring the explanatoriness of a sentence. A first method is to adapt an existing method and a second method based on a probabilistic model. Experimental results show that the proposed methods are effective, presenting a better value for a state of the art sentence ranking method for standard text summarization. © Springer International Publishing Switzerland 2016."},
note = {cited By 0},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Nguyen, TS; Nguyen, LM; Tran, XC
Vietnamese named entity recognition at vlsp 2016 evaluation campaign Inproceedings
In: Proceedings of the fourth international workshop on vietnamese language and speech processing, 2016.
BibTeX | Tags:
@inproceedings{nguyen2016vietnamese,
title = {Vietnamese named entity recognition at vlsp 2016 evaluation campaign},
author = {TS Nguyen and LM Nguyen and XC Tran},
year = {2016},
date = {2016-01-01},
booktitle = {Proceedings of the fourth international workshop on vietnamese language and speech processing},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Phan, Viet Anh; Chau, Ngoc Phuong; Nguyen, Minh Le
Exploiting tree structures for classifying programs by functionalities Conference
2016, (cited By 5).
Abstract | Links | BibTeX | Tags:
@conference{Phan201685,
title = {Exploiting tree structures for classifying programs by functionalities},
author = {Viet Anh Phan and Ngoc Phuong Chau and Minh Le Nguyen},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85006974296&doi=10.1109%2fKSE.2016.7758034&partnerID=40&md5=dccdafb1810db4ea6a2ef5384d0b1d6a},
doi = {10.1109/KSE.2016.7758034},
year = {2016},
date = {2016-01-01},
journal = {Proceedings - 2016 8th International Conference on Knowledge and Systems Engineering, KSE 2016},
pages = {85-90},
abstract = {Änalyzing source code to solve software engineering problems such as fault prediction, cost, and effort estimation always receives attention of researchers as well as companies. The traditional approaches are based on machine learning, and software metrics obtained by computing standard measures of software projects. However, these methods have faced many challenges due to limitations of using software metrics which were not enough to capture the complexity of programs. The aim of this paper is to apply several natural language processing techniques, which deal with software engineering problems by exploring information of programs' abstract syntax trees (ASTs) instead of software metrics. To speed up computational time, we propose a pruning tree technique to eliminate redundant branches of ASTs. In addition, the k-Nearest Neighbor (kNN) algorithm was adopted to compare with other methods whereby the distance between programs is measured by using the tree edit distance (TED) and the Levenshtein distance. These algorithms are evaluated based on the performance of solving 104-label program classification problem. The experiments show that due to the use of appropriate data structures although kNN is a simple machine learning algorithm, the classifiers achieve the promising results. © 2016 IEEE."},
note = {cited By 5},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Le, Tho Thi Ngoc; Nguyen, Minh Le; Shimazu, Akira
Unsupervised keyphrase extraction: Introducing new kinds of words to keyphrases Journal Article
In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 9992 LNAI, pp. 665-671, 2016, (cited By 30).
Abstract | Links | BibTeX | Tags:
@article{Le2016665,
title = {Unsupervised keyphrase extraction: Introducing new kinds of words to keyphrases},
author = {Tho Thi Ngoc Le and Minh Le Nguyen and Akira Shimazu},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85007256363&doi=10.1007%2f978-3-319-50127-7_58&partnerID=40&md5=0b43d476c5f8ac83ee7d8a1eaef46fea},
doi = {10.1007/978-3-319-50127-7_58},
year = {2016},
date = {2016-01-01},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
volume = {9992 LNAI},
pages = {665-671},
abstract = {Current studies often extract keyphrases by collecting adjacent important adjectives and nouns. However, the statistics on four public corpora shows that about 15% of keyphrases contain other kinds of words. Even so, incorporating such kinds of words to the noun phrase patterns is not a solution to improve the extraction performance. In this work, we propose a solution to improve the extraction performance by involving new kinds of words to keyphrases. We have experimented on four public corpora to demonstrate that our proposal improve the performance of keyphrase extraction and new kinds of words are introduced to keyphrases. In addition, our proposal is also superior to the current unsupervised keyphrase extraction approaches. © Springer International Publishing AG 2016.},
note = {cited By 30},
keywords = {},
pubstate = {published},
tppubtype = {article}
}