@inproceedings{292e5a2093944e9a8d8c03ac9cdd2e9e,
title = "Statistical analysis of large sets of models",
abstract = "Many applications in Model-Driven Engineering involve processing multiple models, e.g. for comparing and merging of model variants into a common domain model. Despite many sophisticated techniques for model comparison, little attention has been given to the initial data analysis and filtering activities. These are hard to ignore especially in the case of a large dataset, possibly with outliers and sub-groupings. We would like to develop a generic approach for model comparison and analysis for large datasets; using techniques from information retrieval, natural language processing and machine learning. We are implementing our approach as an open framework and have so far evaluated it on public datasets involving domain analysis, repository management and model searching scenarios.",
keywords = "Clustering, Model comparison, Model-driven engineering, Vector space model",
author = "{\"O}nder Babur",
year = "2016",
month = aug,
day = "25",
doi = "10.1145/2970276.2975938",
language = "English",
series = "ASE 2016 - Proceedings of the 31st IEEE/ACM International Conference on Automated Software Engineering",
publisher = "Association for Computing Machinery, Inc",
pages = "888--891",
editor = "Sarfraz Khurshid and David Lo and Sven Apel",
booktitle = "ASE 2016 - Proceedings of the 31st IEEE/ACM International Conference on Automated Software Engineering",
note = "31st IEEE/ACM International Conference on Automated Software Engineering, ASE 2016 ; Conference date: 03-09-2016 Through 07-09-2016",
}