@misc{8785, author = {Hadi Hemmati and Andrea Arcuri and Lionel Briand}, title = {Empirical Investigation of the Effects of Test Suite Properties on Similarity-Based Test Case Selection}, abstract = {Our experience with applying model-based testing on industrial systems showed that the generated test suites are often too large and costly to execute given project deadlines and the limited resources for system testing on real platforms. In such industrial contexts, it is often the case that only a small subset of test cases can be run. In previous work, we proposed novel test case selection techniques that minimize the similarities among selected test cases and outperforms other selection alternatives. In this paper, our goal is to gain insights into why and under which conditions similarity-based selection techniques, and in particular our approach, can be expected to work. We investigate the properties of test suites with respect to similarities among fault revealing test cases. We thus identify the ideal situation in which a similarity-based selection works best, which is useful for devising more effective similarity functions. We also address the specific situation in which a test suite contains outliers, that is a small group of very different test cases, and show that it decreases the effectiveness of similarity-based selection. We then propose, and successfully evaluate based on two industrial systems, a solution based on rank scaling to alleviate this problem.}, year = {2011}, journal = {4th International Conference on Software Testing, Verification and Validation (ICST2011)}, pages = {327-336}, publisher = {IEEE Computer Society}, address = {Berlin}, isbn = {978-1-61284-174-8}, }