@inproceedings{kakarla2024diffy, author = {Kakarla, Siva Kesava Reddy and Yan, Francis Y. and Beckett, Ryan}, title = {Diffy: Data-Driven Bug Finding for Configurations}, booktitle = {ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI ’24)}, year = {2024}, month = {June}, abstract = {Configuration errors remain a major cause of system failures and service outages. One promising approach to identify configuration errors automatically is to learn common usage patterns (and anti-patterns) using data-driven methods. However, existing data-driven learning approaches analyze only simple configurations (e.g., those with no hierarchical structure), identify only simple types of issues (e.g., type errors), or require extensive domain-specific tuning. In this paper, we present Diffy, the first push-button configuration analyzer that detects likely bugs in structured configurations. From example configurations, Diffy learns a common template, with “holes” that capture their variation. It then applies unsupervised learning to identify anomalous template parameters as likely bugs. We evaluate Diffy on a large cloud provider’s wide-area network, an operational 5G network testbed, and MySQL configurations, demonstrating its versatility, performance, and accuracy. During Diffy’s development, it caught and prevented a bug in a configuration timer value that had previously caused an outage for the cloud provider.}, url = {http://approjects.co.za/?big=en-us/research/publication/diffy-data-driven-bug-finding-for-configurations/}, }