@inproceedings{ananthanarayanan2011disk-locality, author = {Ananthanarayanan, Ganesh and Ghodsi, Ali and Shenker, Scott and Stoica, Ion}, title = {Disk-Locality in Datacenter Computing Considered Irrelevant}, booktitle = {USENIX HotOS}, year = {2011}, month = {May}, abstract = {Data center computing is becoming pervasive in many organizations. Computing frameworks such as MapReduce [17], Hadoop [6] and Dryad [25], split jobs into small tasks that are run on the cluster’s compute nodes. Through these frameworks, computation can be performed on large datasets in a fault-tolerant way, while hiding the complexities of the distributed nature of the cluster. For these reasons, a considerable work has been done to improve the efficiency of these frameworks}, url = {http://approjects.co.za/?big=en-us/research/publication/disk-locality-datacenter-computing-considered-irrelevant/}, edition = {USENIX HotOS}, }