@inproceedings{zhou2013timestream, author = {Zhou, Lidong and Yu, Yuan and Zhang, Zheng and Qian, Zhengping}, title = {TimeStream: Reliable Stream Computation in the Cloud}, booktitle = {EuroSys 2013}, year = {2013}, month = {April}, abstract = {TimeStream is a distributed system designed specifically for low-latency continuous processing of big streaming data on a large cluster of commodity machines. The unique characteristics of this emerging application domain have led to a significantly different design from the popular MapReduce-style batch data processing. In particular, we advocate a powerful new abstraction called resilient substitution that caters to the specific needs in this new computation model to handle failure recovery and dynamic reconfiguration in response to load changes. Several real-world applications running on our prototype have been shown to scale robustly with low latency while at the same time maintaining the simple and concise declarative programming model. TimeStream handles an on-line advertising aggregation pipeline at a rate of 700,000 URLs per second with a 2-second delay, while performing sentiment analysis of Twitter data at a peak rate close to 10,000 tweets per second, with approximately 2-second delay.}, publisher = {ACM}, url = {http://approjects.co.za/?big=en-us/research/publication/timestream-reliable-stream-computation-in-the-cloud/}, edition = {EuroSys 2013}, note = {Updated version}, }