@inproceedings{3ba91fd08e874fb5a3ebe89ec467c8a8,
title = "Algorithms and estimators for accurate summarization of internet traffic",
abstract = "Statistical summaries of traffic in IP networks are at the heart of network operation and are used to recover information on arbitrary subpopulations of flows. It is therefore of great importance to collect the most accurate and informative summaries given the router's resource constraints. Cisco's sampled NetFlow, based on aggregating a sampled packet stream into flows, is the most widely deployed such system. We observe two sources of inefficiency in current methods. Firstly, a single parameter (the sampling rate) is used to control utilization of both memory and processing/access speed, which means that it has to be set according to the bottleneck resource. Secondly, the unbiased estimators are applicable to summaries that in effect are collected through uneven use of resources during the measurement period (information from the earlier part of the measurement period is either not collected at all and fewer counter are utilized or discarded when performing a sampling rate adaptation). We develop algorithms that collect more informative summaries through an even and more efficient use of available resources. The heart of our approach is a novel derivation of unbiased estimators that use these more informative counts. We show how to efficiently compute these estimators and prove analytically that they are superior (have smaller variance on all packet streams and subpopulations) to previous approaches. Simulations on Pareto distributions and IP flow data show that the new summaries provide significantly more accurate estimates. We provide an implementation design that can be efficiently deployed at routers.",
keywords = "Data streams, IP flows, NetFlow, Network management, Sketches, Subpopulation queries",
author = "Edith Cohen and Nick Duffield and Haim Kaplan and Carsten Lund and Mikkel Thorup",
year = "2007",
doi = "10.1145/1298306.1298344",
language = "אנגלית",
isbn = "9781595939081",
series = "Proceedings of the ACM SIGCOMM Internet Measurement Conference, IMC",
pages = "265--278",
booktitle = "IMC'07",
note = "null ; Conference date: 24-10-2007 Through 26-10-2007",
}