@inproceedings{li:hal-01648006, TITLE = {{DSS: A Scalable and Efficient Stratified Sampling Algorithm for Large-Scale Datasets}}, AUTHOR = {Li, Minne and Li, Dongsheng and Shen, Siqi and Zhang, Zhaoning and Lu, Xicheng}, URL = {https://inria.hal.science/hal-01648006}, NOTE = {Part 5: Data Processing and Big Data}, BOOKTITLE = {{13th IFIP International Conference on Network and Parallel Computing (NPC)}}, ADDRESS = {Xi'an, China}, EDITOR = {Guang R. Gao and Depei Qian and Xinbo Gao and Barbara Chapman and Wenguang Chen}, PUBLISHER = {{Springer International Publishing}}, SERIES = {Network and Parallel Computing}, VOLUME = {LNCS-9966}, PAGES = {133-146}, YEAR = {2016}, MONTH = Oct, DOI = {10.1007/978-3-319-47099-3\_11}, KEYWORDS = {Stratified sampling ; Aggregation ; Distributed processing ; Spark}, PDF = {https://inria.hal.science/hal-01648006/file/432484_1_En_11_Chapter.pdf}, HAL_ID = {hal-01648006}, HAL_VERSION = {v1}, }