@article{ QIU Xue-song:116, author = {[ QIU Xue-song, WANG Jia-lu, WANG Zhi-li, YAN Yi-fei]}, title = {A Shuffle Partition Optimization Scheme Based on Data Skew Model in Spark}, publisher = {Journal of Beijing University of Posts and Telecommunications}, year = {2020}, journal = {Journal of Beijing University of Posts and Telecommunications}, volume = {43}, number = {2}, eid = {116}, pages = {116-121}, keywords = {data skew;Spark;shuffle;partitioning algorithm;load balancing}, doi = https://journal.bupt.edu.cn/EN/10.13190/j.jbupt.2019-092 }