@misc{17718, author = {Mehdi Sarkhoosh and Sushant Gautam and Cise Midoglu and Saeed Sabet and Thomas Torjusen and P{\r a}l Halvorsen}, title = {The SoccerSum Dataset for Automated Detection, Segmentation, and Tracking of Objects on the Soccer Pitch}, abstract = {This paper introduces SoccerSum, a novel dataset aimed at enhancing object detection and segmentation in video frames depicting the soccer pitch, using footage from the Norwegian Eliteserien league across 2021-2023. With the goal of detecting elements beyond common entities in existing datasets, such as the soccer ball, players and referees, this dataset includes additional annotations for the goal net, corner flag posts, and the penalty mark. SoccerSum also includes the segmentation of key pitch areas such as the penalty and goal boxes for the same frame sequences. Comprising 750 frames annotated with 10 classes for advanced analysis, SoccerSum offers compatibility with existing frameworks, providing a rich dataset for the development of computer vision algorithms. This dataset not only serves as a resource for improving sports analytics, but also introduces a new application for automatic game summarization, enabling the generation of detailed and engaging content for fans and professionals. The SoccerSum dataset is accessible on Zenodo: https://zenodo.org/records/10612084.}, year = {2024}, journal = {MMSys {\textquoteright}24: Proceedings of the 15th ACM Multimedia Systems Conference}, publisher = {Association for Computing Machinery}, doi = {10.1145/3625468.3652180}, }