Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
42 changes: 16 additions & 26 deletions joss-paper/paper.bib
Original file line number Diff line number Diff line change
Expand Up @@ -48,7 +48,7 @@ @article{vanArem2025
number={16},
journal={Applied Sciences},
publisher={MDPI AG},
author={van Arem, Koen and Goes-Smit, Floris and Söhl, Jakob},
author={Koen van Arem and Floris Goes-Smit and Jakob Söhl},
year={2025},
month=aug, pages={8916} }

Expand All @@ -72,10 +72,10 @@ @article{Bassek2025

@article{Bauer2023,
abstract = {Choosing the right formation is one of the coach's most important decisions in football. Teams change formation dynamically throughout matches to achieve their immediate objective: to retain possession, progress the ball up-field and create (or prevent) goal-scoring opportunities. In this work we identify the unique formations used by teams in distinct phases of play in a large sample of tracking data. This we achieve in two steps: first, we train a convolutional neural network to decompose each game into non-overlapping segments and classify these segments into phases with an average F 1-score of 0.76. We then measure and contextualize unique formations used in each distinct phase of play. While conventional discussion tends to reduce team formations over an entire match to a single three-digit code (e.g. 4-4-2; 4 defender, 4 midfielder, 2 striker), we provide an objective representation of team formations per phase of play. Using the most frequently occurring phases of play, mid-block, we identify and contextualize six unique formations. A long-term analysis in the German Bundesliga allows us to quantify the efficiency of each formation, and to present a helpful scouting tool to identify how well a coach's preferred playing style is suited to a potential club.},
author = {P Bauer and G Anzer and L Shaw - Journal of sports analytics and undefined 2023},
author = {Pascal Bauer and Gabriel Anzer and Lluke Shaw},
doi = {10.3233/JSA-220620},
issue = {1},
journal = {journals.sagepub.comP Bauer, G Anzer, L ShawJournal of sports analytics, 2023•journals.sagepub.com},
journal = {Journal of sports analytics},
keywords = {Association football,human-in-the-loop machine learning,soccer,sports analytics},
month = {3},
pages = {39-59},
Expand All @@ -99,7 +99,7 @@ @article{Bischofberger2025


@inproceedings{Fernandez2018,
author = {Javier Fernández and F C Barcelona and Javier Fernandez and Luke Bornn},
author = {Javier Fernandez and Luke Bornn},
booktitle = {Sloan Sports Analytics Conference},
title = {Wide Open Spaces: A statistical technique for measuring space creation in professional soccer},
url = {https://www.researchgate.net/publication/324942294_Wide_Open_Spaces_A_statistical_technique_for_measuring_space_creation_in_professional_soccer},
Expand All @@ -124,9 +124,9 @@ @article{Fernandez2021

@article{Forcher2022,
abstract = {Recently, the availability of big amounts of data enables analysts to dive deeper into the constraints of performance in various team sports. While offensive analyses in football have been extensively conducted, the evaluation of defensive performance is underrepresented in this sport. Hence, the aim of this study was to analyze successful defensive playing phases by investigating the space and time characteristics of defensive pressure. Therefore, tracking and event data of 153 games of the German Bundesliga (second half of 2020/21 season) were assessed. Defensive pressure was measured in the last 10 seconds of a defensive playing sequence (time characteristic) and it was distinguished between pressure on the ball-carrier, pressure on the group (5 attackers closest to the ball), and pressure on the whole team (space characteristic). A linear mixed model was applied to evaluate the effect of success of a defensive play (ball gain), space characteristic, and time characteristic on defensive pressure. Defensive pressure is higher in successful defensive plays (14.47 ± 16.82[%]) compared to unsuccessful defensive plays (12.87 ± 15.31[%]). The characteristics show that defensive pressure is higher in areas closer to the ball (space characteristic) and the closer the measurement is to the end of a defensive play (time characteristic), which is especially true for successful defensive plays. Defensive pressure is a valuable key performance indicator for defensive play. Further, this study shows that there is an association between the pressing of the ball-carrier and areas close to the ball with the success of defensive play.},
author = {L Forcher and L Forcher and S Altmann and D Jekauc - Science and Medicine … and undefined 2022},
author = {Leander Forcher and Leon Forcher and Stefan Altmann and Ddarko Jekauc and Matthias Kempe},
doi = {10.1080/24733938.2022.2158213},
journal = {Taylor \& FrancisL Forcher, L Forcher, S Altmann, D Jekauc, M KempeScience and Medicine in Football, 2022•Taylor \& Francis},
journal = {Science and Medicine in Football,},
keywords = {defensive behavior,machine learning,match analysis,performance analysis,team sports},
publisher = {Taylor and Francis Ltd.},
title = {The keys of pressing to gain the ball–Characteristics of defensive pressure in elite soccer using tracking data},
Expand All @@ -135,10 +135,10 @@ @article{Forcher2022
}
@article{Goes2020a,
abstract = {In professional soccer, increasing amounts of data are collected that harness great potential when it comes to analysing tactical behaviour. Unlocking this potential is difficult as big data challenges the data management and analytics methods commonly employed in sports. By joining forces with computer science, solutions to these challenges could be achieved, helping sports science to find new insights, as is happening in other scientific domains. We aim to bring multiple domains together in the context of analysing tactical behaviour in soccer using position tracking data. A systematic literature search for studies employing position tracking data to study tactical behaviour in soccer was conducted in seven electronic databases, resulting in 2338 identified studies and finally the inclusion of 73 papers. Each domain clearly contributes to the analysis of tactical behaviour, albeit in-sometimes radically-different ways. Accordingly, we present a multidisciplinary framework where each domain's contributions to feature construction, modelling and interpretation can be situated. We discuss a set of key challenges concerning the data analytics process, specifically feature construction, spatial and temporal aggregation. Moreover, we discuss how these challenges could be resolved through multidisciplinary collaboration, which is pivotal in unlocking the potential of position tracking data in sports analytics.},
author = {F R Goes and L A Meerhoff and M J O Bueno and D M Rodrigues and F A Moura and M S Brink and M T Elferink-Gemser and A J Knobbe and S A Cunha and R S Torres and K A P M Lemmink},
author = {Floris Goes and L A Meerhoff and M J O Bueno and D M Rodrigues and F A Moura and M S Brink and M T Elferink-Gemser and A J Knobbe and S A Cunha and R S Torres and K A P M Lemmink},
doi = {10.1080/17461391.2020.1747552},
issue = {4},
journal = {Taylor \& FrancisFR Goes, LA Meerhoff, MJO Bueno, DM Rodrigues, FA Moura, MS BrinkEuropean Journal of Sport Science, 2021•Taylor \& Francis},
journal = {European Journal of Sport Science},
keywords = {Football,big data,performance analysis,tactical analysis,team sport},
pages = {481-496},
publisher = {Taylor and Francis Ltd.},
Expand All @@ -149,11 +149,11 @@ @article{Goes2020a
}
@article{Goes2020b,
abstract = {Association football teams can be considered complex dynamical systems of individuals grouped in subgroups (defenders, midfielders and attackers), coordinating their behaviour to achieve a shared g...},
author = {Floris R Goes and Michel S Brink and Marije T Elferink-Gemser and Matthias Kempe and Koen A P M Lemmink},
author = {Floris Goes and Michel Brink and Marije Elferink-Gemser and Matthias Kempe and Koen A P M Lemmink},
doi = {10.1080/02640414.2020.1834689},
issn = {1466447X},
issue = {5},
journal = {https://doi.org/10.1080/02640414.2020.1834689},
journal = {Journal of Sports Sciences},
keywords = {Soccer,Spatiotemporal,machine learning,subgroups,tactics},
pages = {523-532},
pmid = {33106106},
Expand All @@ -168,7 +168,7 @@ @article{Goes2021
author = {Floris Goes and Edgar Schwarz and Marije Elferink-Gemser and Koen Lemmink and Michel Brink},
doi = {10.1080/24733938.2021.1944660},
issue = {3},
journal = {Taylor \& Francis},
journal = {Science and Medicine in Football},
keywords = {football,risk-taking behaviour,spatiotemporal behaviour,tactical behaviour,time-motion analysis},
pages = {372-380},
publisher = {Taylor and Francis Ltd.},
Expand Down Expand Up @@ -199,7 +199,7 @@ @article{Hader2019

@article{Herold2022,
abstract = {This study describes an approach to evaluate the off-ball behaviour of attacking players in association football. The aim was to implement a defensive pressure model to examine an offensive player’s ability to create separation from a defender using 1411 high-intensity off-ball actions including 988 Deep Runs (DRs) DRs and 423 Change of Directions (CODs). Twenty-two official matches (14 competitive matches and 8 friendlies) of the German National Team were included in the research. To validate the effectiveness of the pressure model, each pass (n = 25,418) was evaluated for defensive pressure on the receiver at the moment of the pass and for the pass completion rate (R = −.34, p < .001). Next, after assessing the inter-rater reliability (Fleiss Kappa of 80 for DRs and 78 for CODs), three expert raters annotated all DRs and CODs that met the pre-set criteria. A time-series analysis of each DR and COD was calculated to the nearest 0.1 second, finding a slight increase in pressure from the start to the end of the off-ball actions as defenders re-established proximity to the attacker after separation was created. A linear mixed model using run type (DR or COD) as a fixed effect with the local maximum as a fixed effect on a continuous scale resulted in p < 0.001, d = 4.81, CI = 0.63 to 0.67 for the greatest decrease in pressure, p < 0.001, d = 0.143, CI = 9.18 to 10.61 for length of the longest decrease in pressure, and p < 0.001, d = 1.13, CI = 0.90 to 1.11 for the fastest rate of decrease in pressure. As these values pertain to the local maximum, situations with greater starting pressure on the attacker often led to greater subsequent decreases. Furthermore, there was a significant (p < .0001) difference between offensive and defensive positions and the number of off-ball actions. Results suggest the model can be applied to quantify and visualise the pressure exerted on non-ball-possessing players. This approach can be combined with other methods of match analysis, providing practitioners with new opportunities to measure tactical performance in football.},
author = {Mat Herold and A Hecksteden and D Radke and F Goes and S Nopp and T Meyer and M Kempe},
author = {Mat Herold and Anne Hecksteden and D Radke and F Goes and S Nopp and T Meyer and M Kempe},
doi = {10.1080/02640414.2022.2081405},
issn = {1466447X},
issue = {12},
Expand Down Expand Up @@ -280,7 +280,7 @@ @article{Link2016

@article{Oonk2025a,
abstract = {The field of football (soccer) has seen a recent increase in the utilisation of data, mainly for the analysis of physical and tactical performance. Analysis of tactical performance can be conducted...},
author = {G. A. Oonk and T. J.W. Buurke and K. A.P.M. Lemmink and M. Kempe},
author = {Gerard Alexander Oonk and Tom J.W. Buurke and Koen A.P.M. Lemmink and Matthias Kempe},
doi = {10.1080/02640414.2025.2555117},
issn = {1466447X},
journal = {Journal of Sports Sciences},
Expand All @@ -293,18 +293,8 @@ @article{Oonk2025a
}

@inproceedings{Oonk2025b,
abstract = {Valuable new insights can be obtained by combining tracking and event data in soccer anal-
ysis. However, how to synchronize the two data streams, is rarely discussed. Non systematic
errors in the timestamps, and synchronizing with cost functions result in suboptimal synchro-
nization, which hinders further analysis. Within this proceedings we will introduce a com-
putationally optimized implementation of the Needleman-Wunch algorithm, by using domain
knowledge about the game. The optimized version is over 70 times more efficient in terms of
time constraints and memory usage. On top of that, we show that the properly synchronized
approach translates back to practice with better performing xG models. Taken together, this im-
plementation is a training-free, high-quality synchronization algorithm, with low computational
cost that solves existing issues. On top of that, all data and code used for this proceedings is
fully open-sourced and available in the DataBallPy package.},
author = {G.A. Oonk and D. Grob and M. Kempe},
abstract = {Valuable new insights can be obtained by combining tracking and event data in soccer anal-ysis. However, how to synchronize the two data streams, is rarely discussed. Non systematicerrors in the timestamps, and synchronizing with cost functions result in suboptimal synchronization, which hinders further analysis. Within this proceedings we will introduce a computationally optimized implementation of the Needleman-Wunch algorithm, by using domain knowledge about the game. The optimized version is over 70 times more efficient in terms of time constraints and memory usage. On top of that, we show that the properly synchronized approach translates back to practice with better performing xG models. Taken together, this implementation is a training-free, high-quality synchronization algorithm, with low computationalcost that solves existing issues. On top of that, all data and code used for this proceedings is fully open-sourced and available in the DataBallPy package.},
author = {Gerard Alexander Oonk and Daan Grob and Matthias Kempe},
city = {Luxembourg},
editor = {D. Goossens},
booktitle = {MathSports Conference},
Expand All @@ -322,7 +312,7 @@ @article{Raabe2022
volume = {7},
number = {76},
pages = {4588},
author = {Raabe, Dominik and Biermann, Henrik and Bassek, Manuel and Wohlan, Martin and Komitova, Rumena and Rein, Robert and Groot, Tobias Kuppens and Memmert, Daniel},
author = {Dominik Raabe and Henrik Biermann and Manuel Bassek and Martin Wohlan and Rumena Komitova and Robert Rein and Tobias Kuppens Groot and Daniel Memmert},
title = {floodlight - A high-level, data-driven sports analytics framework},
journal = {Journal of Open Source Software}
}
Expand Down
Loading
Loading