<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "http://jats.nlm.nih.gov/publishing/1.0/JATS-journalpublishing1.dtd">
<article article-type="research-article" dtd-version="1.0" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">JSSM</journal-id>
<journal-title-group>
<journal-title>Journal of Sports Science and Medicine</journal-title>
<abbrev-journal-title>J Sports Sci &#x0026; Med</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1303-2968</issn>
<publisher>
<publisher-name>Uludag University</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.52082/jssm.2023.475</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Research article</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Predicting Injury and Illness with Machine Learning in Elite Youth Soccer: A Comprehensive Monitoring Approach over 3 Months</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Haller</surname><given-names>Nils</given-names></name>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x2709;</xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g004.tif" mime-subtype="tif"/>
<p><bold>Nils HALLER</bold></p>
<sec>
<title>Employment</title>
<p>Senior Researcher, Department of Sport and Exercise Science, University of Salzburg; Department of Sports Medicine, Rehabilitation and Disease Prevention, University of Mainz, Mainz, Germany</p>
</sec>
<sec>
<title>Degree</title>
<p>PhD</p>
</sec>
<sec>
<title>Research interests</title>
<p>Exercise physiology, Load monitoring, Sports therapy</p>
<p><bold>E-mail:</bold> <email>nhaller@uni-mainz.de</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>Kranzinger</surname><given-names>Stefan</given-names></name>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g005.tif" mime-subtype="tif"/>
<p><bold>Stefan KRANZINGER</bold></p>
<sec>
<title>Employment</title>
<p>Researcher, Salzburg Research Forschungsgesellschaft m.b.H</p>
</sec>
<sec>
<title>Degree</title>
<p>Mag., MSc., PhD</p>
</sec>
<sec>
<title>Research interests</title>
<p>Human motion analysis, Machine learning, Statistics</p>
<p><bold>E-mail:</bold> <email>stefan.kranzinger@salzburgresearch.at</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>Kranzinger</surname><given-names>Christina</given-names></name>
<xref ref-type="aff" rid="aff003"><sup>3</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g006.tif" mime-subtype="tif"/>
<p><bold>Christina KRANZINGER</bold></p>
<sec>
<title>Employment</title>
<p>Researcher, Salzburg Research Forschungsgesellschaft m.b.H</p>
</sec>
<sec>
<title>Degree</title>
<p>Mag., MSc.</p>
</sec>
<sec>
<title>Research interests</title>
<p>Human motion analysis, Machine learning, Statistics</p>
<p><bold>E-mail:</bold> <email>christina.kranzinger@salzburgresearch.at</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>Blumkaitis</surname><given-names>Julia C.</given-names></name>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g007.tif" mime-subtype="tif"/>
<p><bold>Julia C. BLUMKAITIS</bold></p>
<sec>
<title>Employment</title>
<p>Research Assistant, Department of Sport and Exercise Science, University of Salzburg</p>
</sec>
<sec>
<title>Degree</title>
<p>M.Sc.</p>
</sec>
<sec>
<title>Research interests</title>
<p>Exercise physiology, Training load monitoring</p>
<p><bold>E-mail:</bold> <email>julia.blumkaitis@plus.ac.at</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>Strepp</surname><given-names>Tilmann</given-names></name>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g008.tif" mime-subtype="tif"/>
<p><bold>Tilmann STREPP</bold></p>
<sec>
<title>Employment</title>
<p>PhD Student, Department of Sport and Exercise Science, University of Salzburg</p>
</sec>
<sec>
<title>Degree</title>
<p>M.Sc.</p>
</sec>
<sec>
<title>Research interests</title>
<p>Sport science, Exercise physiology</p>
<p><bold>E-mail:</bold> <email>tilmann.strepp@plus.ac.at</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>Simon</surname><given-names>Perikles</given-names></name>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g009.tif" mime-subtype="tif"/>
<p><bold>Perikles SIMON</bold></p>
<sec>
<title>Employment</title>
<p>Department of Sports Medicine, Rehabilitation and Disease Prevention, University of Mainz, Mainz, Germany</p>
</sec>
<sec>
<title>Degree</title>
<p>MD, PhD</p>
</sec>
<sec>
<title>Research interests</title>
<p>Exercise immunology, Molecular exercise physiology, Sports medicine</p>
<p><bold>E-mail:</bold> <email>simonpe@uni-mainz.de</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>Tomaskovic</surname><given-names>Aleksandar</given-names></name>
<xref ref-type="aff" rid="aff002"><sup>2</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g010.tif" mime-subtype="tif"/>
<p><bold>Aleksandar TOMASKOVIC</bold></p>
<sec>
<title>Employment</title>
<p>Department of Sports Medicine, Rehabili-tation and Disease Prevention, University of Mainz, Mainz, Germany</p>
</sec>
<sec>
<title>Degree</title>
<p>M.Sc.</p>
</sec>
<sec>
<title>Research interests</title>
<p>Training load management, Sports physiotherapy</p>
<p><bold>E-mail:</bold> <email>altomask@uni-mainz.de</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>O&#x2019;Brien</surname><given-names>James</given-names></name>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g011.tif" mime-subtype="tif"/>
<p><bold>James O&#x2019;BRIEN</bold></p>
<sec>
<title>Employment</title>
<p>Red Bull Athlete Performance Center, Salzburg, Austria</p>
</sec>
<sec>
<title>Degree</title>
<p>MSc, PhD</p>
</sec>
<sec>
<title>Research interests</title>
<p>Injury prevention, Sports physiotherapy</p>
<p><bold>E-mail:</bold> <email>james.obrien@redbullperformance.com</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>D&#x00FC;ring</surname><given-names>Manfred</given-names></name>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g012.tif" mime-subtype="tif"/>
<p><bold>Manfred D&#x00DC;RING</bold></p>
<sec>
<title>Employment</title>
<p>Head of Performance at FC Red Bull Salzburg</p>
</sec>
<sec>
<title>Degree</title>
<p>Dipl., Dr. Sports Science</p>
</sec>
<sec>
<title>Research interests</title>
<p>Monitoring &#x0026; training load management, Exercise physiology, Biomechanics, Performance diagnostics</p>
<p><bold>E-mail:</bold> <email>manfred.duering@redbullsalzburg.at</email></p>
</sec>
</bio>
</contrib>
<contrib contrib-type="author">
<name><surname>St&#x00F6;ggl</surname><given-names>Thomas</given-names></name>
<xref ref-type="aff" rid="aff001"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff004"><sup>4</sup></xref>
<bio>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g013.tif" mime-subtype="tif"/>
<p><bold>Thomas ST&#x00D6;GGL</bold></p>
<sec>
<title>Employment</title>
<p>Head of R&#x0026;D and Science at the Red Bull Athlete Performance Center</p>
</sec>
<sec>
<title>Degree</title>
<p>Univ-. Prof. Mag. Dr.</p>
</sec>
<sec>
<title>Research interests</title>
<p>Physiology and biomechanics in sports from sedentary to the elite athlete; training intensity distribution among elite endurance athletes; Exercise physiology and performance diagnostics; Sensor technologies in various settings of sport science</p>
<p><bold>E-mail:</bold> <email>thomas.stoeggl@redbullperformance.com</email></p>
</sec>
</bio>
</contrib>
</contrib-group>
<aff id="aff001"><label>1</label> <institution>Department of Sport and Exercise Science, University of Salzburg</institution>, <addr-line>Salzburg, Austria</addr-line></aff>
<aff id="aff002"><label>2</label> <institution>Department of Sports Medicine, Rehabilitation and Disease Prevention, University of Mainz</institution>, <addr-line>Mainz, Germany</addr-line></aff>
<aff id="aff003"><label>3</label> <institution>Salzburg Research Forschungsgesellschaft m.b.H</institution>, <addr-line>Salzburg, Austria</addr-line></aff>
<aff id="aff004"><label>4</label> <institution>Red Bull Athlete Performance Center</institution>, <addr-line>Salzburg, Austria</addr-line></aff>
<author-notes>
<corresp id="cor1">&#x2709; Department of Sports Medicine, Disease Prevention and Rehabilitation Johannes Gutenberg University Mainz, Germany.</corresp>
</author-notes>
<pub-date pub-type="collection">
<month>09</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="epub">
<day>01</day>
<month>09</month>
<year>2023</year>
</pub-date>
<volume>22</volume>
<issue>3</issue>
<fpage>475</fpage>
<lpage>486</lpage>
<history>
<date date-type="received">
<day>09</day>
<month>05</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>04</day>
<month>08</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>&#x00A9; Journal of Sports Science and Medicine</copyright-statement>
<copyright-year>2023</copyright-year>
</permissions>
<abstract>
<p>The search for monitoring tools that provide early indication of injury and illness could contribute to better player protection. The aim of the present study was to i) determine the feasibility of and adherence to our monitoring approach, and ii) identify variables associated with up-coming illness and injury. We incorporated a comprehensive set of monitoring tools consisting of external load and physical fitness data, questionnaires, blood, neuromuscular-, hamstring, hip abductor and hip adductor performance tests performed over a three-month period in elite under-18 academy soccer players. Twenty-five players (age: 16.6 &#x00B1; 0.9 years, height: 178 &#x00B1; 7 cm, weight: 74 &#x00B1; 7 kg, VO<sub>2max</sub>: 59 &#x00B1; 4 ml/min/kg) took part in the study. In addition to evaluating adherence to the monitoring approach, data were analyzed using a linear support vector machine (SVM) to predict illness and injuries. The approach was feasible, with no injuries or dropouts due to the monitoring process. Questionnaire adherence was high at the beginning and decreased steadily towards the end of the study. An SVM resulted in the best classification results for three classification tasks, i.e., illness prediction, illness determination and injury prediction. For injury prediction, one of four injuries present in the test data set was detected, with 96.3% of all data points (i.e., injuries and non-injuries) correctly detected. For both illness prediction and determination, there was only one illness in the test data set that was detected by the linear SVM. However, the model showed low precision for injury and illness prediction with a considerable number of false-positives. The results demonstrate the feasibility of a holistic monitoring approach with the possibility of predicting illness and injury. Additional data points are needed to improve the prediction models. In practical application, this may lead to overcautious recommendations on when players should be protected from injury and illness.</p>
<p><boxed-text position="float">
<caption><title>Key points</title></caption>
<list list-type="bullet">
<list-item><p>A comprehensive monitoring approach was feasible and did not lead to adverse events, such as injuries.</p></list-item>
<list-item><p>A machine learning approach has shown promise for injury and illness prediction as well as illness detection.</p></list-item>
<list-item><p>The analysis was limited by the low number of injuries and illnesses during the study period.</p></list-item>
<list-item><p>Future studies should include longer study periods to further improve machine learning models.</p></list-item>
</list>
</boxed-text></p>
</abstract>
<kwd-group>
<title>Key words</title>
<kwd>Football</kwd>
<kwd>artificial intelligence</kwd>
<kwd>injury prevention</kwd>
<kwd>load management</kwd>
<kwd>load monitoring</kwd>
</kwd-group>
<counts>
<fig-count count="13"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="45"/>
<page-count count="12"/>
</counts>
</article-meta>
</front>
<body>
<sec id="sec1-1">
<title>Introduction</title>
<p>Load management (i.e., the prescription, monitoring, and adjustment of workload) is intended to objectify the athlete's workload, protect players from injury and illness and maximize their performance (Schwellnus et al., <xref ref-type="bibr" rid="ref34">2016</xref>; Soligard et al., <xref ref-type="bibr" rid="ref36">2016</xref>). An emerging area of research addresses the potential of load monitoring tools, such as tracking devices or questionnaires, to help predicting injuries or other undesirable events to better protect athletes (Van Eetvelde et al., <xref ref-type="bibr" rid="ref41">2021</xref>). In particular, machine learning models have potential application for injury prediction, physical performance prediction, training load and monitoring, players&#x2019; career trajectory, club performance, and match attendance (Nassis et al., <xref ref-type="bibr" rid="ref25">2023</xref>). However, the predictive accuracy of these machine learning models, e.g., in terms of area under the curve, was not adequate in all studies (Nassis et al., <xref ref-type="bibr" rid="ref25">2023</xref>).</p>
<p>In soccer, Rossi et al. (<xref ref-type="bibr" rid="ref30">2018</xref>) conducted a study over a duration of 23 weeks, using global-positioning-system-based training load data to examine the relationship between load and injury occurrence. By generating a training data set and validating their model with a decision tree, the authors demonstrated that certain cut-off values of the exponential weighted moving average (EWMA) of total distance and high-speed running, particularly in players that recently returned to play after injury, were associated with an increased injury risk. Interestingly, other studies in team sports have found that different variables contribute to the prediction of injury. While Rossi et al. (<xref ref-type="bibr" rid="ref30">2018</xref>) used only tracking data and corresponding ratios, such as the acute:chronic workload ratio (ACWR (Gabbett, <xref ref-type="bibr" rid="ref8">2018</xref>)), other author groups added additional variables to their data sets, such as pre-season screening (Ayala et al., <xref ref-type="bibr" rid="ref2">2019</xref>), genetic variables (Rodas et al., <xref ref-type="bibr" rid="ref28">2020</xref>), physical fitness, motor coordination and anthropometric data (Rommers et al., <xref ref-type="bibr" rid="ref29">2020</xref>), age, previous injury, and hamstring strength (Ruddy et al., <xref ref-type="bibr" rid="ref32">2018</xref>) resulting in potentially different outcomes. These differences in study design hamper between-study comparisons. Likewise, some of the studies also evaluated different types of injuries ((Van Eetvelde et al., <xref ref-type="bibr" rid="ref41">2021</xref>) for review). In addition, measurements performed irregularly, or only in the pre-season, may be insufficient to capture the dynamic nature of the measurement variables.</p>
<p>Given the multifactorial nature of non-contact injuries, incorporating additional variables can potentially enhance machine learning models. Such variables include training load data, metrics on physical fitness, objective training/game data, and corresponding physiological responses (e.g., measured via blood-based biomarkers, questionnaires, or neuromuscular performance tests). The inclusion of these different variables may be of importance in view of, i) weak physical fitness is discussed to be a risk factor for illness and injury (Malone et al., <xref ref-type="bibr" rid="ref22">2018</xref>; Watson et al., <xref ref-type="bibr" rid="ref43">2017</xref>), ii) questionnaires (Saw et al., <xref ref-type="bibr" rid="ref33">2016</xref>) and certain vertical jump variables (e.g., counter movement jump (CMJ)) are sensitive to changes in training load, albeit with uncertainty regarding most fatigue-related variables (Claudino et al., <xref ref-type="bibr" rid="ref5">2017</xref>; Gathercole et al., <xref ref-type="bibr" rid="ref9">2015</xref>) and iii) blood biomarkers decipher various physiological domains such as the immune response and inflammatory response to training load (Haller et al., <xref ref-type="bibr" rid="ref12">2023a</xref>; <xref ref-type="bibr" rid="ref14">2023b</xref>).</p>
<p>Based on the approach and experience of a four-week pilot study (Haller et al., <xref ref-type="bibr" rid="ref13">2022</xref>), we aimed to evaluate the feasibility (in terms of injuries and dropouts) of a comprehensive monitoring approach using a variety of monitoring tools, i.e., i) training and game data, ii) blood-based biomarkers covering different physiological domains such as hormonal responses or inflammation, iii) CMJ as surrogate for neuromuscular performance, iv) strength performance tests, i.e. hamstring and hip adductor/abductor strength, and v) questionnaires to assess how well these tools alone or in combination are able to assess and predict injury and illness in a cohort of elite youth soccer players over a three-month period using a linear support vector machine (SVM).</p>
</sec>
<sec id="sec1-2" sec-type="methods">
<title>Methods</title>
<sec id="sec2-1">
<title>Ethical approval</title>
<p>The local human ethics committee in Salzburg (GZ 02/2021) approved the experimental design. All procedures were in accordance with the standards of the Declaration of Helsinki of the World Medical Association. Participants were informed about the study both verbally and in writing and gave their written informed consent.</p>
</sec>
<sec id="sec2-2">
<title>Participants and setting</title>
<p>Twenty-five male players (age: 16.6 &#x00B1; 0.9 years, height: 178 &#x00B1; 7 cm, weight: 74 &#x00B1; 7 kg, VO<sub>2max</sub>: 59 &#x00B1; 4 ml/min/kg) of an elite European youth soccer team (first national league, UEFA Youth League participant) were included in this study. Following one familiarization session in which participants were informed about the objectives of the study, data were collected over a three-month period from September to December during the 2021/2022 regular season. During this process, the researchers had no influence on the training program, and the coaching staff did not receive feedback on the preliminary results before the study was completed. <xref ref-type="fig" rid="fig001">Figure 1</xref> outlines the study design.</p>
<p>A standardized set-up with test stations was used each week to ensure consistency and comparability of measurements. The training focus and number of training sessions per day were also identical across all weeks, with small fluctuations when additional matches were scheduled in midweek. All testing was integrated into the regular training schedule replicating a real-life scenario of an entire soccer team.</p>
<p>Specifically, participants were asked to complete questionnaires each morning (AM) and evening (PM). Strength and conditioning (S&#x0026;C) training was performed two mornings each week, with hamstring and abductor/adductor performance tests as part of the S&#x0026;C training on match day (MD) -4 (days). Twice a week, venous blood was drawn under resting conditions, prior to training, in a fasted state (MD -4, and -2), followed by CMJ testing. Players had previous experience with the procedures used in the study (i.e., hamstring and abductor/adductor, CMJ performance tests, questionnaires, but not venous blood sampling) prior to the start of the study. Team soccer training and matches were consistently monitored with a local positioning system (LPS).</p>
</sec>
<sec id="sec2-3">
<title>Measures<break/>Performance, injury, and illness</title>
<p>Performance data (e.g., distance covered, heart rate, high metabolic power distance (HMPD), training impulse (TRIMP) (Stagno et al., <xref ref-type="bibr" rid="ref37">2007</xref>), total number of sprints, accelerations, decelerations) were recorded using a 100 Hz LPS (Kinexon Precision Technologies, Munich, Germany) during matches and training. Injury statistics, in form of both time-loss and medical attention, were collected daily by the team's medical staff and physiotherapists in accordance with established guidelines (Fuller et al., <xref ref-type="bibr" rid="ref7">2006</xref>). Only non-contact injuries were included in the current analysis. Similarly, illness statistics were collected daily by staff members. Additional measures due to COVID-19 included a daily questionnaire, covering of illness, such as cough, pain in the limbs, breathing difficulties, and loss of taste or sense of smell, along with daily body temperature measurements.</p>
</sec>
<sec id="sec2-4">
<title>Physiological exercise testing prior to season start</title>
<p>Players performed physiological exercise testing prior to the season to determine maximal oxygen uptake (VO<sub>2max</sub>), peak running speed (V<sub>peak</sub>) and lactate threshold using a 2-phase (submaximal step-wise and maximal ramp) test as previously described (St&#x00F6;ggl et al., <xref ref-type="bibr" rid="ref38">2022</xref>).</p>
</sec>
<sec id="sec2-5">
<title>Questionnaires</title>
<p>Using cluster analysis of our pilot study data (Haller et al., <xref ref-type="bibr" rid="ref13">2022</xref>), psychologists designed a questionnaire: specifically, from 23 (AM) and 8 (PM) questions conducted prior to the present study, the number of items (redundancy addressing the same psychological domain) was refined to 5 (AM) and 5 (PM) questions for the present study. Questionnaires were administered via a smartphone app (Trayn, Sunnyvale, CA, United States) and completed by players daily, in both the morning and evening. The AM questionnaire items were related to sleep, muscular fatigue, and energy level. The PM questions were related to perceived fatigue from training/game, stress, satisfaction, and mental strength. Questionnaires were completed on a Likert scale from 0-10, except for sleep and wake times, where the time was to be reported. The complete questionnaire can be found in <xref ref-type="app" rid="A001">Appendix 1</xref>.</p>
</sec>
<sec id="sec2-6">
<title>Nordic hamstring strength</title>
<p>Eccentric hamstring strength was measured with the Nordic hamstring exercise on the Nordbord device (Vald Performance, Albion, Australia) (Opar et al., <xref ref-type="bibr" rid="ref27">2013</xref>) during S&#x0026;C training on MD -4 (<xref ref-type="fig" rid="fig001">Figure 1</xref>). Players knelt on the device with the fixation hooks oriented vertically and positioned just above the ankles (standardized position). Three repetitions were performed at maximal effort, with 5 s of rest in between trials. The experimenter instructed the players to keep their bodies straight and resist falling for as long as possible. Verbal encouragement in the form of "hold, hold, hold" was given. The mean value of the maximum force (F<sub>max</sub>) of the left and right leg of each trial was included in the statistical analysis.</p>
</sec>
<sec id="sec2-7">
<title>Hip abduction, adduction strength</title>
<p>Isometric force of hip abduction and hip adduction was measured using the ForceFrame device (Vald Performance, Albion, Australia) on MD -4. After a general warm-up of 12-15 min, players were barefoot in the supine position, with their arms crossed in front of the chest. The hips were positioned in 0&#x00B0; flexion and neutral rotation. The medial malleoli were centered over the inner load cells for adduction, and the lateral malleoli over the outer load cells to test abduction. A single repetition at 100% was performed in both abduction and adduction. As shown in our pilot study the maximum values for both abduction and adduction occur in the vast majority of cases in the first repetition. Each repetition was held for 5 s, with a 10 s break between repetitions. Verbal encouragement in the form of, &#x201C;3, 2, 1 push, push, push&#x201C; was given (Haller et al., <xref ref-type="bibr" rid="ref13">2022</xref>).</p>
</sec>
<sec id="sec2-8">
<title>Neuromuscular performance</title>
<p>The CMJ as a proxy of neuromuscular performance was performed on a split force plate (Forcedecks, VALD Performance, Albion, Australia), with arms fixed at the hip. To save time, the jumps were integrated into the 15-min team warm-up treadmill running session in which the players rotated to perform the jumps and then continued treadmill running. The order of the players to perform the jumps remained the same throughout the study period. Following two warm-up jumps (while waiting for the jumps on the force plate), two maximal jump attempts were performed in a standardized order (Gathercole et al., <xref ref-type="bibr" rid="ref9">2015</xref>; Twist and Highton, <xref ref-type="bibr" rid="ref40">2013</xref>; Watkins et al., <xref ref-type="bibr" rid="ref42">2017</xref>). Participants were instructed to jump as high as possible in each trial, with the depth of the CMJ chosen by players themselves (Haller et al., <xref ref-type="bibr" rid="ref13">2022</xref>).</p>
</sec>
<sec id="sec2-9">
<title>Blood collection</title>
<p>Venous blood (&#x007E; 3-5 ml) was collected at rest, in a fasted condition, on days MD -4 and -2 by certified medical staff, and analyzed for, i) cell-free DNA (cfDNA) levels, ii) hematological blood count and iii) further established blood parameters. For cfDNA analyses, blood was immediately centrifuged after collection at 1600 x g for 10 min. The plasma was then stored at &#x003C; -20&#x00B0; C. Briefly, plasma was diluted 1:10 in H<sub>2</sub>O and served as a template for qPCR based on amplification of a 90-base pair sequence within the L1PA2 transposon. A CFX384 Touch&#x2122; real-time PCR system (Bio-Rad, Munich, Germany) was used to analyze the blood samples according to the following protocol: Denaturation at 98&#x00B0; C for 2 min, 35 cycles of melting at 95&#x00B0; C for 10 s, annealing at 64&#x00B0; C for 10 s, followed by a melting curve (Neuberger et al., <xref ref-type="bibr" rid="ref26">2021</xref>). Differential blood count and further biochemical variables were determined using whole blood by the Mythic 22 Haematology Analyzer (Orph&#x00E9;e, Geneva, Switzerland). An overview of all blood-based biomarkers is presented in <xref ref-type="app" rid="A002">Appendix 2</xref>.</p>
</sec>
<sec id="sec2-10">
<title>Statistical analysis</title>
<p>Feasibility was determined by the number of adverse events and discontinuations during the study period. Adherence, which was calculated using the following formula: the number of completed tests or questionnaires performed divided by the total number of scheduled tests or questionnaires (i.e., (completed/scheduled) x 100 to express as percentage).</p>
<p>In addition, we targeted three classification tasks: We evaluated the ability to predict a non-contact injury (yes/no), based on data from the most recent monitoring session. Second, we evaluated the ability to predict illness (yes/no) based on the most recent blood data. Third, we evaluated the association between illness (yes/no) with blood data from the same day, to determine whether current illness can be identified via the blood variables.</p>
<p>For all three classification tasks, we excluded two participants due to missing data (one player was injured during the entire study period; for another player, only 2 weeks of data were available due to injury and illness), resulting in a total number of 23 participants. For the analysis, 18 participants were randomly selected as the training data set and 5 participants were selected as the test data set. The allocation of training and test data sets remained the same for all three tasks, to facilitate comparison of the results between tasks.</p>
<p>The training data set for injury prediction included seven data points (indicating the presence or absence of an injury/illness) with and 1078 without an injury, while the test data set has four data points with and 296 without an injury. The training data set for illness prediction consists of 11 data points with and 272 without an illness, while the test data set has one data point with and 59 data points without an illness. For illness determination, the training data set contained 9 data points with and 168 without an illness, while the test data set has one data point with and 41 data points without an illness, which leads to a highly imbalanced data set (<xref ref-type="table" rid="table001">Table 1</xref>).</p>
</sec>
<sec id="sec2-11">
<title>Oversampling</title>
<p>In imbalanced data sets standard classification methods tend to ignore the minority class and may be dominated by the majority class (Guo et al., <xref ref-type="bibr" rid="ref11">2008</xref>). Basically, there are two main methods discussed in the literature to solve the problem of imbalanced data, i.e., Undersampling and Oversampling. Undersampling methods randomly eliminate observations from the majority class, resulting in a loss of data (Kotsiantis et al., <xref ref-type="bibr" rid="ref19">2006</xref>). Oversampling, on the other hand, randomly replicates or generates observations from the minority class, which can lead to overfitting (Weiss and Provost, <xref ref-type="bibr" rid="ref44">2001</xref>). We chose oversampling techniques that circumvent the disadvantage of possible overfitting by generating synthetic copies of minority-class observations rather than exact copies.</p>
<p>In view of the mixed variable types (categorical and numerical variables) in injury prediction, we applied the Synthetic Minority Over-sampling Technique-Nominal Continuous (SMOTE-NC) (Chawla et al., <xref ref-type="bibr" rid="ref4">2002</xref>) algorithm to create a balanced training data set. The number of nearest neighbors (smallest Euclidean distance between feature vectors) used to create the new sample was set to five. The percentage that the minority class (e.g., fewer injuries than non-injuries; therefore, in this case, the injury is the minority class) should have in the new data set compared to the majority class was set at 25%. The training data set thus consists of 1078 data points without injury and 269 with injury.</p>
<p>We have opted for the Adaptive Synthetic Sampling Approach for Imbalanced Learning (ADASYN) algorithm (He et al., <xref ref-type="bibr" rid="ref16">2008</xref>) in view of the numerical data for illness prediction and determination. During the sampling process, we set the number of nearest neighbors to two, to generate the training data. As a result, we included 271 data points with illness and 272 data points without illness in our training data set for illness prediction. For illness determination, we included 169 data points with illness and 168 data points without illness in our training data set.</p>
</sec>
<sec id="sec2-12">
<title>Classification</title>
<p>For the classification purpose, we applied several machine-learning algorithms such as tree-based methods, naive bayes, or neural networks. Ultimately, a simple linear SVM (Hearst et al., <xref ref-type="bibr" rid="ref17">1998</xref>) demonstrated the best results (in terms of accuracy and Cohens Kappa) for all three classification tasks. SVM uses a simple mathematical model and manipulates it in such a way that a linear division of the domain is possible. Basically, SVMs can be distinguished between linear and nonlinear models (Hastie et al., <xref ref-type="bibr" rid="ref15">2009</xref>; Suthaharan, <xref ref-type="bibr" rid="ref39">2016</xref>). In our case, a linear SVM is used, which divides the data domain linearly into individual classes.</p>
<p>To assess the importance of variables for each classification task, we employed the caret package (Kuhn, <xref ref-type="bibr" rid="ref20">2022</xref>) with a Receiver Operating Characteristic (ROC) curve analysis to analyze variable importance for SVMs to identify the most important variables. To calculate the variable importance, the sensitivity and specificity values are calculated for different cut-offs of the predictor data. From this, the ROC is calculated using the trapezoidal rule, where the area under the ROC is used to interpret the variable importance (Kuhn, <xref ref-type="bibr" rid="ref20">2022</xref>). <xref ref-type="table" rid="table001">Table 1</xref> displays an overview of the classification task, model, types, and number of variables, as well as sizes of the training and test data sets.</p>
<p>To train the algorithm, we used a two-fold cross-validation and tried 10 different values per algorithm parameter and chose the parameters that showed the highest area under the ROC curve. The best model was finally used to evaluate the test data. To create the balanced data set, we used the RSBID package (Wu, <xref ref-type="bibr" rid="ref45">2022</xref>) to apply the SMOTE-NC algorithm and the smotefamily package (Siriseriwan, <xref ref-type="bibr" rid="ref35">2019</xref>) for the ADASYN algorithm from the statistical software R (R Foundation for Statistical Computing, Vienna, Austria). The models were trained with the caret package (Kuhn, <xref ref-type="bibr" rid="ref20">2022</xref>), which also was used to calculate variable importance.</p>
</sec>
<sec id="sec2-13">
<title>Performance metrics</title>
<p>As metrics to evaluate the classification tasks we chose accuracy, Cohen&#x2019;s Kappa, precision, and recall. Accuracy is the ratio between the sum of true-positive and true-negative predictions, divided by the sum of positive and negative observations. Precision represents the ratio between the sum of true-positives divided by the sum of predicted-positives, while recall shows the sum of true-positives divided by the sum of positive observations. Cohen&#x2019;s Kappa (Cohen, <xref ref-type="bibr" rid="ref6">1960</xref>) allows comparison between model results and random results. The value is the ratio between the accuracy of the prediction minus the random accuracy divided by one minus random accuracy and can be interpreted as the proportion of the accuracy where random accuracy is excluded. This metric can range from -1 to +1. A perfect classification would give a value of +1, 0 for a result equal to a random classification and -1 for a result worse than a random classification (Cohen, <xref ref-type="bibr" rid="ref6">1960</xref>). As the primary task of our models is to detect injury or illness, we defined the occurrence of an injury or an illness as the positive class.</p>
</sec>
<sec id="sec2-14">
<title>Data pre-processing</title>
<p>For the evaluation of the injury prediction task, we used a total of 65 training load variables (all 65 variables are outlined in <xref ref-type="app" rid="A003">Appendix 3</xref>). To better detect anomalies of the respective participants, we scaled the load variables per participant. We also took the EWMA of the last two training sessions of each participant where the player was not injured. In addition, we calculated the ACWR, i.e., the ratio between the mean value of the respective load variables of the last seven days (<sub>x7</sub>) and the mean value between the eighth and the 28<sup>th</sup> day (<sub>x8-28</sub>) of a respective date. For the evaluation, we also took the values of <sub>x7</sub> and <sub>x8-28</sub> into account. Due to missing data, it was not possible to calculate EWMA, <sub>x7, x8-28</sub> and ACWR (Gabbett, <xref ref-type="bibr" rid="ref8">2018</xref>; Murray et al., <xref ref-type="bibr" rid="ref24">2017</xref>) for all load variables. Thus, in total 237 load variables could be used for the injury prediction task.</p>
<p>In addition, we used two performance parameters (V<sub>peak</sub>, VO<sub>2max</sub>), three items of the questionnaires (sleep quality, sleep duration, and muscle fatigue), two blood variables (CK and cfDNA), two jump variables (jump height impulse max, concentric peak force max) and a dummy whether the participant had a physiotherapist treatment on the respective day. Since these data were collected less frequently than the training load variables covered by LPS, we could not simply merge these data sets. Therefore, we used two different approaches to solve this problem by including these variables via clustering approaches inspired by Rossi et al. (<xref ref-type="bibr" rid="ref31">2023</xref>). For blood, questionnaire and jump data, we applied a longitudinal clustering algorithm that divided the participants into specific groups. We included these groups in our model via factor variables. These factor variables were calculated with the kml algorithm (Genolini et al., <xref ref-type="bibr" rid="ref10">2015</xref>), a k-means algorithm for longitudinal data, where clusters were determined for each variable separately. For the calculation, all values were aggregated using the mean values per week and missing values were imputed using the "CopyMean" function of the kml package. Due to the small number of participants, we choose to set the number of cluster groups to two. However, there was an outlier in the data for the two blood variables and sleep duration, so we decided to have three cluster groups for these variables.</p>
<p>As information on performance parameters was only available for two time points (before and after the study period), a simple k-means algorithm of the R package factoextra (Kassambara and Mundt, <xref ref-type="bibr" rid="ref18">2020</xref>) was used to calculate two cluster groups, for VO<sub>2max</sub> and V<sub>peak</sub> respectively, by taking the mean of pre and post.</p>
</sec>
</sec>
<sec id="sec1-3">
<title>Results</title>
<sec id="sec2-15">
<title>Aspects of feasibility</title>
<p>No adverse events in the form of injury or dropout were noted during the study period, although some players had concerns about repeated blood sampling. <xref ref-type="fig" rid="fig002">Figure 2</xref> shows the sleep quality, as one example of the questionnaire data, for each player as a mean value per week over the study period. The figure illustrates declining adherence to the questionnaire across the study period. It appears that most players accepted the questionnaire until about halfway through the study duration, but thereafter acceptance decreased. We noted a decline in adherence from 95.7% in the first week to 73.9% in the seventh week to 21.7% in the fourteenth week.</p>
</sec>
<sec id="sec2-16">
<title>Results of prediction tasks</title>
<p><xref ref-type="table" rid="table002">Table 2</xref> displays the results for all three classification tasks for the test data set: injury prediction, illness prediction, and illness determination. The linear SVM was able to predict 96.3% of data points (injury yes/no) correctly. The recall score of 25% indicates that one of the four injuries in the test set was detected by the model. A precision of 11.1% shows that one out of nine predicted injuries was actually an injury. In the case of illness prediction, the linear SVM predicted 66.7% of the data points correctly. A recall value of 100% shows that the one illness present in the test set was detected. A precision of 4.8% indicates that out of 21 predicted illnesses, one was actually an illness. The model to determine illness detects all data points in the test set correctly, which resulted in an accuracy, precision, and recall value of 100% each and a Cohens Kappa of 1.</p>
<p>To investigate the most important variables for classification of each task <xref ref-type="fig" rid="fig003">Figure 3</xref> visualizes the ten most important variables according to ROC curve variable importance. Regarding variable importance for injury prediction, four out of the ten most important variables represent factor variables out of the longitudinal cluster approach (sleep quality, jump height, cfDNA, and sleep duration). Sleep quality was detected to be most important, followed by the ACWR of tempo runs (> 19.8 km/h) and CMJ jump height. For illness prediction and determination, five blood variables were in the top ten for both classification tasks (total ferritin, total c-reactive Protein (CRP), percentage and total eosinophils (EOS) and glucose (GLU)), with total CRP and percentage EOS being two variables in the top three most important variables. In general, illness determination task demonstrated the highest ROC curve variable importance values, followed by the injury and illness prediction variables, which would have been expected according to the results of the model evaluation.</p>
</sec>
</sec>
<sec id="sec1-4">
<title>Discussion</title>
<p>The overall goals of this study were to i) demonstrate the feasibility of a comprehensive monitoring approach being fully integrated in the training process, and ii) test the predictive accuracy of a machine learning approach in terms of injury and illness prediction using the combination of external training load data and a variety of objective (neuromuscular performance and strength testing, biomarkers, heart rate) and subjective (questionnaire) internal load and recovery measures in an elite youth soccer team. It has been demonstrated that it is possible to develop machine learning models to predict injuries and to detect and predict illnesses.</p>
<sec id="sec2-17">
<title>Principal findings</title>
<p>In general, the integration of a holistic monitoring approach into the training regime can only succeed if the following factors are present: 1) coach buy-in, 2) cost, time, and logistical prerequisites, 3) team adherence, 4) an interdisciplinary team, and 5) the benefits coaches see in an empirically based measure (Akenhead and Nassis, <xref ref-type="bibr" rid="ref1">2016</xref>). Therefore, it is important to integrate the majority of measures into the regular training routine with the help of an interdisciplinary team of practitioners, researchers, and clinicians to avoid disrupting the training process and causing additional burden to the players. It has been shown that a period of 15 minutes in the morning is sufficient for blood sampling. An additional 15 minutes before regular training was sufficient for measuring CMJ performance, which was integrated into the team warm-up program on the treadmill. Questionnaires as an easy-to-use and established tool were completed within 1-2 minutes in the morning and evening. Measurements of hip adductor, hip abductor, and hamstring strength were categorized as a strength training stimulus and therefore incorporated into S&#x0026;C training on MD -4. The performance tests did not result in any adverse events. However, some of the players showed concerns on repetitive venous blood sampling. Accordingly, future research should focus on identifying key blood variables for monitoring training load and recovery which can be measured via capillary blood or even saliva, ideally via point-of-care testing, similar to the measurement of creatine kinase. Testing various machine learning models showed that the linear SVM resulted in the best classification results for the three different classification tasks of interest.</p>
<p>To develop the best performing model, many variables were taken into account. However, in order to simplify data collection in the future the most relevant parameters were identified by a ROC curve variable importance analysis. For injury prediction, the three most important variables were sleep quality, the ACWR of tempo runs (> 19.8 km/h) and CMJ jump height. For illness prediction, ferritin, CRP and percentage EOS were identified to be most important, for illness determination CRP, creatinine and percentage EOS.</p>
<p>For injury prediction, one of four injuries present in the test data set was detected and 96.3% of all data points were detected correctly. For illness prediction and determination, only one illness was present in the test data set, as the same random split of players into training or test data set for all three classification tasks was used. However, this data point was detected by the linear SVM for both illness prediction and determination. Unfortunately, the model showed quite low precision values for both predictive tasks. Thus, the model tends to predict false-positive injuries and illnesses. Differences in accuracy between illness determination and prediction appear reasonable because in some cases there was some time lag between blood collection and illness onset. Thus, the accuracy is not expected to be perfect for the prediction task. In addition, it should be noted that throughout the study period, COVID illnesses occurred as well as illnesses that may have been specifically related to the high density of training and competition.</p>
<p>In practical terms, applying the present model could lead to over-estimation of players&#x2019; risk of injuries and illnesses. On the other hand, the model works perfectly to detect illness, driven mainly by the CRP variable, which was shown to have the highest importance among blood variables. According to a categorization framework presented by Landis and Koch (Landis and Koch, <xref ref-type="bibr" rid="ref21">1977</xref>), Cohens' Kappa values show slight performance for predicting injury and illness, but perfect performance for detecting illness.</p>
<p>During the study period of three months, there were too few injuries and illnesses from a statistical perspective to develop a better predictive model. Comparable studies covered longer periods of at least about half a year or more and included more injuries in their predictive models (Rommers et al., <xref ref-type="bibr" rid="ref29">2020</xref>; Rossi et al., <xref ref-type="bibr" rid="ref30">2018</xref>). In addition, a higher frequency of data points would have been needed for some variables. For blood collection, two samplings per week were the maximum from an adherence perspective. Switching to capillary samples could help, with the disadvantage that fewer variables can be determined. The main challenge in classifying injuries and illnesses is the limited injury and illness data set, which contrasts with the almost daily data available on players' training load. We have therefore tried to oversample the number of illnesses and injuries in the training data set. Nevertheless, the number of illnesses and injuries in the test data set remains limited. The different time points for data collection also led to challenges in merging the different data sets.</p>
<p>Since many variables (blood, jumps) were collected less frequently and over a shorter period compared to the training load data, this information was included in the machine learning models via clusters leading to factor variables. Therefore, the information on blood, jumps and fitness was aggregated and not included as detailed as would be possible with more frequent measures. When using longitudinal clusters to include the blood, questionnaire and jump data in the injury prediction analysis, we were faced with a decreasing willingness to fill out the questionnaires. Therefore, the number of missing values increased over time, and we could not use these data over the entire survey period. While there was an increase in questionnaire adherence compared to our pilot study (Haller et al., <xref ref-type="bibr" rid="ref13">2022</xref>), further strategies to increase adherence are necessary to minimize missing data. This includes, for example, regular educational talks (McGuigan et al., <xref ref-type="bibr" rid="ref23">2023</xref>), reminders by the coaching staff, and a clear message that the players will benefit enormously from filling out questionnaires on a frequent basis. It is expected that adherence increases if the monitoring results are coupled with consequences in training and recovery planning.</p>
</sec>
<sec id="sec2-18">
<title>Practical applications</title>
<p>The strength of machine learning approaches is to not only seek linear relationships and consider only one or two parameters, but to consider specifically the interaction between many variables, which may be necessary due to the multifactorial nature of injury and illness. In the present study, training load data, questionnaire scores and blood variables were found to be potentially associated with impending injury or illness. Unfortunately, it is not possible to draw conclusions about the specific direction of the variables, which might be possible with other statistical methods. While tracking variables have been associated with impending injury, blood variables could be useful for early detection of illness. Specifically, illness determination showed the best model performance, but the precision was low for prediction tasks. From a practical point of view, this may lead to overcautious reactions from practitioners so far. Hence, it is necessary to test whether the identified important variables persist by feeding the algorithm with additional data points and to observe the evolution of the accuracy measures.</p>
<p>The long-term goal is to capture the critical variables with minimal effort (i.e., omitting unnecessary methods to minimize human effort and avoid large amounts of data) or minimally invasive, e.g., for blood with point-of-care devices in the future. The use of minimally invasive point-of-care methods would also allow for more frequent blood collection than two days per week, and it is not recommended to collect venous blood at this regularity anyway, as this would impose an immense burden on the athletes in the long term (Carling et al., <xref ref-type="bibr" rid="ref3">2018</xref>).</p>
<p>Strategies to further reduce the large amount of redundant data (e.g., tracking, blood and CMJ variables) are recommended and discussed elsewhere. Lastly, it should be noted that the study required a highly professional environment and significant human resources (two physicians for blood collection, two physiotherapists for hip abduction/adduction, two practitioners for the CMJ). The blood collection required staff and sophisticated equipment for the analysis including sophisticated qPCR methods for the determination of cfDNA. Thus, the approach is feasible for financially strong clubs, but not practical and cost-effective for non-elite clubs or professional clubs with limited resources, unless the machine models perform better.</p>
</sec>
</sec>
<sec id="sec1-5">
<title>Conclusion</title>
<p>A holistic approach to monitoring training load and training load response was successfully integrated into regular practice, and many variables indicative of the occurrence of injury and illness were identified. Whereas conventional statistical approaches have the disadvantage of focusing, for example, on factors linearly associated with injury and disease by performing regression analyses, we provide an approach to consider interactions among a large number of variables potentially associated with illness and injury. Future studies can build on our initial results and apply a longer study period with more data points to further train the algorithms and determine if the variables identified are truly critical. Further statistical methods can then be used i) to reveal and interpret the direction of the variables, or ii) the crucial variables can be used in practice over a longer period of time so that changes can be identified on an individual basis allowing early interventions to be made.</p>
</sec>
</body>
<back>
<ack>
<title>Acknowledgements</title>
<p>We would like to thank all the players, practitioners, and club officials who agreed to, planned, participated in, helped with, or conducted the study. The study is a cooperation project between the University of Salzburg, the University of Mainz and the Red Bull Athlete Performance Center. The study receives funding from the Red Bull Athlete Performance Center for the scientific accompaniment of the monitoring concept in the context of which data for the current study were collected. Christina and Stefan Kranzinger acknowledge the financial support by the Austrian Federal Ministry for Climate Action, Environment, Energy, Mobility, Innovation and Technology and Land Salzburg under Contract No. 2021-0.641.557. All experiments comply with the current laws of the country in which they were performed. The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest. The data sets generated and analyzed during the current study are not publicly available but are available from the corresponding author, who was an organizer of the study.</p>
</ack>
<app-group>
<title>&#x00A0;</title>
<app id="A001">
<label>Appendix 1.</label>
<title>Questionnaire items</title>
<p><bold>AM questionnaire (Likert Scale from 0-10, except sleep onset and wakening):</bold></p>
<list list-type="order">
<list-item><p>How was your sleep? (very poor / very good)</p></list-item>
<list-item><p>When did you fall asleep (exact time)</p></list-item>
<list-item><p>When did you wake up? (exact time)</p></list-item>
<list-item><p>I am feeling (powerless / full of energy)</p></list-item>
<list-item><p>My muscular fatigue is (very fatigued / not at all fatigued)</p></list-item>
</list>
<p><bold>PM questionnaire (Likert Scale from 0-10):</bold></p>
<list list-type="order">
<list-item><p>How strenuous was the training / game today? (rest / maximal)</p></list-item>
<list-item><p>How stressful did you find today compared to an average day? (less stressful / more stressful)</p></list-item>
<list-item><p>How stressful did you find today in terms of training/game compared to an average day? (less stressful / more stressful)</p></list-item>
<list-item><p>Today I was satisfied with myself (not at all / very)</p></list-item>
<list-item><p>I am mentally strong (not at all / very strong)</p></list-item>
</list>
</app>
<app id="A002">
<label>Appendix 2.</label>
<title>Blood-based biomarkers measured in our study</title>
<list list-type="order">
<list-item><p>Cell-free DNA</p></list-item>
<list-item><p>Creatine kinase</p></list-item>
<list-item><p>White blood cells</p></list-item>
<list-item><p>%- Lymphocytes</p></list-item>
<list-item><p>%- Monocytes</p></list-item>
<list-item><p>%- Neutrophils</p></list-item>
<list-item><p>%- Eosinophils</p></list-item>
<list-item><p>%- Basophils</p></list-item>
<list-item><p>Lymphocytes</p></list-item>
<list-item><p>Monocytes</p></list-item>
<list-item><p>Neutrophils</p></list-item>
<list-item><p>Eosinophils</p></list-item>
<list-item><p>Basophils</p></list-item>
<list-item><p>Red blood cells</p></list-item>
<list-item><p>Hemoglobin</p></list-item>
<list-item><p>Hematocrit</p></list-item>
<list-item><p>Mean corpuscular volume</p></list-item>
<list-item><p>Mean corpuscular haemoglobin</p></list-item>
<list-item><p>Mean corpuscular hemoglobin concentration</p></list-item>
<list-item><p>Red blood cell distribution width</p></list-item>
<list-item><p>Platelets</p></list-item>
<list-item><p>Glucose</p></list-item>
<list-item><p>C-reactive protein</p></list-item>
<list-item><p>Alkaline phosphatase</p></list-item>
<list-item><p>GOT (glutamic-oxaloacetic transaminase)</p></list-item>
<list-item><p>GPT (Glutamat-Pyruvat-Transaminase)</p></list-item>
<list-item><p>GGT (Gamma-glutamyl Transferase)</p></list-item>
<list-item><p>LDH (Lactate Dehydrogenase)</p></list-item>
<list-item><p>Creatinine</p></list-item>
<list-item><p>Urea</p></list-item>
<list-item><p>Uric acid</p></list-item>
<list-item><p>Iron</p></list-item>
<list-item><p>Transferrin</p></list-item>
<list-item><p>Ferritin</p></list-item>
<list-item><p>Iron-binding capacity</p></list-item>
<list-item><p>Total protein</p></list-item>
<list-item><p>Myoglobin</p></list-item>
<list-item><p>Magnesium</p></list-item>
<list-item><p>Calcium</p></list-item>
<list-item><p>Phosphorus</p></list-item>
</list>
</app>
<app id="A003">
<label>Appendix 3:</label>
<title>Training load variables</title>
<list list-type="order">
<list-item><p>Time</p></list-item>
<list-item><p>Time on Playing Field (s)</p></list-item>
<list-item><p>Distance (m)</p></list-item>
<list-item><p>Distance / min (m)</p></list-item>
<list-item><p>HMPD (m)</p></list-item>
<list-item><p>Metabolic Power per mass (mean) (W/kg)</p></list-item>
<list-item><p>Metabolic Power per mass (max.) (W/kg)</p></list-item>
<list-item><p>Metabolic Work (kcal)</p></list-item>
<list-item><p>Metabolic Work / min (kcal)</p></list-item>
<list-item><p>Explosive Distance (m)</p></list-item>
<list-item><p>TRIMP</p></list-item>
<list-item><p>Speed (max.) (km/h)</p></list-item>
<list-item><p>Speed (% of max.) (%)</p></list-item>
<list-item><p>Speed (mean) (km/h)</p></list-item>
<list-item><p>Sprints</p></list-item>
<list-item><p>DFL Sprints/min</p></list-item>
<list-item><p>Tempo Runs (> 19.8 km/h)</p></list-item>
<list-item><p>Tempo Runs/min</p></list-item>
<list-item><p>Accelerations</p></list-item>
<list-item><p>Accelerations / min</p></list-item>
<list-item><p>Acceleration (max.) (ms2)</p></list-item>
<list-item><p>Accumulated Acceleration Load</p></list-item>
<list-item><p>Accumulated Acceleration Load/min</p></list-item>
<list-item><p>Accelerations (Very high)</p></list-item>
<list-item><p>Accelerations (High)</p></list-item>
<list-item><p>Accelerations (4-5 ms2)</p></list-item>
<list-item><p>Accelerations (> = 5 ms2)</p></list-item>
<list-item><p>Accelerations/min (Very high)</p></list-item>
<list-item><p>Decelerations</p></list-item>
<list-item><p>Decelerations/min</p></list-item>
<list-item><p>Deceleration (max.) (ms2)</p></list-item>
<list-item><p>Decelerations (High)</p></list-item>
<list-item><p>Decelerations (Very high)</p></list-item>
<list-item><p>Decelerations (4-5 ms2)</p></list-item>
<list-item><p>Decelerations (> = 5 ms2)</p></list-item>
<list-item><p>Decelerations/min (Very high)</p></list-item>
<list-item><p>Distance (speed &#x007C; 0-5.4 km/h) (m)</p></list-item>
<list-item><p>Distance (speed &#x007C; 5.4-10.8 km/h) (m)</p></list-item>
<list-item><p>Distance (speed &#x007C; 10.8-14.4 km/h) (m)</p></list-item>
<list-item><p>Distance (speed &#x007C; 14.4-19.8 km/h) (m)</p></list-item>
<list-item><p>Distance (speed &#x007C; 19.8-25.2 km/h) (m)</p></list-item>
<list-item><p>Distance (speed &#x007C; 25.2-28 km/h) (m)</p></list-item>
<list-item><p>Distance (speed &#x007C; > = 28 km/h) (m)</p></list-item>
<list-item><p>Heart Rate (max.) (bpm)</p></list-item>
<list-item><p>Heart Rate (mean) (bpm)</p></list-item>
<list-item><p>Heart Rate (time &#x007C; 0-50%) (s)</p></list-item>
<list-item><p>Heart Rate (time &#x007C; 50-60%) (s)</p></list-item>
<list-item><p>Heart Rate (time &#x007C; 60-70%) (s)</p></list-item>
<list-item><p>Heart Rate (time &#x007C; 70-80%) (s)</p></list-item>
<list-item><p>Heart Rate (time &#x007C; 80-90%) (s)</p></list-item>
<list-item><p>Heart Rate (time &#x007C; >= 90%) (s)</p></list-item>
<list-item><p>Heart Rate Recovery</p></list-item>
<list-item><p>Heart Rate Impulse</p></list-item>
<list-item><p>Changes of Direction/min</p></list-item>
<list-item><p>Changes of Direction</p></list-item>
<list-item><p>Changes of Direction (right)</p></list-item>
<list-item><p>Changes of Direction (left)</p></list-item>
<list-item><p>Step Balance (mean) (%)</p></list-item>
<list-item><p>Jumps</p></list-item>
<list-item><p>Jump Load (J)</p></list-item>
<list-item><p>Distance Sprint (m)</p></list-item>
<list-item><p>Total max sprint distance (25-28km/h) (m)</p></list-item>
<list-item><p>Time S&#x0026;C training time (s)</p></list-item>
<list-item><p>Total exercise time AM+PM+MD (s)</p></list-item>
<list-item><p>Total training time AM+PM (s)</p></list-item>
<list-item><p>Total MD time (s)</p></list-item>
</list>
</app>
</app-group>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Akenhead</surname><given-names>R.</given-names></name><name><surname>Nassis</surname><given-names>G. P.</given-names></name></person-group> (<year>2016</year>) <article-title>Training Load and Player Monitoring in High-Level Football: Current Practice and Perceptions</article-title>. <source>International Journal of Sports Physiology and Performance</source> <volume>11</volume>(<issue>5</issue>), <fpage>587</fpage>-<lpage>593</lpage>. <comment>https://doi.org/10.1123/ijspp.2015-0331</comment> <pub-id pub-id-type="doi">10.1123/ijspp.2015-0331</pub-id></mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ayala</surname><given-names>F.</given-names></name><name><surname>Lopez-Valenciano</surname><given-names>A.</given-names></name><name><surname>Martin</surname><given-names>J. A. G.</given-names></name><name><surname>Croix</surname><given-names>M. D.</given-names></name><name><surname>Vera-Garcia</surname><given-names>F. J.</given-names></name><name><surname>Garcia-Vaquero</surname><given-names>M. D.</given-names></name><name><surname>Ruiz-Perez</surname><given-names>I.</given-names></name><name><surname>Myer</surname><given-names>G. D.</given-names></name></person-group> (<year>2019</year>) <article-title>A Preventive Model for Hamstring Injuries in Professional Soccer: Learning Algorithms</article-title>. <source>International Journal of Sports Medicine</source> <volume>40</volume>(<issue>5</issue>), <fpage>344</fpage>-<lpage>353</lpage>. <comment>https://doi.org/10.1055/a-0826-1955</comment> <pub-id pub-id-type="doi">10.1055/a-0826-1955</pub-id></mixed-citation></ref>
<ref id="ref3"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Carling</surname><given-names>C.</given-names></name><name><surname>Lacome</surname><given-names>M.</given-names></name><name><surname>McCall</surname><given-names>A.</given-names></name><name><surname>Dupont</surname><given-names>G.</given-names></name><name><surname>Le Gall</surname><given-names>F.</given-names></name><name><surname>Simpson</surname><given-names>B.</given-names></name><name><surname>Buchheit</surname><given-names>M.</given-names></name></person-group> (<year>2018</year>) <article-title>Monitoring of Post-match Fatigue in Professional Soccer: Welcome to the Real World</article-title>. <source>Sports Medicine</source> <comment>https://doi.org/10.1007/s40279-018-0935-z</comment> <pub-id pub-id-type="doi">10.1007/s40279-018-0935-z</pub-id></mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chawla</surname><given-names>N. V.</given-names></name><name><surname>Bowyer</surname><given-names>K. W.</given-names></name><name><surname>Hall</surname><given-names>L. O.</given-names></name><name><surname>Kegelmeyer</surname><given-names>W. P.</given-names></name></person-group> (<year>2002</year>) <article-title>SMOTE: Synthetic minority over-sampling technique</article-title>. <source>Journal of Artificial Intelligence Research</source> <volume>16</volume>, <fpage>321</fpage>-<lpage>357</lpage>. <comment>https://doi.org/DOI 10.1613/jair.953</comment> <pub-id pub-id-type="doi">10.1613/jair.953</pub-id></mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Claudino</surname><given-names>J. G.</given-names></name><name><surname>Cronin</surname><given-names>J.</given-names></name><name><surname>Mezencio</surname><given-names>B.</given-names></name><name><surname>McMaster</surname><given-names>D. T.</given-names></name><name><surname>McGuigan</surname><given-names>M.</given-names></name><name><surname>Tricoli</surname><given-names>V.</given-names></name><name><surname>Amadio</surname><given-names>A. C.</given-names></name><name><surname>Serrao</surname><given-names>J. C.</given-names></name></person-group> (<year>2017</year>) <article-title>The countermovement jump to monitor neuromuscular status: A meta-analysis</article-title>. <source>Journal of Science and Medicine in Sport</source> <volume>20</volume>(<issue>4</issue>), <fpage>397</fpage>-<lpage>402</lpage>. <comment>https://doi.org/10.1016/j.jsams.2016.08.011</comment> <pub-id pub-id-type="doi">10.1016/j.jsams.2016.08.011</pub-id></mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cohen</surname><given-names>J.</given-names></name></person-group> (<year>1960</year>) <article-title>A Coefficient of Agreement for Nominal Scales</article-title>. <source>Educational and Psychological Measurement</source> <volume>20</volume>(<issue>1</issue>), <fpage>37</fpage>-<lpage>46</lpage>. <comment>https://doi.org/Doi 10.1177/001316446002000104</comment> <pub-id pub-id-type="doi">10.1177/001316446002000104</pub-id></mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fuller</surname><given-names>C. W.</given-names></name><name><surname>Ekstrand</surname><given-names>J.</given-names></name><name><surname>Junge</surname><given-names>A.</given-names></name><name><surname>Andersen</surname><given-names>T. E.</given-names></name><name><surname>Bahr</surname><given-names>R.</given-names></name><name><surname>Dvorak</surname><given-names>J.</given-names></name><name><surname>Hagglund</surname><given-names>M.</given-names></name><name><surname>McCrory</surname><given-names>P.</given-names></name><name><surname>Meeuwisse</surname><given-names>W. H.</given-names></name></person-group> (<year>2006</year>) <article-title>Consensus statement on injury definitions and data collection procedures in studies of football (soccer) injuries</article-title>. <source>Clinical Journal of Sport Medicine</source> <volume>16</volume>(<issue>2</issue>), <fpage>97</fpage>-<lpage>106</lpage>. <comment>https://doi.org/Doi 10.1097/00042752-200603000-00003</comment> <pub-id pub-id-type="doi">10.1097/00042752-200603000-00003</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gabbett</surname><given-names>T.</given-names></name></person-group> (<year>2018</year>) <article-title>Infographic: The training-injury prevention paradox: should athletes be training smarter and harder? [Editorial]</article-title>. <source>British Journal of Sports Medicine</source> <volume>52</volume>(<issue>3</issue>), <fpage>203</fpage>. <comment>https://doi.org/10.1136/bjsports-2016-097249</comment> <pub-id pub-id-type="doi">10.1136/bjsports-2016-097249</pub-id></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gathercole</surname><given-names>R.</given-names></name><name><surname>Sporer</surname><given-names>B.</given-names></name><name><surname>Stellingwerff</surname><given-names>T.</given-names></name><name><surname>Sleivert</surname><given-names>G.</given-names></name></person-group> (<year>2015</year>) <article-title>Alternative countermovement-jump analysis to quantify acute neuromuscular fatigue</article-title>. <source>International Journal of Sports Physiology and Performance</source> <volume>10</volume>(<issue>1</issue>), <fpage>84</fpage>-<lpage>92</lpage>. <comment>https://doi.org/10.1123/ijspp.2013-0413</comment> <pub-id pub-id-type="doi">10.1123/ijspp.2013-0413</pub-id></mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Genolini</surname><given-names>C.</given-names></name><name><surname>Alacoque</surname><given-names>X.</given-names></name><name><surname>Sentenac</surname><given-names>M.</given-names></name><name><surname>Arnaud</surname><given-names>C.</given-names></name></person-group> (<year>2015</year>) <article-title>kml and kml3d: R packages to cluster longitudinal data</article-title>. <source>Journal of Statistical Software</source> <volume>65</volume>, <fpage>1</fpage>-<lpage>34</lpage>. <comment>https://doi.org/10.18637/jss.v065.i04</comment> <pub-id pub-id-type="doi">10.18637/jss.v065.i04</pub-id></mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname><given-names>X.</given-names></name><name><surname>Yin</surname><given-names>Y.</given-names></name><name><surname>Dong</surname><given-names>C.</given-names></name><name><surname>Yang</surname><given-names>G.</given-names></name><name><surname>Zhou</surname><given-names>G.</given-names></name></person-group> (<year>2008</year>) <article-title>On the class imbalance problem</article-title>. <source>Fourth international conference on natural computation</source>. <comment>https://doi.org/10.1109/ICNC.2008.871</comment> <pub-id pub-id-type="doi">10.1109/ICNC.2008.871</pub-id></mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Haller</surname><given-names>N.</given-names></name><name><surname>Behringer</surname><given-names>M.</given-names></name><name><surname>Reichel</surname><given-names>T.</given-names></name><name><surname>Wahl</surname><given-names>P.</given-names></name><name><surname>Simon</surname><given-names>P.</given-names></name><name><surname>Kruger</surname><given-names>K.</given-names></name><name><surname>Zimmer</surname><given-names>P.</given-names></name><name><surname>St&#x00F6;ggl</surname><given-names>T.</given-names></name></person-group> (<year>2023a</year>) <article-title>Blood-Based Biomarkers for Managing Workload in Athletes: Considerations and Recommendations for Evidence-Based Use of Established Biomarkers</article-title>. <source>Sports Medicine</source> <volume>53</volume>, <fpage>1315</fpage>-<lpage>1333</lpage>. <comment>https://doi.org/10.1007/s40279-023-01836-x</comment> <pub-id pub-id-type="doi">10.1007/s40279-023-01836-x</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Haller</surname><given-names>N.</given-names></name><name><surname>Blumkaitis</surname><given-names>J. C.</given-names></name><name><surname>Strepp</surname><given-names>T.</given-names></name><name><surname>Schmuttermair</surname><given-names>A.</given-names></name><name><surname>Aglas</surname><given-names>L.</given-names></name><name><surname>Simon</surname><given-names>P.</given-names></name><name><surname>Neuberger</surname><given-names>E.</given-names></name><name><surname>Kranzinger</surname><given-names>C.</given-names></name><name><surname>Kranzinger</surname><given-names>S.</given-names></name><name><surname>O'Brien</surname><given-names>J.</given-names></name><name><surname>Ergoth</surname><given-names>B.</given-names></name><name><surname>Raffetseder</surname><given-names>S.</given-names></name><name><surname>Fail</surname><given-names>C.</given-names></name><name><surname>During</surname><given-names>M.</given-names></name><name><surname>St&#x00F6;ggl</surname><given-names>T.</given-names></name></person-group> (<year>2022</year>) <article-title>Comprehensive training load monitoring with biomarkers, performance testing, local positioning data, and questionnaires-first results from elite youth soccer</article-title>. <source>Frontiers in Physiology</source> <volume>13</volume>. <comment>https://doi.org/10.3389/fphys.2022.1000898</comment> <pub-id pub-id-type="doi">10.3389/fphys.2022.1000898</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Haller</surname><given-names>N.</given-names></name><name><surname>Reichel</surname><given-names>T.</given-names></name><name><surname>Zimmer</surname><given-names>P.</given-names></name><name><surname>Behringer</surname><given-names>M.</given-names></name><name><surname>Wahl</surname><given-names>P.</given-names></name><name><surname>Stoggl</surname><given-names>T.</given-names></name><name><surname>Kruger</surname><given-names>K.</given-names></name><name><surname>Simon</surname><given-names>P.</given-names></name></person-group> (<year>2023b</year>) <article-title>Blood-Based Biomarkers for Managing Workload in Athletes: Perspectives for Research on Emerging Biomarkers</article-title>. <source>Sports Medicine</source>. <comment>https://doi.org/10.1007/s40279-023-01866-5</comment> <pub-id pub-id-type="doi">10.1007/s40279-023-01866-5</pub-id></mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hastie</surname><given-names>T.</given-names></name><name><surname>Tibshirani</surname><given-names>R.</given-names></name><name><surname>Friedman</surname><given-names>J. H.</given-names></name><name><surname>Friedman</surname><given-names>J. H.</given-names></name></person-group> (<year>2009</year>) <source>The elements of statistical learning: data mining, inference, and prediction (Vol. 2) Springer</source>. <comment>https://doi.org/10.1007/978-0-387-84858-7</comment> <pub-id pub-id-type="doi">10.1007/978-0-387-84858-7</pub-id></mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>He</surname><given-names>H.</given-names></name><name><surname>Bai</surname><given-names>Y.</given-names></name><name><surname>Garcia</surname><given-names>E. A.</given-names></name><name><surname>Li</surname><given-names>S.</given-names></name></person-group> (<year>2008</year>) <source>ADASYN: Adaptive synthetic sampling approach for imbalanced learning. 2008 IEEE international joint conference on neural networks (IEEE world congress on computational intelligence)</source>.</mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hearst</surname><given-names>M. A.</given-names></name><name><surname>Dumais</surname><given-names>S. T.</given-names></name><name><surname>Osuna</surname><given-names>E.</given-names></name><name><surname>Platt</surname><given-names>J.</given-names></name><name><surname>Scholkopf</surname><given-names>B.</given-names></name></person-group> (<year>1998</year>) <article-title>Support vector machines</article-title>. <source>IEEE Intelligent Systems and their applications</source> <volume>13</volume>(<issue>4</issue>), <fpage>18</fpage>-<lpage>28</lpage>. <comment>https://doi.org/10.1109/5254.708428</comment> <pub-id pub-id-type="doi">10.1109/5254.708428</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Kassambara</surname><given-names>A.</given-names></name><name><surname>Mundt</surname><given-names>F.</given-names></name></person-group> (<year>2020</year>) <source>Package &#x2018;factoextra&#x2019;: extract and visualize the results of multivariate data analyses. CRAN-R Package</source>. <comment><ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://CRAN.R-project.org/package=factoextra">https://CRAN.R-project.org/package=factoextra</ext-link></comment></mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kotsiantis</surname><given-names>S.</given-names></name><name><surname>Kanellopoulos</surname><given-names>D.</given-names></name><name><surname>Pintelas</surname><given-names>P.</given-names></name></person-group> (<year>2006</year>) <article-title>Handling imbalanced datasets: A review</article-title>. <source>GESTS International Transactions on Computer Science and Engineering</source> <volume>30</volume>(<issue>1</issue>), <fpage>25</fpage>-<lpage>36</lpage>.</mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Kuhn</surname><given-names>M.</given-names></name></person-group> (<year>2022</year>) <source>Package &#x2018;caret&#x2018;: Classification and Regression Training, Version 6.0-94</source>. <comment><ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://cran.r-project.org/web/packages/caret/caret.pdf">https://cran.r-project.org/web/packages/caret/caret.pdf</ext-link></comment></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Landis</surname><given-names>J. R.</given-names></name><name><surname>Koch</surname><given-names>G. G.</given-names></name></person-group> (<year>1977</year>) <article-title>The measurement of observer agreement for categorical data</article-title>. <source>Biometrics</source> <volume>33</volume>(<issue>1</issue>), <fpage>159</fpage>-<lpage>174</lpage>. <comment>https://doi.org/10.2307/2529310</comment> <pub-id pub-id-type="doi">10.2307/2529310</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malone</surname><given-names>S.</given-names></name><name><surname>Owen</surname><given-names>A.</given-names></name><name><surname>Mendes</surname><given-names>B.</given-names></name><name><surname>Hughes</surname><given-names>B.</given-names></name><name><surname>Collins</surname><given-names>K.</given-names></name><name><surname>Gabbett</surname><given-names>T. J.</given-names></name></person-group> (<year>2018</year>) <article-title>High-speed running and sprinting as an injury risk factor in soccer: Can well-developed physical qualities reduce the risk?</article-title> <source>Journal of Science and Medicine in Sport</source> <volume>21</volume>(<issue>3</issue>), <fpage>257</fpage>-<lpage>262</lpage>. <comment>https://doi.org/10.1016/j.jsams.2017.05.016</comment> <pub-id pub-id-type="doi">10.1016/j.jsams.2017.05.016</pub-id></mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>McGuigan</surname><given-names>H. E.</given-names></name><name><surname>Hassmen</surname><given-names>P.</given-names></name><name><surname>Rosic</surname><given-names>N.</given-names></name><name><surname>Thornton</surname><given-names>H. R.</given-names></name><name><surname>Stevens</surname><given-names>C. J.</given-names></name></person-group> (<year>2023</year>) <article-title>Does education improve adherence to a training monitoring program in recreational athletes?</article-title> <source>International Journal of Sports Science &#x0026; Coaching</source> <volume>18</volume>(<issue>1</issue>), <fpage>101</fpage>-<lpage>113</lpage>. <comment>https://doi.org/10.1177/17479541211070789</comment> <pub-id pub-id-type="doi">10.1177/17479541211070789</pub-id></mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Murray</surname><given-names>N. B.</given-names></name><name><surname>Gabbett</surname><given-names>T. J.</given-names></name><name><surname>Townshend</surname><given-names>A. D.</given-names></name><name><surname>Blanch</surname><given-names>P.</given-names></name></person-group> (<year>2017</year>) <article-title>Calculating acute: chronic workload ratios using exponentially weighted moving averages provides a more sensitive indicator of injury likelihood than rolling averages</article-title>. <source>British Journal of Sports Medicine</source> <volume>51</volume>(<issue>9</issue>), <fpage>749</fpage>-<lpage>754</lpage>. <comment>https://doi.org/10.1136/bjsports-2016-097152</comment> <pub-id pub-id-type="doi">10.1136/bjsports-2016-097152</pub-id></mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nassis</surname><given-names>G. P.</given-names></name><name><surname>Verhagen</surname><given-names>E.</given-names></name><name><surname>Brito</surname><given-names>J.</given-names></name><name><surname>Figueiredo</surname><given-names>P.</given-names></name><name><surname>Krustrup</surname><given-names>P.</given-names></name></person-group> (<year>2023</year>) <article-title>A review of machine learning applications in soccer with an emphasis on injury risk</article-title>. <source>Biology of Sport</source> <volume>40</volume>(<issue>1</issue>), <fpage>233</fpage>-<lpage>239</lpage>. <comment>https://doi.org/10.5114/biolsport.2023.114283</comment> <pub-id pub-id-type="doi">10.5114/biolsport.2023.114283</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Neuberger</surname><given-names>E. W. I.</given-names></name><name><surname>Brahmer</surname><given-names>A.</given-names></name><name><surname>Ehlert</surname><given-names>T.</given-names></name><name><surname>Kluge</surname><given-names>K.</given-names></name><name><surname>Philippi</surname><given-names>K. F. A.</given-names></name><name><surname>Boedecker</surname><given-names>S. C.</given-names></name><name><surname>Weinmann-Menke</surname><given-names>J.</given-names></name><name><surname>Simon</surname><given-names>P.</given-names></name></person-group> (<year>2021</year>) <article-title>Validating quantitative PCR assays for cfDNA detection without DNA extraction in exercising SLE patients</article-title>. <source>Scientific Reports</source> <volume>11</volume>(<issue>1</issue>) <comment>https://doi.org/10.1038/s41598-021-92826-4</comment> <pub-id pub-id-type="doi">10.1038/s41598-021-92826-4</pub-id></mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Opar</surname><given-names>D. A.</given-names></name><name><surname>Piatkowski</surname><given-names>T.</given-names></name><name><surname>Williams</surname><given-names>M. D.</given-names></name><name><surname>Shield</surname><given-names>A. J.</given-names></name></person-group> (<year>2013</year>) <article-title>A Novel Device Using the Nordic Hamstring Exercise to Assess Eccentric Knee Flexor Strength: A Reliability and Retrospective Injury Study</article-title>. <source>Journal of Orthopaedic &#x0026; Sports Physical Therapy</source> <volume>43</volume>(<issue>9</issue>), <fpage>636</fpage>-<lpage>640</lpage>. <comment>https://doi.org/10.2519/jospt.2013.4837</comment> <pub-id pub-id-type="doi">10.2519/jospt.2013.4837</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rodas</surname><given-names>G.</given-names></name><name><surname>Osaba</surname><given-names>L.</given-names></name><name><surname>Arteta</surname><given-names>D.</given-names></name><name><surname>Pruna</surname><given-names>R.</given-names></name><name><surname>Fernandez</surname><given-names>D.</given-names></name><name><surname>Lucia</surname><given-names>A.</given-names></name></person-group> (<year>2020</year>) <article-title>Genomic Prediction of Tendinopathy Risk in Elite Team Sports</article-title>. <source>International Journal of Sports Physiology and Performance</source> <volume>15</volume>(<issue>4</issue>), <fpage>489</fpage>-<lpage>495</lpage>. <comment>https://doi.org/10.1123/ijspp.2019-0431</comment> <pub-id pub-id-type="doi">10.1123/ijspp.2019-0431</pub-id></mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rommers</surname><given-names>N.</given-names></name><name><surname>Rossler</surname><given-names>R.</given-names></name><name><surname>Verhagen</surname><given-names>E.</given-names></name><name><surname>Vandecasteele</surname><given-names>F.</given-names></name><name><surname>Verstockt</surname><given-names>S.</given-names></name><name><surname>Vaeyens</surname><given-names>R.</given-names></name><name><surname>Lenoir</surname><given-names>M.</given-names></name><name><surname>D'Hondt</surname><given-names>E.</given-names></name><name><surname>Witvrouw</surname><given-names>E.</given-names></name></person-group> (<year>2020</year>) <article-title>A Machine Learning Approach to Assess Injury Risk in Elite Youth Football Players</article-title>. <source>Medicine &#x0026; Science in Sports &#x0026; Exercise</source> <volume>52</volume>(<issue>8</issue>), <fpage>1745</fpage>-<lpage>1751</lpage>. <comment>https://doi.org/10.1249/Mss.0000000000002305</comment> <pub-id pub-id-type="doi">10.1249/Mss.0000000000002305</pub-id></mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rossi</surname><given-names>A.</given-names></name><name><surname>Pappalardo</surname><given-names>L.</given-names></name><name><surname>Cintia</surname><given-names>P.</given-names></name><name><surname>Iaia</surname><given-names>F. M.</given-names></name><name><surname>Fernandez</surname><given-names>J.</given-names></name><name><surname>Medina</surname><given-names>D.</given-names></name></person-group> (<year>2018</year>) <article-title>Effective injury forecasting in soccer with GPS training data and machine learning</article-title>. <source>Plos One</source> <volume>13</volume>(<issue>7</issue>) <comment>https://doi.org/10.1371/journal.pone.0201264</comment> <pub-id pub-id-type="doi">10.1371/journal.pone.0201264</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rossi</surname><given-names>A.</given-names></name><name><surname>Pappalardo</surname><given-names>L.</given-names></name><name><surname>Filetti</surname><given-names>C.</given-names></name><name><surname>Cintia</surname><given-names>P.</given-names></name></person-group> (<year>2023</year>) <article-title>Blood sample profile helps to injury forecasting in elite soccer players</article-title>. <source>Sport Sciences for Health</source> <volume>19</volume>(<issue>1</issue>), <fpage>285</fpage>-<lpage>296</lpage>. <comment>https://doi.org/10.1007/s11332-022-00932-1</comment> <pub-id pub-id-type="doi">10.1007/s11332-022-00932-1</pub-id></mixed-citation></ref>
<ref id="ref32"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ruddy</surname><given-names>J. D.</given-names></name><name><surname>Shield</surname><given-names>A. J.</given-names></name><name><surname>Maniar</surname><given-names>N.</given-names></name><name><surname>Williams</surname><given-names>M. D.</given-names></name><name><surname>Duhig</surname><given-names>S.</given-names></name><name><surname>Timmins</surname><given-names>R. G.</given-names></name><name><surname>Hickey</surname><given-names>J.</given-names></name><name><surname>Bourne</surname><given-names>M. N.</given-names></name><name><surname>Opar</surname><given-names>D. A.</given-names></name></person-group> (<year>2018</year>) <article-title>Predictive Modeling of Hamstring Strain Injuries in Elite Australian Footballers</article-title>. <source>Medicine &#x0026; Science in Sports &#x0026; Exercise</source> <volume>50</volume>(<issue>5</issue>), <fpage>906</fpage>-<lpage>914</lpage>. <comment>https://doi.org/10.1249/MSS.0000000000001527</comment> <pub-id pub-id-type="doi">10.1249/MSS.0000000000001527</pub-id></mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Saw</surname><given-names>A. E.</given-names></name><name><surname>Main</surname><given-names>L. C.</given-names></name><name><surname>Gastin</surname><given-names>P. B.</given-names></name></person-group> (<year>2016</year>) <article-title>Monitoring the athlete training response: subjective self-reported measures trump commonly used objective measures: a systematic review [Research Support, Non-U.S. Gov't Review]</article-title>. <source>British Journal of Sports Medicine</source> <volume>50</volume>(<issue>5</issue>), <fpage>281</fpage>-<lpage>291</lpage>. <comment>https://doi.org/10.1136/bjsports-2015-094758</comment> <pub-id pub-id-type="doi">10.1136/bjsports-2015-094758</pub-id></mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schwellnus</surname><given-names>M.</given-names></name><name><surname>Soligard</surname><given-names>T.</given-names></name><name><surname>Alonso</surname><given-names>J. M.</given-names></name><name><surname>Bahr</surname><given-names>R.</given-names></name><name><surname>Clarsen</surname><given-names>B.</given-names></name><name><surname>Dijkstra</surname><given-names>H. P.</given-names></name><name><surname>Gabbett</surname><given-names>T. J.</given-names></name><name><surname>Gleeson</surname><given-names>M.</given-names></name><name><surname>Hagglund</surname><given-names>M.</given-names></name><name><surname>Hutchinson</surname><given-names>M. R.</given-names></name><name><surname>Janse Van Rensburg</surname><given-names>C.</given-names></name><name><surname>Meeusen</surname><given-names>R.</given-names></name><name><surname>Orchard</surname><given-names>J. W.</given-names></name><name><surname>Pluim</surname><given-names>B. M.</given-names></name><name><surname>Raftery</surname><given-names>M.</given-names></name><name><surname>Budgett</surname><given-names>R.</given-names></name><name><surname>Engebretsen</surname><given-names>L.</given-names></name></person-group> (<year>2016</year>) <article-title>How much is too much? (Part 2) International Olympic Committee consensus statement on load in sport and risk of illness [Consensus Development Conference]</article-title>. <source>British Journal of Sports Medicine</source> <volume>50</volume>(<issue>17</issue>), <fpage>1043</fpage>-<lpage>1052</lpage>. <comment>https://doi.org/10.1136/bjsports-2016-096572</comment> <pub-id pub-id-type="doi">10.1136/bjsports-2016-096572</pub-id></mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Siriseriwan</surname><given-names>W.</given-names></name></person-group> (<year>2019</year>) <article-title>Smotefamily: A collection of oversampling techniques for class imbalance problem based on SMOTE</article-title>. <source>R Package Version</source>, <volume>1</volume>(<issue>1</issue>)</mixed-citation></ref>
<ref id="ref36"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Soligard</surname><given-names>T.</given-names></name><name><surname>Schwellnus</surname><given-names>M.</given-names></name><name><surname>Alonso</surname><given-names>J. M.</given-names></name><name><surname>Bahr</surname><given-names>R.</given-names></name><name><surname>Clarsen</surname><given-names>B.</given-names></name><name><surname>Dijkstra</surname><given-names>H. P.</given-names></name><name><surname>Gabbett</surname><given-names>T.</given-names></name><name><surname>Gleeson</surname><given-names>M.</given-names></name><name><surname>Hagglund</surname><given-names>M.</given-names></name><name><surname>Hutchinson</surname><given-names>M. R.</given-names></name><name><surname>van Rensburg</surname><given-names>C. J.</given-names></name><name><surname>Khan</surname><given-names>K. M.</given-names></name><name><surname>Meeusen</surname><given-names>R.</given-names></name><name><surname>Orchard</surname><given-names>J. W.</given-names></name><name><surname>Pluim</surname><given-names>B. M.</given-names></name><name><surname>Raftery</surname><given-names>M.</given-names></name><name><surname>Budgett</surname><given-names>R.</given-names></name><name><surname>Engebretsen</surname><given-names>L.</given-names></name></person-group> (<year>2016</year>) <article-title>How much is too much? (Part 1) International Olympic Committee consensus statement on load in sport and risk of injury</article-title>. <source>British Journal of Sports Medicine</source> <volume>50</volume>(<issue>17</issue>), <fpage>1030</fpage>-<lpage>1041</lpage>. <comment>https://doi.org/10.1136/bjsports-2016-096581</comment> <pub-id pub-id-type="doi">10.1136/bjsports-2016-096581</pub-id></mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stagno</surname><given-names>K. M.</given-names></name><name><surname>Thatcher</surname><given-names>R.</given-names></name><name><surname>Van Someren</surname><given-names>K. A.</given-names></name></person-group> (<year>2007</year>) <article-title>A modified TRIMP to quantify the in-season training load of team sport players</article-title>. <source>Journal of Sports Sciences</source> <volume>25</volume>(<issue>6</issue>), <fpage>629</fpage>-<lpage>634</lpage>. <comment>https://doi.org/10.1080/02640410600811817</comment> <pub-id pub-id-type="doi">10.1080/02640410600811817</pub-id></mixed-citation></ref>
<ref id="ref38"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>St&#x00F6;ggl</surname><given-names>T. L.</given-names></name><name><surname>Blumkaitis</surname><given-names>J. C.</given-names></name><name><surname>Strepp</surname><given-names>T.</given-names></name><name><surname>Sareban</surname><given-names>M.</given-names></name><name><surname>Simon</surname><given-names>P.</given-names></name><name><surname>Neuberger</surname><given-names>E. W. I.</given-names></name><name><surname>Finkenzeller</surname><given-names>T.</given-names></name><name><surname>Nunes</surname><given-names>N.</given-names></name><name><surname>Aglas</surname><given-names>L.</given-names></name><name><surname>Haller</surname><given-names>N.</given-names></name></person-group> (<year>2022</year>) <article-title>The Salzburg 10/7 HIIT shock cycle study: the effects of a 7-day high-intensity interval training shock microcycle with or without additional low-intensity training on endurance performance, well-being, stress and recovery in endurance trained athletes-study protocol of a randomized controlled trial</article-title>. <source>Bmc Sports Science Medicine and Rehabilitation</source> <volume>14</volume>(<issue>1</issue>) <comment>https://doi.org/10.1186/s13102-022-00456-8</comment> <pub-id pub-id-type="doi">10.1186/s13102-022-00456-8</pub-id></mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Suthaharan</surname><given-names>S.</given-names></name></person-group> (<year>2016</year>) <article-title>Machine learning models and algorithms for big data classification</article-title>. <source>Integrated Serien in Information Systems</source> <volume>36</volume>, <fpage>1</fpage>-<lpage>12</lpage>. <comment>https://doi.org/10.1007/978-1-4899-7641-3_1</comment> <pub-id pub-id-type="doi">10.1007/978-1-4899-7641-3_1</pub-id></mixed-citation></ref>
<ref id="ref40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Twist</surname><given-names>C.</given-names></name><name><surname>Highton</surname><given-names>J.</given-names></name></person-group> (<year>2013</year>) <article-title>Monitoring fatigue and recovery in rugby league players</article-title>. <source>International Journal of Sports Physiology and Performance</source> <volume>8</volume>(<issue>5</issue>), <fpage>467</fpage>-<lpage>474</lpage>. <comment>https://doi.org/10.1123/ijspp.8.5.467</comment> <pub-id pub-id-type="doi">10.1123/ijspp.8.5.467</pub-id></mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Van Eetvelde</surname><given-names>H.</given-names></name><name><surname>Mendonca</surname><given-names>L. D.</given-names></name><name><surname>Ley</surname><given-names>C.</given-names></name><name><surname>Seil</surname><given-names>R.</given-names></name><name><surname>Tischer</surname><given-names>T.</given-names></name></person-group> (<year>2021</year>) <article-title>Machine learning methods in sport injury prediction and prevention: a systematic review</article-title>. <source>Journal of Experimental Orthopaedics</source> <volume>8</volume>(<issue>1</issue>) <comment>https://doi.org/10.1186/s40634-021-00346-x</comment> <pub-id pub-id-type="doi">10.1186/s40634-021-00346-x</pub-id></mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Watkins</surname><given-names>C. M.</given-names></name><name><surname>Barillas</surname><given-names>S. R.</given-names></name><name><surname>Wong</surname><given-names>M. A.</given-names></name><name><surname>Archer</surname><given-names>D. C.</given-names></name><name><surname>Dobbs</surname><given-names>I. J.</given-names></name><name><surname>Lockie</surname><given-names>R. G.</given-names></name><name><surname>Coburn</surname><given-names>J. W.</given-names></name><name><surname>Tran</surname><given-names>T. T.</given-names></name><name><surname>Brown</surname><given-names>L. E.</given-names></name></person-group> (<year>2017</year>) <article-title>Determination of Vertical Jump as a Measure of Neuromuscular Readiness and Fatigue</article-title>. <source>Journal of Strength and Conditioning Research</source> <volume>31</volume>(<issue>12</issue>), <fpage>3305</fpage>-<lpage>3310</lpage>. <comment>https://doi.org/Doi 10.1519/Jsc.0000000000002231</comment> <pub-id pub-id-type="doi">10.1519/Jsc.0000000000002231</pub-id></mixed-citation></ref>
<ref id="ref43"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Watson</surname><given-names>A.</given-names></name><name><surname>Brickson</surname><given-names>S.</given-names></name><name><surname>Brooks</surname><given-names>M. A.</given-names></name><name><surname>Dunn</surname><given-names>W.</given-names></name></person-group> (<year>2017</year>) <article-title>Preseason Aerobic Fitness Predicts In-Season Injury and Illness in Female Youth Athletes</article-title>. <source>Orthopaedic Journal of Sports Medicine</source> <volume>5</volume>(<issue>9</issue>), <fpage>2325967117726976</fpage>. <comment>https://doi.org/10.1177/2325967117726976</comment> <pub-id pub-id-type="doi">10.1177/2325967117726976</pub-id></mixed-citation></ref>
<ref id="ref44"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Weiss</surname><given-names>G. M.</given-names></name><name><surname>Provost</surname><given-names>F.</given-names></name></person-group> (<year>2001</year>) <source>The effect of class distribution on classifier learning: an empirical study.</source> <publisher-name>Rutgers University</publisher-name>.</mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="web"><person-group person-group-type="author"><name><surname>Wu</surname><given-names>D.</given-names></name></person-group> (<year>2022</year>) <article-title>Resampling Strategies for Binary Imbalanced Datasets</article-title>. <source>R package version 0.0.2.0000</source>. <comment><ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://github.com/dongyuanwu/RSBID">https://github.com/dongyuanwu/RSBID</ext-link></comment></mixed-citation></ref>
</ref-list>
</back>
<floats-group>
<fig id="fig001" position="float">
<label>Figure 1.</label>
<caption><p><bold>Outline of the study with a regular week.</bold> The legend on the right shows which measurements were taken on which day. MD = match day with "+"/"-" signs indicate the distance in days to regular season matches, AM = morning, PM = afternoon/evening, Hip ABD = hip abduction strength, Hip ADD = hip adduction strength, CMJ= counter movement jump testing, LPS = Local Positioning System, S&#x0026;C = Strength and Conditioning. The figure is analogous to that used in our pilot study (Haller et al., <xref ref-type="bibr" rid="ref13">2022</xref>).</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g001.tif" mime-subtype="tif"/>
</fig>
<fig id="fig002" position="float">
<label>Figure 2.</label>
<caption><p><bold>Average sleep quality per player (Study ID) for each week.</bold> Different colors indicate the sleep quality with lighter colors indicating better sleep quality rating. Weeks with missing values are shown in grey. Weeks in which the questionnaire was not completed on any day are shown in grey.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g002.tif" mime-subtype="tif"/>
</fig>
<fig id="fig003" position="float">
<label>Figure 3.</label>
<caption><p><bold>Plot of the ten most important variables according to ROC curve variable importance for each of the three classification tasks.</bold> ACWR: acute:chronic workload ratio, mean x8-x28: mean value over 3 weeks days 8 to 28, HR: heart rate, cfDNA: cell-free DNA, CRP: c-reactive protein, EOS: eosinophile; MCHC: Mean corpuscular hemoglobin concentration, BAS: basophils, TP: total protein, HCT: hematocrit, GLU: glucose, LYMPH: lymphocytes, MG: magnesium, Crea: creatinine, UA: uric acid, -%: percentage.</p></caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="jssm-22-475-g003.tif" mime-subtype="tif"/>
</fig>
<table-wrap id="table001" position="float" orientation="portrait">
<label>Table 1.</label>
<caption><p>Overview of the classification tasks.</p></caption>
<table rules="all" frame="box">
<thead>
<tr>
<th align="left" valign="middle">Classification Task</th>
<th align="center" valign="middle">Model</th>
<th align="center" valign="middle">Types and number of variables included</th>
<th align="center" valign="middle">Training data set data points (before oversampling)</th>
<th align="center" valign="middle">Training data set data points (after oversampling)</th>
<th align="center" valign="middle">Test data set data points</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Injury<break/>prediction</td>
<td align="center" valign="middle">linear SVM</td>
<td align="center" valign="middle">Training load, blood, fitness, questionnaire, jump variables (247)</td>
<td align="center" valign="middle">1.085<break/>(incl. 7 injuries)</td>
<td align="center" valign="middle">1.347<break/>(incl. 269 injuries)</td>
<td align="center" valign="middle">300<break/>(incl. 4 injuries)</td>
</tr>
<tr>
<td align="left" valign="middle">Illness<break/>prediction</td>
<td align="center" valign="middle">linear SVM</td>
<td align="center" valign="middle">Blood variables<break/>(40)</td>
<td align="center" valign="middle">283<break/>(incl. 11 illnesses)</td>
<td align="center" valign="middle">543<break/>(incl. 271 illnesses)</td>
<td align="center" valign="middle">60<break/>(incl. 1 illness)</td>
</tr>
<tr>
<td align="left" valign="middle">Illness<break/>determination</td>
<td align="center" valign="middle">linear SVM</td>
<td align="center" valign="middle">Blood variables<break/>(40)</td>
<td align="center" valign="middle">177<break/>(incl. 9 illnesses)</td>
<td align="center" valign="middle">337<break/>(incl. 169 illnesses)</td>
<td align="center" valign="middle">42<break/>(incl. 1 illness)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>Injury prediction: 11 injuries present in the sample, with 8 different players affected; Illness prediction: 12 illnesses present in the sample, with 10 different players affected; Illness determination: 10 illnesses present in the sample, with 5 different players affected. Differences in the numbers of illness prediction and detection possible due to non-appearance for blood collection, when already ill.</p></fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="table002" position="float" orientation="portrait">
<label>Table 2.</label>
<caption><p>Classification results of the three classification tasks. Accuracy, Cohens Kappa, F1-Score and Specificity of the test data set.</p></caption>
<table rules="all" frame="box">
<thead>
<tr>
<th align="left" valign="middle">Model</th>
<th align="center" valign="middle">Accuracy,<break/>in %</th>
<th align="center" valign="middle">Precision,<break/>in %</th>
<th align="center" valign="middle">Recall,<break/>in %</th>
<th align="center" valign="middle">Cohens<break/>Kappa</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle"><bold>Injury</bold><break/><bold>prediction</bold></td>
<td align="center" valign="middle">96.3</td>
<td align="center" valign="middle">11.1</td>
<td align="center" valign="middle">25.0</td>
<td align="center" valign="middle">0.138</td>
</tr>
<tr>
<td align="left" valign="middle"><bold>Illness</bold><break/><bold>prediction</bold></td>
<td align="center" valign="middle">66.7</td>
<td align="center" valign="middle">4.8</td>
<td align="center" valign="middle">100.0</td>
<td align="center" valign="middle">0.061</td>
</tr>
<tr>
<td align="left" valign="middle"><bold>Illness</bold><break/><bold>determination</bold></td>
<td align="center" valign="middle">100.0</td>
<td align="center" valign="middle">100.0</td>
<td align="center" valign="middle">100.0</td>
<td align="center" valign="middle">1</td>
</tr>
</tbody>
</table>
</table-wrap>
</floats-group>
</article>