I would like to try to create an AI that will help me with some football xml files.
I have around 100k xml files that contains events for some football matches (examples below) and I would like to teach an AI how to read those data and implement a sort of “chat” to interact with the data.
Ex.: “How many passes has been made by Atalanta in Serie A”?
In this case the model should find, in all the xml files, the ones that contains referee to “Atalanta” and “Serie A” (the XML contains the ID of both competition and team, but there are some XML that can tell which ID is which team name) and sum the amount of tag that has the attribute “type” equals to “PASS” (also in this case there will be an XML that contains the correlation between the name of the event and it’s code in the XML)
I’m pretty new to the model training / ai world and I would like to know which could be the best model to use and how to start. I’ve searched a little bit on internet and I’ve found out that for simple tasks like this I could use a rule-based system or a decision tree model
I’m also not sure if the model can read the XML or I need to convert them into CSV or Pandas DataFrame so if you guys have some tips please let me know
For the chat part I’ve read about Flask and Django available on Python but I’ve never used them so kinda new also for this part
Please let me know what are your suggestions and if you have any tips for me
I’ve not done any code because I would like first to know which could be the best option to develop.
An example of a XML is the following:
PS: there are around 2000 events per match in the XML
<game repotime="2023-11-20 10:33:48">
<PLAYERS modulo1="343" modulo2="3421" colore1="255x0x0x128" colore2="255x255x255x255" rev="-1" revSics="14">
<PLAYER nome="MUSSO J." id="16872" numero="1" ruolo="P" team="1" posMod="1" pos="1.0;4.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="SCALVINI G." id="23599" numero="42" ruolo="D" team="1" posMod="2" pos="3.0;6.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="DJIMSITI B." id="10288" numero="19" ruolo="D" team="1" posMod="3" pos="2.7;4.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="KOLASINAC S." id="10832" numero="23" ruolo="D" team="1" posMod="4" pos="3.0;2.0" esp="-1" sos="5466235" sub="-1" />
<PLAYER nome="ZAPPACOSTA D." id="6461" numero="77" ruolo="D" team="1" posMod="5" pos="5.3;7.0" esp="-1" sos="4639256" sub="-1" />
<PLAYER nome="DE ROON M." id="8630" numero="15" ruolo="C" team="1" posMod="6" pos="4.7;5.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="EDERSON" id="30828" numero="13" ruolo="C" team="1" posMod="7" pos="4.7;3.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="RUGGERI M." id="23628" numero="22" ruolo="D" team="1" posMod="8" pos="5.3;1.0" esp="-1" sos="4652630" sub="-1" />
<PLAYER nome="DE KETELAERE C." id="22258" numero="17" ruolo="A" team="1" posMod="9" pos="6.7;6.0" esp="-1" sos="5008198" sub="-1" />
<PLAYER nome="SCAMACCA G." id="14684" numero="90" ruolo="A" team="1" posMod="10" pos="6.5;4.0" esp="-1" sos="5008198" sub="-1" />
<PLAYER nome="KOOPMEINERS T." id="14256" numero="7" ruolo="C" team="1" posMod="11" pos="6.7;2.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="HOLM E." id="26709" numero="3" ruolo="D" team="1" posMod="12" pos="5.3;7.0" esp="-1" sos="-1" sub="4639256" />
<PLAYER nome="BAKKER M." id="23529" numero="20" ruolo="D" team="1" posMod="13" pos="5.3;1.0" esp="-1" sos="-1" sub="4652630" />
<PLAYER nome="MURIEL L." id="6333" numero="9" ruolo="A" team="1" posMod="14" pos="6.5;4.0" esp="-1" sos="-1" sub="5008198" />
<PLAYER nome="LOOKMAN A." id="15518" numero="11" ruolo="A" team="1" posMod="15" pos="6.7;6.0" esp="-1" sos="-1" sub="5008198" />
<PLAYER nome="PALOMINO J. L." id="13249" numero="6" ruolo="D" team="1" posMod="16" pos="3.0;2.0" esp="-1" sos="-1" sub="5466235" />
<PLAYER nome="DI GREGORIO M." id="14464" numero="16" ruolo="P" team="2" posMod="1" pos="1.0;4.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="IZZO A." id="6516" numero="4" ruolo="D" team="2" posMod="2" pos="3.0;6.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="MARI' P." id="25359" numero="22" ruolo="D" team="2" posMod="3" pos="2.7;4.0" esp="-1" sos="4060555" sub="-1" />
<PLAYER nome="CALDIROLA L." id="19128" numero="5" ruolo="D" team="2" posMod="4" pos="2.578947;4.113821" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="BIRINDELLI S." id="12913" numero="19" ruolo="D" team="2" posMod="5" pos="5.3;7.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="GAGLIARDINI R." id="5884" numero="6" ruolo="C" team="2" posMod="6" pos="4.7;5.0" esp="-1" sos="4069771" sub="-1" />
<PLAYER nome="PESSINA M." id="12538" numero="32" ruolo="C" team="2" posMod="7" pos="3.9105277;3.9756107" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="CIURRIA P." id="5866" numero="84" ruolo="A" team="2" posMod="8" pos="5.3;1.0" esp="-1" sos="-1" sub="-1" />
<PLAYER nome="COLPANI A." id="20996" numero="28" ruolo="C" team="2" posMod="9" pos="6.1;5.0" esp="-1" sos="4584666" sub="-1" />
<PLAYER nome="CAPRARI G." id="5795" numero="10" ruolo="A" team="2" posMod="10" pos="6.1;3.0" esp="-1" sos="3714549" sub="-1" />
<PLAYER nome="MOTA D." id="11936" numero="47" ruolo="A" team="2" posMod="11" pos="7.1;4.0" esp="-1" sos="3713054" sub="-1" />
<PLAYER nome="VIGNATO S." id="23539" numero="80" ruolo="C" team="2" posMod="12" pos="7.257893;2.9349594" esp="-1" sos="-1" sub="3714549" />
<PLAYER nome="COLOMBO L." id="16068" numero="9" ruolo="A" team="2" posMod="13" pos="7.363157;4.8130074" esp="-1" sos="-1" sub="3713054" />
<PLAYER nome="CARBONI A." id="23486" numero="44" ruolo="D" team="2" posMod="14" pos="2.857895;2.4065056" esp="-1" sos="-1" sub="4060555" />
<PLAYER nome="BONDO W." id="33692" numero="38" ruolo="C" team="2" posMod="15" pos="4.542105;4.869919" esp="-1" sos="-1" sub="4069771" />
<PLAYER nome="MACHIN J." id="11636" numero="7" ruolo="C" team="2" posMod="16" pos="4.6789484;3.0162613" esp="-1" sos="-1" sub="4584666" />
</PLAYERS>
<EVENT idevent="PASS03092023063506" idgroup="PASS03092023063506" type="PASS" start="10000" end="15008" half="1" idteam="2" player="MOTA D." idplayer="11936" playerTo="PESSINA M." idplayerTo="12538" pos="52.41;34.23" pos1="63.00;37.61" note="" esito="-1">
<TAGS>
<TAG cod="PASS-0" />
</TAGS>
</EVENT>
<EVENT idevent="PIF030920231259341" idgroup="PASS03092023063506" type="PIF" start="10000" end="15008" half="1" idteam="2" player="MOTA D." idplayer="11936" playerTo="PESSINA M." idplayerTo="12538" pos="52.41;34.23" pos1="63.00;37.61" note="" esito="2">
<TAGS>
<TAG cod="PIF-6" />
<TAG cod="PIF-10" />
</TAGS>
</EVENT>
<EVENT idevent="PIC030920231259341as" idgroup="PASS03092023063506" type="PIC" start="10000" end="15008" half="1" idteam="1" pos="52.41;34.23" pos1="63.00;37.61" player="" idplayer="" playerTo="" idplayerTo="" note="" esito="-1">
<TAGS>
<TAG cod="PIC-6" />
<TAG cod="PIC-10" />
</TAGS>
</EVENT>
...
</game>
Marco Zen is a new contributor to this site. Take care in asking for clarification, commenting, and answering.
Check out our Code of Conduct.