<?xml version="1.0" encoding="UTF-8"?>
<doi_batch version="4.4.2" xmlns="http://www.crossref.org/schema/4.4.2" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:jats="http://www.ncbi.nlm.nih.gov/JATS1" xsi:schemaLocation="http://www.crossref.org/schema/4.4.2 http://www.crossref.org/schema/deposit/crossref4.4.2.xsd">
<head>
<doi_batch_id>-3bf97310184a13a8c1e-1bd5</doi_batch_id>
<timestamp>20230204051438795</timestamp>
<depositor>
  <depositor_name>beie:beie</depositor_name> 
  <email_address>director@blueeyesintelligence.org</email_address>
</depositor>
<registrant>WEB-FORM</registrant> 
</head>
<body>
<journal>
<journal_metadata>   <full_title>International Journal of Innovative Technology and Exploring Engineering</full_title>   <abbrev_title>IJITEE</abbrev_title>   <issn media_type='electronic'>22783075</issn>   <doi_data>     <doi>10.35940/ijitee</doi>     <resource>https://www.ijitee.org/</resource>   </doi_data> </journal_metadata> <journal_issue>  <publication_date media_type='online'>     <month>02</month>     <day>28</day>     <year>2023</year>   </publication_date>   <journal_volume>     <volume>12</volume>   </journal_volume>   <issue>3</issue> </journal_issue><!-- ============== --> <journal_article publication_type='full_text'>   <titles>     <title>Determine the Undervalued US Major League Baseball Players with Machine Learning</title>   </titles>   <contributors>      <organization sequence='first' contributor_role='author'>Assistant Professor, Department of Mathematical Sciences, Middle Tennessee State University, Murfreesboro, USA</organization>    <person_name sequence='first' contributor_role='author'>      <given_name>Lu</given_name>      <surname>Xiong</surname>      <ORCID>https://orcid.org/0000-0003-2471-1256</ORCID>    </person_name>    <person_name sequence='additional' contributor_role='author'>       <given_name>Kechen</given_name>       <surname>Tian</surname>       <ORCID>https://orcid.org/0000-0002-5481-0012</ORCID>     </person_name>     <organization sequence='additional' contributor_role='author'>Department of Mathematical Sciences, Middle Tennessee State University, Murfreesboro, USA</organization>     <person_name sequence='additional' contributor_role='author'>       <given_name>Yuwen</given_name>       <surname>Qian</surname>       <ORCID>https://orcid.org/0000-0002-3210-5961</ORCID>     </person_name>     <organization sequence='additional' contributor_role='author'>Department of Mathematical Sciences, Middle Tennessee State University, Murfreesboro, USA</organization>     <person_name sequence='additional' contributor_role='author'>       <given_name>Wilson</given_name>       <surname>Musyoka</surname>       <ORCID>https://orcid.org/0000-0002-6102-4597</ORCID>     </person_name>     <organization sequence='additional' contributor_role='author'>Department of Mathematical Sciences, Middle Tennessee State University, Murfreesboro, USA</organization>     <person_name sequence='additional' contributor_role='author'>       <given_name>Xingyu</given_name>       <surname>Chen</surname>       <ORCID>https://orcid.org/0000-0001-5716-2121</ORCID>     </person_name>     <organization sequence='additional' contributor_role='author'>Department of Mathematical Sciences, Middle Tennessee State University, Murfreesboro, USA</organization>   </contributors>    <jats:abstract xml:lang='en'>         <jats:p>Baseball is a sport of statistics. The industry has accumulated detailed offensive and defensive statistical data for over a century. Experience has shown that data analysis can give a competitive advantage compared to teams without using such analysis. In the last two decades, with the development of machine learning and artificial intelligence, we have had more advanced algorithms to analyze data in baseball. In the following research, we will run different ML models using sci-kit-learn and H2O on Colab, and the Caret package on RStudio to examine the datasets (hitting dataset and salary dataset) and determine the undervalued players by predicting the number of runs scored in the next year. We will compare machine learning regression algorithms and ensemble methods and give comprehensive explanations of the result. The suggestion of which model is superior in terms of prediction accuracy will be determined.</jats:p>     </jats:abstract>  <publication_date media_type='online'>     <month>02</month>     <day>28</day>     <year>2023</year>   </publication_date>   <pages>     <first_page>17</first_page>     <last_page>24</last_page>   </pages>   <crossmark>     <crossmark_version>CC BY-NC-ND 4.0</crossmark_version>     <crossmark_policy>10.35940/BEIESP.CrossMarkPolicy</crossmark_policy>     <crossmark_domains>       <crossmark_domain>          <domain>www.ijitee.org</domain>       </crossmark_domain>     </crossmark_domains>     <crossmark_domain_exclusive>true</crossmark_domain_exclusive>     <custom_metadata>       <assertion explanation='Funding' group_label='Funding' group_name='Funding' name='Declaration' order='0'>No, I did not receive.</assertion>       <assertion explanation='Conflicts of Interest' group_label='Conflicts of Interest' group_name='Conflicts-of-Interest' name='Declaration' order='1'>No conflicts of interest to the best of our knowledge.</assertion>       <assertion explanation='Ethical Approval and Consent to Participate' group_label='Ethical Approval and Consent to Participate' group_name='Ethical-Approval-and-Consent-to-Participate' name='Declaration' order='2'>No, the article does not require ethical approval and consent to participate with evidence.</assertion>       <assertion explanation='Availability of Data and Material' group_label='Availability of Data and Material' group_name='Availability-of-Data-and-Material' name='Declaration' order='3'>The datasets used and/or analyzed during the current study are available from the corresponding author upon reasonable request.</assertion>       <assertion explanation='Authors Contributions' group_label='Authors Contributions' group_name='Authors-Contributions' name='Declaration' order='4'>Lu Xiong: the overall research strategy, direction, ideas, team management, and writing.  Kechen Tian: coding and results summary. Yuwen Qian: literature review and citations. Wilson Musyoka: data description and general introduction of SVM. Xingyu Chen: model evaluation and interpretation.</assertion>     </custom_metadata>   </crossmark>   <doi_data>     <doi>10.35940/ijitee.B9406.0212323</doi>     <resource>https://www.ijitee.org/portfolio-item/B94060112223/</resource>   </doi_data> </journal_article>
</journal>
</body>
</doi_batch>
