<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">JDS</journal-id>
<journal-title-group><journal-title>Journal of Data Science</journal-title></journal-title-group>
<issn pub-type="epub">1683-8602</issn><issn pub-type="ppub">1680-743X</issn><issn-l>1680-743X</issn-l>
<publisher>
<publisher-name>School of Statistics, Renmin University of China</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">JDS1200</article-id>
<article-id pub-id-type="doi">10.6339/25-JDS1200</article-id>
<article-categories><subj-group subj-group-type="heading">
<subject>Statistical Data Science</subject></subj-group></article-categories>
<title-group>
<article-title>Q-learning with Compound Outcome and Mixed Misclassification and Measurement Error in Covariates</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2669-558X</contrib-id>
<name><surname>Khadem Charvadeh</surname><given-names>Yasin</given-names></name><xref ref-type="aff" rid="j_jds1200_aff_001">1</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yi</surname><given-names>Grace Y.</given-names></name><email xlink:href="mailto:gyi5@uwo.ca">gyi5@uwo.ca</email><xref ref-type="aff" rid="j_jds1200_aff_001">1</xref><xref ref-type="aff" rid="j_jds1200_aff_002">2</xref><xref ref-type="corresp" rid="cor1">∗</xref>
</contrib>
<aff id="j_jds1200_aff_001"><label>1</label>Department of Statistical and Actuarial Sciences, <institution>University of Western Ontario</institution>, London, Ontario, <country>Canada</country></aff>
<aff id="j_jds1200_aff_002"><label>2</label>Department of Computer Science, <institution>University of Western Ontario</institution>, London, Ontario, <country>Canada</country></aff>
</contrib-group>
<author-notes>
<corresp id="cor1"><label>∗</label>Corresponding author. Email: <ext-link ext-link-type="uri" xlink:href="mailto:gyi5@uwo.ca">gyi5@uwo.ca</ext-link>.</corresp>
</author-notes>
<pub-date pub-type="ppub"><year>2025</year></pub-date><pub-date pub-type="epub"><day>15</day><month>10</month><year>2025</year></pub-date><volume content-type="ahead-of-print">0</volume><issue>0</issue><fpage>1</fpage><lpage>23</lpage><supplementary-material id="S1" content-type="document" xlink:href="jds1200_s001.pdf" mimetype="application" mime-subtype="pdf">
<caption>
<title>Supplementary Material</title>
<p>
<list>
<list-item id="j_jds1200_li_001">
<label>S1.</label>
<p>An Example of Constructing <inline-formula id="j_jds1200_ineq_001"><alternatives><mml:math>
<mml:msubsup>
<mml:mrow>
<mml:mi mathvariant="italic">S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>∗</mml:mo>
</mml:mrow>
</mml:msubsup>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">θ</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">j</mml:mi>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="false">
<mml:mrow>
<mml:mi mathvariant="italic">A</mml:mi>
</mml:mrow>
<mml:mo accent="true">‾</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="false">
<mml:mrow>
<mml:mi mathvariant="italic">X</mml:mi>
</mml:mrow>
<mml:mo accent="true">‾</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>∗</mml:mo>
</mml:mrow>
</mml:msubsup>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="false">
<mml:mrow>
<mml:mi mathvariant="italic">C</mml:mi>
</mml:mrow>
<mml:mo accent="true">‾</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>∗</mml:mo>
</mml:mrow>
</mml:msubsup>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="false">
<mml:mrow>
<mml:mi mathvariant="italic">Z</mml:mi>
</mml:mrow>
<mml:mo accent="true">‾</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">K</mml:mi>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[${S_{Kj}^{\ast }}({\theta _{Kj}};{Y_{Kji}},{\overline{A}_{Ki}},{\overline{X}_{Ki}^{\ast }},{\overline{C}_{Ki}^{\ast }},{\overline{Z}_{Ki}})$]]></tex-math></alternatives></inline-formula></p>
</list-item>
<list-item id="j_jds1200_li_002">
<label>S2.</label>
<p>Proportion of Optimally Treated Future Patients</p>
</list-item>
<list-item id="j_jds1200_li_003">
<label>S3.</label>
<p>Simulation Results for Correction Strategies with Reduced Sample Size</p>
</list-item>
<list-item id="j_jds1200_li_004">
<label>S4.</label>
<p>Simulation Results for Correction Strategies with Reduced Validation Subsample Size</p>
</list-item>
<list-item id="j_jds1200_li_005">
<label>S5.</label>
<p>Data Analysis</p>
</list-item>
</list> 
</p>
</caption>
</supplementary-material><history><date date-type="received"><day>30</day><month>8</month><year>2024</year></date><date date-type="accepted"><day>21</day><month>9</month><year>2025</year></date></history>
<permissions><copyright-statement>2025 The Author(s). Published by the School of Statistics and the Center for Applied Statistics, Renmin University of China.</copyright-statement><copyright-year>2025</copyright-year>
<license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>Open access article under the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">CC BY</ext-link> license.</license-p></license></permissions>
<abstract>
<p>Precision medicine is an innovative approach that aims to customize medical treatments and interventions to patients based on their individual characteristics. Several estimation techniques, including Q-learning, have been developed to determine optimal treatment rules. However, the applicability of these methods depends on the availability of precisely measured variables. This study extends the scope of Q-learning to incorporate compound outcomes, deviating from the commonly assumed univariate outcomes, and further accommodates data with mismeasurement in both binary and continuous covariates. Two methods are described to mitigate the impact of mismeasurement. Numerical studies reveal that mismeasurement in covariates leads to notable estimation bias in parameters indexing the optimal treatment, yet the methods addressing the mismeasured effects yield improved results.</p>
</abstract>
<kwd-group>
<label>Keywords</label>
<kwd>compound outcome</kwd>
<kwd>dynamic treatment regimes</kwd>
<kwd>estimating function</kwd>
<kwd>misclassification</kwd>
<kwd>measurement error</kwd>
<kwd>Q-learning</kwd>
<kwd>regression calibration</kwd>
<kwd>regression models</kwd>
</kwd-group>
<funding-group><funding-statement>Yi is the Canada Research Chair in Data Science (Tier 1). Her research is supported by funding from the Natural Sciences and Engineering Research Council of Canada (NSERC) and the Canada Research Chairs Program.</funding-statement></funding-group>
</article-meta>
</front>
<back>
<ref-list id="j_jds1200_reflist_001">
<title>References</title>
<ref id="j_jds1200_ref_001">
<mixed-citation publication-type="journal"> <string-name><surname>Akazawa</surname> <given-names>K</given-names></string-name>, <string-name><surname>Kinukawa</surname> <given-names>N</given-names></string-name>, <string-name><surname>Nakamura</surname> <given-names>T</given-names></string-name> (<year>1998</year>). <article-title>A note on the corrected score function adjusting for misclassification</article-title>. <source><italic>Journal of the Japan Statistical Society</italic></source>, <volume>28</volume>(<issue>1</issue>): <fpage>115</fpage>–<lpage>123</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.14490/jjss1995.28.115" xlink:type="simple">https://doi.org/10.14490/jjss1995.28.115</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_002">
<mixed-citation publication-type="book"> <string-name><surname>Carroll</surname> <given-names>RJ</given-names></string-name>, <string-name><surname>Ruppert</surname> <given-names>D</given-names></string-name>, <string-name><surname>Stefanski</surname> <given-names>LA</given-names></string-name>, <string-name><surname>Crainiceanu</surname> <given-names>CM</given-names></string-name> (<year>2006</year>). <source><italic>Measurement Error in Nonlinear Models: A Modern Perspective</italic></source>. <publisher-name>CRC press</publisher-name>.</mixed-citation>
</ref>
<ref id="j_jds1200_ref_003">
<mixed-citation publication-type="book"> <string-name><surname>Chakraborty</surname> <given-names>B</given-names></string-name>, <string-name><surname>Moodie</surname> <given-names>EE</given-names></string-name> (<year>2013</year>). <source><italic>Statistical Methods for Dynamic Treatment Regimes</italic></source>. <publisher-name>Springer</publisher-name>.</mixed-citation>
</ref>
<ref id="j_jds1200_ref_004">
<mixed-citation publication-type="journal"> <string-name><surname>Henmi</surname> <given-names>M</given-names></string-name>, <string-name><surname>Eguchi</surname> <given-names>S</given-names></string-name> (<year>2004</year>). <article-title>A paradox concerning nuisance parameters and projected estimating functions</article-title>. <source><italic>Biometrika</italic></source>, <volume>91</volume>(<issue>4</issue>): <fpage>929</fpage>–<lpage>941</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1093/biomet/91.4.929" xlink:type="simple">https://doi.org/10.1093/biomet/91.4.929</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_005">
<mixed-citation publication-type="journal"> <string-name><surname>Khadem Charvadeh</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Yi</surname> <given-names>GY</given-names></string-name> (<year>2024</year>a). <article-title>Accommodating misclassification effects on optimizing dynamic treatment regimes with Q-learning</article-title>. <source><italic>Statistics in Medicine</italic></source>, <volume>43</volume>(<issue>3</issue>): <fpage>578</fpage>–<lpage>605</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1002/sim.9973" xlink:type="simple">https://doi.org/10.1002/sim.9973</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_006">
<mixed-citation publication-type="journal"> <string-name><surname>Khadem Charvadeh</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Yi</surname> <given-names>GY</given-names></string-name> (<year>2024</year>b). <article-title>Understanding effective virus control policies for COVID-19 with the Q-learning method</article-title>. <source><italic>Statistics in Biosciences</italic></source>, <volume>16</volume>(<issue>1</issue>): <fpage>265</fpage>–<lpage>289</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1007/s12561-023-09382-w" xlink:type="simple">https://doi.org/10.1007/s12561-023-09382-w</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_007">
<mixed-citation publication-type="chapter"> <string-name><surname>Lizotte</surname> <given-names>DJ</given-names></string-name>, <string-name><surname>Bowling</surname> <given-names>MH</given-names></string-name>, <string-name><surname>Murphy</surname> <given-names>SA</given-names></string-name> (<year>2010</year>). <chapter-title>Efficient reinforcement learning with multiple reward functions for randomized controlled trial analysis</chapter-title>. In: <source><italic>Twenty-Seventh International Conference on Machine Learning (ICML)</italic></source>, <fpage>695</fpage>–<lpage>702</lpage>.</mixed-citation>
</ref>
<ref id="j_jds1200_ref_008">
<mixed-citation publication-type="journal"> <string-name><surname>Ning</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Yi</surname> <given-names>GY</given-names></string-name>, <string-name><surname>Reid</surname> <given-names>N</given-names></string-name> (<year>2018</year>). <article-title>A class of weighted estimating equations for semiparametric transformation models with missing covariates</article-title>. <source><italic>Scandinavian Journal of Statistics</italic></source>, <volume>45</volume>(<issue>1</issue>): <fpage>87</fpage>–<lpage>109</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1111/sjos.12289" xlink:type="simple">https://doi.org/10.1111/sjos.12289</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_009">
<mixed-citation publication-type="chapter"> <string-name><surname>Robins</surname> <given-names>JM</given-names></string-name> (<year>2004</year>). <chapter-title>Optimal structural nested models for optimal sequential decisions</chapter-title>. In: <string-name><surname>Lin</surname>, <given-names>DY</given-names></string-name>, <string-name><surname>Heagerty</surname>, <given-names>PJ</given-names></string-name> (eds.), <source><italic>Proceedings of the Second Seattle Symposium in Biostatistics</italic></source>. <series>Lecture Notes in Statistics</series>, vol. <volume>179</volume>. <publisher-name>Springer</publisher-name>. <publisher-loc>New York, NY</publisher-loc>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1007/978-1-4419-9076-1_11" xlink:type="simple">https://doi.org/10.1007/978-1-4419-9076-1_11</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_010">
<mixed-citation publication-type="journal"> <string-name><surname>Robins</surname> <given-names>JM</given-names></string-name>, <string-name><surname>Rotnitzky</surname> <given-names>A</given-names></string-name>, <string-name><surname>Zhao</surname> <given-names>LP</given-names></string-name> (<year>1994</year>). <article-title>Estimation of regression coefficients when some regressors are not always observed</article-title>. <source><italic>Journal of the American Statistical Association</italic></source>, <volume>89</volume>(<issue>427</issue>): <fpage>846</fpage>–<lpage>866</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1080/01621459.1994.10476818" xlink:type="simple">https://doi.org/10.1080/01621459.1994.10476818</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_011">
<mixed-citation publication-type="journal"> <string-name><surname>Spicker</surname> <given-names>D</given-names></string-name>, <string-name><surname>Wallace</surname> <given-names>MP</given-names></string-name> (<year>2020</year>). <article-title>Measurement error and precision medicine: Error-prone tailoring covariates in dynamic treatment regimes</article-title>. <source><italic>Statistics in Medicine</italic></source>, <volume>39</volume>(<issue>26</issue>): <fpage>3732</fpage>–<lpage>3755</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1002/sim.8690" xlink:type="simple">https://doi.org/10.1002/sim.8690</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_012">
<mixed-citation publication-type="journal"> <string-name><surname>Wang</surname> <given-names>L</given-names></string-name>, <string-name><surname>Rotnitzky</surname> <given-names>A</given-names></string-name>, <string-name><surname>Lin</surname> <given-names>X</given-names></string-name>, <string-name><surname>Millikan</surname> <given-names>RE</given-names></string-name>, <string-name><surname>Thall</surname> <given-names>PF</given-names></string-name> (<year>2012</year>). <article-title>Evaluation of viable dynamic treatment regimes in a sequentially randomized trial of advanced prostate cancer</article-title>. <source><italic>Journal of the American Statistical Association</italic></source>, <volume>107</volume>(<issue>498</issue>): <fpage>493</fpage>–<lpage>508</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1080/01621459.2011.641416" xlink:type="simple">https://doi.org/10.1080/01621459.2011.641416</ext-link></mixed-citation>
</ref>
<ref id="j_jds1200_ref_013">
<mixed-citation publication-type="book"> <string-name><surname>Yi</surname> <given-names>GY</given-names></string-name> (<year>2017</year>). <source><italic>Statistical Analysis with Measurement Error or Misclassification: Strategy, Method and Application</italic></source>. <publisher-name>Springer Science+Business Media LLC, New York</publisher-name>.</mixed-citation>
</ref>
<ref id="j_jds1200_ref_014">
<mixed-citation publication-type="book"> <string-name><surname>Yi</surname> <given-names>GY</given-names></string-name>, <string-name><surname>Delaigle</surname> <given-names>A</given-names></string-name>, <string-name><surname>Gustafson</surname> <given-names>P</given-names></string-name> (<year>2021</year>). <source><italic>Handbook of Measurement Error Models</italic></source>. <publisher-name>CRC Press</publisher-name>.</mixed-citation>
</ref>
</ref-list>
</back>
</article>
