array(41) {
["project_status"]=>
string(7) "ongoing"
["project_assoc_trials"]=>
array(2) {
[0]=>
object(WP_Post)#5130 (24) {
["ID"]=>
int(8018)
["post_author"]=>
string(4) "1363"
["post_date"]=>
string(19) "2023-08-05 04:44:39"
["post_date_gmt"]=>
string(19) "2023-08-05 04:44:39"
["post_content"]=>
string(0) ""
["post_title"]=>
string(251) "NCT03464136 - A Phase 3b, Multicenter, Randomized, Blinded, Active-Controlled Study to Compare the Efficacy and Safety of Ustekinumab to That of Adalimumab in the Treatment of Biologic Naïve Subjects With Moderately-to-Severely Active Crohn's Disease"
["post_excerpt"]=>
string(0) ""
["post_status"]=>
string(7) "publish"
["comment_status"]=>
string(6) "closed"
["ping_status"]=>
string(6) "closed"
["post_password"]=>
string(0) ""
["post_name"]=>
string(193) "nct03464136-a-phase-3b-multicenter-randomized-blinded-active-controlled-study-to-compare-the-efficacy-and-safety-of-ustekinumab-to-that-of-adalimumab-in-the-treatment-of-biologic-naive-subjects"
["to_ping"]=>
string(0) ""
["pinged"]=>
string(0) ""
["post_modified"]=>
string(19) "2025-07-15 14:28:36"
["post_modified_gmt"]=>
string(19) "2025-07-15 18:28:36"
["post_content_filtered"]=>
string(0) ""
["post_parent"]=>
int(0)
["guid"]=>
string(242) "https://dev-yoda.pantheonsite.io/clinical-trial/nct03464136-a-phase-3b-multicenter-randomized-blinded-active-controlled-study-to-compare-the-efficacy-and-safety-of-ustekinumab-to-that-of-adalimumab-in-the-treatment-of-biologic-naive-subjects/"
["menu_order"]=>
int(0)
["post_type"]=>
string(14) "clinical_trial"
["post_mime_type"]=>
string(0) ""
["comment_count"]=>
string(1) "0"
["filter"]=>
string(3) "raw"
}
[1]=>
object(WP_Post)#5131 (24) {
["ID"]=>
int(1588)
["post_author"]=>
string(4) "1363"
["post_date"]=>
string(19) "2017-02-08 13:24:00"
["post_date_gmt"]=>
string(19) "2017-02-08 13:24:00"
["post_content"]=>
string(0) ""
["post_title"]=>
string(238) "NCT01369355 - A Phase 3, Randomized, Double-blind, Placebo-controlled, Parallel-group, Multicenter Study to Evaluate the Safety and Efficacy of Ustekinumab Maintenance Therapy in Subjects With Moderately to Severely Active Crohn's Disease"
["post_excerpt"]=>
string(0) ""
["post_status"]=>
string(7) "publish"
["comment_status"]=>
string(6) "closed"
["ping_status"]=>
string(6) "closed"
["post_password"]=>
string(0) ""
["post_name"]=>
string(193) "nct01369355-a-phase-3-randomized-double-blind-placebo-controlled-parallel-group-multicenter-study-to-evaluate-the-safety-and-efficacy-of-ustekinumab-maintenance-therapy-in-subjects-with-moderat"
["to_ping"]=>
string(0) ""
["pinged"]=>
string(0) ""
["post_modified"]=>
string(19) "2025-07-15 15:06:16"
["post_modified_gmt"]=>
string(19) "2025-07-15 19:06:16"
["post_content_filtered"]=>
string(0) ""
["post_parent"]=>
int(0)
["guid"]=>
string(242) "https://dev-yoda.pantheonsite.io/clinical-trial/nct01369355-a-phase-3-randomized-double-blind-placebo-controlled-parallel-group-multicenter-study-to-evaluate-the-safety-and-efficacy-of-ustekinumab-maintenance-therapy-in-subjects-with-moderat/"
["menu_order"]=>
int(0)
["post_type"]=>
string(14) "clinical_trial"
["post_mime_type"]=>
string(0) ""
["comment_count"]=>
string(1) "0"
["filter"]=>
string(3) "raw"
}
}
["project_title"]=>
string(129) "Validation of a hybrid mechanistic-ML model of Crohn's Disease to predict clinical and endoscopic outcomes in individual patients"
["project_narrative_summary"]=>
string(702) "Crohn’s disease (CD) is a chronic, relapsing inflammatory disease of the gastrointestinal (GI) tract with a prevalence of about 320 cases in 100,000 people in Europe and North America. Even though there are multiple approved therapies, long-term remission rates are low in Crohn's Disease patients with about 50% of patients requiring surgery within 10 years. Quantitative systems pharmacology models that provide mechanistic understanding of a disease are increasingly being used at various stages of drug development, for gaining insights into both safety and efficacy of a treatment. For efficacy predictions, QSP models that predict clinical scores, in addition to biomarkers, have applicability."
["project_learn_source"]=>
string(10) "web_search"
["project_learn_source_exp"]=>
string(14) "Vivli Platform"
["principal_investigator"]=>
array(7) {
["first_name"]=>
string(13) "Sai Phanindra"
["last_name"]=>
string(13) "Venkatapurapu"
["degree"]=>
string(3) "PhD"
["primary_affiliation"]=>
string(11) "AstraZeneca"
["email"]=>
string(42) "saiphanindra.venkatapurapu@astrazeneca.com"
["state_or_province"]=>
string(2) "MD"
["country"]=>
string(13) "United States"
}
["project_key_personnel"]=>
bool(false)
["project_ext_grants"]=>
array(2) {
["value"]=>
string(2) "no"
["label"]=>
string(68) "No external grants or funds are being used to support this research."
}
["project_date_type"]=>
string(18) "full_crs_supp_docs"
["property_scientific_abstract"]=>
string(1683) "Background:
In Crohn’s Disease, SES-CD (Simple Endoscopic Score for Crohn’s Disease) is used to measure the endoscopic activity in patients by evaluating endoscopy images. However, due to the invasive nature of endoscopic evaluations, objective assessments of gut damage is infrequent. Non-invasive tools to predict changes in gut mucosal condition with treatment are needed.
Objective:
The study aims to create an algorithm to predict patient-specific clinical and endoscopic outcomes from a mathematical/QSP model of Crohn's disease using de-identified patient data.
Study Design:
This is a retrospective study where the deidentified patient data from the requested studies will be used to develop and validate a mechanistic-ML model of Crohn's disease. The primary outcome measures include SES-CD and CDAI scores over time. Secondary outcome measures include endoscopic and clinical response measures along with changes in biomarkers over time.
Participants:
Patients from the requested studies who have the primary predictor variables, SES-CD and/or CDAI score data along with the component scores will be included in the study.
Statistical Analysis:
Descriptive statistics will be used to summarize baseline characteristics as well as clinical/endoscopic outcomes. Dichotomous variables will be presented as percentages along with 95% CI. Continuous variables will be reported as means with SD or medians with interquartile ranges. The machine learning algorithm's accuracy to predict the clinical scores such as SES-CD and CDAI using the QSP model outputs will be assessed."
["project_brief_bg"]=>
string(2608) "Crohn’s disease (CD) is a chronic, relapsing inflammatory disease of the gastrointestinal (GI) tract with a prevalence of about 320 cases in 100,000 people in Europe and North America. Even though there are multiple approved therapies, long-term remission rates are low in Crohn's Disease patients with about 50% of patients requiring surgery within 10 years. Quantitative systems pharmacology models that provide mechanistic understanding of a disease are increasingly being used at various stages of drug development, for gaining insights into both safety and efficacy of a treatment. For efficacy predictions, QSP models that predict clinical scores, in addition to biomarkers, have applicability in late-stage drug development [1, 2].
Typically clinical scores constitute subjective assessments either by patients or physicians which make it challenging to predict using a mechanistic approach [3]. In Crohn’s Disease, for example, SES-CD (Simple Endoscopic Score for Crohn’s Disease) is used to measure the endoscopic activity in patients by evaluating endoscopy images. In addition to being an endpoint in clinical trials, endoscopic healing is one of the primary treatment goals in IBD as recommended by STRIDE consensus. However, given the invasive nature of endoscopic evaluations, physicians are often required to make treatment decisions based on limited objective information about the state of the patient's gastrointestinal tissue while aiming to achieve mucosal healing. Non-invasive tools to predict changes in gut mucosal condition with treatment are needed.
We developed a computational platform for simulating mucosal health and the level of inflammation in patients with CD under different treatment scenarios [1]. The platform estimates changes in mucosal health and inflammatory activity over a continuous timeline of weeks to years. In order to estimate outcomes such as SES-CD and CDAI (Crohn's Disease Activity Index) at a patient level from the immunological model outputs, we would need de-identified individual patient data. Patient data from the following studies will be analyzed to create machine learning models to connect the immunological outputs from the Crohn's disease model to clinical scores [3]. The data will also be used to validate the model response to different therapies.
Impact for patients: Besides their application in drug development, computational tools that can predict endoscopic outcomes can be a promising form of decision support that can predict outcomes and patient progress in Crohn’s disease."
["project_specific_aims"]=>
string(1245) "This is a retrospective study where the deidentified patient data from the requested studies will be used to develop and validate a mechanistic-ML model of Crohn's disease. The primary objectives of this study are to
A) Create a machine learning algorithm to connect the immunological outputs from a model of Crohn's Disease to the clinical scores, and
B) Validate the model predictions
We will be using demographic and lifestyle data, disease history, baseline disease information, treatment history, lab results and symptoms to inform the model and predict the time course clinical scores and biomarkers. To validate the model, we would need time course SES-CD and CDAI score data split by their components for each gut segment, subject to availability. Please see the sections below for more information on data requirements.
Patients with Crohn’s disease may benefit from this study in two ways: 1) the validated and published model will help researchers in drug development, 2) computational tools, developed using the validated model as the basis, that can predict endoscopic outcomes can be a promising form of decision support to predict outcomes and progress in Crohn’s disease patients."
["project_study_design"]=>
array(2) {
["value"]=>
string(7) "meta_an"
["label"]=>
string(52) "Meta-analysis (analysis of multiple trials together)"
}
["project_purposes"]=>
array(4) {
[0]=>
array(2) {
["value"]=>
string(22) "participant_level_data"
["label"]=>
string(36) "Participant-level data meta-analysis"
}
[1]=>
array(2) {
["value"]=>
string(37) "participant_level_data_only_from_yoda"
["label"]=>
string(51) "Meta-analysis using only data from the YODA Project"
}
[2]=>
array(2) {
["value"]=>
string(37) "develop_or_refine_statistical_methods"
["label"]=>
string(37) "Develop or refine statistical methods"
}
[3]=>
array(2) {
["value"]=>
string(50) "research_on_clinical_prediction_or_risk_prediction"
["label"]=>
string(50) "Research on clinical prediction or risk prediction"
}
}
["project_research_methods"]=>
string(230) "Inclusion criteria: Patients from the requested studies who have the primary predictor variables, SES-CD and/or CDAI score data along with the component scores will be included in the study.
Exclusion criteria: None"
["project_main_outcome_measure"]=>
string(1308) "Our study will focus on predicting SES-CD endoscopic score along with its components over time in individual patients post-treatment using the mechanistic-ML model of Crohn's Disease. All available time points for each individual will be used to prepare the training and validation datasets. Regarding SES-CD data, we request the components - size of ulcers, ulcerated surface, affected surface area and narrowing for each gut segment along with the total SES-CD for each patient at available time points. Similar component data for CDAI would be helpful, subject to availability.
Primary outcome measures:
1. Endoscopic outcomes:
A. SES-CD score over time
B. Individual time course SES-CD score data split by its components for each gut segment
2. Endoscopic response (percentage, 95% CI)
3. Endoscopic remission (percentage, 95% CI)
Secondary outcome measures:
1.Clinical outcomes:
A. CDAI over time
B. Individual time course CDAI score data split by its components
2. Clinical response (percentage, 95% CI)
3. Clinical remission (percentage, 95% CI)
4. Change in Fecal calprotectin over time (continuous variable, mg/L)
5. Change in CRP over time (continuous variable, ug/g)"
["project_main_predictor_indep"]=>
string(581) "Primary predictor/independent variables for the analysis include:
1. Demographic and lifestyle data: Age, Gender, Body weight, Smoking status
2. Disease history: Duration of Crohn's disease, Disease location classification, History of surgery
3. Baseline clinical data: SES-CD, CDAI, FCP (ug/g), CRP (mg/L)
4. Treatment history: Previous exposure to biologics, steroids and other SoC
5. Lab tests: Immune cell counts (if available), cytokine levels (if available)
6. Symptoms: Diarrhea, Abdominal pain reported during visits (if available)"
["project_other_variables_interest"]=>
string(181) "Gender, age and ethnicity would also be of interest to run responder analysis and understand the characteristics of patients that are associated with response to specific biologics."
["project_stat_analysis_plan"]=>
string(1351) "Descriptive statistics will be used to summarize baseline characteristics (e.g. disease activity and patient demographics) as well as clinical and endoscopic outcomes. Dichotomous variables will be presented as proportions or percentages along with 95% CI. Continuous variables will be reported as means with standard deviations or medians with interquartile ranges. Linear imputation will be performed on continuous variables with missing data. Data will be analyzed using Python.
The processed data will then be used to create datasets for the study by combining all the features listed in the proposal. Each row in the final dataset will represent an individual patient and the columns would be the independent variables and outcomes. The final dataset will be randomly split into a training, validation and test sets in the ratio of 70/20/10. These datasets will be used to develop the machine learning algorithm (decision trees/regression models similar to the approach used in Shim et al.) for linking immunology outcomes to clinical scores and to validate the overall performance of the hybrid mechanistic-ML model, The ML algorithm will be developed on the training set and the hyper parameters are tuned on the validation set. Finally, the overall performance of the mechanistic-ML model will be evaluated on the Test dataset."
["project_software_used"]=>
array(1) {
[0]=>
array(2) {
["value"]=>
string(6) "python"
["label"]=>
string(6) "Python"
}
}
["project_timeline"]=>
string(92) "Target Analysis Start Date: 09/02/2025
Estimated Analysis Completion Date: 04/30/2026"
["project_dissemination_plan"]=>
string(235) "We aim to present results of the work at Digestive Disease Week (DDW) or Crohn's & Colitis Congress or American Conference on Pharmacometrics (ACoP) and publish in Nature Systems Biology or Clinical Pharmacology and Therapeutics. "
["project_bibliography"]=>
string(1096) "
- Venkatapurapu, S. P., Iwakiri, R., Udagawa, E., Patidar, N., Qi, Z., Takayama, R., Kumar, K., Sato, Y., Behar, M., Offner, P., Dwivedi, G., Miyasaka, H., Suzuki, R. K., Hamada, A. L., D’Alessandro, P. M., & Fernandez, J. (2022). A computational platform integrating a mechanistic model of Crohn’s disease for predicting temporal progression of mucosal damage and healing. Advances in Therapy, 39(7), 3225–3247. https://doi.org/10.1007/s12325-022-02144-y
- Rogers, K. V., Martin, S. W., Bhattacharya, I., Singh, R. S. P., & Nayak, S. (2021). A dynamic quantitative systems pharmacology model of inflammatory bowel disease: Part 1 – Model framework. Clinical and Translational Science, 14(1), 239–248. https://doi.org/10.1111/cts.12849
- Shim, J. V., Rehberg, M., Wagenhuber, B., van der Graaf, P. H., & Chung, D. W. (2025). Combining mechanistic modeling with machine learning as a strategy to predict inflammatory bowel disease clinical scores. Frontiers in Pharmacology, 16, 1479666. https://doi.org/10.3389/fphar.2025.1479666
"
["project_suppl_material"]=>
bool(false)
["project_coi"]=>
array(1) {
[0]=>
array(1) {
["file_coi"]=>
array(21) {
["ID"]=>
int(17124)
["id"]=>
int(17124)
["title"]=>
string(16) "YODA_COI_SPV.pdf"
["filename"]=>
string(16) "YODA_COI_SPV.pdf"
["filesize"]=>
int(20388)
["url"]=>
string(65) "https://yoda.yale.edu/wp-content/uploads/2025/04/YODA_COI_SPV.pdf"
["link"]=>
string(62) "https://yoda.yale.edu/data-request/2025-0276/yoda_coi_spv-pdf/"
["alt"]=>
string(0) ""
["author"]=>
string(4) "1809"
["description"]=>
string(0) ""
["caption"]=>
string(0) ""
["name"]=>
string(16) "yoda_coi_spv-pdf"
["status"]=>
string(7) "inherit"
["uploaded_to"]=>
int(17123)
["date"]=>
string(19) "2025-04-25 19:33:33"
["modified"]=>
string(19) "2025-04-25 19:33:34"
["menu_order"]=>
int(0)
["mime_type"]=>
string(15) "application/pdf"
["type"]=>
string(11) "application"
["subtype"]=>
string(3) "pdf"
["icon"]=>
string(62) "https://yoda.yale.edu/wp/wp-includes/images/media/document.png"
}
}
}
["data_use_agreement_training"]=>
bool(true)
["human_research_protection_training"]=>
bool(true)
["certification"]=>
bool(true)
["search_order"]=>
string(1) "0"
["project_send_email_updates"]=>
bool(false)
["project_publ_available"]=>
bool(true)
["project_year_access"]=>
string(4) "2025"
["project_rep_publ"]=>
bool(false)
["project_assoc_data"]=>
array(0) {
}
["project_due_dil_assessment"]=>
array(21) {
["ID"]=>
int(17855)
["id"]=>
int(17855)
["title"]=>
string(47) "YODA Project Due Diligence Assessment 2025-0276"
["filename"]=>
string(51) "YODA-Project-Due-Diligence-Assessment-2025-0276.pdf"
["filesize"]=>
int(126318)
["url"]=>
string(100) "https://yoda.yale.edu/wp-content/uploads/2025/04/YODA-Project-Due-Diligence-Assessment-2025-0276.pdf"
["link"]=>
string(93) "https://yoda.yale.edu/data-request/2025-0276/yoda-project-due-diligence-assessment-2025-0276/"
["alt"]=>
string(0) ""
["author"]=>
string(4) "1885"
["description"]=>
string(0) ""
["caption"]=>
string(0) ""
["name"]=>
string(47) "yoda-project-due-diligence-assessment-2025-0276"
["status"]=>
string(7) "inherit"
["uploaded_to"]=>
int(17123)
["date"]=>
string(19) "2025-09-03 14:22:43"
["modified"]=>
string(19) "2025-09-03 14:22:43"
["menu_order"]=>
int(0)
["mime_type"]=>
string(15) "application/pdf"
["type"]=>
string(11) "application"
["subtype"]=>
string(3) "pdf"
["icon"]=>
string(62) "https://yoda.yale.edu/wp/wp-includes/images/media/document.png"
}
["project_title_link"]=>
array(21) {
["ID"]=>
int(17856)
["id"]=>
int(17856)
["title"]=>
string(46) "YODA Project Protocol - 2025-0276 - 2025-08-26"
["filename"]=>
string(46) "YODA-Project-Protocol-2025-0276-2025-08-26.pdf"
["filesize"]=>
int(125455)
["url"]=>
string(95) "https://yoda.yale.edu/wp-content/uploads/2025/04/YODA-Project-Protocol-2025-0276-2025-08-26.pdf"
["link"]=>
string(88) "https://yoda.yale.edu/data-request/2025-0276/yoda-project-protocol-2025-0276-2025-08-26/"
["alt"]=>
string(0) ""
["author"]=>
string(4) "1885"
["description"]=>
string(0) ""
["caption"]=>
string(0) ""
["name"]=>
string(42) "yoda-project-protocol-2025-0276-2025-08-26"
["status"]=>
string(7) "inherit"
["uploaded_to"]=>
int(17123)
["date"]=>
string(19) "2025-09-03 14:23:03"
["modified"]=>
string(19) "2025-09-03 14:23:03"
["menu_order"]=>
int(0)
["mime_type"]=>
string(15) "application/pdf"
["type"]=>
string(11) "application"
["subtype"]=>
string(3) "pdf"
["icon"]=>
string(62) "https://yoda.yale.edu/wp/wp-includes/images/media/document.png"
}
["project_review_link"]=>
array(21) {
["ID"]=>
int(17857)
["id"]=>
int(17857)
["title"]=>
string(36) "YODA Project Review - 2025-0276_site"
["filename"]=>
string(38) "YODA-Project-Review-2025-0276_site.pdf"
["filesize"]=>
int(1315640)
["url"]=>
string(87) "https://yoda.yale.edu/wp-content/uploads/2025/04/YODA-Project-Review-2025-0276_site.pdf"
["link"]=>
string(80) "https://yoda.yale.edu/data-request/2025-0276/yoda-project-review-2025-0276_site/"
["alt"]=>
string(0) ""
["author"]=>
string(4) "1885"
["description"]=>
string(0) ""
["caption"]=>
string(0) ""
["name"]=>
string(34) "yoda-project-review-2025-0276_site"
["status"]=>
string(7) "inherit"
["uploaded_to"]=>
int(17123)
["date"]=>
string(19) "2025-09-03 14:23:25"
["modified"]=>
string(19) "2025-09-03 14:23:25"
["menu_order"]=>
int(0)
["mime_type"]=>
string(15) "application/pdf"
["type"]=>
string(11) "application"
["subtype"]=>
string(3) "pdf"
["icon"]=>
string(62) "https://yoda.yale.edu/wp/wp-includes/images/media/document.png"
}
["project_highlight_button"]=>
string(0) ""
["request_data_partner"]=>
string(15) "johnson-johnson"
["request_overridden_res"]=>
string(1) "3"
}
data partner
array(1) {
[0]=>
string(15) "johnson-johnson"
}
pi country
array(0) {
}
pi affil
array(0) {
}
products
array(1) {
[0]=>
string(7) "stelara"
}
num of trials
array(1) {
[0]=>
string(1) "2"
}
res
array(1) {
[0]=>
string(1) "3"
}
General Information
How did you learn about the YODA Project?:
Internet Search
Conflict of Interest
Request Clinical Trials
Associated Trial(s):
- NCT03464136 - A Phase 3b, Multicenter, Randomized, Blinded, Active-Controlled Study to Compare the Efficacy and Safety of Ustekinumab to That of Adalimumab in the Treatment of Biologic Naïve Subjects With Moderately-to-Severely Active Crohn's Disease
- NCT01369355 - A Phase 3, Randomized, Double-blind, Placebo-controlled, Parallel-group, Multicenter Study to Evaluate the Safety and Efficacy of Ustekinumab Maintenance Therapy in Subjects With Moderately to Severely Active Crohn's Disease
What type of data are you looking for?:
Individual Participant-Level Data, which includes Full CSR and all supporting documentation
Request Clinical Trials
Data Request Status
Status:
Ongoing
Research Proposal
Project Title:
Validation of a hybrid mechanistic-ML model of Crohn's Disease to predict clinical and endoscopic outcomes in individual patients
Scientific Abstract:
Background:
In Crohn's Disease, SES-CD (Simple Endoscopic Score for Crohn's Disease) is used to measure the endoscopic activity in patients by evaluating endoscopy images. However, due to the invasive nature of endoscopic evaluations, objective assessments of gut damage is infrequent. Non-invasive tools to predict changes in gut mucosal condition with treatment are needed.
Objective:
The study aims to create an algorithm to predict patient-specific clinical and endoscopic outcomes from a mathematical/QSP model of Crohn's disease using de-identified patient data.
Study Design:
This is a retrospective study where the deidentified patient data from the requested studies will be used to develop and validate a mechanistic-ML model of Crohn's disease. The primary outcome measures include SES-CD and CDAI scores over time. Secondary outcome measures include endoscopic and clinical response measures along with changes in biomarkers over time.
Participants:
Patients from the requested studies who have the primary predictor variables, SES-CD and/or CDAI score data along with the component scores will be included in the study.
Statistical Analysis:
Descriptive statistics will be used to summarize baseline characteristics as well as clinical/endoscopic outcomes. Dichotomous variables will be presented as percentages along with 95% CI. Continuous variables will be reported as means with SD or medians with interquartile ranges. The machine learning algorithm's accuracy to predict the clinical scores such as SES-CD and CDAI using the QSP model outputs will be assessed.
Brief Project Background and Statement of Project Significance:
Crohn's disease (CD) is a chronic, relapsing inflammatory disease of the gastrointestinal (GI) tract with a prevalence of about 320 cases in 100,000 people in Europe and North America. Even though there are multiple approved therapies, long-term remission rates are low in Crohn's Disease patients with about 50% of patients requiring surgery within 10 years. Quantitative systems pharmacology models that provide mechanistic understanding of a disease are increasingly being used at various stages of drug development, for gaining insights into both safety and efficacy of a treatment. For efficacy predictions, QSP models that predict clinical scores, in addition to biomarkers, have applicability in late-stage drug development [1, 2].
Typically clinical scores constitute subjective assessments either by patients or physicians which make it challenging to predict using a mechanistic approach [3]. In Crohn's Disease, for example, SES-CD (Simple Endoscopic Score for Crohn's Disease) is used to measure the endoscopic activity in patients by evaluating endoscopy images. In addition to being an endpoint in clinical trials, endoscopic healing is one of the primary treatment goals in IBD as recommended by STRIDE consensus. However, given the invasive nature of endoscopic evaluations, physicians are often required to make treatment decisions based on limited objective information about the state of the patient's gastrointestinal tissue while aiming to achieve mucosal healing. Non-invasive tools to predict changes in gut mucosal condition with treatment are needed.
We developed a computational platform for simulating mucosal health and the level of inflammation in patients with CD under different treatment scenarios [1]. The platform estimates changes in mucosal health and inflammatory activity over a continuous timeline of weeks to years. In order to estimate outcomes such as SES-CD and CDAI (Crohn's Disease Activity Index) at a patient level from the immunological model outputs, we would need de-identified individual patient data. Patient data from the following studies will be analyzed to create machine learning models to connect the immunological outputs from the Crohn's disease model to clinical scores [3]. The data will also be used to validate the model response to different therapies.
Impact for patients: Besides their application in drug development, computational tools that can predict endoscopic outcomes can be a promising form of decision support that can predict outcomes and patient progress in Crohn's disease.
Specific Aims of the Project:
This is a retrospective study where the deidentified patient data from the requested studies will be used to develop and validate a mechanistic-ML model of Crohn's disease. The primary objectives of this study are to
A) Create a machine learning algorithm to connect the immunological outputs from a model of Crohn's Disease to the clinical scores, and
B) Validate the model predictions
We will be using demographic and lifestyle data, disease history, baseline disease information, treatment history, lab results and symptoms to inform the model and predict the time course clinical scores and biomarkers. To validate the model, we would need time course SES-CD and CDAI score data split by their components for each gut segment, subject to availability. Please see the sections below for more information on data requirements.
Patients with Crohn's disease may benefit from this study in two ways: 1) the validated and published model will help researchers in drug development, 2) computational tools, developed using the validated model as the basis, that can predict endoscopic outcomes can be a promising form of decision support to predict outcomes and progress in Crohn's disease patients.
Study Design:
Meta-analysis (analysis of multiple trials together)
What is the purpose of the analysis being proposed? Please select all that apply.:
Participant-level data meta-analysis
Meta-analysis using only data from the YODA Project
Develop or refine statistical methods
Research on clinical prediction or risk prediction
Software Used:
Python
Data Source and Inclusion/Exclusion Criteria to be used to define the patient sample for your study:
Inclusion criteria: Patients from the requested studies who have the primary predictor variables, SES-CD and/or CDAI score data along with the component scores will be included in the study.
Exclusion criteria: None
Primary and Secondary Outcome Measure(s) and how they will be categorized/defined for your study:
Our study will focus on predicting SES-CD endoscopic score along with its components over time in individual patients post-treatment using the mechanistic-ML model of Crohn's Disease. All available time points for each individual will be used to prepare the training and validation datasets. Regarding SES-CD data, we request the components - size of ulcers, ulcerated surface, affected surface area and narrowing for each gut segment along with the total SES-CD for each patient at available time points. Similar component data for CDAI would be helpful, subject to availability.
Primary outcome measures:
1. Endoscopic outcomes:
A. SES-CD score over time
B. Individual time course SES-CD score data split by its components for each gut segment
2. Endoscopic response (percentage, 95% CI)
3. Endoscopic remission (percentage, 95% CI)
Secondary outcome measures:
1.Clinical outcomes:
A. CDAI over time
B. Individual time course CDAI score data split by its components
2. Clinical response (percentage, 95% CI)
3. Clinical remission (percentage, 95% CI)
4. Change in Fecal calprotectin over time (continuous variable, mg/L)
5. Change in CRP over time (continuous variable, ug/g)
Main Predictor/Independent Variable and how it will be categorized/defined for your study:
Primary predictor/independent variables for the analysis include:
1. Demographic and lifestyle data: Age, Gender, Body weight, Smoking status
2. Disease history: Duration of Crohn's disease, Disease location classification, History of surgery
3. Baseline clinical data: SES-CD, CDAI, FCP (ug/g), CRP (mg/L)
4. Treatment history: Previous exposure to biologics, steroids and other SoC
5. Lab tests: Immune cell counts (if available), cytokine levels (if available)
6. Symptoms: Diarrhea, Abdominal pain reported during visits (if available)
Other Variables of Interest that will be used in your analysis and how they will be categorized/defined for your study:
Gender, age and ethnicity would also be of interest to run responder analysis and understand the characteristics of patients that are associated with response to specific biologics.
Statistical Analysis Plan:
Descriptive statistics will be used to summarize baseline characteristics (e.g. disease activity and patient demographics) as well as clinical and endoscopic outcomes. Dichotomous variables will be presented as proportions or percentages along with 95% CI. Continuous variables will be reported as means with standard deviations or medians with interquartile ranges. Linear imputation will be performed on continuous variables with missing data. Data will be analyzed using Python.
The processed data will then be used to create datasets for the study by combining all the features listed in the proposal. Each row in the final dataset will represent an individual patient and the columns would be the independent variables and outcomes. The final dataset will be randomly split into a training, validation and test sets in the ratio of 70/20/10. These datasets will be used to develop the machine learning algorithm (decision trees/regression models similar to the approach used in Shim et al.) for linking immunology outcomes to clinical scores and to validate the overall performance of the hybrid mechanistic-ML model, The ML algorithm will be developed on the training set and the hyper parameters are tuned on the validation set. Finally, the overall performance of the mechanistic-ML model will be evaluated on the Test dataset.
Narrative Summary:
Crohn's disease (CD) is a chronic, relapsing inflammatory disease of the gastrointestinal (GI) tract with a prevalence of about 320 cases in 100,000 people in Europe and North America. Even though there are multiple approved therapies, long-term remission rates are low in Crohn's Disease patients with about 50% of patients requiring surgery within 10 years. Quantitative systems pharmacology models that provide mechanistic understanding of a disease are increasingly being used at various stages of drug development, for gaining insights into both safety and efficacy of a treatment. For efficacy predictions, QSP models that predict clinical scores, in addition to biomarkers, have applicability.
Project Timeline:
Target Analysis Start Date: 09/02/2025
Estimated Analysis Completion Date: 04/30/2026
Dissemination Plan:
We aim to present results of the work at Digestive Disease Week (DDW) or Crohn's & Colitis Congress or American Conference on Pharmacometrics (ACoP) and publish in Nature Systems Biology or Clinical Pharmacology and Therapeutics.
Bibliography:
- Venkatapurapu, S. P., Iwakiri, R., Udagawa, E., Patidar, N., Qi, Z., Takayama, R., Kumar, K., Sato, Y., Behar, M., Offner, P., Dwivedi, G., Miyasaka, H., Suzuki, R. K., Hamada, A. L., D’Alessandro, P. M., & Fernandez, J. (2022). A computational platform integrating a mechanistic model of Crohn’s disease for predicting temporal progression of mucosal damage and healing. Advances in Therapy, 39(7), 3225--3247. https://doi.org/10.1007/s12325-022-02144-y
- Rogers, K. V., Martin, S. W., Bhattacharya, I., Singh, R. S. P., & Nayak, S. (2021). A dynamic quantitative systems pharmacology model of inflammatory bowel disease: Part 1 – Model framework. Clinical and Translational Science, 14(1), 239--248. https://doi.org/10.1111/cts.12849
- Shim, J. V., Rehberg, M., Wagenhuber, B., van der Graaf, P. H., & Chung, D. W. (2025). Combining mechanistic modeling with machine learning as a strategy to predict inflammatory bowel disease clinical scores. Frontiers in Pharmacology, 16, 1479666. https://doi.org/10.3389/fphar.2025.1479666