Skip to content

Commit

Permalink
Added combine_discovery_validation() (#1)
Browse files Browse the repository at this point in the history
  • Loading branch information
wleoncio committed Jan 14, 2025
1 parent 9d4f420 commit 0061c99
Showing 1 changed file with 19 additions and 0 deletions.
19 changes: 19 additions & 0 deletions src/pCRscore/pipeline.py
Original file line number Diff line number Diff line change
Expand Up @@ -41,3 +41,22 @@ def fit_line(data):
ci = model.conf_int(alpha=0.001).loc['Fraction']
result.append({'Feature': name, 'Coef': coef, 'CI': ci[0] * ci[1]})
return pandas.DataFrame(result)


def combine_discovery_validation(data_disc, data_valid, fit_disc, fit_valid):
# Combine fit results
fit_combined = pandas.merge(
fit_valid, fit_disc, on="Feature", suffixes=("_Valid", "_Discv")
)
# Select cell types that show a clear association in both cohorts
fit_combined = fit_combined[
(fit_combined['Coef_Discv'] * fit_combined['Coef_Valid'] > 0) &
(fit_combined['CI_Valid'] > 0) &
(fit_combined['CI_Discv'] > 0)
]
# All data put together
all_pat = pandas.concat([data_disc, data_valid], axis=0)

# Select only the cell types that pass the validation
all_pat = all_pat[all_pat['Feature'].isin(fit_combined['Feature'])]
return all_pat

0 comments on commit 0061c99

Please sign in to comment.