Skip to content

Commit

Permalink
issue 22 fix
Browse files Browse the repository at this point in the history
- adding code to address issue 22
- T is now restricted to first occurrence with a requirement of minPriorObservation days (a new input with default of 0)
- Includes characterization for T with O during and not during TAR plus T with O for the first time during and not during TAR
- added cohort_counts to the database and exported csvs that tell you how many patients are in allT, T, O, firstO, TnO, TnfirstO, TnOc and TnfirstOc
  • Loading branch information
jreps committed Mar 15, 2023
1 parent e848a05 commit 9d97421
Show file tree
Hide file tree
Showing 9 changed files with 390 additions and 103 deletions.
23 changes: 19 additions & 4 deletions R/AggregateCovariates.R
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@
#'
#' @param targetIds A list of cohortIds for the target cohorts
#' @param outcomeIds A list of cohortIds for the outcome cohorts
#' @param minPriorObservation The minimum time in the database a patient in the target cohorts must be observed prior to index
#' @template timeAtRisk
#' @param covariateSettings An object created using \code{FeatureExtraction::createCovariateSettings}
#'
Expand All @@ -28,6 +29,7 @@
createAggregateCovariateSettings <- function(
targetIds,
outcomeIds,
minPriorObservation = 0,
riskWindowStart = 1,
startAnchor = 'cohort start',
riskWindowEnd = 365,
Expand Down Expand Up @@ -57,19 +59,26 @@ createAggregateCovariateSettings <- function(
endAnchor = endAnchor,
errorMessages = errorMessages
)

# check covariateSettings
.checkCovariateSettings(
covariateSettings = covariateSettings,
errorMessages = errorMessages
)

# check minPriorObservation
.checkMinPriorObservation(
minPriorObservation = minPriorObservation,
errorMessages = errorMessages
)

checkmate::reportAssertions(errorMessages)

# create list
result <- list(
targetIds = targetIds,
outcomeIds = outcomeIds,
minPriorObservation = minPriorObservation,
riskWindowStart = riskWindowStart,
startAnchor = startAnchor,
riskWindowEnd = riskWindowEnd ,
Expand Down Expand Up @@ -126,6 +135,7 @@ computeAggregateCovariateAnalyses <- function(
createCohortsOfInterest(
connection = connection,
dbms = connectionDetails$dbms,
cdmDatabaseSchema = cdmDatabaseSchema,
aggregateCovariateSettings,
targetDatabaseSchema,
targetTable,
Expand All @@ -135,16 +145,16 @@ computeAggregateCovariateAnalyses <- function(
)

## get counts
sql <- 'select cohort_definition_id, count(*) N from #agg_cohorts group by cohort_definition_id;'
sql <- 'select cohort_definition_id, count(*) row_count, count(distinct subject_id) person_count from #agg_cohorts group by cohort_definition_id;'
sql <- SqlRender::translate(
sql = sql,
targetDialect = connectionDetails$dbms
)
counts <- DatabaseConnector::querySql(
connection = connection,
sql = sql
sql = sql,
snakeCaseToCamelCase = T,
)
#print(counts) # testing

message("Computing aggregate covariate results")

Expand All @@ -159,6 +169,8 @@ computeAggregateCovariateAnalyses <- function(
cdmVersion = cdmVersion,
aggregated = T
)
# adding counts as a new table
result$cohortCounts <- counts

# add databaseId and runId to each table in results
# could add settings table with this and just have setting id
Expand Down Expand Up @@ -234,6 +246,7 @@ computeAggregateCovariateAnalyses <- function(

createCohortsOfInterest <- function(
connection,
cdmDatabaseSchema,
dbms,
aggregateCovariateSettings,
targetDatabaseSchema,
Expand All @@ -247,13 +260,15 @@ createCohortsOfInterest <- function(
sqlFilename = "createTargetOutcomeCombinations.sql",
packageName = "Characterization",
dbms = dbms,
cdm_database_schema = cdmDatabaseSchema,
tempEmulationSchema = tempEmulationSchema,
target_database_schema = targetDatabaseSchema,
target_table = targetTable,
outcome_database_schema = outcomeDatabaseSchema,
outcome_table = outcomeTable,
target_ids = paste(aggregateCovariateSettings$targetIds, collapse = ',', sep = ','),
outcome_ids = paste(aggregateCovariateSettings$outcomeIds, collapse = ',', sep = ','),
min_prior_observation = aggregateCovariateSettings$minPriorObservation,
tar_start = aggregateCovariateSettings$riskWindowStart,
tar_start_anchor = ifelse(
aggregateCovariateSettings$startAnchor == 'cohort start',
Expand Down
12 changes: 12 additions & 0 deletions R/HelperFunctions.R
Original file line number Diff line number Diff line change
Expand Up @@ -241,3 +241,15 @@
add = errorMessages
)
}

.checkMinPriorObservation <- function(
minPriorObservation,
errorMessages
) {
checkmate::assertCount(
x = minPriorObservation,
null.ok = F,
.var.name = 'minPriorObservation',
add = errorMessages
)
}
35 changes: 34 additions & 1 deletion R/SaveLoad.R
Original file line number Diff line number Diff line change
Expand Up @@ -404,6 +404,38 @@ exportAggregateCovariateToCsv <- function(

}
)
# cohort details
Andromeda::batchApply(
tbl = result$cohortCounts,
fun = function(x) {

append <- file.exists(
file.path(
saveDirectory,
"cohort_counts.csv"
)
)

dat <- as.data.frame(
x %>%
dplyr::collect()
)

colnames(dat) <- SqlRender::camelCaseToSnakeCase(
string = colnames(dat)
)

readr::write_csv(
x = dat,
file = file.path(
saveDirectory,
"cohort_counts.csv"
),
append = append
)

}
)

# cohort details
Andromeda::batchApply(
Expand Down Expand Up @@ -577,7 +609,8 @@ exportAggregateCovariateToCsv <- function(
"analysis_ref.csv",
"covariate_ref.csv",
"covariates.csv",
"covariates_continuous.csv"
"covariates_continuous.csv",
"cohort_counts.csv"
)
)
)
Expand Down
Loading

0 comments on commit 9d97421

Please sign in to comment.