tlverse
diff --git a/‎.Rbuildignore
+32-8 b/‎.Rbuildignore
+32-8
diff --git a/‎.gitignore
+6-2 b/‎.gitignore
+6-2
diff --git a/‎DESCRIPTION
+18-13 b/‎DESCRIPTION
+18-13
diff --git a/‎R/LF_rule.R
+2-2 b/‎R/LF_rule.R
+2-2
diff --git a/‎R/Optimal_Rule_Q_learning.R
+6-6 b/‎R/Optimal_Rule_Q_learning.R
+6-6
diff --git a/‎R/Optimal_Rule_Revere.R
+70-73 b/‎R/Optimal_Rule_Revere.R
+70-73
@@ -1,10 +1,34 @@
+^\.git
+^\.git/*
+^\.gitignore$
 ^.*\.Rproj$
 ^\.Rproj\.user$
-^README-refs.bib
-^README.Rmd
-^README.knit.md
-^README.utf8.md
-^Simulations/
-^sandbox/
-^vignette/
-^Makefile
+^README\.md
+
+# Automated testing files.
+^travis\.yml$
+^appveyor\.yml$
+^codecov\.yml$
+# Files from building the Guide-to-SuperLearner.rmd vignette.
+^SuperLearner.png$
+^vignettes/[^/]*_cache
+# other miscellaneous non-CRAN files
+xgboost.model
+deploy.sh
+^sandbox$
+^Simulations$
+^vignette$
+^docs$
+^README\.Rmd$
+^README\.utf8.md$
+^README\.knit.md$
+^README-.*\.Rmd$
+^README\.html$
+^README-.*\.png$
+^README-refs.bib$
+^cran-comments.md$
+^CONTRIBUTING\.md$
+^Makefile$
+^LICENSE$
+man-roxygen
+^_pkgdown\.yml$
@@ -2,6 +2,10 @@
 .Rhistory
 .RData
 .Ruserdata
+.future
+README.html
+vignettes/*.html
+
+# macOS files
 .DS_Store
-tmle3mopttx.Rproj
-.DS_Store
+inst/doc
@@ -1,5 +1,6 @@
 Package: tmle3mopttx
-Title: Targeted Maximum Likelihood Estimation of the Mean under Optimal Individualized Treatment
+Title: Targeted Maximum Likelihood Estimation of the Mean under Optimal
+    Individualized Treatment
 Version: 0.1.0
 Authors@R: c(
     person("Ivana", "Malenica", email = "[email protected]",
@@ -10,32 +11,36 @@ Authors@R: c(
            comment = c(ORCID = "0000-0002-9874-6649")),
     person("Mark", "van der Laan", email = "[email protected]",
            role = c("aut", "ths")))
-Description: This package estimates the optimal individualized treatment rule for the categorical treatment
-  using Super Learner (sl3). In order to avoid nesting cross-validation, it uses split-specific estimates 
-  of Q and g to estimate the rule as described by Coyle et al. In addition it provides the Targeted Maximum
-  Likelihood estimates of the mean performance using CV-TMLE under such estimated rules. This is an 
-  adapter package for use with the tmle3 framework and the tlverse software ecosystem for Targeted Learning.
-Depends: R (>= 3.5.0)
+Description: This package estimates the optimal individualized treatment rule
+    for the categorical treatment using Super Learner (sl3). In order to avoid
+    nested cross-validation, it uses split-specific estimates of Q and g to
+    estimate the rule as described by Coyle et al. In addition it provides the
+    Targeted Maximum Likelihood estimates of the mean performance using CV-TMLE
+    under such estimated rules. This is an adapter package for use with the
+    tmle3 framework and the tlverse software ecosystem for Targeted Learning.
+Depends: R (>= 3.4.0)
 License: GPL-3
 Encoding: UTF-8
 LazyData: true
 LazyLoad: yes
 Imports:
-    data.table,
-    assertthat,
     R6,
     uuid,
+    stats,
     methods,
-    stats
+    data.table,
+    assertthat,
+    sl3,
+    tmle3
 Suggests:
     testthat,
     knitr,
     rmarkdown
 Remotes:
-    github::tlverse/tmle3,
-    github::tlverse/sl3,
+    github::tlverse/delayed,
     github::tlverse/origami,
-    github::tlverse/delayed
+    github::tlverse/sl3,
+    github::tlverse/tmle3
 BugReports: https://github.com/tlverse/tmle3mopttx/issues
 VignetteBuilder: knitr
 RoxygenNote: 6.1.1
@@ -14,9 +14,9 @@
 #'   \code{define_lf(LF_static, name, type, value, ...)}
 #'
 #'   \describe{
-#'     \item{\code{name}}{character, the name of the factor. Should match a node name 
+#'     \item{\code{name}}{character, the name of the factor. Should match a node name
 #'     in the nodes specified by tmle3_Task.}
-#'     
+#'
 #'     \item{\code{type}}{character, either 'density', for conditional density or, 'mean' for conditional mean
 #'     }
 #'     \item{\code{value}}{the static value
 
@@ -24,14 +24,14 @@ Optimal_Rule_Q_learning <- R6Class(
       # todo: function
       A_vals <- tmle_task$npsem$A$variable_type$levels
       A_vals <- factor(A_vals, A_vals)
-      
+
       # Generate counterfactual tasks for each value of A:
       cf_tasks <- lapply(A_vals, function(A_val) {
-        #if(is.character(A_val)){
+        # if(is.character(A_val)){
         #  A_val<-as.numeric(A_val)
-          #A_val<-as.factor(A_val)
-        #}
-        A_val<-as.numeric(A_val)
+        # A_val<-as.factor(A_val)
+        # }
+        A_val <- as.numeric(A_val)
         newdata <- data.table(A = A_val)
         cf_task <- tmle_task$generate_counterfactual_task(UUIDgenerate(), new_data = newdata)
         return(cf_task)
@@ -40,7 +40,7 @@ Optimal_Rule_Q_learning <- R6Class(
       private$.cf_tasks <- cf_tasks
     },
 
-    rule = function(tmle_task, fold_number="full") {
+    rule = function(tmle_task, fold_number = "full") {
       # Get Q(a,W) for each level of A, all folds
       blip_fin <- sapply(private$.cf_tasks, private$.likelihood$get_likelihood, "Y", fold_number)
 
 
@@ -1,6 +1,6 @@
 #' Learns the Optimal Rule given a tmle_task and likelihood, using the Revere framework.
 #' Complements 'tmle3_Spec_mopttx_blip_revere'.
-#' 
+#'
 #'
 #' @importFrom R6 R6Class
 #' @importFrom data.table data.table
@@ -14,16 +14,16 @@ Optimal_Rule_Revere <- R6Class(
   inherit = tmle3_Spec,
   lock_objects = FALSE,
   public = list(
-    initialize = function(tmle_task, likelihood, fold_number = "split-specific", V = NULL, 
-                          blip_type = "blip2", learners, maximize = TRUE, realistic=FALSE) {
+    initialize = function(tmle_task, likelihood, fold_number = "split-specific", V = NULL,
+                              blip_type = "blip2", learners, maximize = TRUE, realistic = FALSE) {
       private$.tmle_task <- tmle_task
       private$.likelihood <- likelihood
       private$.fold_number <- fold_number
       private$.blip_type <- blip_type
       private$.learners <- learners
       private$.maximize <- maximize
       private$.realistic <- realistic
-      
+
       if (missing(V)) {
         V <- tmle_task$npsem$W$variables
       }
@@ -47,64 +47,63 @@ Optimal_Rule_Revere <- R6Class(
       DR <- data.frame(private$.DR_full[[v]])
       return(data.frame(DR[indx, ]))
     },
-    
-    blip_revere_function = function(tmle_task, fold_number){
-      
+
+    blip_revere_function = function(tmle_task, fold_number) {
       likelihood <- self$likelihood
       A_vals <- tmle_task$npsem$A$variable_type$levels
       V <- self$V
-      
+
       # Generate counterfactual tasks for each value of A:
       cf_tasks <- lapply(A_vals, function(A_val) {
-        if(is.character(A_val)){
-          A_val<-as.numeric(A_val)
-          #A_val<-as.factor(A_val)
+        if (is.character(A_val)) {
+          A_val <- as.numeric(A_val)
+          # A_val<-as.factor(A_val)
         }
         newdata <- data.table(A = A_val)
         cf_task <- tmle_task$generate_counterfactual_task(UUIDgenerate(), new_data = newdata)
         return(cf_task)
       })
-      
+
       # DR A-IPW mapping of blip
       A <- tmle_task$get_tmle_node("A")
       Y <- tmle_task$get_tmle_node("Y")
       A_vals <- tmle_task$npsem$A$variable_type$levels
-      A_ind <- self$factor_to_indicators(A,A_vals)
+      A_ind <- self$factor_to_indicators(A, A_vals)
       Y_mat <- replicate(length(A_vals), Y)
-      
-      #Use fold_number fits for Q and g:
+
+      # Use fold_number fits for Q and g:
       Q_vals <- sapply(cf_tasks, likelihood$get_likelihood, "Y", fold_number)
       g_vals <- sapply(cf_tasks, likelihood$get_likelihood, "A", fold_number)
       DR <- (A_ind / g_vals) * (Y_mat - Q_vals) + Q_vals
 
       # Type of pseudo-blip:
       blip_type <- self$blip_type
-      
-      if(blip_type=="blip1"){
-        blip <- DR[,2] - DR[,1]
-      }else if(blip_type=="blip2"){
+
+      if (blip_type == "blip1") {
+        blip <- DR[, 2] - DR[, 1]
+      } else if (blip_type == "blip2") {
         blip <- DR - rowMeans(DR)
-      }else if(blip_type=="blip3"){
+      } else if (blip_type == "blip3") {
         blip <- DR - (rowMeans(DR) * g_vals)
       }
-      
-      #TO DO: Nicer solutions. Do it one by one, for now
-      if(is.null(V)){
-        data <- data.table(V=blip,blip=blip)
+
+      # TO DO: Nicer solutions. Do it one by one, for now
+      if (is.null(V)) {
+        data <- data.table(V = blip, blip = blip)
         outcomes <- grep("blip", names(data), value = TRUE)
         V <- grep("V", names(data), value = TRUE)
-        revere_task <- make_sl3_Task(data, outcome=outcomes, covariates=V, folds=tmle_task$folds)
-      }else{
-        V <- tmle_task$data[,self$V,with=FALSE]
-        data <- data.table(V,blip=blip)
+        revere_task <- make_sl3_Task(data, outcome = outcomes, covariates = V, folds = tmle_task$folds)
+      } else {
+        V <- tmle_task$data[, self$V, with = FALSE]
+        data <- data.table(V, blip = blip)
         outcomes <- grep("blip", names(data), value = TRUE)
-        revere_task <- make_sl3_Task(data, outcome=outcomes, covariates=self$V, folds=tmle_task$folds)
+        revere_task <- make_sl3_Task(data, outcome = outcomes, covariates = self$V, folds = tmle_task$folds)
       }
-      
+
 
       return(revere_task)
     },
-    
+
     bound = function(cv_g) {
       cv_g[cv_g < 0.01] <- 0.01
       cv_g[cv_g > 0.99] <- 0.99
@@ -123,81 +122,79 @@ Optimal_Rule_Revere <- R6Class(
       private$.blip_fit <- blip_fit
     },
 
-    rule = function(tmle_task, fold_number="full") {
-      
+    rule = function(tmle_task, fold_number = "full") {
       realistic <- private$.realistic
       likelihood <- self$likelihood
-      
+
       # TODO: when applying the rule, we actually only need the covariates
       blip_task <- self$blip_revere_function(tmle_task, fold_number)
       blip_preds <- self$blip_fit$predict_fold(blip_task, fold_number)
-      
+
       # Type of pseudo-blip:
       blip_type <- self$blip_type
-      
-      if(is.list(blip_preds)){
+
+      if (is.list(blip_preds)) {
         blip_preds <- unpack_predictions(blip_preds)
       }
-      
+
       rule_preds <- NULL
-      
-      if(realistic){
-        
-        #Need to grab the propensity score:
+
+      if (realistic) {
+
+        # Need to grab the propensity score:
         g_learner <- likelihood$factor_list[["A"]]$learner
         g_task <- tmle_task$get_regression_task("A")
         g_fits <- unpack_predictions(g_learner$predict(g_task))
-        
+
         if (!private$.maximize) {
           blip_preds <- blip_preds * -1
         }
-        
-        if(blip_type == "blip1"){
+
+        if (blip_type == "blip1") {
           rule_preds <- as.numeric(blip_preds > 0)
-        
-          for(i in 1:length(rule_preds)){
-            rule_preds_prob<-g_fits[i,]
-            #TO DO: What is a realistic cutoff here?
-            if(rule_preds_prob<0.05){
-              #Switch- assumes options are 0 and 1.
+
+          for (i in 1:length(rule_preds)) {
+            rule_preds_prob <- g_fits[i, ]
+            # TO DO: What is a realistic cutoff here?
+            if (rule_preds_prob < 0.05) {
+              # Switch- assumes options are 0 and 1.
               rule_preds[i] <- abs(rule_preds[i] - 1)
             }
           }
-          
-        }else{
-          if(dim(blip_preds)[2]<3){
+        } else {
+          if (dim(blip_preds)[2] < 3) {
             rule_preds <- max.col(blip_preds) - 1
-            for(i in 1:length(rule_preds)){
-              rule_preds_prob<-g_fits[i,rule_preds[i]]
-              #TO DO: What is a realistic cutoff here?
-              if(rule_preds_prob<0.05){
-                #Pick the next largest blip
-                rule_preds[i] <- max.col(blip_preds[i,order(blip_preds[i,], decreasing = TRUE)[2]])
+            for (i in 1:length(rule_preds)) {
+              rule_preds_prob <- g_fits[i, rule_preds[i]]
+              # TO DO: What is a realistic cutoff here?
+              if (rule_preds_prob < 0.05) {
+                # Pick the next largest blip
+                rule_preds[i] <- max.col(blip_preds[i, order(blip_preds[i, ], decreasing = TRUE)[2]])
               }
             }
-          }else{
+          } else {
             rule_preds <- max.col(blip_preds)
-            for(i in 1:length(rule_preds)){
-              rule_preds_prob<-g_fits[i,rule_preds[i]]
-              #TO DO: What is a realistic cutoff here?
-              if(rule_preds_prob<0.07){
-                #Pick the next largest blip
-                rule_preds[i] <- order(blip_preds[i,], decreasing = TRUE)[2] 
+            for (i in 1:length(rule_preds)) {
+              rule_preds_prob <- g_fits[i, rule_preds[i]]
+              # TO DO: What is a realistic cutoff here?
+              if (rule_preds_prob < 0.07) {
+                # Pick the next largest blip
+                rule_preds[i] <- order(blip_preds[i, ], decreasing = TRUE)[2]
               }
             }
           }
         }
-      }else{
+      } else {
         if (!private$.maximize) {
           blip_preds <- blip_preds * -1
         }
-        
-        if(blip_type == "blip1"){
+
+        if (blip_type == "blip1") {
           rule_preds <- as.numeric(blip_preds > 0)
-        }else{
-          if(dim(blip_preds)[2]<3){
+        } else {
+          if (dim(blip_preds)[2] < 3) {
             rule_preds <- max.col(blip_preds) - 1
-          }else{
+          } else {
             rule_preds <- max.col(blip_preds)
           }
         }