From 0757b6bf8be93ce2859a4adde10b4f78c5901aeb Mon Sep 17 00:00:00 2001 From: Erik de Vries Date: Thu, 2 May 2019 13:15:56 +0200 Subject: [PATCH] dfm_gen: re-added codes variable --- R/dfm_gen.R | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/R/dfm_gen.R b/R/dfm_gen.R index d079a58..fde93a2 100644 --- a/R/dfm_gen.R +++ b/R/dfm_gen.R @@ -31,14 +31,15 @@ dfm_gen <- function(out, words = '999', text = "lemmas", clean, cores = detectCo } if ('_source.codes.majorTopic' %in% colnames(out)) { out <- out %>% + mutate(codes = .$`_source.codes.majorTopic`) %>% mutate(junk = case_when( - .$`_source.codes.majorTopic` == 92 ~ 1, - .$`_source.codes.majorTopic` == 91 ~ 1, - .$`_source.codes.majorTopic` == 93 ~ 1, + .$codes == 92 ~ 1, + .$codes == 91 ~ 1, + .$codes == 93 ~ 1, TRUE ~ 0 ) ) %>% - mutate(aggregate = .$`_source.codes.majorTopic` %>% + mutate(aggregate = .$codes %>% str_pad(4, side="right", pad="a") %>% str_match("([0-9]{1,2})?[0|a][1-9|a]") %>% .[,2] %>%