|
|
@ -16,7 +16,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
# filter(`_source.codes.timeSpent` != -1) %>% ### Exclude Norwegian summer sample hack
|
|
|
|
# filter(`_source.codes.timeSpent` != -1) %>% ### Exclude Norwegian summer sample hack
|
|
|
|
|
|
|
|
|
|
|
|
dfm_gen <- function(out,words = '999', text = c("lemmas","full")) {
|
|
|
|
dfm_gen <- function(out,words = '999', text = "lemmas") {
|
|
|
|
# Create subset with just ids, codes and text
|
|
|
|
# Create subset with just ids, codes and text
|
|
|
|
out <- out %>%
|
|
|
|
out <- out %>%
|
|
|
|
select(`_id`, matches("_source.*")) ### Keep only the id and anything belonging to the source field
|
|
|
|
select(`_id`, matches("_source.*")) ### Keep only the id and anything belonging to the source field
|
|
|
|