From a11d7728eac7ab0c0cfdd842c5d735777e66fa74 Mon Sep 17 00:00:00 2001 From: Erik de Vries Date: Mon, 13 May 2019 11:43:15 +0200 Subject: [PATCH] actor_aggregation: only aggregate scores on non-junk articles --- R/actor_aggregation.R | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/R/actor_aggregation.R b/R/actor_aggregation.R index cdea013..1d73b28 100644 --- a/R/actor_aggregation.R +++ b/R/actor_aggregation.R @@ -60,9 +60,9 @@ actor_aggregation <- function(row, actors, es_pwd, localhost, default_operator = ) } if (year > 0) { - query <- paste0('computerCodes.actors:(',paste(actorids, collapse = ' '),') && publication_date:[',year,'-01-01 TO ',year,'-12-31]') + query <- paste0('computerCodes.actors:(',paste(actorids, collapse = ' '),') && publication_date:[',year,'-01-01 TO ',year,'-12-31] && computerCodes.junk:0') } else { - query <- paste0('computerCodes.actors:(',paste(actorids, collapse = ' '),') && publication_date:[',actor$`_source.startDate`,' TO ',actor$`_source.endDate`,']') + query <- paste0('computerCodes.actors:(',paste(actorids, collapse = ' '),') && publication_date:[',actor$`_source.startDate`,' TO ',actor$`_source.endDate`,'] && computerCodes.junk:0') } out <- elasticizer(query_string(paste0('country:',actor$`_source.country`,' && ',query), fields = c('computerCodes.actorsDetail', 'doctype', 'publication_date'), default_operator = default_operator),