diff --git a/global.R b/global.R index 915c8d77c76a932cf8da66080bfeeea5d985b441..1637e9ae4b0f25bcf067784252265bf3829375ce 100644 --- a/global.R +++ b/global.R @@ -40,12 +40,9 @@ all_data <- bind_rows(all_data_gitlab, all_data_forge, combined_data) all_data$updated_at <- as.POSIXct(all_data$updated_at, format = ("%Y-%m-%dT%H:%M:%S")) all_data <- all_data %>% mutate(message = paste0(type,sep = " : ",message), email_clean = str_remove(author, "@.*")) - -all_data <- all_data %>% stringdist_left_join(annuaire,by = c("email_clean" = "mail_clean"), method = "jw", max_dist = 0.25) # ajout de auteur des membre du SCTE via l'annuaire +all_data <- all_data %>% stringdist_left_join(annuaire,by = c("email_clean" = "mail_clean"), method = "jw", max_dist = 0.265) # ajout de auteur des membre du SCTE via l'annuaire, 75% des auteurs sont du csd all_data <- all_data %>% dplyr::mutate(etiquette = paste(groupe,topics,sep = ",")) -df <- all_data %>% filter(!is.na(auteur)) %>% select(author,auteur) -distinct(df)%>% datatable() # transformation re_code ---- traduction <- c(