.RData deleted 100644 → 0
File deleted
.Rhistory deleted 100644 → 0
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
theme_bw()
p
}
figure(new_lst$NED)
figure <- function(df){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
labs(title = "Number of common ID", fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = 32)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
theme_bw()
p
}
figure(new_lst$NED)
figure <- function(df){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
labs(title = "Number of common ID", fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = 35)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
theme_bw()
p
}
figure(new_lst$NED)
for (i in 1:28){
p <- figure(new_lst[[i]])
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 12, height = 8)
}
figure <- function(df){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
labs(title = "Number of common ID", fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = 20)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
theme_bw()
p
}
new_lst[[1]]
names(new_lst[[1]])
figure <- function(df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
labs(title = "Number of common ID", fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(new_lst[[i]], 35)
}
else{
p <- figure(new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 12, height = 8)
}
NED <- figure(new_lst$NED, 35)
NED <- figure(new_lst$NED, 35)
NED
ggsave(plot = NED,
filename = paste0(get.data.dir(),"/plots/","NED_" ,"_plot.png"),
width = 12, height = 8)
ggsave(plot = NED,
filename = paste0(get.data.dir(),"/plots/","NED_" ,"_plot.png"),
width = 15, height = 8)
ggsave(plot = NED,
filename = paste0(get.data.dir(),"/plots/","NED_" ,"_plot.png"),
width = 18, height = 8)
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(new_lst[[i]], 35)
}
else{
p <- figure(new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
labs(title = paste0("Plot of the Number of common ID for country:", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Plot of the number of common ID for country: ", country )) +
ggeasy::easy_center_title() +
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Plot of the number of common ID for country: ", country )) +
theme_update(plot.title = element_text(hjust = 0.5)) +
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Plot of the number of common ID for country: ", country )) +
theme(plot.title = element_text(hjust = 0.5)) +
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0(get.data.dir(),"/plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
getwd()
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0("D:/public/data/fadn/lieferung_20210414/common_id_plots","/plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0("D:/public/data/fadn/lieferung_20210414/common_id_plots",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0("D:/public/data/fadn/lieferung_20210414/common_id_plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity",position = position_dodge(width = 0.8),width=0.5, fill = "limegreen" ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
guides(fill=FALSE) +
ggtitle(paste0("Plot of the number of common ID for country: ", country )) +
theme(plot.title = element_text(hjust = 0.5)) +
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0("D:/public/data/fadn/lieferung_20210414/common_id_plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
new_lst$BEL
figure("BEL",new_lst$BEL, 35)
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity", position = position_dodge(width = 0.8),width=0.5, fill = rainbow(n=length(df$Num_id)) ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Plot of the number of common ID for country: ", country )) +
theme(plot.title = element_text(hjust = 0.5)) +
theme_bw()
p
}
figure("BEL",new_lst$BEL, 35)
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity", position = position_dodge(width = 0.8),width=0.5, fill = rainbow(n=length(df$Num_id)) ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
# other 20, NED = 35
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Number of common ID for country: ", country )) +
theme(plot.title = element_text(hjust = 0.5)) +
theme_bw()
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0("D:/public/data/fadn/lieferung_20210414/common_id_plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity", position = position_dodge(width = 0.8),width=0.5, fill = rainbow(n=length(df$Num_id)) ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Number of common ID for country: ", country )) +
theme_bw() +
theme(plot.title = element_text(hjust = 0.5))
p
}
figure("BEL",new_lst$BEL, 35)
figure <- function(country, df, n){
p = df %>%
#ggplot( aes(x = reorder(Years, -Num_id) ,y=Num_id))
ggplot( aes(x = Years ,y=Num_id))+
geom_bar( stat="identity", position = position_dodge(width = 0.8),width=0.5, fill = rainbow(n=length(df$Num_id)) ) +
coord_flip()+
#labs(title = paste0("Plot of the Number of common ID for country: ", country ), fill = "Years") +
xlab("Years") +
ylab("Number of common ID") +
geom_text(aes(label=Num_id), vjust=0.5, colour="black", size=3.5)+
theme(axis.text.x=element_text(color = "black", size=6, angle=0, vjust=.8, hjust=0.8)) +
scale_x_discrete(labels = function(x) str_wrap(x, width = n)) +
facet_wrap( ~ group, scales="free",
labeller=names
#labeller(group = label_facet(df$group, "grouping"))
)+
ggtitle(paste0("Number of common ID for country: ", country )) +
theme_bw() +
theme(plot.title = element_text(hjust = 0.5))
p
}
for (i in 1:28){
if (sheetsnames[i] =="NED"){
p <- figure(sheetsnames[i],new_lst[[i]], 35)
}
else{
p <- figure(sheetsnames[i],new_lst[[i]], 20)
}
ggsave(plot = p,
filename = paste0("D:/public/data/fadn/lieferung_20210414/common_id_plots/",sheetsnames[i] ,"_plot.png"),
width = 18, height = 8)
}
knitr::opts_chunk$set(echo = TRUE)
summary(cars)
plot(pressure)
View(pressure)
knitr::opts_chunk$set(echo = TRUE)
file_names <- list.files("D:/public/data/fadn/lieferung_20210414/csv",include.dirs = TRUE)
file_names_gpg <- file_names[grepl(".gpg",file_names)]
length(file_names_gpg)
file_names <- file_names[!grepl(".gpg",file_names)]
library(tidyverse)
file_names <- file_names %>% tibble(name=.) %>% mutate(country=str_sub(name,1,3),year=str_sub(name,4,7))
file_names %>% print(n=30)
file_names %>% group_by(year) %>% count()
file_names %>% filter(country=="POL")
file_names <- file_names %>% mutate(provided="y")
data_requested_general <- read_xlsx(path = "D:/public/data/fadn/lieferung_20210414/FADN data request forms_March2021_MM210326.xlsx",sheet = 2,range = "A365:P393")
library(tidyverse)
library(readxl)
library(data.table)
data_requested_general <- read_xlsx(path = "D:/public/data/fadn/lieferung_20210414/FADN data request forms_March2021_MM210326.xlsx",sheet = 2,range = "A365:P393")
colnames(data_requested_general)[1] <- "country"
data_requested_general <- data_requested_general %>% mutate(country=str_sub(country,2,4))
data_requested_general_long <- data_requested_general %>% pivot_longer(-country)
data_requested_general_long <- data_requested_general_long %>% filter(value=="y") %>% rename(year=name,requested=value)
requested_and_provided <- data_requested_general_long %>% full_join(file_names %>% select(-name),by=c("country","year")) %>% filter(is.na(requested ) | is.na(provided))
## if empty, than everything is fine
requested_and_provided
# writexl::write_xlsx(x=requested_and_provided,path="D:/public/data/fadn/lieferung_20210414/missing_countries_years.xlsx")
files_list <- list()
folder_csv <- "D:/public/data/fadn/lieferung_20210414/csv/"
system.time({
files_list <- lapply(file_names %>% pull(name) %>% unique(),function(x)fread(input = paste0(folder_csv,x)))
}) ## 41.16 ~ 76 sec
files <- rbindlist(files_list)
files %>% select(YEAR,COUNTRY,countryyear)
## Number of sum of sample farms - observation - not unique
files %>% select(YEAR,COUNTRY) %>% group_by(COUNTRY) %>% count() %>% print(n=28)
## Combination of country and year in data set
files %>% select(YEAR,COUNTRY) %>% group_by(COUNTRY) %>% distinct()
library(fadnUtils)
library(fadnUtils)
library(fadnUtils)
library(fadnUtils)
library(fadnUtils)
library(fadnUtils)
devtools::load_all(".")
knitr::opts_chunk$set(echo = TRUE)
library(tidyverse)
library(readxl)
library(data.table)
library(skimr)
file_names <- list.files("D:/public/data/fadn/lieferung_20210414/csv",include.dirs = TRUE)
file_names_gpg <- file_names[grepl(".gpg",file_names)]
length(file_names_gpg)
file_names <- file_names[!grepl(".gpg",file_names)]
library(tidyverse)
file_names <- file_names %>% tibble(name=.) %>% mutate(country=str_sub(name,1,3),year=str_sub(name,4,7))
file_names %>% print(n=30)
file_names %>% group_by(year) %>% count()
file_names %>% filter(country=="POL")
file_names <- file_names %>% mutate(provided="y")
data_requested_general <- read_xlsx(path = "D:/public/data/fadn/lieferung_20210414/FADN data request forms_March2021_MM210326.xlsx",sheet = 2,range = "A365:P393")
colnames(data_requested_general)[1] <- "country"
data_requested_general <- data_requested_general %>% mutate(country=str_sub(country,2,4))
data_requested_general_long <- data_requested_general %>% pivot_longer(-country)
data_requested_general_long <- data_requested_general_long %>% filter(value=="y") %>% rename(year=name,requested=value)
requested_and_provided <- data_requested_general_long %>% full_join(file_names %>% select(-name),by=c("country","year")) %>% filter(is.na(requested ) | is.na(provided))
## if empty, than everything is fine
requested_and_provided
# writexl::write_xlsx(x=requested_and_provided,path="D:/public/data/fadn/lieferung_20210414/missing_countries_years.xlsx")