Lentil Diversity Panel
A population representing global genetic diversity in cultivated lentil varieties
Prepare Data
# devtools::install_github("derekmichaelwright/agData")
library(agData)
library(plotly) # plot_ly()
library(leaflet) # leaflet()
library(htmlwidgets) # saveWidget()
# Prep data
myCaption <- "www.dblogr.com/ or derekmichaelwright.github.io/dblogr/ | Data: AGILE"
rColors <- c("darkred", "darkgreen", "darkorange3", "steelblue", "grey")
cColors <- c("darkred", "darkorange3", "darkgoldenrod2", "deeppink3",
"steelblue", "darkorchid4", "cornsilk4", "darkgreen")
sColors <- c("deeppink3", "darkblue", "darkorchid4", "darkorange3", "steelblue",
"darkgoldenrod2", "darkred", "darkgreen", "cornsilk4")
#
dd <- read.csv("data_ldp.csv") %>%
mutate(DTF_Cluster = factor(DTF_Cluster))
Origins
Countries
# Prep data
xx <- dd %>%
group_by(Origin, Region) %>%
summarise(Count = n()) %>%
arrange(Count) %>%
mutate(Origin = factor(Origin, levels = .$Origin))
# Plot
mp <- ggplot(xx, aes(x = Origin, y = Count, fill = Region)) +
geom_col(color = "black", alpha = 0.7) +
facet_grid(. ~ Region, scales = "free", space = "free") +
scale_fill_manual(values = rColors) +
theme_agData(legend.position = "none",
panel.grid.major.x = element_blank(),
axis.text.x = element_text(angle = 45, hjust = 1)) +
labs(title = "Lentil Diversity Panel Origins", x = NULL,
caption = myCaption)
ggsave("lentil_diversity_panel_1_01.png", mp, width = 8, height = 4)
Map
# Prep data
xx <- dd %>%
mutate(Lat = ifelse(is.na(Lat), Country_Lat, Lat),
Lon = ifelse(is.na(Lon), Country_Lon, Lon),
Lat = ifelse(duplicated(Lat), jitter(Lat, 1, 1), Lat),
Lon = ifelse(duplicated(Lon), jitter(Lon, 1, 1), Lon),
Size = 1)
# Plot png
png("lentil_diversity_panel_1_02.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i", yaxs = "i")
mapBubbles2(dF = xx, nameX = "Lon", nameY = "Lat",
nameZColour = alpha("darkred",0.8),
nameZFill = alpha("darkgoldenrod2",0.8),
nameZSize = "Size", symbolSize = 0.2, addLegend = F,
#xlim = c(-140,110), ylim = c(5,20),
lwd = 1, oceanCol = "grey90", landCol = "white", borderCol = "black")
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
Country Map
# Prep data
xx <- dd %>%
filter(Origin != "Unknown") %>%
mutate(Origin = recode(Origin, "ICARDA"="Syria", "USDA"="USA")) %>%
group_by(Origin, Country_Lat, Country_Lon) %>%
summarise(Count = n()) %>%
as.data.frame()
# Plot
png("lentil_diversity_panel_1_03.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i",yaxs = "i")
mapBubbles2(dF = xx, nameX = "Country_Lon", nameY = "Country_Lat",
nameZColour = alpha("darkgoldenrod2",0.8),
nameZFill = alpha("darkgreen",0.8),
nameZSize = "Count", legendPos = "bottomleft",
lwd = 1, oceanCol = "grey90", landCol = "white", borderCol = "black")
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
Genotype PCA By Region
mp <- plot_ly(dd, x = ~myG_PC1, y = ~myG_PC3, z = ~myG_PC2,
color = ~Region, colors = rColors, hoverinfo = "text",
text = ~paste(Name,
"\nOrigin:", Origin,
"\nSource:", Source,
"\nCollDate:", CollDate,
"\nSTR_Group:", STR_Group,
"\nDTF_Cluster:", DTF_Cluster)) %>%
add_markers()
saveWidget(as_widget(mp), "lentil_diversity_panel_1_04.html")
Genetic Structure Analyis
Genotype Composition
# Prep data
xx <- dd %>%
select(Name, Origin, Region, G1, G2, G3, G4, G5, G6, G7, G8) %>%
arrange(G1, G2, G3, G4, G5, G6, G7, G8) %>%
gather(Group, Value, G1, G2, G3, G4, G5, G6, G7, G8) %>%
mutate(Name = factor(Name, unique(Name)))
# Plot
mp <- ggplot(xx, aes(x = Name, y = Value, fill = Group)) +
geom_col(position = "stack") +
scale_fill_manual(name = NULL, values = sColors) +
guides(fill = guide_legend(nrow = 1)) +
theme_agData(legend.position = "bottom",
axis.ticks.x = element_blank(),
axis.text.x = element_blank()) +
labs(title = "Lentil Diversity Panel", y = NULL, x = NULL,
caption = myCaption)
ggsave("lentil_diversity_panel_2_01.png", mp, width = 10, height = 4)
Genotype Composition By Region
# Prep data
xx <- dd %>%
select(Name, Origin, Region, G1, G2, G3, G4, G5, G6, G7, G8) %>%
arrange(G1, G2, G3, G4, G5, G6, G7, G8) %>%
gather(Group, Value, G1, G2, G3, G4, G5, G6, G7, G8) %>%
mutate(Name = factor(Name, unique(Name)))
# Plot
mp <- ggplot(xx, aes(x = Name, y = Value, fill = Group)) +
geom_col(position = "stack") +
facet_grid(. ~ Region, scales = "free_x", space = "free_x") +
scale_fill_manual(name = NULL, values = sColors) +
guides(fill = guide_legend(nrow = 1)) +
theme_agData(legend.position = "bottom",
axis.ticks.x = element_blank(),
axis.text.x = element_blank()) +
labs(title = "Lentil Diversity Panel", y = NULL, x = NULL,
caption = myCaption)
ggsave("lentil_diversity_panel_2_02.png", mp, width = 10, height = 4)
Genetic Structure Pie Map
# Prep data
myG <- c("G1","G2","G3","G4","G5","G6","G7","G8", "Mix")
xx <- dd %>%
filter(!Origin %in% c("ICARDA","USDA","Unknown")) %>%
group_by(Origin, STR_Group, Country_Lat, Country_Lon) %>%
summarise(Count = n()) %>%
spread(STR_Group, Count) %>%
as.data.frame()
# Plot
png("lentil_diversity_panel_2_03.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i", yaxs = "i")
mapPies(dF = xx, nameX = "Country_Lon", nameY = "Country_Lat",
zColours = sColors, nameZs = myG, addCatLegend = F, lwd = 1,
oceanCol = "grey90", landCol = "white", borderCol = "black")
legend(-170, 20, title = "STR Group", legend = myG, col = sColors,
pch = 16, cex = 0.8, pt.cex = 1.25, box.lwd = 2)
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
Genetic Structure Map
# Prep data
myG <- c("G1","G2","G3","G4","G5","G6","G7","G8", "Mix")
xx <- dd %>%
mutate(Lat = ifelse(is.na(Lat), Country_Lat, Lat),
Lon = ifelse(is.na(Lon), Country_Lon, Lon),
Lat = ifelse(duplicated(Lat), jitter(Lat, 1, 1), Lat),
Lon = ifelse(duplicated(Lon), jitter(Lon, 1, 1), Lon),
Size = 1)
# Plot png
png("lentil_diversity_panel_2_04.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i", yaxs = "i")
mapBubbles2(dF = xx, nameX = "Lon", nameY = "Lat",
nameZFill = "STR_Group",
fillPalette = alpha(sColors,0.8),
nameZSize = "Size", symbolSize = 0.2,
xlim = c(-140,110), ylim = c(5,20), lwd = 1, lwdSymbols = 0.4,
addColourLegend = F, addLegend = F,
oceanCol = "grey90", landCol = "white", borderCol = "black")
legend(-170, 20, title = "STR Group", legend = myG, col = sColors,
pch = 16, cex = 0.8, pt.cex = 1.5, box.lwd = 2)
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
# Plot html
pal <- colorFactor(sColors, domain = myG)
mp <- leaflet() %>%
addProviderTiles(providers$CartoDB.Positron) %>%
addCircles(lng = xx$Lon, lat = xx$Lat, weight = 10,
color = pal(xx$STR_Group), opacity = 1, fillOpacity = 1,
popup = paste(xx$Entry,"|",xx$Name)) %>%
addLegend("bottomleft", pal = pal, values = xx$STR_Group,
title = "STR Group", opacity = 1)
saveWidget(mp, file="lentil_diversity_panel_2_04.html")
Genetic Structure Origin Pies
# Prep data
myLevels <- c("South America", "Central America", "Northern America",
"Western Europe", "Eastern Europe", "Southern Europe",
"Western Asia", "Central Asia",
"Northern Africa", "Eastern Africa", "Southern Asia", "Other")
x1 <- dd %>%
group_by(STR_Group, SubRegion) %>%
summarise(Count = n())
x2 <- dd %>%
group_by(SubRegion) %>%
summarise(Total = n())
xx <- left_join(x1, x2, by = "SubRegion") %>%
mutate(Percent = 100 * Count / Total) %>%
mutate(SubRegion = factor(SubRegion, levels = myLevels))
# Plot
mp <- ggplot(xx, aes(x = "", y = Percent, fill = STR_Group)) +
geom_col(color = "black", alpha = 0.7) +
coord_polar("y", start = 0) +
facet_wrap(. ~ SubRegion + paste("n =", Total), ncol = 6) +
scale_fill_manual(values = sColors) +
theme_agData_pie(legend.position = "bottom") +
guides(fill = guide_legend(nrow = 1)) +
labs(title = "Lentil Diversity Panel Origins", x = NULL,
caption = myCaption)
ggsave("lentil_diversity_panel_2_05.png", mp, width = 12, height = 6)
Genotype PCA By Structure Group
mp <- plot_ly(dd, x = ~myG_PC1, y = ~myG_PC2, z = ~myG_PC3, hoverinfo = "text",
color = ~STR_Group, colors = sColors[c(9,1:8)],
text = ~paste(Name,
"\nOrigin:", Origin,
"\nSource:", Source,
"\nCollDate:", CollDate,
"\nSTR_Group:", STR_Group,
"\nDTF_Cluster:", DTF_Cluster)) %>%
add_markers()
saveWidget(as_widget(mp), "lentil_diversity_panel_2_06.html")
DTF
DTF Cluster Pie Map
# Prep data
xx <- dd %>%
filter(!Origin %in% c("ICARDA","USDA","Unknown")) %>%
group_by(Origin, DTF_Cluster, Country_Lat, Country_Lon) %>%
summarise(Count = n()) %>%
spread(DTF_Cluster, Count) %>%
as.data.frame()
# Plot
png("lentil_diversity_panel_3_01.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i", yaxs = "i")
mapPies(dF = xx, nameX = "Country_Lon", nameY = "Country_Lat",
zColours = cColors, nameZs = c("1","2","3","4","5","6","7","8"),
xlim = c(-140,110), ylim = c(5,20), addCatLegend = F, lwd = 1,
oceanCol = "grey90", landCol = "white", borderCol = "black")
legend(-138.5, 13, title = "DTF Cluster", legend = 1:8, col = cColors,
pch = 16, cex = 0.8, pt.cex = 1.5, box.lwd = 2)
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
DTF Cluster Map
# Prep data
xx <- dd %>%
mutate(Lat = ifelse(is.na(Lat), Country_Lat, Lat),
Lon = ifelse(is.na(Lon), Country_Lon, Lon),
Lat = ifelse(duplicated(Lat), jitter(Lat, 1, 1), Lat),
Lon = ifelse(duplicated(Lon), jitter(Lon, 1, 1), Lon),
Size = 1)
# Plot png
png("lentil_diversity_panel_3_02.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i", yaxs = "i")
mapBubbles2(dF = xx, nameX = "Lon", nameY = "Lat",
nameZFill = "DTF_Cluster",
fillPalette = alpha(cColors,0.8),
nameZSize = "Size", symbolSize = 0.2,
xlim = c(-140,110), ylim = c(5,20), lwd = 1, lwdSymbols = 0.4,
addColourLegend = F, addLegend = F,
oceanCol = "grey90", landCol = "white", borderCol = "black")
legend(-138.5, 13, title = "DTF Cluster", legend = 1:8, col = cColors,
pch = 16, cex = 0.8, pt.cex = 1.5, box.lwd = 2)
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
# Plot html
pal <- colorFactor(cColors, domain = 1:8)
mp <- leaflet() %>%
addProviderTiles(providers$CartoDB.Positron) %>%
addCircles(lng = xx$Lon, lat = xx$Lat, weight = 10,
color = pal(xx$DTF_Cluster), opacity = 1, fillOpacity = 1,
popup = paste(xx$Entry,"|",xx$Name)) %>%
addLegend("bottomleft", pal = pal, values = xx$DTF_Cluster,
title = "DTF Cluster", opacity = 1)
saveWidget(mp, file="lentil_diversity_panel_3_02.html")
DTF PCA Clusters
From phenology paper
mp <- plot_ly(dd, x = ~DTF_PC1, y = ~DTF_PC2*2.5, z = ~DTF_PC3*2.5,
color = ~DTF_Cluster, colors = cColors, hoverinfo = "text",
text = ~paste(Name,
"\nOrigin:", Origin,
"\nSource:", Source,
"\nCollDate:", CollDate,
"\nSTR_Group:", STR_Group,
"\nDTF_Cluster:", DTF_Cluster)) %>%
add_markers()
saveWidget(as_widget(mp), "lentil_diversity_panel_3_03.html")
xx <- dd %>%
mutate(DTF_PC1 = scales::rescale(DTF_PC1),
DTF_PC2 = scales::rescale(DTF_PC2),
DTF_PC3 = scales::rescale(DTF_PC3))
mp <- plot_ly(dd, x = ~DTF_PC1, y = ~DTF_PC2, z = ~DTF_PC3,
color = ~STR_Group, colors = sColors, hoverinfo = "text",
text = ~paste(Name,
"\nOrigin:", Origin,
"\nSource:", Source,
"\nCollDate:", CollDate,
"\nSTR_Group:", STR_Group,
"\nDTF_Cluster:", DTF_Cluster)) %>%
add_markers()
saveWidget(as_widget(mp), "lentil_diversity_panel_3_04.html")
DTF Cluster Origin Pies
# Prep data
myLevels <- c("South America", "Central America", "Northern America",
"Western Europe", "Eastern Europe", "Southern Europe",
"Western Asia", "Central Asia",
"Northern Africa", "Eastern Africa", "Southern Asia", "Other")
x1 <- dd %>%
group_by(DTF_Cluster, SubRegion) %>%
summarise(Count = n())
x2 <- dd %>%
group_by(SubRegion) %>%
summarise(Total = n())
xx <- left_join(x1, x2, by = "SubRegion") %>%
mutate(Percent = 100 * Count / Total) %>%
mutate(SubRegion = factor(SubRegion, levels = myLevels))
# Plot
mp <- ggplot(xx, aes(x = "", y = Percent, fill = DTF_Cluster)) +
geom_col(color = "black", alpha = 0.7) +
coord_polar("y", start = 0) +
facet_wrap(. ~ SubRegion + paste("n =", Total), ncol = 6) +
scale_fill_manual(values = cColors) +
theme_agData_pie(legend.position = "bottom") +
guides(fill = guide_legend(nrow = 1)) +
labs(title = "Lentil Diversity Panel Origins", x = NULL,
caption = myCaption)
ggsave("lentil_diversity_panel_3_04.png", width = 12, height = 6)
Genotype PCA By DTF Clusters
From phenology paper
mp <- plot_ly(dd, x = ~myG_PC1, y = ~myG_PC2, z = ~myG_PC3,
color = ~DTF_Cluster, colors = cColors, hoverinfo = "text",
text = ~paste(Name,
"\nOrigin:", Origin,
"\nSource:", Source,
"\nCollDate:", CollDate,
"\nSTR_Group:", STR_Group,
"\nDTF_Cluster:", DTF_Cluster)) %>%
add_markers()
saveWidget(as_widget(mp), "lentil_diversity_panel_3_05.html")
Cotyledon Color
Eurasia Map
# Prep data
myColors <- alpha(c("darkred", "darkgoldenrod2"), 0.7)
xx <- dd %>%
filter(CotyledonColor %in% c("Red", "Yellow"),
Region %in% c("Asia","Europe","Africa")) %>%
mutate(Lat = ifelse(is.na(Lat), Country_Lat, Lat),
Lon = ifelse(is.na(Lon), Country_Lon, Lon),
Lat = ifelse(duplicated(Lat), jitter(Lat, 1, 1), Lat),
Lon = ifelse(duplicated(Lon), jitter(Lon, 1, 1), Lon),
Size = 1)
# Plot png
png("lentil_diversity_panel_4_01.png", width = 3600, height = 2055, res = 600)
par(mai = c(0.2,0,0.25,0), xaxs = "i", yaxs = "i")
mapBubbles2(dF = xx, nameX = "Lon", nameY = "Lat",
nameZFill = "CotyledonColor",
fillPalette = myColors,
nameZSize = "SeedMass1000",
symbolSize = 0.5, lwd = 1, lwdSymbols = 0.5,
addColourLegend = F, addLegend = F,
xlim = c(-25,110), ylim = c(15,35),
oceanCol = "grey90", landCol = "white", borderCol = "black")
legend(55, 3, title = "Cotyledon Color",
legend = c("Red", "Yellow"), col = myColors,
pch = 16, cex = 0.8, pt.cex = 1.5, box.lwd = 2)
title(main = "Lentil Diversity Panel Origins", line = 0.25, cex = 3)
title(sub = myCaption, line = 0, cex.sub = 0.75, adj = 1)
dev.off()
Mass of 1000 Seeds
# Prep data
myColors <- c("darkred", "darkgoldenrod2")
xx <- dd %>% filter(CotyledonColor %in% c("Red", "Yellow"))
# Plot
mp <- ggplot(xx, aes(x = CotyledonColor, y = SeedMass1000,
fill = CotyledonColor, size = SeedMass1000)) +
geom_quasirandom(alpha = 0.7, pch = 21, color = "black") +
scale_fill_manual(values = myColors) +
theme_agData(legend.position = "none") +
labs(title = "Lentil Diversity Panel",
y = "Mass of 1000 Seeds (g)",
x = "Cotyledon Color",
caption = myCaption)
ggsave("lentil_diversity_panel_4_02.png", mp, width = 6, height = 4)
Str Group
# Plot
mp <- ggplot(xx, aes(x = CotyledonColor, y = SeedMass1000,
fill = STR_Group, size = SeedMass1000)) +
geom_quasirandom(alpha = 0.7, pch = 21, color = "black") +
facet_grid(. ~ Region) +
scale_fill_manual(values = sColors) +
guides(size = "none") +
theme_agData() +
labs(caption = myCaption)
ggsave("lentil_diversity_panel_4_03.png", mp, width = 10, height = 4)
DTF Cluster
# Plot
mp <- ggplot(xx, aes(x = CotyledonColor, y = SeedMass1000,
fill = DTF_Cluster, size = SeedMass1000)) +
geom_quasirandom(alpha = 0.7, pch = 21, color = "black") +
facet_grid(. ~ Region) +
scale_fill_manual(values = cColors) +
guides(size = "none") +
theme_agData() +
labs(caption = myCaption)
ggsave("lentil_diversity_panel_4_04.png", mp, width = 10, height = 4)