rbind 添加一个包含日期值的行
rbind adding a row with a date value in it
我正在尝试向该数据框添加新行,我可以使用 rbind() 添加数据,但日期被替换为 NA 我哪里出错了?
library(httr)
library(dplyr)
library(ggplot2)
library(gghighlight)
library(zoo)
library(lubridate)
GET("https://opendata.ecdc.europa.eu/covid19/casedistribution/csv", authenticate(":", ":", type="ntlm"), write_disk(tf <- tempfile(fileext = ".csv")))
data <- read.csv(tf)
lab_notes <- paste0("Data as provided by European Centre for Disease Prevention and Control", "and Engineering (JHU CSSE) and obtained daily.")
#data.today<- c(NaN,06,06,2020,0,357,"United_Kingdom", "UK", "GBR",0,"Europe")
#data <- rbind(data, data.today)
#data$dateRep[c(21548)] <- as.factor(c("06/06/2020"))
#data$dateRep[is.na(data$dateRep)] <- as.factor("06/06/2020")
data$geoId <- as.character(data$geoId)
data$dateRep <- as.character(data$dateRep)
data$dateRep <- as.Date(data$dateRep, "%d/%m/%Y")
#data$dateRep[c(21548)] <- today() + days(1)
# Countries you are interested in plotting
geo_ids <- c("UK")
# selecting data after peak, April the 8th
data.uk <- subset(data, geoId == "UK") %>% arrange(dateRep) ```
问题是您的数据列不是日期格式,而是内部为整数的 factor
,这种解释为日期会导致问题。要在读取数据时获得 character
列而不是 factor
,请在 read.csv
中设置 stringsAsFactors = FALSE
。然后你可以将 dateRep
转换为日期格式并添加一行。我将额外的行格式化为 data.frame,因此您已经拥有正确的列类型。
library(httr)
library(lubridate)
GET("https://opendata.ecdc.europa.eu/covid19/casedistribution/csv", authenticate(":", ":", type="ntlm"), write_disk(tf <- tempfile(fileext = ".csv")))
data <- read.csv(tf, stringsAsFactors = FALSE)
data$dateRep <- as.Date(data$dateRep, format = "%d/%m/%Y")
data.today<- data.frame(today(),06,06,2020,0,357,"United_Kingdom", "UK", "GBR",0,"Europe")
colnames(data.today) <- colnames(data)
rbind(data[1, ], data.today)
dateRep day month year cases deaths countriesAndTerritories geoId countryterritoryCode popData2018 continentExp
1 2020-06-05 5 6 2020 787 6 Afghanistan AF AFG 37172386 Asia
2 2020-06-05 6 6 2020 0 357 United_Kingdom UK GBR 0 Europe
我正在尝试向该数据框添加新行,我可以使用 rbind() 添加数据,但日期被替换为 NA 我哪里出错了?
library(httr)
library(dplyr)
library(ggplot2)
library(gghighlight)
library(zoo)
library(lubridate)
GET("https://opendata.ecdc.europa.eu/covid19/casedistribution/csv", authenticate(":", ":", type="ntlm"), write_disk(tf <- tempfile(fileext = ".csv")))
data <- read.csv(tf)
lab_notes <- paste0("Data as provided by European Centre for Disease Prevention and Control", "and Engineering (JHU CSSE) and obtained daily.")
#data.today<- c(NaN,06,06,2020,0,357,"United_Kingdom", "UK", "GBR",0,"Europe")
#data <- rbind(data, data.today)
#data$dateRep[c(21548)] <- as.factor(c("06/06/2020"))
#data$dateRep[is.na(data$dateRep)] <- as.factor("06/06/2020")
data$geoId <- as.character(data$geoId)
data$dateRep <- as.character(data$dateRep)
data$dateRep <- as.Date(data$dateRep, "%d/%m/%Y")
#data$dateRep[c(21548)] <- today() + days(1)
# Countries you are interested in plotting
geo_ids <- c("UK")
# selecting data after peak, April the 8th
data.uk <- subset(data, geoId == "UK") %>% arrange(dateRep) ```
问题是您的数据列不是日期格式,而是内部为整数的 factor
,这种解释为日期会导致问题。要在读取数据时获得 character
列而不是 factor
,请在 read.csv
中设置 stringsAsFactors = FALSE
。然后你可以将 dateRep
转换为日期格式并添加一行。我将额外的行格式化为 data.frame,因此您已经拥有正确的列类型。
library(httr)
library(lubridate)
GET("https://opendata.ecdc.europa.eu/covid19/casedistribution/csv", authenticate(":", ":", type="ntlm"), write_disk(tf <- tempfile(fileext = ".csv")))
data <- read.csv(tf, stringsAsFactors = FALSE)
data$dateRep <- as.Date(data$dateRep, format = "%d/%m/%Y")
data.today<- data.frame(today(),06,06,2020,0,357,"United_Kingdom", "UK", "GBR",0,"Europe")
colnames(data.today) <- colnames(data)
rbind(data[1, ], data.today)
dateRep day month year cases deaths countriesAndTerritories geoId countryterritoryCode popData2018 continentExp
1 2020-06-05 5 6 2020 787 6 Afghanistan AF AFG 37172386 Asia
2 2020-06-05 6 6 2020 0 357 United_Kingdom UK GBR 0 Europe