Don't remove duplicate rows from ARRL scraper.
Something going on here where the numbers change but the date on the page doesn't.
This commit is contained in:
		@@ -40,11 +40,11 @@ write.table(tab, file = "out/arrl-fcc-licenses-scraped.csv", sep = ",",
 | 
			
		||||
            na = "") 
 | 
			
		||||
 | 
			
		||||
# Clean up table to remove any duplicates (sometimes the page isn't updated regularly)
 | 
			
		||||
db <- read.csv("out/arrl-fcc-licenses-scraped.csv")
 | 
			
		||||
db2 <- db %>% distinct(.keep_all = TRUE) %>% 
 | 
			
		||||
        filter(Date != "Date")
 | 
			
		||||
write.csv(db2, "out/arrl-fcc-licenses-scraped.csv",
 | 
			
		||||
          quote = F,
 | 
			
		||||
          row.names = F,
 | 
			
		||||
          na = "")
 | 
			
		||||
# db <- read.csv("out/arrl-fcc-licenses-scraped.csv")
 | 
			
		||||
# db2 <- db %>% distinct(.keep_all = TRUE) %>% 
 | 
			
		||||
#         filter(Date != "Date")
 | 
			
		||||
# write.csv(db2, "out/arrl-fcc-licenses-scraped.csv",
 | 
			
		||||
#           quote = F,
 | 
			
		||||
#           row.names = F,
 | 
			
		||||
#           na = "")
 | 
			
		||||
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user