0

我正在为 R 中的一个特定的 for 循环而苦苦挣扎。我有一个包含 52 行和大约 30 列的数据框。我正在编写 for 循环以从每一行中提取数据(或值)并将它们插入到长文本中 --- 在本例中为 javascript/geojson 代码。目前,length() 不接受我放入其中的任何参数。

我是 R 新手,所以很多代码可能是多余的。

下面的代码:

# start of 'for loop' 
for(row in 1:nrow(intro_df)) { # trying to iterate through each row of the df
  lines <- vector(length()) # trying to deal with getting an error for "replacement has length zero" 
  # start of long text (notice placeholders in sprintf) --- javascript/geojson to be used in VS code later
  lines[row] <- sprintf(" 
{
            \"type\": \"Feature\",
            \"properties\": {
                \"huc8\": %s,
                \"Year\": %i,
                \"Total Water Use\": %f,
                \"Aquaculture\": %f,
                \"Commercial\": %f,
                \"Self-Supplied Domestic\": %f,
                \"Hydroelectric Power\": %f,
                \"Self-Supplied Industrial\": %f,
                \"Irrigation\": %f,
                \"Livestock\": %f,
                \"Mining\": %f,
                \"Public Supply\": %f,
                \"Thermoelectric\": %f,
                \"Total Groundwater\": %f,
                \"Total Surface Water\": %f
            },
            \"geometry\": {
                \"type\": \"Point\",
                \"coordinates\": [%f, %f]
            }
        }, \n", 
  intro_df$huc8[row], # column names where data/values from intro_df should be inserted into sprintf
  intro_df$Year[row], 
  intro_df$Total_WaterUse[row], 
  intro_df$Aquaculture[row], 
  intro_df$Commercial[row], 
  intro_df$Domestic[row], 
  intro_df$Hydroelectric_power[row], 
  intro_df$Industrial[row], 
  intro_df$Irrigation[row], 
  intro_df$Livestock[row], 
  intro_df$Mining[row], 
  intro_df$Public_Supply[row], 
  intro_df$Thermoelectric[row], 
  intro_df$Total_Groundwater[row], 
  intro_df$Total_Surface_Water[row], 
  intro_df$lat[row], 
  intro_df$long[row])

}
all_lines <- paste(lines, collapse = "\n") # store lines to variable all_lines

file_js_points <- file("js_points.txt") # write all_lines to a text file 
writeLines(all_lines, file_js_points)
close(file_js_points)

编辑我更正了我的代码以摆脱'for循环'。以下是最终为我工作的代码:

# Input data from each row of intro_df into placeholders in sprintf()
lines <- sprintf(" 
{ 
            \"type\": \"Feature\",
            \"properties\": {
                \"huc8\": %s, 
                \"Year\": %s,
                \"Total Water Use\": %s,
                \"Aquaculture\": %s,
                \"Commercial\": %s, 
                \"Self-Supplied Domestic\": %s,
                \"Hydroelectric Power\": %s,
                \"Self-Supplied Industrial\": %s,
                \"Irrigation\": %s, 
                \"Livestock\": %s, 
                \"Mining\": %s, 
                \"Public Supply\": %s, 
                \"Thermoelectric\": %s, 
                \"Total Groundwater\": %s, 
                \"Total Surface Water\": %s 
            }, 
            \"geometry\": { 
                \"type\": \"Point\", 
                \"coordinates\": [%s, %s] 
            } 
        }, \n", 
                      intro_df$huc8, # column names where data/values from intro_df should be inserted into sprintf
                      intro_df$Year, 
                      intro_df$Total_WaterUse, 
                      intro_df$Aquaculture, 
                      intro_df$Commercial, 
                      intro_df$Domestic, 
                      intro_df$Hydroelectric_power, 
                      intro_df$Industrial, 
                      intro_df$Irrigation, 
                      intro_df$Livestock, 
                      intro_df$Mining, 
                      intro_df$Public_Supply, 
                      intro_df$Thermoelectric, 
                      intro_df$Total_Groundwater, 
                      intro_df$Total_Surface_Water, 
                      intro_df$lat, 
                      intro_df$long)

# Collapse all rows into one variable separated by new line 
js_points <- paste(lines, collapse = "\n") 

# Create js_point text file for all js_points
sink(file = "js_points.txt")
cat(js_points)
sink()
4

1 回答 1

1

问题是您lines在每次循环迭代开始时都将其重置为空。您应该在循环之前初始化它(最好是正确的长度,而不是 0 长度) 。你需要使用参数 length =而不是函数length()。(我也使用character它,所以它是正确的矢量类型。)

lines = character(length = nrow(intro_df))
for(row in 1:nrow(intro_df)) { 
  lines[row] <- ...
}

但是,sprintf是矢量化的,因此您根本不需要for循环。我with()用来避免多次输入数据框名称。

lines <- with(intro_df, sprintf("
  {...

  }",
  huc8,
  Year,
  Total_WaterUse, ...
))

all_lines <- paste(lines, collapse = "\n") # store lines to variable all_lines

file_js_points <- file("js_points.txt") # write all_lines to a text file 
writeLines(all_lines, file_js_points)
close(file_js_points)
于 2020-04-14T19:15:35.180 回答