如何在dplyr中使用bind_rows处理大小不兼容的列表?

icomxhvb  于 2023-05-15  发布在  其他
关注(0)|答案(2)|浏览(191)

我有一个数据如下

  1. $ECe
  2. .type .value .borders .feature
  3. 1 ale -0.866 0.490 ECe
  4. 2 ale -0.811 2.680 ECe
  5. 3 ale -0.749 4.990 ECe
  6. 4 ale -0.501 7.994 ECe
  7. 5 ale -0.472 8.801 ECe
  8. 6 ale -0.364 11.140 ECe
  9. 7 ale -0.351 14.090 ECe
  10. 8 ale -0.172 15.900 ECe
  11. 9 ale -0.068 17.810 ECe
  12. 10 ale 0.069 18.750 ECe
  13. 11 ale 0.132 20.190 ECe
  14. 12 ale 0.176 21.020 ECe
  15. 13 ale 0.227 22.950 ECe
  16. 14 ale 0.295 24.520 ECe
  17. 15 ale 0.458 28.290 ECe
  18. 16 ale 0.534 31.640 ECe
  19. 17 ale 0.265 37.990 ECe
  20. 18 ale 0.330 40.700 ECe
  21. 19 ale 0.793 45.117 ECe
  22. 20 ale 0.393 53.090 ECe
  23. 21 ale 0.752 59.719 ECe
  24. $BD
  25. .type .value .borders .feature
  26. 1 ale 2.88401670 0.957 BD
  27. 2 ale 2.89757908 1.138 BD
  28. 3 ale 2.06229728 1.185 BD
  29. 4 ale 1.86256683 1.220 BD
  30. 5 ale 1.22004089 1.299 BD
  31. 6 ale 0.47244692 1.339 BD
  32. 7 ale 0.28531498 1.401 BD
  33. 8 ale 0.21050138 1.486 BD
  34. 9 ale 0.06942624 1.500 BD
  35. 10 ale -0.01446751 1.524 BD
  36. 11 ale -0.92647637 1.637 BD
  37. 12 ale -0.99773176 1.651 BD
  38. 13 ale -1.62164363 1.704 BD
  39. 14 ale -2.12120182 1.800 BD
  40. 15 ale -1.87179280 1.983 BD
  41. 16 ale -1.64798056 2.075 BD
  42. 17 ale -1.55269957 2.170 BD
  43. 18 ale -1.64049346 2.220 BD

我想创建一个数据框,如

  1. # A tibble: 120 × 2
  2. name Borders
  3. <chr> <dbl>
  4. 1 ECe 0.491
  5. 2 SOC 0.261
  6. 3 BD 0.958
  7. 4 Sand 4.00
  8. 5 Silt 0
  9. 6 Clay 0
  10. 7 ECe 3.61
  11. 8 SOC 0.387
  12. 9 BD 1.02
  13. 10 Sand 8.42
  14. # ℹ 110 more rows

我正在使用以下代码

  1. library(tidyverse)
  2. df %>%
  3. purrr::transpose() %>%
  4. `$`(.borders) %>%
  5. bind_rows() %>%
  6. pivot_longer(everything(), values_to = "Borders")

但它返回以下错误
recycle_columns()中的错误:!Tibble列必须具有兼容的大小。·大小18:列xlmlnlx和xlm 2nlx。·大小20:列xlm 3 nlx和xlm 4 nlx。·大小21:列xlm 5 nlx和xlm 6 nlx。仅回收大小为1的值。
如何在R中实现这一点?以下是dput的数据

  1. df <- list(ECe = structure(list(.type = c("ale", "ale", "ale", "ale",
  2. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  3. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale"), .value = c(-0.866449860261058,
  4. -0.811874082709701, -0.749993003099365, -0.501212768536108, -0.47268510237864,
  5. -0.364538974363897, -0.351930853130633, -0.172990179989361, -0.0684651440322241,
  6. 0.0692627161333526, 0.132807737313057, 0.176914094922519, 0.227473041741352,
  7. 0.295586935903242, 0.458768756260148, 0.534728976733407, 0.265760631807008,
  8. 0.330347944699875, 0.793585231260766, 0.393724931630266, 0.752824545868792
  9. ), .borders = c(0.490806, 2.68, 4.99, 7.994, 8.801, 11.14, 14.09,
  10. 15.9, 17.81, 18.75, 20.19, 21.02, 22.95, 24.52, 28.29, 31.64,
  11. 37.99, 40.7, 45.1172, 53.09, 59.7192), .feature = c("ECe", "ECe",
  12. "ECe", "ECe", "ECe", "ECe", "ECe", "ECe", "ECe", "ECe", "ECe",
  13. "ECe", "ECe", "ECe", "ECe", "ECe", "ECe", "ECe", "ECe", "ECe",
  14. "ECe")), row.names = c(NA, -21L), class = "data.frame"), SOC = structure(list(
  15. .type = c("ale", "ale", "ale", "ale", "ale", "ale", "ale",
  16. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  17. "ale", "ale", "ale", "ale", "ale"), .value = c(-1.12668195657973,
  18. -1.14070505975704, -1.12096557264514, -1.0364427676548, -0.905420835797799,
  19. -0.683789433176536, -0.53425868958447, -0.483272349572241,
  20. -0.360467057150275, -0.0571214846376487, 0.0130773857269451,
  21. 0.164166766380452, 0.233741319768938, 0.174784707378661,
  22. 0.188264622491949, 0.150568432447101, 0.532302724503294,
  23. 0.733931793684184, 1.1531117354405, 2.58573209158873, 2.75830864578748
  24. ), .borders = c(0.260869565217391, 0.330143540669856, 0.422727272727273,
  25. 0.545454545454545, 0.631578947368421, 0.686915887850467,
  26. 0.763636363636364, 0.802631578947368, 0.828571428571429,
  27. 0.889952153110048, 0.967289719626168, 1.02272727272727, 1.09090909090909,
  28. 1.23684210526316, 1.40520446096654, 1.52727272727273, 1.80861244019139,
  29. 1.90909090909091, 2.20093457943925, 2.49767441860465, 2.66511627906977
  30. ), .feature = c("SOC", "SOC", "SOC", "SOC", "SOC", "SOC",
  31. "SOC", "SOC", "SOC", "SOC", "SOC", "SOC", "SOC", "SOC", "SOC",
  32. "SOC", "SOC", "SOC", "SOC", "SOC", "SOC")), row.names = c(NA,
  33. -21L), class = "data.frame"), BD = structure(list(.type = c("ale",
  34. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  35. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale"), .value = c(2.88401670431712,
  36. 2.89757908472024, 2.06229728227612, 1.8625668296819, 1.22004089065561,
  37. 0.472446924052171, 0.285314983167609, 0.210501378242261, 0.0694262373804251,
  38. -0.0144675088601809, -0.926476372785716, -0.997731763217841,
  39. -1.62164362525624, -2.12120181627754, -1.87179280480865, -1.64798056454827,
  40. -1.5526995652836, -1.64049345720051), .borders = c(0.957710151765353,
  41. 1.13854777070064, 1.18522292993631, 1.22058598726115, 1.29930014940631,
  42. 1.33971974522293, 1.40121097743178, 1.48638829912715, 1.5, 1.52428025477707,
  43. 1.6371974522293, 1.65183612487222, 1.70405095541401, 1.80025477707006,
  44. 1.98361248722183, 2.07583549579303, 2.17044900526854, 2.22039789258473
  45. ), .feature = c("BD", "BD", "BD", "BD", "BD", "BD", "BD", "BD",
  46. "BD", "BD", "BD", "BD", "BD", "BD", "BD", "BD", "BD", "BD")), row.names = c(NA,
  47. -18L), class = "data.frame"), Sand = structure(list(.type = c("ale",
  48. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  49. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  50. "ale"), .value = c(5.72243888922004, 5.04938965197184, 4.7017193997508,
  51. 4.38186986390524, 3.55049136618825, 3.79907192663079, 3.65192607277815,
  52. 2.69221076986002, 2.08417035244566, 0.508134498143654, -0.760157331236183,
  53. -2.22196153094718, -2.60183427497522, -2.6090089814882, -4.29829842975557,
  54. -4.89113681989785, -6.17719615317024, -6.51041335854504, -6.70721878970499,
  55. -6.69985492661679), .borders = c(3.9999999999992, 7.99999999999983,
  56. 12.0000000000005, 20.0000000000003, 23.9999999999995, 27.9999999999987,
  57. 31.9999999999993, 39.9999999999991, 43.9999999999998, 48.0000000000004,
  58. 52.000000000001, 59.9999999999994, 63.9999999999986, 64.0000000000001,
  59. 68.0000000000007, 71.9999999999999, 76.0000000000005, 79.9999999999997,
  60. 84.0000000000003, 88.000000000001), .feature = c("Sand", "Sand",
  61. "Sand", "Sand", "Sand", "Sand", "Sand", "Sand", "Sand", "Sand",
  62. "Sand", "Sand", "Sand", "Sand", "Sand", "Sand", "Sand", "Sand",
  63. "Sand", "Sand")), row.names = c(NA, -20L), class = "data.frame"),
  64. Silt = structure(list(.type = c("ale", "ale", "ale", "ale",
  65. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  66. "ale", "ale", "ale", "ale", "ale", "ale", "ale"), .value = c(-1.81467365524819,
  67. -1.80595765781436, -1.44252832794551, -1.40678289959526,
  68. -1.3809409627197, -1.27631650711468, -0.918535212874314,
  69. -0.891479949841867, -0.130663280250859, 0.054226944600215,
  70. 0.0371390649359506, 0.547567627523539, 0.540716330465325,
  71. 1.14691203242341, 1.45243650519454, 1.51824963792443, 1.76292774269082,
  72. 1.85725359158924, 2.48581029669555, 0.388409658807059), .borders = c(0,
  73. 3.99999999999921, 7.99999999999841, 7.99999999999983, 8.00000000000125,
  74. 11.999999999999, 15.9999999999997, 16.0000000000011, 20.0000000000003,
  75. 23.9999999999995, 24.0000000000009, 27.9999999999987, 28.0000000000001,
  76. 31.9999999999993, 35.9999999999985, 40.0000000000006, 43.9999999999998,
  77. 47.999999999999, 64.0000000000015, 79.9999999999997), .feature = c("Silt",
  78. "Silt", "Silt", "Silt", "Silt", "Silt", "Silt", "Silt", "Silt",
  79. "Silt", "Silt", "Silt", "Silt", "Silt", "Silt", "Silt", "Silt",
  80. "Silt", "Silt", "Silt")), row.names = c(NA, -20L), class = "data.frame"),
  81. Clay = structure(list(.type = c("ale", "ale", "ale", "ale",
  82. "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale", "ale",
  83. "ale", "ale", "ale", "ale", "ale"), .value = c(-1.02199413478959,
  84. -0.826304780697195, -0.942406575344331, -0.971009582383038,
  85. -1.24981505440423, -1.24219672780758, -0.443954661148336,
  86. -0.344646636267013, -0.344646636267013, 0.0190677799370838,
  87. 0.509523035852588, 0.805292224788913, 0.990611614682741,
  88. 0.998147256094054, 1.16179870265779, 2.06234942853985, 2.8900928986798,
  89. 3.82397972588229), .borders = c(0, 7.99999999999983, 11.999999999999,
  90. 12.0000000000005, 15.9999999999997, 16.0000000000011, 20.0000000000003,
  91. 23.9999999999995, 24.0000000000009, 28.0000000000001, 31.9999999999993,
  92. 35.9999999999999, 39.9999999999991, 40.0000000000006, 47.999999999999,
  93. 51.9999999999996, 56.0000000000002, 67.9999999999993), .feature = c("Clay",
  94. "Clay", "Clay", "Clay", "Clay", "Clay", "Clay", "Clay", "Clay",
  95. "Clay", "Clay", "Clay", "Clay", "Clay", "Clay", "Clay", "Clay",
  96. "Clay")), row.names = c(NA, -18L), class = "data.frame"))
5cnsuln7

5cnsuln71#

UdpateOP请求见备注:

添加.value列:

  1. imap_dfr(df, ~ data.frame(name = .y, Borders = .x$.borders, value = .x$.value))
  2. name Borders value
  3. <chr> <dbl> <dbl>
  4. 1 ECe 0.491 -0.866
  5. 2 ECe 2.68 -0.812
  6. 3 ECe 4.99 -0.750
  7. 4 ECe 7.99 -0.501
  8. 5 ECe 8.80 -0.473
  9. 6 ECe 11.1 -0.365
  10. 7 ECe 14.1 -0.352
  11. 8 ECe 15.9 -0.173
  12. 9 ECe 17.8 -0.0685
  13. 10 ECe 18.8 0.0693
  14. # … with 108 more rows

**第一个答案:**要解决您得到的错误:

1.使用purrr::transpose() %>% $(.borders)可以创建6个不同长度的向量列表。然后尝试用bind_rows将它们按列组合成一个tibble。错误是

  1. Size 18: Columns `BD` and `Clay`.
  2. Size 20: Columns `Sand` and `Silt`.
  3. Size 21: Columns `ECe` and `SOC`.
  4. Only values of size one are recycled.```

要实现你想要的功能,你可以使用purrr::map_df()或者它的变体purrr::imap_dfr()
以下是使用map_df的版本:

  1. library(purrr)
  2. library(dplyr)
  3. map(df, ~(.x %>% select(c(.feature, .borders)))) %>%
  4. map_df(., ~ .x %>% select(.borders), .id = "name")

  1. library(purrr)
  2. library(dplyr)
  3. imap_dfr(df, ~ data.frame(name = .y, Borders = .x$.borders))
  1. name .borders
  2. 1 ECe 0.4908060
  3. 2 ECe 2.6800000
  4. 3 ECe 4.9900000
  5. 4 ECe 7.9940000
  6. 5 ECe 8.8010000
  7. 6 ECe 11.1400000
  8. 7 ECe 14.0900000
  9. 8 ECe 15.9000000
  10. 9 ECe 17.8100000
  11. 10 ECe 18.7500000
  12. 11 ECe 20.1900000
  13. 12 ECe 21.0200000
  14. 13 ECe 22.9500000
  15. 14 ECe 24.5200000
  16. 15 ECe 28.2900000
  17. 16 ECe 31.6400000
  18. 17 ECe 37.9900000
  19. 18 ECe 40.7000000
  20. 19 ECe 45.1172000
  21. 20 ECe 53.0900000
  22. 21 ECe 59.7192000
  23. 22 SOC 0.2608696
  24. 23 SOC 0.3301435
  25. 24 SOC 0.4227273
  26. 25 SOC 0.5454545
  27. 26 SOC 0.6315789
  28. 27 SOC 0.6869159
  29. 28 SOC 0.7636364
  30. 29 SOC 0.8026316
  31. 30 SOC 0.8285714
  32. 31 SOC 0.8899522
  33. 32 SOC 0.9672897
  34. 33 SOC 1.0227273
  35. 34 SOC 1.0909091
  36. 35 SOC 1.2368421
  37. 36 SOC 1.4052045
  38. 37 SOC 1.5272727
  39. 38 SOC 1.8086124
  40. 39 SOC 1.9090909
  41. 40 SOC 2.2009346
  42. 41 SOC 2.4976744
  43. 42 SOC 2.6651163
  44. 43 BD 0.9577102
  45. 44 BD 1.1385478
  46. 45 BD 1.1852229
  47. 46 BD 1.2205860
  48. 47 BD 1.2993001
  49. 48 BD 1.3397197
  50. 49 BD 1.4012110
  51. 50 BD 1.4863883
  52. 51 BD 1.5000000
  53. 52 BD 1.5242803
  54. 53 BD 1.6371975
  55. 54 BD 1.6518361
  56. 55 BD 1.7040510
  57. 56 BD 1.8002548
  58. 57 BD 1.9836125
  59. 58 BD 2.0758355
  60. 59 BD 2.1704490
  61. 60 BD 2.2203979
  62. 61 Sand 4.0000000
  63. 62 Sand 8.0000000
  64. 63 Sand 12.0000000
  65. 64 Sand 20.0000000
  66. 65 Sand 24.0000000
  67. 66 Sand 28.0000000
  68. 67 Sand 32.0000000
  69. 68 Sand 40.0000000
  70. 69 Sand 44.0000000
  71. 70 Sand 48.0000000
  72. 71 Sand 52.0000000
  73. 72 Sand 60.0000000
  74. 73 Sand 64.0000000
  75. 74 Sand 64.0000000
  76. 75 Sand 68.0000000
  77. 76 Sand 72.0000000
  78. 77 Sand 76.0000000
  79. 78 Sand 80.0000000
  80. 79 Sand 84.0000000
  81. 80 Sand 88.0000000
  82. 81 Silt 0.0000000
  83. 82 Silt 4.0000000
  84. 83 Silt 8.0000000
  85. 84 Silt 8.0000000
  86. 85 Silt 8.0000000
  87. 86 Silt 12.0000000
  88. 87 Silt 16.0000000
  89. 88 Silt 16.0000000
  90. 89 Silt 20.0000000
  91. 90 Silt 24.0000000
  92. 91 Silt 24.0000000
  93. 92 Silt 28.0000000
  94. 93 Silt 28.0000000
  95. 94 Silt 32.0000000
  96. 95 Silt 36.0000000
  97. 96 Silt 40.0000000
  98. 97 Silt 44.0000000
  99. 98 Silt 48.0000000
  100. 99 Silt 64.0000000
  101. 100 Silt 80.0000000
  102. 101 Clay 0.0000000
  103. 102 Clay 8.0000000
  104. 103 Clay 12.0000000
  105. 104 Clay 12.0000000
  106. 105 Clay 16.0000000
  107. 106 Clay 16.0000000
  108. 107 Clay 20.0000000
  109. 108 Clay 24.0000000
  110. 109 Clay 24.0000000
  111. 110 Clay 28.0000000
  112. 111 Clay 32.0000000
  113. 112 Clay 36.0000000
  114. 113 Clay 40.0000000
  115. 114 Clay 40.0000000
  116. 115 Clay 48.0000000
  117. 116 Clay 52.0000000
  118. 117 Clay 56.0000000
  119. 118 Clay 68.0000000
展开查看全部
r1wp621o

r1wp621o2#

使用map()list_rbind()

  1. library(tidyverse)
  2. map(df, ~ select(.x, Name = .feature, Borders = .borders, Value = .value)) |>
  3. list_rbind() |>
  4. group_by(Name) |>
  5. mutate(row_order = 1:n()) |>
  6. ungroup() |>
  7. arrange(row_order) |>
  8. select(-row_order)
  1. # A tibble: 118 × 3
  2. Name Borders Value
  3. <chr> <dbl> <dbl>
  4. 1 ECe 0.491 -0.866
  5. 2 SOC 0.261 -1.13
  6. 3 BD 0.958 2.88
  7. 4 Sand 4.00 5.72
  8. 5 Silt 0 -1.81
  9. 6 Clay 0 -1.02
  10. 7 ECe 2.68 -0.812
  11. 8 SOC 0.330 -1.14
  12. 9 BD 1.14 2.90
  13. 10 Sand 8.00 5.05
  14. # … with 108 more rows

如果顺序不重要,您可以直接使用:

  1. map(df, ~ select(.x, Name = .feature, Borders = .borders, Value = .value)) |>
  2. list_rbind()
展开查看全部

相关问题