这些是我的数据集的前50行:
structure(list(price_used = c("comtrade_price_mult", NA, NA,
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
NA, "comtrade_price_mult", "comtrade_price_mult", NA, "comtrade_price_mult",
NA, "comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
NA, "comtrade_price_mult", "comtrade_price_mult", "comtrade_price_mult",
NA, "comtrade_price_mult", NA, "comtrade_price_mult", "comtrade_price_mult",
"comtrade_price_mult", NA), year = c(2003, 2013, 2014, 2005,
2005, 2005, 2005, 2006, 2006, 2006, 2006, 2007, 2007, 2007, 2007,
2008, 2008, 2009, 2009, 2010, 2010, 2011, 2011, 2012, 2012, 2012,
2012, 1994, 1995, 1996, 1996, 1996, 1997, 1997, 1997, 1998, 1998,
1998, 1999, 1999, 1999, 2004, 2004, 2004, 2005, 2005, 2005, 2006,
2006, 2006), country = c("cameroon", "cape verde", "cape verde",
"cote d'ivoire", "cote d'ivoire", "cote d'ivoire", "cote d'ivoire",
"cote d'ivoire", "cote d'ivoire", "cote d'ivoire", "cote d'ivoire",
"cote d'ivoire", "cote d'ivoire", "cote d'ivoire", "cote d'ivoire",
"cote d'ivoire", "cote d'ivoire", "cote d'ivoire", "cote d'ivoire",
"cote d'ivoire", "cote d'ivoire", "cote d'ivoire", "cote d'ivoire",
"cote d'ivoire", "cote d'ivoire", "cote d'ivoire", "cote d'ivoire",
"egypt", "egypt", "egypt", "egypt", "egypt", "egypt", "egypt",
"egypt", "egypt", "egypt", "egypt", "egypt", "egypt", "egypt",
"egypt", "egypt", "egypt", "egypt", "egypt", "egypt", "egypt",
"egypt", "egypt"), standardmeasure = c("42-gallon barrels per day",
"", "", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "thousand 42-gallon barrels", "thousand 42-gallon barrels",
"thousand 42-gallon barrels", "million 42-gallon barrels", "million 42-gallon barrels",
"million 42-gallon barrels", "million cubic meters", "million 42-gallon barrels",
"million 42-gallon barrels", "million cubic meters", "million 42-gallon barrels",
"million cubic meters", "million 42-gallon barrels", "million 42-gallon barrels",
"million 42-gallon barrels", "million cubic meters", "million 42-gallon barrels",
"million 42-gallon barrels", "million 42-gallon barrels", "million cubic meters",
"million 42-gallon barrels", "million cubic meters", "million 42-gallon barrels",
"million 42-gallon barrels", "million 42-gallon barrels", "million cubic meters"
), annuallocationcapacity = c(5250, NA, NA, 1000, 1000, 17520,
6700, 1000, 17520, 6700, 1000, 1000, 6700, 17520, 1000, 17520,
6700, 6700, 17520, 6700, 17520, 6700, 17520, 6700, NA, NA, 17520,
42, 42, 15, 3800, 27, 20, 5000, 12, 3800, 15, 27, 27, 3800, 15,
27, 15, 3800, 15, 3800, 27, 27, 15, 3800), minetype = c("extraction site",
"mine", "mine", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site",
"extraction site", "extraction site", "extraction site", "extraction site"
), mineownership = c("industrial", "artisanal", "artisanal",
"industrial", "industrial", "industrial", "industrial", "industrial",
"industrial", "industrial", "industrial", "industrial", "industrial",
"industrial", "industrial", "industrial", "industrial", "industrial",
"industrial", "industrial", "industrial", "industrial", "industrial",
"industrial", "industrial", "industrial", "industrial", "government",
"government", "government", "government", "government", "government",
"government", "government", "government", "government", "government",
"industrial", "government", "industrial", "government", "government",
"government", "government", "government", "government", "government",
"government", "government"), locationname = c("moudi field",
"salinas de porto ingles, maio", "salinas de porto ingles, maio",
"panther oilfield", "lion oilfield", "baobab oilfield", "east espoir oilfield",
"panther oilfield", "baobab oilfield", "east espoir oilfield",
"lion oilfield", "lion oilfield", "east espoir oilfield", "baobab oilfield",
"panther oilfield", "baobab oilfield", "east espoir oilfield",
"east espoir oilfield", "baobab oilfield", "east espoir oilfield",
"baobab oilfield", "east espoir oilfield", "baobab oilfield",
"east espoir oilfield", "block cl-401", "block cl-103", "baobab oilfield",
"el morgan, suez gulf", "el morgan, suez gulf", "ras budran, suez gulf",
"abu madi", "el morgan, suez gulf", "el morgan, suez gulf", "abu madi",
"ras budran, suez gulf", "abu madi", "ras budran, suez gulf",
"el morgan, suez gulf", "el morgan, suez gulf", "abu madi", "ras budran, suez gulf",
"el morgan, suez gulf", "ras budran, suez gulf", "abu madi",
"ras budran, suez gulf", "abu madi", "el morgan, suez gulf",
"el morgan, suez gulf", "ras budran, suez gulf", "abu madi"),
admin1 = c("", "maio", "maio", "gulf of guinea", "gulf of guinea",
"gulf of guinea", "gulf of guinea", "gulf of guinea", "gulf of guinea",
"gulf of guinea", "gulf of guinea", "gulf of guinea", "gulf of guinea",
"gulf of guinea", "gulf of guinea", "gulf of guinea", "gulf of guinea",
"gulf of guinea", "gulf of guinea", "gulf of guinea", "gulf of guinea",
"gulf of guinea", "gulf of guinea", "gulf of guinea", "gulf of guinea",
"gulf of guinea", "gulf of guinea", "south sinai", "south sinai",
"south sinai", "matruh", "south sinai", "south sinai", "matruh",
"south sinai", "matruh", "south sinai", "south sinai", "south sinai",
"matruh", "south sinai", "south sinai", "south sinai", "matruh",
"south sinai", "matruh", "south sinai", "south sinai", "south sinai",
"matruh"), admin2 = c("", "porto ingles", "porto ingles",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", ""), world_val_withmc = c(64626612, NA, NA, 58750496,
58750496, 1029308672, 393628320, 68633024, 1202450560, 459841248,
68633024, 73954616, 495495904, 1295684864, 73954616, 1733089280,
662768192, 418824960, 1095196032, 529573184, 1384794368,
682766400, 1785383168, 676864192, NA, NA, 1769949312, 915343488,
969826176, 404228960, NA, 727612096, 497491968, NA, 298495168,
NA, 251538608, 452769472, 616853568, NA, 342696416, 1157142272,
642856832, NA, 881257408, NA, 1586263424, 1853091584, 1029495296,
NA), lootable = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0), orig_deflator = c(NA,
105.639106949701, 107.374395983726, NA, NA, NA, NA, NA, NA,
NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,
NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,
NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA), resource = c("oil",
"salt", "salt", "oil", "oil", "oil", "oil", "oil", "oil",
"oil", "oil", "oil", "oil", "oil", "oil", "oil", "oil", "oil",
"oil", "oil", "oil", "oil", "oil", "oil", "oil", "oil", "oil",
"oil", "oil", "oil", "natural gas", "oil", "oil", "natural gas",
"oil", "natural gas", "oil", "oil", "oil", "natural gas",
"oil", "oil", "oil", "natural gas", "oil", "natural gas",
"oil", "oil", "oil", "natural gas"), exp_annual_value_location1 = c(76133440,
NA, NA, 62305808, 62305808, 1091597824, 417448928, 66877492,
1171693696, 448079200, 66877492, 76446016, 512188320, 1339334144,
76446016, 1643753728, 628604480, 418313280, 1093857920, 529067712,
1383472512, 717797248, 1876986112, 748939840, NA, NA, 1958421888,
877859392, 847055424, 365471232, NA, 657848192, 426205312,
NA, 255723200, NA, 168767872, 303782144, 536430400, NA, 298016896,
912430656, 506905920, NA, 593088704, NA, 1067559680, 1312398336,
729110144, NA), offshore = c(1, 0, 0, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1), NAME_0 = c("Cameroon", "Cabo Verde", "Cabo Verde",
"Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire",
"Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire",
"Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire",
"Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire",
"Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire",
"Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire", "Côte d'Ivoire",
"Egypt", "Egypt", "Egypt", "Egypt", "Egypt", "Egypt", "Egypt",
"Egypt", "Egypt", "Egypt", "Egypt", "Egypt", "Egypt", "Egypt",
"Egypt", "Egypt", "Egypt", "Egypt", "Egypt", "Egypt", "Egypt",
"Egypt", "Egypt"), NAME_1 = c("Sud-Ouest", "Maio", "Maio",
"Lagunes", "Lagunes", "Lagunes", "Lagunes", "Lagunes", "Lagunes",
"Lagunes", "Lagunes", "Lagunes", "Lagunes", "Lagunes", "Lagunes",
"Lagunes", "Lagunes", "Lagunes", "Lagunes", "Lagunes", "Lagunes",
"Lagunes", "Lagunes", "Lagunes", "Comoe", "Abidjan", "Lagunes",
"Janub Sina", "Janub Sina", "Janub Sina", "Al Iskandariyah",
"Janub Sina", "Janub Sina", "Al Iskandariyah", "Janub Sina",
"Al Iskandariyah", "Janub Sina", "Janub Sina", "Janub Sina",
"Al Iskandariyah", "Janub Sina", "Janub Sina", "Janub Sina",
"Al Iskandariyah", "Janub Sina", "Al Iskandariyah", "Janub Sina",
"Janub Sina", "Janub Sina", "Al Iskandariyah"), comtrade_price_mult = c(14501.607421875,
NA, NA, 62305.80859375, 62305.80859375, 62305.80859375, 62305.80859375,
66877.4921875, 66877.4921875, 66877.4921875, 66877.4921875,
76446.015625, 76446.015625, 76446.015625, 76446.015625, 93821.5625,
93821.5625, 62434.81640625, 62434.81640625, 78965.328125,
78965.328125, 107133.9140625, 107133.9140625, 111782.0703125,
111782.0703125, 111782.0703125, 111782.0703125, 20901414,
20167986, 24364748, NA, 24364748, 21310266, NA, 21310266,
NA, 11251191, 11251191, 19867792, NA, 19867792, 33793728,
33793728, NA, 39539248, NA, 39539248, 48607344, 48607344,
NA), wb_price_mult = c(12309.830078125, NA, NA, 58750.49609375,
58750.49609375, 58750.49609375, 58750.49609375, 68633.0234375,
68633.0234375, 68633.0234375, 68633.0234375, 73954.6171875,
73954.6171875, 73954.6171875, 73954.6171875, 98920.625, 98920.625,
62511.19140625, 62511.19140625, 79040.7734375, 79040.7734375,
101905.4296875, 101905.4296875, 101024.5078125, 101024.5078125,
101024.5078125, 101024.5078125, 21793892, 23091100, 26948596,
NA, 26948596, 24874598, NA, 24874598, NA, 16769240, 16769240,
22846428, NA, 22846428, 42857120, 42857120, NA, 58750496,
NA, 58750496, 68633024, 68633024, NA), usgs_price_mult = c(NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_), multicolour_price_mult = c(NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_
), comtrade_unit = c("kilograms", "", "", "kilograms", "kilograms",
"kilograms", "kilograms", "kilograms", "kilograms", "kilograms",
"kilograms", "kilograms", "kilograms", "kilograms", "kilograms",
"kilograms", "kilograms", "kilograms", "kilograms", "kilograms",
"kilograms", "kilograms", "kilograms", "kilograms", "kilograms",
"kilograms", "kilograms", "kilograms", "kilograms", "kilograms",
"", "kilograms", "kilograms", "", "kilograms", "", "kilograms",
"kilograms", "kilograms", "", "kilograms", "kilograms", "kilograms",
"", "kilograms", "", "kilograms", "kilograms", "kilograms",
""), wb_unit = c("42-gallon barrels", "", "", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "", "42-gallon barrels",
"42-gallon barrels", "", "42-gallon barrels", "", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "", "42-gallon barrels",
"42-gallon barrels", "42-gallon barrels", "", "42-gallon barrels",
"", "42-gallon barrels", "42-gallon barrels", "42-gallon barrels",
""), usgs_unit = c("", "metric tons", "metric tons", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
""), multicolour_unit = c("", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", "", "", "", "",
"", "", "", "", "", "", "", "", "", "", "", ""), comtrade_price = c(0.288748025894165,
NA, NA, 0.461126893758774, 0.461126893758774, 0.461126893758774,
0.461126893758774, 0.494962066411972, 0.494962066411972,
0.494962066411972, 0.494962066411972, 0.565778911113739,
0.565778911113739, 0.565778911113739, 0.565778911113739,
0.694375813007355, 0.694375813007355, 0.462081670761108,
0.462081670761108, 0.584424436092377, 0.584424436092377,
0.792900860309601, 0.792900860309601, 0.827301979064941,
0.827301979064941, 0.827301979064941, 0.827301979064941,
0.150046527385712, 0.144781410694122, 0.174909025430679,
NA, 0.174909025430679, 0.152981579303741, NA, 0.152981579303741,
NA, 0.0807697549462318, 0.0807697549462318, 0.142626389861107,
NA, 0.142626389861107, 0.242597535252571, 0.242597535252571,
NA, 0.283843338489532, NA, 0.283843338489532, 0.348941147327423,
0.348941147327423, NA), wb_price = c(33.7255630927967, NA,
NA, 58.7504956668303, 58.7504956668303, 58.7504956668303,
58.7504956668303, 68.6330215319166, 68.6330215319166, 68.6330215319166,
68.6330215319166, 73.954614038387, 73.954614038387, 73.954614038387,
73.954614038387, 98.9206215110437, 98.9206215110437, 62.5111900128862,
62.5111900128862, 79.0407717847173, 79.0407717847173, 101.905430027248,
101.905430027248, 101.024504690732, 101.024504690732, 101.024504690732,
101.024504690732, 21.7938920399316, 23.0910996292376, 26.9485969327739,
NA, 26.9485969327739, 24.8745986032634, NA, 24.8745986032634,
NA, 16.7692401486971, 16.7692401486971, 22.8464274960424,
NA, 22.8464274960424, 42.8571212084921, 42.8571212084921,
NA, 58.7504956668303, NA, 58.7504956668303, 68.6330215319166,
68.6330215319166, NA), usgs_price = c(NA, 45.5323791503906,
44.8896598815918, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,
NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,
NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA,
NA, NA, NA, NA, NA, NA, NA), multicolour_price = c(NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_), comtrade_value = c(76133440, NA, NA, 62305808,
62305808, 1091597824, 417448928, 66877496, 1171693696, 448079232,
66877496, 76446016, 512188288, 1339334144, 76446016, 1643753856,
628604480, 418313248, 1093857920, 529067712, 1383472512,
717797248, 1876986240, 748939840, NA, NA, 1958421888, 877859392,
847055424, 365471232, NA, 657848192, 426205312, NA, 255723184,
NA, 168767856, 303782144, 536430400, NA, 298016896, 912430656,
506905920, NA, 593088768, NA, 1067559744, 1312398336, 729110208,
NA), wb_value = c(64626612, NA, NA, 58750496, 58750496, 1029308672,
393628320, 68633024, 1202450560, 459841248, 68633024, 73954616,
495495904, 1295684864, 73954616, 1733089280, 662768192, 418824960,
1095196032, 529573184, 1384794368, 682766400, 1785383168,
676864192, NA, NA, 1769949312, 915343488, 969826176, 404228960,
NA, 727612096, 497491968, NA, 298495168, NA, 251538608, 452769472,
616853568, NA, 342696416, 1157142272, 642856832, NA, 881257408,
NA, 1586263424, 1853091584, 1029495296, NA), usgs_value = c(NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_), multicolour_value = c(NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_, NA_real_,
NA_real_, NA_real_, NA_real_, NA_real_, NA_real_), yearvalue = c(76133438.9648438,
NA, NA, 62305808.59375, 62305808.59375, 1091597766.5625,
417448917.578125, 66877492.1875, 1171693663.125, 448079197.65625,
66877492.1875, 76446015.625, 512188304.6875, 1339334193.75,
76446015.625, 1643753775, 628604468.75, 418313269.921875,
1093857983.4375, 529067698.4375, 1383472548.75, 717797224.21875,
1876986174.375, 748939871.09375, NA, NA, 1958421871.875,
877859388, 847055412, 365471220, NA, 657848196, 426205320,
NA, 255723192, NA, 168767865, 303782157, 536430384, NA, 298016880,
912430656, 506905920, NA, 593088720, NA, 1067559696, 1312398288,
729110160, NA), price_mult = c(14501.607421875, NA, NA, 62305.80859375,
62305.80859375, 62305.80859375, 62305.80859375, 66877.4921875,
66877.4921875, 66877.4921875, 66877.4921875, 76446.015625,
76446.015625, 76446.015625, 76446.015625, 93821.5625, 93821.5625,
62434.81640625, 62434.81640625, 78965.328125, 78965.328125,
107133.9140625, 107133.9140625, 111782.0703125, 111782.0703125,
111782.0703125, 111782.0703125, 20901414, 20167986, 24364748,
NA, 24364748, 21310266, NA, 21310266, NA, 11251191, 11251191,
19867792, NA, 19867792, 33793728, 33793728, NA, 39539248,
NA, 39539248, 48607344, 48607344, NA), oil_gas = c(1, 0,
0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1), gold = c(0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0), artisanal = c(0, 1, 1, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0)), row.names = c(NA, 50L), class = "data.frame")
我想知道对于NAME_0, year, standardmeasure, resource
的每个唯一组合,变量comtrade_price_mult, wb_price_mult, usgs_price_mult
和multicolour_price_mult
有多少个不同的值。
结果应该看起来像:
year NAME_0 standardmeasure resource n_comtrade n_wb n_usgs n_multicolour
2004 Ghana kilogram gold 3 1 1 NA
2005 Namibia metric tons diamonds 2 1 NA 1
带NA表示只有NA值。
可能通过使用管道将n_distinct()和group_by()组合在一起?
使用group_by
,summarise
,…你可以这样做:
注意:如果只有NA
值,我使用if
来返回NA
。还请注意,如果不想计算NAs,则必须将na.rm = TRUE
添加到n_distinct
。
library(dplyr)
df |>
group_by(year, NAME_0, standardmeasure, resource) |>
summarise(across(c(comtrade_price_mult, wb_price_mult, usgs_price_mult, multicolour_price_mult), ~ if (all(is.na(.x))) NA_integer_ else n_distinct(.x)), .groups = "drop") |>
rename_with(~ gsub("^(.*?)_price_mult$", "n_\1", .x), .cols = ends_with("price_mult"))
#> # A tibble: 27 × 8
#> year NAME_0 standardmeasure resource n_comtrade n_wb n_usgs n_multicolour
#> <dbl> <chr> <chr> <chr> <int> <int> <int> <int>
#> 1 1994 Egypt million 42-gallo… oil 1 1 NA NA
#> 2 1995 Egypt million 42-gallo… oil 1 1 NA NA
#> 3 1996 Egypt million 42-gallo… oil 1 1 NA NA
#> 4 1996 Egypt million cubic me… natural… NA NA NA NA
#> 5 1997 Egypt million 42-gallo… oil 1 1 NA NA
#> 6 1997 Egypt million cubic me… natural… NA NA NA NA
#> 7 1998 Egypt million 42-gallo… oil 1 1 NA NA
#> 8 1998 Egypt million cubic me… natural… NA NA NA NA
#> 9 1999 Egypt million 42-gallo… oil 1 1 NA NA
#> 10 1999 Egypt million cubic me… natural… NA NA NA NA
#> # … with 17 more rows