-
Notifications
You must be signed in to change notification settings - Fork 84
/
Copy pathdata-known-name-variations.R
200 lines (173 loc) · 3.66 KB
/
data-known-name-variations.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
variations <- list(
#"Åland Islands" = c(
#"Aland Islands",
#"aland islands",
#"Åland Islands",
#"åland islands"
#),
"Suriname" = c(
"Dutch Guyana",
"Dutch Guiana"
),
"French Guiana" = c(
"French Guiana",
"French Guyana"
),
"Guyana" = c(
"British Guiana",
"British Guyana"
),
"Congo - Brazzaville" = c(
"republic of congo",
"republic of the congo",
"congo, republic of the",
"congo, republic",
"congo, rep.",
"congo-brazzaville",
"french congo"
),
"Congo - Kinshasa" = c(
"democratic republic of the congo",
"congo, democratic republic of the",
"dem rep of the congo",
"the democratic republic of congo",
"congo, dem. rep.",
"dr congo",
"drc",
"droc",
"rdc",
"congo-kinshasa",
"congo-zaire",
"zaire",
"belgian congo",
"congo free state",
"D.R. Congo",
"DR Congo",
"Democratic Republic of Congo"
# accented regexes do not work on Windows. They are not officially supported anyway
#"republic of the congo-léopoldville",
# "rép. démocratique du congo",
),
"China" = c(
"People's Republic of China",
"China, People's Republic",
"China"
),
"Hong Kong SAR China" = c(
"Hong Kong, China",
"Hong Kong"
),
"Macao SAR China" = c(
"Macau, China",
"Macao, China",
"Macau",
"Macao"
),
"Taiwan" = c(
x = "Republic of China",
x = "Taiwan, Province of China",
x = "Taiwan"
),
"Ireland" = c(
"Republic of Ireland",
"Ireland"
),
"Martinique" = c(
"France, Martinique",
"Martinique, France"
),
"North Korea" = c(
"Democratic People's Republic of Korea",
"DPRK",
"Korea, Dem. Rep.",
"DPR Korea",
"D.P.R. Korea",
"D.P.R Korea",
"Korea DPR",
"Korea D.P.R.",
"Korea, DPR",
"Korea, D.P.R.",
"Korea, North",
"Korea North",
"Korea, Democratic People's Republic",
"Korea (the Democratic People's Republic of)",
"North Korea"
),
"North Macedonia" = c(
"fyrom"
),
"South Africa" = c(
"South Africa",
"South-Africa"
),
"South Korea" = c(
"Korea, Republic of",
"Korea, Rep. of",
"Korea, South",
"Korea South",
"Republic of Korea",
"Rep. of Korea",
"South Korea"
),
"Turkey" = c(
"Turkey",
"Türkiye"
),
"United Arab Emirates" = c(
"emirates",
"united arab em.",
"uae",
"u.a.e."
),
"United Kingdom" = c(
"u.k.",
"United Kingdom",
"The United Kingdom",
"United Kingdom of Great Britain",
"United Kingdom of Great Britain and Northern Ireland"
),
"United States" = c(
"u.s.",
"U.S.A.",
"United States",
"USA"
),
"United States Minor Outlying Islands (the)" = c(
"United States Minor Outlying Islands",
"US Minor Outlying Islands",
"U.S. Minor Outlying Islands",
"Minor Outlying Islands US",
"Minor Outlying Islands U.S.",
"Minor Outlying Islands, US",
"Minor Outlying Islands, U.S."
),
"U.S. Virgin Islands" = c(
"United States Virgin Islands",
"US Virgin Islands",
"U.S. Virgin Islands",
"Virgin Islands, US",
"Virgin Islands, U.S.",
"Virgin Islands, (U.S.)",
"Virgin Islands, (US)",
"Virgin Islands US",
"Virgin Islands U.S.",
"Virgin Islands (U.S.)",
"Virgin Islands (US)"
),
"Yemen" = c(
"yemen",
"republic of yemen"
),
"Yemen Arab Republic" = c(
'yemen arab republic',
'north yemen',
'yemen (sana\'a)'
),
"Yemen People's Republic" = c(
'yemen people\'s republic',
'people\'s democratic republic of yemen',
'south yemen',
'democratic yemen',
'yemen (aden)'
)
)