Changes
On April 12, 2022 at 2:03:01 AM UTC, seanh:
-
Added the following fields to ARCTIC INFRASTRUCTURE INVENTORY
- Database Level with value Project
- FIAR with value No
- Source of Data Policy with value Own
- Region with value Arctic
- Opening Degree with value Restricted Open
- Theme with value Infrastructure
- Host Institute with value Wilson Center’s Polar Institute
- Organizer with value Wilson Center’s Polar Institute
f | 1 | { | f | 1 | { |
2 | "author": "", | 2 | "author": "", | ||
3 | "author_email": "", | 3 | "author_email": "", | ||
4 | "creator_user_id": "2e9fa41b-0394-4070-98d0-205f79d5738b", | 4 | "creator_user_id": "2e9fa41b-0394-4070-98d0-205f79d5738b", | ||
5 | "extras": [ | 5 | "extras": [ | ||
6 | { | 6 | { | ||
7 | "key": "Country", | 7 | "key": "Country", | ||
8 | "value": "USA" | 8 | "value": "USA" | ||
9 | }, | 9 | }, | ||
10 | { | 10 | { | ||
11 | "key": "Data Management ", | 11 | "key": "Data Management ", | ||
12 | "value": "\"Data in its raw form may contain errors or be | 12 | "value": "\"Data in its raw form may contain errors or be | ||
13 | incompatible with the structure of AII, so it must be processed before | 13 | incompatible with the structure of AII, so it must be processed before | ||
14 | integration. AII data is processed in 3 interconnected stages: | 14 | integration. AII data is processed in 3 interconnected stages: | ||
15 | cleaning, transformation, and validation. Cleaning and Transformation | 15 | cleaning, transformation, and validation. Cleaning and Transformation | ||
16 | Though they are two distinct stages, cleaning and transformation often | 16 | Though they are two distinct stages, cleaning and transformation often | ||
17 | occur at the same time. Cleaning refers to dealing with erroneous | 17 | occur at the same time. Cleaning refers to dealing with erroneous | ||
18 | records (those that are incomplete, inaccurate, irrelevant, or | 18 | records (those that are incomplete, inaccurate, irrelevant, or | ||
19 | duplicated). Transformation, in contrast, converts raw data into a | 19 | duplicated). Transformation, in contrast, converts raw data into a | ||
20 | desired format. Because AII is ultimately intended for public use, | 20 | desired format. Because AII is ultimately intended for public use, | ||
21 | Wilson Center staff aim to convert raw data into formats more easily | 21 | Wilson Center staff aim to convert raw data into formats more easily | ||
22 | understood by human users. Given that each AII data source contains | 22 | understood by human users. Given that each AII data source contains | ||
23 | unique records and encoding methods, cleaning and transformation was | 23 | unique records and encoding methods, cleaning and transformation was | ||
24 | tailored to each source. Validation Data validation ensures the | 24 | tailored to each source. Validation Data validation ensures the | ||
25 | quality of records that have undergone cleaning and transformation. | 25 | quality of records that have undergone cleaning and transformation. | ||
26 | Whenever possible, AII records were cross-referenced with data from | 26 | Whenever possible, AII records were cross-referenced with data from | ||
27 | multiple sources to confirm their validity.\"" | 27 | multiple sources to confirm their validity.\"" | ||
28 | }, | 28 | }, | ||
29 | { | 29 | { | ||
30 | "key": "Data Policy", | 30 | "key": "Data Policy", | ||
31 | "value": "\"The Wilson Center developed a list of potential data | 31 | "value": "\"The Wilson Center developed a list of potential data | ||
32 | sources and prioritized the inclusion of web pages that maximize the | 32 | sources and prioritized the inclusion of web pages that maximize the | ||
33 | volume, relevance, and accuracy of records. Priority was given to the | 33 | volume, relevance, and accuracy of records. Priority was given to the | ||
34 | datasets of government bodies, independent research organizations, and | 34 | datasets of government bodies, independent research organizations, and | ||
35 | NGOs, due to their role as aggregators of publicly available data and | 35 | NGOs, due to their role as aggregators of publicly available data and | ||
36 | transparency in methods. Additionally, as the owners of public | 36 | transparency in methods. Additionally, as the owners of public | ||
37 | infrastructure, governments can be assumed to have the most | 37 | infrastructure, governments can be assumed to have the most | ||
38 | authoritative dataset on public projects. For the current release of | 38 | authoritative dataset on public projects. For the current release of | ||
39 | AII (December 2020), the largest sources of data were: the United | 39 | AII (December 2020), the largest sources of data were: the United | ||
40 | Nations Code for Trade and Transport Locations the Global Power Plant | 40 | Nations Code for Trade and Transport Locations the Global Power Plant | ||
41 | Database (World Resources Institute) the Arctic Marine and Aviation | 41 | Database (World Resources Institute) the Arctic Marine and Aviation | ||
42 | Transportation Infrastructure Initiative (Arctic Council, under an | 42 | Transportation Infrastructure Initiative (Arctic Council, under an | ||
43 | initiative of the Governments of the United States and Iceland) the | 43 | initiative of the Governments of the United States and Iceland) the | ||
44 | Interagency Electronic Reporting System for Commercial Fishery | 44 | Interagency Electronic Reporting System for Commercial Fishery | ||
45 | Landings (State of Alaska) the Federal Agency of Sea and River | 45 | Landings (State of Alaska) the Federal Agency of Sea and River | ||
46 | Transport (Government of the Russian Federation) Because coverage is | 46 | Transport (Government of the Russian Federation) Because coverage is | ||
47 | currently limited to publicly available data, this list is not | 47 | currently limited to publicly available data, this list is not | ||
48 | exhaustive. When possible, the websites of private owners of | 48 | exhaustive. When possible, the websites of private owners of | ||
49 | infrastructure were also consulted as the most authoritative | 49 | infrastructure were also consulted as the most authoritative | ||
50 | source.\"" | 50 | source.\"" | ||
51 | }, | 51 | }, | ||
52 | { | 52 | { | ||
53 | "key": "Data Sharing Principle", | 53 | "key": "Data Sharing Principle", | ||
54 | "value": "\"Extracting Data Once a data source has been | 54 | "value": "\"Extracting Data Once a data source has been | ||
55 | earmarked for inclusion in AII, its data must be extracted. The method | 55 | earmarked for inclusion in AII, its data must be extracted. The method | ||
56 | chosen for data extraction depends on the format in which a web page | 56 | chosen for data extraction depends on the format in which a web page | ||
57 | stores data. Data used to build AII is stored in a variety of formats, | 57 | stores data. Data used to build AII is stored in a variety of formats, | ||
58 | ranging from .csv and .doc files to raw html. Where files are publicly | 58 | ranging from .csv and .doc files to raw html. Where files are publicly | ||
59 | available, they are downloaded in their raw form for further | 59 | available, they are downloaded in their raw form for further | ||
60 | processing. Where data is stored in html, web scraping is employed. | 60 | processing. Where data is stored in html, web scraping is employed. | ||
61 | Web scraping, a normal part of internet operations, allows users to | 61 | Web scraping, a normal part of internet operations, allows users to | ||
62 | grab the portions of a web page\u2019s html that contain the raw form | 62 | grab the portions of a web page\u2019s html that contain the raw form | ||
63 | of desired data. Web scraping can be performed in multiple coding | 63 | of desired data. Web scraping can be performed in multiple coding | ||
64 | languages, but for the purposes of AII, scraping was performed in | 64 | languages, but for the purposes of AII, scraping was performed in | ||
65 | Python. In accordance with industry standards, all data extraction | 65 | Python. In accordance with industry standards, all data extraction | ||
66 | and web scraping followed hypertext transfer protocol (HTTP) and | 66 | and web scraping followed hypertext transfer protocol (HTTP) and | ||
67 | proceeded with scraping only when issued a status code of 200 by the | 67 | proceeded with scraping only when issued a status code of 200 by the | ||
68 | requested server of the data source. Users also followed the scraping | 68 | requested server of the data source. Users also followed the scraping | ||
69 | protocols outlined by a server\u2019s Robots.txt file, being careful | 69 | protocols outlined by a server\u2019s Robots.txt file, being careful | ||
70 | not to exceed a server\u2019s request limits. There are several | 70 | not to exceed a server\u2019s request limits. There are several | ||
71 | limitations to using the methodology described in this document. It is | 71 | limitations to using the methodology described in this document. It is | ||
72 | unlikely that all data will be captured by this methodology due to the | 72 | unlikely that all data will be captured by this methodology due to the | ||
73 | following factors: not all infrastructure data is publicly available | 73 | following factors: not all infrastructure data is publicly available | ||
74 | search engines may return incomplete data due to deficiencies and | 74 | search engines may return incomplete data due to deficiencies and | ||
75 | biases in algorithms, indices, and/or queries data collected from | 75 | biases in algorithms, indices, and/or queries data collected from | ||
76 | third-parties may be erroneous The Wilson Center will make efforts to | 76 | third-parties may be erroneous The Wilson Center will make efforts to | ||
77 | counter these limitations by: consulting governmental and | 77 | counter these limitations by: consulting governmental and | ||
78 | nongovernmental entities directly to gain access to data that may not | 78 | nongovernmental entities directly to gain access to data that may not | ||
79 | have appeared in search results or public web pages using multiple | 79 | have appeared in search results or public web pages using multiple | ||
80 | data sources to \u201cplug\u201d each other\u2019s gaps cleaning and | 80 | data sources to \u201cplug\u201d each other\u2019s gaps cleaning and | ||
81 | validating third-party data\"" | 81 | validating third-party data\"" | ||
n | n | 82 | }, | ||
83 | { | ||||
84 | "key": "Database Level", | ||||
85 | "value": "Project" | ||||
86 | }, | ||||
87 | { | ||||
88 | "key": "FIAR", | ||||
89 | "value": "No" | ||||
90 | }, | ||||
91 | { | ||||
92 | "key": "Host Institute", | ||||
93 | "value": "Wilson Center\u2019s Polar Institute" | ||||
94 | }, | ||||
95 | { | ||||
96 | "key": "Opening Degree", | ||||
97 | "value": "Restricted Open" | ||||
98 | }, | ||||
99 | { | ||||
100 | "key": "Organizer", | ||||
101 | "value": "Wilson Center\u2019s Polar Institute" | ||||
102 | }, | ||||
103 | { | ||||
104 | "key": "Region", | ||||
105 | "value": "Arctic" | ||||
106 | }, | ||||
107 | { | ||||
108 | "key": "Source of Data Policy", | ||||
109 | "value": "Own" | ||||
110 | }, | ||||
111 | { | ||||
112 | "key": "Theme", | ||||
113 | "value": "Infrastructure" | ||||
82 | } | 114 | } | ||
83 | ], | 115 | ], | ||
84 | "groups": [ | 116 | "groups": [ | ||
85 | { | 117 | { | ||
86 | "description": "Inventory of Database for Earth Three Poles", | 118 | "description": "Inventory of Database for Earth Three Poles", | ||
87 | "display_name": "An Inventory of Database for Earth Three | 119 | "display_name": "An Inventory of Database for Earth Three | ||
88 | Poles", | 120 | Poles", | ||
89 | "id": "543d60c4-2ba5-4474-b3d2-47a5cd109ce8", | 121 | "id": "543d60c4-2ba5-4474-b3d2-47a5cd109ce8", | ||
90 | "image_display_url": | 122 | "image_display_url": | ||
91 | .142.79/uploads/group/2021-05-18-053212.318529inventurydatabase1.jpg", | 123 | .142.79/uploads/group/2021-05-18-053212.318529inventurydatabase1.jpg", | ||
92 | "name": "inventury-of-database-for-earth-three-poles", | 124 | "name": "inventury-of-database-for-earth-three-poles", | ||
93 | "title": "An Inventory of Database for Earth Three Poles" | 125 | "title": "An Inventory of Database for Earth Three Poles" | ||
94 | } | 126 | } | ||
95 | ], | 127 | ], | ||
96 | "id": "2f2eb6a0-6683-4de5-99e9-7311ab55b7d5", | 128 | "id": "2f2eb6a0-6683-4de5-99e9-7311ab55b7d5", | ||
97 | "isopen": false, | 129 | "isopen": false, | ||
98 | "license_id": "", | 130 | "license_id": "", | ||
99 | "license_title": "", | 131 | "license_title": "", | ||
100 | "maintainer": "", | 132 | "maintainer": "", | ||
101 | "maintainer_email": "", | 133 | "maintainer_email": "", | ||
102 | "metadata_created": "2022-04-05T07:50:27.000177", | 134 | "metadata_created": "2022-04-05T07:50:27.000177", | ||
t | 103 | "metadata_modified": "2022-04-10T08:53:19.568331", | t | 135 | "metadata_modified": "2022-04-12T02:03:01.533605", |
104 | "name": "arctic-infrastructure-inventory", | 136 | "name": "arctic-infrastructure-inventory", | ||
105 | "notes": "The Arctic Infrastructure Inventory (AII) | 137 | "notes": "The Arctic Infrastructure Inventory (AII) | ||
106 | tracks\u00a0infrastructure projects in the Arctic. With nearly 8,000 | 138 | tracks\u00a0infrastructure projects in the Arctic. With nearly 8,000 | ||
107 | projects listed, and thousands more that will be added as it grows, | 139 | projects listed, and thousands more that will be added as it grows, | ||
108 | AII\u00a0aims to be a tool and resource for all stakeholders in Arctic | 140 | AII\u00a0aims to be a tool and resource for all stakeholders in Arctic | ||
109 | infrastructure\u2014including policymakers, industry, researchers, | 141 | infrastructure\u2014including policymakers, industry, researchers, | ||
110 | community leaders, and more.\u00a0\r\n", | 142 | community leaders, and more.\u00a0\r\n", | ||
111 | "num_resources": 1, | 143 | "num_resources": 1, | ||
112 | "num_tags": 0, | 144 | "num_tags": 0, | ||
113 | "organization": { | 145 | "organization": { | ||
114 | "approval_status": "approved", | 146 | "approval_status": "approved", | ||
115 | "created": "2020-04-30T11:11:08.802657", | 147 | "created": "2020-04-30T11:11:08.802657", | ||
116 | "description": "Aerospace Information Research Institute (AIR) | 148 | "description": "Aerospace Information Research Institute (AIR) | ||
117 | under the Chinese Academy of Sciences (CAS) was established in July | 149 | under the Chinese Academy of Sciences (CAS) was established in July | ||
118 | 2017, following the approval for consolidation of three CAS | 150 | 2017, following the approval for consolidation of three CAS | ||
119 | institutes: the Institute of Electronics (IECAS), the Institute of | 151 | institutes: the Institute of Electronics (IECAS), the Institute of | ||
120 | Remote Sensing and Digital Earth (RADI), and the Academy of | 152 | Remote Sensing and Digital Earth (RADI), and the Academy of | ||
121 | Opto-Electronics (AOE) at CAS President Board Meeting. The merger is | 153 | Opto-Electronics (AOE) at CAS President Board Meeting. The merger is | ||
122 | the outcome of CAS efforts towards reformation of its R&D system to | 154 | the outcome of CAS efforts towards reformation of its R&D system to | ||
123 | meet future R&D challenges and to better meet the national demands.", | 155 | meet future R&D challenges and to better meet the national demands.", | ||
124 | "id": "c25dce84-97be-4153-8b90-d38f9ab73e5f", | 156 | "id": "c25dce84-97be-4153-8b90-d38f9ab73e5f", | ||
125 | "image_url": "2021-05-18-080509.992585AIRlogo.png", | 157 | "image_url": "2021-05-18-080509.992585AIRlogo.png", | ||
126 | "is_organization": true, | 158 | "is_organization": true, | ||
127 | "name": "air", | 159 | "name": "air", | ||
128 | "state": "active", | 160 | "state": "active", | ||
129 | "title": "Aerospace Information Research Institute, CAS", | 161 | "title": "Aerospace Information Research Institute, CAS", | ||
130 | "type": "organization" | 162 | "type": "organization" | ||
131 | }, | 163 | }, | ||
132 | "owner_org": "c25dce84-97be-4153-8b90-d38f9ab73e5f", | 164 | "owner_org": "c25dce84-97be-4153-8b90-d38f9ab73e5f", | ||
133 | "private": false, | 165 | "private": false, | ||
134 | "relationships_as_object": [], | 166 | "relationships_as_object": [], | ||
135 | "relationships_as_subject": [], | 167 | "relationships_as_subject": [], | ||
136 | "resources": [ | 168 | "resources": [ | ||
137 | { | 169 | { | ||
138 | "cache_last_updated": null, | 170 | "cache_last_updated": null, | ||
139 | "cache_url": null, | 171 | "cache_url": null, | ||
140 | "created": "2022-04-05T07:52:00.484037", | 172 | "created": "2022-04-05T07:52:00.484037", | ||
141 | "datastore_active": false, | 173 | "datastore_active": false, | ||
142 | "description": "The Arctic Infrastructure Inventory (AII) | 174 | "description": "The Arctic Infrastructure Inventory (AII) | ||
143 | tracks\u00a0infrastructure projects in the Arctic. With nearly 8,000 | 175 | tracks\u00a0infrastructure projects in the Arctic. With nearly 8,000 | ||
144 | projects listed, and thousands more that will be added as it grows, | 176 | projects listed, and thousands more that will be added as it grows, | ||
145 | AII\u00a0aims to be a tool and resource for all stakeholders in Arctic | 177 | AII\u00a0aims to be a tool and resource for all stakeholders in Arctic | ||
146 | infrastructure\u2014including policymakers, industry, researchers, | 178 | infrastructure\u2014including policymakers, industry, researchers, | ||
147 | community leaders, and more.\u00a0\r\n", | 179 | community leaders, and more.\u00a0\r\n", | ||
148 | "format": "", | 180 | "format": "", | ||
149 | "hash": "", | 181 | "hash": "", | ||
150 | "id": "647cd873-0a16-46ae-82b0-447ff00df001", | 182 | "id": "647cd873-0a16-46ae-82b0-447ff00df001", | ||
151 | "last_modified": null, | 183 | "last_modified": null, | ||
152 | "metadata_modified": "2022-04-05T07:52:00.721424", | 184 | "metadata_modified": "2022-04-05T07:52:00.721424", | ||
153 | "mimetype": null, | 185 | "mimetype": null, | ||
154 | "mimetype_inner": null, | 186 | "mimetype_inner": null, | ||
155 | "name": "ARCTIC INFRASTRUCTURE INVENTORY", | 187 | "name": "ARCTIC INFRASTRUCTURE INVENTORY", | ||
156 | "package_id": "2f2eb6a0-6683-4de5-99e9-7311ab55b7d5", | 188 | "package_id": "2f2eb6a0-6683-4de5-99e9-7311ab55b7d5", | ||
157 | "position": 0, | 189 | "position": 0, | ||
158 | "resource_type": null, | 190 | "resource_type": null, | ||
159 | "size": null, | 191 | "size": null, | ||
160 | "state": "active", | 192 | "state": "active", | ||
161 | "url": "https://arcticinfrastructure.wilsoncenter.org/", | 193 | "url": "https://arcticinfrastructure.wilsoncenter.org/", | ||
162 | "url_type": null | 194 | "url_type": null | ||
163 | } | 195 | } | ||
164 | ], | 196 | ], | ||
165 | "state": "active", | 197 | "state": "active", | ||
166 | "tags": [], | 198 | "tags": [], | ||
167 | "title": "ARCTIC INFRASTRUCTURE INVENTORY", | 199 | "title": "ARCTIC INFRASTRUCTURE INVENTORY", | ||
168 | "type": "dataset", | 200 | "type": "dataset", | ||
169 | "url": "https://arcticinfrastructure.wilsoncenter.org/", | 201 | "url": "https://arcticinfrastructure.wilsoncenter.org/", | ||
170 | "version": "" | 202 | "version": "" | ||
171 | } | 203 | } |