forked from uataq/co2usa_data_synthesis
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathco2usa_load_netCDF_script.m
185 lines (155 loc) · 7.2 KB
/
co2usa_load_netCDF_script.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
% Load the CO2-USA Data Synthesis files from netCDF
%
% USAGE:
%
% The CO2-USA synthesis data is available to download from the ORNL DAAC:
% https://doi.org/10.3334/ORNLDAAC/1743
%
% To download the data, first sign into your account (or create one if you don't have one).
% Next, click on "Download Data" to download the entire data set in a zip file.
% Extract the netCDF files to a folder on your computer.
%
% The CO2-USA synthesis data files should be all saved in a single directory:
% /synthesis_output/[netCDF_files.nc]
%
% For example, for the CO2 data file for Boston it would be:
% /synthesis_output/boston_all_sites_co2_1_hour_R0_2019-07-09.nc
%
% In the code below, choose the cities you want to extract, the species, and if you want to save plots.
% After running the script, the CO2_USA greenhouse gas data will all be contained within the
% 'co2_usa' variable.
%
% For more information, visit the CO2-USA GitHub repository:
% https://github.com/loganemitchell/co2usa_data_synthesis
%
% Written by Logan Mitchell ([email protected])
% University of Utah
% Last updated: 2019-10-30
%clear all
%close all
% set(0,'DefaultFigureWindowStyle','docked')
t_overall = tic;
if ~exist('cities','var')
cities = {
%'boston'
%'indianapolis'
%'los_angeles'
%'northeast_corridor'
%'portland'
'salt_lake_city'
%'san_francisco_baaqmd'
%'san_francisco_beacon'
%'toronto'
};
end
if ~exist('species_to_load','var')
species_to_load = {
'co2'
'ch4'
%'co'
};
end
if ~exist('readFolder','var')
currentFolder = pwd;
readFolder = fullfile(currentFolder(1:regexp(currentFolder,'gcloud.utah.edu')+14),'data','co2-usa','synthesis_output','netCDF_formatted_files');
end
% Do you want to save the summary figures?
plt.save_overview_image = 'n'; % options: 'y' or 'n'
for species_index = 1:length(species_to_load)
species = species_to_load{species_index};
fprintf('Loading the %s city data...\n',species)
for ii = 1:size(cities,1)
city = cities{ii,1};
t_city = tic;
fprintf('------Working on %s: ------\n',city)
%all_files = dir(fullfile(readFolder,city,'netCDF_formatted_files',[city,'*',species,'_','*.nc']));
all_files = dir(fullfile(readFolder,[city,'*',species,'_','*.nc']));
if isempty(all_files); fprintf('\n*** Data files for %s were not found! Check the path name and try again.***\nTime elapsed: %4.0f seconds.\n',city,toc(t_city)); continue; end % Skip it if the file doesn't exist.
for fni = 1:length(all_files)
fn = all_files(fni);
fprintf('Working on %s.\n',fn.name)
%ncdisp(fullfile(fn.folder,fn.name))
info = ncinfo(fullfile(fn.folder,fn.name));
fn_parts = strsplit(fn.name,{'_','.'});
site_code = fn.name(length(city)+2:regexp(fn.name,'_1_hour')-1);
% Loading Attributes:
for jj = 1:length(info.Attributes)
attribute_name = info.Attributes(jj).Name;
if strcmp(attribute_name(1),'_'); attribute_name = attribute_name(2:end); end
co2_usa.(city).(site_code).global_attributes.(attribute_name) = info.Attributes(jj).Value;
end
% Loading Variables
for var = 1:length(info.Variables)
variable_name = info.Variables(var).Name;
for jj = 1:length(info.Variables(var).Attributes)
attribute_name = info.Variables(var).Attributes(jj).Name;
% names can't start with an underscore
if strcmp(attribute_name(1),'_'); attribute_name = attribute_name(2:end); end
co2_usa.(city).(site_code).attributes.(variable_name).(attribute_name) = info.Variables(var).Attributes(jj).Value;
end
co2_usa.(city).(site_code).(variable_name) = ncread(fullfile(fn.folder,fn.name),[info.Name,info.Variables(var).Name]);
if strcmp('time',variable_name)
co2_usa.(city).(site_code).(variable_name) = datetime(co2_usa.(city).(site_code).(variable_name),'ConvertFrom','posixtime');
end
end
end
%co2_usa.(city).site_codes = fieldnames(co2_usa.(city)); co2_usa.(city).site_codes = co2_usa.(city).site_codes(~strcmp(co2_usa.(city).site_codes,'site_codes'));
clear info
fprintf('Done. Time elapsed: %4.0f seconds.\n',toc(t_city))
end
fprintf('Done loading city %s data. Overall time elapsed: %4.0f seconds.\n',species,toc(t_overall))
% city = 'indianapolis';
% %site = 'SITE02_co2_136M';
% %site = 'SITE10_co2_40M';
% site = 'SITE09_co2_130M';
%
% foo = co2_usa.(city).(site).time(cursor_info.DataIndex)
% days(duration(foo-datetime(year(foo),1,1)))
% If there are duplicate times, this finds the index of the duplicate times:
%[ia,ib,ic] = unique(co2_usa.(city).(site).time);
%id = setdiff(ic,ib);
%% Plot of the city data:
clear('t1','t2')
for ii = 1:size(cities,1)
%%
city = cities{ii,1}; %if ~isfield(co2_usa,city); continue; end
site_codes = fieldnames(co2_usa.(city)); site_codes = site_codes(contains(site_codes,[species,'_']));
%if isempty(site_codes); continue; end
% Uppercase city name:
city_long_name = replace(city,'_',' '); city_long_name([1,regexp(city_long_name,' ')+1]) = upper(city_long_name([1,regexp(city_long_name,' ')+1]));
fx(ii+species_index*100) = figure(ii+species_index*100); fx(ii+species_index*100).Color = [1 1 1]; clf; hold on
title([city_long_name,' ',upper(species),' - All sites'],'FontSize',35,'FontWeight','Bold')
for jj = 1:length(site_codes)
site = site_codes{jj,1};
if ~isempty(regexp(site,'background','once'))
plot(co2_usa.(city).(site).time,co2_usa.(city).(site).(species),'k-','LineWidth',2)
else
plot(co2_usa.(city).(site).time,co2_usa.(city).(site).(species))
end
end
units_label_abbr = '';
units_label = co2_usa.(city).(site_codes{1}).attributes.(species).units;
if strcmp(units_label,'nanomol mol-1'); units_label_abbr = 'ppb'; end
if strcmp(units_label,'micromol mol-1'); units_label_abbr = 'ppm'; end
ylabel([upper(species),' (',units_label_abbr,')'],'FontWeight','Bold')
%ylim([350,750])
hold off; grid on;
legend(replace(site_codes,'_',' '),'Location','NorthWest')
xl = get(gca,'XLabel'); xlFontSize = get(xl,'FontSize'); xAX = get(gca,'XAxis'); yl = get(gca,'YLabel'); ylFontSize = get(yl,'FontSize'); yAX = get(gca,'YAxis');
xAX.FontSize = 25; yAX.FontSize = 25; yl.FontSize = 30; yl.FontWeight = 'Bold';
% Plot of 2 years of data:
%t1 = datetime(2014,1,1); % SLC, Boston, Indy
%t1 = datetime(2015,1,1); % LA
%t1 = datetime(2010,1,1); % Portland
%t2 = t1+calyears(2);
%ax = gca; ax.XLim = [t1,t2]; ax.XTick = t1:calmonths(6):t2; datetick('x','yyyy-mm','keepticks')
% Plot all of the data:
%ax = gca; t1 = ax.XLim(1); t2 = ax.XLim(2); datetick('x','yyyy')
if strcmp(plt.save_overview_image,'y')
writeFolder = fullfile(currentFolder(1:regexp(currentFolder,'gcloud.utah.edu')+14),'data','co2-usa','synthesis_output');
export_fig(fullfile(writeFolder,city,[city,'_img_all_sites_',species,'.jpg']),'-r300','-p0.01',fx(ii+species_index*100))
% export_fig(fullfile(readFolder,city,[city,'_img_all_sites_',species,'_',[datestr(t1,'yyyymmdd'),'-',datestr(t2,'yyyymmdd')],'.jpg']),'-r300','-p0.01',fx(ii))
end
%%
end % end of cities loop
end % end of species_to_load