126 lines
5.1 KiB
Matlab
126 lines
5.1 KiB
Matlab
function asosstations = readASOS(filename, startRow, endRow)
|
|
%IMPORTFILE Import numeric data from a text file as a matrix.
|
|
% ASOSSTATIONS = IMPORTFILE(FILENAME) Reads data from text file FILENAME
|
|
% for the default selection.
|
|
%
|
|
% ASOSSTATIONS = IMPORTFILE(FILENAME, STARTROW, ENDROW) Reads data from
|
|
% rows STARTROW through ENDROW of text file FILENAME.
|
|
%
|
|
% Example:
|
|
% asosstations = importfile('asos-stations.txt', 3, 920);
|
|
%
|
|
% See also TEXTSCAN.
|
|
|
|
% Auto-generated by MATLAB on 2019/11/25 13:24:05
|
|
|
|
%% Initialize variables.
|
|
if nargin<=2
|
|
startRow = 3;
|
|
endRow = inf;
|
|
end
|
|
|
|
%% Read columns of data as text:
|
|
% For more information, see the TEXTSCAN documentation.
|
|
formatSpec = '%9s%5s%7s%6s%31s%31s%21s%2s%32s%10s%11s%7s%6s%59s%12s%s%[^\n\r]';
|
|
|
|
%% Open the text file.
|
|
fileID = fopen(filename,'r');
|
|
|
|
%% Read columns of data according to the format.
|
|
% This call is based on the structure of the file used to generate this
|
|
% code. If an error occurs for a different file, try regenerating the code
|
|
% from the Import Tool.
|
|
dataArray = textscan(fileID, formatSpec, endRow(1)-startRow(1)+1, 'Delimiter', '', 'WhiteSpace', '', 'TextType', 'string', 'HeaderLines', startRow(1)-1, 'ReturnOnError', false, 'EndOfLine', '\r\n');
|
|
for block=2:length(startRow)
|
|
frewind(fileID);
|
|
dataArrayBlock = textscan(fileID, formatSpec, endRow(block)-startRow(block)+1, 'Delimiter', '', 'WhiteSpace', '', 'TextType', 'string', 'HeaderLines', startRow(block)-1, 'ReturnOnError', false, 'EndOfLine', '\r\n');
|
|
for col=1:length(dataArray)
|
|
dataArray{col} = [dataArray{col};dataArrayBlock{col}];
|
|
end
|
|
end
|
|
|
|
%% Remove white space around all cell columns.
|
|
dataArray{4} = strtrim(dataArray{4});
|
|
dataArray{5} = strtrim(dataArray{5});
|
|
dataArray{6} = strtrim(dataArray{6});
|
|
dataArray{14} = strtrim(dataArray{14});
|
|
|
|
%% Close the text file.
|
|
fclose(fileID);
|
|
|
|
%% Convert the contents of columns containing numeric text to numbers.
|
|
% Replace non-numeric text with NaN.
|
|
raw = repmat({''},length(dataArray{1}),length(dataArray)-1);
|
|
for col=1:length(dataArray)-1
|
|
raw(1:length(dataArray{col}),col) = mat2cell(dataArray{col}, ones(length(dataArray{col}), 1));
|
|
end
|
|
numericData = NaN(size(dataArray{1},1),size(dataArray,2));
|
|
|
|
for col=[1,2,3,10,11,13,15]
|
|
% Converts text in the input cell array to numbers. Replaced non-numeric
|
|
% text with NaN.
|
|
rawData = dataArray{col};
|
|
for row=1:size(rawData, 1)
|
|
% Create a regular expression to detect and remove non-numeric prefixes and
|
|
% suffixes.
|
|
regexstr = '(?<prefix>.*?)(?<numbers>([-]*(\d+[\,]*)+[\.]{0,1}\d*[eEdD]{0,1}[-+]*\d*[i]{0,1})|([-]*(\d+[\,]*)*[\.]{1,1}\d+[eEdD]{0,1}[-+]*\d*[i]{0,1}))(?<suffix>.*)';
|
|
try
|
|
result = regexp(rawData(row), regexstr, 'names');
|
|
numbers = result.numbers;
|
|
|
|
% Detected commas in non-thousand locations.
|
|
invalidThousandsSeparator = false;
|
|
if numbers.contains(',')
|
|
thousandsRegExp = '^[-/+]*\d+?(\,\d{3})*\.{0,1}\d*$';
|
|
if isempty(regexp(numbers, thousandsRegExp, 'once'))
|
|
numbers = NaN;
|
|
invalidThousandsSeparator = true;
|
|
end
|
|
end
|
|
% Convert numeric text to numbers.
|
|
if ~invalidThousandsSeparator
|
|
numbers = textscan(char(strrep(numbers, ',', '')), '%f');
|
|
numericData(row, col) = numbers{1};
|
|
raw{row, col} = numbers{1};
|
|
end
|
|
catch
|
|
raw{row, col} = rawData{row};
|
|
end
|
|
end
|
|
end
|
|
|
|
|
|
%% Split data into numeric and string columns.
|
|
rawNumericColumns = raw(:, [1,2,3,10,11,13,15]);
|
|
rawStringColumns = string(raw(:, [4,5,6,7,8,9,12,14,16]));
|
|
|
|
|
|
%% Replace non-numeric cells with NaN
|
|
R = cellfun(@(x) ~isnumeric(x) && ~islogical(x),rawNumericColumns); % Find non-numeric cells
|
|
rawNumericColumns(R) = {NaN}; % Replace non-numeric cells
|
|
|
|
%% Make sure any text containing <undefined> is properly converted to an <undefined> categorical
|
|
for catIdx = [4,5,6,7,9]
|
|
idx = (rawStringColumns(:, catIdx) == "<undefined>");
|
|
rawStringColumns(idx, catIdx) = "";
|
|
end
|
|
|
|
%% Create output variable
|
|
asosstations = table;
|
|
asosstations.NCDCID = cell2mat(rawNumericColumns(:, 1));
|
|
asosstations.WBAN = cell2mat(rawNumericColumns(:, 2));
|
|
asosstations.COOPID = cell2mat(rawNumericColumns(:, 3));
|
|
asosstations.CALL = rawStringColumns(:, 1);
|
|
asosstations.LOCATION = rawStringColumns(:, 2);
|
|
asosstations.ALT_NAME = rawStringColumns(:, 3);
|
|
asosstations.COUNTRY = categorical(rawStringColumns(:, 4));
|
|
asosstations.ST = categorical(rawStringColumns(:, 5));
|
|
asosstations.COUNTY = categorical(rawStringColumns(:, 6));
|
|
asosstations.LAT = cell2mat(rawNumericColumns(:, 4));
|
|
asosstations.LON = cell2mat(rawNumericColumns(:, 5));
|
|
asosstations.ELEV = categorical(rawStringColumns(:, 7));
|
|
asosstations.UTC = cell2mat(rawNumericColumns(:, 6));
|
|
asosstations.STNTYPEBEGDT = rawStringColumns(:, 8);
|
|
asosstations.GHCND = cell2mat(rawNumericColumns(:, 7));
|
|
asosstations.VarName16 = categorical(rawStringColumns(:, 9));
|