-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathGCNET_ArgosMain_16032020.py
299 lines (276 loc) · 16.1 KB
/
GCNET_ArgosMain_16032020.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
#!/usr/bin/python
import numpy as np
import os
import datetime
import warnings
def WriteCFile(fid,DatasetN):
if len(DatasetN)!=0:
formstr = '%i,%4i,%.4f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f,%.2f'
try:
np.savetxt(fid,DatasetN,fmt=formstr)
print "Successfully saved "+str(len(DatasetN[:,1]))+" entries to file: "+str(fid.name)
except:
print "Error writing CSV: WriteCFile in ArgosMain"
else:
np.savetxt(fid,DatasetN)
print "Successfully wrote empty CSV to file: "+str(fid.name)
#check for reset bool in reset file
try:
f = open("ARGOSRESET.txt","r")
flagval = f.read()
flag = int(flagval)
if flag==1:
newloadflag = 1
else:
newloadflag = 0
except IOError:
newloadflag = 1
#load temp file
try:
ftemp = open("argostemp.dat","r")
with warnings.catch_warnings():
warnings.simplefilter("ignore") #ignores warnings about lines with incorrect columns (some columns are corrupt and missing values)
tempraw = np.genfromtxt(ftemp,missing_values=("*******","******","*****","****","***","**","*"),filling_values=999,invalid_raise=False)
gmat=np.array(tempraw)
except:
print "Error Loading argostemp.txt, check fortran exe or timing"
#define limits for filtering for all stations
swmax = 1300 #W/m2 the full strength of the sun
swmin = 0
hmpmin = -40 #this is the measurement range of the HMP temp sensor
hmpmax = 50 #this is hottest hopefully ever
tcmax = 50
tcmin = -100
wmax = 50# wind max m/s
wmin = 0 #wind min m/s
wdmax = 360
wdmin = 0
pmin = 500 #this is low pressure
pmax = 1200 #this is high pressure
rhmax = 130 #no more than 130# humidity sensors can have noise above 100%
rhmin = 0
shmin = -10 #this is conservative
shmax = 10 #max height above snow - sonic sensor, usually have really
#high values when bad
battmin = 8 #loggers & instruments unlikely to work
battmax = 24 #hopefully the highest ever would be 16 or else there
#are serious problems
#% Argos Station IDs and names
#%(04) 107282 gits - GITS
#%(05) 107283 hum - Humboldt Glacier
#%(07) 107285 tunu - Tunu N Glacier
#%(22) 107284 Pet - Petermann Glacier
#%(31) 135797 PE_gun - Princess Elizabeth Station Antarctica
#%(32) 135798 PE_blu - Princess Elizabeth Station ice runway
#%(33) 135796 PE_air - Princess Elizabeth Station Antarctica
AStation_numbers = np.array([4,5,7,22,31,32,33])
AStation_ID = np.array([107282,107283,107285,107284,135797,135798,135796])
#contains the (c-level) standard station number in the order in which we will process
#these data.
# Define ARGOS Station calibration constants
swincal = 200*np.ones((len(AStation_numbers),1))
swoutcal = 200*np.ones((len(AStation_numbers),1))
# The calibration coefficients are extracted from the
# QC->Ancillary->Defaults->CalibrationDefault.cal files in the QC software
# 4 5 7 22 31 32 33
swnetcal_pos=np.array([9.35, 9.29, 9.43, 9.51, 9.32927, 8.98, 9]) # no cal file for 22 or 33, used 21 for 22
swnetcal_neg=np.array([11.66, 11.62, 11.66, 11.88, 11.5745, 11.31, 11.5])
poffset = 400*np.ones((len(AStation_numbers),1))
swincal[5]=74.6 # %LAR2
swoutcal[5]=69.3 # %LAR2
swincal[6]=197.75 # %LAR3
swoutcal[6]=205.85 # %LAR3
for i in range(len(AStation_numbers)):
sid = AStation_ID[i]
snum = AStation_numbers[i]
print "Processing Station #"+str(snum)+"..."
if gmat.size!=0:
usdata=np.array(gmat[gmat[:,7]==sid,:]) #find data associated with each
if len(usdata)!=0:
u,IA = np.unique(usdata[:,8:],axis=0,return_index=True) #find rows with unique data
# % after column 8 because data may repeat with different time signature
usdata=usdata[np.sort(IA),:]
inds = np.argwhere((usdata[:,0]==usdata[:,9]) & (np.ceil(usdata[:,10])==np.floor(usdata[:,10])) & (usdata[:,10]>0) & (usdata[:,10]<367)) #find lines that are first
#part of the two piece table and have integer Julian day (records with
# decimal julian day are erroneous) and have realistic (positive and
# less than 367 day, leap year will have 366 days)
lastp2v = np.argwhere((usdata[:,0]!=usdata[:,9]) & (usdata[:,9]<=360)) #second parts of table
#column 10 of 2nd table is wind direction, realistic values will be
#less than 360 deg
lastp2 = lastp2v[-1:] #last second part
inds = inds[inds<lastp2] #make sure last record
# has a second piece of the table
numrecs = len(inds) #number of total records
adata = np.ones((numrecs,43))*999;
#indexes (columns) to be assigned in data vector
aind = np.concatenate((np.arange(0,20),np.arange(30,33),np.arange(34,38),np.array([38]),np.array([39])))
#indexes (columns) in table 1 raw
usind1 = np.concatenate((np.array([0]),np.array([10]),np.array([3]),np.arange(12,23)))
#indexes (columns) in table 2 raw
usind2 = np.concatenate((np.arange(9,14),np.array([22]),np.arange(14,22)))
for j in range(numrecs): #loop through records
ind2v=np.argwhere(usdata[inds[j]+1:,0] != usdata[inds[j]+1:,9]) #find second
#table parts occuring after assocaited first part
ind1 = inds[j]
ind2 = inds[j]+ind2v[0] #take the closest 2nd table line
#adata(j,[0:20,30:33,34:38,38,39])=np.column_stack(AStation_numbers(i),usdata(ind1,[0,10,3,12:23]),usdata(ind2,[9:14,22,14,15,16,17,18,19,20,21]));
adata[j,aind]=np.concatenate((np.array([snum]),usdata[ind1,usind1],usdata[ind2,usind2]))
gdata = adata[(adata[:,1]>1990) & (adata[:,1]<2050) & (adata[:,2]>=0) & (adata[:,2]<367),:] #filter realistic time
if len(gdata)!=0:
#(positive and less than 367 JD, leap year will have 366 days)
# and sensible year
gdata[gdata==-8190]=999
gdata[gdata==2080]=999
#print gdata[-1,0:5]
yr = gdata[:,1] #get year data
jday = gdata[:,2]+gdata[:,3]/24 #calculate fractional julian day
datenum = yr*1e3+jday #number that is ascending in time
udatenum,unind = np.unique(datenum,axis=0,return_index=True) #find only unique time stamps
if len(unind)<len(datenum):
numduptime = len(datenum)-len(unind)
print "Warning: Removed "+str(numduptime)+" entires out of: "+str(len(datenum))+" good pts from station ID: "+str(sid)+" Reason: duplicate time tags"
tind=np.argsort(datenum[unind]) #find indexes of a sort of unique values along time
gdata=gdata[tind,:] #crop data array to unique times
jday = jday[tind] #crop jday vector to unique times
yr = yr[tind]
datenum = datenum[tind] #leave only unique and sorted datenums
stnum = gdata[:,0] #get station number vector
SWin = gdata[:,4]*swincal[i] #assign and calibrate incoming shortwave
SWin[SWin<swmin]=999 #filter low
SWin[SWin>swmax]=999 #filter high
SWout = gdata[:,5]*swoutcal[i] #assign and calibrate outgoing shortwave
SWout[SWout<swmin]=999 #filter low
SWout[SWout>swmax]=999 #filter high
# #assign and calibrate net shortwave, negative and positive values
# #have different calibration coefficients according to QC code
SWnet = 999*np.ones(np.size(SWout,0))
SWnet[gdata[:,6]>=0]=gdata[gdata[:,6]>=0,6]*swnetcal_pos[i]
SWnet[gdata[:,6]<0] =gdata[gdata[:,6]<0,6]*swnetcal_neg[i]
SWnet[SWnet<-swmax]=999 #filter low
SWnet[SWnet>swmax]=999 #filter high
TC1 = gdata[:,7] #thermocouple 1
TC1[TC1<tcmin]=999 #filter low
TC1[TC1>tcmax]=999 #filter high
TC2 = gdata[:,8] #thermocouple 2
TC2[TC2<tcmin]=999 #filter low
TC2[TC2>tcmax]=999 #filter high
HMP1 = gdata[:,9] #HMP1 temp
HMP1[HMP1<hmpmin]=999 #filter low
HMP1[HMP1>hmpmax]=999 #filter high
HMP2 = gdata[:,10] #HMP2 temp
HMP2[HMP2<hmpmin]=999 #filter low
HMP2[HMP2>hmpmax]=999 #filter high
RH1 = gdata[:,11] #HMP relative humidity 1
RH1[RH1<rhmin]=999 #filter low
RH1[RH1>rhmax]=999 #filter high
RH2 = gdata[:,12] #HMP relative humidity 2
RH2[RH2<rhmin]=999 #filter low
RH2[RH2>rhmax]=999 #filter high
WS1 = gdata[:,13] #wind speed 1
WS1[WS1<wmin]=999 #filter low
WS1[WS1>wmax]=999 #filter high
WS2 = gdata[:,14] #wind speed 2
WS2[WS2<wmin]=999 #filter low
WS2[WS2>wmax]=999
WD1 = gdata[:,15] #wind direction 1
WD1[WD1<wdmin]=999 #filter low
WD1[WD1>wdmax]=999
WD2 = gdata[:,16] #wind direction 2
WD2[WD2<wdmin]=999 #filter low
WD2[WD2>wdmax]=999
pres = gdata[:,17]+poffset[i] #barometeric pressure
pres[pres<pmin]=999 #filter low
pres[pres>pmax]=999 #filter high
presd = np.diff(pres) #find difference of subsequent pressure meas
hrdif = np.diff(jday)*24. #time diff in hrs
mb_per_hr = np.absolute(np.divide(presd,hrdif,out=np.zeros_like(presd),where=hrdif!=0))
pjumps=np.argwhere(mb_per_hr>10) #find jumps > 10mb/hr (quite unnatural)
pres[pjumps+1]=999 #eliminate these single point jumps
SH1 = gdata[:,18] #hieght above snow 1
SH1[SH1<shmin]=999 #filter low
SH1[SH1>shmax]=999 #filter high
SH2 = gdata[:,19] #hieght above snow 2
SH2[SH2<shmin]=999 #filter low
SH2[SH2>shmax]=999 #filter high
SnowTemp10 = gdata[:,20:30] #10m snow temperature (many of these are non functional or not connected)
volts = gdata[:,30] #battery voltage
volts[volts<battmin]=999 #filter low
volts[volts>battmax]=999 #filter high
SWinmax = gdata[:,31]*swincal[i] #incoming shortwave max
SWinmax[SWinmax<swmin]=999 #filter low
SWinmax[SWinmax>swmax]=999 #filter high
SWoutmax = gdata[:,32]*swoutcal[i] #reflected shortwave max
SWoutmax[SWoutmax<swmin]=0 #filter low
SWoutmax[SWoutmax>swmax]=999 #filter high
SWnetmax = 999*np.ones_like(SWoutmax)
SWnetmax[gdata[:,33]>=0]=gdata[gdata[:,33]>=0,33]*swnetcal_pos[i] #net radiation max
SWnetmax[gdata[:,33]<0]=gdata[gdata[:,33]<0,33]*swnetcal_neg[i]
SWnetmax[SWnetmax<-swmax]=999 #filter low
SWnetmax[SWnetmax>swmax]=999 #filter high
tc1max = gdata[:,34]
tc1max[tc1max<tcmin]=999 #filter low
tc1max[tc1max>tcmax]=999 #filter high
tc2max = gdata[:,35]
tc2max[tc2max<tcmin]=999 #filter low
tc2max[tc2max>tcmax]=999 #filter high
tc1min = gdata[:,36]
tc1min[tc1min<tcmin]=999 #filter low
tc1min[tc1min>tcmax]=999 #filter high
tc2min = gdata[:,37]
tc2min[tc2min<tcmin]=999 #filter low
tc2min[tc2min>tcmax]=999 #filter high
ws1max = gdata[:,38] #stats
ws2max = gdata[:,39]
ws1std = gdata[:,40]
ws2std = gdata[:,41]
Tref = gdata[:,42]
# # note this code does not currently calculate the 2 and 10 m winds
# # and albedo, so this is column 1-42 of the Level C data
wdata = np.column_stack((stnum,yr,jday,SWin,SWout,SWnet,TC1,TC2,HMP1,HMP2,RH1,RH2,WS1,WS2,WD1,WD2,pres,SH1,SH2,SnowTemp10,volts,SWinmax,SWoutmax,SWnetmax,tc1max,tc2max,tc1min,tc2min,ws1max,ws2max,ws1std,ws2std,Tref)) #assemble data into final level C standard form
today = datetime.datetime.now()
day_of_year = (today - datetime.datetime(today.year, 1, 1)).days + 1
theyear = today.year
todayjday = day_of_year+today.hour/24 #calculate fractional julian day
nowdatenum = theyear*1e3+todayjday
wdata = wdata[datenum<nowdatenum,:] #only take entries in the past
numfuturepts = len(np.argwhere(datenum>nowdatenum))
if numfuturepts>0:
print "Warning: Removed "+str(numfuturepts)+" entires out of: "+str(len(wdata[:,1])+numfuturepts)+" good pts from station ID: "+str(sid)+" Reason: time tags in future"
else: #if gdata is empty after removing bad dates
wdata=np.array([])
else: #if no data in usdata still output empty wdata array so empty file is created
wdata = np.array([])
filename = str(snum)+'.csv'
if newloadflag==1:
with open(filename,'w') as fidn:
WriteCFile(fidn,wdata) #overwrite any existing files because
#newloadflag==1 means fresh run
else:
try:
fsize=os.path.getsize(filename)
if fsize!=0: #if station file already exists append to it
if len(wdata) == 0: #if no new data
indstart = 0
outdat = wdata
else: #there is some data in the array
with open(filename,"rb") as f:
lines = f.readlines()
lastline=np.genfromtxt(lines[-1:],delimiter=',') # read last line of existing file
lastyr = lastline[:,1] #get year data
lastjday = lastline[:,2]+lastline[:,3]/24 #calculate fractional julian day
lastdatenum = yr*1e3+jday #number that is ascending in time, calculate last date number of old data
indstart = np.argwhere(datenum<=lastdatenum) #find indexs of dates in new part that are before what is already in csv
if len(indstart)==0: #all data new
indstart = 0
outdat = wdata
elif len(indstart) == len(wdata[:,1]): #only dates before what is already there
outdat = np.array([])
else: #some new data some old data
outdat = wdata[int(np.max(indstart))+1:,:] #begin with index after what is already in file
#write outdat to station_id.dat
with open(filename,'a') as fidn:
WriteCFile(fidn,outdat)
except: #if filename doesnt exist create new file
with open(filename,'w') as fidn:
WriteCFile(fidn,wdata)
print "No Existing "+filename+" found. Writing new .dat for this station"