-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathNASISpedons_Extract_Pedons_from_NASIS _byTextFile.py
1630 lines (1265 loc) · 74.5 KB
/
NASISpedons_Extract_Pedons_from_NASIS _byTextFile.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
#-------------------------------------------------------------------------------
# Name: NASISpedons_Extract_Pedons_from_NASIS_by_TextFile
#
# Author: Adolfo.Diaz
# e-mail: [email protected]
# phone: 608.662.4422 ext. 216
#
# Author: Jason.Nemecek
# e-mail: [email protected]
# phone: 608.662.4422 ext. 190
#
# Created: 7/04/2016
# Last Modified: 5/18/2017
# Copyright: (c) Adolfo.Diaz 2016
# https://alexwlchan.net/2019/10/adventures-with-concurrent-futures/
# This is an exact copy of NASISpedons_Extract_Pedons_from_NASIS _MultiThreading_ArcGISPro
# but modified to work with a text file.
# ==========================================================================================
# Updated 4/29/2021 - Adolfo Diaz
# Major rewrite to introduce parallel tasking using concurrent.futures python
# module. Using this module I was able t
# ==========================================================================================
# Updated 5/26/2021 - Adolfo Diaz
# - Changed the format in which failed pedon ids are written to the error log
# file. Before the pedon IDs were logged as a continous list seperated by commas.
# Now, the pedon IDs are logged with a carriage return
# - Added capability to have the Pedons automatically added to the ArcGIS Pro Session
# if the pedon fc has valid pedons.
# ==========================================================================================
# Updated 6/17/2021 - Adolfo Diaz
# - Added functionality to output an SQLite Database Format
# ==========================================================================================
# Updated 3/14/2022 - Adolfo Diaz
# - updated createReferenceObjects function to set the number of fields to 9 for the siteaoverlap
# table from 6. This is b/c the metadatatable only has 6 fields and 3 additional fields are
# added (areasym, areaname and areatype)
#-------------------------------------------------------------------------------
## ===================================================================================
class ExitError(Exception):
pass
## ===================================================================================
def AddMsgAndPrint(msg, severity=0):
# prints message to screen if run as a python script
# Adds tool message to the geoprocessor
#
#Split the message on \n first, so that if it's multiple lines, a GPMessage will be added for each line
try:
print(msg)
try:
f = open(textFilePath,'a+')
f.write(msg + " \n")
f.close
del f
except:
pass
#for string in msg.split('\n'):
#Add a geoprocessing message (in case this is run as a tool)
if severity == 0:
arcpy.AddMessage(msg)
elif severity == 1:
arcpy.AddWarning(msg)
elif severity == 2:
arcpy.AddError("\n" + msg)
except:
pass
## ===================================================================================
def errorMsg():
try:
exc_type, exc_value, exc_traceback = sys.exc_info()
theMsg = "\t" + traceback.format_exception(exc_type, exc_value, exc_traceback)[1] + "\n\t" + traceback.format_exception(exc_type, exc_value, exc_traceback)[-1]
AddMsgAndPrint(theMsg,2)
except:
AddMsgAndPrint("Unhandled error in errorMsg method", 2)
pass
## ================================================================================================================
def tic():
""" Returns the current time """
return time.time()
## ================================================================================================================
def toc(_start_time):
""" Returns the total time by subtracting the start time - finish time"""
try:
t_sec = round(time.time() - _start_time)
(t_min, t_sec) = divmod(t_sec,60)
(t_hour,t_min) = divmod(t_min,60)
if t_hour:
return ('{} hour(s): {} minute(s): {} second(s)'.format(int(t_hour),int(t_min),int(t_sec)))
elif t_min:
return ('{} minute(s): {} second(s)'.format(int(t_min),int(t_sec)))
else:
return ('{} second(s)'.format(int(t_sec)))
except:
errorMsg()
## ================================================================================================================
def splitThousands(someNumber):
""" will determine where to put a thousands seperator if one is needed.
Input is an integer. Integer with or without thousands seperator is returned."""
try:
return re.sub(r'(\d{3})(?=\d)', r'\1,', str(someNumber)[::-1])[::-1]
except:
errorMsg()
return someNumber
## ================================================================================================================
def getDictionaryOfAllPedonIDs():
# Description
# This function will send a URL request to the 'Web Pedon PEIID List All of NASIS' NASIS
# report to obtain a list of ALL pedons in NASIS. Pedons include regular
# NASIS pedons and LAB pedons. Each record in the report will contain the following values:
# START 1204126, 1204127, 1204128 STOP"""
try:
AddMsgAndPrint("\nRequesting a list of ALL pedonIDs from NASIS")
arcpy.SetProgressorLabel("Requesting a list of ALL pedonIDs from NASIS")
#URL = r'https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_EXPORT_PEDON_BOX_COUNT' + coordinates
URL = r'https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_PEDON_PEIID_LIST_ALL_OF_NASIS'
# Open a network object using the URL with the search string already concatenated
startTime = tic()
#AddMsgAndPrint("\tNetwork Request Time: " + toc(startTime))
""" -------------------------------------- Try connecting to NASIS to read the report ------------------------"""
try:
theReport = urllib.request.urlopen(URL).readlines()
except:
try:
AddMsgAndPrint("\t2nd attempt at requesting data")
theReport = urllib.request.urlopen(URL).readlines()
except:
try:
AddMsgAndPrint("\t3rd attempt at requesting data")
theReport = urllib.request.urlopen(URL).readlines()
except URLError as e:
AddMsgAndPrint('URL Error' + str(e),2)
return False
except HTTPError as e:
AddMsgAndPrint('HTTP Error' + str(e),2)
return False
except socket.timeout as e:
AddMsgAndPrint("\n\t" + URL)
AddMsgAndPrint("\tServer Timeout Error", 2)
return False
except socket.error as e:
AddMsgAndPrint("\n\t" + URL)
AddMsgAndPrint("\tNASIS Reports Website connection failure", 2)
return False
""" -------------------------------------- Read the NASIS report ------------------------------------"""
bValidRecord = False # boolean that marks the starting point of the mapunits listed in the project
arcpy.SetProgressor("step", "Reading NASIS Report: 'WEB_PEDON_PEIID_LIST_ALL_OF_NASIS'", 0, len(theReport), 1)
# iterate through the report until a valid record is found
for theValue in theReport:
# convert from bytes to string and remove white spaces
theValue = theValue.decode('utf-8').strip()
# Iterating through the lines in the report
if bValidRecord:
if theValue == "STOP": # written as part of the report; end of lines
break
# Found a valid record
if not theValue == None:
# All of the peodonIDs will be contained in 1 line
pedonDict = {val.strip():None for val in theValue.split(",")}
else:
continue
else:
if theValue.startswith('<div id="ReportData">START'):
bValidRecord = True
arcpy.SetProgressorPosition()
#Resets the progressor back to its initial state
arcpy.ResetProgressor()
if len(pedonDict) == 0:
AddMsgAndPrint("\tThere were no pedons returned from this report",2)
return False
else:
return pedonDict
except:
errorMsg()
return False
## ================================================================================================================
def getBoundingCoordinates(feature):
""" This function will return WGS coordinates in Lat-Long format that will be passed over to
the 'WEB_EXPORT_PEDON_BOX_COUNT' report. The coordinates are generated by creating
a minimum bounding box around the input features. The box is then converted to vertices
and the SW Ycoord, NE Ycoord, SW Xcoord and NE Ycoord are return in that order.
Geo-Processing Environments are set to WGS84 in order to return coords in Lat/Long."""
try:
""" Determine if features are a subset of selected polygons OR the entire dataset
is being used. This was necessary b/c the output Coordinate System
environmental variable was not being honored if a selected set is being used.
Export selected set to a temporary feature class otherwise continue"""
arcpy.SetProgressorLabel("Calculating bounding coordinates of input features")
featurePath = arcpy.Describe(feature).catalogPath
totalPolys = int(arcpy.GetCount_management(featurePath).getOutput(0))
selectedPolys = int(arcpy.GetCount_management(feature).getOutput(0))
bExport = False
if selectedPolys < totalPolys:
envelopeFeature = arcpy.CreateScratchName("envelopeFeature",data_type="FeatureClass", workspace="in_memory")
arcpy.CopyFeatures_management(feature,envelopeFeature)
AddMsgAndPrint("\nCalculating bounding coordinates for " + splitThousands(selectedPolys) + " feature(s)",0)
bExport = True
else:
envelopeFeature = feature
AddMsgAndPrint("\nCalculating bounding coordinates of input features",0)
""" Set Projection and Geographic Transformation environments in order
to post process everything in WGS84. This will force all coordinates
to be in Lat/Long"""
inputSR = arcpy.Describe(feature).spatialReference # Get Spatial Reference of input features
inputDatum = inputSR.GCS.datumName # Get Datum name of input features
if inputSR == "Unkown":
AddMsgAndPrint("\n\tInput layer needs a spatial reference defined to determine bounding envelope",2)
return False
if inputDatum == "D_North_American_1983":
arcpy.env.geographicTransformations = "WGS_1984_(ITRF00)_To_NAD_1983"
elif inputDatum == "D_North_American_1927":
arcpy.env.geographicTransformations = "WGS_1984_(ITRF00)_To_NAD_1927"
elif inputDatum == "D_NAD_1983_2011":
arcpy.env.geographicTransformations = "WGS_1984_(ITRF00)_To_NAD_1983_2011"
elif inputDatum == "D_WGS_1984":
arcpy.env.geographicTransformations = ""
else:
AddMsgAndPrint("\n\tGeo Transformation of Datum could not be set",2)
AddMsgAndPrint("\tTry Projecting input layer to WGS 1984 Coordinate System",2)
return False, False, False, False
# Factory code for WGS84 Coordinate System
arcpy.env.outputCoordinateSystem = arcpy.SpatialReference(4326)
""" ------------ Create Minimum Bounding Envelope of features ------------"""
envelope = arcpy.CreateScratchName("envelope",data_type="FeatureClass",workspace="in_memory")
envelopePts = arcpy.CreateScratchName("envelopePts",data_type="FeatureClass",workspace="in_memory")
# create minimum bounding geometry enclosing all features
arcpy.MinimumBoundingGeometry_management(envelopeFeature,envelope,"ENVELOPE","ALL","#","MBG_FIELDS")
if int(arcpy.GetCount_management(envelope).getOutput(0)) < 1:
AddMsgAndPrint("\n\tFailed to create minimum bounding area. \n\tArea of interest is potentially too small",2)
return False
arcpy.FeatureVerticesToPoints_management(envelope, envelopePts, "ALL")
""" ------------ Get X and Y coordinates from envelope ------------"""
coordList = []
with arcpy.da.SearchCursor(envelopePts,['SHAPE@XY']) as cursor:
for row in cursor:
if abs(row[0][0]) > 0 and abs(row[0][1]) > 0:
# Don't add duplicate coords; Last coord will also be the starting coord
if not row[0] in coordList:
coordList.append(row[0])
# Reset output Coord Sys Environment
arcpy.env.outputCoordinateSystem = ""
# Delete temp spatial files
for tempFile in [envelope,envelopePts]:
if arcpy.Exists(tempFile):
arcpy.Delete_management(tempFile)
if bExport:
arcpy.Delete_management(envelopeFeature)
if len(coordList) == 4:
AddMsgAndPrint("\tBounding Box Coordinates:")
AddMsgAndPrint("\t\tSouth Latitude: " + str(coordList[0][1]))
AddMsgAndPrint("\t\tNorth Latitude: " + str(coordList[2][1]))
AddMsgAndPrint("\t\tEast Longitude: " + str(coordList[0][0]))
AddMsgAndPrint("\t\tWest Longitude: " + str(coordList[2][0]))
return coordList[0][1],coordList[2][1],coordList[0][0],coordList[2][0]
else:
AddMsgAndPrint("\tCould not get Latitude-Longitude coordinates from bounding area",2)
return False
except:
for tempFile in [envelope,envelopePts]:
if arcpy.Exists(tempFile):
arcpy.Delete_management(tempFile)
errorMsg()
return False
## ================================================================================================================
def getWebPedonNumberSum(coordinates):
""" This function will send the bounding coordinates to the 'Web Pedon Number SUM' NASIS report
and return the number of pedons within the bounding coordinates. Pedons include regular
NASIS pedons and LAB pedons. Example of URL sent to the NASIS report would be:
https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_ANALYSIS_PC_PEDON_NUMBER_SUM&Lat1=43.6425577303&Lat2=43.9828939095&Long1=-89.5997555233&Long2=-89.167551308
# peiid: siteID,Labnum,X,Y
# {'122647': ('84IA0130011', '85P0558', '-92.3241653', '42.3116684'), '883407': ('2014IA013003', None, '-92.1096600', '42.5332000')}
"""
try:
AddMsgAndPrint("\nDetermining if there are any pedons within the bounding coordinates")
arcpy.SetProgressorLabel("Determining if there are any pedons within the bounding coordinates")
# Open a network object using the URL with the search string already concatenated
URL = r'https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_ANALYSIS_PC_PEDON_NUMBER_SUM' + coordinates
""" -------------------------------------- Try connecting to NASIS to read the report ------------------------"""
try:
theReport = urllib.request.urlopen(URL).readlines()
except:
try:
AddMsgAndPrint("\t2nd attempt at requesting data")
theReport = urllib.request.urlopen(URL).read().decode('utf-8')
except:
try:
AddMsgAndPrint("\t3rd attempt at requesting data")
theReport = urllib.request.urlopen(URL).read().decode('utf-8')
except URLError as e:
AddMsgAndPrint('URL Error' + str(e),2)
return False
except HTTPError as e:
AddMsgAndPrint('HTTP Error' + str(e),2)
return False
except socket.timeout as e:
AddMsgAndPrint("\n\t" + URL)
AddMsgAndPrint("\tServer Timeout Error", 2)
return False
except socket.error as e:
AddMsgAndPrint("\n\t" + URL)
AddMsgAndPrint("\tNASIS Reports Website connection failure (Socket Error)", 2)
return False
except:
errorMsg()
return Falsethe
""" -------------------------------------- Read the NASIS report ---------------------------------"""
bValidRecord = False # boolean that marks the starting point of the mapunits listed in the project
# iterate through the report until a valid record is found
for theValue in theReport:
# convert from bytes to string and remove white spaces
theValue = theValue.decode('utf-8').strip()
# Iterating through the lines in the report
if bValidRecord:
if theValue == "STOP": # written as part of the report; end of lines
break
else:
try:
return int(theValue)
except:
continue
else:
if theValue.startswith('<div id="ReportData">START'):
bValidRecord = True
except:
errorMsg()
return False
## ================================================================================================================
def getWebExportPedon(coordinates):
""" This function will send the bounding coordinates to the 'Web Export Pedon Box' NASIS report
and return a list of pedons within the bounding coordinates. Pedons include regular
NASIS pedons and LAB pedons. Each record in the report will contain the following values:
Row_Number,upedonid,peiid,pedlabsampnum,Longstddecimaldegrees,latstddecimaldegrees,Undisclosed Pedon
24|S1994MN161001|102861|94P0697|-93.5380936|44.0612717|'Y'
A dictionary will be returned containing something similar:
{'102857': ('S1954MN161113A', '40A1694', '-93.6499481', '43.8647194','Y'),
'102858': ('S1954MN161113B', '40A1695', '-93.6455002', '43.8899956','N')}
theURL = r' #getPedonIDURL = r'https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_EXPORT_PEDON_BOX_COUNT&Lat1=44.070820&Lat2=44.596950&Long1=-91.166274&Long2=-90.311911'
returns a pedonDictionary"""
try:
AddMsgAndPrint("\nRequesting a list of pedonIDs from NASIS using the above bounding coordinates")
arcpy.SetProgressorLabel("Requesting a list of pedons from NASIS")
URL = r'https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_EXPORT_PEDON_BOX_COUNT' + coordinates
# Open a network object using the URL with the search string already concatenated
startTime = tic()
#AddMsgAndPrint("\tNetwork Request Time: " + toc(startTime))
pedonDictionary = dict()
""" -------------------------------------- Try connecting to NASIS to read the report ------------------------"""
try:
theReport = urllib.request.urlopen(URL).readlines()
except:
try:
AddMsgAndPrint("\t2nd attempt at requesting data")
theReport = urllib.request.urlopen(URL).readlines()
except:
try:
AddMsgAndPrint("\t3rd attempt at requesting data")
theReport = urllib.request.urlopen(URL).readlines()
except URLError as e:
AddMsgAndPrint('URL Error' + str(e),2)
return False
except HTTPError as e:
AddMsgAndPrint('HTTP Error' + str(e),2)
return False
except socket.timeout as e:
AddMsgAndPrint("\n\t" + URL)
AddMsgAndPrint("\tServer Timeout Error", 2)
return False
except socket.error as e:
AddMsgAndPrint("\n\t" + URL)
AddMsgAndPrint("\tNASIS Reports Website connection failure", 2)
return False
""" -------------------------------------- Read the NASIS report ------------------------------------"""
totalPedonCnt = 0
labPedonCnt = 0
undisclosed = 0
bValidRecord = False # boolean that marks the starting point of the mapunits listed in the project
arcpy.SetProgressor("step", "Reading NASIS Report: 'WEB_EXPORT_PEDON_BOX_COUNT'", 0, len(theReport), 1)
# iterate through the report until a valid record is found
for theValue in theReport:
# convert from bytes to string and remove white spaces
theValue = theValue.decode('utf-8').strip()
# Iterating through the lines in the report
if bValidRecord:
if theValue == "STOP": # written as part of the report; end of lines
break
# Found a valid project record i.e. -- SDJR - MLRA 103 - Kingston silty clay loam, 1 to 3 percent slopes|400036
else:
theRec = theValue.split("|")
if len(theRec) != 7:
AddMsgAndPrint("\tNASIS Report: Web Export Pedon Box is not returning the correct amount of values per record",2)
return False
# Undisclosed Record; Reject this record
if theRec[6] == "Y":
undisclosed+=1
totalPedonCnt += 1
continue
rowNumber = theRec[0]
userPedonID = theRec[1]
pedonID = theRec[2]
longDD = theRec[4]
latDD = theRec[5]
# Lab sample or not
if theRec[3] == 'Null' or theRec[3] == '':
labSampleNum = None
else:
labSampleNum = theRec[3]
labPedonCnt += 1
if not pedonID in pedonDictionary:
pedonDictionary[pedonID] = (userPedonID,labSampleNum,longDD,latDD)
totalPedonCnt += 1
else:
if theValue.startswith('<div id="ReportData">START'):
bValidRecord = True
arcpy.SetProgressorPosition()
#Resets the progressor back to its initial state
arcpy.ResetProgressor()
if len(pedonDictionary) == 0:
AddMsgAndPrint("\tThere were no pedons found in this area; Try using a larger extent",1)
return False
else:
#AddMsgAndPrint("\tThere are a total of " + splitThousands(totalPedonCnt) + " pedons found in this area:")
AddMsgAndPrint("\tThere are " + splitThousands(totalPedonCnt) + " within this layer:")
AddMsgAndPrint("\t\tLAB Pedons: " + splitThousands(labPedonCnt))
AddMsgAndPrint("\t\tUndisclosed: " + splitThousands(undisclosed))
AddMsgAndPrint("\t\tNASIS Pedons: " + splitThousands((totalPedonCnt - labPedonCnt) - undisclosed))
return pedonDictionary
except:
errorMsg()
return False
## ================================================================================================================
def filterPedonsByFeature(feature):
# Description:
# This function will temporarily plot out the pedons in order to determine which pedons fall completely
# within the user's AOI. Once determined, the extra pedons will be removed from the pedonDict so that
# extra pedons are not downloaded.
# Parameters
# feature - input area of interest that will be used to intersect agains temporarily plotted NASIS points.
# This will only be used as a reference.
# The pedonDict will be altered but not necessary to be passed in.
# Returns
# This function returns an integer that reflects the number of pedons that are completely within the feature
# AOI. False will be returned if an error occurs within this function OR if there are NO pedons within the
# feature AOI.
# Although the function will update the pedonDict to reflect only the peodonIDs that are within the feature AOI.
# it is not returned since it is directly updated from main.
try:
AddMsgAndPrint("\nSelecting pedons that intersect with " + arcpy.Describe(feature).Name + " Layer",0)
arcpy.SetProgressorLabel("Selecting pedons that intersect with " + arcpy.Describe(feature).Name + " Layer")
# Set everything to WGS84
arcpy.env.outputCoordinateSystem = arcpy.SpatialReference(4326)
# Make a copy of the user-input features - this is just in case there is a selected set
aoiFeature = arcpy.CreateScratchName("aoiFeature",data_type="FeatureClass", workspace="in_memory")
arcpy.CopyFeatures_management(feature,aoiFeature)
# Create a temp point feature class to digitize ALL of the pedons within the bounding box first
tempPoints = arcpy.CreateScratchName("tempPoints",data_type="FeatureClass", workspace="in_memory")
# Factory code for WGS84 Coordinate System
spatial_reference = arcpy.SpatialReference(4326)
arcpy.CreateFeatureclass_management("in_memory", os.path.basename(tempPoints), "POINT", "#", "DISABLED", "DISABLED", spatial_reference)
peiidFld = "peiid"
arcpy.AddField_management(tempPoints,peiidFld,"LONG")
# Initiate the insert cursor object using the peiid and XY values
cursor = arcpy.da.InsertCursor(tempPoints,[peiidFld,'SHAPE@XY'])
for pedon in pedonDict:
xValue = float(pedonDict[pedon][2])
yValue = float(pedonDict[pedon][3])
newRow = [pedon,(xValue,yValue)]
cursor.insertRow(newRow)
del cursor
arcpy.SetProgressorLabel("Selecting pedons that intersect with " + arcpy.Describe(feature).Name + " Layer") # Some odd reason 'tempPointsPRJ' stays frozen in the progress bar.
# Select all of the pedons within the user's AOI
tempPointsLYR = arcpy.CreateScratchName("tempPointsLYR",data_type="FeatureClass", workspace="in_memory")
arcpy.MakeFeatureLayer_management(tempPoints,tempPointsLYR)
#AddMsgAndPrint("\tThere are " + str(int(arcpy.GetCount_management("tempPoints_LYR").getOutput(0))) + " pedons in the layer",2)
arcpy.SelectLayerByLocation_management(tempPointsLYR,"INTERSECT",aoiFeature, "","NEW_SELECTION")
pedonsWithinAOI = int(arcpy.GetCount_management(tempPointsLYR).getOutput(0))
# There are pedons within the user's AOI
if pedonsWithinAOI > 0:
AddMsgAndPrint("\tThere are " + splitThousands(pedonsWithinAOI) + " pedons within this layer",0)
# Make a copy of the user-input features - this is just in case there is a selected set
selectedPedons = arcpy.CreateScratchName("selectedPedons",data_type="FeatureClass", workspace="in_memory")
arcpy.CopyFeatures_management(tempPointsLYR,selectedPedons)
# Create a new list of pedonIDs from the selected set; pedonIDs are converted to strings in order
# to compare against the pedonDict()
selectedPedonsList = [str(row[0]) for row in arcpy.da.SearchCursor(selectedPedons, (peiidFld))]
# Make a copy of pedonDict b/c it cannot change during iteration (next step)
pedonDictCopy = pedonDict.copy()
# delete any pedon from the original pedonDict that is not in the selected set.
labPedonCnt = 0
for pedon in pedonDictCopy:
if pedon not in selectedPedonsList:
del pedonDict[pedon]
else:
if not pedonDict[pedon][1] is None:
labPedonCnt+=1
AddMsgAndPrint("\t\tLAB Pedons: " + splitThousands(labPedonCnt))
AddMsgAndPrint("\t\tNASIS Pedons: " + splitThousands(pedonsWithinAOI - labPedonCnt))
for layer in (aoiFeature,tempPoints,tempPointsLYR,selectedPedons):
if arcpy.Exists(layer):
arcpy.Delete_management(layer)
del pedonDictCopy,selectedPedons,selectedPedonsList
# Return integer reflecting number of pedons within feature AOI
return pedonsWithinAOI
else:
AddMsgAndPrint("\tThere are NO pedons that are completely within your AOI. EXITING! \n",2)
return False
except:
errorMsg()
return False
## ================================================================================================================
def createPedonDB():
"""This Function will create a new File Geodatabase using a pre-established XML workspace
schema. All Tables will be empty and should correspond to that of the access database.
Relationships will also be pre-established.
Return false if XML workspace document is missing OR an existing FGDB with the user-defined
name already exists and cannot be deleted OR an unhandled error is encountered.
Return the path to the new Pedon File Geodatabase if everything executes correctly."""
try:
if sqliteFormat:
AddMsgAndPrint(".\nCreating New Pedon SQLite Database",0)
arcpy.SetProgressorLabel("Creating New Pedon SQLite Database")
else:
AddMsgAndPrint(".\nCreating New Pedon File Geodatabase",0)
arcpy.SetProgressorLabel("Creating New Pedon File Geodatabase")
# pedon xml template that contains empty pedon Tables and relationships
# schema and will be copied over to the output location
pedonXML = os.path.dirname(sys.argv[0]) + os.sep + "NASISpedons_XMLWorkspace.xml"
if sqliteFormat:
localPedonDB = os.path.dirname(sys.argv[0]) + os.sep + "NASISPedonsSQLiteTemplate.sqlite"
ext = ".sqlite"
else:
localPedonDB = os.path.dirname(sys.argv[0]) + os.sep + "NASISPedonsFGDBTemplate.gdb"
ext = ".gdb"
# Return false if pedon fGDB template is not found
if not arcpy.Exists(localPedonDB):
AddMsgAndPrint("\t" + os.path.basename(localPedonDB) + ext + " template was not found!",2)
return False
newPedonDB = os.path.join(outputFolder,DBname + ext)
if arcpy.Exists(newPedonDB):
try:
arcpy.Delete_management(newPedonDB)
AddMsgAndPrint(".\t" + os.path.basename(newPedonDB) + " already exists. Deleting and re-creating FGDB\n",1)
except:
AddMsgAndPrint(".\t" + os.path.basename(newPedonDB) + " already exists. Failed to delete\n",2)
return False
# copy template over to new location
AddMsgAndPrint(".\tCreating " + DBname + ext + " with NCSS Pedon Schema 7.4.1")
arcpy.Copy_management(localPedonDB,newPedonDB)
""" ------------------------------ Code to use XML Workspace -------------------------------------------"""
## # Return false if xml file is not found
## if not arcpy.Exists(pedonXML):
## AddMsgAndPrint("\t" + os.path.basename(pedonXML) + " Workspace document was not found!",2)
## return False
##
## # Create empty temp File Geodatabae
## arcpy.CreateFileGDB_management(outputFolder,os.path.splitext(os.path.basename(newPedonFGDB))[0])
##
## # set the pedon schema on the newly created temp Pedon FGDB
## AddMsgAndPrint("\tImporting NCSS Pedon Schema 7.3 into " + DBname + ".gdb")
## arcpy.ImportXMLWorkspaceDocument_management(newPedonFGDB, pedonXML, "DATA", "DEFAULTS")
#arcpy.UncompressFileGeodatabaseData_management(newPedonFGDB)
AddMsgAndPrint(".\tSuccessfully created: " + os.path.basename(newPedonDB))
return newPedonDB
except:
AddMsgAndPrint("Unhandled exception (createDB)", 2)
errorMsg()
return False
## ===============================================================================================================
def createReferenceObjects(pedonDBloc):
# Description
# This function will create the following 2 unique dictionaries that will be used throughout the script:
# - pedonGDBtablesList: contains every table in the newly created pedonDB above as a key.
# Individual records of tables will be added as list of values to the table keys.
# This dictionary will be populated using the results from the
# the WEB_AnalysisPC_MAIN_URL_EXPORT NASIS report
# i.e. {'area': [],'areatype': [],'basalareatreescounted': []}
# - tableInfoDict: Dictionary containing physical name from MDSTATTABS table as the key.
# Each key has an associated list consisting of alias name, number of fields in the
# physical table and the position index of the same table within the pedonGDBList.
#
# i.e. {croptreedetails:['Crop Tree Details',48,34]}
# The number of fields is used to double check that the values from
# the web report are correct. This was added b/c there were text fields that were
# getting disconnected in the report and being read as 2 lines -- Jason couldn't
# address this issue in NASIS.
# The position index is needed b/c once the pedonGDBList begins to be populated a
# table cannot be looked up.
# Paramaters
# pedonDBloc - Catalog path of the pedon File Geodatabase that was create to store pedon data.
# This FGDB must contain the Metadata Table which will be used to retrieve alias names
# and physical table names
# Returns
# This function returns 2 dictionaries (Description above). If anything goes wrong the function will
# return False,False and the script will eventually exit.
try:
arcpy.SetProgressorLabel("Gathering Metadata Table and Field Information")
AddMsgAndPrint(".\nGathering Metadata Table and Field Information")
# Open Metadata table containing information for other pedon tables
theMDTable = pedonDBloc + os.sep + prefix + "MetadataTable"
# Establishes a cursor for searching through field rows. A search cursor can be used to retrieve rows.
# This method will return an enumeration object that will, in turn, hand out row objects
if not arcpy.Exists(theMDTable):
AddMsgAndPrint(".\n\t" + theMDTable + " doesn't Exist",2)
return False,False
# Establish a list of tables to get field aliases for
arcpy.env.workspace = pedonDBloc
tableList = arcpy.ListTables("*")
tableList.append(prefix + "pedon")
#nameOfFields = ["TablePhysicalName","TableLabel"]
nameOfFields = ["tabphynm","tablab"]
# Initiate 2 Dictionaries
tableInfoDict = dict()
emptyPedonGDBtablesDict = dict()
with arcpy.da.SearchCursor(theMDTable,nameOfFields) as cursor:
for row in cursor:
physicalName = prefix + row[0] # Physical name of table
aliasName = row[1] # Alias name of table
tblPath = f"{pedonDBloc}\\{physicalName}"
if physicalName.find(prefix + 'Metadata') > -1: continue
if physicalName in tableInfoDict: continue
# The metadata table has more tables than what is in the DB template. Only
# Gather field information for those tables in the DB.
if physicalName in tableList:
uniqueFields = [f.name for f in arcpy.ListFields(tblPath) if not f.name.lower() in ('objectid','oid','geometry','fid','shape')]
numOfValidFlds = len(uniqueFields)
# Add 2 more fields to the pedon table for X,Y
if physicalName == prefix + 'pedon':
numOfValidFlds += 2
# Siteaoverlap table has 9 fields instead of 6 b/c areaiidref is actually
# a NASIS client placeholder for areatypename, areasymbol, areaname, areaiidref
if physicalName == prefix + 'siteaoverlap':
numOfValidFlds = 9
# i.e. {phtexture:'Pedon Horizon Texture',phtexture}; will create a one-to-many dictionary
# As long as the physical name doesn't exist in dict() add physical name
# as Key and alias as Value.
if not physicalName in tableInfoDict:
tableInfoDict[physicalName] = [aliasName,numOfValidFlds]
emptyPedonGDBtablesDict[physicalName] = []
del uniqueFields;numOfValidFlds
arcpy.SetProgressorLabel('')
return emptyPedonGDBtablesDict,tableInfoDict
except:
AddMsgAndPrint("Unhandled exception (createReferenceObject)", 2)
errorMsg()
return False, False
## ===============================================================================================================
def parsePedonsIntoLists(pedonDict):
""" This function will parse pedons into manageable chunks that will be sent to the 2nd URL report.
There is an inherent URL character limit of 2,083. The report URL is 123 characters long which leaves 1,960 characters
available. I arbitrarily chose to have a max URL of 1,860 characters long to avoid problems. Most pedonIDs are about
6 characters. This would mean an average max request of 265 pedons at a time.
This function returns a list of pedon lists"""
#1860 = 265
try:
arcpy.SetProgressorLabel("Determining the number of requests to send the server")
# Total Count
i = 1
listOfPedonStrings = list() # List containing pedonIDstring lists; individual lists are comprised of about 265 pedons
pedonIDstr = "" # concatenated string of pedonIDs
for pedonID in pedonDict:
# End of pedon dictionary has been reached
if i == len(pedonDict):
pedonIDstr = pedonIDstr + str(pedonID)
listOfPedonStrings.append(pedonIDstr)
# End of pedon list NOT reached
else:
# Max URL length reached - retrieve pedon data and start over
if len(pedonIDstr) > 1866:
pedonIDstr = pedonIDstr + str(pedonID)
listOfPedonStrings.append(pedonIDstr)
## reset the pedon ID string to empty
pedonIDstr = ""
i+=1
# concatenate pedonID to string and continue
else:
pedonIDstr = pedonIDstr + str(pedonID) + ",";i+=1
numOfPedonStrings = len(listOfPedonStrings) # Number of unique requests that will be sent
if not numOfPedonStrings:
AddMsgAndPrint("\n\t Something Happened here.....WTF!",2)
exit()
else:
return listOfPedonStrings,numOfPedonStrings
except:
AddMsgAndPrint("Unhandled exception (createFGDB)", 2)
errorMsg()
exit()
## ================================================================================================================
def organizeFutureInstanceIntoPedonDict(futureObject):
# Description
# This function will take in a "future" object representing the execution of the
# ThreadPoolExecutor callable. In this case, the future object represents
# the content of pedon Horizon information for a list of pedon IDs. The content
# will be organized it into a dictionary (pedonDBDict) whose schema follows
# NASIS 7.3 pedon schema.
# Parameters
# future object - Encapsulates the asynchronous execution of a callable.
# Future instances are created by Executor.submit()
# Returns
# True if the data was organized correctly
# False if the object was empty or there was an error.
# To view a sample output report go to:
# https://nasis.sc.egov.usda.gov/NasisReportsWebSite/limsreport.aspx?report_name=WEB_AnalysisPC_MAIN_URL_EXPORT&pedonid_list=14542
try:
theReport = futureObject
# There was an obvious error in opening the URL in the openURL function
if theReport == None:
return None
invalidTable = 0 # represents tables that don't correspond with the GDB
invalidRecord = 0 # represents records that were not added
validRecord = 0
bHeader = False # flag indicating if value is html junk
currentTable = "" # The table found in the report
numOfFields = "" # The number of fields a specific table should contain
partialValue = "" # variable containing part of a value that is not complete
originalValue = "" # variable containing the original incomplete value
bPartialValue = False # flag indicating if value is incomplete; append next record
""" ------------------- Begin Adding data from URL into a dictionary of lists ---------------"""
for theValue in theReport:
# convert from bytes to string and remove white spaces
theValue = theValue.decode('utf-8').strip()
# represents the start of valid table; Typically Line #19
if theValue.find('@begin') > -1:
theTable = prefix + theValue[theValue.find('@') + 7:] ## Isolate the table
numOfFields = tableFldDict[theTable][1]
# Check if the table name exists in the list of dictionaries
# if so, set the currentTable variable and bHeader
if theTable in pedonDBtablesDict:
currentTable = theTable
bHeader = True ## Next line will be the header
else:
AddMsgAndPrint("\t" + theTable + " Does not exist in the FGDB schema! Figure this out Jason Nemecek!",2)
invalidTable += 1
# end of the previous table has been reached; reset currentTable
elif theValue.find('@end') > -1:
currentTable = ""
bHeader = False
# represents header line; skip this line
elif bHeader:
bHeader = False
# this is a valid record that should be collected
elif not bHeader and currentTable:
numOfValues = len(theValue.split('|'))
# Add the record to its designated list within the dictionary
# Do not remove the double quotes b/c doing so converts the object
# to a list which increases its object size. Remove quotes before
# inserting into table
# this should represent the 2nd half of a valid value
if bPartialValue:
partialValue += theValue # append this record to the previous record
# This value completed the previous value
if len(partialValue.split('|')) == numOfFields:
pedonDBtablesDict[currentTable].append(partialValue)
validRecord += 1
bPartialValue = False
partialValue,originalValue = "",""
# appending this value still falls short of number of possible fields
# add another record; this would be the 3rd record appended and may
# exceed number of values.
elif len(partialValue.split('|')) < numOfFields:
arcpy.SetProgressorPosition()
continue
# appending this value exceeded the number of possible fields
else:
AddMsgAndPrint("\t\tIncorrectly formatted Record Found in " + currentTable + " table:",2)
AddMsgAndPrint("\t\t\tRecord should have " + str(numOfFields) + " values but has " + str(len(partialValue.split('|'))),2)
AddMsgAndPrint("\t\t\tOriginal Record: " + originalValue,2)
AddMsgAndPrint("\t\t\tAppended Record: " + partialValue,2)
invalidRecord += 1
bPartialValue = False
partialValue,originalValue = ""
# number of values do not equal the number of fields in the corresponding tables
elif numOfValues != numOfFields:
# number of values exceed the number of fields; Big Error
if numOfValues > numOfFields:
AddMsgAndPrint("\n\t\tIncorrectly formatted Record Found in " + currentTable + " table:",2)
AddMsgAndPrint("\t\t\tRecord should have " + str(numOfFields) + " values but has " + str(numOfValues),2)
AddMsgAndPrint("\t\t\tRecord: " + theValue,2)