-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathDataUpdateFromLink.py
332 lines (310 loc) · 13.8 KB
/
DataUpdateFromLink.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
#-------------------------------------------------------------
# Name: Data Update from Link
# Purpose: Downloads a zipped up file geodatabase from a download link. Updates data in a geodatabase
# from the zip file. Two update options:
# Existing Mode - Will only update datasets that have the same name and will delete and
# append records, so field names need to be the same.
# New Mode - Copies all datasets from the geodatabase and loads into geodatabase. Requires
# no locks on geodatabase.
# Author: Shaun Weston (shaun_weston@eagle.co.nz)
# Date Created: 05/09/2013
# Last Updated: 10/11/2016
# Copyright: (c) Eagle Technology
# ArcGIS Version: ArcMap 10.1+
# Python Version: 2.7
#--------------------------------
# Import main modules
import os
import sys
import logging
import smtplib
# Set global variables
# Logging
enableLogging = "false" # Use within code - logger.info("Example..."), logger.warning("Example..."), logger.error("Example...")
logFile = "" # e.g. os.path.join(os.path.dirname(__file__), "Example.log")
# Email logging
sendErrorEmail = "false"
emailServerName = "" # e.g. smtp.gmail.com
emailServerPort = 0 # e.g. 25
emailTo = ""
emailUser = ""
emailPassword = ""
emailSubject = ""
emailMessage = ""
# Proxy
enableProxy = "false"
requestProtocol = "http" # http or https
proxyURL = ""
# Output
output = None
# ArcGIS desktop installed
arcgisDesktop = "true"
# If ArcGIS desktop installed
if (arcgisDesktop == "true"):
# Import extra modules
import arcpy
# Enable data to be overwritten
arcpy.env.overwriteOutput = True
# Python version check
if sys.version_info[0] >= 3:
# Python 3.x
import urllib.request as urllib2
else:
# Python 2.x
import urllib2
import zipfile
import glob
# Start of main function
def mainFunction(downloadLink,updateMode,geodatabase,featureDataset): # Get parameters from ArcGIS Desktop tool by seperating by comma e.g. (var1 is 1st parameter,var2 is 2nd parameter,var3 is 3rd parameter)
try:
# --------------------------------------- Start of code --------------------------------------- #
# Download the file from the link
file = urllib2.urlopen(downloadLink)
# Download in chunks
fileChunk = 16 * 1024
datasetFileName = "Data.zip"
if ".gdb" in downloadLink:
datasetFileName = "Data.gdb.zip"
with open(os.path.join(arcpy.env.scratchFolder, datasetFileName), 'wb') as output:
while True:
chunk = file.read(fileChunk)
if not chunk:
break
# Write chunk to output file
output.write(chunk)
output.close()
# Unzip the file to the scratch folder
arcpy.AddMessage("Extracting zip file...")
zip = zipfile.ZipFile(os.path.join(arcpy.env.scratchFolder, datasetFileName), mode="r")
unzipFolder = arcpy.env.scratchFolder
if ".gdb" in downloadLink:
unzipFolder = os.path.join(arcpy.env.scratchFolder, "Data.gdb")
zip.extractall(unzipFolder)
# Get the newest unzipped database from the scratch folder
database = max(glob.iglob(arcpy.env.scratchFolder + r"\*.gdb"), key=os.path.getmtime)
# Assign the geodatabase workspace and load in the datasets to the lists
arcpy.env.workspace = database
featureclassList = arcpy.ListFeatureClasses()
tableList = arcpy.ListTables()
arcpy.AddMessage("Copying datasets...")
# Load the feature classes into the geodatabase if at least one is in the geodatabase provided
if (len(featureclassList) > 0):
# Loop through the feature classes
for eachFeatureclass in featureclassList:
# Create a Describe object from the dataset
describeDataset = arcpy.Describe(eachFeatureclass)
# If feature dataset provided, add that to path
if featureDataset:
outputDataset = os.path.join(geodatabase + "\\" + featureDataset, describeDataset.name)
else:
outputDataset = os.path.join(geodatabase, describeDataset.name)
exportData = "true"
# If update mode is then copy, otherwise delete and appending records
if (updateMode == "New"):
# Copy feature class into geodatabase using the same dataset name
arcpy.CopyFeatures_management(eachFeatureclass, outputDataset, "", "0", "0", "0")
else:
# If dataset exists in geodatabase, delete features and load in new data
if arcpy.Exists(outputDataset):
arcpy.DeleteFeatures_management(outputDataset)
arcpy.Append_management(os.path.join(arcpy.env.workspace, eachFeatureclass), outputDataset, "NO_TEST", "", "")
else:
exportData = "false"
# Log warning
arcpy.AddWarning("Warning: " + outputDataset + " does not exist and won't be updated")
# Logging
if (enableLogging == "true"):
logger.warning(outputDataset + " does not exist and won't be updated")
if (exportData.lower() == "true"):
datasetRecordCount = arcpy.GetCount_management(outputDataset)
arcpy.AddMessage(str(outputDataset) + " record count - " + str(datasetRecordCount) + "...")
# Logging
if (enableLogging == "true"):
logger.info(str(outputDataset) + " record count - " + str(datasetRecordCount) + "...")
if (len(tableList) > 0):
# Loop through of the tables
for eachTable in tableList:
# Create a Describe object from the dataset
describeDataset = arcpy.Describe(eachTable)
outputDataset = os.path.join(geodatabase, describeDataset.name)
exportData = "true"
# If update mode is then copy, otherwise delete and appending records
if (updateMode == "New"):
# Copy feature class into geodatabase using the same dataset name
arcpy.TableSelect_analysis(eachTable, outputDataset, "")
else:
# If dataset exists in geodatabase, delete features and load in new data
if arcpy.Exists(os.path.join(geodatabase, eachTable)):
arcpy.DeleteRows_management(os.path.join(geodatabase, eachTable))
arcpy.Append_management(os.path.join(arcpy.env.workspace, eachTable), outputDataset, "NO_TEST", "", "")
else:
exportData = "false"
# Log warning
arcpy.AddWarning("Warning: " + outputDataset + " does not exist and won't be updated")
# Logging
if (enableLogging == "true"):
logger.warning(outputDataset + " does not exist and won't be updated")
if (exportData.lower() == "true"):
datasetRecordCount = arcpy.GetCount_management(outputDataset)
arcpy.AddMessage(str(outputDataset) + " record count - " + str(datasetRecordCount) + "...")
# Logging
if (enableLogging == "true"):
logger.info(str(outputDataset) + " record count - " + str(datasetRecordCount) + "...")
# --------------------------------------- End of code --------------------------------------- #
# If called from gp tool return the arcpy parameter
if __name__ == '__main__':
# Return the output if there is any
if output:
# If ArcGIS desktop installed
if (arcgisDesktop == "true"):
arcpy.SetParameterAsText(1, output)
# ArcGIS desktop not installed
else:
return output
# Otherwise return the result
else:
# Return the output if there is any
if output:
return output
# Logging
if (enableLogging == "true"):
# Log end of process
logger.info("Process ended.")
# Remove file handler and close log file
logMessage.flush()
logMessage.close()
logger.handlers = []
# If arcpy error
except arcpy.ExecuteError:
# Build and show the error message
errorMessage = arcpy.GetMessages(2)
printMessage(errorMessage,"error")
# Logging
if (enableLogging == "true"):
# Log error
logger.error(errorMessage)
# Log end of process
logger.info("Process ended.")
# Remove file handler and close log file
logMessage.flush()
logMessage.close()
logger.handlers = []
if (sendErrorEmail == "true"):
# Send email
sendEmail(errorMessage)
# If python error
except Exception as e:
errorMessage = ""
# Build and show the error message
# If many arguments
if (e.args):
for i in range(len(e.args)):
if (i == 0):
# Python version check
if sys.version_info[0] >= 3:
# Python 3.x
errorMessage = str(e.args[i]).encode('utf-8').decode('utf-8')
else:
# Python 2.x
errorMessage = unicode(e.args[i]).encode('utf-8')
else:
# Python version check
if sys.version_info[0] >= 3:
# Python 3.x
errorMessage = errorMessage + " " + str(e.args[i]).encode('utf-8').decode('utf-8')
else:
# Python 2.x
errorMessage = errorMessage + " " + unicode(e.args[i]).encode('utf-8')
# Else just one argument
else:
errorMessage = e
printMessage(errorMessage,"error")
# Logging
if (enableLogging == "true"):
# Log error
logger.error(errorMessage)
# Log end of process
logger.info("Process ended.")
# Remove file handler and close log file
logMessage.flush()
logMessage.close()
logger.handlers = []
if (sendErrorEmail == "true"):
# Send email
sendEmail(errorMessage)
# End of main function
# Start of print message function
def printMessage(message,type):
# If ArcGIS desktop installed
if (arcgisDesktop == "true"):
if (type.lower() == "warning"):
arcpy.AddWarning(message)
elif (type.lower() == "error"):
arcpy.AddError(message)
else:
arcpy.AddMessage(message)
# ArcGIS desktop not installed
else:
print(message)
# End of print message function
# Start of set logging function
def setLogging(logFile):
# Create a logger
logger = logging.getLogger(os.path.basename(__file__))
logger.setLevel(logging.DEBUG)
# Setup log message handler
logMessage = logging.FileHandler(logFile)
# Setup the log formatting
logFormat = logging.Formatter("%(asctime)s: %(levelname)s - %(message)s", "%d/%m/%Y - %H:%M:%S")
# Add formatter to log message handler
logMessage.setFormatter(logFormat)
# Add log message handler to logger
logger.addHandler(logMessage)
return logger, logMessage
# End of set logging function
# Start of send email function
def sendEmail(message):
# Send an email
arcpy.AddMessage("Sending email...")
# Server and port information
smtpServer = smtplib.SMTP(emailServerName,emailServerPort)
smtpServer.ehlo()
smtpServer.starttls()
smtpServer.ehlo
# Login with sender email address and password
smtpServer.login(emailUser, emailPassword)
# Email content
header = 'To:' + emailTo + '\n' + 'From: ' + emailUser + '\n' + 'Subject:' + emailSubject + '\n'
body = header + '\n' + emailMessage + '\n' + '\n' + message
# Send the email and close the connection
smtpServer.sendmail(emailUser, emailTo, body)
# End of send email function
# This test allows the script to be used from the operating
# system command prompt (stand-alone), in a Python IDE,
# as a geoprocessing script tool, or as a module imported in
# another script
if __name__ == '__main__':
# Arguments are optional - If running from ArcGIS Desktop tool, parameters will be loaded into *argv
# If ArcGIS desktop installed
if (arcgisDesktop == "true"):
argv = tuple(arcpy.GetParameterAsText(i)
for i in range(arcpy.GetArgumentCount()))
# ArcGIS desktop not installed
else:
argv = sys.argv
# Delete the first argument, which is the script
del argv[0]
# Logging
if (enableLogging == "true"):
# Setup logging
logger, logMessage = setLogging(logFile)
# Log start of process
logger.info("Process started.")
# Setup the use of a proxy for requests
if (enableProxy == "true"):
# Setup the proxy
proxy = urllib2.ProxyHandler({requestProtocol : proxyURL})
openURL = urllib2.build_opener(proxy)
# Install the proxy
urllib2.install_opener(openURL)
mainFunction(*argv)