-
Notifications
You must be signed in to change notification settings - Fork 11
/
DomainsRemoveDuplicates.py
366 lines (317 loc) · 18.5 KB
/
DomainsRemoveDuplicates.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
#-------------------------------------------------------------
# Name: Remove Duplicate Domains
# Purpose: Gets a list of used domains in the database then removes those not being used. Also looks at configuration
# file to find duplicate domains, then re-assigns a domain and removes the unused duplicate domain.
# Author: Shaun Weston ([email protected])
# Date Created: 14/04/2014
# Last Updated: 04/06/2014
# Copyright: (c) Eagle Technology
# ArcGIS Version: 10.1/10.2
# Python Version: 2.7
#--------------------------------
# Import modules
import os
import sys
import logging
import smtplib
import arcpy
import csv
# Enable data to be overwritten
arcpy.env.overwriteOutput = True
# Set global variables
enableLogging = "false" # Use logger.info("Example..."), logger.warning("Example..."), logger.error("Example...")
logFile = os.path.join(os.path.dirname(__file__), r"Logs\DomainsRemoveDuplicates.log") # os.path.join(os.path.dirname(__file__), "Example.log")
sendErrorEmail = "false"
emailTo = ""
emailUser = ""
emailPassword = ""
emailSubject = ""
emailMessage = ""
output = None
# Start of main function
def mainFunction(geodatabase,configFile): # Get parameters from ArcGIS Desktop tool by seperating by comma e.g. (var1 is 1st parameter,var2 is 2nd parameter,var3 is 3rd parameter)
try:
# Logging
if (enableLogging == "true"):
# Setup logging
logger, logMessage = setLogging(logFile)
# Log start of process
logger.info("Process started.")
# --------------------------------------- Start of code --------------------------------------- #
# Get a list of assigned domains
assignedDomains = []
# Get a list of the feature datasets in the database
arcpy.env.workspace = geodatabase
featureDatasetList = arcpy.ListDatasets("", "Feature")
# FUNCTION - Get the domains for these feature datasets
assignedDomains = assignedDomains + getDomains(geodatabase,featureDatasetList,configFile,"Feature Dataset")
# Get a list of the feature classes in the database
featureClassList = arcpy.ListFeatureClasses()
# FUNCTION - Get the domains for these feature calsses
assignedDomains = assignedDomains + getDomains(geodatabase,featureClassList,configFile,"Feature Class")
# Get a list of the tables in the database
mosaicList = arcpy.ListDatasets("", "Mosaic")
# FUNCTION - Get the domains for these tables
assignedDomains = assignedDomains + getDomains(geodatabase,mosaicList,configFile,"Mosaic")
# Get a list of mosaic rasters in the database
tableList = arcpy.ListTables()
# FUNCTION - Get the domains for these tables
assignedDomains = assignedDomains + getDomains(geodatabase,featureClassList,configFile,"Table")
# Get a list of domains on the geodatabase
geodatabaseDomains = arcpy.da.ListDomains(geodatabase)
# For each of the domains
for domain in geodatabaseDomains:
usedDomainCount = 0
# Check it is being used by looking at the assigned domains list
for assignedDomain in assignedDomains:
if (domain.name == assignedDomain):
usedDomainCount = usedDomainCount + 1
# If domain is not being used
if (usedDomainCount == 0):
# Don't remove domains on wcc_encroachments feature class (Wellington City Council) as there are subtypes and it's causing issues in this script
if ("Encroach" not in domain.name):
# Remove the domain from the geodatabase
arcpy.AddMessage("Removing domain " + domain.name + " as not being used...")
# Logging
if (enableLogging == "true"):
logger.info("Removing domain " + domain.name + " as not being used...")
arcpy.DeleteDomain_management(geodatabase, domain.name)
# --------------------------------------- End of code --------------------------------------- #
# If called from gp tool return the arcpy parameter
if __name__ == '__main__':
# Return the output if there is any
if output:
arcpy.SetParameterAsText(1, output)
# Otherwise return the result
else:
# Return the output if there is any
if output:
return output
# Logging
if (enableLogging == "true"):
# Log end of process
logger.info("Process ended.")
# Remove file handler and close log file
logging.FileHandler.close(logMessage)
logger.removeHandler(logMessage)
pass
# If arcpy error
except arcpy.ExecuteError:
# Build and show the error message
errorMessage = arcpy.GetMessages(2)
arcpy.AddError(errorMessage)
# Logging
if (enableLogging == "true"):
# Log error
logger.error(errorMessage)
# Remove file handler and close log file
logging.FileHandler.close(logMessage)
logger.removeHandler(logMessage)
if (sendErrorEmail == "true"):
# Send email
sendEmail(errorMessage)
# If python error
except Exception as e:
errorMessage = ""
# Build and show the error message
for i in range(len(e.args)):
if (i == 0):
errorMessage = str(e.args[i])
else:
errorMessage = errorMessage + " " + str(e.args[i])
arcpy.AddError(errorMessage)
# Logging
if (enableLogging == "true"):
# Log error
logger.error(errorMessage)
# Remove file handler and close log file
logging.FileHandler.close(logMessage)
logger.removeHandler(logMessage)
if (sendErrorEmail == "true"):
# Send email
sendEmail(errorMessage)
# End of main function
# Get a list of domains used in the database and reassigns duplicates
def getDomains(geodatabase,datasetList,configFile,dataType):
# Logging
if (enableLogging == "true"):
# Setup logging
logger, logMessage = setLogging(logFile)
assignedDomains = []
# Loop through the datasets
for dataset in datasetList:
# Setup the source and destination paths
sourceDatasetPath = os.path.join(geodatabase, dataset)
# If feature datasets
if (dataType == "Feature Dataset"):
# Get a list of the feature classes in the feature dataset
featureClassList = arcpy.ListFeatureClasses("","",dataset)
# Change dataset name to be just name (remove user and schema if SDE database)
splitDataset = dataset.split('.')
dataset = splitDataset[-1]
# Loop through the feature classes in the feature dataset
for featureClass in featureClassList:
# Change feature class name to be just name (remove user and schema if SDE database)
splitDataset = featureClass.split('.')
featureClass = splitDataset[-1]
# Don't include _H or VW
if ("_H" not in featureClass) and ("VW" not in featureClass) and ("vw" not in featureClass):
# Setup the source and destination paths
sourceDatasetPath = os.path.join(geodatabase + "\\" + dataset, featureClass)
# List fields in feature class
fields = arcpy.ListFields(featureClass)
# Loop through fields
for field in fields:
# Check if field has domain
if field.domain != "":
# If configuration provided
if (configFile):
# Set CSV delimiter
csvDelimiter = ","
domain = field.domain
# Look through configuration file to see if domain exists
# Open the CSV file
with open(configFile, 'rb') as csvFile:
# Read the CSV file
rows = csv.reader(csvFile, delimiter=csvDelimiter)
# For each row in the CSV
count = 0
for row in rows:
# Ignore the first line containing headers
if (count > 0):
originalDomain = row[0]
duplicateDomain = row[1]
# If duplicate domain is in config file
if (field.domain == duplicateDomain):
arcpy.AddMessage("Reassigning domain on feature class " + featureClass + " from " + field.domain + " to " + originalDomain + " as it is duplicated...")
# Logging
if (enableLogging == "true"):
logger.info("Reassigning domain on feature class " + featureClass + " from " + field.domain + " to " + originalDomain + " as it is duplicated...")
# Check for subtypes on the dataset
describeDataset = arcpy.Describe(featureClass)
defaultSubtype = describeDataset.defaultSubtypeCode
# If a subtype exists
if (defaultSubtype != -1):
# Get a list of subtypes on the dataset
datasetSubtypes = arcpy.da.ListSubtypes(dataset)
for subtypeCode, subtypeDesc in datasetSubtypes.iteritems():
# Remove existing domain
arcpy.RemoveDomainFromField_management(sourceDatasetPath, field.name, subtypeCode)
# Re-assign domain to other domain for subtype
arcpy.AssignDomainToField_management(sourceDatasetPath, field.name, originalDomain, subtypeCode)
# Re-assign domain to other domain
arcpy.AssignDomainToField_management(sourceDatasetPath, field.name, originalDomain, "")
# Else no subtypes on dataset
else:
# Re-assign domain to other domain
arcpy.AssignDomainToField_management(sourceDatasetPath, field.name, originalDomain, "")
count = count + 1
# Add the domain to the list
assignedDomains.append(domain)
else:
# Add the domain to the list
assignedDomains.append(field.domain)
# If feature classes/tables/mosaics
else:
# List fields in feature class
fields = arcpy.ListFields(dataset)
# Change dataset name to be just name (remove user and schema if SDE database)
splitDataset = dataset.split('.')
dataset = splitDataset[-1]
# Don't include _H or VW
if ("_H" not in dataset) and ("VW" not in dataset) and ("vw" not in dataset):
# Loop through fields
for field in fields:
# Check if field has domain
if field.domain != "":
# If configuration provided
if (configFile):
# Set CSV delimiter
csvDelimiter = ","
domain = field.domain
# Look through configuration file to see if domain exists
# Open the CSV file
with open(configFile, 'rb') as csvFile:
# Read the CSV file
rows = csv.reader(csvFile, delimiter=csvDelimiter)
# For each row in the CSV
count = 0
for row in rows:
# Ignore the first line containing headers
if (count > 0):
originalDomain = row[0]
duplicateDomain = row[1]
# If duplicate domain is in config file
if (field.domain == duplicateDomain):
arcpy.AddMessage("Reassigning domain on feature class " + dataset + " from " + field.domain + " to " + originalDomain + " as it is duplicated...")
# Logging
if (enableLogging == "true"):
logger.info("Reassigning domain on feature class " + dataset + " from " + field.domain + " to " + originalDomain + " as it is duplicated...")
# Check for subtypes on the dataset
describeDataset = arcpy.Describe(dataset)
defaultSubtype = describeDataset.defaultSubtypeCode
# If a subtype exists
if (defaultSubtype != -1):
# Get a list of subtypes on the dataset
datasetSubtypes = arcpy.da.ListSubtypes(dataset)
for subtypeCode, subtypeDesc in datasetSubtypes.iteritems():
# Remove existing domain
arcpy.RemoveDomainFromField_management(sourceDatasetPath, field.name, subtypeCode)
# Re-assign domain to other domain for subtype
arcpy.AssignDomainToField_management(sourceDatasetPath, field.name, originalDomain, subtypeCode)
# Re-assign domain to other domain
arcpy.AssignDomainToField_management(sourceDatasetPath, field.name, originalDomain, "")
# Else no subtypes on dataset
else:
# Re-assign domain to other domain
arcpy.AssignDomainToField_management(sourceDatasetPath, field.name, originalDomain, "")
domain = originalDomain
count = count + 1
# Add the domain to the list
assignedDomains.append(domain)
else:
# Add the domain to the list
assignedDomains.append(field.domain)
# Return a list of assigned domains
return assignedDomains
# Start of set logging function
def setLogging(logFile):
# Create a logger
logger = logging.getLogger(os.path.basename(__file__))
logger.setLevel(logging.DEBUG)
# Setup log message handler
logMessage = logging.FileHandler(logFile)
# Setup the log formatting
logFormat = logging.Formatter("%(asctime)s: %(levelname)s - %(message)s", "%d/%m/%Y - %H:%M:%S")
# Add formatter to log message handler
logMessage.setFormatter(logFormat)
# Add log message handler to logger
logger.addHandler(logMessage)
return logger, logMessage
# End of set logging function
# Start of send email function
def sendEmail(message):
# Send an email
arcpy.AddMessage("Sending email...")
# Server and port information
smtpServer = smtplib.SMTP("smtp.gmail.com",587)
smtpServer.ehlo()
smtpServer.starttls()
smtpServer.ehlo
# Login with sender email address and password
smtpServer.login(emailUser, emailPassword)
# Email content
header = 'To:' + emailTo + '\n' + 'From: ' + emailUser + '\n' + 'Subject:' + emailSubject + '\n'
body = header + '\n' + emailMessage + '\n' + '\n' + message
# Send the email and close the connection
smtpServer.sendmail(emailUser, emailTo, body)
# End of send email function
# This test allows the script to be used from the operating
# system command prompt (stand-alone), in a Python IDE,
# as a geoprocessing script tool, or as a module imported in
# another script
if __name__ == '__main__':
# Arguments are optional - If running from ArcGIS Desktop tool, parameters will be loaded into *argv
argv = tuple(arcpy.GetParameterAsText(i)
for i in range(arcpy.GetArgumentCount()))
mainFunction(*argv)