diff --git a/filehunt.py b/filehunt.py index 529525a..56a568a 100644 --- a/filehunt.py +++ b/filehunt.py @@ -6,7 +6,7 @@ # filehunt: general file searching library for use by PANhunt and PassHunt # By BB -import os, sys, zipfile, re, datetime, cStringIO, argparse, time, hashlib, unicodedata, codecs +import os, sys, zipfile, re, datetime, io, argparse, time, hashlib, unicodedata, codecs import colorama import progressbar import pst # MS-PST files @@ -37,10 +37,8 @@ def __init__(self, filename, file_dir): self.type = None self.matches = [] - def __cmp__(self, other): - - return cmp(self.path.lower(), other.path.lower()) - + def __lt__(self, other): + return self.path.lower() < other.path.lower() def set_file_stats(self): @@ -74,7 +72,7 @@ def size_friendly(self): def set_error(self, error_msg): self.errors.append(error_msg) - print colorama.Fore.RED + unicode2ascii(u'ERROR %s on %s' % (error_msg, self.path)) + colorama.Fore.WHITE + sys.stdout.buffer.write(colorama.Fore.RED.encode('ascii','ignore') + unicode2ascii('ERROR %s on %s\n' % (error_msg, self.path)) + colorama.Fore.WHITE.encode('ascii','ignore')) def check_regexs(self, regexs, search_extensions): @@ -94,7 +92,7 @@ def check_regexs(self, regexs, search_extensions): elif self.type == 'TEXT': try: - file_text = read_file(self.path, 'rb') + file_text = read_file(self.path, 'r') self.check_text_regexs(file_text, regexs, '') #except WindowsError: # self.set_error(sys.exc_info()[1]) @@ -145,7 +143,7 @@ def check_pst_regexs(self, regexs, search_extensions, hunt_type, gauge_update_fu if message.Subject: message_path = os.path.join(folder.path, message.Subject) else: - message_path = os.path.join(folder.path, u'[NoSubject]') + message_path = os.path.join(folder.path, '[NoSubject]') if message.Body: self.check_text_regexs(message.Body, regexs, message_path) if message.HasAttachments: @@ -185,7 +183,7 @@ def check_attachment_regexs(self, attachment, regexs, search_extensions, sub_pat if attachment_ext in search_extensions['ZIP']: if attachment.data: try: - memory_zip = cStringIO.StringIO() + memory_zip = io.StringIO() memory_zip.write(attachment.data) zf = zipfile.ZipFile(memory_zip) self.check_zip_regexs(zf, regexs, search_extensions, os.path.join(sub_path, attachment.Filename)) @@ -212,7 +210,7 @@ def check_zip_regexs(self, zf, regexs, search_extensions, sub_path): for file_in_zip in files_in_zip: if get_ext(file_in_zip) in search_extensions['ZIP']: # nested zip file try: - memory_zip = cStringIO.StringIO() + memory_zip = io.StringIO() memory_zip.write(zf.open(file_in_zip).read()) nested_zf = zipfile.ZipFile(memory_zip) self.check_zip_regexs(nested_zf, regexs, search_extensions, os.path.join(sub_path, decode_zip_filename(file_in_zip))) @@ -222,13 +220,13 @@ def check_zip_regexs(self, zf, regexs, search_extensions, sub_path): elif get_ext(file_in_zip) in search_extensions['TEXT']: #normal doc try: file_text = zf.open(file_in_zip).read() - self.check_text_regexs(file_text, regexs, os.path.join(sub_path, decode_zip_filename(file_in_zip))) + self.check_text_regexs(decode_zip_text(file_text), regexs, os.path.join(sub_path, decode_zip_filename(file_in_zip))) except: # RuntimeError: # e.g. zip needs password self.set_error(sys.exc_info()[1]) else: # SPECIAL try: if get_ext(file_in_zip) == '.msg': - memory_msg = cStringIO.StringIO() + memory_msg = io.StringIO() memory_msg.write(zf.open(file_in_zip).read()) msg = msmsg.MSMSG(memory_msg) if msg.validMSG: @@ -253,10 +251,10 @@ def find_all_files_in_directory(AFileClass, root_dir, excluded_directories, sear global TEXT_FILE_SIZE_LIMIT - all_extensions = [ext for ext_list in search_extensions.values() for ext in ext_list] + all_extensions = [ext for ext_list in list(search_extensions.values()) for ext in ext_list] extension_types = {} - for ext_type, ext_list in search_extensions.iteritems(): + for ext_type, ext_list in search_extensions.items(): for ext in ext_list: extension_types[ext] = ext_type @@ -379,9 +377,13 @@ def load_object(fn): def read_file(fn, open_mode="r"): - f = open(fn, open_mode) + try: + with open(fn, open_mode) as f: s = f.read() - f.close() + except: + with open(fn, "rb") as f: + b = f.read() + s = b.decode("utf-8", "ignore") return s @@ -421,13 +423,19 @@ def unicode2ascii(unicode_str): return unicodedata.normalize('NFKD', unicode_str).encode('ascii','ignore') -def decode_zip_filename(str): +def decode_zip_filename(instr): - if type(str) is unicode: - return str + if type(instr) is str: + return instr else: - return str.decode('cp437') + return instr.decode('cp437') +def decode_zip_text(instr): + + if type(instr) is str: + return instr + else: + return instr.decode('utf-8') def get_ext(file_name): diff --git a/msmsg.py b/msmsg.py index 07e5ecb..2c364f3 100644 --- a/msmsg.py +++ b/msmsg.py @@ -61,7 +61,7 @@ def get_stream(self, sector, size): def __repr__(self): - return ', '.join(['%s:%s' % (hex(sector), hex(entry)) for sector, entry in zip(range(len(self.entries)), self.entries)]) + return ', '.join(['%s:%s' % (hex(sector), hex(entry)) for sector, entry in zip(list(range(len(self.entries))), self.entries)]) @@ -102,7 +102,7 @@ def get_stream(self, sector, size): def __repr__(self): - return ', '.join(['%s:%s' % (hex(sector), hex(entry)) for sector, entry in zip(range(len(self.entries)), self.entries)]) + return ', '.join(['%s:%s' % (hex(sector), hex(entry)) for sector, entry in zip(list(range(len(self.entries))), self.entries)]) @@ -133,7 +133,7 @@ def set_entry_children(self, dir_entry): child_ids_queue.append(dir_entry.ChildID) while child_ids_queue: child_entry = self.entries[child_ids_queue.pop()] - if child_entry.Name in dir_entry.childs.keys(): + if child_entry.Name in list(dir_entry.childs.keys()): raise MSGException('Directory Entry Name already in children dictionary') dir_entry.childs[child_entry.Name] = child_entry if child_entry.SiblingID != DirectoryEntry.NOSTREAM: @@ -156,7 +156,7 @@ def get_directory_sector(self, sector): def __repr__(self): - return u', '.join([entry.__repr__() for entry in self.entries]) + return ', '.join([entry.__repr__() for entry in self.entries]) @@ -199,9 +199,8 @@ def __init__(self, mscfb, bytes): self.childs = {} - def __cmp__(self, other): - - return cmp(self.Name, other.Name) + def __lt__(self, other): + return self.Name < other.Name def get_data(self): @@ -222,7 +221,7 @@ def list_children(self, level=0, expand=False): for child_entry in sorted(self.childs.values()): line_sfx = '' if child_entry.ObjectType == DirectoryEntry.OBJECT_STORAGE: - line_sfx = '(%s)' % len(child_entry.childs.keys()) + line_sfx = '(%s)' % len(list(child_entry.childs.keys())) s += '%s %s %s\n' % (line_pfx, child_entry.Name, line_sfx) if expand: s += child_entry.list_children(level+1, expand) @@ -231,7 +230,7 @@ def list_children(self, level=0, expand=False): def __repr__(self): - return u'%s (%s, %s, %s, %s, %s, %s)' % (self.Name, self.ObjectType, hex(self.SiblingID), hex(self.RightSiblingID), hex(self.ChildID), hex(self.StartingSectorLocation), hex(self.StreamSize)) + return '%s (%s, %s, %s, %s, %s, %s)' % (self.Name, self.ObjectType, hex(self.SiblingID), hex(self.RightSiblingID), hex(self.ChildID), hex(self.StartingSectorLocation), hex(self.StreamSize)) @@ -240,7 +239,7 @@ class MSCFB: def __init__(self, cfb_file): """cfb_file is unicode or string filename or a file object""" - if isinstance(cfb_file, str) or isinstance(cfb_file, unicode): + if isinstance(cfb_file, str) or isinstance(cfb_file, str): self.fd = open(cfb_file,'rb') else: self.fd = cfb_file @@ -330,14 +329,14 @@ def __init__(self, msmsg, parent_dir_entry, header_size): property_entries_count = (len(bytes) - header_size) / 16 for i in range(property_entries_count): prop_entry = PropertyEntry(self.msmsg, parent_dir_entry, bytes[header_size + i*16: header_size + i*16 + 16]) - if prop_entry in self.properties.keys(): + if prop_entry in list(self.properties.keys()): raise MSGException('PropertyID already in properties dictionary') self.properties[prop_entry.PropertyID] = prop_entry def getval(self, prop_id): - if prop_id in self.properties.keys(): + if prop_id in list(self.properties.keys()): return self.properties[prop_id].value else: return None @@ -345,7 +344,7 @@ def getval(self, prop_id): def __repr__(self): - return u'\n'.join([prop.__repr__() for prop in self.properties.values()]) + return '\n'.join([prop.__repr__() for prop in list(self.properties.values())]) @@ -389,7 +388,7 @@ def __init__(self, msmsg, parent_dir_entry, bytes): def __repr__(self): - return u'%s=%s' % (hex(self.PropertyTag), self.value.__repr__()) + return '%s=%s' % (hex(self.PropertyTag), self.value.__repr__()) @@ -723,7 +722,7 @@ def set_recipients(self): recipient_dir_index = 0 while True: recipient_dir_name = '__recip_version1.0_#%s' % zeropadhex(recipient_dir_index, 8) - if recipient_dir_name in self.root_dir_entry.childs.keys(): + if recipient_dir_name in list(self.root_dir_entry.childs.keys()): recipient_dir_entry = self.root_dir_entry.childs[recipient_dir_name] rps = PropertyStream(self, recipient_dir_entry, PropertyStream.RECIP_OR_ATTACH_HEADER_SIZE) recipient = Recipient(rps) @@ -739,7 +738,7 @@ def set_attachments(self): attachment_dir_index = 0 while True: attachment_dir_name = '__attach_version1.0_#%s' % zeropadhex(attachment_dir_index, 8) - if attachment_dir_name in self.root_dir_entry.childs.keys(): + if attachment_dir_name in list(self.root_dir_entry.childs.keys()): attachment_dir_entry = self.root_dir_entry.childs[attachment_dir_name] aps = PropertyStream(self, attachment_dir_entry, PropertyStream.RECIP_OR_ATTACH_HEADER_SIZE) attachment = Attachment(aps) @@ -870,7 +869,7 @@ def size_friendly(size): def test_status_msg(msg_file): msg = MSMSG(msg_file) - print msg.cfb.directory + print(msg.cfb.directory) msg.close() @@ -878,19 +877,19 @@ def test_folder_msgs(test_folder): global error_log_list - s = u'' + s = '' for msg_filepath in [os.path.join(test_folder, filename) for filename in os.listdir(test_folder) if os.path.isfile(os.path.join(test_folder, filename)) and os.path.splitext(filename.lower())[1] == '.msg']: #try: - s += u'Opening %s\n' % msg_filepath + s += 'Opening %s\n' % msg_filepath error_log_list = [] msg = MSMSG(msg_filepath) #s += u'MajorVersion: %s, FATSectors: %s, MiniFATSectors: %s, DIFATSectors %s\n' % (msg.cfb.MajorVersion, msg.cfb.FATSectors, msg.cfb.MiniFATSectors, msg.cfb.DIFATSectors) #s += u'MiniStreamSectorLocation: %s, MiniStreamSize: %s\n' % (hex(msg.cfb.MiniStreamSectorLocation), msg.cfb.MiniStreamSize) #s += u'\n' + msg.cfb.directory.entries[0].list_children(level=0, expand=True) #s += u'\n' + msg.prop_stream.__repr__() - s += u'Recipients: %s\n' % u', '.join([recip.__repr__() for recip in msg.recipients]) - s += u'Attachments: %s\n' % u', '.join([attach.__repr__() for attach in msg.attachments]) - s += u'Subject: %s\nBody: %s\n' % (msg.Subject.__repr__(), msg.Body.__repr__()) + s += 'Recipients: %s\n' % ', '.join([recip.__repr__() for recip in msg.recipients]) + s += 'Attachments: %s\n' % ', '.join([attach.__repr__() for attach in msg.attachments]) + s += 'Subject: %s\nBody: %s\n' % (msg.Subject.__repr__(), msg.Body.__repr__()) s += '\n\n\n' # dump attachments: if False: @@ -917,6 +916,6 @@ def test_folder_msgs(test_folder): if __name__=="__main__": - test_folder = u'D:\\' + test_folder = 'D:\\' #test_status_msg(test_folder+'test.msg') #test_folder_msgs(test_folder) \ No newline at end of file diff --git a/panhunt.py b/panhunt.py index 251d5bd..31746a8 100644 --- a/panhunt.py +++ b/panhunt.py @@ -6,9 +6,9 @@ # PANhunt: search directories and sub directories for documents with PANs # By BB -import os, sys, zipfile, re, datetime, cStringIO, argparse, time, hashlib, unicodedata, platform +import os, sys, zipfile, re, datetime, io, argparse, time, hashlib, unicodedata, platform import colorama -import ConfigParser +import configparser import progressbar import filehunt @@ -16,16 +16,16 @@ # defaults defaults = { - 'search_dir': u'C:\\', - 'output_file': u'panhunt_%s.txt' % time.strftime("%Y-%m-%d-%H%M%S"), - 'excluded_directories_string': u'C:\\Windows,C:\\Program Files,C:\\Program Files (x86)', - 'text_extensions_string': u'.doc,.xls,.xml,.txt,.csv,.log', - 'zip_extensions_string': u'.docx,.xlsx,.zip', - 'special_extensions_string': u'.msg', - 'mail_extensions_string': u'.pst', - 'other_extensions_string': u'.ost,.accdb,.mdb', # checks for existence of files that can't be checked automatically + 'search_dir': 'C:\\', + 'output_file': 'panhunt_%s.txt' % time.strftime("%Y-%m-%d-%H%M%S"), + 'excluded_directories_string': 'C:\\Windows,C:\\Program Files,C:\\Program Files (x86)', + 'text_extensions_string': '.doc,.xls,.xml,.txt,.csv,.log', + 'zip_extensions_string': '.docx,.xlsx,.zip', + 'special_extensions_string': '.msg', + 'mail_extensions_string': '.pst', + 'other_extensions_string': '.ost,.accdb,.mdb', # checks for existence of files that can't be checked automatically 'excluded_pans_string': '', - 'config_file': u'panhunt.ini' + 'config_file': 'panhunt.ini' } search_dir = defaults['search_dir'] output_file = defaults['output_file'] @@ -69,7 +69,7 @@ def __init__(self, filename, file_dir): def check_text_regexs(self, text, regexs, sub_path): """Uses regular expressions to check for PANs in text""" - for brand, regex in regexs.items(): + for brand, regex in list(regexs.items()): pans = regex.findall(text) if pans: for pan in pans: @@ -140,11 +140,11 @@ def digits_of(n): def get_text_hash(text): - if type(text) is unicode: + if type(text) is str: encoded_text = text.encode('utf-8') else: encoded_text = text - return hashlib.sha512(encoded_text+'PAN').hexdigest() + return hashlib.sha512(encoded_text+'PAN'.encode('utf-8')).hexdigest() def add_hash_to_file(text_file): @@ -163,10 +163,10 @@ def check_file_hash(text_file): hash_in_file = text_output[hash_pos+len(os.linesep):] hash_check = get_text_hash(text_output[:hash_pos]) if hash_in_file == hash_check: - print colorama.Fore.GREEN + 'Hashes OK' + sys.stdout.buffer.write(colorama.Fore.GREEN.encode('ascii','ignore') + 'Hashes OK\n'.encode('ascii','ignore')) else: - print colorama.Fore.RED + 'Hashes Not OK' - print colorama.Fore.WHITE + hash_in_file +'\n' + hash_check + sys.stdout.buffer.write(colorama.Fore.RED.encode('ascii','ignore') + 'Hashes Not OK\n'.encode('ascii','ignore')) + sys.stdout.buffer.write(colorama.Fore.WHITE.encode('ascii','ignore') + hash_in_file +'\n' + hash_check) def output_report(search_dir, excluded_directories_string, all_files, total_files_searched, pans_found, output_file, mask_pans): @@ -179,21 +179,21 @@ def output_report(search_dir, excluded_directories_string, all_files, total_file pan_report += u'Searched %s files. Found %s possible PANs.\n%s\n\n' % (total_files_searched, pans_found, '='*100) for afile in sorted([afile for afile in all_files if afile.matches]): - pan_header = u'FOUND PANs: %s (%s %s)' % (afile.path, afile.size_friendly(), afile.modified.strftime('%d/%m/%Y')) - print colorama.Fore.RED + filehunt.unicode2ascii(pan_header) + pan_header = 'FOUND PANs: %s (%s %s)' % (afile.path, afile.size_friendly(), afile.modified.strftime('%d/%m/%Y')) + sys.stdout.buffer.write(colorama.Fore.RED.encode('ascii','ignore') + filehunt.unicode2ascii(pan_header) + '\n'.encode('ascii','ignore')) pan_report += pan_header + '\n' - pan_list = u'\t' + pan_sep.join([pan.__repr__(mask_pans) for pan in afile.matches]) - print colorama.Fore.YELLOW + filehunt.unicode2ascii(pan_list) + pan_list = '\t' + pan_sep.join([pan.__repr__(mask_pans) for pan in afile.matches]) + sys.stdout.buffer.write(colorama.Fore.YELLOW.encode('ascii','ignore') + filehunt.unicode2ascii(pan_list) + '\n'.encode('ascii','ignore')) pan_report += pan_list + '\n\n' if len([afile for afile in all_files if afile.type == 'OTHER']) <> 0: pan_report += u'Interesting Files to check separately:\n' for afile in sorted([afile for afile in all_files if afile.type == 'OTHER']): - pan_report += u'%s (%s %s)\n' % (afile.path, afile.size_friendly(), afile.modified.strftime('%d/%m/%Y')) + pan_report += '%s (%s %s)\n' % (afile.path, afile.size_friendly(), afile.modified.strftime('%d/%m/%Y')) pan_report = pan_report.replace('\n', os.linesep) - print colorama.Fore.WHITE + 'Report written to %s' % filehunt.unicode2ascii(output_file) + sys.stdout.buffer.write(colorama.Fore.WHITE.encode('ascii','ignore') + 'Report written to '.encode('ascii','ignore') + filehunt.unicode2ascii(output_file) + '\n'.encode('ascii','ignore')) filehunt.write_unicode_file(output_file, pan_report) add_hash_to_file(output_file) @@ -306,8 +306,8 @@ def hunt_pans(gauge_update_function=None): mail_extensions_string = unicode(args.mailfiles) other_extensions_string = unicode(args.otherfiles) mask_pans = not args.unmask - excluded_pans_string = unicode(args.excludepan) - config_file = unicode(args.config) + excluded_pans_string = str(args.excludepan) + config_file = str(args.config) load_config_file() set_global_parameters() diff --git a/pst.py b/pst.py index bad778b..b3be85a 100644 --- a/pst.py +++ b/pst.py @@ -26,7 +26,7 @@ def is_int(x): to_byte = ord def is_int(x): - return isinstance(x, (int, long)) + return isinstance(x, int) ############################################################################################################################## # _ _ _ ____ _ _ ___ _ ____ ______ _ @@ -284,9 +284,9 @@ class Block: 200, 161, 128, 166, 153, 152, 168, 47, 14, 129, 101, 115, 228, 194, 162, 138, 212, 225, 17, 208, 8, 139, 42, 242, 237, 154, 100, 63, 193, 108, 249, 236) if sys.hexversion >= 0x03000000: - decrypt_table = bytes.maketrans(bytearray(range(256)), bytearray(mpbbCryptFrom512)) + decrypt_table = bytes.maketrans(bytearray(list(range(256))), bytearray(mpbbCryptFrom512)) else: - decrypt_table = string.maketrans(b''.join(map(chr, range(256))), b''.join(map(chr, mpbbCryptFrom512))) + decrypt_table = string.maketrans(b''.join(map(chr, list(range(256)))), b''.join(map(chr, mpbbCryptFrom512))) btypeData = 0 btypeXBLOCK = 1 @@ -439,7 +439,7 @@ def fetch_subnodes(self, bid): block = self.fetch_block(bid) if block.block_type == Block.btypeSLBLOCK: for slentry in block.rgentries: - if slentry.nid in subnodes.keys(): + if slentry.nid in list(subnodes.keys()): raise PSTException('Duplicate subnode %s' % slentry.nid) subnodes[slentry.nid.nid] = slentry elif block.block_type == Block.btypeSIBLOCK: @@ -457,7 +457,7 @@ def get_page_leaf_entries(self, entry_type, page_offset): page = self.fetch_page(page_offset) for entry in page.rgEntries: if isinstance(entry, entry_type): - if entry.key in leaf_entries.keys(): + if entry.key in list(leaf_entries.keys()): raise PSTException('Invalid Leaf Key %s' % entry) leaf_entries[entry.key] = entry elif isinstance(entry, BTENTRY): @@ -633,7 +633,7 @@ def __init__(self, bth_data, hn): self.value = ptype.value(hn.get_hid_data(self.hid)) else: self.subnode_nid = NID(self.dwValueHnid) - if self.subnode_nid.nid in hn.subnodes.keys(): + if self.subnode_nid.nid in list(hn.subnodes.keys()): subnode_nid_bid = hn.subnodes[self.subnode_nid.nid].bidData else: raise PSTException('Invalid NID subnode reference %s' % self.subnode_nid) @@ -920,7 +920,7 @@ def __init__(self, hn): def getval(self, propid): - if propid in self.props.keys(): + if propid in list(self.props.keys()): return self.props[propid].value else: return None @@ -1016,7 +1016,7 @@ def setup_row_matrix(self): if self.hnidRows.is_hid: row_matrix_datas = [self.hn.get_hid_data(self.hnidRows)] # block data list else: - if self.hnidRows.nid in self.hn.subnodes.keys(): + if self.hnidRows.nid in list(self.hn.subnodes.keys()): subnode_nid_bid = self.hn.subnodes[self.hnidRows.nid].bidData else: raise PSTException('Row Matrix HNID not in Subnodes: %s' % self.hnidRows.nid) @@ -1037,7 +1037,7 @@ def setup_row_matrix(self): else: data_bytes = None #row_datas.append(self.get_row_cell_value(data_bytes, tcoldesc)) - if tcoldesc.wPropId in rowvals.keys(): + if tcoldesc.wPropId in list(rowvals.keys()): raise PSTException('Property ID %s already in row data' % hex(tcoldesc.wPropId)) rowvals[tcoldesc.wPropId] = self.get_row_cell_value(data_bytes, tcoldesc) self.RowMatrix[dwRowID] = rowvals #row_datas @@ -1062,7 +1062,7 @@ def get_row_cell_value(self, data_bytes, tcoldesc): return ptype.value(self.hn.get_hid_data(hid)) else: subnode_nid = NID(data_bytes) - if subnode_nid.nid in self.hn.subnodes.keys(): + if subnode_nid.nid in list(self.hn.subnodes.keys()): subnode_nid_bid = self.hn.subnodes[subnode_nid.nid].bidData else: raise PSTException('Row Matrix Value HNID Subnode invalid: %s' % subnode_nid) @@ -1079,7 +1079,7 @@ def getval(self, RowIndex, wPropId): dwRowID = self.get_row_ID(RowIndex) rowvals = self.RowMatrix[dwRowID] - if wPropId in rowvals.keys(): + if wPropId in list(rowvals.keys()): return rowvals[wPropId] else: return None @@ -1089,7 +1089,7 @@ def __repr__(self): s = 'TC Rows: %s, %s\n' % (len(self.RowIndex), self.hn) s += 'Columns: ' + ''.join([' %s' % tcoldesc for tcoldesc in self.rgTCOLDESC]) - s += '\nData:\n' + '\n'.join(['%s: %s' % (hex(dwRowID), rowvals) for dwRowID,rowvals in self.RowMatrix.items()]) + s += '\nData:\n' + '\n'.join(['%s: %s' % (hex(dwRowID), rowvals) for dwRowID,rowvals in list(self.RowMatrix.items())]) return s @@ -1269,7 +1269,7 @@ def __init__(self, nid, ltp, parent_path='', messaging=None): self.submessages = [SubMessage(self.tc_contents.RowIndex[RowIndex].nid, \ self.tc_contents.getval(RowIndex,PropIdEnum.PidTagSentRepresentingNameW), ltp.strip_SubjectPrefix(self.tc_contents.getval(RowIndex,PropIdEnum.PidTagSubjectW)), \ self.tc_contents.getval(RowIndex,PropIdEnum.PidTagClientSubmitTime)) \ - for RowIndex in range(len(self.tc_contents.RowIndex)) if RowIndex in self.tc_contents.RowIndex.keys()] + for RowIndex in range(len(self.tc_contents.RowIndex)) if RowIndex in list(self.tc_contents.RowIndex.keys())] except PSTException as e: log_error(e) @@ -1373,7 +1373,7 @@ def __init__(self, nid, ltp, nbd=None, parent_message=None, messaging=None): self.tc_attachments = None self.tc_recipients = None if self.pc.hn.subnodes: - for subnode in self.pc.hn.subnodes.values(): #SLENTRYs + for subnode in list(self.pc.hn.subnodes.values()): #SLENTRYs if subnode.nid.nidType == NID.NID_TYPE_ATTACHMENT_TABLE: self.tc_attachments = self.ltp.get_tc_by_slentry(subnode) elif subnode.nid.nidType == NID.NID_TYPE_RECIPIENT_TABLE: @@ -1476,7 +1476,7 @@ def set_message_store(self): self.message_store = self.ltp.get_pc_by_nid(NID(NID.NID_MESSAGE_STORE)) self.store_record_key = self.message_store.getval(PropIdEnum.PidTagRecordKey) - if PropIdEnum.PidTagPstPassword in self.message_store.props.keys(): + if PropIdEnum.PidTagPstPassword in list(self.message_store.props.keys()): self.PasswordCRC32Hash = struct.unpack('I', struct.pack('i', self.message_store.getval(PropIdEnum.PidTagPstPassword)))[0] else: self.PasswordCRC32Hash = None @@ -1994,15 +1994,15 @@ def export_all_messages(self, path='', progressbar = None, total_messages = 0): messages_completed = 0 for folder in self.folder_generator(): filepath = get_unused_filename(os.path.join(path, get_safe_filename(folder.path.replace('\\','_'))+'.txt')) - msg_txt = u'' + msg_txt = '' for message in self.message_generator(folder): - msg_txt += u'Subject: %s\nFrom: %s (%s)\n' % (message.Subject, message.SenderName, message.SenderSmtpAddress) - msg_txt += u'To: %s\n' % ('; '.join([u'%s (%s)' % (subrecipient.DisplayName, subrecipient.EmailAddress) for subrecipient in message.subrecipients])) - msg_txt += u'Sent: %s\nDelivered: %s\n' % (message.ClientSubmitTime, message.MessageDeliveryTime) - msg_txt += u'MessageClass: %s\n' % (message.MessageClass) + msg_txt += 'Subject: %s\nFrom: %s (%s)\n' % (message.Subject, message.SenderName, message.SenderSmtpAddress) + msg_txt += 'To: %s\n' % ('; '.join(['%s (%s)' % (subrecipient.DisplayName, subrecipient.EmailAddress) for subrecipient in message.subrecipients])) + msg_txt += 'Sent: %s\nDelivered: %s\n' % (message.ClientSubmitTime, message.MessageDeliveryTime) + msg_txt += 'MessageClass: %s\n' % (message.MessageClass) if message.HasAttachments: - msg_txt += u'Attachments: %s\n' % (u', '.join([subattachment.__repr__() for subattachment in message.subattachments])) - msg_txt += u'\n%s\n\n\n' % message.Body + msg_txt += 'Attachments: %s\n' % (', '.join([subattachment.__repr__() for subattachment in message.subattachments])) + msg_txt += '\n%s\n\n\n' % message.Body if msg_txt: write_file(filepath, unicode2ascii(msg_txt), 'w') messages_completed += 1 @@ -2030,7 +2030,7 @@ def get_total_attachment_count(self): def get_pst_status(self): - status = u'Valid PST: %s, Unicode: %s, CryptMethod: %s, Name: %s, Password: %s' % (self.header.validPST, self.header.is_unicode, self.header.bCryptMethod, self.messaging.message_store.getval(PropIdEnum.PidTagDisplayName), self.messaging.PasswordCRC32Hash) + status = 'Valid PST: %s, Unicode: %s, CryptMethod: %s, Name: %s, Password: %s' % (self.header.validPST, self.header.is_unicode, self.header.bCryptMethod, self.messaging.message_store.getval(PropIdEnum.PidTagDisplayName), self.messaging.PasswordCRC32Hash) return status @@ -2146,9 +2146,9 @@ def log_error(e): def test_status_pst(pst_filepath): pst = PST(pst_filepath) - print(unicode2ascii(pst.get_pst_status())) - print('Total Messages: %s' % pst.get_total_message_count()) - print('Total Attachments: %s' % pst.get_total_attachment_count()) + sys.stdout.buffer.write((unicode2ascii(pst.get_pst_status())) + '\n'.encode('ascii','ignore')) + print(('Total Messages: %s' % pst.get_total_message_count())) + print(('Total Attachments: %s' % pst.get_total_attachment_count())) pst.close() @@ -2163,7 +2163,7 @@ def test_dump_pst(pst_filepath, output_path): """ dump out all PST email attachments and emails (into text files) to output_path folder""" pst = PST(pst_filepath) - print(pst.get_pst_status()) + print((pst.get_pst_status())) pbar = get_simple_progressbar('Messages: ') total_messages = pst.get_total_message_count()