Commit 43c043d370486dc097159f5d52a3e2b942d3c8f7

Authored by Christian Herdtweck
1 parent 26a592fb

msodde: unify debug-logging what file type we found

Showing 1 changed file with 12 additions and 10 deletions
oletools/msodde.py
@@ -815,7 +815,6 @@ RTF_START = b'\x7b\x5c\x72\x74' # == b'{\rt' but does not mess up auto-indent @@ -815,7 +815,6 @@ RTF_START = b'\x7b\x5c\x72\x74' # == b'{\rt' but does not mess up auto-indent
815 815
816 816
817 def process_rtf(file_handle, field_filter_mode=None): 817 def process_rtf(file_handle, field_filter_mode=None):
818 - log.debug('process_rtf')  
819 """ find dde links or other fields in rtf file """ 818 """ find dde links or other fields in rtf file """
820 all_fields = [] 819 all_fields = []
821 data = RTF_START + file_handle.read() # read complete file into memory! 820 data = RTF_START + file_handle.read() # read complete file into memory!
@@ -843,30 +842,33 @@ def process_rtf(file_handle, field_filter_mode=None): @@ -843,30 +842,33 @@ def process_rtf(file_handle, field_filter_mode=None):
843 842
844 843
845 def process_file(filepath, field_filter_mode=None): 844 def process_file(filepath, field_filter_mode=None):
846 - """ decides which of process_doc/x or process_xls/x to call """ 845 + """ decides which of the process_* functions to call """
847 if olefile.isOleFile(filepath): 846 if olefile.isOleFile(filepath):
848 - log.debug('checking streams to see whether this is xls') 847 + log.debug('Is OLE. Checking streams to see whether this is xls')
849 if xls_parser.is_xls(filepath): 848 if xls_parser.is_xls(filepath):
  849 + log.debug('Process file as excel 2003 (xls)')
850 return process_xls(filepath) 850 return process_xls(filepath)
851 else: 851 else:
  852 + log.debug('Process file as word 2003 (doc)')
852 return process_doc(filepath) 853 return process_doc(filepath)
853 854
854 with open(filepath, 'rb') as file_handle: 855 with open(filepath, 'rb') as file_handle:
855 if file_handle.read(4) == RTF_START: 856 if file_handle.read(4) == RTF_START:
856 - # This is a RTF file 857 + log.debug('Process file as rtf')
857 return process_rtf(file_handle, field_filter_mode) 858 return process_rtf(file_handle, field_filter_mode)
858 859
859 try: 860 try:
860 doctype = ooxml.get_type(filepath) 861 doctype = ooxml.get_type(filepath)
861 - except Exception:  
862 - log.debug('Exception trying to xml-parse file', exc_info=True) 862 + log.debug('Detected file type: {0}'.format(doctype))
  863 + except Exception as exc:
  864 + log.debug('Exception trying to xml-parse file: {0}'.format(exc))
863 doctype = None 865 doctype = None
864 866
865 - if doctype:  
866 - log.debug('Detected file type: {0}'.format(doctype))  
867 if doctype == ooxml.DOCTYPE_EXCEL: 867 if doctype == ooxml.DOCTYPE_EXCEL:
868 - return process_xlsx(filepath, field_filter_mode)  
869 - else: 868 + log.debug('Process file as excel 2007+ (xlsx)')
  869 + return process_xlsx(filepath)
  870 + else: # could be docx; if not: this is the old default code path
  871 + log.debug('Process file as word 2007+ (docx)')
870 return process_docx(filepath, field_filter_mode) 872 return process_docx(filepath, field_filter_mode)
871 873
872 874