# -*- coding: Latin-1 -*- # # Linux OOM Analyser # # Copyright (c) 2017-2021 Carsten Grohmann # License: MIT - THIS PROGRAM COMES WITH NO WARRANTY import re DEBUG = False """Show additional information during the development cycle""" VERSION = "0.5.0 (devel)" """Version number""" # __pragma__ ('skip') # MOC objects to satisfy statical checker and imports in unit tests js_undefined = 0 class classList(): def add(self, *args, **kwargs): pass def remove(self, *args, **kwargs): pass class document(): def querySelectorAll(self, *args, **kwargs): return [element()] def getElementById(self, *arg, **kwargs): return element() def createElementNS(self, *arg, **kwargs): return element() def createElement(self, *args, **kwargs): return element() class element(): firstChild = [] classList = classList() offsetWidth = 0 def removeChild(self, *args, **kwargs): return def appendChild(self, *args, **kwargs): return # __pragma__ ('noskip') class OOMEntityState: """Enum for completeness of the OOM block""" unknown = 0 empty = 1 invalid = 2 started = 3 complete = 4 class OOMEntityType: """Enum for the type of the OOM""" unknown = 0 automatic = 1 manual = 2 def is_visible(element): return element.offsetWidth > 0 and element.offsetHeight > 0 def hide_element(element_id): """Hide the given HTML element""" element = document.getElementById(element_id) element.classList.add('js-text--display-none') def show_element(element_id): """Show the given HTML element""" element = document.getElementById(element_id) element.classList.remove('js-text--display-none') def hide_elements(selector): """Hide all matching elements by adding class js-text--display-none""" for element in document.querySelectorAll(selector): element.classList.add('js-text--display-none') def show_elements(selector): """Show all matching elements by removing class js-text--display-none""" for element in document.querySelectorAll(selector): element.classList.remove('js-text--display-none') def toggle(element_id): """Toggle the visibility of the given HTML element""" element = document.getElementById(element_id) element.classList.toggle('js-text--display-none') def escape_html(unsafe): """ Escape unsafe HTML entities @type unsafe: str @rtype: str """ return unsafe.replace('&', "&")\ .replace('<', "<")\ .replace('>', ">")\ .replace('"', """)\ .replace("'", "'") def error(msg): """Show the error box and add the error message""" show_notifybox('ERROR', msg) def internal_error(msg): """Show the error box and add the internal error message""" show_notifybox('INTERNAL ERROR', msg) def warning(msg): """Show the error box and add the warning message""" show_notifybox('WARNING', msg) def show_notifybox(prefix, msg): """Show escaped message in the notification box""" if prefix == 'WARNING': css_class = 'js-notify_box__msg--warning' else: css_class = 'js-notify_box__msg--error' show_element('notify_box') notify_box = document.getElementById('notify_box') notification = document.createElement('div') notification.classList.add(css_class) notification.innerHTML = '{}: {}
'.format(prefix, escape_html(msg)) notify_box.appendChild(notification) class BaseKernelConfig: """Base class for all kernel specific configuration""" name = 'Base configuration for all kernels' """Name/description of this kernel configuration""" EXTRACT_PATTERN = None """ Instance specific dictionary of RE pattern to analyse a OOM block for a specific kernel version This dict will be filled from EXTRACT_PATTERN_BASE and EXTRACT_PATTERN_OVERLAY during class constructor is executed. :type: None|Dict :see: EXTRACT_PATTERN_BASE and EXTRACT_PATTERN_OVERLAY """ EXTRACT_PATTERN_BASE = { 'invoked oom-killer': ( r'^(?P[\S ]+) invoked oom-killer: ' r'gfp_mask=(?P0x[a-z0-9]+)(\((?P[A-Z_|]+)\))?, ' r'(nodemask=(?P([\d,-]+|\(null\))), )?' r'order=(?P-?\d+), ' r'oom_score_adj=(?P\d+)', True, ), 'Trigger process and kernel version': ( r'^CPU: \d+ PID: (?P\d+) ' r'Comm: .* (Not tainted|Tainted:.*) ' r'(?P\d[\w.-]+) #\d', True, ), # split caused by a limited number of iterations during converting PY regex into JS regex 'Mem-Info (part 1)': ( r'^Mem-Info:.*' r'(?:\n)' # first line (starting w/o a space) r'^active_anon:(?P\d+) inactive_anon:(?P\d+) ' r'isolated_anon:(?P\d+)' r'(?:\n)' # remaining lines (w/ leading space) r'^ active_file:(?P\d+) inactive_file:(?P\d+) ' r'isolated_file:(?P\d+)' r'(?:\n)' r'^ unevictable:(?P\d+) dirty:(?P\d+) writeback:(?P\d+) ' r'unstable:(?P\d+)', True, ), 'Mem-Info (part 2)': ( r'^ slab_reclaimable:(?P\d+) slab_unreclaimable:(?P\d+)' r'(?:\n)' r'^ mapped:(?P\d+) shmem:(?P\d+) pagetables:(?P\d+) ' r'bounce:(?P\d+)' r'(?:\n)' r'^ free:(?P\d+) free_pcp:(?P\d+) free_cma:(?P\d+)', True, ), 'Memory node information': ( r'(^Node \d+ (DMA|Normal|hugepages).*(:?\n))+', False, ), 'Page cache': ( r'^(?P\d+) total pagecache pages.*$', True, ), 'Swap usage information': ( r'^(?P\d+) pages in swap cache' r'(?:\n)' r'^Swap cache stats: add \d+, delete \d+, find \d+\/\d+' r'(?:\n)' r'^Free swap = (?P\d+)kB' r'(?:\n)' r'^Total swap = (?P\d+)kB', False, ), 'Page information': ( r'^(?P\d+) pages RAM' r'(' r'(?:\n)' r'^(?P\d+) pages HighMem/MovableOnly' r')?' r'(?:\n)' r'^(?P\d+) pages reserved' r'(' r'(?:\n)' r'^(?P\d+) pages cma reserved' r')?' r'(' r'(?:\n)' r'^(?P\d+) pages in pagetable cache' r')?' r'(' r'(?:\n)' r'^(?P\d+) pages hwpoisoned' r')?', True, ), 'Process killed by OOM': ( r'^Out of memory: Kill process (?P\d+) \((?P[\S ]+)\) ' r'score (?P\d+) or sacrifice child', True, ), 'Details of process killed by OOM': ( r'^Killed process \d+ \(.*\)' r'(, UID \d+,)?' r' total-vm:(?P\d+)kB, anon-rss:(?P\d+)kB, ' r'file-rss:(?P\d+)kB, shmem-rss:(?P\d+)kB.*', True, ), } """ RE pattern to extract information from OOM. The first item is the RE pattern and the second is whether it is mandatory to find this pattern. This dictionary will be copied to EXTRACT_PATTERN during class constructor is executed. :type: dict(tuple(str, bool)) :see: EXTRACT_PATTERN """ EXTRACT_PATTERN_OVERLAY = {} """ To extend / overwrite parts of EXTRACT_PATTERN in kernel configuration. :type: dict(tuple(str, bool)) :see: EXTRACT_PATTERN """ GFP_FLAGS = { 'GFP_ATOMIC': {'value': '__GFP_HIGH | __GFP_ATOMIC | __GFP_KSWAPD_RECLAIM'}, 'GFP_KERNEL': {'value': '__GFP_RECLAIM | __GFP_IO | __GFP_FS'}, 'GFP_KERNEL_ACCOUNT': {'value': 'GFP_KERNEL | __GFP_ACCOUNT'}, 'GFP_NOWAIT': {'value': '__GFP_KSWAPD_RECLAIM'}, 'GFP_NOIO': {'value': '__GFP_RECLAIM'}, 'GFP_NOFS': {'value': '__GFP_RECLAIM | __GFP_IO'}, 'GFP_USER': {'value': '__GFP_RECLAIM | __GFP_IO | __GFP_FS | __GFP_HARDWALL'}, 'GFP_DMA': {'value': '__GFP_DMA'}, 'GFP_DMA32': {'value': '__GFP_DMA32'}, 'GFP_HIGHUSER': {'value': 'GFP_USER | __GFP_HIGHMEM'}, 'GFP_HIGHUSER_MOVABLE': {'value': 'GFP_HIGHUSER | __GFP_MOVABLE'}, 'GFP_TRANSHUGE_LIGHT': {'value': 'GFP_HIGHUSER_MOVABLE | __GFP_COMP | __GFP_NOMEMALLOC | __GFP_NOWARN & ~__GFP_RECLAIM'}, 'GFP_TRANSHUGE': {'value': 'GFP_TRANSHUGE_LIGHT | __GFP_DIRECT_RECLAIM'}, '__GFP_DMA': {'value': 0x01}, '__GFP_HIGHMEM': {'value': 0x02}, '__GFP_DMA32': {'value': 0x04}, '__GFP_MOVABLE': {'value': 0x08}, '__GFP_RECLAIMABLE': {'value': 0x10}, '__GFP_HIGH': {'value': 0x20}, '__GFP_IO': {'value': 0x40}, '__GFP_FS': {'value': 0x80}, '__GFP_COLD': {'value': 0x100}, '__GFP_NOWARN': {'value': 0x200}, '__GFP_RETRY_MAYFAIL': {'value': 0x400}, '__GFP_NOFAIL': {'value': 0x800}, '__GFP_NORETRY': {'value': 0x1000}, '__GFP_MEMALLOC': {'value': 0x2000}, '__GFP_COMP': {'value': 0x4000}, '__GFP_ZERO': {'value': 0x8000}, '__GFP_NOMEMALLOC': {'value': 0x10000}, '__GFP_HARDWALL': {'value': 0x20000}, '__GFP_THISNODE': {'value': 0x40000}, '__GFP_ATOMIC': {'value': 0x80000}, '__GFP_ACCOUNT': {'value': 0x100000}, '__GFP_DIRECT_RECLAIM': {'value': 0x400000}, '__GFP_WRITE': {'value': 0x800000}, '__GFP_KSWAPD_RECLAIM': {'value': 0x1000000}, '__GFP_NOLOCKDEP': {'value': 0x2000000}, '__GFP_RECLAIM': {'value': '__GFP_DIRECT_RECLAIM|__GFP_KSWAPD_RECLAIM'}, } """ Definition of GFP flags The decimal value of a flag will be calculated by evaluating the entries from left to right. Grouping by parentheses is not supported. Source: include/linux/gpf.h @note : This list os probably a mixture of different kernel versions - be carefully @todo: Implement kernel specific versions because this flags are not constant (see https://github.com/torvalds/linux/commit/e67d4ca79aaf9d13a00d229b1b1c96b86828e8ba#diff-020720d0699e3ae1afb6fcd815ca8500) """ ps_table_items = ['pid', 'uid', 'tgid', 'total_vm_pages', 'rss_pages', 'nr_ptes_pages', 'swapents_pages', 'oom_score_adj'] """Elements of the process table""" REC_PROCESS_LINE = re.compile( r'^\[(?P[ \d]+)\]\s+(?P\d+)\s+(?P\d+)\s+(?P\d+)\s+(?P\d+)\s+' r'(?P\d+)\s+(?P\d+)\s+(?P-?\d+)\s+(?P.+)\s*') """Match content of process table""" rec_version4kconfig = re.compile('.+') """RE to match kernel version to kernel configuration""" rec_oom_begin = re.compile(r'invoked oom-killer:', re.MULTILINE) """RE to match the first line of an OOM block""" rec_oom_end = re.compile(r'^Killed process \d+', re.MULTILINE) """RE to match the last line of an OOM block""" def __init__(self): super().__init__() if self.EXTRACT_PATTERN is None: # Create a copy to prevent modifications on the class dictionary # TODO replace with self.EXTRACT_PATTERN = self.EXTRACT_PATTERN.copy() after # https://github.com/QQuick/Transcrypt/issues/716 "dict does not have a copy method" is fixed self.EXTRACT_PATTERN = {} self.EXTRACT_PATTERN.update(self.EXTRACT_PATTERN_BASE) if self.EXTRACT_PATTERN_OVERLAY: self.EXTRACT_PATTERN.update(self.EXTRACT_PATTERN_OVERLAY) class KernelConfig_4_6(BaseKernelConfig): # Support changes: # * "mm, oom_reaper: report success/failure" (bc448e897b6d24aae32701763b8a1fe15d29fa26) name = 'Configuration for Linux kernel 4.6 or later' rec_version4kconfig = re.compile(r'^4\.([6-9]\.|[12][0-9]\.).+') # The "oom_reaper" line is optionally rec_oom_end = re.compile(r'^((Out of memory.*|Memory cgroup out of memory): Killed process \d+|oom_reaper:)', re.MULTILINE) def __init__(self): super().__init__() class KernelConfig_4_9(KernelConfig_4_6): # Support changes: # * "mm: oom: deduplicate victim selection code for memcg and global oom" (7c5f64f84483bd13886348edda8b3e7b799a7fdb) name = 'Configuration for Linux kernel 4.9 or later' rec_version4kconfig = re.compile(r'^4\.([9]\.|[12][0-9]\.).+') EXTRACT_PATTERN_OVERLAY_49 = { 'Details of process killed by OOM': ( r'^(Out of memory.*|Memory cgroup out of memory): Killed process \d+ \(.*\)' r'(, UID \d+,)?' r' total-vm:(?P\d+)kB, anon-rss:(?P\d+)kB, ' r'file-rss:(?P\d+)kB, shmem-rss:(?P\d+)kB.*', True, ), } def __init__(self): super().__init__() self.EXTRACT_PATTERN.update(self.EXTRACT_PATTERN_OVERLAY_49) class KernelConfig_5_0(KernelConfig_4_9): # Support changes: # * "mm, oom: reorganize the oom report in dump_header" (ef8444ea01d7442652f8e1b8a8b94278cb57eafd) name = 'Configuration for Linux kernel 5.0 or later' rec_version4kconfig = re.compile(r'^[5-9]\..+') EXTRACT_PATTERN_OVERLAY_50 = { # third last line - not integrated yet # oom-kill:constraint=CONSTRAINT_NONE,nodemask=(null),cpuset=/,mems_allowed=0,global_oom,task_memcg=/,task=sed,pid=29481,uid=12345 'Process killed by OOM': ( r'^Out of memory: Killed process (?P\d+) \((?P[\S ]+)\) ' r'total-vm:(?P\d+)kB, anon-rss:(?P\d+)kB, ' r'file-rss:(?P\d+)kB, shmem-rss:(?P\d+)kB, ' r'UID:\d+ pgtables:(?P\d+)kB oom_score_adj:(?P\d+)', True, ), } def __init__(self): super().__init__() self.EXTRACT_PATTERN.update(self.EXTRACT_PATTERN_OVERLAY_50) class KernelConfig_5_8(KernelConfig_5_0): # Support changes: # * "mm/writeback: discard NR_UNSTABLE_NFS, use NR_WRITEBACK instead" (8d92890bd6b8502d6aee4b37430ae6444ade7a8c) name = 'Configuration for Linux kernel 5.8 or later' rec_version4kconfig = re.compile(r'^(5\.[8-9]\.|5\.[1-9][0-9]\.|[6-9]\.).+') EXTRACT_PATTERN_OVERLAY_58 = { 'Mem-Info (part 1)': ( r'^Mem-Info:.*' r'(?:\n)' # first line (starting w/o a space) r'^active_anon:(?P\d+) inactive_anon:(?P\d+) ' r'isolated_anon:(?P\d+)' r'(?:\n)' # remaining lines (w/ leading space) r'^ active_file:(?P\d+) inactive_file:(?P\d+) ' r'isolated_file:(?P\d+)' r'(?:\n)' r'^ unevictable:(?P\d+) dirty:(?P\d+) writeback:(?P\d+)', True, ), } def __init__(self): super().__init__() self.EXTRACT_PATTERN.update(self.EXTRACT_PATTERN_OVERLAY_58) class KernelConfigRhel7(BaseKernelConfig): """RHEL7 / CentOS7 specific configuration""" name = 'Configuration for RHEL7 / CentOS7 specific Linux kernel (3.10)' rec_version4kconfig = re.compile(r'^3\..+') def __init__(self): super().__init__() AllKernelConfigs = [ KernelConfig_5_8(), KernelConfig_5_0(), KernelConfig_4_9(), KernelConfig_4_6(), KernelConfigRhel7(), BaseKernelConfig(), ] """ Instances of all available kernel configurations. The last entry in this list is the base configuration as a fallback. @type: List(BaseKernelConfig) """ class OOMEntity: """Hold whole OOM message block and provide access""" current_line = 0 """Zero based index of the current line in self.lines""" lines = [] """OOM text as list of lines""" state = OOMEntityState.unknown """State of the OOM after initial parsing""" text = "" """OOM as text""" def __init__(self, text): # use Unix LF only text = text.replace('\r\n', '\r') text = text.strip() oom_lines = text.split('\n') self.current_line = 0 self.lines = oom_lines self.text = text # don't do anything if the text is empty or does not contains the leading OOM message if not text: self.state = OOMEntityState.empty return elif 'invoked oom-killer:' not in text: self.state = OOMEntityState.invalid return oom_lines = self._remove_non_oom_lines(oom_lines) oom_lines = self._remove_kernel_colon(oom_lines) cols_to_strip = self._number_of_columns_to_strip(oom_lines[self._get_CPU_index(oom_lines)]) oom_lines = self._strip_needless_columns(oom_lines, cols_to_strip) oom_lines = self._rsyslog_unescape_lf(oom_lines) self.lines = oom_lines self.text = '\n'.join(oom_lines) if 'Killed process' in text: self.state = OOMEntityState.complete else: self.state = OOMEntityState.started def _get_CPU_index(self, lines): """ Return the index of the first line with "CPU: " Depending on the OOM version the "CPU: " pattern is in second or third oom line. """ for i in range(len(lines)): if 'CPU: ' in lines[i]: return i return 0 def _number_of_columns_to_strip(self, line): """ Determinate number of columns left to the OOM message to strip. Sometime timestamps, hostnames and or syslog tags are left to the OOM message. This columns will be count to strip later. """ to_strip = 0 columns = line.split(" ") # Examples: # [11686.888109] CPU: 4 PID: 29481 Comm: sed Not tainted 3.10.0-514.6.1.el7.x86_64 #1 # Apr 01 14:13:32 mysrv kernel: CPU: 4 PID: 29481 Comm: sed Not tainted 3.10.0-514.6.1.el7.x86_64 #1 # Apr 01 14:13:32 mysrv kernel: [11686.888109] CPU: 4 PID: 29481 Comm: sed Not tainted 3.10.0-514.6.1.el7.x86_64 #1 try: # strip all excl. "CPU:" if 'CPU:' in line: to_strip = columns.index("CPU:") except ValueError: pass return to_strip def _remove_non_oom_lines(self, oom_lines): """Remove all lines before and after OOM message block""" cleaned_lines = [] in_oom_lines = False killed_process = False for line in oom_lines: # first line of the oom message block if "invoked oom-killer:" in line: in_oom_lines = True if in_oom_lines: cleaned_lines.append(line) # OOM blocks ends with the second last only or both lines # Out of memory: Killed process ... # oom_reaper: reaped process ... if 'Killed process' in line: killed_process = True continue # next line after "Killed process \d+ ..." if killed_process: if 'oom_reaper' in line: break else: # remove this line del cleaned_lines[-1] break return cleaned_lines def _rsyslog_unescape_lf(self, oom_lines): """ Rsyslog replaces line breaks with their octal representation #012. This feature can be controlled inside the rsyslog configuration with the directives $EscapeControlCharactersOnReceive, $Escape8BitCharactersOnReceive and $ControlCharactersEscapePrefix. The replacement is only in second line (active_anon:....) of the Mem-Info block. """ lines = [] for line in oom_lines: if '#012' in line: lines.extend(line.split('#012')) else: lines.append(line) return lines def _remove_kernel_colon(self, oom_lines): """ Remove the "kernel:" pattern w/o leading and tailing spaces. Some OOM messages don't have a space between "kernel:" and the process name. _strip_needless_columns() will fail in such cases. Therefore the pattern is removed. """ oom_lines = [i.replace('kernel:', '') for i in oom_lines] return oom_lines def _strip_needless_columns(self, oom_lines, cols_to_strip=0): """ Remove needless columns at the start of every line. This function removes all leading items w/o any relation to the OOM message like, date and time, hostname, syslog priority/facility. """ stripped_lines = [] for line in oom_lines: # remove empty lines if not line.strip(): continue if cols_to_strip: # [-1] slicing needs Transcrypt operator overloading line = line.split(" ", cols_to_strip)[-1] # __:opov stripped_lines.append(line) return stripped_lines def back(self): """Return the previous line""" if self.current_line - 1 < 0: raise StopIteration() self.current_line -= 1 return self.lines[self.current_line] def current(self): """Return the current line""" return self.lines[self.current_line] def next(self): """Return the next line""" if self.current_line + 1 < len(self.lines): self.current_line += 1 return self.lines[self.current_line] raise StopIteration() def find_text(self, pattern): """ Search the pattern and set the position to the first found line. Otherwise the position pointer won't be changed. :param pattern: Text to find :type pattern: str :return: True if the marker has found. """ for line in self.lines: if pattern in line: self.current_line = self.lines.index(line) return True return False def __iter__(self): return self def __next__(self): return self.next() class OOMResult: """Results of an OOM analysis""" kconfig = BaseKernelConfig() """Kernel configuration""" details = {} """Extracted result""" oom_entity = None """ State of this OOM (unknown, incomplete, ...) :type: OOMEntityState """ oom_type = OOMEntityType.unknown """ Type of this OOM (manually or automatically triggered) :type: OOMEntityType """ error_msg = "" """ Error message @type: str """ kversion = None """ Kernel version @type: str """ oom_text = None """ OOM text @type: str """ swap_active = False """ Swap space active or inactive @type: bool """ class OOMAnalyser: """Analyse an OOM object and calculate additional values""" oom_entity = None """ State of this OOM (unknown, incomplete, ...) :type: OOMEntityState """ oom_result = OOMResult() """ Store details of OOM analysis :type: OOMResult """ def __init__(self, oom): self.oom_entity = oom self.oom_result = OOMResult() def _identify_kernel_version(self): """ Identify the used kernel version and @rtype: bool """ pattern = r'CPU: \d+ PID: \d+ Comm: .* (Not tainted|Tainted: [A-Z ]+) (?P\d[\w.-]+) #.+' rec = re.compile(pattern, re.MULTILINE) match = rec.search(self.oom_entity.text) if not match: self.oom_result.error_msg = 'Failed to extract kernel version from OOM text' return False self.oom_result.kversion = match.group('kernel_version') return True def _choose_kernel_config(self): """ Select proper kernel configuration @rtype: bool """ for kcfg in AllKernelConfigs: match = kcfg.rec_version4kconfig.match(self.oom_result.kversion) if match: self.oom_result.kconfig = kcfg break if not self.oom_result.kconfig: warning('Failed to find a proper configuration for kernel "{}"'.format(self.oom_result.kversion)) self.oom_result.kconfig = BaseKernelConfig() return True def _check_for_empty_oom(self): """ Check for an empty OOM text @rtype: bool """ if not self.oom_entity.text: self.state = OOMEntityState.empty self.oom_result.error_msg = 'Empty OOM text. Please insert an OOM message block.' return False return True def _check_for_complete_oom(self): """ Check if the OOM in self.oom_entity is complete and update self.oom_state accordingly @rtype: bool """ self.oom_state = OOMEntityState.unknown self.oom_result.error_msg = 'Unknown OOM format' if not self.oom_result.kconfig.rec_oom_begin.search(self.oom_entity.text): self.state = OOMEntityState.invalid self.oom_result.error_msg = 'The inserted text is not a valid OOM block! The initial pattern was not found!' return False if not self.oom_result.kconfig.rec_oom_end.search(self.oom_entity.text): self.state = OOMEntityState.started self.oom_result.error_msg = 'The inserted OOM is incomplete! The initial pattern was found but not the '\ 'final.' return False self.state = OOMEntityState.complete self.oom_result.error_msg = None return True def _extract_block_from_next_pos(self, marker): """ Extract a block that starts with the marker and contains all lines up to the next line with ":". :rtype: str """ block = '' if not self.oom_entity.find_text(marker): return block line = self.oom_entity.current() block += "{}\n".format(line) for line in self.oom_entity: if ':' in line: self.oom_entity.back() break block += "{}\n".format(line) return block def _extract_from_oom_text(self): """Extract details from OOM message text""" self.oom_result.details = {} # __pragma__ ('jsiter') for k in self.oom_result.kconfig.EXTRACT_PATTERN: pattern, is_mandatory = self.oom_result.kconfig.EXTRACT_PATTERN[k] rec = re.compile(pattern, re.MULTILINE) match = rec.search(self.oom_entity.text) if match: self.oom_result.details.update(match.groupdict()) elif is_mandatory: error('Failed to extract information from OOM text. The regular expression "{}" (pattern "{}") ' 'does not find anything. This can lead to errors later on.'.format(k, pattern)) # __pragma__ ('nojsiter') if self.oom_result.details['trigger_proc_order'] == "-1": self.oom_result.oom_type = OOMEntityType.manual else: self.oom_result.oom_type = OOMEntityType.automatic self.oom_result.details['hardware_info'] = self._extract_block_from_next_pos('Hardware name:') # strip "Call Trace" line at beginning and remove leading spaces call_trace = '' block = self._extract_block_from_next_pos('Call Trace:') for line in block.split('\n'): if line.startswith('Call Trace'): continue call_trace += "{}\n".format(line.strip()) self.oom_result.details['call_trace'] = call_trace # extract process table self.oom_result.details['_ps'] = {} self.oom_entity.find_text('[ pid ]') for line in self.oom_entity: if not line.startswith('['): break if line.startswith('[ pid ]'): continue match = self.oom_result.kconfig.REC_PROCESS_LINE.match(line) if match: details = match.groupdict() details['notes'] = '' pid = details.pop('pid') self.oom_result.details['_ps'][pid] = {} self.oom_result.details['_ps'][pid].update(details) def _hex2flags(self, hexvalue, flag_definition): """\ Convert the hexadecimal value into flags specified by definition @return: list of flags and the decimal sum of all unknown flags """ remaining = int(hexvalue, 16) converted_flags = [] # __pragma__ ('jsiter') for flag in flag_definition: value = self._flag2decimal(flag, flag_definition) if remaining & value: # delete flag by "and" with a reverted mask remaining &= ~value converted_flags.append(flag) # __pragma__ ('nojsiter') return converted_flags, remaining def _flag2decimal(self, flag, flag_definition): """\ Convert a single flag into a decimal value """ if flag not in flag_definition: error('No definition for flag {} found'.format(flag)) return 0 value = flag_definition[flag]['value'] if isinstance(value, int): return value tokenlist = iter(re.split('([|&])', value)) operator = None negate_rvalue = False lvalue = 0 while True: try: token = next(tokenlist) except StopIteration: break token = token.strip() if token in ['|', '&']: operator = token continue if token.startswith('~'): token = token[1:] negate_rvalue = True if token.isdigit(): rvalue = int(token) elif token.startswith('0x') and token[2:].isdigit(): rvalue = int(token, 16) else: # it's not a decimal nor a hexadecimal value - reiterate assuming it's a flag string rvalue = self._flag2decimal(token, flag_definition) if negate_rvalue: rvalue = ~rvalue if operator == '|': lvalue |= rvalue elif operator == '&': lvalue &= rvalue operator = None negate_rvalue = False return lvalue def _convert_numeric_results_to_integer(self): """Convert all *_pages and *_kb to integer""" # __pragma__ ('jsiter') for item in self.oom_result.details: if self.oom_result.details[item] is None: self.oom_result.details[item] = '' continue if item.endswith('_kb') or item.endswith('_pages') or item.endswith('_pid') or \ item in ['killed_proc_score', 'trigger_proc_order', 'trigger_proc_oomscore']: try: self.oom_result.details[item] = int(self.oom_result.details[item]) except: error('Converting item "{}={}" to integer failed'.format(item, self.oom_result.details[item])) # __pragma__ ('nojsiter') def _convert_numeric_process_values_to_integer(self): """Convert numeric values in process table to integer values""" ps = self.oom_result.details['_ps'] ps_index = [] # TODO Check if transcrypt issue: pragma jsiter for the whole block "for pid_str in ps: ..." # sets item in "for item in ['uid',..." to 0 instead of 'uid' # jsiter is necessary to iterate over ps for pid_str in ps.keys(): converted = {} process = ps[pid_str] for item in self.oom_result.kconfig.ps_table_items: if item == 'pid': continue try: converted[item] = int(process[item]) except: error('Converting process parameter "{}={}" to integer failed'.format(item, process[item])) converted['name'] = process['name'] converted['notes'] = process['notes'] pid_int = int(pid_str) del ps[pid_str] ps[pid_int] = converted ps_index.append(pid_int) ps_index.sort(key=int) self.oom_result.details['_ps_index'] = ps_index def _calc_pstable_values(self): """Set additional notes to processes listed in the process table""" tpid = self.oom_result.details['trigger_proc_pid'] kpid = self.oom_result.details['killed_proc_pid'] # sometimes the trigger process isn't part of the process table if tpid in self.oom_result.details['_ps']: self.oom_result.details['_ps'][tpid]['notes'] = 'trigger process' # assume the killed process may also not part of the process table if kpid in self.oom_result.details['_ps']: self.oom_result.details['_ps'][kpid]['notes'] = 'killed process' def _calc_trigger_process_values(self): """Calculate all values related with the trigger process""" self.oom_result.details['trigger_proc_requested_memory_pages'] = 2 ** self.oom_result.details['trigger_proc_order'] self.oom_result.details['trigger_proc_requested_memory_pages_kb'] = self.oom_result.details['trigger_proc_requested_memory_pages'] * \ self.oom_result.details['page_size_kb'] # process gfp_mask if self.oom_result.details['trigger_proc_gfp_flags'] != '': # None has been is converted to '' flags = self.oom_result.details['trigger_proc_gfp_flags'] del self.oom_result.details['trigger_proc_gfp_flags'] else: flags, unknown = self._hex2flags(self.oom_result.details['trigger_proc_gfp_mask'], self.oom_result.kconfig.GFP_FLAGS) if unknown: flags.append('0x{0:x}'.format(unknown)) flags = ' | '.join(flags) self.oom_result.details['trigger_proc_gfp_mask'] = '{} ({})'.format(self.oom_result.details['trigger_proc_gfp_mask'], flags) # already fully processed and no own element to display -> delete otherwise an error msg will be shown del self.oom_result.details['trigger_proc_gfp_flags'] def _calc_killed_process_values(self): """Calculate all values related with the killed process""" self.oom_result.details['killed_proc_total_rss_kb'] = self.oom_result.details['killed_proc_anon_rss_kb'] + \ self.oom_result.details['killed_proc_file_rss_kb'] + \ self.oom_result.details['killed_proc_shmem_rss_kb'] self.oom_result.details['killed_proc_rss_percent'] = int(100 * self.oom_result.details['killed_proc_total_rss_kb'] / int(self.oom_result.details['system_total_ram_kb'])) def _calc_swap_values(self): """Calculate all swap related values""" try: self.oom_result.swap_active = self.oom_result.details['swap_total_kb'] > 0 except KeyError: self.oom_result.swap_active = False if not self.oom_result.swap_active: return self.oom_result.details['swap_cache_kb'] = self.oom_result.details['swap_cache_pages'] * self.oom_result.details['page_size_kb'] del self.oom_result.details['swap_cache_pages'] # SwapUsed = SwapTotal - SwapFree - SwapCache self.oom_result.details['swap_used_kb'] = self.oom_result.details['swap_total_kb'] - self.oom_result.details['swap_free_kb'] - \ self.oom_result.details['swap_cache_kb'] self.oom_result.details['system_swap_used_percent'] = int(100 * self.oom_result.details['swap_total_kb'] / self.oom_result.details['swap_used_kb']) def _calc_system_values(self): """Calculate system memory""" # educated guess self.oom_result.details['page_size_kb'] = 4 # calculate remaining explanation values self.oom_result.details['system_total_ram_kb'] = self.oom_result.details['ram_pages'] * self.oom_result.details['page_size_kb'] if self.oom_result.swap_active: self.oom_result.details['system_total_ramswap_kb'] = self.oom_result.details['system_total_ram_kb'] + \ self.oom_result.details['swap_total_kb'] else: self.oom_result.details['system_total_ramswap_kb'] = self.oom_result.details['system_total_ram_kb'] total_rss_pages = 0 for pid in self.oom_result.details['_ps'].keys(): total_rss_pages += self.oom_result.details['_ps'][pid]['rss_pages'] self.oom_result.details['system_total_ram_used_kb'] = total_rss_pages * self.oom_result.details['page_size_kb'] self.oom_result.details['system_total_used_percent'] = int(100 * self.oom_result.details['system_total_ram_used_kb'] / self.oom_result.details['system_total_ram_kb']) def _determinate_platform_and_distribution(self): """Determinate platform and distribution""" kernel_version = self.oom_result.details.get('kernel_version', '') if 'x86_64' in kernel_version: self.oom_result.details['platform'] = 'x86 64bit' else: self.oom_result.details['platform'] = 'unknown' dist = 'unknown' if '.el7uek' in kernel_version: dist = 'Oracle Linux 7 (Unbreakable Enterprise Kernel)' elif '.el7' in kernel_version: dist = 'RHEL 7/CentOS 7' elif '.el6' in kernel_version: dist = 'RHEL 6/CentOS 6' elif '.el5' in kernel_version: dist = 'RHEL 5/CentOS 5' elif 'ARCH' in kernel_version: dist = 'Arch Linux' elif '-generic' in kernel_version: dist = 'Ubuntu' self.oom_result.details['dist'] = dist def _calc_from_oom_details(self): """ Calculate values from already extracted details @see: self.details """ self._convert_numeric_results_to_integer() self._convert_numeric_process_values_to_integer() self._calc_pstable_values() self._determinate_platform_and_distribution() self._calc_system_values() self._calc_trigger_process_values() self._calc_killed_process_values() self._calc_swap_values() def analyse(self): """ Extract and calculate values from the given OOM object If the return value is False, the OOM is too incomplete to perform an analysis. @rtype: bool """ if not self._check_for_empty_oom(): error(self.oom_result.error_msg) return False if not self._identify_kernel_version(): error(self.oom_result.error_msg) return False if not self._choose_kernel_config(): error(self.oom_result.error_msg) return False if not self._check_for_complete_oom(): error(self.oom_result.error_msg) return False self._extract_from_oom_text() self._calc_from_oom_details() self.oom_result.oom_text = self.oom_entity.text return True class OOMDisplay: """Display the OOM analysis""" # result ergibt an manchen stellen self.result.result :-/ oom_result = OOMResult() """ OOM analysis details @rtype: OOMResult """ example_rhel7 = u'''\ sed invoked oom-killer: gfp_mask=0x201da, order=0, oom_score_adj=0 sed cpuset=/ mems_allowed=0-1 CPU: 4 PID: 29481 Comm: sed Not tainted 3.10.0-514.6.1.el7.x86_64 #1 Hardware name: HP ProLiant DL385 G7, BIOS A18 12/08/2012 ffff880182272f10 00000000021dcb0a ffff880418207938 ffffffff816861ac ffff8804182079c8 ffffffff81681157 ffffffff810eab9c ffff8804182fe910 ffff8804182fe928 0000000000000202 ffff880182272f10 ffff8804182079b8 Call Trace: [] dump_stack+0x19/0x1b [] dump_header+0x8e/0x225 [] ? ktime_get_ts64+0x4c/0xf0 [] ? delayacct_end+0x8f/0xb0 [] oom_kill_process+0x24e/0x3c0 [] ? oom_unkillable_task+0xcd/0x120 [] ? find_lock_task_mm+0x56/0xc0 [] ? has_capability_noaudit+0x1e/0x30 [] out_of_memory+0x4b6/0x4f0 [] __alloc_pages_slowpath+0x5d7/0x725 [] __alloc_pages_nodemask+0x405/0x420 [] alloc_pages_current+0xaa/0x170 [] __page_cache_alloc+0x97/0xb0 [] filemap_fault+0x170/0x410 [] ext4_filemap_fault+0x36/0x50 [ext4] [] __do_fault+0x4c/0xc0 [] do_read_fault.isra.42+0x43/0x130 [] handle_mm_fault+0x6b1/0xfe0 [] ? do_mmap_pgoff+0x305/0x3c0 [] __do_page_fault+0x154/0x450 [] do_page_fault+0x35/0x90 [] page_fault+0x28/0x30 Mem-Info: active_anon:7355653 inactive_anon:660960 isolated_anon:0#012 active_file:1263 inactive_file:1167 isolated_file:32#012 unevictable:0 dirty:4 writeback:0 unstable:0#012 slab_reclaimable:27412 slab_unreclaimable:13708#012 mapped:4818 shmem:87896 pagetables:25222 bounce:0#012 free:39513 free_pcp:2958 free_cma:0 Node 0 DMA free:15872kB min:40kB low:48kB high:60kB active_anon:0kB inactive_anon:0kB active_file:0kB inactive_file:0kB unevictable:0kB isolated(anon):0kB isolated(file):0kB present:15992kB managed:15908kB mlocked:0kB dirty:0kB writeback:0kB mapped:0kB shmem:0kB slab_reclaimable:0kB slab_unreclaimable:0kB kernel_stack:0kB pagetables:0kB unstable:0kB bounce:0kB free_pcp:0kB local_pcp:0kB free_cma:0kB writeback_tmp:0kB pages_scanned:0 all_unreclaimable? yes lowmem_reserve[]: 0 2780 15835 15835 Node 0 DMA32 free:59728kB min:7832kB low:9788kB high:11748kB active_anon:2154380kB inactive_anon:604748kB active_file:500kB inactive_file:112kB unevictable:0kB isolated(anon):0kB isolated(file):0kB present:3094644kB managed:2848912kB mlocked:0kB dirty:0kB writeback:0kB mapped:4016kB shmem:5140kB slab_reclaimable:6448kB slab_unreclaimable:2796kB kernel_stack:1040kB pagetables:6876kB unstable:0kB bounce:0kB free_pcp:3788kB local_pcp:228kB free_cma:0kB writeback_tmp:0kB pages_scanned:28 all_unreclaimable? no lowmem_reserve[]: 0 0 13055 13055 Node 0 Normal free:36692kB min:36784kB low:45980kB high:55176kB active_anon:12301636kB inactive_anon:793132kB active_file:604kB inactive_file:176kB unevictable:0kB isolated(anon):0kB isolated(file):128kB present:13631488kB managed:13368348kB mlocked:0kB dirty:0kB writeback:0kB mapped:4108kB shmem:207940kB slab_reclaimable:47900kB slab_unreclaimable:28884kB kernel_stack:6624kB pagetables:43340kB unstable:0kB bounce:0kB free_pcp:4204kB local_pcp:640kB free_cma:0kB writeback_tmp:0kB pages_scanned:128 all_unreclaimable? no lowmem_reserve[]: 0 0 0 0 Node 1 Normal free:49436kB min:45444kB low:56804kB high:68164kB active_anon:14967844kB inactive_anon:1244560kB active_file:1552kB inactive_file:1992kB unevictable:0kB isolated(anon):0kB isolated(file):0kB present:16777212kB managed:16514220kB mlocked:0kB dirty:16kB writeback:0kB mapped:10760kB shmem:138504kB slab_reclaimable:55300kB slab_unreclaimable:23152kB kernel_stack:6176kB pagetables:50672kB unstable:0kB bounce:0kB free_pcp:3360kB local_pcp:248kB free_cma:0kB writeback_tmp:0kB pages_scanned:125777 all_unreclaimable? yes lowmem_reserve[]: 0 0 0 0 Node 0 DMA: 0*4kB 0*8kB 0*16kB 0*32kB 2*64kB (U) 1*128kB (U) 1*256kB (U) 0*512kB 1*1024kB (U) 1*2048kB (M) 3*4096kB (M) = 15872kB Node 0 DMA32: 203*4kB (UEM) 231*8kB (UEM) 259*16kB (UEM) 231*32kB (UEM) 157*64kB (UEM) 90*128kB (UEM) 49*256kB (UEM) 20*512kB (UE) 3*1024kB (UEM) 1*2048kB (M) 0*4096kB = 63668kB Node 0 Normal: 1231*4kB (UEM) 391*8kB (UEM) 456*16kB (UEM) 342*32kB (UEM) 141*64kB (UEM) 23*128kB (UEM) 0*256kB 0*512kB 0*1024kB 0*2048kB 0*4096kB = 38260kB Node 1 Normal: 2245*4kB (UEM) 732*8kB (UEM) 594*16kB (UEM) 396*32kB (UEM) 160*64kB (UEM) 16*128kB (UEM) 2*256kB (UM) 0*512kB 1*1024kB (M) 0*2048kB 0*4096kB = 50836kB Node 0 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=1048576kB Node 0 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=2048kB Node 1 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=1048576kB Node 1 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=2048kB 100155 total pagecache pages 11342 pages in swap cache Swap cache stats: add 31260615, delete 31249273, find 295999950/297583545 Free swap = 0kB Total swap = 8388604kB 8379834 pages RAM 0 pages HighMem/MovableOnly 192987 pages reserved [ pid ] uid tgid total_vm rss nr_ptes swapents oom_score_adj name [ 390] 0 390 39012 6739 78 51 0 systemd-journal [ 433] 0 433 11104 2 22 360 -1000 systemd-udevd [ 530] 0 530 13854 28 27 83 -1000 auditd [ 559] 0 559 7692 65 19 87 0 systemd-logind [ 563] 0 563 4817 41 14 36 0 irqbalance [ 569] 87 569 7684 52 20 48 -900 dbus-daemon [ 587] 32 587 16240 17 34 116 0 rpcbind [ 647] 0 647 50303 11 36 113 0 gssproxy [ 796] 0 796 193856 2897 207 112 0 rsyslogd [ 818] 0 818 13177 0 27 146 0 vsftpd [ 840] 0 840 62892 9 36 103 0 ypbind [ 868] 0 868 21663 28 43 191 -1000 sshd [ 871] 29 871 11126 2 25 222 0 rpc.statd [ 907] 0 907 8044 4 21 53 0 atd [ 916] 0 916 27509 2 10 30 0 agetty [ 934] 0 934 27509 2 10 31 0 agetty [ 1255] 0 1255 45716 1 39 337 0 rscd [ 1268] 0 1268 45746 28 38 353 0 rscd [ 1269] 0 1269 45716 29 38 311 0 rscd [ 1285] 0 1285 23290 25 45 235 0 master [ 1287] 89 1287 23379 52 47 242 0 qmgr [ 1830] 0 1830 446643 959 68 1234 0 ovcd [ 2062] 0 2062 144894 511 37 309 0 ovbbccb [ 2121] 0 2121 33138 26 19 138 0 crond [ 2136] 38 2136 7846 40 19 88 0 ntpd [ 2451] 0 2451 177827 0 36 816 0 ovconfd [ 8145] 0 8145 300303 1616 58 692 0 hpsensor [ 8204] 0 8204 31508 119 31 328 0 opcmsgi [ 8405] 0 8405 201479 1289 49 244 0 opcmsga [ 8472] 0 8472 134080 236 46 514 0 opcmona [ 8596] 0 8596 31377 172 29 301 0 opcle [ 8658] 0 8658 81199 124 34 336 0 opcacta [ 8685] 0 8685 137169 23313 97 3256 0 oacore [ 6330] 12345 6330 7520 15 18 61 0 rotatelogs [ 6331] 12345 6331 28318 0 12 83 0 run.sh [ 6576] 12345 6576 8478546 5157063 15483 1527848 0 mysqld [27171] 12345 27171 7522 10 18 58 0 rotatelogs [27172] 12345 27172 28320 3 11 94 0 run.sh [27502] 12345 27502 4029300 2716569 6505 226225 0 java [11729] 0 11729 64122 5003 79 2465 0 snmpd [12130] 0 12130 122202 565 29 175 0 hpasmlited [12166] 0 12166 11905 89 24 121 0 cmahealthd [12190] 0 12190 11871 89 24 119 0 cmastdeqd [12214] 0 12214 13707 84 31 211 0 cmahostd [12237] 0 12237 12493 38 28 352 0 cmathreshd [12276] 0 12276 12368 45 30 210 0 cmasm2d [12299] 0 12299 12485 43 26 282 0 cmaperfd [12324] 0 12324 31932 184 31 143 0 cmapeerd [12352] 0 12352 14280 48 32 169 0 cmaeventd [12379] 0 12379 14831 26 30 198 0 cmafcad [12407] 0 12407 11806 12 25 128 0 cmasasd [12436] 0 12436 14364 86 31 181 0 cmaidad [12463] 0 12463 11288 15 25 125 0 cmaided [12492] 0 12492 11805 14 26 127 0 cmascsid [12523] 0 12523 92228 129 63 433 0 cmanicd [14002] 0 14002 11803 12 25 128 0 cmasm2d [32615] 0 32615 36254 323 73 7 0 sshd [ 894] 12345 894 36254 328 70 5 0 sshd [ 895] 12345 895 3389 123 11 0 0 ksh [10620] 0 10620 36254 328 72 0 0 sshd [10634] 38714 10634 36290 329 70 8 0 sshd [10635] 38714 10635 14221 25 31 124 0 sftp-server [29021] 0 29021 36254 314 69 0 0 sshd [29025] 12345 29025 36254 316 67 0 0 sshd [29026] 12345 29026 29286 96 12 1 0 ksh [29051] 12345 29051 29494 330 12 74 0 svr05 [29979] 12345 29979 1666 42 9 0 0 less [29662] 89 29662 23316 258 43 0 0 pickup [26065] 89 26065 23317 256 45 0 0 trivial-rewrite [26066] 89 26066 23353 265 45 0 0 cleanup [26067] 89 26067 23368 271 45 0 0 smtp [26743] 0 26743 36254 314 68 0 0 sshd [26937] 12345 26937 36254 314 67 0 0 sshd [26938] 12345 26938 29286 96 11 0 0 ksh [27122] 12345 27122 29494 459 12 0 0 svr05 [28657] 0 28657 36254 314 74 0 0 sshd [28702] 12345 28702 36254 314 72 0 0 sshd [28703] 12345 28703 29286 97 11 0 0 ksh [28993] 0 28993 36254 314 72 0 0 sshd [28996] 12345 28996 29526 531 12 0 0 svr05 [29006] 12345 29006 36254 314 69 0 0 sshd [29007] 12345 29007 29286 96 11 0 0 ksh [29110] 12345 29110 29558 745 12 0 0 svr05 [29481] 12345 29481 29214 58 14 0 0 sed [29752] 12345 29752 7522 296 19 0 0 rotatelogs Out of memory: Kill process 6576 (mysqld) score 651 or sacrifice child Killed process 6576 (mysqld) total-vm:33914892kB, anon-rss:20629004kB, file-rss:0kB, shmem-rss:0kB ''' example_ubuntu2110 = u'''\ kworker/0:2 invoked oom-killer: gfp_mask=0xcc0(GFP_KERNEL), order=-1, oom_score_adj=0 CPU: 0 PID: 735 Comm: kworker/0:2 Not tainted 5.13.0-19-generic #19-Ubuntu Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS ArchLinux 1.14.0-1 04/01/2014 Workqueue: events moom_callback Call Trace: show_stack+0x52/0x58 dump_stack+0x7d/0x9c dump_header+0x4f/0x1f9 oom_kill_process.cold+0xb/0x10 out_of_memory.part.0+0xce/0x270 out_of_memory+0x41/0x80 moom_callback+0x7a/0xb0 process_one_work+0x220/0x3c0 worker_thread+0x53/0x420 kthread+0x11f/0x140 ? process_one_work+0x3c0/0x3c0 ? set_kthread_struct+0x50/0x50 ret_from_fork+0x22/0x30 Mem-Info: active_anon:221 inactive_anon:14331 isolated_anon:0 active_file:18099 inactive_file:22324 isolated_file:0 unevictable:4785 dirty:633 writeback:0 slab_reclaimable:6027 slab_unreclaimable:6546 mapped:15338 shmem:231 pagetables:412 bounce:0 free:427891 free_pcp:153 free_cma:0 Node 0 active_anon:884kB inactive_anon:57324kB active_file:72396kB inactive_file:89296kB unevictable:19140kB isolated(anon):0kB isolated(file):0kB mapped:61352kB dirty:2532kB writeback:0kB shmem:924kB shmem_thp: 0kB shmem_pmdmapped: 0kB anon_thp: 0kB writeback_tmp:0kB kernel_stack:1856kB pagetables:1648kB all_unreclaimable? no Node 0 DMA free:15036kB min:352kB low:440kB high:528kB reserved_highatomic:0KB active_anon:0kB inactive_anon:0kB active_file:0kB inactive_file:0kB unevictable:0kB writepending:0kB present:15992kB managed:15360kB mlocked:0kB bounce:0kB free_pcp:0kB local_pcp:0kB free_cma:0kB lowmem_reserve[]: 0 1893 1893 1893 1893 Node 0 DMA32 free:1696528kB min:44700kB low:55872kB high:67044kB reserved_highatomic:0KB active_anon:884kB inactive_anon:57324kB active_file:72396kB inactive_file:89296kB unevictable:19140kB writepending:2532kB present:2080640kB managed:2010036kB mlocked:19140kB bounce:0kB free_pcp:612kB local_pcp:612kB free_cma:0kB lowmem_reserve[]: 0 0 0 0 0 Node 0 DMA: 1*4kB (U) 1*8kB (U) 1*16kB (U) 1*32kB (U) 0*64kB 1*128kB (U) 0*256kB 1*512kB (U) 0*1024kB 1*2048kB (M) 3*4096kB (M) = 15036kB Node 0 DMA32: 0*4kB 4*8kB (UM) 25*16kB (UME) 151*32kB (UM) 56*64kB (UM) 21*128kB (ME) 36*256kB (UME) 47*512kB (UM) 41*1024kB (UM) 32*2048kB (UM) 377*4096kB (UM) = 1696528kB Node 0 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=2048kB 42845 total pagecache pages 0 pages in swap cache Swap cache stats: add 0, delete 0, find 0/0 Free swap = 0kB Total swap = 0kB 524158 pages RAM 0 pages HighMem/MovableOnly 17809 pages reserved 0 pages hwpoisoned Tasks state (memory values in pages): [ pid ] uid tgid total_vm rss pgtables_bytes swapents oom_score_adj name [ 323] 0 323 9458 2766 77824 0 -250 systemd-journal [ 356] 0 356 5886 1346 69632 0 -1000 systemd-udevd [ 507] 0 507 70208 4646 98304 0 -1000 multipathd [ 542] 101 542 21915 1391 69632 0 0 systemd-timesyn [ 587] 102 587 4635 1882 73728 0 0 systemd-network [ 589] 103 589 5875 2951 86016 0 0 systemd-resolve [ 602] 0 602 1720 322 53248 0 0 cron [ 603] 104 603 2159 1168 53248 0 -900 dbus-daemon [ 608] 0 608 7543 4677 94208 0 0 networkd-dispat [ 609] 107 609 55313 1248 73728 0 0 rsyslogd [ 611] 0 611 311571 8248 221184 0 -900 snapd [ 613] 0 613 3404 1668 65536 0 0 systemd-logind [ 615] 0 615 98223 3142 126976 0 0 udisksd [ 620] 0 620 1443 278 45056 0 0 agetty [ 623] 0 623 1947 1147 57344 0 0 login [ 650] 0 650 3283 1683 65536 0 -1000 sshd [ 651] 0 651 27005 5232 106496 0 0 unattended-upgr [ 661] 0 661 58546 1812 90112 0 0 polkitd [ 856] 1000 856 3789 2157 73728 0 0 systemd [ 857] 1000 857 25433 835 86016 0 0 (sd-pam) [ 862] 1000 862 2208 1373 53248 0 0 bash [ 876] 1000 876 2870 1356 57344 0 0 sudo [ 877] 0 877 1899 1052 53248 0 0 bash oom-kill:constraint=CONSTRAINT_NONE,nodemask=(null),cpuset=/,mems_allowed=0,global_oom,task_memcg=/system.slice/unattended-upgrades.service,task=unattended-upgr,pid=651,uid=0 Out of memory: Killed process 651 (unattended-upgr) total-vm:108020kB, anon-rss:8380kB, file-rss:12548kB, shmem-rss:0kB, UID:0 pgtables:104kB oom_score_adj:0 ''' sorted_column = None """Processes will sort by values in this column""" sort_order = None """Sort order for process values""" svg_namespace = 'http://www.w3.org/2000/svg' # generated with Colorgorical http://vrl.cs.brown.edu/color svg_colors_mem = [ '#aee39a', '#344b46', '#1ceaf9', '#5d99aa', '#32e195', '#b02949', '#deae9e', '#805257', '#add51f', '#544793', '#a794d3', '#e057e1', '#769b5a', '#76f014', '#621da6', '#ffce54', '#d64405', '#bb8801', '#096013', '#ff0087' ] """20 different colors for memory usage diagram""" # generated with ColorBrewer (v2.0) https://colorbrewer2.org/?type=diverging&scheme=PuOr&n=3 svg_colors_swap = [ '#f1a340', '#f7f7f7', '#998ec3' ] """3 different colors for swap usage diagram""" svg_array_updown = """ """ """SVG graphics with two black triangles UP and DOWN for sorting""" svg_array_up = """ """ """SVG graphics with one black triangle UP for sorting""" svg_array_down = """ """ """SVG graphics with one black triangle DOWN for sorting""" def __init__(self): self.oom = None self.set_HTML_defaults() self.update_toc() element = document.getElementById('version') element.textContent = "v{}".format(VERSION) def _set_item(self, item): """ Paste the content into HTML elements with the ID / Class that matches the item name. The content won't be formatted. Only suffixes for pages and kbytes are added in the singular or plural. """ elements = document.getElementsByClassName(item) for element in elements: content = self.oom_result.details.get(item, '') if isinstance(content, str): content = content.strip() if content == '': row = element.parentNode row.classList.add('js-text--display-none') if item.endswith('_pages') and isinstance(content, int): if content == 1: content = "{} page".format(content) else: content = "{} pages".format(content) if item.endswith('_kb') and isinstance(content, int): if content == 1: content = "{} kByte".format(content) else: content = "{} kBytes".format(content) if item.endswith('_percent') and isinstance(content, int): content = "{}%".format(content) element.textContent = content if DEBUG: show_element('notify_box') def update_toc(self): """ Update the TOC to show current headlines only There are two conditions to show a h2 headline in TOC: * the headline is visible * the id attribute is set """ new_toc = '' toc_content = document.querySelectorAll('nav > ul')[0] for element in document.querySelectorAll('h2'): if not (is_visible(element) and element.id): continue new_toc += '
  • {}
  • '.format(element.id, element.textContent) toc_content.innerHTML = new_toc def update_process_table(self): """ Re-create the process table with additional information """ new_table = '' table_content = document.getElementById('process_table') for pid in self.oom_result.details['_ps_index']: if pid == self.oom_result.details['trigger_proc_pid']: css_class = 'class="js-pstable__triggerproc--bgcolor"' elif pid == self.oom_result.details['killed_proc_pid']: css_class = 'class="js-pstable__killedproc--bgcolor"' else: css_class = '' process = self.oom_result.details['_ps'][pid] line = """ {} {} {} {} {} {} {} {} {} {} """.format(css_class, pid, process['uid'], process['tgid'], process['total_vm_pages'], process['rss_pages'], process['nr_ptes_pages'], process['swapents_pages'], process['oom_score_adj'], process['name'], process['notes']) new_table += line table_content.innerHTML = new_table self.set_sort_triangle() def set_sort_triangle(self): """Set the sorting symbols for all columns in the process table""" # TODO Check operator overloading # Operator overloading (Pragma opov) does not work in this context. # self.oom_result.kconfig.ps_table_items + ['notes'] will compile to a string # "pid,uid,tgid,total_vm_pages,rss_pages,nr_ptes_pages,swapents_pages,oom_score_adjNotes" and not to an # array ps_table_and_notes = self.oom_result.kconfig.ps_table_items[:] ps_table_and_notes.append('notes') for column_name in ps_table_and_notes: element_id = "pstable_sort_{}".format(column_name) element = document.getElementById(element_id) if not element: internal_error('Missing id "{}" in process table.'.format(element_id)) continue if column_name == self.sorted_column: if self.sort_order == 'descending': element.innerHTML = self.svg_array_down else: element.innerHTML = self.svg_array_up else: element.innerHTML = self.svg_array_updown def set_HTML_defaults(self): """Reset the HTML document but don't clean elements""" # hide all elements marked to be hidden by default hide_elements('.js-text--default-hide') # show all elements marked to be shown by default show_elements('.js-text--default-show') # show hidden rows show_elements('table .js-text--display-none') # clear notification box element = document.getElementById('notify_box') while element.firstChild: element.removeChild(element.firstChild) # clear process table element = document.getElementById('process_table') while element.firstChild: element.removeChild(element.firstChild) # reset sort triangles self.sorted_column = None self.sort_order = None self.set_sort_triangle() # remove svg charts for element_id in ('svg_swap', 'svg_ram'): element = document.getElementById(element_id) while element.firstChild: element.removeChild(element.firstChild) def svg_create_element(self, height, width, css_class): """Return an empty SVG element""" svg = document.createElementNS(self.svg_namespace, 'svg') svg.setAttribute('version', '1.1') svg.setAttribute('height', height) svg.setAttribute('width', width) svg.setAttribute('viewBox', '0 0 {} {}'.format(width, height)) svg.setAttribute('class', css_class) return svg def svg_create_rect(self, x=0, y=0, width=0, height=0, color=None, title=None): g = document.createElementNS(self.svg_namespace, 'g') rect = document.createElementNS(self.svg_namespace, 'rect') if x: rect.setAttribute('x', x) if y: rect.setAttribute('y', y) if width: rect.setAttribute('width', width) if height: rect.setAttribute('height', height) if color: rect.setAttribute('fill', color) if title: t = document.createElementNS(self.svg_namespace, 'title') t.textContent = title g.appendChild(t) g.appendChild(rect) return g def svg_generate_bar_chart(self, color_list, *elements): """Generate a SVG bar chart""" bar_height = 100 label_height = 80 length_factor = 4 overall_height = bar_height + label_height overall_width = 100 * length_factor css_class = 'js-mem-usage__svg' svg = self.svg_create_element(overall_height, overall_width, css_class) sum_all_elements = sum([length for unused, length in elements]) current_pos = 0 bar_group = document.createElementNS(self.svg_namespace, 'g') bar_group.setAttribute('id', 'bar_group') bar_group.setAttribute('stroke', 'black') bar_group.setAttribute('stroke-width', 2) nr_processed_elements = 0 for title, length in elements: # length is None/undefined is the regular expression doesn't find any values if not length: continue rect_len = int(100 * length / sum_all_elements) * length_factor if not rect_len: continue color = color_list[nr_processed_elements % len(color_list)] rect = self.svg_create_rect(current_pos, 0, rect_len, bar_height, color, title) bar_group.appendChild(rect) label_group = document.createElementNS(self.svg_namespace, 'g') label_group.setAttribute('id', title) color_rect = self.svg_create_rect(0, 0, 20, 20, color) color_rect.setAttribute('stroke', 'black') color_rect.setAttribute('stroke-width', 2) text = document.createElementNS(self.svg_namespace, 'text') text.setAttribute('x', '30') text.setAttribute('y', '18') text.textContent = title label_group.appendChild(color_rect) label_group.appendChild(text) # TODO replace hardcoded values x = 5 + 125 * (nr_processed_elements // 2) y = bar_height + 10 + (nr_processed_elements % 2) * 40 label_group.setAttribute('transform', 'translate({}, {})'.format(x, y)) bar_group.appendChild(label_group) current_pos += rect_len nr_processed_elements += 1 svg.appendChild(bar_group) return svg def copy_example_rhel7_to_form(self): document.getElementById('textarea_oom').value = self.example_rhel7 def copy_example_ubuntu_to_form(self): document.getElementById('textarea_oom').value = self.example_ubuntu2110 def reset_form(self): document.getElementById('textarea_oom').value = "" self.set_HTML_defaults() self.update_toc() def toggle_oom(self, show=False): """Toggle the visibility of the full OOM message""" oom_element = document.getElementById('oom') row_with_oom = oom_element.parentNode.parentNode toggle_msg = document.getElementById('oom_toogle_msg') if show or row_with_oom.classList.contains('js-text--display-none'): row_with_oom.classList.remove('js-text--display-none') toggle_msg.text = "(click to hide)" else: row_with_oom.classList.add('js-text--display-none') toggle_msg.text = "(click to show)" def analyse_and_show(self): """Analyse the OOM text inserted into the form and show the results""" self.oom = OOMEntity(self.load_from_form()) # set defaults and clear notifications self.set_HTML_defaults() analyser = OOMAnalyser(self.oom) success = analyser.analyse() if success: self.oom_result = analyser.oom_result self.show_oom_details() self.update_toc() else: # don't show results - just return return def load_from_form(self): """ Return the OOM text from textarea element @rtype: str """ element = document.getElementById('textarea_oom') oom_text = element.value return oom_text def show_oom_details(self): """ Show all extracted details as well as additionally generated information """ hide_element('input') show_element('analysis') if self.oom_result.oom_type == OOMEntityType.manual: hide_elements('.js-oom-automatic--show') show_elements('.js-oom-manual--show') else: show_elements('.js-oom-automatic--show') hide_elements('.js-oom-manual--show') for item in self.oom_result.details.keys(): # ignore internal items if item.startswith('_'): continue self._set_item(item) # Hide "OOM Score" if not available # since KernelConfig_5_0.EXTRACT_PATTERN_OVERLAY_50['Process killed by OOM'] if 'killed_proc_score' in self.oom_result.details: show_elements('.js-killed-proc-score--show') else: hide_elements('.js-killed-proc-score--show') # generate process table self.update_process_table() # show/hide swap space if self.oom_result.swap_active: # generate swap usage diagram svg_swap = self.svg_generate_bar_chart( self.svg_colors_swap, ('Swap Used', self.oom_result.details['swap_used_kb']), ('Swap Free', self.oom_result.details['swap_free_kb']), ('Swap Cached', self.oom_result.details['swap_cache_kb']), ) elem_svg_swap = document.getElementById('svg_swap') elem_svg_swap.appendChild(svg_swap) show_elements('.js-swap-active--show') hide_elements('.js-swap-inactive--show') else: hide_elements('.js-swap-active--show') show_elements('.js-swap-inactive--show') # generate RAM usage diagram ram_title_attr = ( ('Active mem', 'active_anon_pages'), ('Inactive mem', 'inactive_anon_pages'), ('Isolated mem', 'isolated_anon_pages'), ('Active PC', 'active_file_pages'), ('Inactive PC', 'inactive_file_pages'), ('Isolated PC', 'isolated_file_pages'), ('Unevictable', 'unevictable_pages'), ('Dirty', 'dirty_pages'), ('Writeback', 'writeback_pages'), ('Unstable', 'unstable_pages'), ('Slab reclaimable', 'slab_reclaimable_pages'), ('Slab unreclaimable', 'slab_unreclaimable_pages'), ('Mapped', 'mapped_pages'), ('Shared', 'shmem_pages'), ('Pagetable', 'pagetables_pages'), ('Bounce', 'bounce_pages'), ('Free', 'free_pages'), ('Free PCP', 'free_pcp_pages'), ('Free CMA', 'free_cma_pages'), ) chart_elements = [(title, self.oom_result.details[value]) for title, value in ram_title_attr if value in self.oom_result.details] svg_ram = self.svg_generate_bar_chart(self.svg_colors_mem, *chart_elements) elem_svg_ram = document.getElementById('svg_ram') elem_svg_ram.appendChild(svg_ram) element = document.getElementById('oom') element.textContent = self.oom_result.oom_text self.toggle_oom(show=False) def sort_pstable(self, column_name): """Sort process table by the values in the given column""" # TODO Check operator overloading # Operator overloading (Pragma opov) does not work in this context. # self.oom_result.kconfig.ps_table_items + ['notes'] will compile to a string # "pid,uid,tgid,total_vm_pages,rss_pages,nr_ptes_pages,swapents_pages,oom_score_adjNotes" and not to an # array ps_table_and_notes = self.oom_result.kconfig.ps_table_items[:] ps_table_and_notes.append('notes') if column_name not in ps_table_and_notes: internal_error('Can not sort process table with an unknown column name "{}"'.format(column_name)) return # reset sort order if the column has changes if column_name != self.sorted_column: self.sort_order = None self.sorted_column = column_name if not self.sort_order or self.sort_order == 'descending': self.sort_order = 'ascending' self.sort_psindex_by_column(column_name) else: self.sort_order = 'descending' self.sort_psindex_by_column(column_name, True) self.sorted_column = column_name self.update_process_table() def sort_psindex_by_column(self, column_name, reverse=False): """ Sort the pid list '_ps_index' based on the values in the process dict '_ps'. Is uses bubble sort with all disadvantages but just a few lines of code """ ps = self.oom_result.details['_ps'] ps_index = self.oom_result.details['_ps_index'] def getvalue(column, pos): if column == 'pid': value = ps_index[pos] else: value = ps[ps_index[pos]][column] # JS sorts alphanumeric by default, convert values explicit to integers to sort numerically if column not in ['name', 'notes'] and value is not js_undefined: value = int(value) return value # We set swapped to True so the loop looks runs at least once swapped = True while swapped: swapped = False for i in range(len(ps_index) - 1): v1 = getvalue(column_name, i) v2 = getvalue(column_name, i+1) if (not reverse and v1 > v2) or (reverse and v1 < v2): # Swap the elements ps_index[i], ps_index[i+1] = ps_index[i+1], ps_index[i] # Set the flag to True so we'll loop again swapped = True OOMDisplayInstance = OOMDisplay()