From 18e8a3eb56cfeeaf80d02aa6314a2696ba1a9959 Mon Sep 17 00:00:00 2001 From: Carsten Grohmann Date: Sat, 25 Nov 2017 12:52:55 +0100 Subject: [PATCH] Initial commit --- .gitignore | 10 + LICENSE.txt | 19 ++ Makefile | 65 +++++ OOMAnalyser.html | 489 ++++++++++++++++++++++++++++++++ OOMAnalyser.py | 704 +++++++++++++++++++++++++++++++++++++++++++++++ README.md | 90 ++++++ requirements.txt | 1 + 7 files changed, 1378 insertions(+) create mode 100644 .gitignore create mode 100644 LICENSE.txt create mode 100644 Makefile create mode 100644 OOMAnalyser.html create mode 100644 OOMAnalyser.py create mode 100644 README.md create mode 100644 requirements.txt diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..476ffda --- /dev/null +++ b/.gitignore @@ -0,0 +1,10 @@ +# Files to be ignored by Git + +# Byte-compiled / optimized / DLL files +*.py[cod] + +# Environments +env/ + +# IntelliJ project files +.idea \ No newline at end of file diff --git a/LICENSE.txt b/LICENSE.txt new file mode 100644 index 0000000..612136d --- /dev/null +++ b/LICENSE.txt @@ -0,0 +1,19 @@ +Copyright (c) 2017 Carsten Grohmann mail carsten-grohmann.de + +Permission is hereby granted, free of charge, to any person obtaining a copy of +this software and associated documentation files (the "Software"), to deal in +the Software without restriction, including without limitation the rights to +use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies +of the Software, and to permit persons to whom the Software is furnished to do +so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. \ No newline at end of file diff --git a/Makefile b/Makefile new file mode 100644 index 0000000..e81c29e --- /dev/null +++ b/Makefile @@ -0,0 +1,65 @@ +# Makefile for OOMAnalyser +# +# Copyright (c) 2017 Carsten Grohmann +# License: MIT (see LICENSE.txt) +# THIS PROGRAM COMES WITH NO WARRANTY + +.PHONY: help clean distclean + +# Makefile defaults +SHELL = /bin/sh + +BASE_DIR = . +PYTHON_BIN = python3 +VIRTUAL_ENV = env + +export VIRTUAL_ENV := $(abspath ${VIRTUAL_ENV}) +export PATH := ${VIRTUAL_ENV}/bin:${PATH} + +HELP= @grep -B1 '^[a-zA-Z\-]*:' Makefile |\ + awk 'function p(h,t){printf"%-12s=%s\n",h,t;};\ + /\#+/{t=$$0;};\ + /:/{gsub(":.*","");h=$$0};\ + /^--/{p(h,t);t=h="";};\ + END{p(h,t)}' |\ + sed -n 's/=.*\#+/:/gp' + +#+ Show this text +help: + $(HELP) + +#+ Clean python compiler files and automatically generated files +clean: + @echo "Remove all automatically generated files ..." + @find $(BASE_DIR) -depth -type f -name "*.pyc" -exec rm -f {} \; + @find $(BASE_DIR) -depth -type f -name "*.pyo" -exec rm -f {} \; + @find $(BASE_DIR) -depth -type f -name "*.orig" -exec rm -f {} \; + @find $(BASE_DIR) -depth -type f -name "*~" -exec rm -f {} \; + @$(RM) --force --recursive __javascript__ + +#+ Remove all automatically generated and Git repository data +distclean: clean venv-clean + @echo "Remove Git repository data (.git*) ..." + @(RM) --force .git .gitignore + +$(VIRTUAL_ENV)/bin/activate: requirements.txt + test -d $(VIRTUAL_ENV) || virtualenv $(VIRTUAL_ENV) + . $(VIRTUAL_ENV)/bin/activate + $(VIRTUAL_ENV)/bin/pip install -Ur requirements.txt + touch $(VIRTUAL_ENV)/bin/activate + +#+ Setup the virtual environment from scratch +venv: $(VIRTUAL_ENV)/bin/activate + +#+ Freeze the current virtual environment by update requirements.txt +venv-freeze: + source $(VIRTUAL_ENV)/bin/activate && $(VIRTUAL_ENV)/bin/pip freeze > requirements.txt + +#+ Remove the virtual environment +venv-clean: + rm -rf $(VIRTUAL_ENV) + +#+ Compile Python to JavaScript +build: venv + . $(VIRTUAL_ENV)/bin/activate + transcrypt --build --map --nomin -e 6 OOMAnalyser.py diff --git a/OOMAnalyser.html b/OOMAnalyser.html new file mode 100644 index 0000000..353406a --- /dev/null +++ b/OOMAnalyser.html @@ -0,0 +1,489 @@ + + + + + + OOM Analyser + + + + + + + +

Analyse and visualise Linux OOM output

+ +

+ This web page splits the content of a Linux Out Of Memory message into + smaller pieces, aggregates these and presents them in a more human friendly + format. +

+ +

+ +
+ + + +

+ +
+

Analysis results

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Tigger process
(PID )This process requests memory and is triggering thereby the OOM situation
Killed process
(PID )Process killed by Linux kernel to satisfy the memory request
OOM Score
(score)
Virtual Memory
(total-vm)
Virtual memory used by this process
Resident anonymous memory
(anon-rss)
Part of the virtual process memory mapped into RAM
Resident file mapping memory
(file-rss)
Files which have been mapped into RAM (with + mmap(2)) +
Resident shared memory
(shmem-rss)
This may include System V shared memory and shared anonymous memory
Memory Usage
RAM Summary
Swap Summary
RAM usage
Active anonymous memoryRecently used anonymous memory.
+ These memory pages will usually not swapped out. +
Inactive anonymous memoryLeast recently used anonymous memory.
+ These memory pages can be swapped out. +
Isolated anonymous memoryMemory isolation is used to separate memory between different virtual machines.
Active PagecachePagecache that has been used more recently and usually not reclaimed unless absolutely necessary.
Inactive PagecachePagecache which has been less recently used. It can be reclaimed without huge performance impact.
Isolated PagecacheMemory isolation is used to separate memory between different virtual machines.
Unevictable pagesUnevictable memory. It can't be swapped out because the pages are owned by ramfs or protected by + mlock(3) / + shmctl(SHM_LOCK). + Unevictable pages are managed by kernels LRU framework. +
DirtyMemory which is waiting to get written back to the + disk. + [1] +
Writeback + Memory which is actively being written back to the disk. + [1] +
UnstableNot yet committed to stable storage.
Slab Reclaimable + Slab is a in-kernel data structures cache. Part of Slab, that might be reclaimed, such as caches. + [1] +
+ Additional details are listed in + slabinfo(5) also. +
Slab Unreclaimable + Part of Slab, that cannot be reclaimed on memory pressure. + [1] +
Mapped + Files which have been mapped into memory (with + mmap(2)), such as libraries. + [1] +
shmem + Amount of memory consumed in + tmpfs(5) + filesystems. + [1] +
Pagetables + Amount of memory dedicated to the lowest level of pagetables. + [1] +
Bounce + Memory used for block device "bounce buffers". + [1] +
free
free_pcp
free_cma
Total Pagecache
Swap usage
Swap TotalTotal amount of swap space available. + [1] +
Swap FreeAmount of swap space that is currently unused. + [1] +
Swap CachedMemory that once was swapped out, is swapped back in + but still also is in the swap file. (If memory pres‐ + sure is high, these pages don't need to be swapped out + again because they are already in the swap file. This + saves I/O). + [1] +
Swap UsedAmount of used swap space w/o cached swap
+ (SwapUsed = SwapTotal - SwapFree -SwapCache) +
Operating System
Kernel
DistributionGuessed from the kernel version
PlatformGuessed from the kernel version
Page sizeGuessed
Memory Chunks
+

+            
Process Table
+

+            
Hardware Details
+

+            
Kernel Call Trace
+

+            
+ +
+ +
+

Error messages

+
+
+ + +

Footnotes

+
    +
  1. + proc(5) - process information pseudo-filesystem (Go Back) +
  2. +
+ +
+ + + +
+

+ Copyright (c) 2017 Carsten Grohmann mail <add at here> carsten-grohmann.de +

+

+ Permission is hereby granted, free of charge, to any person obtaining a copy of + this software and associated documentation files (the "Software"), to deal in + the Software without restriction, including without limitation the rights to + use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies + of the Software, and to permit persons to whom the Software is furnished to do + so, subject to the following conditions: +

+

+ The above copyright notice and this permission notice shall be included in all + copies or substantial portions of the Software. +

+

+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE + AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE + SOFTWARE. +

+
+ + + \ No newline at end of file diff --git a/OOMAnalyser.py b/OOMAnalyser.py new file mode 100644 index 0000000..1bfde42 --- /dev/null +++ b/OOMAnalyser.py @@ -0,0 +1,704 @@ +# -*- coding: Latin-1 -*- +# +# Linux OOM Analyser +# +# Copyright (c) 2017 Carsten Grohmann +# License: MIT - THIS PROGRAM COMES WITH NO WARRANTY + +import re + +DEBUG=False +"""Show additional information during the development cycle""" + + +def hide_element(element_id): + """Hide the given HTML element""" + document.getElementById(element_id).style.display = 'none' + + +def show_element(element_id): + """Show the given HTML element""" + document.getElementById(element_id).style.display = 'block' + + +def toggle(element_id): + """Toggle the visibility of the given HTML element""" + element = document.getElementById(element_id) + display_prop = element.style.display + if display_prop and display_prop == 'block': + element.style.display = 'none' + else: + element.style.display = 'block' + + +def error(msg): + """Unhide the error box and add the error message""" + show_element("error_box") + print("ERROR: ", msg) + + +class OOM(object): + REC_TIMESTAMP = re.compile( + r'(' + r'\[\s+\d+\.\d+\]' + r'|' + r'\[[A-Z]+[\w ]+ +\d{1,2} \d{2}:\d{2}:\d{2} \d{4}\]' + r') ', re.ASCII) + + i = 0 + lines = [] + complete = False + + def __init__(self, text): + # use Unix LF only + text = text.replace('\r\n', '\r') + + # Split into lines + oom_lines = [] + inside_oom = False + + for line in text.split('\n'): + + if "invoked oom-killer:" in line: + inside_oom = True + elif not inside_oom: + continue + + # Remove leading timestamps + line = self.REC_TIMESTAMP.sub('', line) + + # remove empty lines + if not line.strip(): + continue + + oom_lines.append(line) + + # next line will not be part of the oom anymore + if "Killed process" in line: + inside_oom = False + break + + self.i = 0 + self.complete = not inside_oom + self.lines = oom_lines + self.text = '\n'.join(oom_lines) + + def back(self): + """Return the previous line""" + if self.i - 1 < 0: + raise StopIteration() + self.i -= 1 + return self.lines[self.i] + + def current(self): + """Return the current line""" + return self.lines[self.i] + + def next(self): + """Return the next line""" + if self.i + 1 < len(self.lines): + self.i += 1 + return self.lines[self.i] + raise StopIteration() + + def find_text(self, pattern): + """ + Search the pattern and set the position to the first found line. + Otherwise the position pointer won't be changed. + + :param pattern: Text to fine + :type pattern: str + + :return: True if the marker has found. + """ + for line in self.lines: + if pattern in line: + self.i = self.lines.index(line) + return True + return False + + def __iter__(self): + return self + + def __next__(self): + return self.next() + + +class OOMAnalyser(object): + example = u'''\ +sed invoked oom-killer: gfp_mask=0x201da, order=0, oom_score_adj=0 +sed cpuset=/ mems_allowed=0-1 +CPU: 4 PID: 29481 Comm: sed Not tainted 3.10.0-514.6.1.el7.x86_64 #1 +Hardware name: HP ProLiant DL385 G7, BIOS A18 12/08/2012 + ffff880182272f10 00000000021dcb0a ffff880418207938 ffffffff816861ac + ffff8804182079c8 ffffffff81681157 ffffffff810eab9c ffff8804182fe910 + ffff8804182fe928 0000000000000202 ffff880182272f10 ffff8804182079b8 +Call Trace: + [] dump_stack+0x19/0x1b + [] dump_header+0x8e/0x225 + [] ? ktime_get_ts64+0x4c/0xf0 + [] ? delayacct_end+0x8f/0xb0 + [] oom_kill_process+0x24e/0x3c0 + [] ? oom_unkillable_task+0xcd/0x120 + [] ? find_lock_task_mm+0x56/0xc0 + [] ? has_capability_noaudit+0x1e/0x30 + [] out_of_memory+0x4b6/0x4f0 + [] __alloc_pages_slowpath+0x5d7/0x725 + [] __alloc_pages_nodemask+0x405/0x420 + [] alloc_pages_current+0xaa/0x170 + [] __page_cache_alloc+0x97/0xb0 + [] filemap_fault+0x170/0x410 + [] ext4_filemap_fault+0x36/0x50 [ext4] + [] __do_fault+0x4c/0xc0 + [] do_read_fault.isra.42+0x43/0x130 + [] handle_mm_fault+0x6b1/0xfe0 + [] ? do_mmap_pgoff+0x305/0x3c0 + [] __do_page_fault+0x154/0x450 + [] do_page_fault+0x35/0x90 + [] page_fault+0x28/0x30 +Mem-Info: +active_anon:7355653 inactive_anon:660960 isolated_anon:0 + active_file:1263 inactive_file:1167 isolated_file:32 + unevictable:0 dirty:4 writeback:0 unstable:0 + slab_reclaimable:27412 slab_unreclaimable:13708 + mapped:4818 shmem:87896 pagetables:25222 bounce:0 + free:39513 free_pcp:2958 free_cma:0 +Node 0 DMA free:15872kB min:40kB low:48kB high:60kB active_anon:0kB inactive_anon:0kB active_file:0kB inactive_file:0kB unevictable:0kB isolated(anon):0kB isolated(file):0kB present:15992kB managed:15908kB mlocked:0kB dirty:0kB writeback:0kB mapped:0kB shmem:0kB slab_reclaimable:0kB slab_unreclaimable:0kB kernel_stack:0kB pagetables:0kB unstable:0kB bounce:0kB free_pcp:0kB local_pcp:0kB free_cma:0kB writeback_tmp:0kB pages_scanned:0 all_unreclaimable? yes lowmem_reserve[]: 0 2780 15835 15835 +Node 0 DMA32 free:59728kB min:7832kB low:9788kB high:11748kB active_anon:2154380kB inactive_anon:604748kB active_file:500kB inactive_file:112kB unevictable:0kB isolated(anon):0kB isolated(file):0kB present:3094644kB managed:2848912kB mlocked:0kB dirty:0kB writeback:0kB mapped:4016kB shmem:5140kB slab_reclaimable:6448kB slab_unreclaimable:2796kB kernel_stack:1040kB pagetables:6876kB unstable:0kB bounce:0kB free_pcp:3788kB local_pcp:228kB free_cma:0kB writeback_tmp:0kB pages_scanned:28 all_unreclaimable? no lowmem_reserve[]: 0 0 13055 13055 +Node 0 Normal free:36692kB min:36784kB low:45980kB high:55176kB active_anon:12301636kB inactive_anon:793132kB active_file:604kB inactive_file:176kB unevictable:0kB isolated(anon):0kB isolated(file):128kB present:13631488kB managed:13368348kB mlocked:0kB dirty:0kB writeback:0kB mapped:4108kB shmem:207940kB slab_reclaimable:47900kB slab_unreclaimable:28884kB kernel_stack:6624kB pagetables:43340kB unstable:0kB bounce:0kB free_pcp:4204kB local_pcp:640kB free_cma:0kB writeback_tmp:0kB pages_scanned:128 all_unreclaimable? no lowmem_reserve[]: 0 0 0 0 +Node 1 Normal free:49436kB min:45444kB low:56804kB high:68164kB active_anon:14967844kB inactive_anon:1244560kB active_file:1552kB inactive_file:1992kB unevictable:0kB isolated(anon):0kB isolated(file):0kB present:16777212kB managed:16514220kB mlocked:0kB dirty:16kB writeback:0kB mapped:10760kB shmem:138504kB slab_reclaimable:55300kB slab_unreclaimable:23152kB kernel_stack:6176kB pagetables:50672kB unstable:0kB bounce:0kB free_pcp:3360kB local_pcp:248kB free_cma:0kB writeback_tmp:0kB pages_scanned:125777 all_unreclaimable? yes lowmem_reserve[]: 0 0 0 0 +Node 0 DMA: 0*4kB 0*8kB 0*16kB 0*32kB 2*64kB (U) 1*128kB (U) 1*256kB (U) 0*512kB 1*1024kB (U) 1*2048kB (M) 3*4096kB (M) = 15872kB +Node 0 DMA32: 203*4kB (UEM) 231*8kB (UEM) 259*16kB (UEM) 231*32kB (UEM) 157*64kB (UEM) 90*128kB (UEM) 49*256kB (UEM) 20*512kB (UE) 3*1024kB (UEM) 1*2048kB (M) 0*4096kB = 63668kB +Node 0 Normal: 1231*4kB (UEM) 391*8kB (UEM) 456*16kB (UEM) 342*32kB (UEM) 141*64kB (UEM) 23*128kB (UEM) 0*256kB 0*512kB 0*1024kB 0*2048kB 0*4096kB = 38260kB +Node 1 Normal: 2245*4kB (UEM) 732*8kB (UEM) 594*16kB (UEM) 396*32kB (UEM) 160*64kB (UEM) 16*128kB (UEM) 2*256kB (UM) 0*512kB 1*1024kB (M) 0*2048kB 0*4096kB = 50836kB +Node 0 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=1048576kB +Node 0 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=2048kB +Node 1 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=1048576kB +Node 1 hugepages_total=0 hugepages_free=0 hugepages_surp=0 hugepages_size=2048kB +100155 total pagecache pages +11342 pages in swap cache +Swap cache stats: add 31260615, delete 31249273, find 295999950/297583545 +Free swap = 0kB +Total swap = 8388604kB +8379834 pages RAM +0 pages HighMem/MovableOnly +192987 pages reserved +[ pid ] uid tgid total_vm rss nr_ptes swapents oom_score_adj name +[ 390] 0 390 39012 6739 78 51 0 systemd-journal +[ 433] 0 433 11104 2 22 360 -1000 systemd-udevd +[ 530] 0 530 13854 28 27 83 -1000 auditd +[ 559] 0 559 7692 65 19 87 0 systemd-logind +[ 563] 0 563 4817 41 14 36 0 irqbalance +[ 569] 87 569 7684 52 20 48 -900 dbus-daemon +[ 587] 32 587 16240 17 34 116 0 rpcbind +[ 647] 0 647 50303 11 36 113 0 gssproxy +[ 796] 0 796 193856 2897 207 112 0 rsyslogd +[ 818] 0 818 13177 0 27 146 0 vsftpd +[ 840] 0 840 62892 9 36 103 0 ypbind +[ 868] 0 868 21663 28 43 191 -1000 sshd +[ 871] 29 871 11126 2 25 222 0 rpc.statd +[ 907] 0 907 8044 4 21 53 0 atd +[ 916] 0 916 27509 2 10 30 0 agetty +[ 934] 0 934 27509 2 10 31 0 agetty +[ 1255] 0 1255 45716 1 39 337 0 rscd +[ 1268] 0 1268 45746 28 38 353 0 rscd +[ 1269] 0 1269 45716 29 38 311 0 rscd +[ 1285] 0 1285 23290 25 45 235 0 master +[ 1287] 89 1287 23379 52 47 242 0 qmgr +[ 1830] 0 1830 446643 959 68 1234 0 ovcd +[ 2062] 0 2062 144894 511 37 309 0 ovbbccb +[ 2121] 0 2121 33138 26 19 138 0 crond +[ 2136] 38 2136 7846 40 19 88 0 ntpd +[ 2451] 0 2451 177827 0 36 816 0 ovconfd +[ 8145] 0 8145 300303 1616 58 692 0 hpsensor +[ 8204] 0 8204 31508 119 31 328 0 opcmsgi +[ 8405] 0 8405 201479 1289 49 244 0 opcmsga +[ 8472] 0 8472 134080 236 46 514 0 opcmona +[ 8596] 0 8596 31377 172 29 301 0 opcle +[ 8658] 0 8658 81199 124 34 336 0 opcacta +[ 8685] 0 8685 137169 23313 97 3256 0 oacore +[ 6330] 12345 6330 7520 15 18 61 0 rotatelogs +[ 6331] 12345 6331 28318 0 12 83 0 run.sh +[ 6576] 12345 6576 8478546 5157063 15483 1527848 0 java +[27171] 12345 27171 7522 10 18 58 0 rotatelogs +[27172] 12345 27172 28320 3 11 94 0 run.sh +[27502] 12345 27502 4029300 2716569 6505 226225 0 java +[11729] 0 11729 64122 5003 79 2465 0 snmpd +[12130] 0 12130 122202 565 29 175 0 hpasmlited +[12166] 0 12166 11905 89 24 121 0 cmahealthd +[12190] 0 12190 11871 89 24 119 0 cmastdeqd +[12214] 0 12214 13707 84 31 211 0 cmahostd +[12237] 0 12237 12493 38 28 352 0 cmathreshd +[12276] 0 12276 12368 45 30 210 0 cmasm2d +[12299] 0 12299 12485 43 26 282 0 cmaperfd +[12324] 0 12324 31932 184 31 143 0 cmapeerd +[12352] 0 12352 14280 48 32 169 0 cmaeventd +[12379] 0 12379 14831 26 30 198 0 cmafcad +[12407] 0 12407 11806 12 25 128 0 cmasasd +[12436] 0 12436 14364 86 31 181 0 cmaidad +[12463] 0 12463 11288 15 25 125 0 cmaided +[12492] 0 12492 11805 14 26 127 0 cmascsid +[12523] 0 12523 92228 129 63 433 0 cmanicd +[14002] 0 14002 11803 12 25 128 0 cmasm2d +[32615] 0 32615 36254 323 73 7 0 sshd +[ 894] 12345 894 36254 328 70 5 0 sshd +[ 895] 12345 895 3389 123 11 0 0 ksh +[10620] 0 10620 36254 328 72 0 0 sshd +[10634] 38714 10634 36290 329 70 8 0 sshd +[10635] 38714 10635 14221 25 31 124 0 sftp-server +[29021] 0 29021 36254 314 69 0 0 sshd +[29025] 12345 29025 36254 316 67 0 0 sshd +[29026] 12345 29026 29286 96 12 1 0 ksh +[29051] 12345 29051 29494 330 12 74 0 svr05 +[29979] 12345 29979 1666 42 9 0 0 less +[29662] 89 29662 23316 258 43 0 0 pickup +[26065] 89 26065 23317 256 45 0 0 trivial-rewrite +[26066] 89 26066 23353 265 45 0 0 cleanup +[26067] 89 26067 23368 271 45 0 0 smtp +[26743] 0 26743 36254 314 68 0 0 sshd +[26937] 12345 26937 36254 314 67 0 0 sshd +[26938] 12345 26938 29286 96 11 0 0 ksh +[27122] 12345 27122 29494 459 12 0 0 svr05 +[28657] 0 28657 36254 314 74 0 0 sshd +[28702] 12345 28702 36254 314 72 0 0 sshd +[28703] 12345 28703 29286 97 11 0 0 ksh +[28993] 0 28993 36254 314 72 0 0 sshd +[28996] 12345 28996 29526 531 12 0 0 svr05 +[29006] 12345 29006 36254 314 69 0 0 sshd +[29007] 12345 29007 29286 96 11 0 0 ksh +[29110] 12345 29110 29558 745 12 0 0 svr05 +[29481] 12345 29481 29214 58 14 0 0 sed +[29752] 12345 29752 7522 296 19 0 0 rotatelogs +Out of memory: Kill process 6576 (java) score 651 or sacrifice child +Killed process 6576 (java) total-vm:33914892kB, anon-rss:20629004kB, file-rss:0kB, shmem-rss:0kB + ''' + + REC_INVOKED_OOMKILLER = re.compile(r'^(?P[\w ]+) invoked oom-killer:', re.MULTILINE) + + REC_PID_KERNELVERSION = re.compile( + r'^CPU: \d+ PID: (?P\d+) ' + r'Comm: .* (Not tainted|Tainted:.*) ' + r'(?P\d[\w.-]+) #\d', + re.MULTILINE + ) + + # split caused by a limited number of iterations during converting PY regex into JS regex + REC_MEMINFO_1 = re.compile( + # head line + r'^Mem-Info:.*' + + # first line break + r'(?:\n)' + + # first line (starting with a space) + r'^active_anon:(?P\d+) inactive_anon:(?P\d+) ' + r'isolated_anon:(?P\d+)' + + # next line break + r'(?:\n)' + + # remaining lines (with leading space) + r'^ active_file:(?P\d+) inactive_file:(?P\d+) ' + r'isolated_file:(?P\d+)' + + # next line break + r'(?:\n)' + + r'^ unevictable:(?P\d+) dirty:(?P\d+) writeback:(?P\d+) ' + r'unstable:(?P\d+)' + + # # next line break + # r'(?:\n)' + # + , re.MULTILINE + ) + + REC_MEMINFO_2 = re.compile( + r'^ slab_reclaimable:(?P\d+) slab_unreclaimable:(?P\d+)' + + # next line break + r'(?:\n)' + + r'^ mapped:(?P\d+) shmem:(?P\d+) pagetables:(?P\d+) ' + r'bounce:(?P\d+)' + + # next line break + r'(?:\n)' + + r'^ free:(?P\d+) free_pcp:(?P\d+) free_cma:(?P\d+)' + + , re.MULTILINE + ) + + + REC_MEM_NODEINFO = re.compile(r'(^Node \d+ (DMA|Normal|hugepages).*(:?\n))+', re.MULTILINE) + + mem_modinfo_entries = ("active_anon_pages", "inactive_anon_pages", "isolated_anon_pages", + "active_file_pages", "inactive_file_pages", "isolated_file_pages", + "unevictable_pages", "dirty_pages", "writeback_pages", "unstable_pages", + "slab_reclaimable_pages", "slab_unreclaimable_pages", + "mapped_pages", "shmem_pages", "pagetables_pages", "bounce_pages", + "free_pages", "free_pcp_pages", "free_cma_pages", + ) + + REC_PAGECACHE = re.compile(r'^(?P\d+) total pagecache pages.*$', re.MULTILINE) + + REC_SWAP = re.compile( + r'^(?P\d+) pages in swap cache' + r'(?:\n)' + r'^Swap cache stats: add \d+, delete \d+, find \d+/\d+' + r'(?:\n)' + r'^Free swap = (?P\d+)kB' + r'(?:\n)' + r'^Total swap = (?P\d+)kB', + re.MULTILINE) + + REC_PAGEINFO = re.compile( + r'^(?P\d)+ pages RAM' + r'(?:\n)' + r'^(?P\d+) pages HighMem/MovableOnly' + r'(?:\n)' + r'^(?P\d+) pages reserved', + re.MULTILINE) + + REC_PROCESSES = re.compile( + r'^\[ pid \].*(?:\n)' + r'(^(\[[ \d]+.+)(?:\n))+', + re.MULTILINE) + + REC_KILLED = re.compile( + r'^Out of memory: Kill process (?P\d+) \((?P[\w ]+)\) ' + r'score (?P\d+) or sacrifice child' + r'(?:\n)' + r'Killed process \d+ \(.*\) total-vm:(?P\d+)kB, anon-rss:(?P\d+)kB, ' + r'file-rss:(?P\d+)kB, shmem-rss:(?P\d+)kB' + , + re.MULTILINE) + + lines = [] + """All lines of an OOM without leading timestamps""" + + details = {} + """Extracted details""" + + # Reference to the OOM object + oom = None + + svg_namespace = 'http://www.w3.org/2000/svg' + + svg_colours = ['#f20000', '#591616', '#cc6666', '#594343', '#d96c36', + '#7f5540', '#e6bfac', '#b27700', '#402b00', '#ffd580', + '#8c8c69', '#99e600', '#558000', '#d2e6ac', '#464d39', + '#004d00', '#36d96c', '#6cd9b5', '#005959', '#004d4d', + '#004040', '#739999', '#297ca6', '#80d5ff', '#1a2b33', + ] + + def __init__(self): + self._set_defaults() + + def _set_single_item(self, item): + """ + Set content of a single item to the HTML element with the same name. + + The content won't be formatted. + """ + element = document.getElementById(item) + if not element: + print("ERROR: HTML element not found: ", item) + return + content = self.details.get(item, '') + if type(content) is str: + content = content.strip() + element.textContent = content + if DEBUG: + show_element('error_box') + + def _set_defaults(self, clean_oom=True): + """\ + Reset the whole HTML document + """ + if clean_oom: + document.getElementById('textarea_oom').textContent = "" + + hide_element("analysis") + self.lines = [] + self.details = {} + for item in self.mem_modinfo_entries: + element = document.getElementById(item) + element.textContent = "" + + # empty terminal + element = document.getElementById('__terminal__') + element.textContent = "" + hide_element('error_box') + + # remove svg charts + element = document.getElementById('svg_swap') + while element.firstChild: + element.removeChild(element.firstChild) + + def _create_svg_element(self, height, width): + """ + Return an empty SVG element + """ + svg = document.createElementNS(self.svg_namespace, 'svg') + svg.setAttribute('version', '1.1') + svg.setAttribute('height', height) + svg.setAttribute('width', width) + svg.setAttribute('viewBox', '0 0 {} {}'.format(width, height)) + return svg + + def _create_svg_rect(self, x=0, y=0, width=0, height=0, colour=None): + rect = document.createElementNS(self.svg_namespace, 'rect') + if x: + rect.setAttribute('x', x) + if y: + rect.setAttribute('y', y) + if width: + rect.setAttribute('width', width) + if height: + rect.setAttribute('height', height) + if colour: + rect.setAttribute('fill', colour) + return rect + + def _generate_svg_bar_chart(self, *elements): + """ + Generate a SVG bar chart + """ + bar_height = 100 + label_height = 80 + length_factor = 4 + overall_height = bar_height + label_height + overall_width = 100 * length_factor + + svg = self._create_svg_element(overall_height, overall_width) + + sum_all_elements = sum([length for unused, length in elements]) + + current_pos = 0 + bar_group = document.createElementNS(self.svg_namespace, 'g') + bar_group.setAttribute('id', 'bar_group') + bar_group.setAttribute('stroke', 'black') + bar_group.setAttribute('stroke-width', 2) + + nr_processed_elements = 0 + for title, length in elements: + rect_len = int(100 * length / sum_all_elements) * length_factor + + if not rect_len: + continue + + colour = self.svg_colours[nr_processed_elements] + + rect = self._create_svg_rect(current_pos, 0, rect_len, bar_height, colour) + bar_group.appendChild(rect) + + label_group = document.createElementNS(self.svg_namespace, 'g') + label_group.setAttribute('id', title) + colour_rect = self._create_svg_rect(0, 0, 20, 20, colour) + colour_rect.setAttribute('stroke', 'black') + colour_rect.setAttribute('stroke-width', 2) + + text = document.createElementNS(self.svg_namespace, 'text') + text.setAttribute('x', '30') + text.setAttribute('y', '18') + text.textContent = title + + label_group.appendChild(colour_rect) + label_group.appendChild(text) + + # TODO replace hardcoded values + x = 5 + 125 * (nr_processed_elements // 2) + y = bar_height + 10 + (nr_processed_elements % 2) * 40 + label_group.setAttribute('transform', 'translate({}, {})'.format(x, y)) + + bar_group.appendChild(label_group) + + current_pos += rect_len + nr_processed_elements += 1 + + svg.appendChild(bar_group) + + return svg + + def _extract_block_from_next_pos(self, marker): + """ + Extract a block starting with the marker and add all lines with a leading space character + + :rtype: str + """ + block = '' + if not self.oom.find_text(marker): + return block + + line = self.oom.current() + block += "{}\n".format(line) + for line in self.oom: + if not line.startswith(' '): + self.oom.back() + break + block += "{}\n".format(line) + return block + + def _extract_from_oom_text(self): + """Extract details from OOM message text""" + match = self.REC_INVOKED_OOMKILLER.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + match = self.REC_PID_KERNELVERSION.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + self.details['hardware_info'] = self._extract_block_from_next_pos('Hardware name:') + self.details['call_trace'] = self._extract_block_from_next_pos('Call Trace:') + + match = self.REC_MEMINFO_1.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + match = self.REC_MEMINFO_2.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + match = self.REC_MEM_NODEINFO.search(self.oom.text) + if match: + self.details['mem_node_info'] = match.group() + + match = self.REC_PAGECACHE.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + match = self.REC_SWAP.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + # TODO Add to HTML + #match = self.REC_PAGEINFO.search(self.oom.text) + #if match: + # self.details.update(match.groupdict()) + + match = self.REC_PROCESSES.search(self.oom.text) + if match: + self.details['process_table'] = match.group() + + match = self.REC_KILLED.search(self.oom.text) + if match: + self.details.update(match.groupdict()) + + def _calc_from_oom_details(self): + """ + Calculate values from already extracted details + + @see: self.details + """ + # TODO Check if bug in transcrypt + # for item in self.details: -> "Uncaught TypeError: Result of the Symbol.iterator" + + # convert all *_pages and *_kb to integer + for item in self.details.keys(): + if item.endswith('_kb') or item.endswith('_pages'): + try: + self.details[item] = int(self.details[item]) + except: + error('Converting item {}: {} to integer failed'. format(item, self.details[item])) + + kernel_version = self.details.get('kernel_version', '') + if 'x86_64' in kernel_version: + self.details['platform'] = 'x86 64bit' + else: + self.details['platform'] = 'unknown' + + # guess distribution from kernel version + if '.el7' in kernel_version: + self.details['dist'] = 'RHEL/CentOS 7' + elif '.el6' in kernel_version: + self.details['dist'] = 'RHEL/CentOS 6' + elif '.el5' in kernel_version: + self.details['dist'] = 'RHEL/CentOS 5' + elif 'ARCH' in kernel_version: + self.details['dist'] = 'Arch Linux' + elif '_generic' in kernel_version: + self.details['dist'] = 'Ubuntu' + else: + self.details['dist'] = 'unknown' + + # educated guess + self.details['page_size'] = 4 + + self.details['swap_cache_kb'] = self.details['swap_cache_pages'] * self.details['page_size'] + del self.details['swap_cache_pages'] + + # SwapUsed = SwapTotal - SwapFree - SwapCache + self.details['swap_used_kb'] = self.details['swap_total_kb'] - self.details['swap_free_kb'] - \ + self.details['swap_cache_kb'] + + def _show_details(self): + """ + Show all extracted details as well as additionally generated information + """ + if DEBUG: + print(self.details) + + show_element("analysis") + + for item in self.details.keys(): + self._set_single_item(item) + + svg_swap = self._generate_svg_bar_chart( + ('Swap Used', self.details['swap_used_kb']), + ('Swap Free', self.details['swap_free_kb']), + ('Swap Cached', self.details['swap_cache_kb']), + ) + elem_svg_swap = document.getElementById('svg_swap') + elem_svg_swap.appendChild(svg_swap) + + svg_ram = self._generate_svg_bar_chart( + ('Active mem', self.details['active_anon_pages']), + ('Inactive mem', self.details['inactive_anon_pages']), + ('Isolated mem', self.details['isolated_anon_pages']), + ('Active PC', self.details['active_file_pages']), + ('Inactive PC', self.details['inactive_file_pages']), + ('Isolated PC', self.details['isolated_file_pages']), + ('Unevictable', self.details['unevictable_pages']), + ('Dirty', self.details['dirty_pages']), + ('Writeback', self.details['writeback_pages']), + ('Unstable', self.details['unstable_pages']), + ('Slab reclaimable', self.details['slab_reclaimable_pages']), + ('Slab unreclaimable', self.details['slab_unreclaimable_pages']), + ('Mapped', self.details['mapped_pages']), + ('Shared', self.details['shmem_pages']), + ('Pagetable', self.details['pagetables_pages']), + ('Bounce', self.details['bounce_pages']), + ('Free', self.details['free_pages']), + ('Free PCP', self.details['free_pcp_pages']), + ('Free CMA', self.details['free_cma_pages']), + ) + elem_svg_ram = document.getElementById('svg_ram') + elem_svg_ram.appendChild(svg_ram) + + + def analyse(self): + # reset the output elements to default + self._set_defaults(False) + element = document.getElementById('textarea_oom') + oom_text = element.textContent + self.oom = OOM(oom_text) + + if not self.oom.complete: + error('The inserted test is not a valid OOM!') + return + + self._extract_from_oom_text() + self._calc_from_oom_details() + self._show_details() + + def reset(self): + self._set_defaults() + + def copy_example(self): + document.getElementById('textarea_oom').textContent = self.example + + +oomAnalyser = OOMAnalyser() diff --git a/README.md b/README.md new file mode 100644 index 0000000..7f46ddc --- /dev/null +++ b/README.md @@ -0,0 +1,90 @@ +# Linux OOM Analyser + +I've started this project to give the Python to JavaScript compiler +[Transcrypt](https://www.transcrypt.org/) a try. + +This web page splits the content of a Linux Out Of Memory message into +smaller pieces, aggregates these and presents them in a more human friendly +format. + + +## Design Goals + * A local copy of the web page should run offline - without an Internet + connection, without loading 3rd party libraries nor transferring data to + foreign servers + * A better understanding of the Linux Memory Management + * Start learning JavaScript, CSS and HTML + + +## Requirements + * [Python](http://www.python.org) 3.6 or later + * [Transcrypt](https://www.transcrypt.org/) 3.6.53 or later + + +## Installation +Install Python virtual environment + +Use the provided Makefile: + +``` +# make venv +``` + +or setup the virtual environment manually: + +``` +# virtualenv env +# . env/bin/activate +# env/bin/pip install -Ur requirements.txt +``` + +## Build +Use the provided Makefile: +``` +# make venv +``` + +or build it manually: + +``` +# . env/bin/activate +# transcrypt --build --map --nomin -e 6 OOMAnalyser.py +``` + +## Further Information + * [Transcrypt](https://www.transcrypt.org/). + * [Linux man pages online](https://man7.org/) + * [Decoding the Linux kernel's page allocation failure messages](https://utcc.utoronto.ca/~cks/space/blog/linux/DecodingPageAllocFailures) + * [Linux Kernel OOM Log Analysis](http://elearningmedium.com/linux-kernel-oom-log-analysis/) + + +## Known Bugs/Issues + +Check the bug tracker on [GitHub](https://github.com/CarstenGrohmann/OOMAnalyser/issues) for current open bugs. +New bugs can be reported there also. + +## License +``` +Copyright (c) 2017 Carsten Grohmann mail carsten-grohmann.de + +Permission is hereby granted, free of charge, to any person obtaining a copy of +this software and associated documentation files (the "Software"), to deal in +the Software without restriction, including without limitation the rights to +use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies +of the Software, and to permit persons to whom the Software is furnished to do +so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +``` + +Enjoy! +Carsten Grohmann diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000..10a64c8 --- /dev/null +++ b/requirements.txt @@ -0,0 +1 @@ +Transcrypt>=3.6.53