1
0
mirror of https://github.com/kellyjonbrazil/jc.git synced 2025-06-23 00:29:59 +02:00

add pidstat-s parser

This commit is contained in:
Kelly Brazil
2022-03-09 16:07:29 -08:00
parent c52ca20e28
commit 0d13909cf6
2 changed files with 168 additions and 0 deletions

View File

@ -64,6 +64,7 @@ parsers = [
'ntpq', 'ntpq',
'passwd', 'passwd',
'pidstat', 'pidstat',
'pidstat-s',
'ping', 'ping',
'ping-s', 'ping-s',
'pip-list', 'pip-list',

167
jc/parsers/pidstat_s.py Normal file
View File

@ -0,0 +1,167 @@
"""jc - JSON Convert `pidstat` command output streaming parser
> This streaming parser outputs JSON Lines
<<Short pidstat description and caveats>>
Usage (cli):
$ pidstat | jc --pidstat-s
Usage (module):
import jc
# result is an iterable object (generator)
result = jc.parse('pidstat_s', pidstat_command_output.splitlines())
for item in result:
# do something
or
import jc.parsers.pidstat_s
# result is an iterable object (generator)
result = jc.parsers.pidstat_s.parse(pidstat_command_output.splitlines())
for item in result:
# do something
Schema:
{
"pidstat": string,
# Below object only exists if using -qq or ignore_exceptions=True
"_jc_meta":
{
"success": boolean, # false if error parsing
"error": string, # exists if "success" is false
"line": string # exists if "success" is false
}
}
Examples:
$ pidstat | jc --pidstat-s
{example output}
...
$ pidstat | jc --pidstat-s -r
{example output}
...
"""
from typing import Dict, Iterable, Union
import jc.utils
from jc.streaming import (
add_jc_meta, streaming_input_type_check, streaming_line_input_type_check, raise_or_yield
)
from jc.parsers.universal import simple_table_parse
from jc.exceptions import ParseError
class info():
"""Provides parser metadata (version, author, etc.)"""
version = '1.0'
description = '`pidstat` command streaming parser'
author = 'Kelly Brazil'
author_email = 'kellyjonbrazil@gmail.com'
compatible = ['linux']
streaming = True
__version__ = info.version
def _process(proc_data: Dict) -> Dict:
"""
Final processing to conform to the schema.
Parameters:
proc_data: (Dictionary) raw structured data to process
Returns:
Dictionary. Structured data to conform to the schema.
"""
int_list = ['time', 'uid', 'pid', 'cpu', 'vsz', 'rss', 'stksize', 'stkref']
float_list = ['percent_usr', 'percent_system', 'percent_guest', 'percent_cpu',
'minflt_s', 'majflt_s', 'percent_mem', 'kb_rd_s', 'kb_wr_s',
'kb_ccwr_s', 'cswch_s', 'nvcswch_s']
for key in proc_data:
if key in int_list:
proc_data[key] = jc.utils.convert_to_int(proc_data[key])
if key in float_list:
proc_data[key] = jc.utils.convert_to_float(proc_data[key])
return proc_data
@add_jc_meta
def parse(
data: Iterable[str],
raw: bool = False,
quiet: bool = False,
ignore_exceptions: bool = False
) -> Union[Iterable[Dict], tuple]:
"""
Main text parsing generator function. Returns an iterator object.
Parameters:
data: (iterable) line-based text data to parse
(e.g. sys.stdin or str.splitlines())
raw: (boolean) unprocessed output if True
quiet: (boolean) suppress warning messages if True
ignore_exceptions: (boolean) ignore parsing exceptions if True
Yields:
Dictionary. Raw or processed structured data.
Returns:
Iterator object (generator)
"""
jc.utils.compatibility(__name__, info.compatible, quiet)
streaming_input_type_check(data)
found_first_hash = False
header = ''
for line in data:
try:
streaming_line_input_type_check(line)
output_line: Dict = {}
if not line.strip():
# skip blank lines
continue
if not line.startswith('#') and not found_first_hash:
# skip preample lines before header row
continue
if line.startswith('#') and not found_first_hash:
# normalize header
header = line.replace('#', ' ')\
.replace('/', '_')\
.replace('%', 'percent_')\
.lower()
found_first_hash = True
continue
if line.startswith('#') and found_first_hash:
# skip header lines after first one is found
continue
output_line = simple_table_parse([header, line])[0]
if output_line:
yield output_line if raw else _process(output_line)
else:
raise ParseError('Not pidstat data')
except Exception as e:
yield raise_or_yield(ignore_exceptions, e, line)