Edit File by line

#! /usr/libexec/platform-python

[0] Fix | Delete

"""

[1] Fix | Delete

Utility for converting *_clat_hist* files generated by fio into latency statistics.

[2] Fix | Delete

[3] Fix | Delete

Example usage:

[4] Fix | Delete

[5] Fix | Delete

$ fiologparser_hist.py *_clat_hist*

[6] Fix | Delete

end-time, samples, min, avg, median, 90%, 95%, 99%, max

[7] Fix | Delete

1000, 15, 192, 1678.107, 1788.859, 1856.076, 1880.040, 1899.208, 1888.000

[8] Fix | Delete

2000, 43, 152, 1642.368, 1714.099, 1816.659, 1845.552, 1888.131, 1888.000

[9] Fix | Delete

4000, 39, 1152, 1546.962, 1545.785, 1627.192, 1640.019, 1691.204, 1744

[10] Fix | Delete

...

[11] Fix | Delete

[12] Fix | Delete

@author Karl Cronburg <karl.cronburg@gmail.com>

[13] Fix | Delete

"""

[14] Fix | Delete

import os

[15] Fix | Delete

import sys

[16] Fix | Delete

import pandas

[17] Fix | Delete

import re

[18] Fix | Delete

import numpy as np

[19] Fix | Delete

[20] Fix | Delete

runascmd = False

[21] Fix | Delete

[22] Fix | Delete

err = sys.stderr.write

[23] Fix | Delete

[24] Fix | Delete

class HistFileRdr():

[25] Fix | Delete

""" Class to read a hist file line by line, buffering

[26] Fix | Delete

a value array for the latest line, and allowing a preview

[27] Fix | Delete

of the next timestamp in next line

[28] Fix | Delete

Note: this does not follow a generator pattern, but must explicitly

[29] Fix | Delete

get next bin array.

[30] Fix | Delete

"""

[31] Fix | Delete

def __init__(self, file):

[32] Fix | Delete

self.fp = open(file, 'r')

[33] Fix | Delete

self.data = self.nextData()

[34] Fix | Delete

[35] Fix | Delete

def close(self):

[36] Fix | Delete

self.fp.close()

[37] Fix | Delete

self.fp = None

[38] Fix | Delete

[39] Fix | Delete

def nextData(self):

[40] Fix | Delete

self.data = None

[41] Fix | Delete

if self.fp:

[42] Fix | Delete

line = self.fp.readline()

[43] Fix | Delete

if line == "":

[44] Fix | Delete

self.close()

[45] Fix | Delete

else:

[46] Fix | Delete

self.data = [int(x) for x in line.replace(' ', '').rstrip().split(',')]

[47] Fix | Delete

[48] Fix | Delete

return self.data

[49] Fix | Delete

[50] Fix | Delete

@property

[51] Fix | Delete

def curTS(self):

[52] Fix | Delete

ts = None

[53] Fix | Delete

if self.data:

[54] Fix | Delete

ts = self.data[0]

[55] Fix | Delete

return ts

[56] Fix | Delete

[57] Fix | Delete

@property

[58] Fix | Delete

def curDir(self):

[59] Fix | Delete

d = None

[60] Fix | Delete

if self.data:

[61] Fix | Delete

d = self.data[1]

[62] Fix | Delete

return d

[63] Fix | Delete

[64] Fix | Delete

@property

[65] Fix | Delete

def curBins(self):

[66] Fix | Delete

return self.data[3:]

[67] Fix | Delete

[68] Fix | Delete

def weighted_percentile(percs, vs, ws):

[69] Fix | Delete

""" Use linear interpolation to calculate the weighted percentile.

[70] Fix | Delete

[71] Fix | Delete

Value and weight arrays are first sorted by value. The cumulative

[72] Fix | Delete

distribution function (cdf) is then computed, after which np.interp

[73] Fix | Delete

finds the two values closest to our desired weighted percentile(s)

[74] Fix | Delete

and linearly interpolates them.

[75] Fix | Delete

[76] Fix | Delete

percs :: List of percentiles we want to calculate

[77] Fix | Delete

vs :: Array of values we are computing the percentile of

[78] Fix | Delete

ws :: Array of weights for our corresponding values

[79] Fix | Delete

return :: Array of percentiles

[80] Fix | Delete

"""

[81] Fix | Delete

idx = np.argsort(vs)

[82] Fix | Delete

vs, ws = vs[idx], ws[idx] # weights and values sorted by value

[83] Fix | Delete

cdf = 100 * (ws.cumsum() - ws / 2.0) / ws.sum()

[84] Fix | Delete

return np.interp(percs, cdf, vs) # linear interpolation

[85] Fix | Delete

[86] Fix | Delete

def weights(start_ts, end_ts, start, end):

[87] Fix | Delete

""" Calculate weights based on fraction of sample falling in the

[88] Fix | Delete

given interval [start,end]. Weights computed using vector / array

[89] Fix | Delete

computation instead of for-loops.

[90] Fix | Delete

[91] Fix | Delete

Note that samples with zero time length are effectively ignored

[92] Fix | Delete

(we set their weight to zero).

[93] Fix | Delete

[94] Fix | Delete

start_ts :: Array of start times for a set of samples

[95] Fix | Delete

end_ts :: Array of end times for a set of samples

[96] Fix | Delete

start :: int

[97] Fix | Delete

end :: int

[98] Fix | Delete

return :: Array of weights

[99] Fix | Delete

"""

[100] Fix | Delete

sbounds = np.maximum(start_ts, start).astype(float)

[101] Fix | Delete

ebounds = np.minimum(end_ts, end).astype(float)

[102] Fix | Delete

ws = (ebounds - sbounds) / (end_ts - start_ts)

[103] Fix | Delete

if np.any(np.isnan(ws)):

[104] Fix | Delete

err("WARNING: zero-length sample(s) detected. Log file corrupt"

[105] Fix | Delete

" / bad time values? Ignoring these samples.\n")

[106] Fix | Delete

ws[np.where(np.isnan(ws))] = 0.0;

[107] Fix | Delete

return ws

[108] Fix | Delete

[109] Fix | Delete

def weighted_average(vs, ws):

[110] Fix | Delete

return np.sum(vs * ws) / np.sum(ws)

[111] Fix | Delete

[112] Fix | Delete

[113] Fix | Delete

percs = None

[114] Fix | Delete

columns = None

[115] Fix | Delete

[116] Fix | Delete

def gen_output_columns(ctx):

[117] Fix | Delete

global percs,columns

[118] Fix | Delete

strpercs = re.split('[,:]', ctx.percentiles)

[119] Fix | Delete

percs = [50.0] # always print 50% in 'median' column

[120] Fix | Delete

percs.extend(list(map(float,strpercs)))

[121] Fix | Delete

if ctx.directions:

[122] Fix | Delete

columns = ["end-time", "dir", "samples", "min", "avg", "median"]

[123] Fix | Delete

else:

[124] Fix | Delete

columns = ["end-time", "samples", "min", "avg", "median"]

[125] Fix | Delete

columns.extend(list(map(lambda x: x+'%', strpercs)))

[126] Fix | Delete

columns.append("max")

[127] Fix | Delete

[128] Fix | Delete

def fmt_float_list(ctx, num=1):

[129] Fix | Delete

""" Return a comma separated list of float formatters to the required number

[130] Fix | Delete

of decimal places. For instance:

[131] Fix | Delete

[132] Fix | Delete

fmt_float_list(ctx.decimals=4, num=3) == "%.4f, %.4f, %.4f"

[133] Fix | Delete

"""

[134] Fix | Delete

return ', '.join(["%%.%df" % ctx.decimals] * num)

[135] Fix | Delete

[136] Fix | Delete

# Default values - see beginning of main() for how we detect number columns in

[137] Fix | Delete

# the input files:

[138] Fix | Delete

__HIST_COLUMNS = 1216

[139] Fix | Delete

__NON_HIST_COLUMNS = 3

[140] Fix | Delete

__TOTAL_COLUMNS = __HIST_COLUMNS + __NON_HIST_COLUMNS

[141] Fix | Delete

[142] Fix | Delete

def read_chunk(rdr, sz):

[143] Fix | Delete

""" Read the next chunk of size sz from the given reader. """

[144] Fix | Delete

try:

[145] Fix | Delete

""" StopIteration occurs when the pandas reader is empty, and AttributeError

[146] Fix | Delete

occurs if rdr is None due to the file being empty. """

[147] Fix | Delete

new_arr = rdr.read().values

[148] Fix | Delete

except (StopIteration, AttributeError):

[149] Fix | Delete

return None

[150] Fix | Delete

[151] Fix | Delete

# Let's leave the array as is, and let later code ignore the block size

[152] Fix | Delete

return new_arr

[153] Fix | Delete

[154] Fix | Delete

#""" Extract array of the times, directions wo times, and histograms matrix without times column. """

[155] Fix | Delete

#times, rws, szs = new_arr[:,0], new_arr[:,1], new_arr[:,2]

[156] Fix | Delete

#hists = new_arr[:,__NON_HIST_COLUMNS:]

[157] Fix | Delete

#times = times.reshape((len(times),1))

[158] Fix | Delete

#dirs = rws.reshape((len(rws),1))

[159] Fix | Delete

#arr = np.append(times, hists, axis=1)

[160] Fix | Delete

#return arr

[161] Fix | Delete

[162] Fix | Delete

def get_min(fps, arrs):

[163] Fix | Delete

""" Find the file with the current first row with the smallest start time """

[164] Fix | Delete

return min([fp for fp in fps if not arrs[fp] is None], key=lambda fp: arrs.get(fp)[0][0])

[165] Fix | Delete

[166] Fix | Delete

def histogram_generator(ctx, fps, sz):

[167] Fix | Delete

[168] Fix | Delete

# Create a chunked pandas reader for each of the files:

[169] Fix | Delete

rdrs = {}

[170] Fix | Delete

for fp in fps:

[171] Fix | Delete

try:

[172] Fix | Delete

rdrs[fp] = pandas.read_csv(fp, dtype=int, header=None, chunksize=sz)

[173] Fix | Delete

except ValueError as e:

[174] Fix | Delete

if e.message == 'No columns to parse from file':

[175] Fix | Delete

if ctx.warn: sys.stderr.write("WARNING: Empty input file encountered.\n")

[176] Fix | Delete

rdrs[fp] = None

[177] Fix | Delete

else:

[178] Fix | Delete

raise(e)

[179] Fix | Delete

[180] Fix | Delete

# Initial histograms from disk:

[181] Fix | Delete

arrs = {fp: read_chunk(rdr, sz) for fp,rdr in rdrs.items()}

[182] Fix | Delete

while True:

[183] Fix | Delete

[184] Fix | Delete

try:

[185] Fix | Delete

""" ValueError occurs when nothing more to read """

[186] Fix | Delete

fp = get_min(fps, arrs)

[187] Fix | Delete

except ValueError:

[188] Fix | Delete

return

[189] Fix | Delete

arr = arrs[fp]

[190] Fix | Delete

arri = np.insert(arr[0], 1, fps.index(fp))

[191] Fix | Delete

yield arri

[192] Fix | Delete

arrs[fp] = arr[1:]

[193] Fix | Delete

[194] Fix | Delete

if arrs[fp].shape[0] == 0:

[195] Fix | Delete

arrs[fp] = read_chunk(rdrs[fp], sz)

[196] Fix | Delete

[197] Fix | Delete

def _plat_idx_to_val(idx, edge=0.5, FIO_IO_U_PLAT_BITS=6, FIO_IO_U_PLAT_VAL=64):

[198] Fix | Delete

""" Taken from fio's stat.c for calculating the latency value of a bin

[199] Fix | Delete

from that bin's index.

[200] Fix | Delete

[201] Fix | Delete

idx : the value of the index into the histogram bins

[202] Fix | Delete

edge : fractional value in the range [0,1]** indicating how far into

[203] Fix | Delete

the bin we wish to compute the latency value of.

[204] Fix | Delete

[205] Fix | Delete

** edge = 0.0 and 1.0 computes the lower and upper latency bounds

[206] Fix | Delete

respectively of the given bin index. """

[207] Fix | Delete

[208] Fix | Delete

# MSB <= (FIO_IO_U_PLAT_BITS-1), cannot be rounded off. Use

[209] Fix | Delete

# all bits of the sample as index

[210] Fix | Delete

if (idx < (FIO_IO_U_PLAT_VAL << 1)):

[211] Fix | Delete

return idx

[212] Fix | Delete

[213] Fix | Delete

# Find the group and compute the minimum value of that group

[214] Fix | Delete

error_bits = (idx >> FIO_IO_U_PLAT_BITS) - 1

[215] Fix | Delete

base = 1 << (error_bits + FIO_IO_U_PLAT_BITS)

[216] Fix | Delete

[217] Fix | Delete

# Find its bucket number of the group

[218] Fix | Delete

k = idx % FIO_IO_U_PLAT_VAL

[219] Fix | Delete

[220] Fix | Delete

# Return the mean (if edge=0.5) of the range of the bucket

[221] Fix | Delete

return base + ((k + edge) * (1 << error_bits))

[222] Fix | Delete

[223] Fix | Delete

def plat_idx_to_val_coarse(idx, coarseness, edge=0.5):

[224] Fix | Delete

""" Converts the given *coarse* index into a non-coarse index as used by fio

[225] Fix | Delete

in stat.h:plat_idx_to_val(), subsequently computing the appropriate

[226] Fix | Delete

latency value for that bin.

[227] Fix | Delete

"""

[228] Fix | Delete

[229] Fix | Delete

# Multiply the index by the power of 2 coarseness to get the bin

[230] Fix | Delete

# bin index with a max of 1536 bins (FIO_IO_U_PLAT_GROUP_NR = 24 in stat.h)

[231] Fix | Delete

stride = 1 << coarseness

[232] Fix | Delete

idx = idx * stride

[233] Fix | Delete

lower = _plat_idx_to_val(idx, edge=0.0)

[234] Fix | Delete

upper = _plat_idx_to_val(idx + stride, edge=1.0)

[235] Fix | Delete

return lower + (upper - lower) * edge

[236] Fix | Delete

[237] Fix | Delete

def print_all_stats(ctx, end, mn, ss_cnt, vs, ws, mx, dir=dir):

[238] Fix | Delete

ps = weighted_percentile(percs, vs, ws)

[239] Fix | Delete

[240] Fix | Delete

avg = weighted_average(vs, ws)

[241] Fix | Delete

values = [mn, avg] + list(ps) + [mx]

[242] Fix | Delete

if ctx.directions:

[243] Fix | Delete

row = [end, dir, ss_cnt]

[244] Fix | Delete

fmt = "%d, %s, %d, "

[245] Fix | Delete

else:

[246] Fix | Delete

row = [end, ss_cnt]

[247] Fix | Delete

fmt = "%d, %d, "

[248] Fix | Delete

row = row + [float(x) / ctx.divisor for x in values]

[249] Fix | Delete

if ctx.divisor > 1:

[250] Fix | Delete

fmt = fmt + fmt_float_list(ctx, len(percs)+3)

[251] Fix | Delete

else:

[252] Fix | Delete

# max and min are decimal values if no divisor

[253] Fix | Delete

fmt = fmt + "%d, " + fmt_float_list(ctx, len(percs)+1) + ", %d"

[254] Fix | Delete

[255] Fix | Delete

print (fmt % tuple(row))

[256] Fix | Delete

[257] Fix | Delete

def update_extreme(val, fncn, new_val):

[258] Fix | Delete

""" Calculate min / max in the presence of None values """

[259] Fix | Delete

if val is None: return new_val

[260] Fix | Delete

else: return fncn(val, new_val)

[261] Fix | Delete

[262] Fix | Delete

# See beginning of main() for how bin_vals are computed

[263] Fix | Delete

bin_vals = []

[264] Fix | Delete

lower_bin_vals = [] # lower edge of each bin

[265] Fix | Delete

upper_bin_vals = [] # upper edge of each bin

[266] Fix | Delete

[267] Fix | Delete

def process_interval(ctx, iHist, iEnd, dir):

[268] Fix | Delete

""" print estimated percentages for the given merged sample

[269] Fix | Delete

"""

[270] Fix | Delete

ss_cnt = 0 # number of samples affecting this interval

[271] Fix | Delete

mn_bin_val, mx_bin_val = None, None

[272] Fix | Delete

[273] Fix | Delete

# Update total number of samples affecting current interval histogram:

[274] Fix | Delete

ss_cnt += np.sum(iHist)

[275] Fix | Delete

[276] Fix | Delete

# Update min and max bin values

[277] Fix | Delete

idxs = np.nonzero(iHist != 0)[0]

[278] Fix | Delete

if idxs.size > 0:

[279] Fix | Delete

mn_bin_val = bin_vals[idxs[0]]

[280] Fix | Delete

mx_bin_val = bin_vals[idxs[-1]]

[281] Fix | Delete

[282] Fix | Delete

if ss_cnt > 0: print_all_stats(ctx, iEnd, mn_bin_val, ss_cnt, bin_vals, iHist, mx_bin_val, dir=dir)

[283] Fix | Delete

[284] Fix | Delete

[285] Fix | Delete

dir_map = ['r', 'w', 't'] # map of directional value in log to textual representation

[286] Fix | Delete

def process_weighted_interval(ctx, samples, iStart, iEnd, printdirs):

[287] Fix | Delete

""" Construct the weighted histogram for the given interval by scanning

[288] Fix | Delete

through all the histograms and figuring out which of their bins have

[289] Fix | Delete

samples with latencies which overlap with the given interval

[290] Fix | Delete

[iStart,iEnd].

[291] Fix | Delete

"""

[292] Fix | Delete

[293] Fix | Delete

times, files, dirs, sizes, hists = samples[:,0], samples[:,1], samples[:,2], samples[:,3], samples[:,4:]

[294] Fix | Delete

iHist={}; ss_cnt = {}; mn_bin_val={}; mx_bin_val={}

[295] Fix | Delete

for dir in printdirs:

[296] Fix | Delete

iHist[dir] = np.zeros(__HIST_COLUMNS, dtype=float)

[297] Fix | Delete

ss_cnt[dir] = 0 # number of samples affecting this interval

[298] Fix | Delete

mn_bin_val[dir] = None

[299] Fix | Delete

mx_bin_val[dir] = None

[300] Fix | Delete

[301] Fix | Delete

for end_time,file,dir,hist in zip(times,files,dirs,hists):

[302] Fix | Delete

[303] Fix | Delete

# Only look at bins of the current histogram sample which

[304] Fix | Delete

# started before the end of the current time interval [start,end]

[305] Fix | Delete

start_times = (end_time - 0.5 * ctx.interval) - bin_vals / ctx.time_divisor

[306] Fix | Delete

idx = np.where(start_times < iEnd)

[307] Fix | Delete

s_ts, l_bvs, u_bvs, hs = start_times[idx], lower_bin_vals[idx], upper_bin_vals[idx], hist[idx]

[308] Fix | Delete

[309] Fix | Delete

# Increment current interval histogram by weighted values of future histogram

[310] Fix | Delete

# total number of samples

[311] Fix | Delete

# and min and max values as necessary

[312] Fix | Delete

textdir = dir_map[dir]

[313] Fix | Delete

ws = hs * weights(s_ts, end_time, iStart, iEnd)

[314] Fix | Delete

mmidx = np.where(hs != 0)[0]

[315] Fix | Delete

if 'm' in printdirs:

[316] Fix | Delete

iHist['m'][idx] += ws

[317] Fix | Delete

ss_cnt['m'] += np.sum(hs)

[318] Fix | Delete

if mmidx.size > 0:

[319] Fix | Delete

mn_bin_val['m'] = update_extreme(mn_bin_val['m'], min, l_bvs[max(0, mmidx[0] - 1)])

[320] Fix | Delete

mx_bin_val['m'] = update_extreme(mx_bin_val['m'], max, u_bvs[min(len(hs) - 1, mmidx[-1] + 1)])

[321] Fix | Delete

if textdir in printdirs:

[322] Fix | Delete

iHist[textdir][idx] += ws

[323] Fix | Delete

ss_cnt[textdir] += np.sum(hs) # Update total number of samples affecting current interval histogram:

[324] Fix | Delete

if mmidx.size > 0:

[325] Fix | Delete

mn_bin_val[textdir] = update_extreme(mn_bin_val[textdir], min, l_bvs[max(0, mmidx[0] - 1)])

[326] Fix | Delete

mx_bin_val[textdir] = update_extreme(mx_bin_val[textdir], max, u_bvs[min(len(hs) - 1, mmidx[-1] + 1)])

[327] Fix | Delete

[328] Fix | Delete

for textdir in sorted(printdirs):

[329] Fix | Delete

if ss_cnt[textdir] > 0: print_all_stats(ctx, iEnd, mn_bin_val[textdir], ss_cnt[textdir], bin_vals, iHist[textdir], mx_bin_val[textdir], dir=textdir)

[330] Fix | Delete

[331] Fix | Delete

def guess_max_from_bins(ctx, hist_cols):

[332] Fix | Delete

""" Try to guess the GROUP_NR from given # of histogram

[333] Fix | Delete

columns seen in an input file """

[334] Fix | Delete

max_coarse = 8

[335] Fix | Delete

if ctx.group_nr < 19 or ctx.group_nr > 26:

[336] Fix | Delete

bins = [ctx.group_nr * (1 << 6)]

[337] Fix | Delete

else:

[338] Fix | Delete

bins = [1216,1280,1344,1408,1472,1536,1600,1664]

[339] Fix | Delete

coarses = range(max_coarse + 1)

[340] Fix | Delete

fncn = lambda z: list(map(lambda x: z/2**x if z % 2**x == 0 else -10, coarses))

[341] Fix | Delete

[342] Fix | Delete

arr = np.transpose(list(map(fncn, bins)))

[343] Fix | Delete

idx = np.where(arr == hist_cols)

[344] Fix | Delete

if len(idx[1]) == 0:

[345] Fix | Delete

table = repr(arr.astype(int)).replace('-10', 'N/A').replace('array',' ')

[346] Fix | Delete

errmsg = ("Unable to determine bin values from input clat_hist files. Namely \n"

[347] Fix | Delete

"the first line of file '%s' " % ctx.FILE[0] + "has %d \n" % (__TOTAL_COLUMNS,) +

[348] Fix | Delete

"columns of which we assume %d " % (hist_cols,) + "correspond to histogram bins. \n"

[349] Fix | Delete

"This number needs to be equal to one of the following numbers:\n\n"

[350] Fix | Delete

+ table + "\n\n"

[351] Fix | Delete

"Possible reasons and corresponding solutions:\n"

[352] Fix | Delete

" - Input file(s) does not contain histograms.\n"

[353] Fix | Delete

" - You recompiled fio with a different GROUP_NR. If so please specify this\n"

[354] Fix | Delete

" new GROUP_NR on the command line with --group_nr\n")

[355] Fix | Delete

if runascmd:

[356] Fix | Delete

err(errmsg)

[357] Fix | Delete

exit(1)

[358] Fix | Delete

else:

[359] Fix | Delete

raise RuntimeError(errmsg)

[360] Fix | Delete

[361] Fix | Delete

return bins[idx[1][0]]

[362] Fix | Delete

[363] Fix | Delete

def output_weighted_interval_data(ctx,printdirs):

[364] Fix | Delete

[365] Fix | Delete

fps = [open(f, 'r') for f in ctx.FILE]

[366] Fix | Delete

gen = histogram_generator(ctx, fps, ctx.buff_size)

[367] Fix | Delete

[368] Fix | Delete

print(', '.join(columns))

[369] Fix | Delete

[370] Fix | Delete

try:

[371] Fix | Delete

start, end = 0, ctx.interval

[372] Fix | Delete

arr = np.empty(shape=(0,__TOTAL_COLUMNS + 1),dtype=int)

[373] Fix | Delete

more_data = True

[374] Fix | Delete

while more_data or len(arr) > 0:

[375] Fix | Delete

[376] Fix | Delete

# Read up to ctx.max_latency (default 20 seconds) of data from end of current interval.

[377] Fix | Delete

while len(arr) == 0 or arr[-1][0] < ctx.max_latency * 1000 + end:

[378] Fix | Delete

try:

[379] Fix | Delete

new_arr = next(gen)

[380] Fix | Delete

except StopIteration:

[381] Fix | Delete

more_data = False

[382] Fix | Delete

break

[383] Fix | Delete

nashape = new_arr.reshape((1,__TOTAL_COLUMNS + 1))

[384] Fix | Delete

arr = np.append(arr, nashape, axis=0)

[385] Fix | Delete

#arr = arr.astype(int)

[386] Fix | Delete

[387] Fix | Delete

if arr.size > 0:

[388] Fix | Delete

# Jump immediately to the start of the input, rounding

[389] Fix | Delete

# down to the nearest multiple of the interval (useful when --log_unix_epoch

[390] Fix | Delete

# was used to create these histograms):

[391] Fix | Delete

if start == 0 and arr[0][0] - ctx.max_latency > end:

[392] Fix | Delete

start = arr[0][0] - ctx.max_latency

[393] Fix | Delete

start = start - (start % ctx.interval)

[394] Fix | Delete

end = start + ctx.interval

[395] Fix | Delete

[396] Fix | Delete

process_weighted_interval(ctx, arr, start, end, printdirs)

[397] Fix | Delete

[398] Fix | Delete

# Update arr to throw away samples we no longer need - samples which

[399] Fix | Delete

# end before the start of the next interval, i.e. the end of the

[400] Fix | Delete

# current interval:

[401] Fix | Delete

idx = np.where(arr[:,0] > end)

[402] Fix | Delete

arr = arr[idx]

[403] Fix | Delete

[404] Fix | Delete

start += ctx.interval

[405] Fix | Delete

end = start + ctx.interval

[406] Fix | Delete

finally:

[407] Fix | Delete

for fp in fps:

[408] Fix | Delete

fp.close()

[409] Fix | Delete

[410] Fix | Delete

def output_interval_data(ctx,directions):

[411] Fix | Delete

fps = [HistFileRdr(f) for f in ctx.FILE]

[412] Fix | Delete

[413] Fix | Delete

print(', '.join(columns))

[414] Fix | Delete

[415] Fix | Delete

start = 0

[416] Fix | Delete

end = ctx.interval

[417] Fix | Delete

while True:

[418] Fix | Delete

[419] Fix | Delete

more_data = False

[420] Fix | Delete

[421] Fix | Delete

# add bins from all files in target intervals

[422] Fix | Delete

arr = None

[423] Fix | Delete

numSamples = 0

[424] Fix | Delete

while True:

[425] Fix | Delete

foundSamples = False

[426] Fix | Delete

for fp in fps:

[427] Fix | Delete

ts = fp.curTS

[428] Fix | Delete

if ts and ts+10 < end: # shift sample time when very close to an end time

[429] Fix | Delete

curdirect = fp.curDir

[430] Fix | Delete

numSamples += 1

[431] Fix | Delete

foundSamples = True

[432] Fix | Delete

if arr is None:

[433] Fix | Delete

arr = {}

[434] Fix | Delete

for d in directions:

[435] Fix | Delete

arr[d] = np.zeros(shape=(__HIST_COLUMNS), dtype=int)

[436] Fix | Delete

if 'm' in arr:

[437] Fix | Delete

arr['m'] = np.add(arr['m'], fp.curBins)

[438] Fix | Delete

if 'r' in arr and curdirect == 0:

[439] Fix | Delete

arr['r'] = np.add(arr['r'], fp.curBins)

[440] Fix | Delete

if 'w' in arr and curdirect == 1:

[441] Fix | Delete

arr['w'] = np.add(arr['w'], fp.curBins)

[442] Fix | Delete

if 't' in arr and curdirect == 2:

[443] Fix | Delete

arr['t'] = np.add(arr['t'], fp.curBins)

[444] Fix | Delete

[445] Fix | Delete

more_data = True

[446] Fix | Delete

fp.nextData()

[447] Fix | Delete

elif ts:

[448] Fix | Delete

more_data = True

[449] Fix | Delete

[450] Fix | Delete

# reached end of all files

[451] Fix | Delete

# or gone through all files without finding sample in interval

[452] Fix | Delete

if not more_data or not foundSamples:

[453] Fix | Delete

break

[454] Fix | Delete

[455] Fix | Delete

if arr is not None:

[456] Fix | Delete

#print("{} size({}) samples({}) nonzero({}):".format(end, arr.size, numSamples, np.count_nonzero(arr)), str(arr), )

[457] Fix | Delete

for d in sorted(arr.keys()):

[458] Fix | Delete

aval = arr[d]

[459] Fix | Delete

process_interval(ctx, aval, end, d)

[460] Fix | Delete

[461] Fix | Delete

# reach end of all files

[462] Fix | Delete

if not more_data:

[463] Fix | Delete

break

[464] Fix | Delete

[465] Fix | Delete

start += ctx.interval

[466] Fix | Delete

end = start + ctx.interval

[467] Fix | Delete

[468] Fix | Delete

def main(ctx):

[469] Fix | Delete

[470] Fix | Delete

if ctx.job_file:

[471] Fix | Delete

try:

[472] Fix | Delete

from configparser import SafeConfigParser, NoOptionError

[473] Fix | Delete

except ImportError:

[474] Fix | Delete

from ConfigParser import SafeConfigParser, NoOptionError

[475] Fix | Delete

[476] Fix | Delete

cp = SafeConfigParser(allow_no_value=True)

[477] Fix | Delete

with open(ctx.job_file, 'r') as fp:

[478] Fix | Delete

cp.readfp(fp)

[479] Fix | Delete

[480] Fix | Delete

if ctx.interval is None:

[481] Fix | Delete

# Auto detect --interval value

[482] Fix | Delete

for s in cp.sections():

[483] Fix | Delete

try:

[484] Fix | Delete

hist_msec = cp.get(s, 'log_hist_msec')

[485] Fix | Delete

if hist_msec is not None:

[486] Fix | Delete

ctx.interval = int(hist_msec)

[487] Fix | Delete

except NoOptionError:

[488] Fix | Delete

pass

[489] Fix | Delete

[490] Fix | Delete

if not hasattr(ctx, 'percentiles'):

[491] Fix | Delete

ctx.percentiles = "90,95,99"

[492] Fix | Delete

[493] Fix | Delete

if ctx.directions:

[494] Fix | Delete

ctx.directions = ctx.directions.lower()

[495] Fix | Delete

[496] Fix | Delete

if ctx.interval is None:

[497] Fix | Delete

ctx.interval = 1000

[498] Fix | Delete

[499] Fix | Delete