From 0c1d68ee8cc2a631d6029285e771ebbfe119995d Mon Sep 17 00:00:00 2001 From: wukong Date: Sat, 7 Dec 2019 15:02:59 -0800 Subject: code formatting changes to lin_reg scripts; added range to output of mean scripts; --- mean.awk | 17 +++++++++-------- 1 file changed, 9 insertions(+), 8 deletions(-) (limited to 'mean.awk') diff --git a/mean.awk b/mean.awk index 754acfe..069db4c 100644 --- a/mean.awk +++ b/mean.awk @@ -5,20 +5,21 @@ BEGIN { OFS = FS - sign = "[+-]?" - decimal = "[0-9]+[.]?[0-9]*" - fraction = "[.][0-9]+" - exponent = "([Ee]" sign "[0-9]+)?" - number = "^" sign "(" decimal "|" fraction ")" exponent "$" + #sign = "[+-]?" + #decimal = "[0-9]+[.]?[0-9]*" + #fraction = "[.][0-9]*" + #exponent = "([Ee]" "[+-]?" "[0-9]+)?" + number = "^[+-]?([0-9]+[.]?[0-9]*|[.][0-9]*)([Ee][+-]?[0-9]+)?$" } # Welford's 'online' algorithm for variance -NF > 0 { +NF { for (n=1; n<=NF; n++) { if ($n ~ number) { count += 1 (count == 1 || $n < min) ? min = $n : min = min (count == 1 || $n > max) ? max = $n : max = max + range = max - min delta0 = $n - mean mean += delta0/count delta1 = $n - mean @@ -29,7 +30,7 @@ NF > 0 { } END { - print "mean", "std_err", "std_dev", "min", "max", "total", "count" - print mean, sqrt(var/count), sqrt(var), min, max, (mean*count), count + print "mean", "std_err", "std_dev", "range", "min", "max", "total", "count" + print mean, sqrt(var/count), sqrt(var), range, min, max, (mean*count), count } -- cgit v1.2.3