line |
stmt |
bran |
cond |
sub |
pod |
time |
code |
1
|
|
|
|
|
|
|
#================---------=================================================# |
2
|
|
|
|
|
|
|
# Statistics::OLS -- Perform Ordinary Least Squares (with statistics) 2-D # |
3
|
|
|
|
|
|
|
# by Sanford Morton # |
4
|
|
|
|
|
|
|
#==========================================================================# |
5
|
|
|
|
|
|
|
|
6
|
|
|
|
|
|
|
# Revision history for Perl module Statistics::OLS. |
7
|
|
|
|
|
|
|
# |
8
|
|
|
|
|
|
|
# 0.01 - 22 March 1998 |
9
|
|
|
|
|
|
|
# - original version |
10
|
|
|
|
|
|
|
# |
11
|
|
|
|
|
|
|
# 0.02 - 29 March 1998 |
12
|
|
|
|
|
|
|
# - corrected array bounds check bug in setData |
13
|
|
|
|
|
|
|
# - included check for divide by zero in standard error of |
14
|
|
|
|
|
|
|
# coefficients and t-stats |
15
|
|
|
|
|
|
|
# |
16
|
|
|
|
|
|
|
# 0.03 - 31 May 1998 |
17
|
|
|
|
|
|
|
# - placed module into standard format using h2xs |
18
|
|
|
|
|
|
|
# |
19
|
|
|
|
|
|
|
# 0.04 - 13 July 1998 |
20
|
|
|
|
|
|
|
# - changed the name from Statistics::Ols to Statistics::OLS |
21
|
|
|
|
|
|
|
# |
22
|
|
|
|
|
|
|
# 0.05 - 15 Sep 1999 |
23
|
|
|
|
|
|
|
# - corrected error checking bug |
24
|
|
|
|
|
|
|
# - corrected pod documentation bug |
25
|
|
|
|
|
|
|
# |
26
|
|
|
|
|
|
|
# 0.06 - 4 July 2000 |
27
|
|
|
|
|
|
|
# - allowed data in scientific (exponential) notation |
28
|
|
|
|
|
|
|
# |
29
|
|
|
|
|
|
|
# 0.07 - 12 October 2000 |
30
|
|
|
|
|
|
|
# - _sse fix for potential precision problems |
31
|
|
|
|
|
|
|
|
32
|
|
|
|
|
|
|
package Statistics::OLS; |
33
|
|
|
|
|
|
|
|
34
|
|
|
|
|
|
|
$Statistics::OLS::VERSION = '0.07'; |
35
|
|
|
|
|
|
|
|
36
|
1
|
|
|
1
|
|
650
|
use strict; |
|
1
|
|
|
|
|
2
|
|
|
1
|
|
|
|
|
2061
|
|
37
|
|
|
|
|
|
|
|
38
|
|
|
|
|
|
|
#==================# |
39
|
|
|
|
|
|
|
# public methods # |
40
|
|
|
|
|
|
|
#==================# |
41
|
|
|
|
|
|
|
|
42
|
|
|
|
|
|
|
sub new { |
43
|
1
|
|
|
1
|
1
|
58
|
my $class = shift; |
44
|
1
|
|
|
|
|
12
|
my $self = {}; |
45
|
|
|
|
|
|
|
|
46
|
1
|
|
|
|
|
3
|
bless $self, $class; |
47
|
1
|
|
|
|
|
5
|
$self->_init (@_); |
48
|
|
|
|
|
|
|
|
49
|
1
|
|
|
|
|
2
|
return $self; |
50
|
|
|
|
|
|
|
} |
51
|
|
|
|
|
|
|
|
52
|
|
|
|
|
|
|
|
53
|
|
|
|
|
|
|
sub setData { |
54
|
|
|
|
|
|
|
# check for equal or non-numeric data |
55
|
|
|
|
|
|
|
# can receive data either as \@xdata, \@ydata or as @xydata. |
56
|
|
|
|
|
|
|
# set refs: either to $self->{'_xdata'} and $self->{'_ydata'} |
57
|
|
|
|
|
|
|
# or to $self->{'_xydata'} |
58
|
|
|
|
|
|
|
# then set $self->{'_flatDataArray'} |
59
|
1
|
|
|
1
|
1
|
6
|
my $self = shift; |
60
|
1
|
|
|
|
|
3
|
my ($arrayref1, $arrayref2) = @_; |
61
|
1
|
|
|
|
|
2
|
my ($arrayref, $i); |
62
|
|
|
|
|
|
|
|
63
|
1
|
50
|
|
|
|
4
|
if (ref $arrayref2) { # passing data as two data arrays (x0 ...) (y0 ...) |
64
|
|
|
|
|
|
|
|
65
|
0
|
0
|
|
|
|
0
|
unless ($#$arrayref1 == $#$arrayref2) { # error checking |
66
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The dataset does not contain an equal number of x and y values. "; |
67
|
0
|
|
|
|
|
0
|
return 0; |
68
|
|
|
|
|
|
|
} |
69
|
|
|
|
|
|
|
|
70
|
0
|
0
|
|
|
|
0
|
unless ($#$arrayref1 > 1) { # error checking |
71
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The data set must contain at least three points. "; |
72
|
0
|
|
|
|
|
0
|
return 0; |
73
|
|
|
|
|
|
|
} |
74
|
|
|
|
|
|
|
|
75
|
|
|
|
|
|
|
# check whether data are equal and numeric |
76
|
0
|
|
|
|
|
0
|
for ($i=0; $i<=$#$arrayref1; $i++) { |
77
|
|
|
|
|
|
|
|
78
|
0
|
0
|
|
|
|
0
|
unless ($$arrayref1[$i] =~ /^([+-]?)(?=\d|\.\d)\d*(\.\d*)?([Ee]([+-]?\d+))?$/) { |
79
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The data element $$arrayref1[$i] is non-numeric. "; |
80
|
0
|
|
|
|
|
0
|
return 0; |
81
|
|
|
|
|
|
|
} |
82
|
0
|
0
|
|
|
|
0
|
unless ($$arrayref2[$i] =~ /^([+-]?)(?=\d|\.\d)\d*(\.\d*)?([Ee]([+-]?\d+))?$/) { |
83
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The data element $$arrayref2[$i] is non-numeric. "; |
84
|
0
|
|
|
|
|
0
|
return 0; |
85
|
|
|
|
|
|
|
} |
86
|
|
|
|
|
|
|
} |
87
|
|
|
|
|
|
|
|
88
|
0
|
|
|
|
|
0
|
$self->{'_xdata'} = $arrayref1; |
89
|
0
|
|
|
|
|
0
|
$self->{'_ydata'} = $arrayref2; |
90
|
0
|
|
|
|
|
0
|
$self->{'_flatDataArray'} = 0; # passed as two data arrays |
91
|
|
|
|
|
|
|
|
92
|
|
|
|
|
|
|
} else { # passing data as a single flat data array (x0 y0 ...) |
93
|
|
|
|
|
|
|
|
94
|
|
|
|
|
|
|
# check whether array is unbalanced |
95
|
1
|
50
|
|
|
|
5
|
if ($#$arrayref1 % 2 == 0) { |
96
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The dataset does not contain an equal number of x and y values."; |
97
|
0
|
|
|
|
|
0
|
return 0; |
98
|
|
|
|
|
|
|
} |
99
|
|
|
|
|
|
|
|
100
|
1
|
50
|
|
|
|
4
|
unless ($#$arrayref1 > 4) { # error checking |
101
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The data set must contain at least three points. "; |
102
|
0
|
|
|
|
|
0
|
return 0; |
103
|
|
|
|
|
|
|
} |
104
|
|
|
|
|
|
|
|
105
|
|
|
|
|
|
|
# check whether data are numeric |
106
|
1
|
|
|
|
|
5
|
for ($i=0; $i<=$#$arrayref1; $i++) { |
107
|
22
|
50
|
|
|
|
100
|
unless ($$arrayref1[$i] =~ /^([+-]?)(?=\d|\.\d)\d*(\.\d*)?([Ee]([+-]?\d+))?$/) { |
108
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "The data element $$arrayref1[$i] is non-numeric."; |
109
|
0
|
|
|
|
|
0
|
return 0; |
110
|
|
|
|
|
|
|
} |
111
|
|
|
|
|
|
|
} |
112
|
|
|
|
|
|
|
|
113
|
1
|
|
|
|
|
4
|
$self->{'_xydata'} = $arrayref1; |
114
|
1
|
|
|
|
|
3
|
$self->{'_flatDataArray'} = 1; # passed as one data array |
115
|
|
|
|
|
|
|
} |
116
|
|
|
|
|
|
|
|
117
|
1
|
|
|
|
|
2
|
$self->{'_dataIsSet'} = 1; |
118
|
1
|
|
|
|
|
2
|
$self->{'_gotMinMax'} = 0; # recalculate min-max if already calculated |
119
|
1
|
|
|
|
|
2
|
return 1; |
120
|
|
|
|
|
|
|
} |
121
|
|
|
|
|
|
|
|
122
|
|
|
|
|
|
|
|
123
|
|
|
|
|
|
|
|
124
|
|
|
|
|
|
|
sub error { |
125
|
|
|
|
|
|
|
# returns the last error message as a string |
126
|
0
|
|
|
0
|
0
|
0
|
my $self = shift; |
127
|
0
|
|
|
|
|
0
|
return $self->{'_errorMessage'}; |
128
|
|
|
|
|
|
|
} |
129
|
|
|
|
|
|
|
|
130
|
|
|
|
|
|
|
|
131
|
|
|
|
|
|
|
sub regress { |
132
|
1
|
|
|
1
|
1
|
6
|
my $self = shift; |
133
|
|
|
|
|
|
|
|
134
|
1
|
50
|
|
|
|
6
|
unless ($self->{'_dataIsSet'}) { |
135
|
0
|
|
|
|
|
0
|
$self->{'_errorMessage'} = "No datset has been registered. "; |
136
|
0
|
|
|
|
|
0
|
return 0; |
137
|
|
|
|
|
|
|
} |
138
|
|
|
|
|
|
|
|
139
|
1
|
|
|
|
|
3
|
my ($sumX, $sumY, $sumXX, $sumYY, $sumXY) = qw (0 0 0 0 0); |
140
|
1
|
|
|
|
|
2
|
my ($n, $i, $arrayref); |
141
|
|
|
|
|
|
|
|
142
|
1
|
50
|
|
|
|
4
|
if ($self->{'_flatDataArray'}) { |
143
|
1
|
|
|
|
|
2
|
$arrayref = $self->{'_xydata'}; |
144
|
1
|
|
|
|
|
2
|
$n = 1 + $#{ $arrayref }; |
|
1
|
|
|
|
|
2
|
|
145
|
1
|
|
|
|
|
4
|
for ($i=0; $i<$n; $i+=2) { |
146
|
11
|
|
|
|
|
20
|
$sumX += $self->{'_xydata'}[$i]; |
147
|
11
|
|
|
|
|
20
|
$sumY += $self->{'_xydata'}[$i+1]; |
148
|
11
|
|
|
|
|
24
|
$sumXX += $self->{'_xydata'}[$i]**2; |
149
|
11
|
|
|
|
|
15
|
$sumYY += $self->{'_xydata'}[$i+1]**2; |
150
|
11
|
|
|
|
|
30
|
$sumXY += $self->{'_xydata'}[$i] * $self->{'_xydata'}[$i+1]; |
151
|
|
|
|
|
|
|
} |
152
|
1
|
|
|
|
|
3
|
$n /= 2; # number of observations |
153
|
|
|
|
|
|
|
} else { |
154
|
0
|
|
|
|
|
0
|
$arrayref = $self->{'_xdata'}; |
155
|
0
|
|
|
|
|
0
|
$n = $#{ $arrayref }; |
|
0
|
|
|
|
|
0
|
|
156
|
0
|
|
|
|
|
0
|
$n++; # number of observations |
157
|
0
|
|
|
|
|
0
|
for ( $i=0; $i<$n; $i++ ) { |
158
|
0
|
|
|
|
|
0
|
$sumX += $self->{'_xdata'}[$i]; |
159
|
0
|
|
|
|
|
0
|
$sumY += $self->{'_ydata'}[$i]; |
160
|
0
|
|
|
|
|
0
|
$sumXX += $self->{'_xdata'}[$i]**2; |
161
|
0
|
|
|
|
|
0
|
$sumYY += $self->{'_ydata'}[$i]**2; |
162
|
0
|
|
|
|
|
0
|
$sumXY += $self->{'_xdata'}[$i] * $self->{'_ydata'}[$i]; |
163
|
|
|
|
|
|
|
} |
164
|
|
|
|
|
|
|
} |
165
|
|
|
|
|
|
|
|
166
|
|
|
|
|
|
|
# sum of squared deviations of X and Y |
167
|
1
|
|
|
|
|
4
|
$self->{'_ssdX'} = $sumXX - $sumX**2/$n; |
168
|
1
|
|
|
|
|
4
|
$self->{'_ssdY'} = $sumYY - $sumY**2/$n; |
169
|
1
|
|
|
|
|
2
|
$self->{'_ssdXY'} = $sumXY - $sumX*$sumY/$n; |
170
|
|
|
|
|
|
|
|
171
|
|
|
|
|
|
|
# num observations and sample averages |
172
|
1
|
|
|
|
|
2
|
$self->{'_n'} = $n; |
173
|
1
|
|
|
|
|
10
|
($self->{'_avX'}, $self->{'_avY'}) = ($sumX/$n, $sumY/$n); |
174
|
|
|
|
|
|
|
|
175
|
|
|
|
|
|
|
# sample var's and cov's (using n-1) |
176
|
1
|
|
|
|
|
4
|
$self->{'_varX'} = $self->{'_ssdX'} / ($n-1); |
177
|
1
|
|
|
|
|
3
|
$self->{'_varY'} = $self->{'_ssdY'} / ($n-1); |
178
|
1
|
|
|
|
|
8
|
$self->{'_covXY'} = $self->{'_ssdXY'} / ($n-1); |
179
|
|
|
|
|
|
|
|
180
|
|
|
|
|
|
|
# coefficient estimates |
181
|
1
|
50
|
|
|
|
5
|
$self->{'_b2'} = $self->{'_ssdX'} == 0 |
182
|
|
|
|
|
|
|
? undef |
183
|
|
|
|
|
|
|
: $self->{'_ssdXY'} / $self->{'_ssdX'}; # slope |
184
|
1
|
|
|
|
|
5
|
$self->{'_b1'} = ($sumY - $self->{'_b2'} * $sumX) / $n; # intercept |
185
|
|
|
|
|
|
|
|
186
|
|
|
|
|
|
|
# R-squared |
187
|
1
|
50
|
33
|
|
|
11
|
$self->{'_rsq'} = ($self->{'_ssdX'} == 0 or $self->{'_ssdY'} == 0) |
188
|
|
|
|
|
|
|
? 1.0 |
189
|
|
|
|
|
|
|
: ($self->{'_ssdXY'} / $self->{'_ssdX'}) |
190
|
|
|
|
|
|
|
* ($self->{'_ssdXY'} / $self->{'_ssdY'}) ; |
191
|
|
|
|
|
|
|
# $self->{'_rsq'} = $self->{'_b2'}**2 * $self->{'_ssdX'} / $self->{'_ssdY'}; |
192
|
|
|
|
|
|
|
|
193
|
|
|
|
|
|
|
# error (residual) sum of squares |
194
|
1
|
|
|
|
|
4
|
$self->{'_sse'} = $self->{'_ssdY'} - $self->{'_ssdX'} * $self->{'_b2'}**2; |
195
|
1
|
50
|
|
|
|
5
|
$self->{'_sse'} = 0 if $self->{'_sse'} < 0; # potential precision problems |
196
|
|
|
|
|
|
|
|
197
|
|
|
|
|
|
|
# homoscedastic standard deviation of error term |
198
|
1
|
|
|
|
|
7
|
$self->{'_sigma'} = sqrt ($self->{'_sse'}/($n-2)); |
199
|
|
|
|
|
|
|
|
200
|
|
|
|
|
|
|
# standard error of coefficients and t-stats |
201
|
1
|
|
|
|
|
4
|
$self->{'_seB1'} = $self->{'_seB2'} = undef; |
202
|
1
|
|
|
|
|
2
|
$self->{'_t1'} = $self->{'_t2'} = undef; |
203
|
|
|
|
|
|
|
|
204
|
1
|
50
|
|
|
|
4
|
unless ($self->{'_ssdX'} == 0) { |
205
|
1
|
|
|
|
|
3
|
$self->{'_seB1'} = $self->{'_sigma'} * sqrt ($sumXX / ($n*$self->{'_ssdX'})); |
206
|
1
|
|
|
|
|
3
|
$self->{'_seB2'} = $self->{'_sigma'} / sqrt $self->{'_ssdX'}; |
207
|
1
|
50
|
|
|
|
15
|
$self->{'_t2'} = $self->{'_b2'} / $self->{'_seB2'} unless $self->{'_seB2'} == 0; |
208
|
1
|
50
|
|
|
|
6
|
$self->{'_t1'} = $self->{'_b1'} / $self->{'_seB1'} unless $self->{'_seB1'} == 0; |
209
|
|
|
|
|
|
|
} |
210
|
|
|
|
|
|
|
|
211
|
|
|
|
|
|
|
# durbin-watson |
212
|
1
|
|
|
|
|
1
|
my $sum = 0; |
213
|
1
|
|
|
|
|
2
|
my ($prevErr, $currentErr); |
214
|
|
|
|
|
|
|
|
215
|
1
|
50
|
|
|
|
3
|
if ($self->{'_sse'} == 0) { |
216
|
0
|
|
|
|
|
0
|
$self->{'_dw'} = undef; |
217
|
|
|
|
|
|
|
} else { |
218
|
1
|
50
|
|
|
|
4
|
if ($self->{'_flatDataArray'}) { |
219
|
1
|
|
|
|
|
1
|
$arrayref = $self->{'_xydata'}; |
220
|
1
|
|
|
|
|
2
|
$n = 1+$#{ $arrayref }; |
|
1
|
|
|
|
|
16
|
|
221
|
1
|
|
|
|
|
5
|
$prevErr = $self->{'_xydata'}[1] |
222
|
|
|
|
|
|
|
- $self->{'_b1'} - $self->{'_b2'} * $self->{'_xydata'}[0]; |
223
|
1
|
|
|
|
|
4
|
for ($i=2; $i<$n; $i+=2) { |
224
|
10
|
|
|
|
|
22
|
$currentErr = $self->{'_xydata'}[$i+1] |
225
|
|
|
|
|
|
|
- $self->{'_b1'} - $self->{'_b2'} * $self->{'_xydata'}[$i]; |
226
|
10
|
|
|
|
|
12
|
$sum += ($currentErr - $prevErr)**2; |
227
|
10
|
|
|
|
|
18
|
$prevErr = $currentErr; |
228
|
|
|
|
|
|
|
} |
229
|
|
|
|
|
|
|
} else { |
230
|
0
|
|
|
|
|
0
|
$arrayref = $self->{'_xdata'}; |
231
|
0
|
|
|
|
|
0
|
$n = 1+$#{ $arrayref }; |
|
0
|
|
|
|
|
0
|
|
232
|
0
|
|
|
|
|
0
|
$prevErr = $self->{'_ydata'}[0] |
233
|
|
|
|
|
|
|
- $self->{'_b1'} - $self->{'_b2'} * $self->{'_xdata'}[0]; |
234
|
0
|
|
|
|
|
0
|
for ( $i=1; $i<$n; $i++ ) { |
235
|
0
|
|
|
|
|
0
|
$currentErr = $self->{'_ydata'}[$i] |
236
|
|
|
|
|
|
|
- $self->{'_b1'} - $self->{'_b2'} * $self->{'_xdata'}[$i]; |
237
|
0
|
|
|
|
|
0
|
$sum += ($currentErr - $prevErr)**2; |
238
|
0
|
|
|
|
|
0
|
$prevErr = $currentErr; |
239
|
|
|
|
|
|
|
} |
240
|
|
|
|
|
|
|
} |
241
|
1
|
|
|
|
|
3
|
$self->{'_dw'} = $sum / $self->{'_sse'}; |
242
|
|
|
|
|
|
|
} |
243
|
|
|
|
|
|
|
|
244
|
1
|
|
|
|
|
2
|
$self->{'_gotMinMax'} = 0; # should recalculate min-max's if already calculated |
245
|
1
|
|
|
|
|
3
|
return 1; |
246
|
|
|
|
|
|
|
} |
247
|
|
|
|
|
|
|
|
248
|
|
|
|
|
|
|
sub minMax { |
249
|
1
|
|
|
1
|
0
|
5
|
my $self = shift; |
250
|
1
|
50
|
|
|
|
6
|
$self->_getMinMax() unless $self->{'_gotMinMax'}; |
251
|
1
|
|
|
|
|
5
|
return ($self->{'_xmin'}, $self->{'_xmax'}, |
252
|
|
|
|
|
|
|
$self->{'_ymin'}, $self->{'_ymax'}); |
253
|
|
|
|
|
|
|
} |
254
|
|
|
|
|
|
|
|
255
|
1
|
|
|
1
|
1
|
7
|
sub coefficients { my $self = shift; return ($self->{'_b1'}, $self->{'_b2'}); } |
|
1
|
|
|
|
|
4
|
|
256
|
|
|
|
|
|
|
|
257
|
1
|
|
|
1
|
1
|
4
|
sub rsq { my $self = shift; return $self->{'_rsq'}; } |
|
1
|
|
|
|
|
4
|
|
258
|
|
|
|
|
|
|
|
259
|
1
|
|
|
1
|
1
|
4
|
sub tstats { my $self = shift; return ($self->{'_t1'}, $self->{'_t2'}); } |
|
1
|
|
|
|
|
4
|
|
260
|
|
|
|
|
|
|
|
261
|
1
|
|
|
1
|
0
|
6
|
sub av { my $self = shift; return ($self->{'_avX'}, $self->{'_avY'}); } |
|
1
|
|
|
|
|
4
|
|
262
|
|
|
|
|
|
|
|
263
|
1
|
|
|
1
|
0
|
4
|
sub var { my $self = shift; return ($self->{'_varX'}, $self->{'_varY'}, |
|
1
|
|
|
|
|
4
|
|
264
|
|
|
|
|
|
|
$self->{'_covXY'}); } |
265
|
|
|
|
|
|
|
|
266
|
1
|
|
|
1
|
0
|
4
|
sub sigma { my $self = shift; return $self->{'_sigma'}; } |
|
1
|
|
|
|
|
3
|
|
267
|
|
|
|
|
|
|
|
268
|
1
|
|
|
1
|
0
|
10
|
sub size { my $self = shift; return $self->{'_n'}; } |
|
1
|
|
|
|
|
3
|
|
269
|
|
|
|
|
|
|
|
270
|
0
|
|
|
0
|
0
|
0
|
sub dw { my $self = shift; return $self->{'_dw'}; } |
|
0
|
|
|
|
|
0
|
|
271
|
|
|
|
|
|
|
|
272
|
|
|
|
|
|
|
sub residuals { |
273
|
1
|
|
|
1
|
1
|
6
|
my $self = shift; |
274
|
1
|
|
|
|
|
1
|
my ($n, $i, $arrayref); |
275
|
1
|
|
|
|
|
2
|
my @result = (); |
276
|
|
|
|
|
|
|
|
277
|
1
|
50
|
|
|
|
3
|
if ($self->{'_flatDataArray'}) { # construct xy data array |
278
|
1
|
|
|
|
|
2
|
$arrayref = $self->{'_xydata'}; |
279
|
1
|
|
|
|
|
2
|
$n = 1+$#{ $arrayref }; |
|
1
|
|
|
|
|
1
|
|
280
|
1
|
|
|
|
|
4
|
for ($i=0; $i<$n; $i+=2) { |
281
|
11
|
|
|
|
|
20
|
$result[$i] = $self->{'_xydata'}[$i]; |
282
|
11
|
|
|
|
|
47
|
$result[$i+1] = $self->{'_xydata'}[$i+1] |
283
|
|
|
|
|
|
|
- $self->{'_b1'} - $self->{'_b2'} * $self->{'_xydata'}[$i]; |
284
|
|
|
|
|
|
|
} |
285
|
|
|
|
|
|
|
} else { # construct y data array |
286
|
0
|
|
|
|
|
0
|
$arrayref = $self->{'_xdata'}; |
287
|
0
|
|
|
|
|
0
|
$n = 1+$#{ $arrayref }; |
|
0
|
|
|
|
|
0
|
|
288
|
0
|
|
|
|
|
0
|
for ( $i=0; $i<$n; $i++ ) { |
289
|
0
|
|
|
|
|
0
|
$result[$i] = $self->{'_ydata'}[$i] |
290
|
|
|
|
|
|
|
- $self->{'_b1'} - $self->{'_b2'} * $self->{'_xdata'}[$i]; |
291
|
|
|
|
|
|
|
} |
292
|
|
|
|
|
|
|
} |
293
|
1
|
|
|
|
|
8
|
return @result; |
294
|
|
|
|
|
|
|
} |
295
|
|
|
|
|
|
|
|
296
|
|
|
|
|
|
|
sub predicted { |
297
|
1
|
|
|
1
|
1
|
38
|
my $self = shift; |
298
|
1
|
|
|
|
|
2
|
my ($n, $i, $arrayref); |
299
|
1
|
|
|
|
|
3
|
my @result = (); |
300
|
|
|
|
|
|
|
|
301
|
1
|
50
|
|
|
|
3
|
if ($self->{'_flatDataArray'}) { |
302
|
1
|
|
|
|
|
2
|
$arrayref = $self->{'_xydata'}; |
303
|
1
|
|
|
|
|
2
|
$n = 1+$#{ $arrayref }; |
|
1
|
|
|
|
|
2
|
|
304
|
1
|
|
|
|
|
4
|
for ($i=0; $i<$n; $i+=2) { |
305
|
11
|
|
|
|
|
45
|
$result[$i] = $self->{'_xydata'}[$i]; |
306
|
11
|
|
|
|
|
34
|
$result[$i+1] = $self->{'_b1'} + $self->{'_b2'} * $self->{'_xydata'}[$i]; |
307
|
|
|
|
|
|
|
} |
308
|
|
|
|
|
|
|
} else { |
309
|
0
|
|
|
|
|
0
|
$arrayref = $self->{'_xdata'}; |
310
|
0
|
|
|
|
|
0
|
$n = 1+$#{ $arrayref }; |
|
0
|
|
|
|
|
0
|
|
311
|
0
|
|
|
|
|
0
|
for ( $i=0; $i<$n; $i++ ) { |
312
|
0
|
|
|
|
|
0
|
$result[$i] = $self->{'_b1'} + $self->{'_b2'} * $self->{'_xdata'}[$i]; |
313
|
|
|
|
|
|
|
} |
314
|
|
|
|
|
|
|
} |
315
|
1
|
|
|
|
|
9
|
return @result; |
316
|
|
|
|
|
|
|
} |
317
|
|
|
|
|
|
|
|
318
|
|
|
|
|
|
|
|
319
|
|
|
|
|
|
|
#===================# |
320
|
|
|
|
|
|
|
# private methods # |
321
|
|
|
|
|
|
|
#===================# |
322
|
|
|
|
|
|
|
|
323
|
|
|
|
|
|
|
# initialization; |
324
|
|
|
|
|
|
|
# this contains a record of all private data |
325
|
|
|
|
|
|
|
# this is the place to start if you want to read the code. |
326
|
|
|
|
|
|
|
sub _init { |
327
|
1
|
|
|
1
|
|
1
|
my $self = shift; |
328
|
|
|
|
|
|
|
|
329
|
|
|
|
|
|
|
# $self->{'_flatDataArray'} = ''; # data passed as one flat or two data arrays? |
330
|
1
|
|
|
|
|
6
|
$self->{'_dataIsSet'} = 0; # return error if asking to regress |
331
|
1
|
|
|
|
|
2
|
$self->{'_errorMessage'} = ''; |
332
|
|
|
|
|
|
|
|
333
|
|
|
|
|
|
|
# will hold references to caller's data array(s) |
334
|
|
|
|
|
|
|
# $self->{'_xydata'} = $self->{'_xdata'} = $self->{'_ydata'} = ''; |
335
|
|
|
|
|
|
|
|
336
|
|
|
|
|
|
|
# $self->{'_ssdX'} = $self->{'_ssdY'} = $self->{'_ssdXY'} = ''; |
337
|
1
|
|
|
|
|
3
|
$self->{'_n'} = 0; # num observations |
338
|
|
|
|
|
|
|
# $self->{'_avX'} = $self->{'_avY'} = ''; |
339
|
|
|
|
|
|
|
# $self->{'_varX'} = $self->{'_vary'} = $self->{'_covXY'} = ''; |
340
|
|
|
|
|
|
|
|
341
|
1
|
|
|
|
|
3
|
$self->{'_gotMinMax'} = 0; # do not calculate again |
342
|
|
|
|
|
|
|
# $self->{'_xmin'} = $self->{'_xmax'} = 0; |
343
|
|
|
|
|
|
|
# $self->{'_ymin'} = $self->{'_ymax'} = 0; |
344
|
|
|
|
|
|
|
|
345
|
|
|
|
|
|
|
# $self->{'_b1'} = $self->{'_b2'} = ''; |
346
|
|
|
|
|
|
|
# $self->{'_rsq'} = $self->{'_sse'} = $self->{'_sigma'} = ''; |
347
|
|
|
|
|
|
|
|
348
|
|
|
|
|
|
|
# $self->{'_seB1'} = $self->{'_seB2'} = undef; |
349
|
|
|
|
|
|
|
# $self->{'_t1'} = $self->{'_t2'} = undef; |
350
|
|
|
|
|
|
|
# $self->{'_dw'} = undef; |
351
|
|
|
|
|
|
|
} |
352
|
|
|
|
|
|
|
|
353
|
|
|
|
|
|
|
|
354
|
|
|
|
|
|
|
# sets min and max values of all data (_xmin, _ymin, _xmax, _ymax); |
355
|
|
|
|
|
|
|
# also sets _xslope, _yslope, _ax and _ay used in _data2pxl; |
356
|
|
|
|
|
|
|
# usage: $self->_getMinMax |
357
|
|
|
|
|
|
|
sub _getMinMax { |
358
|
1
|
|
|
1
|
|
2
|
my $self = shift; |
359
|
1
|
|
|
|
|
7
|
my ($i, $n, $arrayref); |
360
|
|
|
|
|
|
|
|
361
|
1
|
50
|
|
|
|
4
|
if ($self->{'_flatDataArray'}) { |
362
|
1
|
|
|
|
|
4
|
$self->{'_xmin'} = $self->{'_xmax'} = $self->{'_xydata'}[0]; |
363
|
1
|
|
|
|
|
4
|
$self->{'_ymin'} = $self->{'_ymax'} = $self->{'_xydata'}[1]; |
364
|
1
|
|
|
|
|
1
|
$arrayref = $self->{'_xydata'}; |
365
|
1
|
|
|
|
|
2
|
$n = 1+$#{ $arrayref }; |
|
1
|
|
|
|
|
2
|
|
366
|
1
|
|
|
|
|
5
|
for ($i=2; $i<$n; $i+=2) { |
367
|
10
|
100
|
|
|
|
24
|
$self->{'_xmin'} = $self->{'_xydata'}[$i] |
368
|
|
|
|
|
|
|
if $self->{'_xydata'}[$i] < $self->{'_xmin'}; |
369
|
10
|
100
|
|
|
|
22
|
$self->{'_xmax'} = $self->{'_xydata'}[$i] |
370
|
|
|
|
|
|
|
if $self->{'_xydata'}[$i] > $self->{'_xmax'}; |
371
|
10
|
100
|
|
|
|
27
|
$self->{'_ymin'} = $self->{'_xydata'}[$i+1] |
372
|
|
|
|
|
|
|
if $self->{'_xydata'}[$i+1] < $self->{'_ymin'}; |
373
|
10
|
50
|
|
|
|
27
|
$self->{'_ymax'} = $self->{'_xydata'}[$i+1] |
374
|
|
|
|
|
|
|
if $self->{'_xydata'}[$i+1] > $self->{'_ymax'}; |
375
|
|
|
|
|
|
|
} |
376
|
1
|
|
|
|
|
3
|
$n /= 2; # number of observations |
377
|
|
|
|
|
|
|
} else { |
378
|
0
|
|
|
|
|
0
|
$self->{'_xmin'} = $self->{'_xmax'} = $self->{'_xdata'}[0]; |
379
|
0
|
|
|
|
|
0
|
$self->{'_ymin'} = $self->{'_ymax'} = $self->{'_ydata'}[0]; |
380
|
0
|
|
|
|
|
0
|
$arrayref = $self->{'_xdata'}; |
381
|
0
|
|
|
|
|
0
|
$n = 1+$#{ $arrayref }; |
|
0
|
|
|
|
|
0
|
|
382
|
0
|
|
|
|
|
0
|
for ( $i=1; $i<$n; $i++ ) { |
383
|
0
|
0
|
|
|
|
0
|
$self->{'_xmin'} = $self->{'_xdata'}[$i] |
384
|
|
|
|
|
|
|
if $self->{'_xdata'}[$i] < $self->{'_xmin'}; |
385
|
0
|
0
|
|
|
|
0
|
$self->{'_xmax'} = $self->{'_xdata'}[$i] |
386
|
|
|
|
|
|
|
if $self->{'_xdata'}[$i] > $self->{'_xmax'}; |
387
|
0
|
0
|
|
|
|
0
|
$self->{'_ymin'} = $self->{'_ydata'}[$i] |
388
|
|
|
|
|
|
|
if $self->{'_ydata'}[$i] < $self->{'_ymin'}; |
389
|
0
|
0
|
|
|
|
0
|
$self->{'_ymax'} = $self->{'_ydata'}[$i] |
390
|
|
|
|
|
|
|
if $self->{'_ydata'}[$i] > $self->{'_ymax'}; |
391
|
|
|
|
|
|
|
} |
392
|
|
|
|
|
|
|
} |
393
|
1
|
|
|
|
|
3
|
$self->{'_gotMinMax'} = 1; |
394
|
|
|
|
|
|
|
} |
395
|
|
|
|
|
|
|
|
396
|
|
|
|
|
|
|
1; |
397
|
|
|
|
|
|
|
|
398
|
|
|
|
|
|
|
__END__ |