1
/*
2
*---+----1----+----2----+----3----+----4----+----5----+----6----+----7----+----8;
3
DATA SET TITLE: ATMOSPHERIC CO2 CONC - MAUNA LOA OBSERVATORY, HAWAII,
1958-2001.
4
CONTRIBUTORS: C. D. KEELING, T. P. WHORF (AND THE CARBON DIOXIDE
RESEARCH
5
GROUP), SCRIPPS INSTITUTION OF
OCEANOGRAPHY, UNIVERSITY OF CALIFORNIA,
6
LA JOLLA, CALIFORNIA 92093-0444
7
SCOPE OF THE DATA: THE DATA FILE
CONTAINS MONTHLY AND ANNUAL ATMOSPHERIC
8
CO2
CONCENTRATIONS
DERIVED FROM THE SCRIPPS INSTITUTION OF
9
OCEANOGRAPHY'S (SIO's)
CONTINUOUS MONITORING PROGRAM AT MAUNA LOA
10
OBSERVATORY, HAWAII. THIS RECORD
CONSTITUTES THE LONGEST CONTINUOUS
11
RECORD OF ATMOSPHERIC CO2
CONCENTRATIONS AVAILABLE IN THE WORLD.
12
MONTHLY AND ANNUAL AVERAGE MOLE
FRACTIONS OF CO2 IN WATER-VAPOR-FREE AIR
13
ARE GIVEN FROM MARCH 1958 THROUGH
DECEMBER 2001, EXCEPT FOR A FEW INTERRUPTIONS.
14
DATA FORMAT: ALL CONC. ARE
EXPRESSED IN PARTS PER MILLION BY VOLUME (PPMV) IN
15
THE SIO X99 MOLE FRACTION
SCALE. MISSING VALUES ARE REPRESENTED BY
-99.99.
16
*---+----1----+----2----+----3----+----4----+----5----+----6----+----7----+----8;
17
*/
18
19
options nocenter nodate nonumber ls=80 ps=256;
20
data maunaloa; length month $ 9;
21
title1 'Trend analysis of carbon dioxide levels';
22
infile 'C:\Geaghan\EXST\EXST7015New\Fall2002\SAS\maunaloa.co2.txt'
firstobs=15 obs=58;
23
input @1 Year 4. @5 January 7.
@12 February 7. @19 March 7. @26 April 7. @33 May 7. @40
24
June 7. @47 July 7. @54 August 7. @61 September 7. @68
October 7. @75
24
November 7. @82
December
7. @89 Annual 7.;
25
time = year - 1957;
26
CO2Level = January; mo = 1; month = 'January';
output;
27
CO2Level = February; mo = 2; month = 'February'; output;
28
CO2Level = March; mo = 3; month =
'March'; output;
29
CO2Level = April; mo = 4; month =
'April'; output;
30
CO2Level = May; mo = 5; month
= 'May'; output;
31
CO2Level = June; mo = 6; month =
'June'; output;
32
CO2Level = July; mo =
7; month = 'July'; output;
33
CO2Level = August; mo = 8; month = 'August';
output;
34
CO2Level = September; mo = 9;
month = 'September'; output;
35
CO2Level = October; mo = 10;
month = 'October'; output;
36
CO2Level = November; mo = 11;
month = 'November'; output;
37
CO2Level = December; mo = 12;
month = 'December'; output;
38
drop January February March April May June July August September
39
October November December
Annual;
40
run;
NOTE: The
infile
'C:\Geaghan\EXST\EXST7015New\Fall2002\SAS\maunaloa.co2.txt' is:
File Name=C:\Geaghan\EXST\EXST7015New\Fall2002\SAS\maunaloa.co2.txt,
RECFM=V,LRECL=256
NOTE: 44
records were read from the infile
'C:\Geaghan\EXST\EXST7015New\Fall2002\SAS\maunaloa.co2.txt'.
The minimum record length was 102.
The maximum record length was 102.
NOTE: The data
set WORK.MAUNALOA has 528
observations and 5 variables.
NOTE: DATA
statement used:
real time
0.06 seconds
cpu
time
0.06 seconds
41
42
data maunaloa; set maunaloa;
43
if co2level lt 0 then co2level = .;
44
loglevel = log(co2level);
46
run;
48
*proc print noobs; run;
49
options ls=111 ps=56;
50
proc plot data=maunaloa; plot co2level*time; run;
51
options ls=80 ps=256;
NOTE: There
were 528 observations read from
the data set WORK.MAUNALOA.
NOTE: The
PROCEDURE PLOT printed page 1.
NOTE:
PROCEDURE PLOT used:
real time
0.05 seconds
cpu
time
0.03 seconds
Trend analysis
of carbon dioxide levels
Plot of
CO2Level*time. Legend: A = 1 obs, B = 2
obs, etc.
CO2Level |
|
380 +
|
|
|
|
C
|
B
C D
370
+
A C D C
|
C C C B
|
B
C B B
|
C D D B
|
C
C C A
|
C C C A
360
+
A B C B D C B
|
B
B B
D B
|
C B C C C
|
A C D C B B
|
B
E C B C B
|
C D B B B
350
+
C B C B
|
C
B E B
|
C C D B
|
C D D C
|
B
D D C B
|
B B B C B
340
+
B
C D D B
|
C C
D B B
|
C
B D C B
|
C B D A
|
B C C D C B
|
D C C C C
330
+
B C D D B
|
C C E D A B A
|
D C E C A B
|
B C B C B B
|
C D E D C B
| A C
B E D C B B
320 + B C D B B C C C B
| A C C C C D C C B
| B C D D C C B A
| C D A B A
| B B B
|
310 +
|
---+---------+---------+---------+---------+---------+---------+---------+---------+---------+
0
5
10
15
20
25
30
35
40 45
time
NOTE: 7 obs
had missing values.
53
proc mixed data=maunaloa; classes month;
54
title2 'Basic Analysis of Covariance using PROC MIXED';
55
model co2level = time month time*month / htype=1 3 DDFM=Satterthwaite;
57
run;
NOTE: 7
observations are not included
because of missing values.
NOTE: The
PROCEDURE MIXED printed page 2.
NOTE:
PROCEDURE MIXED used:
real time
0.07 seconds
cpu
time
0.07 seconds
Trend analysis
of carbon dioxide levels
Basic Analysis
of Covariance using PROC
MIXED
The Mixed
Procedure
Model Information
Data
Set
WORK.MAUNALOA
Dependent
Variable
CO2Level
Covariance
Structure
Diagonal
Estimation
Method
REML
Residual
Variance Method
Profile
Fixed Effects
SE Method
Model-Based
Degrees of
Freedom Method
Residual
Class Level Information
Class
Levels Values
month
12 April August December
February January July June March May November October September
Dimensions
Covariance
Parameters
1
Columns in
X
26
Columns in
Z
0
Subjects
1
Max Obs Per
Subject
528
Observations
Used
521
Observations
Not
Used
7
Total
Observations
528
Covariance
Parameter
Estimates
Cov
Parm
Estimate
Residual
3.5033
Fit Statistics
-2 Res Log
Likelihood 2184.8
AIC (smaller
is better) 2186.8
AICC (smaller
is better) 2186.8
BIC (smaller
is better) 2191.0
Type 1 Tests
of Fixed Effects
Num Den
Effect
DF DF F
Value
Pr > F
time
1 497
42276.8 <.0001
month
11 497
45.54 <.0001
time*month
11
497 0.26 0.9927
Type 3 Tests of Fixed Effects
Num Den
Effect
DF DF
F Value Pr > F
time
1 497
42195.7 <.0001
month
11 497
9.51 <.0001
time*month
11
497 0.26 0.9927
59
proc glm data=maunaloa; classes month;
60
title2 'Basic Analysis of Covariance using PROC GLM';
61
model co2level = time month time*month / solution;
62
run;
NOTE: The
PROCEDURE GLM printed pages 3-4.
NOTE:
PROCEDURE GLM used:
real time
0.08 seconds
cpu
time
0.08 seconds
Trend analysis
of carbon dioxide levels
Basic Analysis
of Covariance using PROC GLM
The GLM
Procedure
Class Level
Information
Class
Levels Values
month
12
April August December February January July June March May November
October September
Number of
observations 528
NOTE: Due to
missing values, only 521
observations can be used in this analysis.
Trend analysis
of carbon dioxide levels
Basic Analysis
of Covariance using PROC GLM
Dependent
Variable: CO2Level
Sum
of
Source
DF Squares
Mean Square F Value
Pr > F
Model
23 149874.8665
6516.2985 1860.02
<.0001
Error
497
1741.1612
3.5033
Corrected
Total
520
151616.0277
R-Square
Coeff Var Root MSE
CO2Level Mean
0.988516
0.550729
1.871722 339.8628
Source
DF Type I SS Mean
Square F Value
Pr > F
time
1 148110.2034
148110.2034 42276.8
<.0001
month
11
1754.7861
159.5260 45.54
<.0001
time*month
11
9.8771
0.8979 0.26
0.9927
Source
DF Type III SS Mean
Square F Value
Pr > F
time
1 147825.9593
147825.9593 42195.7
<.0001
month
11
366.6464
33.3315 9.51
<.0001
time*month
11
9.8771
0.8979 0.26
0.9927
Standard
Parameter
Estimate
Error t Value
Pr > |t|
Intercept
307.1697146 B 0.57410421
535.04
<.0001
time
1.3144369 B
0.02222108
59.15
<.0001
month
April
4.3696829 B
0.82363751
5.31
<.0001
month
August
1.5290698 B
0.81190596
1.88
0.0602
month
December 1.7211416
B
0.81190596
2.12
0.0345
month
February 1.9953236
B
0.84506816
2.36
0.0186
month
January 1.4453398
B
0.83122443
1.74
0.0827
month
July
3.3254757
B
0.81190596
4.10
<.0001
month
June
4.1589625 B
0.83122443
5.00
<.0001
month
March
3.1485337 B
0.82363751
3.82
0.0001
month
May
4.9943340 B
0.81190596
6.15
<.0001
month
November 0.7041332
B
0.81190596
0.87
0.3862
month
October -0.8184642
B
0.83122443
-0.98
0.3253
month
September 0.0000000
B
.
.
.
time*month
April
0.0302079 B
0.03170608
0.95
0.3412
time*month
August
0.0088393 B
0.03142535
0.28
0.7786
time*month
December 0.0344038
B
0.03142535
1.09
0.2741
time*month
February 0.0369158
B
0.03232065
1.14
0.2539
time*month
January 0.0290137
B
0.03198159
0.91
0.3647
time*month
July
0.0155849 B
0.03142535
0.50
0.6202
time*month
June
0.0365205 B
0.03198159
1.14
0.2540
time*month
March
0.0285085 B
0.03170608
0.90
0.3690
time*month
May
0.0280599 B
0.03142535
0.89
0.3723
time*month
November 0.0242607
B
0.03142535
0.77
0.4405
time*month
October 0.0289971
B
0.03198159
0.91
0.3650
time*month
September 0.0000000
B
.
. .
NOTE: The X'X
matrix has been found to be
singular, and a generalized inverse
was used to solve the normal equations.
Terms whose estimates are
followed by the letter 'B' are not uniquely estimable.
64
proc sort data=maunaloa; by mo; run;
NOTE: There
were 528 observations read from
the data set WORK.MAUNALOA.
NOTE: The data
set WORK.MAUNALOA has 528
observations and 6 variables.
NOTE:
PROCEDURE SORT used:
real time
0.04 seconds
cpu
time
0.04 seconds
65
proc means data=maunaloa noprint; by mo;
66
title2 'Calculate and plot means to examine pattern over a year';
67
var co2level; output out=next n=n mean=mean var=var;
68
run;
NOTE: There
were 528 observations read from
the data set WORK.MAUNALOA.
NOTE: The data
set WORK.NEXT has 12
observations and 6 variables.
NOTE:
PROCEDURE MEANS used:
real time
0.05 seconds
cpu
time
0.05 seconds
69
options ls=111 ps=56;
70
proc plot data=next; plot mean*mo; run;
71
options ls=80 ps=256;
NOTE: There
were 12 observations read from
the data set WORK.NEXT.
NOTE: The
PROCEDURE PLOT printed page 5.
NOTE:
PROCEDURE PLOT used:
real time
0.01 seconds
cpu
time
0.01 seconds
Trend analysis
of carbon dioxide levels
Calculate and
plot means to examine pattern
over a year
Plot of
mean*mo. Legend: A = 1 obs, B = 2 obs,
etc.
mean |
343 +
|
|
|
|
A
A A
|
342 +
|
|
|
|
|
341
+
A
| A
|
|
A
|
|
340 +
|
|
| A
|
|
A
339 +
|
|
|
A
|
|
338
+
A
|
|
|
|
A
|
337 +
|
|
A
|
|
|
336 +
|
---+--------+--------+--------+--------+--------+--------+--------+--------+--------+--------+--------+--
1
2
3
4
5
6
7
8
9
10
11 12
mo
73
proc mixed data=maunaloa; classes month;
74
title2 'Analysis of Covariance and Response Surface - testing';
75
model co2level = time time*time mo mo*mo mo*mo*mo mo*mo*mo*mo
76
time*mo time*mo*mo time*mo*mo*mo
time*mo*mo*mo*mo
77
time*time*mo time*time*mo*mo
time*time*mo*mo*mo time*time*mo*mo*mo*mo
78
month month*time / htype=1 3
DDFM=Satterthwaite;
79
run;
NOTE: 7
observations are not included
because of missing values.
NOTE: The
PROCEDURE MIXED printed page 6.
NOTE:
PROCEDURE MIXED used:
real time
0.07 seconds
cpu
time
0.07 seconds
Trend analysis
of carbon dioxide levels
Analysis of
Covariance and Response Surface
- testing
The Mixed
Procedure
Model Information
Data
Set
WORK.MAUNALOA
Dependent
Variable
CO2Level
Covariance
Structure
Diagonal
Estimation
Method
REML
Residual
Variance Method
Profile
Fixed Effects
SE Method
Model-Based
Degrees of
Freedom Method
Residual
Class Level Information
Class
Levels Values
month
12 April August December February January July June
March May November
October September
Dimensions
Covariance
Parameters
1
Columns in
X
39
Columns in
Z
0
Subjects
1
Max Obs Per
Subject
528
Observations
Used
521
Observations
Not
Used
7
Total
Observations
528
Covariance
Parameter Estimates
Cov
Parm
Estimate
Residual
0.5614
Fit Statistics
-2 Res Log
Likelihood 1415.2
AIC (smaller
is better) 1417.2
AICC (smaller
is better) 1417.3
BIC (smaller
is better) 1421.4
Type 1 Tests of Fixed Effects
Num Den
Effect
DF DF
F Value Pr > F
time
1 491
263837 <.0001
time*time
1 491
2618.04 <.0001
mo
1 491
820.70 <.0001
mo*mo
1
491 359.17 <.0001
mo*mo*mo
1 491
1435.04 <.0001
mo*mo*mo*mo
1 491
326.95 <.0001
time*mo
1 491
0.06 0.8069
time*mo*mo
1 491
1.27 0.2601
time*mo*mo*mo
1 491
8.25 0.0043
time*mo*mo*mo*mo
1
491 0.15 0.7009
time*time*mo
1 491
0.01 0.9111
time*time*mo*mo
1 491
0.80 0.3728
time*time*mo*mo*mo
1
491 0.14 0.7113
tim*time*mo*mo*mo*mo
1
491 0.00 0.9468
month
7 491
25.76 <.0001
time*month
7 491
0.31 0.9474
Type 3 Tests of Fixed Effects
Num Den
Effect
DF DF
F Value Pr > F
time
1 491
54.27 <.0001
time*time
1 491
36.19 <.0001
mo
0
.
. .
mo*mo
0
.
. .
mo*mo*mo
0
.
. .
mo*mo*mo*mo
0
.
. .
time*mo
0
.
. .
time*mo*mo
0
.
. .
time*mo*mo*mo
0
.
. .
time*mo*mo*mo*mo
0
.
. .
time*time*mo
1 491
0.09 0.7584
time*time*mo*mo
1
491 0.03 0.8697
time*time*mo*mo*mo
1
491 0.01 0.9357
tim*time*mo*mo*mo*mo
1
491 0.00 0.9698
month
5 491
4.95 0.0002
time*month
7 491
0.31 0.9474
81
proc mixed data=maunaloa; classes month;
82
title2 'Fit of a simplified Response Surface';
83
model co2level = time time*time mo mo*mo mo*mo*mo mo*mo*mo*mo
84
/ htype=1 3
DDFM=Satterthwaite outp=ResidDataP solution;
85
run;
NOTE: 7
observations are not included
because of missing values.
NOTE: The data
set WORK.RESIDDATAP has 528
observations and 13 variables.
NOTE: The
PROCEDURE MIXED printed page 7.
NOTE:
PROCEDURE MIXED used:
real time
0.16 seconds
cpu
time
0.16 seconds
86
quit;
Trend analysis
of carbon dioxide levels
Fit of a
simplified Response Surface
The Mixed
Procedure
Model Information
Data
Set
WORK.MAUNALOA
Dependent
Variable
CO2Level
Covariance
Structure
Diagonal
Estimation
Method
REML
Residual
Variance Method
Profile
Fixed Effects
SE Method
Model-Based
Degrees of
Freedom Method
Residual
Class Level Information
Class
Levels Values
month
12 April August December
February January July June March May November October September
Dimensions
Covariance
Parameters
1
Columns in
X
7
Columns in
Z
0
Subjects
1
Max Obs Per
Subject
528
Observations
Used
521
Observations
Not
Used
7
Total
Observations
528
Covariance
Parameter
Estimates
Cov
Parm
Estimate
Residual
0.7484
Fit Statistics
-2 Res Log
Likelihood 1391.5
AIC (smaller
is better) 1393.5
AICC (smaller
is better) 1393.5
BIC (smaller
is better) 1397.7
Solution for Fixed Effects
Standard
Effect
Estimate
Error DF
t Value Pr > |t|
Intercept
312.28 0.3637
514 858.72
<.0001
time
0.8051 0.01244
514 64.70
<.0001
time*time
0.01178 0.000266
514 44.25
<.0001
mo
-0.04612 0.3342
514 -0.14
0.8903
mo*mo
0.6626 0.09890
514
6.70 <.0001
mo*mo*mo
-0.1346 0.01121
514 -12.00
<.0001
mo*mo*mo*mo
0.006711
0.000429 514
15.66
<.0001
Type 1 Tests of Fixed Effects
Num Den
Effect
DF
DF
F Value Pr > F
time
1 514
197913 <.0001
time*time
1
514 1963.89 <.0001
mo
1 514
615.64 <.0001
mo*mo
1 514
269.43 <.0001
mo*mo*mo
1
514 1076.47 <.0001
mo*mo*mo*mo
1
514 245.26 <.0001
Type 3 Tests of Fixed Effects
Num Den
Effect
DF DF
F Value Pr > F
time
1 514
4186.59 <.0001
time*time
1
514 1958.27 <.0001
mo
1 514
0.02 0.8903
mo*mo
1 514
44.89 <.0001
mo*mo*mo
1
514 144.04 <.0001
mo*mo*mo*mo
1
514 245.26 <.0001
88
PROC UNIVARIATE DATA=ResidDataP PLOT NORMAL; VAR resid;
91
RUN;
NOTE: The
PROCEDURE UNIVARIATE printed pages
8-9.
NOTE:
PROCEDURE UNIVARIATE used:
real time
3.66 seconds
cpu
time
0.32 seconds
Trend analysis
of carbon dioxide levels
Fit of a
simplified Response Surface
The UNIVARIATE
Procedure
Variable:
Resid
Moments
N
521 Sum
Weights
521
Mean
0 Sum
Observations
0
Std
Deviation 0.86007223
Variance
0.73972425
Skewness
0.29861691
Kurtosis
-0.1936156
Uncorrected
SS 384.65661 Corrected
SS 384.65661
Coeff
Variation
. Std Error Mean
0.03768045
Basic Statistical Measures
Location
Variability
Mean
0.00000 Std
Deviation
0.86007
Median
-0.05525
Variance
0.73972
Mode
.
Range
5.03599
Interquartile
Range 1.22765
Tests for Location: Mu0=0
Test
-Statistic- -----p Value------
Student's
t t
0 Pr > |t| 1.0000
Sign
M -9.5
Pr >= |M| 0.4304
Signed
Rank S
-2031.5 Pr >= |S| 0.5551
Tests for Normality
Test
--Statistic--- -----p Value------
Shapiro-Wilk
W
0.992105 Pr < W
0.0073
Kolmogorov-Smirnov
D
0.041427 Pr > D
0.0284
Cramer-von
Mises W-Sq
0.175167 Pr > W-Sq 0.0113
Anderson-Darling
A-Sq
1.092857 Pr > A-Sq 0.0076
Quantiles
(Definition 5)
Quantile
Estimate
100%
Max 2.7313413
99%
2.0879960
95%
1.5156392
90%
1.1414107
75%
Q3 0.6015282
50%
Median
-0.0552539
25%
Q1
-0.6261222
10%
-1.0483464
5%
-1.2992655
1%
-1.6967417
0%
Min
-2.3046472
Extreme Observations
------Lowest-----
-----Highest-----
Value
Obs
Value Obs
-2.30465
392
2.17174 32
-1.99443
388
2.37034 210
-1.98929
103
2.37386 473
-1.84170
396
2.41438 472
-1.69762
371
2.73134 471
Missing Values
-----Percent Of-----
Missing
Missing
Value Count
All Obs Obs
.
7
1.33 100.00
Stem
Leaf
#
Boxplot
26
3
1 0
24
1
1 |
22
77
2 |
20 1397
4
|
18
013669
6 |
16
301478
6 |
14
014602278999
12 |
12
0027990144589
13 |
10
00112267891246667999
20 |
8
001111233557900223455567888899
30 |
6
0000111123456667990111111122333345568
37
+-----+
4
0000112333334445668999990000000122233889
40
| |
2
000012455556666777791122222346667789
36 | |
0
1111223455555566777770112222234556666788999
43
| + |
-0
8876665554433332222108877666544333222
37 *-----*
-2 98766665544332222211100998887555555444433211000
47
| |
-4
888887777644322221110009999888876655443111000
45
| |
-6
97776333222110009999876664433333222211000
41
+-----+
-8
997776666555531110887776666665322111100
39 |
-10
743211076665554432100
21 |
-12
42100008876544321000
20 |
-14
2009432100
10
|
-16
007200
6 |
-18
994
3 |
-20
|
-22
0
1
|
----+----+----+----+----+----+----+----+----+--
Multiply Stem.Leaf by 10**-1
Normal Probability Plot
2.7+
*
|
*
|
*
|
***+
|
**++
1.7+
**+
|
****
|
**+
|
***
|
****
0.7+
***
|
***
|
***
|
****
|
+**
-0.3+
****
|
***
|
****
|
****
| ***
-1.3+ *****
| ****+
| *** ++
|* +++
|++
-2.3+*
+----+----+----+----+----+----+----+----+----+----+
-2
-1
0
+1 +2
Modified: August 16, 2004
James P. Geaghan