Anda di halaman 1dari 474

StatPac for Windows

User's Guide
By StatPac Inc.

StatPac for Windows software and manual
Copyright 1999-2013 y StatPac !nc"
#ll $ights $eser%ed"
!S&' 0-91()33-12-*
StatPac+ is a registered trademar, of StatPac !nc"
Administrative
StatPac !nc"
(-09 .yndale #%e" S" /209#
&loomington0 1innesota 22320
4el5 69227 (((-2933
8a95 69227 (((-2932
Technical Support
StatPac !nc"
1200 8irst Street
Pepin0 Wisconsin 23)29
4el5 6)127 332-22-1
8a95 6)127 332-22-2
ii StatPac For Windows User's Manual
Contents
Introduction 1
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1
System $e;uirements and !nstallation""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2
.ocal PC <ardware = Software $e;uirements""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2
Ser%er <ardware = Software $e;uirements""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2
:ther >seful Software""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3
!nstallation on a .ocal PC"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3
>nregistering = $emo%ing the Software from a PC""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3
'etwor, :peration""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3
>pdating to a 1ore $ecent ?ersion""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2
&ac,ing->p a Study""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-
Processing 4ime"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")
Ser%er @emands and Security""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")
4echnical Support""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(
'otice of .iaility"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(
Paper = Pencil and C#4! Sur%ey Process""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""9
!nternet Sur%ey Process"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""9
&asic 8ile 4ypes""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""10
Codeoo,s 6"cod7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""10
@ata 1anager 8orms 6"frm7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""10
@ata 8iles 6"dat7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""10
!nternet $esponse 8iles 6"asc or "t9t7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""10
Amail #ddress .ists 6"lst or "t9t7"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11
Amail .ogs 6"log7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11
$ich 4e9t 8iles 6"rtf7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11
<41. 8iles 6"htm7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11
Perl Script 6"pl7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11
Password 8iles 6"te9t7""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12
A9ported @ata 8iles 6"t9t and "cs% and "md7"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12
Amail &ody 8iles 6"t9t or "htm7"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12
Sample 8ile 'aming Scheme for a Sur%ey"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12
CustomiBing the Pac,age""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""13
Basic Research Concets 1!
Prolem $ecognition and @efinition""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12
Creating the $esearch @esign"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-
1ethods of $esearch"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-
Sampling"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-
@ata Collection"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(
$eporting the $esults""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(
?alidity""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(
$eliaility""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""19
Systematic and $andom Arror""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""20
8ormulating <ypotheses from $esearch Cuestions""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""20
4ype ! and 4ype !! Arrors""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""21
4ypes of @ata""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""21
Significance"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
:ne-4ailed and 4wo-4ailed 4ests""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
Procedure for Significance 4esting"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
&onferroniDs 4heorem""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2-
Central 4endency"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2)
?ariaility""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2)
Standard Arror of the 1ean"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2(
!nferences with Small Sample SiBes"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2(
@egrees of 8reedom""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2(
Code"oo# $esi%n &'
Components of a Study @esign"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""29
Alements of a ?ariale""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""30
?ariale 8ormat""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""30
?ariale 'ame""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31
?ariale .ael"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
?alue .aels""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
?alid Codes"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33
S,ip Codes for &ranching"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33
@ata Antry Control Parameters"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
1issing :E"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
#uto #d%ance"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
Caps :nly"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
Codeoo, 4ools"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-
4he Frid""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-
Codeoo, .iraries""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3)
@uplicating ?ariales""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3(
!nsert = @elete ?ariales""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3(
1o%e ?ariales"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3(
Starting Columns""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3(
Print a Codeoo,""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""39
Spell Chec, a Codeoo,"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""39
?ariale @etail Window""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""30
Codeoo, Creation Process""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31
1ethod 1 - Create a Codeoo, from Scratch"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31
1ethod 2 G Create a Codeoo, from a Word-Processed @ocument""""""""""""""""""""""""""32
1ultiple $esponse ?ariales"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
1issing @ata"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32
Changing !nformation in a Codeoo,"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-
$ata Mana%er For( )'
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""39
@ata !nput 8ields"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""39
8orm 'aming Con%entions"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""39
8orm Creation Process""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""20
>sing the Codeoo, to Create a 8orm"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""20
>sing a Word-Processed @ocument to Create a 8orm"""""""""""""""""""""""""""""""""""""""""""""""21
?ariale 4e9t 8ormatting"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
8ield Placement""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
?alue .aels""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
?ariale Separation"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
?ariale .ael !ndent""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
ii StatPac For Windows User's Manual
?alue .aels !ndent""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
Space etween Columns"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23
?alid Codes"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
S,ip Codes""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
?ariale 'umers"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
?ariale .ist and @etail Windows"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22
@ata !nput Settings""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2-
Select a Specific ?ariale""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2)
8inding 4e9t in the 8orm"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2(
$eplacing 4e9t in the 8orm"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2(
Sa%ing the Codeoo, or Wor,space"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""29
$ata Mana%er *1
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-1
Eeyoard and 1ouse 8unctions"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Create a 'ew @ata 8ile"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Adit or #dd 4o an A9isting @ata 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Select a @ifferent @ata 8ile"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Change 8ields""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Change $ecords""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-3
Anter a 'ew @ata $ecord""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-3
?iew @ata for a Specified $ecord 'umer"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-3
8ind $ecords 4hat Contain Specified @ata"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-3
8ield 4o Search"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Search 8or"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Search @irection"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
Search 1ethod""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
@uplicate a 8ield from the Pre%ious $ecord"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-2
@elete a $ecord"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""--
@ata !nput Settings""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""--
Compact @ata 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-)
@oule Antry ?erification"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-(
Print a @ata $ecord"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-(
?ariale .ist = @etail Windows"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-(
@ata 8ile 8ormat"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""-(
+(ail Sur,eys -1
:%er%iew""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")1
<41. Amail Sur%eys""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")1
Plain 4e9t Amail Sur%eys"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")2
&rac,ets"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")3
!tem 'umering"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")3
Codeoo, @esign for a Plain 4e9t Amail Sur%ey""""""""""""""""""""""""""""""""""""""""""""""""""""""")3
Capturing a $espondentDs Amail #ddress""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")-
8iltering Amail to a 1ailo9""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")-
Feneral Considerations for Plain 4e9t Amail""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")-
Internet Sur,eys --
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""))
!nternet Sur%ey Process"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""))
Ser%er Setup""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""))
Create the <41. Sur%ey Pages""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
>pload the 8iles to the We ser%er""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
4est the sur%ey"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
StatPac For Windows User's Manual iii
@ownload and import the test data""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
@elete the test data from the ser%er"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
Conduct the sur%ey""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
@ownload and import the data"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")(
@isplay a sur%ey closed message"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")9
Ser%er Setup"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""")9
84P .ogin !nformation"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(0
Paths = 8older !nformation""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(0
@esign Considerations for !nternet Sur%eys"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(3
Special ?ariales for !nternet Sur%eys""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(2
Script to Create the <41."""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(-
Command Synta9 = <elp"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""((
Sa%ing and .oading Styles""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(9
Sur%ey Feneration Procedure"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""(9
Script Aditor""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""90
!medded <41. 4ags""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""90
Primary Settings""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""91
<41. 'ame"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""91
&anner !mage""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""93
<eading"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""93
8inish 4e9t = 8inish >$.""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""93
Coo,ie"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""93
!P #ddress Control""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""93
#llow Cross Site #ccess"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""93
>$. to Sur%ey 8older"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""92
#d%anced Settings"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""9-
<eader = 8ooter"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""9-
8inish = Popups"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""99
Control""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""101
8onts = Colors""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""103
Passwords - Color = &anner !mage"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""110
Passwords - 4e9t = Control""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""111
Passwords - Single %s" 1ultiple""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""113
Passwords - 4echnical 'otes""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""112
Ser%er :%errides"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11-
&ranching and Piping""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""11(
$andomiBation 6$otations7"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""119
Sur%ey Creation Script""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""120
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""120
Specify 4e9t""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""121
Spacing and pagination"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""122
!mages and .in,s""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""123
<elp Windows""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""123
Popup Windows""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12-
Sur%ey Creation - :Hects"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12)
$adio &uttons for a Single ?ariale"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12)
$adio &uttons for Frouped ?ariales 6matri9 style7""""""""""""""""""""""""""""""""""""""""""""""""129
@rop@own 1enu""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""132
4e9t&o9 for a Single ?ariale"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""133
#dding a 4e9t&o9 to a $adio &utton0 Chec,&o90 or $adio &utton 1atri9""""""""""""13-
4e9t&o9es for Frouped ?ariales"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""132
Slider for Single or 1ultiple ?ariales"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""133
Chec,&o9 for 1ultiple $esponse ?ariales"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""13)
Chec,o9 for Froups of 1ultiple $esponse ?ariales 6horiBontal matri97"""""""""""""13)
.ist&o9"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""120
>ploading and @ownloading 8iles from the Ser%er"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""120
i, StatPac For Windows User's Manual
#uto 4ransfer""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""120
84P"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""121
Summary of the 1ost Common Script Commands""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""122
+(ail .ist Mana%e(ent 1!*
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12-
8ormat of an Amail #ddress 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12-
A9tract Amail #ddresses"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12(
.ist Statistics"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""12(
Ioin 4wo or 1ore .ists"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""129
Split a .ist"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-0
Clean0 Sort0 and Aliminate @uplicates""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-2
#dd !@ 'umers to a .ist"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-2
Create a .ist of 'onresponders"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-3
Sutract :ne .ist 8rom #nother .ist""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-3
1erge an Amail .ist into a StatPac @ata 8ile"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-2
Send Amail !n%itations""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-2
>sing an !@ 'umer to 4rac, $esponses"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-2
Amail #ddress 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1--
&ody 4e9t 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1--
Sending Amail"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1-)
Procedure Files 1-1
:%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)1
1ouse and Eeyoard 8unctions"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)2
@esigning #nalyses"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)2
Continuation .ines""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)2
Comment .ines"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)2
? 'umers""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)-
Eeywords""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)-
#nalyses""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)-
?ariale .ist""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)-
?ariale @etail"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1))
8ind 4e9t"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)(
$eplace 4e9t""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)9
:ptions""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1)9
.oad0 Sa%e0 and 1erge Procedure 8iles""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(3
Print a Procedure 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(3
$un a Procedure 8ile"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(3
$esults Aditor""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(-
Fraphics""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(-
4ale of Contents""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""1(9
#utomatically Fenerated 4opline Procedures"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""190
/eywords 1'1
Eeyword !nde9""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""191
Eeywords :%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""191
Categories of Eeywords""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""192
Eeyword <elp"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""192
:rdering Eeywords"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""193
Floal and 4emporary Eeywords"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""193
Permanently Change a Codeoo, and @ata 8ile""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""193
&ac,up a Study"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""192
S4>@J Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""19-
StatPac For Windows User's Manual ,
@#4# Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""19)
S#?A Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""19)
W$!4A Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""19(
1A$FA Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""202
<A#@!'F Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""202
4!4.A Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""203
8::4':4A Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""203
.#&A.S Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""203
:P4!:'S Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""20-
SA.AC4 and $AIAC4 Commands"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""20(
'AW Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""213
.A4 Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""212
S4#CE Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""21-
$AC:@A Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""21(
C:1P>4A Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""220
#?A$#FA0 C:>'4 and S>1 Commands"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""223
!8-4<A' K A.SA Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""22-
S:$4 Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""232
WA!F<4 Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""233
':$1#.!LA Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""232
.#F Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23-
@!88A$A'CA Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23)
@>11J Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""239
$>' Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""231
$A1 Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""232
$eser%ed Words"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""233
$eser%ed Word $AC:$@"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""233
$eser%ed Word 4:4#.""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""232
$eser%ed Word 1A#'"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""232
$eser%ed Word 4!1A"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""232
Basic 0nalyses &)-
#nalyses !nde9""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23)
#nalyses :%er%iew"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23)
.!S4 Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""23(
8$AC>A'C!AS Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""222
C$:SS4#&S Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2)3
&#''A$S Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""2(1
@ASC$!P4!?A Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""299
&$A#E@:W' Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""302
44AS4 Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""309
4-4est 8or 1atched Pairs""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""309
4-4est 8or !ndependent Froups""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""310
C:$$A.#4A Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""313
0d,anced 0nalyses 11-
#d%anced #nalyses !nde9"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31)
$AF$ASS Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31)
S4APW!SA Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""322
.:F!4 and P$:&!4 Commands""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33-
PC# Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""332
8#C4:$ Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""339
C.>S4A$ Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""322
@!SC$!1!'#'4 Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-3
,i StatPac For Windows User's Manual
#':?# Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3)3
C#':'!C#. Command""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""393
1#P Command"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""300
#d%anced #nalyses &iliography"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""30(
Utilities )11
>tility Programs""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""311
!mport and A9port"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""312
StatPac and Prior ?ersions of StatPac Fold""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""312
#ccess0 A9cel0 Parado90 d&ase0 and .otus"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""313
@!8 8iles"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""313
Comma @elimited and 4a @elimited 8iles"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""313
8iles Containing 1ultiple @ata $ecords per Case"""""""""""""""""""""""""""""""""""""""""""""""""""313
!nternet 8iles"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""312
Amail Sur%eys"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""312
1erging @ata 8iles""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31-
Concatenate @ata 8iles"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31)
1erge ?ariales and @ata"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""31(
#ggregate""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""320
Codeoo,""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""323
Cuic, Codeoo, Creation""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""323
Chec, Codeoo, and @ata"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""323
Sampling"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""322
$andom 'umer 4ale"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""322
$andom @igit @ialing 4ale"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32-
Select $andom $ecords from @ata 8ile"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32(
Create ?ariale for Weighting""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""329
Compare @ata 8iles"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""332
Con%ersions"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""332
@ate Con%ersions""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
Currency Con%ersion""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
@ichotomous 1ultiple $esponse Con%ersion""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
Statistics Calculator )1'
Statistics Calculator 1enu""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""339
@istriutions 1enu"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""330
'ormal distriution"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""330
4 distriution""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""331
8 distriution"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
Chi-s;uare distriution"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
Counts 1enu"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
Chi-s;uare test""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""333
8isherDs A9act 4est""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""332
&inomial 4est""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33-
Poisson @istriution A%ents 4est""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33-
Percents 1enu"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33-
Choosing the Proper 4est""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33-
:ne Sample t-4est etween Percents""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""33(
Confidence !nter%als around a Percent"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""320
1eans 1enu""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""321
1ean and Standard @e%iation of a Sample""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""321
1atched Pairs t-4est etween 1eans"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""322
!ndependent Froups t-4est etween 1eans""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""323
Confidence !nter%al around a 1ean"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""323
StatPac For Windows User's Manual ,ii
Compare a Sample 1ean to a Population 1ean""""""""""""""""""""""""""""""""""""""""""""""""""""""322
Compare 4wo Standard @e%iations""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32-
Compare 4hree or more 1eans""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32-
Correlation 1enu""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""32(
$egression"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""329
Sampling 1enu"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-1
Sample SiBe for Percents""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-1
Sample SiBe for 1eans"""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""""3-2
Inde2 )*!
,iii StatPac For Windows User's Manual
Introduction
3,er,iew
StatPac is a complete data manager and analysis pac,age" !t will handle all phases of
sur%ey design and analysis"
4he steps in running StatPac are the same as in all research5
1" @esign the study
2" Collect the data
3" $un the analyses
'umerous other tas,s may e performed0 such as managing e-mail lists and
manually enteringMediting data"
4he study design contains a description of the %ariales0 their laels0 and the data file
format" 4he study design is stored in a file called the codebook" #ll codeoo, file
names end with a "cod e9tension"
#nother part of the study design is called a form" 4he form is used for data entry and
editing" Jou do not need a form unless you will e doing manual data entry or
editing" #ll form names end with a "frm e9tension" When you are processing
;uestionnaires0 the form closely resemles the ;uestionnaire itself" StatPacNs data
manager uses the form to allow entry and editing of data"
#n essential element of StatPac is the aility to create and maintain a dataase of
information to e analyBed" 4his may e ;uestionnaire data0 test scores or any other
type of OrawO information" 4he information is stored in a data file on dis," #ll data
file names end with a "dat e9tension"
When performing a We sur%ey0 the responses will e stored on the ser%er in an
#SC!! te9t file using a "asc e9tension" 6'ote5 4he default e9tension for internet
response files may e changed y modifying the !nternetA9tension setting in the
StatPac"ini file"7 When youNre ready to perform analyses0 youNll download the
response file to your local computer and import it into a StatPac data file"
4he final step is to perform the analyses" StatPac is designed for either interacti%e or
atch processing" 4his means you can run a single analysis 6interacti%e7 or many
different analyses at one time 6atch7" 4o run an analysis you will type a set of
commands that say Ofirst do thisO0 One9t do thisO0 and so on" 4hese commands are
stored in a procedure file" Procedure file names end with a "pro e9tension"
Syste( Re4uire(ents and Installation
!nstalling StatPac on a hard dis, is %ery easy and will ta,e aout fi%e minutes"
!f you ha%e any prolems installing this product0 please do not hesitate to write0 call0
or e-mail"
StatPac !nc"
4echnical Support
1200 8irst Street
Pepin0 W! 23)29
6)127 332-22-1 69-2 Central 4ime7
6)127 332-22-2 68a97
supportPstatpac"com
Please note that StatPac can legally e installed on two computers pro%ided that there
will not e simultaneous use of oth installations" !t may e installed on a networ,
dri%e" <owe%er0 access to the software will e restricted to the wor,station used for
the installation" #ny other installations are a %iolation of copyright laws" !f you wish
to install StatPac on an additional computer0 please remo%e it from the current
computer efore installing it on the new computer0 or purchase a second copy at a
reduced cost"
When conducting we sur%eys0 the <41. files that StatPac creates may e installed
on any ser%er or ser%ers" 'o special license is re;uired to upload the <41. files to
multiple ser%ers" #dditionally0 the Perl scripts pro%ided with the software may e
installed on more than one ser%er" 'o special license is re;uired for multiple
installations of the Perl scripts"
.ocal PC 5ardware 6 Software Re4uire(ents
StatPac will wor, on a PC running Windows 920 Windows 9(0 Windows 20000 '40
*P0 ?ista0 Windows )0 or Windows (" !t re;uires aout 201 of dis, space and a
minimum of 22-1 $#1" StatPacDs performance is directly related to the CP> cloc,
speed 6faster is etter7 and the amount of $#1 6more is etter7" We suggest not
using StatPac on older PCs that ha%e a CP> cloc, speed slower than 3001<B"
Ser,er 5ardware 6 Software Re4uire(ents
!f you will e conducting We sur%eys0 youNll need access to a We ser%er to QhostR
your sur%eys" 4he ser%er may e >ni9M.ini9 or any %ersion of WindowsM!!S" !t must
support CF!" 4his means you will ha%e access to a cgi-in folder on your ser%er"
'early all hosting ser%ices support CF!0 so you may need to contact your !SP for
more information" StatPac has a Perl script that you will e installed in the cgi-in
folder on your ser%er" !f you do not currently ha%e your own We ser%er0 you may
use StatPacDs free ser%er" 4he domain for our hosting ser%er is ta,e-sur%ey"com"
& Introduction StatPac For Windows User's Manual
3ther Useful Software
#ll StatPac reports are created in rich te9t format" 4hese files can e %iewed0 printed0
and manipulated in StatPac0 or you can use any word processor to %iew the reports
6e"g" 1icrosoft Word7"
8or We sur%eys0 you may also wish to use a WJS!WJF <41. editor" StatPac will
create aesthetically pleasing and fully functional !nternet sur%eys0 ut you may want
to %isually enhance their appearance with additional graphics or other design
features" !n order to do that0 you must ha%e a What-You-See-Is-What-You-Get
<41. editor" 1icrosoft 8ront Page and @reamWea%er are e9amples of a
WJS!WJF <41. editor" #ny WJS!WJF <41. editor will wor," While we do
not recommend it0 you may also use recent %ersions 1icrosoft Word to edit your
<41. files"
Installation on a .ocal PC
1" Choose Run from the Start &ar"
2" >se the &rowse utton to na%igate to your C@ 6or the file you downloaded from
our We site7" Clic, on O!nstall StatPacO"
3" Clic, :E to install the pac,age" 4he default installation folder is C5SStatPac"
?ista0 Windows )0 and Windows ( users should not change the installation folder"
System administrators5 >sers must ha%e readMwrite access to the folder where the
software is installed" Since the ?ista0 Windows )0 and Windows ( operating systems
do not allow users write access to the Program 8iles folder0 it should not e installed
in the Programs 8iles folder on ?ista0 Windows )0 or Windows ( machines"
3" #fter the installation has completed0 the 1icrosoft <elp 8ile $eader must e
installed on ?ista0 Windows )0 and Windows ( machines" >se Windows A9plorer to
na%igate to the C5SStatPac folder" !nstall the appropriate 1icrosoft help file reader y
clic,ing on it" !f you do not ,now whether you ha%e a 32 it or -3 it machine0 try
first installing the -3 it %ersion" !t will tell you if it did not install correctly and then
you can install the 32 it %ersion" 4he <elp 8ile $eader files are named5
?ista-<elp-32"msu
?ista-<elp--3"msu
Windows)-<elp-32"msu
Windows)-<elp--3"msu
Windows(-<elp-32"msu
Windows(-<elp--3"msu
2" 4he StatPac installation will create an icon on your des,top"
@oule clic, on the icon to run StatPac
-" Select <elp0 Anter >nloc, Code
)" 4ype your >ser 'ame0 Serial 'umer and >'.:CE Code and clic, :E"
(" #nswer TJesN to connect to the StatPac ser%er" 4his will turn the demo into a full
%ersion" !f you do not ha%e an internet connection or if you are unale to connect to
the StatPac ser%er0 press UAscV instead of answering TJesN" 4hen call or email StatPac
!nc" for an authoriBation ,ey" Some firewalls loc, StatPacDs online registration" Jour
networ, super%isor can adHust your firewall to allow your PC to communicate with
our ser%er" 4he !P address of the StatPac registration ser%er is )3"220"220"20
StatPac For Windows User's Manual Introduction 1
'ote5 !f you plan to use our ser%er to host your online sur%eys0 then your networ,
super%isor should also unloc, !P address5 )3"220"201"1-1 which is the address for
our hosting ser%er ta,e-sur%ey"com" StatPac uses standard 84P protocol0 which
means that ports 200 210 and all ports ao%e 1023 must e unloc,ed for that !P
address"
4hat completes the installation on your local computer"
Unre%isterin% 6 Re(o,in% the Software fro( a PC
StatPac for Windows is copyrighted and should not e registered on more than one
computer at a time 6without a 'etwor, .icense #greement7 with the following single
e9ception" StatPac !nc" specifically grants you the right to install the software on one
additional computer0 pro%ided that oth computers will not run the software
simultaneously"
A9amples of typical installations would e5 17 one home and one office computer0 27
one office computer and a laptop computer0 37 one main computer and one ac,up
computer0 37 your computer and your technical support personNs computer" Jou are
specifically prohiited from installing two copies of the software where there will e
two simultaneous users of the software"
When you register the software0 it is con%erted from a demo %ersion to a full %ersion"
#fter registering StatPac0 you can unregister it from one machine and then register it
on another machine" When you unregister the software0 it is con%erted from a full
%ersion ac, to a demo"
>nregistering the software will enale you to install and register the pac,age on a
different computer" Select <elp0 Anter >'.:CE Code" 4ype UCtrl SV" # minus sign
will e added to the eginning of the serial numer" 4ype your >'.:CE code" Clic,
:E to unregister the software" 4he copy on that computer will e changed to a demo
%ersion and you will then e ale to register it on another computer" !t is not
necessary to actually remo%e the pac,age after unregistering it" Jou may ,eep the
demo %ersion on that computer so it will e easy to reregister it on that computer in
the future"
#fter unregistering the pac,age0 you may remo%e it from that computer y selecting
Control Panel0 #ddM$emo%e Programs0 and clic, on StatPac #ll the files from the
directory where you installed the software will e remo%ed" #ll files that you created
6codeoo,s0 data files0 etc"7 will not e deleted"
7etwor# 3eration
When you purchase a 'etwor, .icense #greement0 your serial numer and password
will automatically acti%ate the networ, option" 4he networ, option will not wor,
unless you ha%e a special serial numer and password"
4he software must e installed from each station that will ha%e access to the
networ," #t the first station0 install the software to a networ, dri%e" Suse;uent
installations at different stations should install to the same networ, dri%e and folder"
Some re;uired files will e written to the local computerDs WindowsSSystem folder"
>se your serial numer and >'.:CE code to acti%ate each station after you install
it"
#fter installing the software on all stations0 perform the following two steps to use
the networ,ing capailities of StatPac for Windows"
) Introduction StatPac For Windows User's Manual
1" Create or decide upon a folder where user profiles will e stored" 4he folder can
ha%e any name" #ll users must ha%e permission to write to this folder" # profile is the
same as the StatPac"ini file and contains all the default %alues for the software" Aach
user will ha%e their own profile 6their own default %alues7"
8or e9ample0 you might create a folder called5
C5S StatPacS>sers8older
2" Create an #SC!! te9t file 6using notepad or any word processor7 and sa%e it in the
StatPac programs folder using the name O>sers"iniO" 4he first line of the te9t is the
path to the folder where user profiles are stored" 4his may e the fully ;ualified
path0 or can e a path relati%e to the folder where StatPac was installed" Suse;uent
lines in the te9t file are user names and passwords separated y commas" @o not
include any spaces unless they are actually part of the password" >pper and lower
case characters are different"
8or e9ample0 three user names and passwords are specified in this O>sers"iniO file5
C5SStatPacS>sers8older
#dministrator0&oss
@a%id0programmer
<ilda0Pastor
StatPac networ,ing will now e enaled" >ser profiles will automatically e created
and stored in the user profile folder when the user first logs into StatPac" 4he login
screen will appear each time a user runs the pac,age"
!f you need to add a new user0 first temporarily rename the >sers"ini file to
something else" 4hen install the software from the new station and acti%ate it with
the serial numer and password" 8inally0 rename the file ac, to >sers"ini and edit
the file to include the new username and password"
Udatin% to a More Recent 8ersion
We fre;uently update the software with enhancements and ug fi9es" Please chec,
our we site to see if you ha%e the most recent update" >pdates are a%ailale to all
users who ha%e a current technical support agreement"
How to update your Statac!
StatPac For Windows User's Manual Introduction !
1" $un StatPac
2" Select <elp0 Software >pdates
3" Clic, the Chec, for >pdates utton
3" @ownload the updates
2" Close StatPac and restart it"
Bac#in%9U a Study
System crashes are not commonW howe%er0 when they do happen0 it can e
de%astating" 1a,ing ac,up copies of your study files is an important part of any
data analysis procedure" Fenerally0 you should ma,e a ac,up whene%er you feel
OitDs more than youDd care to loseO"
AT A "I#I"$"% A&WAYS 'A() $ A ST$*Y '+,-R+ '+GI##I#G A#Y
A#A&YS+S -, THAT ST$*Y.
4he analysis portion of StatPac is %ery powerful" ?ariales and data may e easily
changed" 8urthermore0 these changes can easily e made a permanent part of the
study" !f you should ma,e an error0 your study information and data will reflect this
error" 4he only way to undo an error 6i"e"0 to restore the codeoo, and data to its
former state7 is to use a ac, up" !8 J:> <#?A ':4 1#@A # &#CE>P0 !4 W!..
':4 &A P:SS!&.A 4: >'@: PA$1#'A'4 C<#'FAS J:> <#?A 1#@A
4: 4<A C:@A&::E :$ @#4#"
We strongly recommend that you ma,e fre;uent ac,up copies of all StatPac
codeoo, and data files"
4here are three ways to ac, up your wor,5
17 >se Windows A9plorer to copy the codeoo, 6"cod70 data entry form 6"frm70 data
file 6"dat7 and procedure file 6"pro7 to a different folder"
27 .oad the codeoo, for the study and then select @ata0 &ac,up" JouNll then e ale
to create a ac,up folder and all the files associated with the study will e copied to
the ac,up folder" 4he new ac,up folder will e created in the same folder as the
current codeoo,"
'ote5 !n most situations0 it is desirale 6ut not necessary7 to create a separate folder
for each study" Storing each study in its own folder will ma,e it easier to ac,up and
manage the files associated with each study"
* Introduction StatPac For Windows User's Manual
37 &egin each procedure file with a simple procedure that writes a duplicate
codeoo, and data file" 4hen perform suse;uent procedures on the duplicate files
rather than the originals" &y doing this0 youDll e lea%ing the original codeoo, and
data files intact" 'o matter what happens0 youDll always e ale to re%ert ac, to your
original files"
!n this e9ample0 the original codeoo, and data file are called 1#S4A$" 4he first
procedure 6first 2 lines7 writes a new codeoo, and data file called 4A1P" 4he
second procedure egins using the 4A1P codeoo, and data file0 and all suse;uent
procedures will use the 4A1P codeoo, and data file" !f you ma,e an erroneous
transformation to the data in a suse;uent procedure0 youDll e ale to re%ert ac, to
the original codeoo, and data file y re-running the first procedure"
S4>@J 1#S4A$
W$!4A 4A1P
""
S4>@J 4A1P
6all the rest of the procedures7
Processin% :i(e
4he e9ecution time for any analysis depends upon 6in the order of importance75
1" 4he cloc, speed of the CP> in your computer"
2" 4he numer of records in the data file"
3" 4he numer and type of transformations eing performed"
3" 4he amount of $#1 in the computer"
2" 4he type of analysis eing performed"
-" 4he options used on the analysis"
When you ha%e se%eral analyses to perform0 atch processing can sa%e time" 4he
ad%antage is that you can sumit many analyses at one time and they all get added to
the same document"
Ser,er $e(ands and Security
When conducting We sur%eys0 the demands on your ser%er will e minimal"
Fenerally0 the <41. files created will e small and load ;uic,ly into a rowser" 4he
ser%er is only called upon when a sur%ey page is eing loaded into the respondentNs
rowser and when they clic, the ne9t page or sumit utton" :nce a sur%ey page has
een loaded into the respondentNs rowser0 no demands are placed on the ser%er until
the respondent sumits that page"
4he response data is collected on the ser%er and usually stored in the cgi-in folder"
4his folder is protected from unauthoriBed users" 4hus0 the information you collect is
as secure as your cgi-in folder"
#dditionally0 you may add password protection to a sur%ey to only allow access to
people who ha%e the password"
StatPac For Windows User's Manual Introduction -
:echnical Suort
1ost of the features in StatPac ha%e een de%eloped as a result of user suggestions"
!f you would li,e to suggest a program enhancement0 please feel free to write us
aout it" #ll users of StatPac will enefit"
Technical support a/reement!
@emo users recei%e 30 days of free technical support"
Purchasers of the software recei%e 90 days of free technical support" #fter that0 you
can purchase a technical support agreement" 4o renew your technical support
agreement0 select <elp0 4echnical Support0 and clic, on the lin, to renew your
support agreement"
4he support agreement includes up to 90 minutes of support for a period of one year"
!t also includes updates for that year" 4he cost for updates and a support agreement
depends upon how long you ha%e gone without an agreement"
How to find the serial number of your packa/e!
Clic, <elp0 #out StatPac for Windows to see the serial numer of your software"
@emo %ersions do not ha%e a serial numer" 4hirty days of free support is pro%ided
to demo users"
Tech support by e0mail!
1" !nclude the serial numer of your pac,age"
2" !nclude your codeoo, 6"cod70 data file 6"dat7 and procedure file 6"pro7 as
attachments" 4his will enale us to reproduce the prolem" # Bipped file is preferred"
3" Amail to5 supportPstatpac"com
Tech support by telephone!
1" 4he serial numer of your pac,age" Clic, <elp0 #out StatPac for Windows to see
your serial numer" 6@emo %ersions do not ha%e a serial numer"7
2" #ll rele%ant printouts in front of you"
3" Please try to e at the computer and phone at the same time"
3" Call 6)127 332-22-1 etween 9500 #1 and 2500 P1 Central time"
7otice of .ia"ility
StatPac for Windows is distriuted on an O#S !SO asis without warranty"
StatPac !nc" has made e9tensi%e tests on StatPac for Windows and elie%es it to e
OugO free" <owe%er0 in any set of programs as comple9 as StatPac for Windows0
there is the possiility that the programs will malfunction with unusual or in%alid
data"
; Introduction StatPac For Windows User's Manual
StatPac !nc" shall ha%e no liaility or responsiility to customer or any other person
or entity with respect to any liaility0 loss or damage caused or alleged to e caused
directly or indirectly y StatPac for Windows" 4his includes0 ut is not limited to0
any interruption of ser%ice0 loss of data0 loss of usiness or anticipatory profits0 or
conse;uential damages from the use of StatPac for Windows"
!nformation in this document is suHect to change without notice and does not
represent a commitment on the part of StatPac !nc" 4he software descried in this
document is furnished under a license agreement" 4he software may e used or
copied only in accordance with the terms of the agreement"
Paer 6 Pencil and C0:I Sur,ey Process
Paper and pencil sur%eys and C#4! 6computer assisted telephone inter%iewing7
sur%eys follow the same process5
1" Create a codeoo, 6i"e"0 the study design7" 4he codeoo, contains the ;uestions
and response choices for all the items on the sur%ey" !t also contains %alidity
chec,ing information and ranching information that allows the sur%ey to s,ip to
other ;uestions depending on a respondentNs answer"
2" Create a data entryMediting form" 4he data entry form is a template that can e used
for entering and editing data" StatPac can automatically generate a nicely formatted
form" :nce created0 forms can e easily modified 6such as adding special
instructions to inter%iewers or data entry operators7"
3" Anter the raw data" 4he data manager is used to enter the respondentsN answers
into a dataase" !nternally0 StatPac stores the data in a fi9ed record-length se;uential
#SC!! file with a carriage return and line feed at the end of each data record"
3" Create a procedure file and run the reports" # procedure file is simply a set of
instructions that tells StatPac what ,ind of reports you want"
Internet Sur,ey Process
&uilding an !nternet sur%ey can e ro,en down into se%eral distinct steps" 4he asic
process for creating !nternet sur%eys with an e-mail in%itation and follow-up
reminder to non-respondents is as follows5
1" Create a codeoo," 4he codeoo, for !nternet sur%eys is nearly identical to the
codeoo, for paper and pencil sur%eys"
2" Create a default script y selecting @esign0 !nternet Sur%ey" 4he script controls
how the <41. sur%ey pages will e created"
3" 1odify the default script as necessary"
3" Fenerate and %iew the <41. files" $epeat steps 3 and 3 as necessary"
2" >pload the files to the We site and test the sur%ey online" 4his means that you
complete the sur%ey as if you were a respondent" 4hen download the captured data
and loo, at it to ma,e sure it is correct"
-" Create the email in%itation ody and a test email list containing your email" Send
the test email to the test list" When you recei%e the test email0 try the lin, and ma,e
sure it wor,s as e9pected"
)" Clean the real email list 6and add !@ numers to the list if you intend to trac, who
responded7" Send e-mail in%itations to participate in the sur%ey"
StatPac For Windows User's Manual Introduction '
(" @ownload the file containing %isitor responses and capture them into a data file"
9" Create an e-mail list of nonresponders" Send a reminder e-mail to the
nonresponders"
10" @ownload the file containing %isitor responses and capture them into a data file"
11" Create a procedure file and run the reports in StatPac or e9port the data to
#ccess0 or a ta or comma delimited file"
Basic File :yes
StatPac creates and uses se%eral types of files" 4he file e9tensions are controlled y
the software and usually may not e changed"
Code"oo#s <.cod=
4he sur%ey design is stored in a file called the codebook" Aach item on a sur%ey is a
%ariale" 4he sur%ey design contains a description of the %ariales0 their laels0 and
their formats" #dditional information0 such as s,ip patterns 6ranching7 and %alidity
chec,ing are also stored in the codeoo," #ll codeoo, file names end with a "cod
e9tension"
$ata Mana%er For(s <.fr(=
#nother part of the study design is called a form" 4he form is used as a screen
template for manually entering and editing" !t is not uncommon for a small numer
of respondents to want to complete a hardcopy of the sur%ey rather than the !nternet
%ersion" !n those situations0 you will ha%e to manually add their information to the
rest of the data" #ll forms end with a "frm e9tension"
$ata Files <.dat=
@ata files can e created with the data manager0 imported from a file created y
another program0 or captured from an e-mail or !nternet response file"
When conducting a we sur%ey0 respondentsN answers are stored in a response file on
your ser%er" 4hese response files must e downloaded and captured efore they can
e used or e9ported" When you capture a response file from the ser%er0 it is con%erted
to a fi9ed-format se;uential #SC!! file" $esponses from multiple page sur%eys are
comined into a single data record per respondent" @ata file names end with a "dat
e9tension"
Internet Resonse Files <.asc or .t2t=
When a respondent completes a sur%ey on your we site0 their answers are stored on
your ser%er in an #SC!! te9t file" 4his file is not directly useale y other softwareW it
must first e captured y StatPac and con%erted into a fi9ed-format #SC!! te9t file"
StatPac supports multiple page sur%eys y storing the responses to each page as it is
completed" !f a respondent aandons the sur%ey efore completing all pages0 you
will still ha%e captured the information from the pages that they finished" !nternet
response file names normally end with an "asc e9tension0 although you can
alternati%ely use a "t9t e9tension" 4he !nternetA9tension setting in the StatPac"ini
defaults file can e used to set the !nternet response file e9tension"
1> Introduction StatPac For Windows User's Manual
StatPac pro%ides two methods for uploading and downloading files from your ser%er
6Ser%er0 #uto 4ransfer and Ser%er0 84P7" !f you use your own 84P client to upload
and download files0 then you must tell your 84P program that files with a "asc
e9tension are to e treated as #SC!! 6not inary7 files" !f you are unale to ma,e that
setting in your 84P program0 then you should change StatPacNs default e9tension for
internet response files from "asc to "t9t" 4he !nternetA9tension setting in the
StatPac"ini file sets the e9tension"
+(ail 0ddress .ists <.lst or .t2t=
1any we sur%eys use e-mail in%itations to re;uest participation from respondents"
Amail addresses are stored in an #SC!! te9t file with one e-mail address per line" #ll
mailing list file names created y StatPac end with a "lst or "t9t e9tension" Jou can
specify which e9tension you want to use y changing the .istA9tension setting in the
StatPac"ini defaults file" When an email address file contains more than Hust the email
addresses 6e"g"0 !@ numers0 demographic information0 etc"70 fields can e separated
from each other y tas or commas"
+(ail .o%s <.lo%=
4he StatPac we sur%ey component has a ul, e-mailing program that lets you send
thousands of indi%idualiBed e-mail in%itations in one atch" Aach time you send to an
e-mail list0 a log is ,ept of the successful and unsuccessful e-mails" 4he log file will
ha%e the same file name as the e-mail list e9cept the e9tension is "log" Aach time you
send to a particular e-mail list0 the log for that list will e appended"
Rich :e2t Files <.rtf=
1any people initially de%elop their sur%eys using a word processor" When sa%ed in
rich te9t format0 these documents can e used to facilitate the design of a codeoo,"
Jou will e ale to copy and paste information from the rich te9t file to the
codeoo," @epending on the length of the sur%ey0 this may sa%e considerale typing"
$ich te9t files end with a "rtf e9tension"
5:M. Files <.ht(=
StatPac creates standard <41. pages for a we sur%ey" 1ultiple pages are created
for multiple page sur%eys" 4hese are initially created on your local computer" 4hey
are ordinary <41. pages and may e edited and enhanced with any <41. editor
6e"g"0 8ront Page7" #fter you are satisfied with the appearance of the sur%ey we
pages0 they are uploaded to your we site" 4he sur%ey pages end with a "htm
e9tension" Jou can also use your own editor to create <41. styliBed email
in%itations"
Perl Scrit <.l=
When a respondent completes a page of a we sur%ey0 their answers are stored in a
response file on your ser%er" Jou will ha%e one response file for each sur%ey you
host" 4he Perl script is a program installed on your ser%er that controls the storage of
the data" # Perl script is often called a CF! program" 4here are two Perl scripts
pro%ided with the software5 statpac11.pl and password.pl" When you create an
!nternet sur%ey0 statpac.pl will e renamed to yoursurveyname.pl so that respondents
see a meaningful >$. in their rowser address ar" 4he password.pl script is only
used if you create a sur%ey with password protection"
StatPac For Windows User's Manual Introduction 11
Password Files <.te2t=
When creating a We sur%ey where each respondent has their own password0 a ta
delimited te9t file of %alid passwords must e pro%ided" While your password file
can ha%e any e9tension0 StatPac will create a duplicate file with a "te9t e9tension"
4his file will e uploaded to the ser%er to pro%ide password access to the sur%ey"
+2orted $ata Files <.t2t and .cs, and .(d"=
#fter the data has een captured0 you may want to e9port it to another format so a
different program can use it" StatPac lets you e9port to ta delimited 6"t9t70 comma
delimited 6"cs%70 and #ccess data ases 6"md7" 4hese common formats can then e
imported into most other software"
+(ail Body Files <.t2t or .ht(=
When you send e-mail in%itations to potential respondents0 the ody of the email is
e9tracted from an #SC!! te9t file during the mailing" 4he ody of the e-mail can e
created using any te9t editor 6e"g"0 1icrosoft Word0 'otepad0 etc"7 and should e
sa%ed as a @:S te9t file" >sually0 the e9tension will e "t9t0 ut any e9tension is
acceptale" #lternati%ely0 the e-mail ody may e a <41. file with a "htm
e9tension"
Sa(le File 7a(in% Sche(e for a Sur,ey
!n most situations0 most of the files for a gi%en sur%ey will use the same file names
and only the e9tensions will e different" 4ry to use file names that con%ey meaning
to you" 8or e9ample0 if we wanted to call our sur%ey QopinionR0 we would ha%e files
called5
opinion"cod 6codeoo,7
opinion"frm 6form for manual data entryMediting7
opinion"asc 6#SC!! te9t file of responses to a We sur%ey7
opinion"dat 6data file7
opinion"pro 6procedure file for performing analyses7
opinion"htm 6loader page of We page7
opinionX1"htm 6first user %iewale page of a We sur%ey7
opinionX2"htm 6another page of a We sur%ey or than,-you page7
opinion"pl 6Perl script created y StatPac to control page sumissions7
We might also ha%e 6or create7 se%eral other files0 ut their file names do not ha%e to
e the same" A9amples might e5
something"rtf 6a 1S Word document used to facilitate the codeoo, design7
opinion-mail"lst 6an #SC!! te9t file of e-mail addresses for the first mailing7
opinion-mail-reminder"lst 6an #SC!! te9t file of e-mail addresses of nonresponders7
1& Introduction StatPac For Windows User's Manual
opinion-ody"t9t 6an #SC!! te9t of that contains the e-mail ody for the first
mailing7 or opinion-ody"htm if you were sending an <41. email instead of plain
te9t
opinion-ody-reminder"t9t 6an #SC!! te9t of that contains the e-mail ody for the
second mailing to the nonresponders7 or opinion-ody-reminder"htm if you were
sending an <41. emails instead of plain te9t
opinion"t9t 6an e9ported ta delimited file of the data7
opinion"te9t 6a password file created control We sur%ey access7
Custo(i?in% the Pac#a%e
StatPac stores all its default %alues in a file called StatPac"ini" 4o a large degree0
these settings control the operation of StatPac" 4his file can e found in the StatPac
programs folder0 which is usually C5SStatPac" <owe%er0 if you installed StatPac in a
different folder0 it will e there instead"
1ost of the settings in the StatPac"ini file are adHusted automatically when you run
the program" <owe%er0 there are some settings that you may wish to change
manually" 4hese are noted in this manual when applicale"
>se care when manually editing the StatPac"ini file" Some information 6e"g"0
passwords7 is encrypted in the file and will appear QfunnyR on the screen" @o not
change these" :ther settings may e crucial to the proper operation of the pac,age"
We suggest only changing the settings that are mentioned elsewhere in this manual"
4he StatPac"ini file may e edited y selecting 8ile0 :pen0 System @efaults 8ile"
4his will open the StatPac"ini file in the wor,space area" 1a,e the desired change6s7
and select 8ile0 Sa%e Wor,space0 and 8ile Close"
4he StatPac"ini file is an #SC!! te9t file0 so it may alternati%ely e edited with any
te9t editor 6'otepad0 WordPad0 1S Word0 etc"7" 4o ma,e a change in the StatPac"ini
file using your own editor5
17 Close the StatPac for Windows program"
27 .oad the StatPac"ini file using any te9t editor"
37 1a,e the change and sa%e the file"
1ost users will ne%er need to directly edit the StatPac"ini file ecause nearly all the
parameters can e changed within the program itself y setting analysis options or
changing %alues in %arious settings windows" ?arious references in this manual may
refer to other settings you might wish to alter"
StatPac For Windows User's Manual Introduction 11
Basic Research Concets
Pro"le( Reco%nition and $efinition
We understand the world y as,ing ;uestions and searching for answers" :ur
construction of reality depends on the nature of our in;uiry"
#ll research egins with a ;uestion" !ntellectual curiosity is often the foundation for
scholarly in;uiry" Some ;uestions are not testale" 4he classic philosophical
e9ample is to as,0 O<ow many angels can dance on the head of a pinYO While the
;uestion might elicit profound and thoughtful re%elations0 it clearly cannot e tested
with an empirical e9periment" Prior to @escartes0 this is precisely the ,ind of
;uestion that would engage the minds of learned men" 4heir answers came from
within" 4he scientific method precludes as,ing ;uestions that cannot e empirically
tested" !f the angels cannot e oser%ed or detected0 the ;uestion is considered
inappropriate for scholarly research"
@efining the goals and oHecti%es of a research proHect is one of the most important
steps in the research process" @o not underestimate the importance of this step"
Clearly stated goals ,eep a research proHect focused" 4he process of goal definition
usually egins y writing down the road and general goals of the study" #s the
process continues0 the goals ecome more clearly defined and the research issues are
narrowed"
A9ploratory research 6e"g"0 literature re%iews0 tal,ing to people0 and focus groups7
goes hand-in-hand with the goal clarification process" 4he literature re%iew is
especially important ecause it o%iates the need to rein%ent the wheel for e%ery new
research ;uestion" 1ore importantly0 it gi%es researchers the opportunity to uild on
each otherNs wor,"
4he research ;uestion itself can e stated as a hypothesis" # hypothesis is simply the
in%estigatorDs elief aout a prolem" 4ypically0 a researcher formulates an opinion
during the literature re%iew process" 4he process of re%iewing other scholarDs wor,
often clarifies the theoretical issues associated with the research ;uestion" !t also can
help to elucidate the significance of the issues to the research community"
4he hypothesis is con%erted into a null hypothesis in order to ma,e it testale
ecause the only way to test a hypothesis is to eliminate alternati%es of the
hypothesis" Statistical techni;ues will enale us to reHect or fail to reHect a null
hypothesis0 ut they do not pro%ide us with a way to accept a hypothesis" 4herefore0
all hypothesis testing is indirect"
Creatin% the Research $esi%n
@efining a research prolem pro%ides a format for further in%estigation" # well-
defined prolem points to a method of in%estigation" 4here is no one est method of
research for all situations" $ather0 there are a wide %ariety of techni;ues for the
researcher to choose from" :ften0 the selection of a techni;ue in%ol%es a series of
trade-offs" 8or e9ample0 there is often a trade-off etween cost and the ;uality of
information otained" 4ime constraints sometimes force a trade-off with the o%erall
research design" &udget and time constraints must always e considered as part of
the design process"
Methods of Research
4here are three asic methods of research5 17 sur%ey0 27 oser%ation0 and 37
e9periment" Aach method has its ad%antages and disad%antages"
4he survey is the most common method of gathering information in the social
sciences" !t can e a face-to-face inter%iew0 telephone0 mail0 e-mail0 or we sur%ey"
# personal inter%iew is one of the est methods otaining personal0 detailed0 or in-
depth information" !t usually in%ol%es a lengthy ;uestionnaire that the inter%iewer
fills out while as,ing ;uestions" !t allows for e9tensi%e proing y the inter%iewer
and gi%es respondents the aility to elaorate their answers" 4elephone inter%iews
are similar to face-to-face inter%iews" 4hey are more efficient in terms of time and
cost0 howe%er0 they are limited in the amount of in-depth proing that can e
accomplished0 and the amount of time that can e allocated to the inter%iew" # mail
sur%ey is more cost effecti%e than inter%iew methods" 4he researcher can otain
opinions0 ut trying to meaningfully proe opinions is %ery difficult" Amail and we
sur%eys are the most cost effecti%e and fastest methods"
Observation research monitors respondentsD actions without directly interacting with
them" !t has een used for many years y #"C" 'ielsen to monitor tele%ision %iewing
haits" Psychologists often use one-way mirrors to study eha%ior" #nthropologists
and social scientists often study societal and group eha%iors y simply oser%ing
them" 4he fastest growing form of oser%ation research has een made possile y
the ar code scanners at cash registers0 where purchasing haits of consumers can
now e automatically monitored and summariBed"
!n an experiment0 the in%estigator changes one or more %ariales o%er the course of
the research" When all other %ariales are held constant 6e9cept the one eing
manipulated70 changes in the dependent %ariale can e e9plained y the change in
the independent %ariale" !t is usually %ery difficult to control all the %ariales in the
en%ironment" 4herefore0 e9periments are generally restricted to laoratory models
where the in%estigator has more control o%er all the %ariales"
Sa(lin%
!t is incument on the researcher to clearly define the target population" 4here are no
strict rules to follow0 and the researcher must rely on logic and Hudgment" 4he
population is defined in ,eeping with the oHecti%es of the study"
Sometimes0 the entire population will e sufficiently small0 and the researcher can
include the entire population in the study" 4his type of research is called a census
study ecause data is gathered on e%ery memer of the population"
1* Basic Research Concets StatPac For Windows User's Manual
>sually0 the population is too large for the researcher to attempt to sur%ey all of its
memers" # small0 ut carefully chosen sample can e used to represent the
population" 4he sample reflects the characteristics of the population from which it is
drawn"
Sampling methods are classified as either probability or nonprobability" !n
proaility samples0 each memer of the population has a known non-zero
proaility of eing selected" Proaility methods include random sampling0
systematic sampling0 and stratified sampling" !n nonproaility sampling0 memers
are selected from the population in some nonrandom manner" 4hese include
con%enience sampling0 Hudgment sampling0 ;uota sampling0 and snowall sampling"
4he ad%antage of proaility sampling is that sampling error can e calculated"
Sampling error is the degree to which a sample might differ from the population"
When inferring to the population0 results are reported plus or minus the sampling
error" !n nonproaility sampling0 the degree to which the sample differs from the
population remains un,nown"
Random sampling is the purest form of proaility sampling" Aach memer of the
population has an e;ual and ,nown chance of eing selected" When there are %ery
large populations0 it is often difficult or impossile to identify e%ery memer of the
population0 so the pool of a%ailale suHects ecomes iased"
Systematic sampling is often used instead of random sampling" !t is also called an
Nt name selection techni;ue" #fter the re;uired sample siBe has een calculated0
e%ery 'th record is selected from a list of population memers" #s long as the list
does not contain any hidden order0 this sampling method is as good as the random
sampling method" !ts only ad%antage o%er the random sampling techni;ue is
simplicity" Systematic sampling is fre;uently used to select a specified numer of
records from a computer file"
Strati!ied sampling is commonly used proaility method that is superior to random
sampling ecause it reduces sampling error" # stratum is a suset of the population
that shares at least one common characteristic" 4he researcher first identifies the
rele%ant stratums and their actual representation in the population" $andom
sampling is then used to select suHects from each stratum until the numer of
suHects in that stratum is proportional to its fre;uency in the population" Stratified
sampling is often used when one or more of the stratums in the population ha%e a
low incidence relati%e to the other stratums"
Convenience sampling is used in e9ploratory research where the researcher is
interested in getting an ine9pensi%e appro9imation of the truth" #s the name implies0
the sample is selected ecause they are con%enient" 4his nonproaility method is
often used during preliminary research efforts to get a gross estimate of the results0
without incurring the cost or time re;uired to select a random sample"
"udgment sampling is a common nonproaility method" 4he researcher selects the
sample ased on Hudgment" 4his is usually and e9tension of con%enience sampling"
8or e9ample0 a researcher may decide to draw the entire sample from one
Orepresentati%eO city0 e%en though the population includes all cities" When using this
method0 the researcher must e confident that the chosen sample is truly
representati%e of the entire population"
#uota sampling is the nonproaility e;ui%alent of stratified sampling" .i,e
stratified sampling0 the researcher first identifies the stratums and their proportions
as they are represented in the population" 4hen con%enience or Hudgment sampling is
used to select the re;uired numer of suHects from each stratum" 4his differs from
stratified sampling0 where the stratums are filled y random sampling"
Snowball sampling is a special nonproaility method used when the desired sample
characteristic is rare" !t may e e9tremely difficult or cost prohiiti%e to locate
StatPac For Windows User's Manual Basic Research Concets 1-
respondents in these situations" Snowall sampling relies on referrals from initial
suHects to generate additional suHects" While this techni;ue can dramatically lower
search costs0 it comes at the e9pense of introducing ias ecause the techni;ue itself
reduces the li,elihood that the sample will represent a good cross section from the
population"
$ata Collection
4here are %ery few hard and fast rules to define the tas, of data collection" Aach
research proHect uses a data collection techni;ue appropriate to the particular
research methodology" 4he two primary goals for oth ;uantitati%e and ;ualitati%e
studies are to ma9imiBe response and ma9imiBe accuracy"
When using an outside data collection ser%ice0 researchers often validate the data
collection process y contacting a percentage of the respondents to %erify that they
were actually inter%iewed" @ata editing and cleaning in%ol%es the process of
chec,ing for inad%ertent errors in the data" 4his usually entails using a computer to
chec, for out-of-ounds data"
#uantitative studies employ deducti%e logic0 where the researcher starts with a
hypothesis0 and then collects data to confirm or refute the hypothesis" #ualitative
studies use inducti%e logic0 where the researcher first designs a study and then
de%elops a hypothesis or theory to e9plain the results of the analysis"
Cuantitati%e analysis is generally fast and ine9pensi%e" # wide assortment of
statistical techni;ues is a%ailale to the researcher" Computer software is readily
a%ailale to pro%ide oth asic and ad%anced multi%ariate analysis" 4he researcher
simply follows the preplanned analysis process0 without ma,ing suHecti%e decisions
aout the data" 8or this reason0 ;uantitati%e studies are usually easier to e9ecute than
;ualitati%e studies"
Cualitati%e studies nearly always in%ol%e in-person inter%iews0 and are therefore
%ery laor intensi%e and costly" 4hey rely hea%ily on a researcherDs aility to e9clude
personal iases" 4he interpretation of ;ualitati%e data is often highly suHecti%e0 and
different researchers can reach different conclusions from the same data" <owe%er0
the goal of ;ualitati%e research is to de%elop a hypothesis--not to test one"
Cualitati%e studies ha%e merit in that they pro%ide road0 general theories that can e
e9amined in future research"
Reortin% the Results
4he most important consideration in preparing any research report is the nature of
the audience" 4he purpose is to communicate information0 and therefore0 the report
should e prepared specifically for the readers of the report" Sometimes the format
for the report will e defined for the researcher 6e"g"0 a thesis or dissertation70 while
other times0 the researcher will ha%e complete latitude regarding the structure of the
report" #t a minimum0 the report should contain an astract0 prolem statement0
methods section0 results section0 discussion of the results0 and a list of references"
8alidity
$alidity refers to the accuracy or truthfulness of a measurement" #re we measuring
what we thin, we areY 4his is a simple concept0 ut in reality0 it is e9tremely
difficult to determine if a measure is %alid"
1; Basic Research Concets StatPac For Windows User's Manual
8ace %alidity is ased solely on the Hudgment of the researcher" Aach ;uestion is
scrutiniBed and modified until the researcher is satisfied that it is an accurate measure
of the desired construct" 4he determination of face %alidity is ased on the
suHecti%e opinion of the researcher"
Content validity is similar to face %alidity in that it relies on the Hudgment of the
researcher" <owe%er0 where face %alidity only e%aluates the indi%idual items on an
instrument0 content %alidity goes further in that it attempts to determine if an
instrument pro%ides ade;uate co%erage of a topic" A9pert opinions0 literature
searches0 and open-ended pretest ;uestions help to estalish content %alidity"
Criterion-related validity can e either predicti%e or concurrent" When a
dependentMindependent relationship has een estalished etween two or more
%ariales0 criterion-related %alidity can e assessed" # mathematical model is
de%eloped to e ale to predict the dependent %ariale from the independent
%ariale6s7" %redictive validity refers to the aility of an independent %ariale 6or
group of %ariales7 to predict a future %alue of the dependent %ariale" Concurrent
validity is concerned with the relationship etween two or more %ariales at the same
point in time"
Construct validity refers to the theoretical foundations underlying a particular scale
or measurement" !t e9plores the underlying theories or constructs that e9plain a
phenomenon" 4his is also ;uite suHecti%e and depends hea%ily on the
understanding0 opinions0 and iases of the researcher"
Relia"ility
Reliability is synonymous with repeataility" # measurement that yields consistent
results o%er time is said to e reliale" When a measurement is prone to random
error0 it lac,s reliaility" 4he reliaility of an instrument places an upper limit on its
%alidity" # measurement that lac,s reliaility will necessarily e in%alid" 4here are
three asic methods to test reliaility5 test-retest0 e;ui%alent form0 and internal
consistency"
# test-retest measure of reliaility can e otained y administering the same
instrument to the same group of people at two different points in time" 4he degree to
which oth administrations are in agreement is a measure of the reliaility of the
instrument" 4his techni;ue for assessing reliaility suffers two possile drawac,s"
8irst0 a person may ha%e changed etween the first and second measurement"
Second0 the initial administration of an instrument might in itself induce a person to
answer differently on the second administration"
4he second method of determining reliaility is called the e&uivalent-!orm techni;ue"
4he researcher creates two different instruments designed to measure identical
constructs" 4he degree of correlation etween the instruments is a measure of
e;ui%alent-form reliaility" 4he difficulty in using this method is that it may e %ery
difficult 6andMor prohiiti%ely e9pensi%e7 to create a totally e;ui%alent instrument"
4he most popular methods of estimating reliaility use measures of internal
consistency" When an instrument includes a series of ;uestions designed to e9amine
the same construct0 the ;uestions can e aritrarily split into two groups" 4he
correlation etween the two susets of ;uestions is called the split-al! reliaility"
4he prolem is that this measure of reliaility changes depending on how the
;uestions are split" # etter statistic0 ,nown as CronachDs alpha0 is ased on the
mean 6asolute %alue7 interitem correlation for all possile %ariale pairs" !t pro%ides
a conser%ati%e estimate of reliaility0 and generally represents the lower ound to the
reliaility of a scale of items" 8or dichotomous nominal data0 the E$-20 6Euder-
$ichardson7 is used instead of CronachDs alpha"
StatPac For Windows User's Manual Basic Research Concets 1'
Syste(atic and Rando( +rror
1ost research is an attempt to understand and e9plain variability" When a
measurement lac,s %ariaility0 no statistical tests can e 6or need e7 performed"
?ariaility refers to the dispersion of scores"
!deally0 when a researcher finds differences etween respondents0 they are due to true
difference on the %ariale eing measured" <owe%er0 the comination of systematic
and random errors can dilute the accuracy of a measurement" Systematic error is
introduced through a constant ias in a measurement" !t can usually e traced to a
fault in the sampling procedure or in the design of a ;uestionnaire" Random error
does not occur in any consistent pattern0 and it is not controllale y the researcher"
For(ulatin% 5yotheses fro( Research @uestions
4here are asically two ,inds of research ;uestions5 testale and non-testale"
'either is etter than the other0 and oth ha%e a place in applied research"
A9amples of non-testale ;uestions are5
'ow do managers !eel about te reorganization(
)at do residents !eel are te most important problems !acing te community(
$espondentsD answers to these ;uestions could e summariBed in descripti%e tales
and the results might e e9tremely %aluale to administrators and planners" &usiness
and social science researchers often as, non-testale research ;uestions" 4he
shortcoming with these types of ;uestions is that they do not pro%ide oHecti%e cut-
off points for decision-ma,ers"
!n order to o%ercome this prolem0 researchers often see, to answer one or more
testale research ;uestions" 'early all testale research ;uestions egin with one of
the following two phrases5
*s tere a signi!icant di!!erence between ...(
*s tere a signi!icant relationsip between ...(
8or e9ample5
*s tere a signi!icant relationsip between te age o! managers and teir attitudes
towards te reorganization(
*s tere a signi!icant di!!erence between wite and minority residents wit respect to
wat tey !eel are te most important problems !acing te community(
# research hypothesis is a testale statement of opinion" !t is created from the
research ;uestion y replacing the words +*s tere+ with the words +,ere is+0 and
also replacing the ;uestion mar, with a period" 4he hypotheses for the two sample
research ;uestions would e5
,ere is a signi!icant relationsip between te age o! managers and teir attitudes
towards te reorganization.
,ere is a signi!icant di!!erence between wite and minority residents wit respect to
wat tey !eel are te most important problems !acing te community.
!t is not possile to test a hypothesis directly" !nstead0 you must turn the hypothesis
into a null hypothesis" 4he null hypothesis is created from the hypothesis y adding
the words OnoO or OnotO to the statement" 8or e9ample0 the null hypotheses for the
two e9amples would e5
&> Basic Research Concets StatPac For Windows User's Manual
,ere is no signi!icant relationsip between te age o! managers and teir attitudes
towards te reorganization.
,ere is no signi!icant di!!erence between wite and minority residents wit respect
to wat tey !eel are te most important problems !acing te community.
#ll statistical testing is done on the null hypothesis"""ne%er the hypothesis" 4he result
of a statistical test will enale you to either 17 reHect the null hypothesis0 or 27 fail to
reHect the null hypothesis" 'e%er use the words Oaccept the null hypothesisO"
:ye I and :ye II +rrors
4here are two types of hypothesis testing errors" 4he first one is called a ,ype *
error" 4his is a %ery serious error where you wrongly reHect the null hypothesis"
Suppose that the null hypothesis is5 @aily administrations of drug #&C will not help
patients" #lso suppose that drug #&C is really a %ery ad drug0 and it causes
permanent rain damage to people o%er -0" !n your research0 you as, for %olunteers0
and the entire sample is under -0 years of age" 4he sample seems to impro%e and
you reHect the null hypothesis" 4here could e %ery serious conse;uences if you were
to mar,et this drug 6ased on your sample7" 4ype ! errors are often caused y
sampling prolems"
# ,ype ** error is less serious0 where you wrongly fail to reHect the null hypothesis"
Suppose that drug #&C really isnDt harmful and does actually help many patients0 ut
se%eral of your %olunteers de%elop se%ere and persistent psychosomatic symptoms"
Jou would proaly not mar,et the drug ecause of the potential for long-lasting
side effects" >sually0 the conse;uences of a 4ype !! error will e less serious than a
4ype ! error"
:yes of $ata
:ne of the most important concepts in statistical testing is to understand the four
asic types of data5 nominal0 ordinal0 inter%al0 and ratio" 4he ,inds of statistical tests
that can e performed depend upon the type of data you ha%e" @ifferent statistical
tests are used for different types of data"
'ominal and ordinal data are nonparametric 6non-continuous or categorical7"
!nter%al and ratio scales are called parametric 6continuous7" Some statistical tests are
called parametric tests ecause they use parametric data" :thers are called
nonparametric tests ecause they use nonparametric data" #ll statistical tests are
designed to e used with a specific ,ind of data0 and may only e performed when
you ha%e that ,ind of data"
Nominal data
'ominal data is characteriBed y non-ordered response categories"
+1amples of nominal data
What is your se9Y
XXXX 1ale XXXX 8emale
What program are you inY
XXX #dministrationM1anagement
XXX <ealth Ser%ices
StatPac For Windows User's Manual Basic Research Concets &1
XXX Aducation
XXX <uman Ser%ices
@o you ha%e health insuranceY
XXX Jes XXX 'o XXX @onDt ,now
What school did you attendY
XXX Par, Alementary
XXX West Side
XXX :ther
What should e done with the programY
XXX Close it down
XXX See, go%ernment funding
XXX <old a pri%ate fund raiser
XXX :ther
What state do you li%e inY XXXXXXXXXXXXXXXXXXXXXXXXX
'ote5 4his ;uestion is called an open-ended ;uestion ecause it calls for a %eratim
response" A%en though the categories 6i"e"0 the states7 are not listed0 the ;uestion is
still considered nominal ecause the data can e categoriBed after it is collected"
Which of the following meats ha%e you eaten in the last wee,Y 6Chec, all that
apply7
XXX <amurger XXX Pot roast XXX .i%er
XXX <otdogs XXX &acon XXX Stea,
XXX Por, chops XXX Sausage XXX :ther
'ote5 4his ;uestion is called a multiple response item ecause respondents can chec,
more than one category" 1ultiple response simply means that a respondent can
ma,e more than one response to the same ;uestion" 4he data is still nominal ecause
the responses are non-ordered categories"
What are the two most important issues facing our country todayY
XXXXXXXXXXXXXXXXXXXXXXXX and XXXXXXXXXXXXXXXXXXXXXXXX
'ote5 4his ;uestion is an open-ended multiple response item ecause it calls for two
%eratim responses" !t is still considered nominal data ecause the issues could e
categoriBed after the data is collected"
Ordinal data
:rdinal data is characteriBed y ordered response categories"
+1amples of ordinal data
What is your highest le%el of educationY
XXX Frade school
XXX Some high school
XXX <igh school graduate
XXX Some college
XXX College graduate
&& Basic Research Concets StatPac For Windows User's Manual
XXX #d%anced degree
<ow many eers ha%e you drun, in the last wee,Y
XXX 'one XXX :ne to fi%e XXX Si9 to ten XXX :%er ten
<ow would you rate your progressY
XXX A9cellent
XXX Food
XXX 8air
XXX Poor
What has the trend een in your usiness o%er the past yearY
XXX @ecreasing XXX Stale XXX !ncreasing
Please rate the ;uality of this lectureY
XXX .ow XXX 1edium XXX <igh
>se a circle to indicate your le%el of agreement or disagreement with the following
statement5 #ortion should e a decision etween a woman and her doctor"
Strongly Strongly
#gree #gree 'eutral @isagree @isagree
1 2 3 3 2
What is your annual family incomeY
XXX >nder Z120000
XXX Z120000 to Z230999
XXX Z230000 to Z390999
XXX Z200000 to Z)30999
XXX Z)20000 or more
Interval and ratio data
!nter%al and ratio data are such that each numeric interval represents one unit of
measurement" Ratio scales also ha%e the property of an asolute OBero-pointO"
*nterval and ratio-scaled ;uestions are preferale in research design ecause they
offer the most %ersatility in the ,inds of analyses that may e performed"
+1amples of interval and ratio data
What is your ageY XXXXXXX
<ow many children do you ha%eY XXXXXXXX
What was your S#4 scoreY XXXXXXXX
<ow many years of school ha%e you completedY XXXXXXX
What percent of your wor, time do you spend """" Y XXXXXXX
<ow many collecti%e argaining sessions ha%e you een in%ol%ed inY XXXXXX
What is the a%erage class siBe in your schoolY XXXXXXXX
What was your family income last yearY XXXXXXXXXXX
<ow many units ha%e you completedY 6Circle7 0 1 2 3
StatPac For Windows User's Manual Basic Research Concets &1
What was your FP# as an undergraduate studentY XXXXX
<ow many times ha%e you een arrestedY XXXXX
Si%nificance
What does significance really meanY
1any researchers get %ery e9cited when they ha%e disco%ered a OsignificantO
finding0 without really understanding what it means" When a statistic is significant0
it simply means that you are %ery sure that the statistic is reliale" !t doesnDt mean
the finding is important"
8or e9ample0 suppose we gi%e 10000 people an !C test0 and we as, if there is a
significant difference etween male and female scores" 4he mean score for males is
9( and the mean score for females is 100" We use an independent groups t-test and
find that the difference is significant at the "001 le%el" 4he ig ;uestion is0 OSo
whatYR 4he difference etween 9( and 100 on an !C test is a %ery small
difference"""so small0 in fact0 that itNs not e%en important"
4hen why did the t-statistic come out significantY &ecause there was a large sample
siBe" When you ha%e a large sample siBe0 %ery small differences will e detected as
significant" 4his means that you are %ery sure that the difference is real 6i"e"0 it didnDt
happen y flu,e7" !t doesnDt mean that the difference is large or important" !f we had
only gi%en the !C test to 22 people instead of 100000 the two-point difference
etween males and females would not ha%e een significant"
Significance is a statistical term that tells how sure you are that a difference or
relationship e9ists" 4o say that a significant difference or relationship e9ists only
tells half the story" We might e %ery sure that a relationship e9ists0 ut is it a strong0
moderate0 or wea, relationshipY #fter finding a significant relationship0 it is
important to e%aluate its strength" Significant relationships can e strong or wea,"
Significant differences can e large or small" !t Hust depends on your sample siBe"
1any researchers use the word OsignificantO to descrie a finding that may ha%e
decision-ma,ing utility to a client" 8rom a statisticianDs %iewpoint0 this is an incorrect
use of the word" <owe%er0 the word OsignificantO has %irtually uni%ersal meaning to
the pulic" 4hus0 many researchers use the word OsignificantO to descrie a difference
or relationship that may e strategically important to a client 6regardless of any
statistical tests7" !n these situations0 the word OsignificantO is used to ad%ise a client to
ta,e note of a particular difference or relationship ecause it may e rele%ant to the
companyDs strategic plan" 4he word OsignificantO is not the e9clusi%e domain of
statisticians and either use is correct in the usiness world" 4hus0 for the statistician0
it may e wise to adopt a policy of always referring to Ostatistical significanceO rather
than simply OsignificanceO when communicating with the pulic"
3ne9:ailed and :wo9:ailed :ests
:ne important concept in significance testing is whether to use a one-tailed or two-
tailed test of significance" 4he answer is that it depends on your hypothesis" When
your research hypothesis states 6or implies7 the direction of the difference or
relationship0 then you use a one-tailed proaility" 8or e9ample0 a one-tailed test
would e used to test these null hypotheses5 8emales will not score significantly
higher than males on an !C test" &lue collar wor,ers will not ha%e significantly
lower education than white collar wor,ers" Superman is not significantly stronger
than the a%erage person" !n each case0 the null hypothesis 6indirectly7 predicts the
&) Basic Research Concets StatPac For Windows User's Manual
direction of the e9pected difference" # two-tailed test would e used to test these
null hypotheses5 4here will e no significant difference in !C scores etween males
and females" 4here will e no significant difference etween lue collar and white
collar wor,ers" 4here is no significant difference in strength etween Superman and
the a%erage person" # one-tailed proaility is e9actly half the %alue of a two-tailed
proaility"
4here is a raging contro%ersy 6for aout the last hundred years7 on whether or not it
is e%er appropriate to use a one-tailed test" 4he rationale is that if you already ,now
the direction of the difference0 why other doing any statistical tests" 4he safest et
is to always state your hypotheses so that two-tailed tests are appropriate"
Procedure for Si%nificance :estin%
Whene%er we perform a significance test0 it in%ol%es comparing a test %alue that we
ha%e calculated to some critical %alue for the statistic" !t doesnDt matter what type of
statistic we are calculating 6e"g"0 a t-statistic0 a chi-s;uare statistic0 an 8-statistic0
etc"70 the procedure to test for significance is the same"
1" @ecide on the critical alpa level 67 you will use 6i"e"0 the error rate you are
willing to accept7"
2" Conduct the research"
3" Calculate the statistic"
3" Compare the statistic to a critical value otained from a tale or compares the
proaility of the statistic to the critical alpa level"
!f your statistic is higher than the critical value from the tale or the proaility of
the statistic is less than the critical alpha le%el5
Jour finding is significant"
Jou reHect the null hypothesis"
4he proaility is small that the difference or relationship happened
y chance0 and p is less than the critical alpha le%el 6p [ 7"
!f your statistic is lower than the critical value from the tale or the proaility of the
statistic is higher than the critical alpha le%el5
Jour finding is not significant"
Jou fail to reHect the null hypothesis"
4he proaility is high that the difference or relationship happened
y chance0 and p is greater than the critical alpha le%el 6p \ 7"
1odern computer software can calculate e9act proailities for most test statistics"
When StatPac 6or other software7 gi%es you an e9act proaility0 simply compare it
to your critical alpha le%el" !f the e9act proaility is less than the critical alpha
le%el0 your finding is significant0 and if the e9act proaility is greater than your
critical alpha le%el0 your finding is not significant" >sing a tale is not necessary
when you ha%e the e9act proaility for a statistic"
StatPac For Windows User's Manual Basic Research Concets &!
Bonferroni's :heore(
&onferroniDs theorem states that as one performs an increasing numer of statistical
tests0 the li,elihood of getting an erroneous significant finding 64ype ! error7 also
increases" 4hus0 as we perform more and more statistical tests0 it ecomes
increasingly li,ely that we will falsely reHect a null hypothesis 6%ery ad7"
8or e9ample0 suppose our critical alpha le%el is "02" !f we performed one statistical
test0 our chance of ma,ing a false statement is "02" !f we were to perform 100
statistical tests0 and we made a statement aout the result of each test0 we would
e9pect fi%e of them to e wrong 6Hust y flu,e7" 4his is a rather undesirale situation
for social scientist"
&onferroniDs theorem states that we need to adHust the critical alpha le%el in order to
compensate for the fact that weDre doing more than one test" 4o ma,e the adHustment0
ta,e the desired critical alpha le%el 6e"g"0 "027 and di%ide y the numer of tests eing
performed0 and use the result as the critical alpha le%el" 8or e9ample0 suppose we
had a test with eight scales0 and we plan to compare males and females on each of
the scales using an independent groups t-test" We would use "00-22 6"02M(7 as the
critical alpha le%el for all eight tests"
&onferroniDs theorem should e applied whene%er you are conducting two or more
tests that are of the same OtypeO and the same OfamilyO" 4he same OtypeO means the
same ,ind of statistical test" 8or e9ample0 if you were going to do one t-test0 one
#':?#0 and one regression0 you would not ma,e the adHustment ecause the tests
are all different" 4he same OfamilyO is a more elusi%e concept0 and there are no hard
and fast rules" O8amilyO refers to a series of statistical tests all designed to test the
same 6or %ery closely related7 theoretical constructs" 4he ottom line is that itDs up to
the indi%idual researcher to decide what constitutes a OfamilyO"
Some things are more o%ious than others0 for e9ample0 if you were doing t-tests
comparing males and females on a series of ;uestionnaire items that are all part of
the same scale0 you would proaly apply the adHustment0 y di%iding your critical
alpha le%el y the numer of items in the scale 6i"e"0 the numer of t-tests you
performed on that scale7" 4he proailities of the tests would e called the !amily
error rates" <owe%er0 suppose you ha%e a series of independent ;uestions0 each
focusing on a different construct and you want to compare males and females on how
they answered each ;uestion" <ere is where the whole idea of &onferroniDs
adHustment ecomes philosophical" !f you claim that each t-test that you perform is a
test of a uni;ue OminiO-hypothesis0 then you would not use the adHustment0 ecause
you ha%e defined each ;uestion as a different OfamilyO" !n this case0 the proaility
would e called a statement error rate" #nother researcher might call the entire
;uestionnaire a OfamilyO0 and she would di%ide the critical alpha y the total numer
of items on the ;uestionnaire"
Why stop thereY 8rom a statisticianDs perspecti%e0 the situation ecomes e%en more
comple9" Since they are personally in the Ostatistics usinessO0 what should they call
a OfamilyOY When a statistician does a t-test for a client0 maye she should e
di%iding the critical alpha y the total numer of t-tests that she has done in her life0
since that is a way of loo,ing at her OfamilyO" :f course0 this would result in a
different adHustment for each statistician--an interesting dilemma"
!n the real world0 most researchers do not use &onferroniDs adHustment ecause they
would rarely e ale to reHect a null hypothesis" 4hey would e so concerned aout
the possiility of ma,ing a false statement0 that they would o%erloo, many
differences and relationships that actually e9ist" 4he Oprime directi%eO for social
science research is to disco%er relationships" :ne could argue that it is etter to ris,
ma,ing a few wrong statements0 than to o%erloo, relationships or differences that are
&* Basic Research Concets StatPac For Windows User's Manual
clear or prominent0 ut donDt meet critical alpha significance le%el after applying
&onferroniDs adHustment"
Central :endency
4he est ,nown measures of central tendency are the mean and median" 4he mean
a%erage is found y adding the %alues for all the cases and di%iding y the numer of
cases" 8or e9ample0 to find the mean age of all your friends0 add all their ages
together and di%ide y the numer of friends" 4he mean a%erage can present a
distorted picture of central tendency if the sample is s,ewed in any way"
8or e9ample0 letDs say fi%e people ta,e a test" 4heir scores are 100 120 130 1(0 and 93"
64he last person is a genius"7 4he mean would e the sums of the scores
10]12]13]1(]93 di%ided y 2" !n this e9ample0 a mean of 29"- is not a good
measure of how well people did on the test in general" When analyBing data0 e
careful of using only the mean a%erage when the sample has a few %ery high or %ery
low scores" 4hese scores tend to s,ew the shape of the distriution and will distort
the mean"
When you ha%e sampled from the population0 the mean of the sample is also your
est estimate of the mean of the population" 4he actual mean of the population is
un,nown0 ut the mean of the sample is as good an estimate as we can get"
4he median pro%ides a measure of central tendency such that half the sample will e
ao%e it and half the sample will e elow it" 8or s,ewed distriutions this is a etter
measure of central tendency" !n the pre%ious e9ample0 13 would e the median for
the sample of fi%e people" !f there is no middle %alue 6i"e"0 there are an e%en numer
of data points70 the median is the %alue midway etween the two middle %alues"
4he distriution of many %ariales follows that of a ell-shaped cur%e" 4his is called
a Onormal distriutionO" :ne must assume that data is appro9imately normally
distriuted for many statistical analyses to e %alid" When a distriution is normal0
the mean and median will e e;ual to each other" !f they are not e;ual0 the
distriution is distorted in some way"
8aria"ility
?ariaility is synonymous with di%ersity" 4he more di%ersity there is in a set of data0
the greater the %ariaility" :ne simple measure of di%ersity is the range 6ma9imum
%alue minus the minimum %alue7" 4he range is generally not a good measure of
%ariaility ecause it can e se%erely affected y a single %ery low or high %alue in
the data" # etter method of descriing the amount of %ariaility is to tal, aout the
dispersion of scores away from the mean"
4he %ariance and standard de%iation are useful statistics that measure the dispersion
of scores around the mean" 4he standard de%iation is simply the s;uare root of the
%ariance" &oth statistics measure the amount of di%ersity in the data" 4he higher the
statistics0 the greater the di%ersity" :n the a%erage0 -( percent of all the scores in a
sample will e within plus or minus one standard de%iation of the mean and 92
percent of all scores will e within two standard de%iations of the mean"
4here are two formulas for the %ariance and standard de%iation of a sample" :ne set
of formulas calculates the e9act %ariance and standard de%iation of the sample" 4he
statistics are called biased0 ecause they are iased to the sample" 4hey are the e9act
%ariance and standard de%iation of the sample0 ut they tend to underestimate the
%ariance and standard de%iation of the population"
StatPac For Windows User's Manual Basic Research Concets &-
Fenerally0 we are more concerned with descriing the population rather than the
sample" :ur intent is to use the sample to descrie the population" 4he unbiased
estimates should e used when sampling from the population and inferring ac, to
the population" 4hey pro%ide the est estimate of the %ariance and standard
de%iation of the population"
Standard +rror of the Mean
4he standard error of the mean is used to estimate the range within which we would
e9pect the mean to fall in repeated samples ta,en from the population 6i"e"0
confidence inter%als7" 4he standard error of the mean is an estimate of the standard
de%iation of those repeated samples"
4he formula for the standard error of the mean pro%ides an accurate estimate when
the sample is %ery small compared to the siBe of the population" !n mar,eting
research0 this is usually the case since the populations are ;uite large" <owe%er0
when the sample siBe represents a sustantial portion of the population0 the formula
ecomes inaccurate and must e corrected" 4he finite population correction factor is
used to correct the estimate of the standard error when the sample is more than ten
percent of the population"
Inferences with S(all Sa(le Si?es
When the sample siBe is small 6less than 3070 the z %alue for the area under the
normal cur%e is not accurate" !nstead of a z %alue0 we can use a t %alue to deri%e the
area under the cur%e" !n fact0 many researchers always use the t %alue instead of the
z %alue" 4he reason is that the t %alues are more accurate for small sample siBes0 and
they are nearly identical to the z %alues for large sample siBes" >nli,e the z %alue0 the
%alues for t depend upon the numer of cases in the sample" @epending on the
sample siBe0 the t %alue will change"
$e%rees of Freedo(
@egrees of freedom literally refers to the numer of data %alues that are free to %ary"
8or e9ample0 suppose ! tell you that the mean of a sample is 100 and there are a total
of three %alues in the sample" !t turns out that if ! tell you any two of the %alues0 you
will always e ale to figure out the third %alue" !f two of the %alues are ( and 120
you can calculate that the third %alue is 10 using simple algera"
-x . / . 101 2 3 4 15 x 4 15
!n other words0 if you ,now the mean0 and all ut one %alue0 you can figure out the
missing %alue" #ll the %alues e9cept one are free to %ary" :ne %alue is set once the
others are ,nown" 4hus0 degrees of freedom is e;ual to n-1"
&; Basic Research Concets StatPac For Windows User's Manual
Code"oo# $esi%n
Co(onents of a Study $esi%n
#ll sur%eys egin y creating a codebook" 4he codeoo, contains the format and
laels of each %ariale" !f your sur%ey contains 20 items0 the codeoo, will also
contain 20 items"
!f the sur%ey will e administered y paper and pencil or C#4! there will also e a
data entry form" 4he form refers to the screens that the data entry person will see
while entering and editing data" 4he codeoo, and form usually ha%e the same file
names" :nly the file e9tensions are different"
!f the sur%ey will e administered o%er the !nternet or as an e-mail sur%ey0 a data
entry form is not necessary"
4here are many ways to design the codeoo, and form" 4he est way depends upon
whether or not you already ha%e typed the sur%ey with a word-processor" When you
run the program0 the main screen will e displayed" 4he left side of the screen is for
the Wor,space window and the right side of the screen is used to show the list of
%ariales in the codeoo,"
+le(ents of a 8aria"le
4he codeoo, defines the %ariales in the study" Aach item on the sur%ey is a
%ariale" 4hus0 the numer of %ariales in the codeoo, is the same as the numer of
items" 6'ote that se%eral %ariales are re;uired to define a multiple response item0 so
the numer of %ariales in the codeoo, might actually e9ceed the numer of items
on the sur%ey"7
4here are fi%e components to a %ariale" 4hese are5
?ariale 8ormat
?ariale 'ame
?ariale .ael
?alue .aels 6including %alid codes and s,ip codes7
@ata Antry Control Parameters
4he ?ariale 8ormat is mandatory ecause it defines where and how the data is
stored in the data file" #ll other components are optional"
8aria"le For(at
4he ?ariale 8ormat defines the structure of the %ariale" 4his is the only
information that is mandatory when defining a new %ariale" :nce you define the
structure of a %ariale0 it will e9ist in the codeoo,"
4he synta9 for the ?ariale 8ormat is5
[?ar" 4ype\ ['o" of Cols\ " [@ecimal\
4he following are e9amples of %ariale formats" 4he word QcolumnsR refers to the
numer of characters that will e a%aille to hold the respondentNs answerM5
'2 a numeric %ariale using 2 columns
'2"2 a numeric %ariale using 2 columnsW
the format of the %ariale will e //"//
'2 a numeric %ariale using 2 columns
#1 an alpha %ariale using 1 column
#220 an alpha %ariale using 220 columns
Variable Type
StatPac has two types of %ariales5 numeric and alpha" @ifferent analyses can e
performed depending on the %ariale type" StatPac re;uires that a %ariale type e
specified as either ' or #"
'umeric %ariales may contain numers0 a decimal point0 a plus or minus sign and a
@ or A if scientific notation is used" #lpha %ariales may contain any character
6letters0 numers and special characters7" StatPac automatically left Hustifies alpha
%ariales and right Hustifies numeric %ariales"
#n e9ample of a numeric %ariale might e the following ;uestion on a sur%ey5
'ow many years o! !ormal education ave you completed(
4he response would always e a numer that could e contained in two columns of
the data file" 4he response would also always e numeric" # numeric-type
specification is re;uired for inter%al or ratio-type-data"
1> /eywords StatPac For Windows User's Manual
Some ;uestions ha%e coded responses and could use the alpha-type format" #n
e9ample of alpha-type ;uestion on a sur%ey would e5
)ic product do you pre!er(
6 4 %roduct 6
7 4 %roduct 7
C 4 %roduct C
N 4 No pre!erence
!n this ;uestion0 the responses are coded into categories" 4he categories are not
arithmetically related" 4hat is0 a response of C does not mean twice as much product
as response #" 'ominal and ordinal-type data can use either an alpha or numeric
format"
#nother e9ample of an alpha %ariale would e an open-ended response" 4he
respondent could answer anything to the following ;uestion5
)at could we do to improve our product(
.i,ert-scale ;uestions and preference scales are often gi%en a numeric format so that
descripti%e statistics can e calculated" 4his is a generally accepted procedure in
mar,eting and social science research0 the assumption eing that the percei%ed
inter%als etween the selections are e;ual"
Number of Columns
4he numer of columns component of the format statement is the field width
allocated for the %ariale" 4his is the numer of characters needed to write the
longest data %alue" 4here is not a ma9imum numer of columns for an alpha
%ariale0 although the practical limit for data entry is 10000 - 20000 characters" 8or a
numeric %ariale0 the ma9imum numer of columns is 22 characters"
4he field width for numeric %ariales must e large enough to hold the numer0 a
plus or minus sign0 and a decimal point 6if necessary7" 8or e9ample0 a numeric one-
to-ten scale would re;uire two charactersW racing times for a hundred meter sprint
6with accuracy to the hundredth of a second7 would re;uire fi%e characters 6two for
the seconds0 one for the decimal point0 and two for the hundredths of seconds7" #n
alpha %ariale to hold an entire open-ended sentence might re;uire 120 characters"
!t is %ery important that you lea%e a sufficient numer of columns for your data"
#fter you egin entering data0 changing the numer of columns for a %ariale will
ecome more comple9 6since this re;uires restructuring of the data already entered7"
>ser 4ip5 When in dout0 allow more columns rather than less"
Decimal Places
4he decimal format is the numer of significant decimal places that the %ariale will
contain" 4his component of the format statement is optional and may e omitted" !f
8decimal9 is not specified0 the data will e stored e9actly as entered 6with or
without a decimal point7" !n the format statement itself0 the numer of decimal digits
is preceded y a decimal point"
8aria"le 7a(e
4he %ariale name is simply a name that may e used to reference the %ariale when
designing analyses" While the %ariale name is optional0 its use is highly
recommended" #s a general rule0 the %ariale name is a short word or are%iation"
!ts primary purpose is to help you ,eep trac, of %ariales while designing analyses"
StatPac For Windows User's Manual /eywords 11
4here are se%eral rules go%erning %ariale names" #ll of these are automatically
chec,ed y StatPac so it will not e possile to enter an in%alid %ariale name"
1" # %ariale name must e uni;ue from all other %ariale names and may not e the
same as any analysis ,eyword" 64he ,eywords are listed in another section of the
manual"7
2" 4he first character of a %ariale name may not e a numer or a space"
3" # %ariale name may not e the same as a ? numer" 8or e9ample0 you cannot
name a %ariale O?12O"
3" # %ariale name may not contain a comma or period" 4he %ariale name may
include a spaceW howe%er0 for the purpose of clarity0 we recommend using an
underscore character instead of a space"
2" # %ariale name may not e @0 A0 $AC:$@0 4!1A0 .:0 <!0 W!4<0 &J0 4<A'0
4:4#. or 1A#'" 4hese words ha%e special meaning to StatPac"
8aria"le .a"el
4he %ariale lael is a written description of the %ariale" 8or sur%eys0 the %ariale
lael is usually the ;uestion itself" 4here are no restrictions on the content or length
of a %ariale lael" !t may contain any character on the ,eyoard"
When creating a series of multiple response %ariales0 identical %ariale laels
should e used for each of the multiple response items" 4his tells StatPac how to
format the data entry form0 and therey impro%es data entry"
8alue .a"els
?alue laels are used in the reports to lael the response categories" 4hey may
include any upper or lower case character e9cept a semicolon" 4he format for a %alue
lael is5
8Code948:abel9
4he code on the left of the e;uals sign is what will e typed during data entry" 4he
lael on the right of the e;uals sign is the de!inition of the code and will e used to
lael the output"
!n the following e9ample0 there are four %alue laels" 4hese are entered as four
separate lines"
14; years or less
04< to = years
3415 to 10 years
>4Over 10 years
4here are no spaces etween the code and the e;uals sign" 4here are also no spaces
etween the e;uals sign and the lael" 4he code on the left of the e;uals sign may not
e greater than the field width defined in the format statement" 4here is not a limit on
the length of the %alue lael 6on the right of the e;uals symol7W howe%er0 short %alue
laels 620 or fewer characters7 generally produce more condensed and easier to read
printouts"
8or alpha %ariales0 it is important to note that upper and lower case characters are
different" When you enter the code on the left of the e;uals sign0 the code should e
the same case as you plan to enter the data" 8or e9ample0 if the data entry person will
e entering a lower case m and f for male and female0 the %alue laels would e5
m4?ale
1& /eywords StatPac For Windows User's Manual
!4@emale
4he %alue laels also define what will e accepted as %alid data during data entry"
Whenever a value label is specified% the code 2on the left of the e3uals si/n4 will
be interpreted as a valid code durin/ data entry. If no value labels are specified%
all data will be considered valid.
1any %ariales do not need any %alue laels" They are re3uired only when a
coded response will be entered. 'umeric inter%al and ratio data0 as well as open
ended alpha data0 do not re;uire any %alue laels"
4he following ;uestions would not need %alue laels5
)at is your age(
What is your first nameY
What score did you get on the testY
What is your fa%orite numerY
What would est descrie your feelingsY
8alid Codes
When there are no %alue laels 6such as a test score %ariale70 %alid codes for data
entry can still e specified y simply typing the %alid codes or ranges" 4he format
for entering %alid codes is5
8Code or Range9
[Code or $ange\
[Code or $ange\
!n this case0 each %alid code 6or %alid range7 is entered on a different line"
#lternately0 a slash 6M7 may e used to list a series of %alid codes on the same line5
8Code or Range928Code or Range928Code or Range9
4he following e9amples illustrate %arious ways to specify %alid codes"
1232A accept codes 1B 3 C A
1-3 accept codes 1 to 3
1-3M2 accept 1 to 3 = 2
12-99 accept %alues 12 to 99
#-@ accept codes #0 &0 C and @
#-@M* accept codes #0 &0 C0 @ and *
/ accept anything
'otice that the pound symol 6/7 is used to specify Oaccept any numer or letter
during data entryO" !f the field is numeric0 this means any numer is an acceptale
%alue" !f the field is alpha0 it means that any character is acceptale input"
When the %alid codes0 laels0 and s,ips field is completely empty0 any input will e
accepted 6i"e"0 it is the same as the / symol7" !f the pounds symol is specified0 it
should e the last line of the %alue laels for the %ariale"
StatPac For Windows User's Manual /eywords 11
S#i Codes for Branchin%
Skip codes allow you to specify conditions for passing o%er certain %ariales during
data entry depending on the %alues entered for other %ariales" 4his is commonly
referred to as brancing"
8or instance0 if %ariale - contains responses to the ;uestion O<a%e you e%er read
1usic 1agaBineYO and %ariale ) stored answers to the ;uestion O<ow much do you
li,e 1usic 1agaBineYO0 you would want to s,ip to %ariale ( for a person who
responded O'oO to %ariale -"
# semicolon and Oranch toO numer may e used on a 8Code948:abel9 line to
control data entry ranching" 8or the 1usic 1agaBine e9ample ao%e0 the %alue
laels would e5
D4Des
N4No E/
'ote that the semicolon and %ariale to ranch to follow the %alue lael" !n this
e9ample0 the space efore the semicolon is for readaility only" #ll of the following
lines are e;ui%alent5
N4NoE/
N4No E/
N4No E /
#s another e9ample0 consider a ;uestionnaire that includes a OdwellingO %ariale for
which 1^#partment0 2^Condominium0 and 3^<ouse" !f three separate sections
within the ;uestionnaire corresponded to each type of dwelling0 the %alue laels and
skip codes for the dwelling %ariale could e5
146partment E1>
04Condominium E03
34'ouse E0=
4he skip codes would direct data entry to %ariales 130 23 or 29 depending on
whether a 10 2 or 3 was entered" #gain note that the spacing is for readaility only"
4he pound symol 6/7 may e used in a skip code to mean any %alue or code" 4hat
is0 it is an asolute Hump to a %ariale regardless of the data entered" 8or e9ample0
/^W13 means to Hump to %ariale 13 after entering the current field" 4his feature is
useful when you want to end a ranch and reHoin with a common %ariale0 as in the
dwelling e9ample ao%e"
Comple9 ranching is also supported" 4his means that a ranch can ased on the
response to a pre%ious %ariale" 4he following is an e9ample of how to use comple9
ranching" #ssume it is the %alue laels for %ariale 10" !f the data for %ariale 10 is
entered as a 1 or 20 the comple9 s,ip will e e%aluated" !n this e9ample0 the s,ip
pattern is the same regardless of whether a 1 or 2 is entered" !f the pre%ious response
to %ariale 2 was 1 then the s,ip will go to %ariale 220 and if the pre%ious response
to %ariale 2 was 2 then the s,ip will go to %ariale 30" # response of 3 for this
%ariale would s,ip to %ariale 32"
14Des E F$A41 E 0A F$A40 E 35
04No E F$A41 E 0A F$A40 E 35
34No 6nswer E 3A
'ote that a semicolon is used to egin the comple9 s,ip and efore each Os,ip toO
%ariale" #lso note that a pound symol is used to start each portion of the comple9
s,ip" #ll spacing is optional" Comple9 s,ip patterns are not automatically updated if
1) /eywords StatPac For Windows User's Manual
you insert or delete a %ariale from the codeoo," 4herefore0 they are generally
added after the structure of the codeoo, has een finaliBed"
!f you specify a skip to a none9istent %ariale numer0 it will e interpreted as an
instruction to ranch to the end of the ;uestionnaire" 8or e9ample0 if you ha%e a
sur%ey with fifty ;uestions0 a skip to %ariale ninety-nine would mean to
immediately end the current ;uestionnaire0 and egin a new inter%iew with the ne9t
respondent"
&e careful when defining skip codes0 as it is ;uite possile to create an endless data
entry loop"
$ata +ntry Control Para(eters
4he @ata Antry Control parameters determine how the data entry program will
operate" 4hey can e set independently for each %ariale0 and are all of the yesMno
%ariety"
Missin% 3/
4he decision whether or not to allow missing data for a particular %ariale depends
upon the %ariale itself" 8or e9ample0 !@ numer may e something you want to
ma,e mandatory during data entry 6no missing data will e allowed7" Some %ariales
howe%er0 should accept missing data" 8or e9ample0 in sur%eys0 respondents may
lea%e ;uestions lan, or simply prefer not to answer othersW in agricultural research0
some of the crop diesW in pulic health research0 participants mo%e0 etc" When in
dout0 missing data should e allowed" 4his only means that the data entry person
will e ale to s,ip o%er this %ariale if they need to"
8or !nternet sur%eys0 we strongly recommend allowing missing data for all %ariales"
4he ease in which a person can lea%e an !nternet sur%ey ma,es it e9ceedingly
important that they not ecome frustrated y the process" $e;uiring input when a
respondent does not wish to answer an item will most assuredly result in the partially
completed sur%ey"
0uto 0d,ance
When the #uto #d%ance is set0 the cursor will automatically mo%e to the ne9t field
when the current field is filled with characters" 4his means that during the data entry
process0 if you type the same numer of characters that were reser%ed for field width
6in the format statement70 you will not need to press 8enter9 to mo%e to the ne9t
field" 4his will significantly speed up the data entry process since it eliminates a
,eystro,e 6i"e"0 8enter97 for each %ariale" 4his parameter will e ignored for
!nternet sur%eys"
Cas 3nly
4he Caps :nly parameter determines whether the characters typed on the ,eyoard
will e con%erted to upper case letters in the data file" 4his is especially useful if a
field is coded alpha0 and you do not want the data entry operator to e ale to
inad%ertently enter lower case characters" !t is identical to using the caps loc, on
your ,eyoard" 4his parameter will e ignored for !nternet sur%eys"
StatPac For Windows User's Manual /eywords 1!
Code"oo# :ools
4here are two main tools for entering and changing the information in the codeoo,5
the Frid and the ?ariale @etail" Aither tool may e used at any time" Fenerally0 the
Frid is used when you are eginning a new codeoo,0 and the ?ariale @etail is used
to ma,e changes to indi%idual %ariales" 4here is also an #nalysis utility program
QCuic, Codeoo, CreationR to create a codeoo, from an e9tended format
statement"
:he Grid
:ne method of designing a codeoo, is to use the Frid" Clic, on the Frid utton and
the Frid will e displayed"
# row in the Frid represents a %ariale" !f your study has 20 %ariales0 there will e
20 rows in the Frid" When you start the Frid0 only one row will e showing" 1ore
rows will appear as needed as you enter the codeoo," When you enter a %ariale
format for the current %ariale0 a lan, row for a new %ariale will appear"
4o egin entering information into the Frid0 clic, in the name field of the first row"
>se the 4a ,ey and Shift 4a ,eys to mo%e from one column to the ne9t" Jou can
also use the left or right mouse uttons to select a field"
4he ?ariale .ael and ?alue .ael fields will display a larger window when you
enter those fields" !f either of these windows is showing0 you can minimiBe it y
clic,ing on it with the right mouse utton0 or clic,ing on another field"
1* /eywords StatPac For Windows User's Manual

Code"oo# .i"raries
4here are many features to ma,e the codeoo, design easier" :ne of these is the
aility to load %ariales from other codeoo,s" !n other words0 you can estalish a
OliraryO of commonly used ;uestions" 4he lirary can e a codeoo, that you
designed especially for this purpose0 or it can e a codeoo, that you used for a
pre%ious study"
4o load a %ariale or %ariales from a lirary0 select 8ile0 :pen .irary"
#fter loading the lirary0 you can choose one or more %ariales to copy to the new
codeoo," 4o select multiple %ariales0 hold down the control ,ey while you clic, on
the indi%idual %ariales in the lirary" #fter selecting the %ariales0 clic, on the Copy
4o Frid &utton in the top left corner of the lirary window"
StatPac For Windows User's Manual /eywords 1-
$ulicatin% 8aria"les
1any times0 consecuti%e %ariales in the codeoo, are similar" While wor,ing with
the Frid0 you can copy the information from the pre%ious %ariale to the current
%ariale" While entering a new %ariale0 clic, on the @uplicate &utton to repeat all
the information from the pre%ious %ariale" StatPac will automatically change the
%ariale name since two %ariales cannot share the same name" StatPac will not
duplicate any fields that are not lan, in the current %ariale"
4he @uplicate &utton is especially useful when creating a series of %ariales that
share the same %alue laels or a series of multiple response %ariales" 8or e9ample0 if
you are entering a series of %ariales that all use the same %alue laels0 you could
enter the %ariale format0 name0 lael0 and then clic, the @uplicate utton to repeat
the %alue laels from the pre%ious %ariale" When entering multiple response
%ariales0 you could use the @uplicate &utton to repeat the entire %ariale"
4he lirary feature can also e used to duplicate %ariales in the current codeoo,"
>nli,e the @uplicate &utton 6which duplicates only the pre%ious %ariale70 the
lirary can e used to duplicate %ariale6s7 that appear anywhere in the codeoo,"
8irst sa%e the codeoo, y clic,ing on the Sa%e utton or selecting 8ile0 Sa%e
Codeoo," 4hen clic, on the row where you want the new %ariales to e inserted"
Select 8ile0 :pen .irary and select the current codeoo, as the lirary" 8inally
select the %ariales you want to duplicate0 and clic, the Copy 4o Frid &utton"
Insert 6 $elete 8aria"les
'ormally0 while you are designing a study0 %ariales are added one after another to
the end of the e9isting %ariales" <owe%er0 you can also insert a new %ariale in the
middle of the codeoo,"
Clic, on the Frid row you want to e immediately elow the new %ariale" 4hen
clic, the !nsert &utton to open up a lan, new row in the Frid"
4o delete a %ariale0 first clic, on the Frid row you want to delete" 4hen clic, the
@elete &utton"
Mo,e 8aria"les
4he order of the %ariales can e changed using the >p and @own #rrow &uttons"
8irst0 clic, on the %ariale you want to mo%e" 4hen clic, the >p or @own #rrow
&uttons to mo%e the %ariale"
Startin% Colu(ns
Starting columns refer to the eginning location of the %ariales in the data record"
@uring data entry0 each %ariale that is entered will e stored in the data record
eginning at a certain location" 4he starting columns are these locations"
Starting columns are automatically determined0 and you do not need to e concerned
aout them" 4hat is0 starting columns are assigned y the program while entering
new %ariales into the Frid" 4hey are assigned so the data record will store %ariales
in consecuti%e 6contiguous7 columns" 4hus0 the starting columns are eing
automatically handled y the program and not displayed as part of the Frid" !f
necessary0 they will e adHusted whene%er the codeoo, is sa%ed" 4hey can e
displayed y selecting :ptions0 Show Start Columns"
1; /eywords StatPac For Windows User's Manual
Print a Code"oo#
4o print a codeoo,0 select 8ile0 Print0 Codeoo," 4he Print @ialog window will gi%e
you the opportunity to choose %arious printing options" Printing a codeoo, is
especially important if you gi%e your data file to someone else0 since the codeoo,
will tell them e9actly how the data is formatted"
4he ?ariale Selection lets you select which %ariales from the codeoo, will e
printed" 4he list of %ariales to print can use spaces or commas to separate %ariales0
and dashes to indicate a range of %ariales"
# codeoo, printout will always include the %ariale numers0 names0 and formats
for the %ariales" 4he OWhat 4o PrintO items let you select what additional
information from the codeoo, will e printed"
?ariale .aels - When this parameter is set0 %ariale laels will e printed"
?alue .aels - When this parameter is set0 %alue laels will e printed"
?alid Codes - When this parameter is set0 %alid codes will e printed" 4his
specifically refers to %alid codes that are not part of a 8Code948:abel9"
S,ip Codes- When this parameter is set0 s,ip patterns will e printed as part of the
%alue laels"
Sell Chec# a Code"oo#
4o chec, the spelling in a codeoo,0 select @esign0 Spell Chec," 4he spelling
chec,er dialog o9 will e shown"
StatPac For Windows User's Manual /eywords 1'
4he default dictionary for the spelling chec, is #merican Anglish" 4he software also
includes spelling dictionaries for &ritish Anglish0 8rench0 Spanish0 and Ferman" 4o
change the dictionary that StatPac uses0 you must edit the StatPac"ini file" 8ind the
line that says GictionaryName 4 Hnglis" Change the word OHnglisO to O7ritisO0
O@rencO0 OSpanisO0 or OIermanO"
8aria"le $etail Window
4o show the ?ariale @etail window0 select ?iew0 ?ariale @etail" !f the ?ariale .ist
window is showing0 you can also doule clic, on a %ariale to e%o,e the ?ariale
@etail window" 4he %ariale window gi%es you the aility to add or modify nearly all
the information in the codeoo," While the layout is different0 it gi%es you the same
functionality as the Frid"
4he ?ariale @etail window can e mo%ed around the screen y pressing the mouse
utton on any gray area of the window and dragging the window to a new location"
When you change any of the fields in the ?ariale @etail window0 the change is
instantly reflected in the codeoo," See Alements of a ?ariale for a complete
description of each field"
)> /eywords StatPac For Windows User's Manual
Code"oo# Creation Process
4he asic steps in%ol%ed in designing a codeoo, depend upon whether or not you
ha%e a sur%ey typed with a word processor"
"ethod 55 !f you do not ha%e a word-processed sur%ey0 you are essentially Ostarting
from scratchO and it will e necessary to manually enter the laeling for the
codeoo," :nce completed0 StatPac can automatically create a form for data entry
and that can e loaded into your word-processor0 an !nternet sur%ey0 or an e-mail
sur%ey"
"ethod 65 !f you already ha%e a word-processed sur%ey0 considerale time can e
sa%ed y loading it into the Wor,space window and then copying te9t from it to the
codeoo, laels in the ?ariale @etail window"
Method 1 9 Create a Code"oo# fro( Scratch
4here are three ways to set up a new codeoo,5
1" >se the codeoo, design features that are uilt into the program" 4he Frid and
?ariale @etail tools let you create and edit %ariales0 as well as eing ale to e9tract
%ariales from other studies or libraries o! &uestions" # lirary of ;uestions is simply
a codeoo, with commonly as,ed ;uestions" $ather than retyping a ;uestion with
each new sur%ey0 you can e9tract it from a lirary"
2" >se Cuic, Codeoo, Creation 6an #nalysis utility program7 to enter a format
statement that descries the %ariales and their format" 4his is the fastest way to
create a new codeoo," <owe%er0 the codeoo, it creates will not ha%e any %ariale
names0 laels or %alue laels 6although these can easily e added later7"
3" !f you import data from another format0 a codeoo, will e created" @epending on
the import format0 the codeoo, may or may not ha%e %ariale names"
StatPac For Windows User's Manual /eywords )1
Method & A Create a Code"oo# fro( a Word9
Processed $ocu(ent
Sa%e the sur%ey with your word processor in "rtf 6$ich 4e9t 8ormat7" !n StatPac0
select 8ile0 :pen0 $ich 4e9t 8ile0 and load the word-processed document into the
wor,space"
#cti%ate the ?ariale @etail window y selecting ?iew0 ?ariale @etail0 or y doule
clic,ing on Q['ew\R in the ?ariale .ist window" 4hen create the codeoo, one
%ariale at a time y specifying a format for the %ariale0 and copying selected te9t
from the form to the ?ariale @etail window"
When creating a new %ariale0 first type its format into the ?ariale 8ormat field"
4hen copy te9t from the wor,space to the ?ariale @etail window to fill in the rest of
the %ariale information"
4o copy te9t0 first highlight the te9t on the form" !t will automatically e copied to
the clipoard when you highlight it" 4hat is0 it is not necessary to select Adit0 Copy0
or press [Ctrl C\" 'e9t0 clic, on one of the fields in the ?ariale @etail window" 4he
te9t will e copied to the ?ariale @etail window" Jou can copy te9t from the form to
the ?ariale 'ame0 ?ariale .ael0 or ?alue .aels fields" @epending on the te9t0
you may need to edit it in the ?ariale @etail window" 4his feature may e turned off
y selecting 8ormat0 and then unchec,ing Semi-#utomatic CopyMPaste"
Multile Resonse 8aria"les
!f an item on a ;uestionnaire allows for more than one response0 it is called a
multiple response item" 8or instance0 in the following ;uestion we would need to
allow for fi%e possile responses5
)ic o! te !ollowing brands o! tootpaste ave you used in te last year( -Ceck
all brands youJve used1
KKKKK Ileem
KKKKK Colgate
KKKKK %epsodent
KKKKK Crest
KKKKK Oter
Aach of the fi%e choices is %iewed as a uni;ue %ariale" 4hat is0 fi%e %ariales would
e re;uired to accommodate all possile responses"
When designing a study in the Frid0 using the @uplicate utton will properly create
all multiple response %ariales"
Fenerally0 the following con%entions are oser%ed when creating multiple response
%ariales"
1" 4he format for all multiple response %ariales must e the same"
2" 4he same 6identical7 %ariale lael should e gi%en to each of the multiple
response %ariales"
3" !f you will e creating a We sur%ey from the codeoo,0 the numer of %ariales
must e the same as the numer of %alue laels" Since there are fi%e choices 6%alue
laels70 there must e fi%e identical %ariales"
4he fi%e %ariales for our e9ample would contain the following information5
)& /eywords StatPac For Windows User's Manual
?1 8ormat5 '1
?1 'ame5 4oothpaste
?1 .ael5 Which of the following rands of toothpaste
ha%e you used in the last yearY
?1 ?alue .aels5 1^Fleem
2^Colgate
3^Pepsodent
3^Crest
2^:ther
W-
4he second0 third0 fourth and fifth %ariales would e identical to the first %ariale0
e9cept the %ariale names would e5 4oothpasteX20 4oothpasteX30 4oothpasteX30 and
4oothpasteX2"
'ote the ao%e e9ample uses %alue laels and a s,ip code" 4he s,ip code says to s,ip
to %ariale si9 if nothing is entered for a %ariale"
4he 1issing :E parameter should e set to OJesO for all fi%e %ariales"
'ote that during data entry0 any toothpaste code can e entered for any %ariale"
4hat is0 if a person had only chec,ed Crest0 a O3O would e typed for the first
%ariale" 8or the second %ariale0 the data entry person would Hust press 8enter9
and this would cause the program to s,ip to %ariale si9 6the continuation of the
;uestionnaire7"
Sometimes sur%eys as, ;uestions that limit the numer of responses" 8or e9ample0
the following ;uestionnaire item limits the respondent to two choices0 e%en though
there are fi%e items listed" 'ote that the following method of limiting the numer of
choices may not e used for We sur%eys"
@rom te !ollowing listB coose te two items most important to you. -,wo only
please1
KKKKK @riendsip
KKKKK :ove
KKKKK @inancial security
KKKKK @reedom
KKKKK Spirituality
!n this e9ample0 we controlled the numer of responses y the way we as,ed the
;uestion" 4wo %ariales need to e created to hold the responses to this item 6one for
each chec,7"
4he study design would contain two %ariales for these multiple response %ariales5
?1 8ormat5 '1
?1 'ame5 !mportant
?1 .ael5 8rom the following list0 chose the two items
most important to you"
?1 ?alue .aels5 1^8riendship
2^.o%e
3^8inancial security
3^8reedom
StatPac For Windows User's Manual /eywords )1
2^Spirtuality
W3
?2 8ormat5 '1
?2 'ame5 !mportantX2
?2 .ael5 8rom the following list0 chose the two items
most important to you"
?2 ?alue .aels5 1^8riendship
2^.o%e
3^8inancial security
3^8reedom
2^Spirituality
&oth items ha%e the same format and %ariale lael" ?ariale and %alue laels are
only assigned to the first %ariale" 4he second %ariale will accept %alid codes 1-2"
'otice that the first %ariale also contains a s,ip pattern that says Hump to %ariale
three if nothing is specified for the first %ariale"
4he two %ariales !1P:$4#'4 and !1P:$4#'4X2 are not weighted" 4hat is0
they could e swapped without affecting the results of any analysis 6one is not more
important than the other7" Codes were assigned to each of the possile responses"
!f the ao%e ;uestion was as,ed in the following way0 the %ariales would e
weightedW that is0 one %ariale is more important than the other5
@rom te !ollowing listB write a 1 next to te item tat is most important to you and a
0 next to te item tat is second most important to you"
KKKKK @riendsip
KKKKK :ove
KKKKK @inancial security
KKKKK @reedom
KKKKK Spirituality
'otice that this is no longer a true multiple response ;uestionW it is really as,ing two
different ;uestions 6which is first and which is second7" >nli,e the pre%ious
e9amples0 oth responses are not weighted e;ually" Whene%er a ;uestion as,s the
respondent to ran, a list of items in some sort of prioritiBed order0 it is not multiple
response" !nstead0 it is essentially a series of separate 6ut related7 %ariales" 4wo
%ariales would e created for this ;uestion0 each ha%ing its own %ariale name0
lael and %alue laels5
?1 8ormat5 '1
?1 'ame5 1ostX!mportant
?1 .ael5 8rom the following list0 what item
is the most important to you"
?1 ?alue .aels5 1^8riendship
2^.o%e
3^8inancial security
3^8reedom
2^Spirituality
)) /eywords StatPac For Windows User's Manual
?2 8ormat5 '1
?2 'ame5 SecondX1ostX!mpt
?2 .ael5 8rom the following list0 what item
is the second most important to you"
?2 ?alue .aels5 1^8riendship
2^.o%e
3^8inancial security
3^8reedom
2^Spirituality
While oth %ariales in this e9ample share the same %alue laels0 they are still
considered to e separate %ariales" 4he criteria to determine whether or not a
;uestion is multiple response is the issue of priority" !f all responses are weighted
e;ually0 the ;uestion is appropriate for multiple response" !f the ;uestion in%ol%es
any sort of ran,ing of the items0 it is est %iewed as a series of indi%idual %ariales"
When StatPac copies %ariales from the codeoo, to the data entry form0 %ariales
with the same %ariale lael are interpreted as multiple response %ariales0 and they
will e automatically grouped together on the data entry template and in the <41.
created for We sur%eys"
Missin% $ata
1issing data may e handled in one of two ways" $egardless of the method used0 it
is easy to change missing data using the #nalysis program"
!n most cases0 no special pro%isions need to e made regarding what to do with
missing data" !f any %ariale in the data file is left lan,0 it will e treated as a
missing %alue and will e e9cluded from the analysis" 4he analysis will print the
numer of missing cases0 ut will not include these when performing any statistical
test"
4he other method of handling missing cases is to enter an additional %alue lael"
64; years or less
74< to = years
C415 to 10 years
G4Over 10 years
4?issing Cases
'ote that the code 6on the left of the e;uals sign7 is a space" #ll missing data in
StatPac is stored as spaces 6or lan,s7 during data entry"
When a %ariale is numeric0 it is not appropriate to specify a %alue lael of
8space9^?alue .ael" Since a space is not a %alid numeric code0 it cannot e
included in a numeric calculation" 4herefore0 missing data will automatically e
e9cluded from most analyses of inter%al or ratio numeric data" !t is possile0
howe%er0 to recode missing data to a %alid numeric %alue 6such as Bero70 so that it
will e included in the analyses" #lso0 se%eral multi%ariate procedures include an
option to use mean sustitution for missing data"
!t is important to understand the conse;uences of recoding numeric missing data to
something else" Lero and missing are not the same" #nalytical techni;ues in%ol%ing
computations on a %ariale treat Bero differently than missing data" 1issing data is
StatPac For Windows User's Manual /eywords )!
e9cluded from all numerical calculations0 whereas Beros are treated Hust li,e any
other numeric %alue"
Chan%in% Infor(ation in a Code"oo#
When initially designing a codeoo, and form0 you can change any information for
any %ariale" Jou can also insert new %ariales and delete e9isting %ariales" 4his
will continue to e true up to the time that data is entered into a data file" #fter that0
StatPac will issue a warning when you load a codeoo, that has an associated data
file" StatPac gi%es this warning ecause these operations 6i"e"0 adding new %ariales
and deleting e9isting %ariales7 would ma,e the e9isting data file no longer match
the codeoo," Jou can0 howe%er0 change any other study design information at any
time"
!f you recei%e the warning message0 StatPac will let you acti%ate a safety feature that
pre%ents inad%ertent additions or deletions of %ariales y disaling the !nsert and
@elete &uttons"
!f you choose not to utiliBe the safety feature0 e careful not to inad%ertently add0
delete0 or change the order of any %ariales since this would ma,e the e9isting data
file incompatile with the modified codeoo," <owe%er0 you may still ma,e changes
to any other codeoo, information including a %arialeDs format"
!f you change the format of a %ariale0 the associated data file adHusted accordingly"
8or e9ample0 if you change a %ariale format from #20 to #1000 all the e9isting data
records would e 20 characters too short" <owe%er0 when you sa%e the re%ised
codeoo,0 each data record will e padded with spaces so it matches the new
codeoo, information" 'ote that this feature normally only changes one data file 6the
one with the same name as the codeoo,7" #d%anced users may wish to change
multiple data files that all use the same codeoo," 4o enale changing multiple data
files0 edit StatPac"ini and set 6llow?ultipleGata@iles 4 1"
#d%anced users may wish to turn on or turn off the safety feature so the prompt is
not displayed" 4he CodebookSa!ety parameter can e edited in the StatPac"ini file to
control this feature" Set CodebookSa!ety 4 1 to always enale the safety feature0
CodebookSa!ety 4 0 to always disale the safety feature0 and CodebookSa!ety 4 5
6the default7 to as, you each time that a codeoo, is loaded"
'ote that the ao%e information applies only when you load a codeoo, for which
there is an associated data file"
)* /eywords StatPac For Windows User's Manual
4his is important ecause entering a few records of dummy data is often the est way
to disco%er errors in the study design" Jou would egin a typical proHect y
designing the %ariales and creating a form" 4hen you could enter a few records into
the data file as a test"
Antering a few dummy records is one of the est ways to test your codeoo," Jou
might disco%er a %ariale on the ;uestionnaire that was inad%ertently omitted from
the study0 an alpha field thatDs not wide enough to hold a response0 or some other
maHor change to the study design" !f you donDt need the data file 6i"e"0 itDs Hust dummy
test data70 you can simply delete the data file" 4o delete a data file0 select 8ile0 :pen0
@ata 8ile" $ight clic, on the data file you wish to delete and select @elete"
!f you ha%e already entered a sustantial numer of real data records0 and then
disco%er you need to add a new %ariale0 you cannot simply add the %ariale to the
codeoo," @oing so would ma,e the format of the codeoo, different than the data
file" !nstead0 new %ariales should e created in an analysis0 where oth the
codeoo, and the data file will e updated to include the new %ariale" See the .A4
command"
StatPac For Windows User's Manual /eywords )-
$ata Mana%er For(
3,er,iew
4he form is a simply a template that can e used to enter and edit data" !t can e
created automatically y StatPac0 or you can create it manually 6with StatPac or your
word processor7" 4o create an automatic data manager form0 first load the codeoo,
and then select @esign0 @ata 1anager 8orm0
4here are two components to the form" :ne is the te9t itself" 4he te9t is simply the
;uestions on the sur%ey" 4he te9t can e typed directly into the 8orm window or
loaded from an e9isting word-processed document" 4he other component is the data
input !ields" 4he data input fields define where the answers will e typed on the
form" 4he form is a comination of te9t and data input fields"
$ata Inut Fields
@ata input fields will e shown on the form in another color 6ma,ing them easy to
identify7" 4hey will appear as a %ariale numer enclosed in rac,ets" 8or e9ample0
%ariale twel%e might loo, li,e this U12V" Fenerally0 the form will ha%e one data
input field for each %ariale in the codeoo,"
@ata input fields can e inserted or deleted from the form during the study design
process"
4o insert a data input field on the form0 first select the desired %ariale from the
?ariale .ist or ?ariale @etail window" 4hen hold the #lt ,ey and clic, the left
mouse utton where you want the field to e located on the form" 4he current
%ariale will e incremented each time you insert a data input field"
4o delete a data input field from the form0 highlight it on the form and clic, on the
Cut &utton0 or select Adit0 Cut 6or use the Ctrl * shortcut7" Jou can highlight
multiple data input fields delete them all at once"
@ata input fields will e automatically placed on the form when you copy %ariales
from the codeoo, to the form"
For( 7a(in% Con,entions
!n most cases0 the codeoo,0 form0 and data file will share the same name" #
codeoo, called $ASA#$C< would ha%e an associated form called $ASA#$C<0
and you would proaly enter the data into a data file called $ASA#$C<" Jou will
use this simple naming scheme for nearly all studies"
<owe%er0 there are situations where you may want to use different names for the
codeoo,0 form0 and data file" 4he form is simply a template for displaying the data"
# form can e used to display all the %ariales0 or Hust some of them" Jou can ha%e
se%eral different forms for a gi%en codeoo," Aach form would ha%e its own name0
and each could show 6or not show7 any of the %ariales" 4hus0 different forms could
e used to gi%e different O%iewsO of the same data
For( Creation Process
4here are two asic ways to create a form" :ne is to use the codeoo, to
automatically create the form0 and the other is to use te9t from a word-processed file
as the foundation for the form" !n nearly all cases0 you will use the codeoo, to
create the form and then you can modify it as necessary"
Usin% the Code"oo# to Create a For(
4he form is created after the codeoo, has een completed"
#utomatic form creation in%ol%es copying %ariales from the codeoo, to the form0
and formatting them according to your specifications" 4o create an automatic form0
first load the codeoo," 4hen copy all the %ariales from the codeoo, to the form
y selecting @esign0 Copy ?ariale6s7 4o 8orm" 4he ?ariale 4e9t 8ormatting
controls how the %ariales will e formatted on the form"
!f you want to delete some or all of the %ariales from the form0 highlight the te9t
you want to delete and clic, the Cut &utton 6or choose Adit0 @elete7 to delete the
%ariales from the form" 4o delete all the %ariales on a form 6for e9ample0 to Hust
start o%er70 choose Adit0 Select #ll0 and then clic, the Cut &utton or choose Adit0
@elete" The codebook is not affected by any chan/es made to the form.
!f you inad%ertently delete an input field or entire %ariale it can e easily re-
inserted" 4o insert only a data input field on the form0 first select the desired %ariale
from the ?ariale .ist or ?ariale @etail window" 4hen hold the #lt ,ey and clic,
!> /eywords StatPac For Windows User's Manual
where you want the field to e located on the form" 4he current %ariale will e
incremented each time you insert a data input field" 4o insert a data input field and
the te9t for the %ariale0 hold the Ctrl ,ey and clic, where you want to insert it on the
form"
4he font name and font siBe that will e used to create the formatted %ariale can e
set y selecting 8ormat0 Set @efault 8onts" 4he @efault 4e9t 8ont will e used to
create the te9t on the form" 4he @ata !nput 8ont will e used during data entry to
enter the data into the fields"
Usin% a Word9Processed $ocu(ent to Create a
For(
!f you already ha%e typed your sur%ey with a word-processor0 you can use it as the
foundation of the form" Jou proaly already used it to e9pedite the creation of the
codeoo,"
8irst0 using your word-processor0 sa%e the sur%ey in $ich 4e9t 8ormat 6"rtf7"
'e9t you need to create a lan, form" .oad the codeoo, and the select @esign0 @ata
1anager 8orm" Clic, Copy Selected ?ariales and type 0 for the ?ariales to Copy"
4hen clic, :E" # lan, form will e created"
:pen the rich te9t file in the Wor,space window" Select Adit0 Select #ll0 Adit Copy
6or type Ctrl #0 Ctrl C7" :pen the lan, for and Select Adit0 Paste 6or type Ctrl ?7"
4he te9t from the rich te9t document will now e part of the @ata 1anager form"
4he final step is to insert the data input fields on the form" 4hese must e added
manually" 4o insert a data input field on the form0 first select the desired %ariale
from the ?ariale .ist or ?ariale @etail window" 4hen hold the #lt ,ey and clic, the
mouse where you want the data input field to e located on the form" 4he current
%ariale will e incremented each time you insert a data input field" Continue until
you ha%e a data input field for all %ariales on the form"
!f you clic, the mouse in the wrong place0 use the Cut &utton to delete the data input
field0 and the Paste &utton to insert it at the correct location" # data input field cannot
e deleted with the @elete or &ac,space ,eys" !t can e deleted with the Cut &utton
or y selecting Adit0 Cut"
StatPac For Windows User's Manual /eywords !1
8aria"le :e2t For(attin%
6utomatic variable creation is an important part of oth manual and automatic form
creation" 4he purpose of automatic %ariale creation is to reduce typing" StatPac will
allow you to selecti%ely transfer information from the codeoo, to the form0 and it
gi%es you the aility to automatically format this information in a %ariety of ways"
4he ?ariale 4e9t 8ormatting @ialog window lets you adHust the parameters that
control the format for this information on the form" Select :ptions0 ?ariale 4e9t
8ormatting to modify the formatting specifications"
Aach component of the ?ariale 4e9t 8ormatting @ialog window can e modified"
Field Place(ent
8ield placement refers to the location for the data input field 6i"e"0 where you want
the cursor located when youDre ready to enter data for the %ariale7" @ata input fields
will e displayed in a different color on the form" 4here are si9 possile field
placements5 left0 far left0 right0 far right0 elow0 and far elow"
Field placement set to Left
U1V 1. 'ow would you rate your expectation !or tis seminar(
Field placement set to Far Left
U1V 1. 'ow would you rate your expectation !or tis seminar(
!& /eywords StatPac For Windows User's Manual
Field placement set to Rigt
1. 'ow would you rate your expectation !or tis seminar( U1V
Field placement set to Far Rigt
1. 'ow would you rate your expectation !or tis seminar( U1V
Field placement set to !elo"#
1. 'ow would you rate your expectation !or tis seminar(
U1V
14 'ig 04?edium 34:ow
Field placement set to Far !elo"#
1. 'ow would you rate your expectation !or tis seminar(
14 'ig 04?edium 34:ow
U1V
8alue .a"els
4he ?alue .aels parameter lets you format the %alue laels in single or multiple
columns"
Value labels set to $ingle Column
64:ow
74?edium
C4'ig
Value labels set to %ultiple Columns
64:ow 74?edium C4'ig
8aria"le Searation
4he ?ariale Separation parameter controls the spacing etween %ariales" !t is
especially useful when copying multiple %ariales from the codeoo, to the form"
4he parameter can e set to lan, line6s70 a page feed0 or a horiBontal line"
!f you want to create a form with one %ariale per page0 you would use a page feed
as the %ariale separator0 and set the ?iew mode to Page ?iew efore sa%ing the
form" @uring data entry0 each %ariale will e displayed on its own page"
8aria"le .a"el Indent
4he %ariale lael indent refers to the numer of inches that the %ariale lael will e
indented from the left margin" 4his is especially useful when the field placement is
set to 8ar .eft
StatPac For Windows User's Manual /eywords !1
&'ample# Variable label indent set to ( inc
U1V 1. 'ow would you rate your expectation !or tis seminar(
&'ample# Variable label indent set to ) inc
U1V 1. 'ow would you rate your expectation !or tis seminar(
8alue .a"els Indent
4he %alue laels indent refers to the numer of inches that the first column of %alue
laels will e indented0 with reference to the position of the %ariale lael" 4he
following e9amples will illustrate the %alue laels indent5
&'ample# Value label indent set to * inces
U1V 1. 'ow would you rate your expectation !or tis seminar(
64:ow
74?edium
C4'ig
&'ample# Value label indent set to ( inc
U1V 1. 'ow would you rate your expectation !or tis seminar(
64:ow
74?edium
C4'ig
Sace "etween Colu(ns
4he space etween columns refers to the numer of inches that will e used to
separate the columns of %alue laels" 4his parameter only applies when the ?alue
.aels parameter is set to multiple columns" 4he actual space re;uired for a column
is determined y the lengths of the %alue laels themsel%es"
&'ample# $pace bet"een columns set to + inc
U1V 1. 'ow would you rate your expectation !or tis seminar(
64:ow 74?edium C4'ig
&'ample# $pace bet"een columns set to ( inc
U1V 1. 'ow would you rate your expectation !or tis seminar(
64:ow 74?edium C4'ig
!) /eywords StatPac For Windows User's Manual
8alid Codes
When the ?alid Codes parameter is set0 the %alid codes will e included with the
%alue laels" 4his specifically refers to those %alid codes that are not part of a
[Code\^[.ael\ line"
&'ample# Valid codes is set
U1V 1. 'ow would you rate your expectation !or tis seminar(
1-A 54GonJt know
S#i Codes
When the S,ip Codes parameter is set0 all s,ip codes will appear as part of the %alue
laels" Fenerally0 s,ip codes would not e shown as part of the data entry form since
the ranching will occur automatically"
8aria"le 7u("ers
When the ?ariale 'umer parameter is set0 the %ariale numer will e included as
part of the %ariale lael" When included0 it will precede the %ariale lael and ha%e
a period terminator" !t is important to note that the %ariale numer might not e the
same as the item numer on the sur%ey" Sur%eys often contain multiple response
items or groups of Qsu-;uestionsO under the same Oitem numerO on the sur%ey"
8aria"le .ist and $etail Windows
4he ?ariale .ist window allows the user to %iew the %ariale names and %ariale
numers while entering data" Clic,ing on a %ariale in the ?ariale .ist window will
ma,e that %ariale the current %ariale" @oule clic,ing on a %ariale in the ?ariale
.ist window will acti%ate the ?ariale @etail window"
4he ?ariale @etail window gi%es complete information on the current %ariale" !t
can e turned on or off y selecting ?iew0 ?ariale @etail" @oule clic,ing on a field
will also acti%ate the ?ariale @etail window"
4he ?ariale @etail window can e dragged around the screen y clic,ing and
holding the left mouse utton on any gray area in the ?ariale @etail window"
StatPac For Windows User's Manual /eywords !!
$ata Inut Settin%s
Jou can set the default data input settings" 4hese can e changed during data entry"
Select :ptions0 @ata !nput Settings to change the settings"
4he #utomatic $ecord #d%ance option controls whether the current record will e
automatically incremented when data entry person reaches the last field in the
current record"
!* /eywords StatPac For Windows User's Manual
!f the #utomatic $ecord #d%ance option is set0 the program will automatically
ad%ance to the ne9t record when the last field of the current record has een entered"
4his way0 the data entry person will e ale to enter a large numer of records
without clic,ing on the 'ew $ecord &utton for each record"
4he @isale S,ips @uring Aditing option controls whether s,ip codes should e
acti%e when editing an e9isting record" When this option is set0 s,ip codes will wor,
when entering a new record and will not wor, when editing an e9isting record"
4he final @ata !nput Settings let you change the colors for the fields" @uring the
Study @esign0 all data input fields will e shown with the OCurrent 8ieldO colors"
@uring data entry0 only the current data input field will use the OCurrent 8ieldO
colors0 and the other fields will e displayed with the O:ther 8ieldO colors"
Select a Secific 8aria"le
4here are three ways to select a specific %ariale5
When the ?ariale .ist Window is displayed0 you can select a %ariale y clic,ing on
it" @oule clic,ing on a %ariale will also display the ?ariale @etail window"
When the ?ariale @etail window is displayed0 you can select a %ariale y selecting
it from the %ariale name field"
!f the form already contains an input field for a %ariale0 you can select the %ariale
y clic,ing on the input field" @oule clic,ing on an input field will also display the
?ariale @etail window"
4he three highlighted areas show the three places you can clic, to select a %ariale"
StatPac For Windows User's Manual /eywords !-
Findin% :e2t in the For(
>se the 8ind @ialog window to search for specific te9t in the form" Select Adit0 8ind
6or use the Ctrl 8 shortcut7 to display the 8ind @ialog window"
4o egin a search0 type the search te9t and clic, on the 8ind 'e9t &utton" #fter a
search has een started and a match has een found0 you can continue the search y
clic,ing on the 8ind 'e9t &utton" >pper and lower case differences will e ignored
in the search"
Relacin% :e2t in the For(
>se the $eplace @ialog window to replace specified te9t in the form" Select Adit0
$eplace 6or use the Ctrl < shortcut7 to display the $eplace @ialog window"
#lternati%ely0 you can clic, the $eplace &utton from the 8ind @ialog window"
>pper and lower case differences will e ignored when finding te9t" <owe%er0
replaced te9t will use the e9act te9t typed into the $eplace With window"
!; /eywords StatPac For Windows User's Manual
Sa,in% the Code"oo# or Wor#sace
Select 8ile0 Sa%e Codeoo, or Sa%e Wor,space to sa%e the codeoo, or Wor,space
window" It is recommended that you save your work at re/ular intervals. Jou
may e9it from a partially completed codeoo, or form and finish them at another
time" Clic, the Sa%e icon 6a picture of a dis,ette7 to sa%e oth the codeoo, and the
Wor,space window"
StatPac For Windows User's Manual /eywords !'
$ata Mana%er
3,er,iew
4he @ata 1anager is used to enter new data0 edit e9isting data0 %erify data using a
doule entry method0 and print data using a form created with the Study @esign
program" #ll of the uttons on the opening screen will e disaled until a data file
has een loaded"
!n order to use the @ata 1anager0 you must ha%e first created a data manager form" !t
is not possile to enter new data or edit e9isting data without a form"
4he form pro%ides the data entry template 6i"e"0 what the data entry person will see
on the screen7" 4he @ata 1anager will attempt to show the current field near the
middle of the screen" 4his means that during data entry0 the cursor will appear to
remain relati%ely stationary near the middle of the screen0 and the form will scroll
after each field is entered"
4here are two ways to run the @ata 1anager" !f the data file already e9ists0 and you
want to add0 edit0 or delete records0 select 8ile0 :pen0 @ata 8ile" !f a data file does yet
e9ist0 you can select @ata0 $un @ata 1anager"
/ey"oard and Mouse Functions
4he following are the asic ,eyoard functions for record and field selections5
Anter #d%ance to the ne9t field using s,ip pattern if present
4a #d%ance to the ne9t field using s,ip pattern if present
Shift 4a 1o%e to the pre%ious field" @oes not follow s,ip
patterns"
@own #rrow #d%ance to the ne9t field using s,ip pattern if present
>p #rrow 1o%e to the pre%ious field" 8ollows s,ip patterns that
were used"
Page >p 1o%e to pre%ious record"
Page @own #d%ance to ne9t record"
Create a 7ew $ata File
4o create a new data file0 first run the @ata 1anager" 4hen select 8ile0 :pen0 and
type a new file name" !n nearly all cases0 the data file name will e the same as the
codeoo, and form names" 4he program will first as, for the name of the form you
want to use as your data entry template" 4hen it will as, for the name of the data file"
4he form will load and you will e ale to egin entering data"
+dit or 0dd :o an +2istin% $ata File
4o edit or add records to an e9isting data file0 first run the @ata 1anager" 4hen select
8ile0 :pen and select the data file" !f there is a form with the same name 6most
situations70 it will e loaded and you will e ale to edit or enter data" !f there is not a
form with the same name0 you will e as,ed to enter the name of the form"
Select a $ifferent $ata File
!t is not necessary to close the current data file efore choosing to edit a different
data file" 4o change data files select 8ile0 :pen and select the data file" 4he current
data file will e closed automatically efore the program opens the new file"
Chan%e Fields
4he current field is the one you are ready to enter data into" !t will e highlighted on
the form using the color scheme de%eloped during the design of the form 6although
the colors can e changed with the @ata 1anager program7"
*& /eywords StatPac For Windows User's Manual
@uring normal data entry0 the current field will change automatically following s,ip
patterns if necessary" 4he user0 howe%er0 is free to manually change to any field at
any time" 4here are many ways to change fields"
Clic,ing the mouse on any field will ma,e it the current field" Clic,ing the mouse on
the Pre%ious 8ield &utton or the 'e9t 8ield &utton will change to the pre%ious or
ne9t field" Jou can also type a field numer into the Current 8ield window and press
enter"
!f the ?ariale .ist window is displayed0 clic,ing on a %ariale will ma,e that
%ariale the current field" !f the ?ariale @etail window is displayed0 selecting a new
%ariale will ma,e it the current field" 4he ?ariale .ist and ?ariale @etail windows
can e displayed y selecting ?iew"
8inally0 the following ,eys can also e used to manually change fields"
Anter #d%ance to the ne9t field using s,ip pattern if present
4a #d%ance to the ne9t field using s,ip pattern if present
Shift 4a 1o%e to the pre%ious field" @oes not follow s,ip patterns
that were used"
@own #rrow #d%ance to the ne9t field using s,ip pattern if present
>p #rrow 1o%e to the pre%ious field" 8ollows s,ip patterns that
were used
"
Chan%e Records
4he #utomatic $ecord #d%ance option controls whether the current record will e
automatically incremented when data entry person reaches the last field in the
current record"
!f the #utomatic $ecord #d%ance option is set0 the program will automatically
ad%ance to the ne9t record when the last field of the current record has een entered"
4his way0 it is possile to enter a large numer of records without clic,ing on the
'ew $ecord &urton for each record" 4o change the #utomatic $ecord #d%ance
option0 select :ptions0 @ata !nput Settings"
4here are se%eral ways to manually change records" Clic,ing on the Pre%ious $ecord
&utton or the 'e9t $ecord &utton will change to the pre%ious or ne9t record" Jou
can also type a record numer into the Current $ecord window and press enter"
8inally0 the following ,eys can also e used to manually change records"
Page >p 1o%e to pre%ious record"
Page @own #d%ance to ne9t record
"
+nter a 7ew $ata Record
4here are two ways to enter a new data record" 4he first is to clic, on the 'ew
$ecord &utton0 and the second is to select Adit0 &egin 'ew $ecord" 4he current
StatPac For Windows User's Manual /eywords *1
record numer window will e updated to show the record numer for the new
record" !f you do not enter any data for the new record0 it will not e sa%ed" !f any
data is entered0 the new record will e added to the end of the data file" !t is not
possile to insert a new record into the middle of and e9isting data file"
8iew $ata for a Secified Record 7u("er
4here are two ways to %iew the data for a record with a ,nown record numer" 4he
first is to type the desired record numer into the current record numer window and
press enter 6or clic, anywhere on the form7" 4he second is to select Adit0 Fo 4o
$ecord 6or use the Control F shortcut7"
When finished0 the selected record will e displayed0 and the focus will remain on
the currently selected field" 4he current record numer window will e updated to
show the record numer for the selected record"
Find Records :hat Contain Secified $ata
StatPac ma,es it easy to find data records that contain specified data" 4o egin a
search0 clic, the 8ind &utton0 or select Adit0 Search @ata 8ile 6or use the Control 8
shortcut7" 4he 8ind dialog window will e displayed"
#fter a search has een started and a match has een found0 you can continue the
search y selecting Adit0 Continue Search 6or use the U83V shortcut ,ey7" 4he 8ind
dialog window does not ha%e to e displayed to continue a pre%ious search0 although
if it is displayed0 you can also clic, on 8ind 'e9t to egin the search" 'ote that the
search often happens so ;uic,ly that it seems instantaneous" 4he user can watch the
current record numer to confirm the record numer that they are %iewing following
a search"
4here are four components in the 8ind dialog window"
*) /eywords StatPac For Windows User's Manual
Field :o Search
Select the %ariale 6i"e"0 field7 you want to search" 4he default will e the current
%ariale"
Search For
4his is the te9t or %alue you want to search for" !f you want to search for missing
data0 lea%e this field lan,"
Search $irection
Select #ll0 8orward0 or &ac,wards"
When the Search @irection is set to #ll0 the search will egin with the record
following the current record 6e"g"0 if record 2 is displayed on the screen0 the search
will start with record -7" !f no match is found y the end of the file0 the search will
continue with record 1 and continue until all records ha%e een e9amined" !f no
match is found0 StatPac will report it0 and the current record will continue to e
displayed" When the Search @irection is set to 8orward or &ac,ward0 the search will
go only to the end or eginning of the file 6respecti%ely7"
Search Method
Select A9act 1atch0 Partial 1atch or Sounde9"
>pper and lower case differences will e ignored for all searches regardless of the
method used" !f you search for I:<' I:'AS0 Iohn Iones will e found"
!f you set the Search 1ethod to an A9act 1atch0 then the data must e9actly match
the search string 6with the e9ception of case differences7" !f you search for Iones0
StatPac will not find a record that contains Iohn Iones in the search field
!f you set the Search 1ethod to a Partial 1atch0 then the search will find records that
contain the search string regardless of other te9t in the field" !f you search for Iones0
StatPac will find records that contain Iohn Iones"
# Sounde9 search is one that uses the sound of the word instead of its e9act spelling"
4his ma,es it possile to find te9t e%en when there are spelling or data entry errors"
!f you set the Search 1ethod to a Sounde9 Search0 then the search will find records
that contain the sound of the search string regardless of other te9t in the field" !f you
search for Ionathan0 StatPac will find records that contain Iohn Ionethon0 8red
Iohnathon0 1ary #nn Ionathon0 etc"
$ulicate a Field fro( the Pre,ious Record
!t is sometimes desirale to e ale to repeat data from the pre%ious record" 8or
e9ample0 assume one of the %ariales in your study is the full city name" @uring data
entry you would type the city name for the first record" When entering data for the
city field in the second 6and suse;uent7 records0 you could duplicate the response
from the pre%ious record" 4he duplicate field function is disaled during doule entry
%erification"
4here are two ways to duplicate the data from the pre%ious record" 4he first is to
clic, on the @>P &utton0 and the second is to select Adit0 @uplicate 8ield 8rom
Pre%ious $ecord 6or use the U82V shortcut ,ey7" 4he duplicate function will copy the
contents of the pre%ious record to the current record for the current field"
StatPac For Windows User's Manual /eywords *!
$elete a Record
@eleting a record is a fairly common procedure ecause duplicate records are often
disco%ered in a data file" 4here are two ways to delete a record" 4he first is to clic,
on the @A. &utton and the second is to select Adit0 @elete Current $ecord"
StatPac will not actually delete the record at this time" !nstead0 the contents of all
%ariales in the record are set to lan,s 6missing7" !n this way0 the record is mar,ed
for deletion rather than actually eing deleted" 4he rationale eing that deleting a
record would cause all suse;uent records to mo%e down in the data file0 in effect
changing their record numers" Since editing is often done y record numer0 it is
important that the record numers do not change during an editing session"
$ecords mar,ed for deletion cannot automatically e undeleted" When you mar, a
record for deletion0 it is actually stored as lan,s in the data file0 so there is no way
to reco%er the information" Jou can0 howe%er0 re-enter the data for that record" !f
you enter any data in a record mar,ed for deletion0 it will not e deleted since it now
contains data"
When you e9it the @ata 1anager0 you will ha%e the opportunity to compact the file
6i"e"0 eliminate the deleted records7" 4his will change the record numers for future
editing sessions" !f you want to preser%e the record numers for the ne9t editing
session0 donDt compact the file"
Jou can also manually compact the data file at any time y selecting :ptions0
Compact @ata 8ile" Jou will e as,ed to confirm your selection ecause the
procedure will change the record numers" 4he delete record function is disaled
during doule entry %erification"
!f you ha%e deleted records0 it is important to compact the data file efore performing
any statistical analysis" :therwise0 the deleted records would e counted as missing
data in the analysis"
$ata Inut Settin%s
1ost data entry control parameters are specified in the Study @esign program"
<owe%er0 a few parameters can e altered y the data entry person" Select :ptions0
@ata !nput Settings to change the settings"
** /eywords StatPac For Windows User's Manual
4he #utomatic $ecord #d%ance option controls whether the current record will e
automatically incremented when data entry person reaches the last field in the
current record"
!f the #utomatic $ecord #d%ance option is set0 the program will automatically
ad%ance to the ne9t record when the last field of the current record has een entered"
4his way0 it is possile to enter a large numer of records without clic,ing on the
'ew $ecord &urton for each record"
4he @isale S,ips @uring Aditing option controls whether s,ip codes should e
acti%e when you are editing an e9isting record" When this option is set0 s,ip codes
will wor, when you are entering a new record and will not wor, when editing an
e9isting record" !f you are entering a new data record0 and temporarily return to a
pre%ious record0 and then ac, to the new record you were wor,ing on0 then you will
no longer e entering a QnewR data record" !n other words0 a record ecomes
permanent as soon as you change records 6e%en if only some of the information was
entered for that record7" S,ip codes will e disaled when you return to the QnewR
record that you were entering unless the @isale S,ips @uring Aditing is unchec,ed"
4he final @ata !nput Settings let you change the colors for the fields"
Co(act $ata File
When you delete a record with the @ata 1anager0 StatPac ma,es it a lan, record
without actually deleting the physical record from the data file" !f you ha%e deleted
records0 it is important to compact the file y deleting the lan, records" :therwise0
the deleted records would e counted as missing data in the analysis" 4o compress a
file0 select :ptions0 Compact @ata 8ile" See @eleting # $ecord" 4he compact data
file function is disaled during doule entry %erification"
StatPac For Windows User's Manual /eywords *-
$ou"le +ntry 8erification
StatPac performs %alidity and range chec,ing on all data entered" <owe%er0 some
people prefer to use a @oule Antry ?erification method to further reduce data entry
error" >sing this method0 all the data is first entered into a data file" 4hen the data is
entered again and compared against the first data during the second data entry
process" @iscrepancies are rought to the attention of the data entry person and they
are resol%ed in real time during data entry"
4o egin @oule Antry ?erification open the data file to e %erified and select
:ptions0 @oule Antry ?erification" #ll the e9isting data will e OhiddenO from the
user0 and it will appear that you are ready to egin entering data eginning with the
first record" #s each field is entered it is compared with the e9isting data" S,ip
patterns will e followed as if this were the same as entering a new data record"
@iscrepancies will e highlighted and you will e ale to specify whether to use the
new data or original data" :nce a field has een %erified0 its data will no longer e
hidden"
:%iously0 @oule Antry ?erification wor,s only if sur%eys are entered in e9actly the
same order as the original data entry" When operating in the @oule Antry
?erification mode0 each time a new record is displayed0 the field data will appear
lan, e%en if that record was already %erified" 4hus0 if the data entry person stops
midway through the %erification process0 it is important they note the record numer
they were wor,ing on when they stopped0 so they can egin at that record when they
return"
Print a $ata Record
4o print a data record select 8ile0 Print" 4he current record will e printed using the
form as a template"
8aria"le .ist 6 $etail Windows
4he ?ariale .ist window allows the user to %iew the %ariale names and %ariale
numers while entering data" Clic,ing on a %ariale in the ?ariale .ist window will
ma,e that %ariale the current %ariale" @oule clic,ing on a %ariale in the ?ariale
.ist window will acti%ate the ?ariale @etail window"
4he ?ariale @etail window gi%es complete information on the current %ariale" !t
can e turned on or off y selecting ?iew0 ?ariale @etail" @oule clic,ing on a field
will also acti%ate the ?ariale @etail window"
4he ?ariale @etail window can e dragged around the screen y clic,ing and
holding the left mouse utton on any gray area in the ?ariale @etail window"
$ata File For(at
StatPac stores its data files in se;uential #SC!! fi9ed format with a carriage return
and line feed at the end of each record" 4his is sometimes referred to as a flat #SC!!
file" 4he data file also contains an end of file mar, -Ctrl L or 6SC** 0;1 at the end of
the file" 4his is the most uni%ersally accepted data file format0 and many data ase
managers refer to it as S@8 format
*; /eywords StatPac For Windows User's Manual
When using data created y another program0 you can determine if it is an #SC!! file
y loading into a te9t editor" !f the data does not appear as garage0 itDs proaly
#SC!!" !f all records appear to contain the same numer of characters0 itDs proaly
fi9ed format" @ata in any other format must e imported into StatPac"
# OrecordO or OcaseO in StatPac is defined as a string of characters terminated with a
carriage return and line feed" 8i9ed format means that all records are e9actly the
same length 6i"e"0 they contain the same numer of characters7 as all other records"
4wo different fi9ed format data files are shown as follows5
Single %ariale file 1ultiple %ariale file
$ecord 1 13 13#31(31)2
$ecord 2 29 29C201(0-1
$ecord 3 0- 0-&9012103
and so on """"
'otice that a data file is Hust a series of numers 6or letters7" #ll the records are
always the same length" !n this e9ample0 the single %ariale file uses two columns
per record and the multiple %ariale file uses ten columns per record 6with an
un,nown numer of %ariales7" 4he end of each data record contains an in%isile
carriage return and line feed0 so each record actually contains two more characters
per record 6one for the carriage return and one for the line feed7"
!f you already ha%e a data file stored in se;uential #SC!! format0 you can use it with
StatPac y gi%ing it a "dat e9tension" Jou only need to set up a codeoo, to match
the format of the data file" 'o other changes are necessary"
1ost data downloaded from a mainframe0 read-in from a scanner0 or recei%ed from a
data entry company will e in se;uential #SC!! format" 4o use this data with
StatPac0 perform the following three steps5
1" Set up a study design with StatPac that e9actly matches the format of the data file"
4he format of the study design must e9actly match the format of the data you will e
using" !f the data file contains unused columns0 dummy %ariales should e created
in StatPac to Opass-o%erO the lan, portions of the data record"
2" Copy the data file to your wor, sudirectory" 4hen rename it to the same name as
the codeoo, e9cept with a "dat e9tension"
!f you need to use a data file that is not stored in se;uential #SC!! format0 you must
import it into StatPac" 4he #nalysis program has a utility to import most foreign data
files into StatPacDs format" 4his ma,es it easy to e9change data with other software
pac,ages0 including most data ase managers and spreadsheets"
StatPac For Windows User's Manual /eywords *'
+(ail Sur,eys
3,er,iew
When most people refer to an email survey0 they mean an email in%itation with a
emedded lin, to an !nternet sur%ey" !f this is what you want0 then refer to the
!nternet sur%ey section and Amail .ist 1anagement sections of this manual"
4his chapter is for users who want to send emails0 where the email itself is the
sur%ey"
#n email sur%ey is one where the ody of the email contains the sur%ey itself" 4his is
in contrast to an !nternet sur%ey where you send an email in%itation and the ody of
the email contains a lin, to the !nternet sur%ey"
4he prolem with email sur%eys is that you donDt ,now what ,ind of email reader
your respondents are using" # sur%ey that loo,s fine in one email reader might appear
distorted in another email reader" 4herefore0 we discourage you from sending email
sur%eys"
'e%ertheless0 there are two ,inds of email sur%eys5 <41. and plain te9t"
5:M. +(ail Sur,eys
!n an <41. Amail sur%ey0 the email you send is the sur%ey itself" When the
respondent %iews the email0 they will see the sur%ey"
8ollow the same procedure as you would if creating an !nternet sur%ey0 including
uploading the sur%ey to the !nternet" 4hen0 instead of sending the respondents a lin,
to the sur%ey0 you send them the first page of the sur%ey 6i"e"0 the X1"htm file7"
When they open the email0 they will see the first page of the sur%ey0 and when they
clic, the Sumit utton0 the responses will e stored on the ser%er and the second
page or than, you page will e displayed" @ata is retrie%ed from the ser%er as if it
were an !nternet sur%ey"
Conceptually0 <41. email sur%eys are wonderful" <owe%er0 in reality0 <41. email
sur%eys can cause se%eral prolems" Some people ha%e their email readers set to not
display <41." :ther people ha%e their email readers set to disallow e9ecutales
which means they delete the Ia%aScript in the <41. that StatPac relies on" 4his will
cause them to see a Ia%aScript error when they %iew the email" #dditionally0 you
cannot use coo,ies or !@ numers to trac, who responded and who didnDt"
8or these reasons0 we discourage you from sending <41. email sur%eys" !f you
choose to send them anyhow0 please do so ,nowing that some respondents are li,ely
to ha%e prolems"
Plain :e2t +(ail Sur,eys
# plain-te9t Amail is one where you create a sur%ey using #SC!! te9t and include it
as part of the ody te9t in a regular Amail" 4he sur%ey is emailed to a potential
respondent" 4hey clic, their $eply utton0 complete the sur%ey0 and then clic, the
Send utton to return the completed sur%ey to you" >pon receipt of their reply0 you
can immediately import it into a StatPac data file0 or filter it to a mailo9 6i"e"0 file7
with other returned Amails and import all the responses at once" !mporting returned
Amails appends the respondentNs answers to the end of a StatPac data file"
4here are two ,inds of %ariales that can e included in a plain-te9t Amail" :ne is
where the respondent uses an * to chec, the appropriate response6s7" 4he other is
where the respondent fills in a te9t or numerical response" 4he following simple
sur%ey shows oth ,inds of %ariales" 4he first fi%e sur%ey items are O* the o9O and
the last fi%e items are Ofill in the lan,O5
4: P#$4!C!P#4A0 P.A#SA C.!CE 4<A $AP.J &>44:'"
4ype an * etween the rac,ets to indicate your selection"
1" Fender U V 1ale U V 8emale
2" Athnicity5
U V &lac,
U V White
U V :ther
3" What is your fa%orite randY
U V &rand * U V &rand J
U V &rand L U V >ndecided
3" :%erall0 how would you rate our productY
64ype an * etween the rac,ets to indicate your response"7
A9cellent Poor
U V U V U V U V U V U V U V
1 2 3 3 2 - )
2" Where did you hear aout the productY
64ype an * etween all rac,ets that apply"7
U V $adio
U V 4?
U V 'ewspaper
-& /eywords StatPac For Windows User's Manual
-" :%erall0 how would you rate our productY
A9cellent Poor
1 2 3 3 2 - )
4ype the numer of your rating here" U V
)" <ow old are youY U V
64ype your age etween the rac,ets7
(" What do you feel would e a fair price for this productY
U V 4ype the dollar amount etween the rac,ets""
9" What is your fa%orite randY
64ype the name of your fa%orite rand etween the rac,ets7"
U V
10" What could we do to ma,e our product etterY
64ype your answer etween the rac,ets7"
U
V
C.!CE 4<A SA'@ &>44:' 4: 8!'!S< 4<!S S>$?AJ"
4<#'E J:> 8:$ J:>$ P#$4!C!P#4!:'"
Brac#ets
'otice that the rac,ets are used to show respondents where to type their answers"
4he te9t of the Amail is completely free-form0 e9cept that rac,ets may only e used
to specify where respondents are supposed to type their answer" Jou may not use
rac,ets anywhere else in the Amail"
Ite( 7u("erin%
4he numering of the sur%ey items is optional" 4he purpose of these numers is to
guide the respondent from one ;uestion to the ne9t" 4hey are not necessarily the
same as the %ariale numers in the codeoo," 4hat is0 some sur%ey items might e
multiple response and occupy multiple %ariales in the codeoo," 8or e9ample0
sur%ey item 2 is multiple response and ta,es three codeoo, %ariales" 8rom that
point on0 the item numering on the sur%ey is no longer is the same as the codeoo,
%ariales"
'umering the items on an Amail sur%ey also ser%es an additional purpose" When a
respondent replies to your Amail0 StatPac will e9tract their answers from the Amail
y loo,ing at whatDs etween the rac,ets" !f a respondent inad%ertently deleted one
of the rac,ets0 StatPac might get confused on which %ariale it was e%aluating"
When item numering is not used0 StatPac will report the error and not add any of
that respondentDs answers to the data file" When item numering is used0 StatPac will
StatPac For Windows User's Manual /eywords -1
e ale to identify the start of a new %ariale or series of multiple response %ariales0
and it will lea%e only the defecti%e item lan," StatPac will report the error0 ut the
rest of the data for that respondent will e added to the data file" 4hus0 item
numering allows StatPac to Ore-synchO with the %ariales in the codeoo,0 e%en
when a rac,et has een deleted"
!f you do use item numering on your Amail sur%ey0 the numer may egin with the
letter C 6a common are%iation for ;uestion7" !t must also end in a period followed
y a space0 and it may not contain non-numeric characters" Aach of the following
would e correct usage of item numering"
2" Where did you hear aout the productY
C2" Where did you hear aout the productY
C2" 6a7 Where did you hear aout the productY
4he following would e incorrect usage of item numering" 4he first e9ample does
not ha%e a period following the numer" 4he second e9ample has a space after the C"
4he third e9ample has the letter OaO efore the period and space"
2 Where did you hear aout the productY
C 2" Where did you hear aout the productY
C2a" Where did you hear aout the productY
Code"oo# $esi%n for a Plain :e2t +(ail Sur,ey
4he codeoo, for an Amail sur%ey is the same as any other codeoo," 4he rule is0 if
you want the respondent to use an * to show her response0 the codeoo, must
specify a %alue lael for each response" !f you want the respondent to fill in an
answer0 do not specify any %alue laels for that %ariale"
?ariales can e alpha or numeric" When multiple sets of rac,ets 6o9es7 are
re;uired0 they can e placed horiBontally 6items one and four7 or %ertically 6items
two and fi%e7" !f you specify more than one column of o9es 6item three70 they must
e positioned horiBontally" 4hat is0 the first o9 is associated with %alue lael 1 and
the o9 to the right of it is associated with %alue lael 2" !n the second row0 the first
o9 is associated with %alue lael 30 and the o9 to the right of it is associated with
%alue lael 3"
<ere is the codeoo, for the first fi%e items5
?1" Fender 6#17
1^1ale
8^8emale
?2" Athnicity 6'17
1^&lac,
2^White
3^:ther
?3" What is your fa%orite randY 6'17
1^&rand *
2^&rand J
-) /eywords StatPac For Windows User's Manual
3^&rand L
3^>ndecided
?3" :%erall0 how would you rate our productY 6'17
1^A9cellent
2^
3^
3^
2^
-^
)^Poor
?2" Where did you hear aout the productY 6'17
1^$adio
2^4?
3^'ewspaper
?-" Where did you hear aout the productY 6'17
1^$adio
2^4?
3^'ewspaper
?)" Where did you hear aout the productY 6'17
1^$adio
2^4?
3^'ewspaper
4he last fi%e items on the sample sur%ey are fill-in-the-lan, items" 4he %ariale
formats in the codeoo, specify the ma9imum response length for each of the items"
4he actual distance etween the opening and closing rac,et on the Amail sur%ey can
e any length" !f the respondent OstretchesO the space etween the rac,ets y typing
a longer response0 the data will e recorded properly in the data file pro%ided the
answer does not e9ceed the field length specified in the codeoo," !f the respondentDs
answer does e9ceed the field length0 StatPac will allow you to adHust the codeoo, so
that all fields are sufficient to hold the responses" #lso note that the opening and
closing rac,ets do not need to e on the same line of the Amail" !tem ten in the
e9ample offers the respondent se%eral lines for their answer" <ere is the codeoo, for
the second fi%e items

?(" :%erall0 how would you rate our productY 6'17
?9" <ow old are youY 6'27
?10" What do you feel would e a fair price for this productY 6'-7
?11" What is your fa%orite randY 6#327
?12" What could we do to ma,e our product etterY 6#2007
!f a respondent prefi9es a numeric response with a dollar symol 6as might readily
happen for ?1070 the dollar symol will e eliminated from response when importing
the Amail file"
4he asic te9t for an e-mail sur%ey can e created y selecting @esign0 Amail
Sur%ey" 4his will pro%ide a foundation for the ody of your email" !t is e9pected that
you will edit the te9t as necessary for your specific application and audience"
StatPac For Windows User's Manual /eywords -!
Caturin% a Resondent's +(ail 0ddress
4o capture the respondentsD Amail addresses0 include a %ariale in the codeoo, that
has the name A1#!." Fi%e it a format sufficient to hold all Amail addresses 6e"g"0
#)07 "4he A1#!. %ariale may e placed anywhere in the codeoo," @o not
indicate anything on the Amail sur%ey itself" StatPac will properly capture the
respondentDs Amail address when e%er the A1#!. %ariale name is specified in the
codeoo,"
>nli,e plain-te9t Amail0 CF! Amail cannot automatically capture the respondentDs
email address" 4herefore0 in order to capture the respondentDs Amail address you
must e9plicitly specify it as a field on your we page"
Filterin% +(ail to a Mail"o2
#ll e-mail programs allow you to automatically or manually send a recei%ed e-mail
to a mailo9 or te9t file" #utomatic OfilteringO is often used to sort the incoming
Amail into a series of mailo9es" 4hese mailo9es are simply te9t files containing all
the Amails that ha%e een routed to the mailo9" 4he naming con%ention for the
mailo9es is different for each Amail program" Audora and :utloo, A9press
programs use a "m9 e9tension" 4he first step is to determine the name of the
mailo9" 4hat is0 the name of the file that contains the completed sur%eys 6i"e"0 that"
holds the filtered Amails7" 4his is the file that you will import into StatPac" !f you do
not ha%e an Amail program that has filtering to mailo9es0 you could import the
incoming Amail sur%eyDs into StatPac one at a time from the clipoard0 ut this might
e slow" # etter techni;ue might e to use notepad to copyMpaste all the Amails into
one file that can then e imported into StatPac"
General Considerations for Plain :e2t +(ail
&ecause of the wide di%ersity in e-mail readers0 we suggest that you limit e%ery line
of your e-mail sur%ey to -0 characters" 4his will a%oid unintentional word wrap"
Create your email using a non-proportional font 6e"g"0 Courier7 to ma,e it perfectly
clear as to you how long a -0 character line will e"
We suggest that <41. tags not e used to enhance the appearance of your e-mail"
1any e-mail readers do not recogniBe the control se;uences used y <41. tags0
and these potential respondents will see control codes as part of their e-mail" 1a,e
your e-mail sur%eys generic loo,ing so they will display properly with all e-mail
readers"
&efore actually sending out the sur%eys0 send se%eral copies of the e-mail sur%ey to
yourself" 1a,e sure the sur%eys loo, e9actly the way you want the respondent to see
them" 4hen reply to each of the sur%eys" 'ow chec, your mail to ma,e sure that they
get filtered to the correct mailo9 and chec, the import procedure to ma,e sure that
the data is eing properly imported" Chec,ing the entire import process is crucial for
e-mail and !nternet sur%eys"
-* /eywords StatPac For Windows User's Manual
Internet Sur,eys
3,er,iew
StatPac can create single page or multiple page !nternet sur%eys from a codeoo," !n
order to use the !nternet sur%ey feature you must ha%e a We site that supports CF!"
>sually0 this means you will ha%e access to a cgi-in folder on your ser%er" 'early all
hosting ser%ices support CF!0 so you may need to contact your !SP for more
information" StatPac has a Perl script that you will install in your cgi-in folder" !f
you do not wish to host your own sur%ey0 StatPac can pro%ide a ser%er for you"
:ptionally0 you will ha%e a WJS!WJF <41. editor" StatPac will create
aesthetically pleasing and fully-functional !nternet sur%eys0 ut you may want to
%isually enhance their appearance with graphics or other design features" !n order to
do that0 you must ha%e a What-You-See-Is-What-You-Get <41. editor" 1icrosoft
8ront Page and 1acromedia @reamwea%er are e9amples of WJS!WJF <41.
editors" <owe%er0 any WJS!WJF <41. editor will wor,K e%en recent %ersions
of 1icrososft Word"
#fter StatPac creates the <41. pages0 you may edit them0 ut if you were to
suse;uently regenerate the pages with StatPac0 all edits would e lost" 4herefore0
donNt edit the <41. until you are satisfied with StatPacNs pages" 4est the StatPac
generated <41. pages online efore using an <41. editor to enhance the
appearance of the pages"
1any of the features of !nternet sur%eys will only wor, when the sur%ey is online"
4hings li,e ranching0 coo,ies0 piping0 popup windows0 help windows0 and page
sumissions will not wor, on your local computer" >se your local computer to %iew
and edit the pages0 ut the sur%ey must e on a ser%er to test the functionality of
these features"
Internet Sur,ey Process
4he asic process for creating and using !nternet sur%eys is as follows" We suggest
that you follow this process for each !nternet sur%ey you conduct"
Ser,er Setu
!f you will e using your own ser%er to host the sur%ey and you ha%e not already
setup your ser%er0 select Ser%er \ Setup to specify your ser%er settings"
!f you will e using StatPacDs ser%er to host the sur%ey0 youDll e ale to select a
pri%ate folder name when you design your first sur%ey"
Create the 5:M. Sur,ey Pa%es
1" Create a codeoo,"
2" Create a default script y selecting @esign \ !nternet Sur%ey"
3" 1odify the Primary Settings and script as necessary"
3" Fenerate and %iew the <41. files" $epeat this step as necessary"
Uload the Files to the We" ser,er
Select Ser%er \ #uto 4ransfer " Clic, the >pload Sur%ey utton"
:est the sur,ey
4est the sur%ey y repeatedly ta,ing it online as if you were a respondent" 4est
ranching and %alidity chec,s"
$ownload and i(ort the test data
Select Ser%er \ #uto 4ransfer" Clic, the @ownload $esponses utton" 4he responses
will e downloaded and imported into StatPac"
#lternati%ely0 you may manually download the file of responses y selecting Ser%er
\ 84P" !n the top pane0 na%igate to the folder containing the responses 6usually cgi-
in7" @rag the response file from the top pane to the lower pane to download the file"
#fter downloading the response file to your local computer0 select @ata \ !mport \
!nternet $esponse 8ile to import the data into StatPac"
$elete the test data fro( the ser,er
Select Ser%er \ #uto 4ransfer Select the @elete ta and clic, the @elete $esponses
utton"
#lternati%ely0 you can manually delete the responses using 84P"
!f you are using the StatPac ser%er0 select Ser%er \ 84P \ StatPac" Select ?iew \
$esponse 8older" $ight clic, on the response file and select @elete"
!f you are using your own ser%er0 select Ser%er \ 84P \ DourServerName" !n the top
pane0 na%igate to the folder containing the responses 6usually cgi-in7" $ight clic, on
the response file and select @elete"
Conduct the sur,ey
Amail in%itations or somehow ma,e respondents aware of the lin, to the sur%ey"
$ownload and i(ort the data
!f you are using your own ser%er0 select Ser%er \ #uto 4ransfer \ JourSer%er" Clic,
the @ownload $esponses utton"
!f you are using StatPacDs ser%er0 select Ser%er \ #uto 4ransfer \ StatPac" Select the
#uto 4ransfer ta and clic, the @ownload $esponses utton"
-; /eywords StatPac For Windows User's Manual
#lternati%ely0 you may manually download the file of responses y selecting Ser%er
\ 84P" !n the top pane0 na%igate to the folder containing the responses 6usually cgi-
in7" @rag the response file from the top pane to the lower pane to download the file"
#fter downloading the response file to your local computer0 select @ata \ !mport \
!nternet $esponse 8ile to import the data into StatPac"
4he ser%er will always contain the entire data set unless you delete the response file
on the ser%er 6i"e"0 downloading the response file does not erase it from the ser%er7"
4herefore0 you can download the data at any time from a sur%ey in progress and the
download would contain the entire data set from the eginning to that point in time"
When you import the data0 you would o%erwrite the e9isting file ecause the newly
downloaded file contains the entire data set"
$islay a sur,ey closed (essa%e
Select Ser%er \ #uto 4ransfer " Select the @elete ta and clic, the @elete Sur%ey
utton" 4he sur%ey will e deleted and the sur%ey closed page will e shown to
people attempting to access the sur%ey" !f you repeat this process0 the sur%ey closed
page will e deleted"
#lternati%ely0 you can use 84P to manually close a sur%ey" Select Ser%er \ 84P" !n
the top pane0 na%igate to the folder containing the sur%ey" $ight clic, on the
SurveyName.tm file and rename it to something else" $ight clic, on the
SurveyNameKclosed.tm file and rename it to SurveyName.tm0
Ser,er Setu
&efore you can create an !nternet sur%ey on your own ser%er0 you must tell StatPac
aout that ser%er" Select Ser%er \ Setup"
StatPac For Windows User's Manual /eywords -'
!f you already ha%e setup a ser%er or ser%ers0 use the arrow ,eys to scroll through
your ser%er list"
4o create a new ser%er profile0 clic, the 'ew utton" 4o delete the ser%er profile that
is currently displayed0 clic, the @elete utton"
Jour !SP will e ale to tell you the following 84P login and folder information"
F:P .o%in Infor(ation
$erver Type
4here are asically two types of ser%ers5 17 >ni9 M .inu9 and 27 Windows '4 M !!S"
When you ma,e a Ser%er 4ype selection0 the most li,ely Paths and 8olders settings
will e filled in
Domain Name
4he domain name should e specified without an http or www prefi9" 8or e9ample0
statpac.com or webpoll.org"
FTP $erver
4he 84P Ser%er is the address of the 84P ser%er" !tDs usually your domain name with
an ftp prefi9" 8or e9ample0 !tp.statpac.com or !tp.webpoll.org" !t might also e Hust
the domain name 6i"e"0 statpac.com or" webpoll.org7" !t could e%en e an !P address"
,sername and Pass"ord
Jour >sername and Password will e pro%ided y your !SP" >sernames and
passwords are usually case sensiti%e0 so use care when entering the information"
Paths 6 Folder Infor(ation
We sur%eys will not function properly unless you get all of the settings right" 4here
is a good chance that the default settings are correct0 ut not necessarily" So please e
careful" :n a >ni9 or .inu9 ser%er0 this information is case sensiti%e and is typically
lower case"
FTP Pat to --- Root Folder
When you log in to your ser%er using an 84P program0 youDll e sitting in a folder on
the ser%er" Jour wwwroot folder is the folder where you put your We site <41.
files" Jou should see your We site home page in that folder" !t might e the 84P
login folder or it might e a sufolder #ll of these are li,ely sufolder names"
pulicXhtml
wwwroot
docs
yourdomain name"com
!f your 84P login folder is the same as your wwwroot folder0 then lea%e this setting
lan," !f your wwwroot folder is in a sufolder0 specify the sufolder name"
!f you donDt ,now0 contact your !SP or try to disco%er it yourself y e9ploring your
ser%er" Select 8ile \ A9it" Select Ser%er \ 84P and select the ser%er you are trying to
set up" 4he top pane will e your 84P login folder" @o you see any <41. files in
that folderY !f not0 do you see any of the ao%e sufolder namesY Jou can doule
;> /eywords StatPac For Windows User's Manual
clic, on the sufolder names to see the contents of that folder" JouNre loo,ing for the
folder that contains files with e9tensions of "htm or "html 6e"g"0 inde9"htm or
default"html7" Close the 84P program and return to the Ser%er Setup program to enter
the folder name"
FTP Pat to C.I $cript Folder
4his folder is easy to identify ecause it is nearly always called cgi-in or cgi" !t is
usually a sufolder of the wwwroot folder" Specify the path as the full path to the
folder eginning at the 84P login folder"
+1ample 5 7 The wwwroot folder is a subfolder 2typical $ni18&inu1 server4
4he ser%er folder structure is5
84P .ogin 8older
pulicXhtml
cgi-in
4he 84P path to the wwwroot folder would e5 pulicXhtml
4he 84P path to the CF! script folder would e5 pulicXhtmlMcgi-in
+1ample 6 7 The wwwroot folder is a subfolder 2typical Windows IIS server4
4he ser%er folder structure is5
84P .ogin 8older
wwwroot
cgi-in
4he 84P path to the wwwroot folder would e5 wwwroot
4he 84P path to the CF! script folder would e5 wwwrootMcgi-in
+1ample 9 7 The wwwroot folder is the wwwrootfolder 2e./.% /odaddy.com4
4he ser%er folder structure is5
84P .ogin 8older is the wwwroot folder
cgi
4he 84P path to the wwwroot folder would e5 lea%e lan,
4he 84P path to the CF! script folder would e5 cgi
+1ample : 7 The wwwroot folder is a subfolder called mydomain.com and the
c/i script folder is at the same folder level as mydomain.com
4he ser%er folder structure is5
84P .ogin 8older
mydomain"com
cgi-in
4he 84P path to the wwwroot folder would e5 mydomain"com
4he 84P path to the CF! script folder would e5 cgi-in
StatPac For Windows User's Manual /eywords ;1
Response $torage Folder
4his is the folder where respondentsN answers will e stored" !t is specified
differently depending of the type of ser%er"
$ni1 or &inu1 Server
:n a >ni9M.inu9 ser%er0 it is e9pressed as either an asolute ser%er path or a path
relati%e to the cgi script folder" We hi/hly recommend leavin/ the settin/ as .8
which means to store responses in the c/i script folder. 4he cgi script folder is not
%isile to the outside world on a properly configured ser%er"
4here are numerous ways to specify the storage folder on a >ni9 or .inu9 ser%er"
4he setting may e specified as asolute ser%er path or relati%e to the cgi-in folder"
#solute ser%er paths always egin with a forward slash"
#ll of these would store the results in the cgi-in folder"
Storage8older^MhomeMusernameMpulicXhtmlMcgi-in 6asolute ser%er path7
Storage8older^""Mcgi-in 6two periods7
Storage8older^"M 6one period7
#ll of these would store the results in a folder called OstorageO which is immediately
elow the cgi-in folder"
Storage8older^MhomeMusernameMpulicXhtmlMMcgi-inMstorage
Storage8older^""Mcgi-inMstorage 6two periods7
Storage8older^"Mstorage 6one period7
4hese would store the results in a folder called Opri%ateO which is at the same le%el as
pulicXhtml 6and therefore not accessile to the outside world7"
Storage8older^MhomeMusernameMpri%ate 6asolute ser%er path7
Storage8older^""M""Mpri%ate 6two periods7
4hese would store the results file in a folder called OstorageO which is immediately
elow the pulicXhtml folder" 'ote that this may pose a security ris, ecause the
storage folder would e accessile to the world"
Storage8older^MhomeMusernameMpulicXhtmlMstorage 6asolute path7
Storage8older^MpulicXhtmlMstorage
Storage8older^""Mstorage 6two periods7
#T% Windows% or IIS Server
:n an '4 or !!S ser%er the setting is specified using a @:S path 6i"e"0 the full path
eginning with a dri%e letter to the folder where responses should e stored7" >sers
must ha%e readMwrite access to the folder" #n e9ample might e5
;& /eywords StatPac For Windows User's Manual
Storage8older^c5SinetpuSwwwrootScgi-in
!n order to use 84P to retrie%e the data0 the wwwroot folder name must part of the
Storage8older path" 8or e9ample0 you would not e ale to use 84P to retrie%e this
data ecause the storage folder is not elow the wwwroot folder"
Storage8older^d5Sdatastorage
Some older '4 ser%ers re;uire that you use doule ac,slashes instead of single
ac,slashes" !f you recei%e a QSer%er &usyR message after clic,ing the sumit utton
on a sur%ey0 try changing the path to doule ac,slashes in place of single
ac,slashes5
Storage8older^c5SSinetpuSSwwwrootSScgi-in
$erver Pat to Perl
4ype the asolute path where Perl is installed on your ser%er" Jour !SP will e ale to
tell you this information" 4he default settings are most li,ely correct" 4he synta9 for
this setting is different for >ni9M.inu9 and '4M!!S ser%ers"
$ni1 or &inu1 server!
Perl^MusrMinMperl
Windows 2#T or IIS4 server!
Perl^c5SperlSinSperl"e9e
%ail %etod
4here are 3 mail methods to select from" 4he defaults are proaly correct" 8or
>ni9M.inu9 ser%ers0 we suggest >ni9 Send1ail" 8or '4M!!S we suggest S14P 1ail
Ser%er"
$ni1 Sendmail
>se this method on >ni9M.inu9 ser%ers only" Set the ser%er path to the mail program
to pint to the asolute ser%er path" Jour !SP should e ale to gi%e you the path and
name of your ser%er mailing program" 8or e9ample0 usrMsinMsendmail
erl "ail! Sendmail
StatPac For Windows User's Manual /eywords ;1
4his method may e used with any ,ind of ser%er" !t uses the perl 1ail55Sendmail
module" Jou must ha%e the perl module installed on your ser%er to use this method""
S"T "ail Server
4his method may e used with any ,ind of ser%er" !t uses your S14P ser%er to send
emails"
erl #et! S"T
4his method may e used with any ,ind of ser%er" !t uses the perl 'et5S14P module"
Jou must ha%e the perl module installed on your ser%er to use this method""
$%TP Port
When you choose one of the S14P methods you must also specify the S14P port"
Port 22 is the default and it is most li,ely correct for your ser%er although some
ser%ers use a different port" Jour !SP to will e ale to tell you your S14P mail port
numer"
$esi%n Considerations for Internet Sur,eys
4he first step in any sur%ey is to create a codeoo," Fenerally0 this would e done
using the Frid" 4here are only a few special considerations in designing a codeoo,
for an !nternet sur%ey"
1" >se a short lower case codeoo, name without spaces0 dashes0 or special
characters"
2" Eeep your sur%ey pages short" $esponses are only collected when the user clic,s
the sumit utton" !f the user gets frustrated and lea%es your We site without
completing the sur%ey0 none of her responses will e recorded" Jou can dramatically
increase response y ,eeping your sur%eys short 6e"g"0 under 20 ;uestions7" !f your
sur%ey needs to e longer0 use a multiple page sur%ey so that responses are stored at
the end of each page" A%en if a respondent fails to finish the entire sur%ey0 data will
e captured for each page they completed"
3" #llow missing response for most items" When you do not allow missing response
and the user clic,s the sumit utton without answering all the items0 they will e
presented with a message to complete the missing item" !f they ecome frustrated
and lea%e your We site0 none of their responses on that page will e recorded e%en
though only one item might actually e missing"
3" Specify a %ariale name for each %ariale" @o not use special characters in the
%ariale name e9cept the underscore character" # good %ariale naming scheme is
C10 C20 C3a0 C30 etc"
2" When creating multiple response %ariales0 there must e the same numer of
%ariales as %alue laels0 and all the %alue laels must e specified for each of the
%ariales of the multiple response %ariales" 8or e9ample0 if you ha%e a sur%ey with
a ;uestion that says QChec, all that applyR0 and there are fi%e response choices 6%alue
;) /eywords StatPac For Windows User's Manual
laels70 then the codeoo, must contain fi%e %ariales with identical %ariale and
%alue laels"
-" .imit ranching to %ariales that will use radio uttons" &ranching out of te9t
o9es or chec, o9es is not supported" &oth simple and comple9 ranching are
supported"
)" 4est your sur%ey online efore going li%e" 4his in%ol%es completing the sur%ey
se%eral times and importing the data into StatPac" @o not assume that if the sur%ey
%isually loo,s o,ay0 it is o,ay" When you test the sur%ey online0 specify an answer
for e%ery ;uestion" 8or multiple response chec,o9es0 chec, e%ery o9" 4his is the
only way to guarantee that you ha%e not made any errors" ?isually inspect the "asc
response file 6using notepad7" !f any numeric fields ha%e more than one %alue 6with a
comma separator70 it means that you ha%e made an error in the codeoo, or StatPac
script 6two %ariales ha%e the same name or the %ariale is specified twice in the
script7"
(" 4est your email in%itation y sending an in%itation to yourself" 1a,e sure the lin,
in the in%itation wor,s li,e you e9pect it to" !n other words0 try it_
4esting is a mandatory component of e%ery internet sur%ey" @o not ypass this step_
Secial 8aria"les for Internet Sur,eys
4here are three special %ariales for !nternet sur%eys5 *%6ddress0 ,oday0 and
Respondent*G" !f you add these %ariales to your codeoo,0 you will e ale to
capture the !P address of the respondent0 the date that they completed the sur%ey0 and
a uni;ue $espondent !@ numer" #fter generating an !nternet sur%ey0 StatPac will
as, if you want to add these %ariales to the codeoo," !n most cases0 you should
answer yes"
#lternati%ely0 you can manually add these %ariales to the codeoo, during the study
design" 4he *%6ddress and Respondent*G %ariales should ha%e an #12 format and
the ,oday %ariale should ha%e an '( format" When capturing the date0 it will e
stored in the data file in JJJJ11@@ format" 4hese %ariales may e placed
anywhere in the codeoo," 4hey will not e shown on the we pages and are for
internal use only"
4here is an additional '2 %ariale0 SecondsB that will e automatically added to
!nternet sur%ey codeoo,s" 4his %ariale is used to hold the numer of seconds it
too, the respondent to complete the sur%ey" !f a respondent did not complete the
sur%ey0 the Seconds %ariale will e lan," 4he name for the Seconds %ariale is set
in the StatPac"ini file with the Seconds?ar'ame ^ parameter" !f the parameter is left
lan,0 then seconds will not e added to the codeoo, or calculated"
4he Respondent*G %ariale can e used to match respondentNs data with an e9isting
data ase of information" 8irst0 include Respondent*G as an #12 %ariale in the
codeoo," When you generate the !nternet sur%ey0 it will not appear on the sur%ey"
4he Respondent*G %ariale must e included in the codeoo, if you intend to trac,
who responded to the sur%ey" !n a typical we sur%ey0 you would use StatPacNs ul,
e-mail program to send potential respondents an in%itation to ta,e your sur%ey and
there would e a lin, in the e-mail to the sur%ey >$." !n order to trac, who
responded or to match respondentsD data with the data ase0 the >$. lin, must e
appended with a ;uestion mar, and the respondentDs !@ numer" 8or e9ample0 when
sending the e-mail to respondent whose !@ in the data ase was 9123-0 you would
use this as the lin, >$. in the email to that respondent" 4he respondent !@ may
consist of any alpha or numeric characters"
StatPac For Windows User's Manual /eywords ;!
http5MMwww"yourdomain"comMsur%eyname"htmYid^9123-
'ote5 !f you are using password protection for the sur%ey0 the lin, might e5
http5MMwww"yourdomain"comMcgi-inMsur%eyname"plYid^9123-
StatPacNs ul, e-mail program will automatically append an Yid^ to the >$. lin, in
the e-mail in%itation" !f you use StatPac to send email in%itations0 !@ handling is
automatic"
Scrit to Create the 5:M.
4he second step in creating an !nternet sur%ey is to create a script that defines all the
characteristics of the <41. pages" 4he script is a set of commands that tells StatPac
how to generate the <41. sur%ey files that will ecome your !nternet sur%ey" 4he
script language is ;uite easy to understand0 and there are only a few commands that
youDll need to ,now" !n most cases0 the default script created y StatPac will re;uire
only minor editing"
4o create a default script0 first open the codeoo," Select @esign \ !nternet Sur%ey
and the !nternet script window will show the current script" !f a script has not een
pre%iously created for this codeoo,0 a default script will e created" 4he default
script is StatPacDs est guess of how you want your sur%ey to loo,0 ut in most cases
youNll e ale to impro%e on its appearance y editing the script"
#gain0 you do not need to ,now or understand all the script commands" >sually
minor editing will e sufficient" 4he script is di%ided into sections to ma,e it easier
to understand" 4here are three maHor sections5 Primary Settings0 #d%anced Settings0
and Sur%ey Creation"
4he Primary settings must e specified for each sur%ey" 4hey control parameters that
are uni;ue to a gi%en sur%ey"
4he #d%anced settings control te9t attriutes such as fonts0 colors0 and spacing"
4hese settings often remain the same from one sur%ey to another" 4he #d%anced
settings can e sa%ed in a style sheet so they can e used in a future sur%ey"
4he Sur%ey Creation section has commands to control the order and appearance of
oHects 6i"e"0 radio uttons0 chec, o9es0 te9t o9es0 etc"7"
When Settings is not chec,ed0 only the Sur%ey Creation section will show in the
script" When Settings is chec,ed0 all the settings will e shown" 4he Primary and
#d%anced settings may e edited directly in the script window 6if Settings is
chec,ed70 or you may clic, the Adit utton to use the Script editor"
;* /eywords StatPac For Windows User's Manual
4he asic process is to let StatPac create a default script and generate the !nternet
sur%ey <41. pages" 4hen %iew the sur%ey pages and note the things you would li,e
to change" 1a,e changes in the script and regenerate the pages" ?iew the <41.
pages again and continue ma,ing changes to the script until you are satisfied with the
sur%ey"
:nce you are satisfied with the appearance of a sur%ey0 you can clic, the Ser%er
utton to upload it to the !nternet"
Jou will want to ma,e changes to the Primary Settings0 ut only the >$. to sur%ey
folder is critical ecause it defines the ser%er and folder that will host the sur%ey
online"
StatPac For Windows User's Manual /eywords ;-
Co((and Synta2 6 5el
1ost script commands ha%e two parts" 4he part to the left of the e;uals symol is a
,eyword for the script" 4he part to the right of the e;uals symol is the te9t for the
,eyword" !f the te9t part 6to the right of the e;uals symol7 is longer than one line
Hust continue typing without pressing UAnterV0 so the te9t automatically wraps to the
ne9t line6s7" >nli,e a procedure file0 an indented line will not e interpreted as a
continuation of the pre%ious line"
While %iewing the script0 you can right clic, on any line to learn more aout that
command" !f the command in%ol%es a file or color selection0 the right clic, will also
offer a settings choice"
4he actual window for the script has standard editing features" >se Ctrl *0 Ctrl C0
and Ctrl ? to cut0 copy0 and paste te9t within the window" 4here is also a semi-
automatic copy and paste feature to e9pedite changes to the script" Jou may highlight
te9t from other selected areas of the screen and then clic, in the script window to
automatically paste them into the te9t 6without actually selecting copy and paste7"
4he copy will wor, from the wor,space or the @etail window" 4o copy a %ariale
name0 select the %ariale on the right from the list and doule-clic, in the script
window on the line where the %ariale name should appear" ?ariale names will
always e added to the end of the line"
:nce created for a gi%en codeoo,0 the script is automatically sa%ed" !f you
suse;uently select @esign0 !nternet Sur%ey for the same codeoo,0 the pre%iously
createdMedited script will e shown" 4he script itself is an #SC!! te9t file with the
name Ocodebookname.scriptO" 4he script is created from the codeoo,0 ut once
created0 it is independent of the codeoo," 8or e9ample0 say you are wor,ing on a
;; /eywords StatPac For Windows User's Manual
codeoo, and then create a script Hust to see what the !nternet sur%ey will loo, li,e
6so far7" 4hen you go ac, to the Frid and add more %ariales" 4he ne9t time you
select @esign0 !nternet Sur%ey0 the pre%ious script will e shown -- without the new
%ariales" Clic, the 'ew Script utton to recreate Sur%ey Creation portion of the
script with the new %ariales" #lternati%ely0 you can manually add the commands to
the Sur%ey Creation portion of the script"
!f you want to completely start o%er with the default script for a gi%en codeoo,0
close StatPac0 delete the codebookname.script file0 rerun StatPac0 load the
codeoo,0 and select @esign0 !nternet Sur%ey"
Sa,in% and .oadin% Styles
4he #d%anced settings control the Oloo, and feelO of a sur%ey" 8onts and colors are
part of the ad%anced settings"
Jou can sa%e the QstyleR to a file so that you can recall and use the style on a future
sur%ey" 4he style includes most of the ad%anced settings 6colors0 and page layout
parameters7" 4he QStyle &uttonsR let you sa%e the current style or load a pre%ious
style" QStyle filesR ha%e the e9tension of "style and the default folder for style files is
the installation folder 6although you can sa%e or load styles to and from any folder7"
While wor,ing on a sur%ey0 sa%e the style y clic,ing on the Style Sa%e &utton and
typing a name for the style" .oad a pre%ious style y clic,ing on the Style :pen
&utton and select the style" When you generate the <41. files0 the current style will
control the appearance of the sur%ey"
4he actual style file is an #SC!! te9t file that contains most of the #d%anced settings"
When you first select @esign \ !nternet Sur%ey0 StatPac loads a style called
@efault"style from the installation folder" !f you want to change your default style0
sa%e the desired style to the installation folder using the name O@efaultO and
o%erwrite the e9isting @efault"style"
Sur,ey Generation Procedure
Fenerally0 the procedure youDll follow will e to first clic, the :E utton" 4his will
run the script that creates the !nternet sur%ey" StatPac will create se%eral <41.
pages5 a loader page0 one for each page of the sur%ey0 a than,-you page0 and a
sur%ey-closed page" :ther <41. files0 including help and popup windows0 and a
coo,ie-cutter might also e created"
When the Pre%iew o9 is chec,ed0 the sur%ey will e shown in a pre%iew window" !n
the Pre%iew window0 select ?iew to select the page you want to loo, at"
Jou may also select the &rowser .ocal utton to launch Windows A9plorer and %iew
the sur%ey you created" !f your sur%ey contains multiple pages0 you will ha%e to loo,
at each page indi%idually" #fter e9amining the appearance of the sur%ey0 close
A9plorer" !f necessary0 ma,e changes to the script and repeat the process" Jou can
continue ma,ing changes to the script until you are satisfied with the appearance of
the !nternet sur%ey" !t is important to note that many features 6including the continue
and sumit uttons7 will not wor, properly until the files are actually uploaded to the
!nternet"
StatPac For Windows User's Manual /eywords ;'
Scrit +ditor
&oth the Primary Settings section and the #d%anced Settings section of the script can
e edited using the Script editor" 8or ine9perienced users0 this will e easier than
editing the script directly0 although oth methods achie%e the same goal"
4he Script Aditor offers the aility to ma,e changes to the Primary and #d%anced
sections of the script using a form interface" 4he tas represent different sections of
the script" Changes made using the Script Aditor will e reflected in the script itself
when you e9it the script editor"
!n the Primary and #d%anced settings section of this manual that follow0 the ,eyword
in the script is specified" When using the Script editor0 you do not need to e
concerned with the ,eywords themsel%es"
Clic, the Adit utton to e%o,e the Script editor" $ight clic, on any line in the script
editor to get help for that command"
I("edded 5:M. :a%s
<41. tags may e imedded in te9t settings to control the appearance of the te9t"
4hese are5
Start and stop old5 [\ and [M\
Start and stop underlining5 [u\ and [Mu\
'> /eywords StatPac For Windows User's Manual
Start and stop italics5 [i\ and [Mi\
!nsert a line rea,5 [r\
4han,s^[\4his entire te9t is old"[M\
4e9t^:nly one word is [u\underlined[Mu\"
!nstructions^[\[i\4his is old = italics"[Mi\[M\
Closed^4han, you for your interest"[r\ [r\ 4he sur%ey is closed"
Pri(ary Settin%s
4he Primary settings will always e shown at the eginning of the script" 4his is the
only section of the script that you must complete" !t specifies critical information that
is li,ely to %ary from sur%ey to sur%ey" 4here are eight Primary settings"
5:M. 7a(e
<41. 'ame sets the name for all sur%ey pages" 4he default will e the same as the
codeoo, name ut you may change it" 4his will e the name of the sur%ey on the
We and it will e part of the lin, to the sur%ey" #n e9ample would e5
<41.'ame^$esearch
StatPac For Windows User's Manual /eywords '1
4he first %iewale page of the sur%ey is named ',?:NameK1.tm" #ll suse;uent
pages of the sur%ey 6including the than,-you page7 will ha%e file names with an
underscore and numer suffi9" 4he last numered file is the than,-you page0 which is
the page that respondents will e shown when they clic, the final sumit utton"
# one-page sur%ey would ha%e the following files"
$esearch"htm 6.oader7
$esearchX1"htm 61st page7
$esearchX2"htm 64han,-you page7
# three-page sur%ey would ha%e the following files"
$esearch"htm 6.oader7
$esearchX1"htm 61st page7
$esearchX2"htm 62nd page7
$esearchX3"htm 63rd page7
$esearchX3"htm 64han,-you page7
#dditionally0 the <41.'ame command is used to name se%eral other files"
$esearchXclosed"htm 6Sur%ey is closed page7
$esearchXcoo,ieXcutter"htm 6@elete the coo,ie7
$esearchXpopupX1"htm 61st popup window7
$esearchXpopupX2"htm 62nd popup window7
$esearchXhelpX1"htm 61st help window7
$esearchXhelpX2"htm 62nd help window7
$esearchXstart"htm 6.oader page for password protected sur%eys7
4he <41.'ameXclosed"htm page can e used after a sur%ey has een closed" #fter
a sur%ey is closed you can delete the sur%ey from your ser%er" <owe%er0 you
proaly also want to pre%ent late responders from getting a page not found
message" 4herefore0 when you delete a sur%ey0 the sur%ey closed page will e shown
to respondents"
When coo,ies ha%e een used to pre%ent %isitors from ta,ing the sur%ey more than
once0 then you also need to upload a file named codeoo,nameXcoo,ieXcutter"htm"
4his file is necessary to test your installation" When a respondent finishes a page of
the sur%ey0 they will e gi%en a coo,ie as they ad%ance to the ne9t page" 4he coo,ie
contains the !@ numer0 and controls whether they will e ale to return to a
pre%ious page and it will redirect their rowser to the proper page if they ;uit the
sur%ey without completing it and come ac, to finish it at a future time" When you
test your sur%ey online0 you too will recei%e the coo,ie" 4hus0 you could test it once
ut you might e unale to test it again" 4o delete the coo,ie from your computer0 set
your rowser to ',?:NameKcookieKcutter.tm and the coo,ie will e deleted"
JouDll then e ale to test the sur%ey again"
'& /eywords StatPac For Windows User's Manual
Banner I(a%e
&anner!mage sets the image that will e shown at the top of the page" 4o select the
image0 right clic, on the &anner!mage command line" !f youDre doing a sur%ey for a
client0 &anner!mage is proaly your clientDs logo"
&anner!mage^c5SimagesSlogo"Hpg
1ultiple anner images may e show side y side" #fter right clic,ing on the line0
select the first anner image" 4hen right clic, on the line again and select the second
anner image" 4hey will e separated on the command line y a semicolon"
&anner!mage^c5SimagesSlogo#"HpgWc5SimagesSlogo&"gif
4o erase any or all pre%iously selected anner images0 simple delete them from the
&anner!mage command line"
4ip5 4o capture a clientDs logo0 go to their We site" $ight clic, on their logo and
select Sa%e Picture #s" Jou may need to edit the logo with image editing software
such as Photo Shop or Paint Shop Pro"
5eadin%
<eading sets the te9t for the page heading" !t is generally the title of the sur%ey"
<eading^#cme !nc" Amployee Sur%ey
Finish :e2t 6 Finish UR.
8inish4e9t sets the te9t for a lin, on the than, you page and 8inish>$. sets the >$.
for the lin," !f you are doing a sur%ey for a client0 this is proaly a lin, to their
home page" !f the sur%ey is for your company0 itDs proaly a lin, to your home page"
8inish4e9t^Clic, here for the StatPac home page
8inish>$.^http5MMstatpac"com
!f oth are left lan,0 then the finish page will not ha%e an outgoing lin," !f the
8inish4e9t is specified and the 8inish>$. is left lan,0 the te9t on the than,-you
page will appear as te9t only without a hyperlin,"
Coo#ie
Coo,ie sets the type of coo,ie that will e used to pre%ent multiple sumissions from
the same computer" 4he %alid settings are5 'one0 !@0 Partial0 or 8ull"
Coo,ie^'one
Coo/ie0ID
StatPac For Windows User's Manual /eywords '1
4he respondentNs computer will e gi%en a coo,ie so that a respondent who attempts
to ta,e the sur%ey multiple times will e assigned the same !@ numer as pre%ious
administrations" !f they finish the sur%ey or ;uit prematurely and attempt to ta,e it
again0 they will start at the first page of the sur%ey and will e assigned the same !@
numer as their first access" !f they change pre%iously entered data0 their most recent
entry will e captured y the program"
Coo/ie0Partial
# coo,ie will e gi%en when the respondent reaches the than,-you page to pre%ent
them from ta,ing the sur%ey again" 4hus0 the respondent will e ale to page ac,
and forth within the sur%ey0 ut not after they ha%e completed the sur%ey" :nce
theyN%e completed the sur%ey0 they will not e ale to access it again"
Coo/ie0Full
# coo,ie will e gi%en when the respondent sumits each page" 4hus0 if a respondent
stops ta,ing the sur%ey on a gi%en page and tries to ta,e the sur%ey again at a future
time0 their rowser will automatically e redirected to the page where they left off"
Setting Coo,ie^8ull turns the sur%ey into a Qforward onlyR sur%ey" $espondents will
e ale to go forward to the ne9t page of the sur%ey0 ut they will not e ale to go
ac, to a pre%ious page" !n other words0 their rowserNs &ac, &utton will not wor,"
:nce theyN%e completed the sur%ey0 they will not e ale to access it again"
IP 0ddress Control
!PControl sets whether !P addresses will e used to pre%ent multiple sumissions
from the same !P address" 4he %alid settings are5 Jes or 'o

!PControl^Jes

When a respondent completes the sur%ey0 their !P address will e recorded in an !P
log file" !f they attempt to ta,e the sur%ey again0 their !P address will e found in the
log file and they will e pre%ented from ta,ing the sur%ey again"
!PControl is more effecti%e than coo,ies ecause coo,ie loc,ers are sometimes
installed on respondentsD computers" !PControl cannot e loc,ed" <owe%er0
!PControl should only e used when you ha%e reason to elie%e that each potential
respondent has a different !P address" 8or e9ample0 if you are sur%eying different
companies and you want to allow only one respondent from each company0
!PControl could e used" !PControl would not e appropriate if you were sur%eying
multiple people from the same company"
When using coo,ie or !P control0 the ',?:NameKcutter.tm will allow you to delete
the coo,ie or your !P address" Since the ',?:NameKcutter.tm can e accessed
from your rowser0 it means that anyone can access it" 4he ',?:KSecureCutter
setting in the StatPac"ini system defaults file can e used to control whether you will
e re;uired to enter your StatPac serial numer to access the ',?:NameKcutter.tm
file. !f <41.XSecureCutter^10 you will e re;uired to enter your serial numer and
if <41.XSecureCutter^00 you will not"
0llow Cross Site 0ccess
Cross site access might e a useful feature" Jou can place the loader page on your
domain 6the >$. respondents will see7 and host the sur%ey itself on the StatPac
ser%er" 4he loader page is named ',?:name.tm and its purpose is to load the first
') /eywords StatPac For Windows User's Manual
page of the sur%ey 6named ',?:nameK1.tm7" When cross site access is allowed0
the loader page can e hosted on a ser%er that is different than the sur%ey itself"
#llowing cross site access has ris,s ecause it ma,es your sur%ey more con%enient
to hac,ing attempts" StatPac was written to minimiBe the possiility of eing hac,ed0
and we are not aware of any successful attempts" <owe%er0 we are aware of many
situations where hac,ers ha%e tried to defeat StatPacDs security" 4his is especially true
for sur%eys from financial institutions and Opopularity pollsO for the young adult
audience" #llowing cross site access ma,es it more con%enient for someone to try to
hac, the sur%ey0 so we recommend not using cross site access unless you actually
need it"
4he ',?:K6llowCrossSite setting in the StatPac"ini system defaults file is used to
control cross site access" When <41.X#llowCrossSite ^ 10 cross site access will e
allowed" When <41.X#llowCrossSite ^ 00 an 6ccess Genied message will e
displayed0
UR. to Sur,ey Folder
We8older>$. sets the ser%er and optionally the folder where the sur%ey will reside"
!t is the full >$. to the folder that will hold the sur%ey" #ll of the sur%ey pages are
uploaded to this folder"
If you "ill be using te $tatPac server#
Specify StatPac as the We8older>$. setting5
We8older>$.^ta,e-su%ey"com
!f you want to use StatPacDs secure SS. ser%er0 add an ttpsM22www. prefi9"
We8older>$.^https5MMwww"ta,e-su%ey"com
When you clic, :E to generate the <41.0 the setting will e changed to reflect
your current pri%ate folder on the StatPac ser%er0 and the <41. will e created
using the modified setting" When using SS.0 the www" prefi9 is re;uired and will e
added y the software if you inad%ertently omit it when using https5MM"
4he lin, to your sur%eys on the StatPac ser%er will e5
http5MMta,e-sur%ey"comMfoldernameMsur%eyname"htm
or
https5MMwww"ta,e-sur%ey"comMfoldernameMsur%eyname"htm
4o change your pri%ate folder name 6when Settings is chec,ed70 right clic, on the
We8older>$. line and select Ser%er 8older Setting" #lternati%ely0 select
Ser%er\#uto 4ransfer and clic, the 8older ta"
#fter you change you folder name0 you must regenerate the <41. so that the sur%ey
incorporates the new folder name and not the old folder name" 4he We8older>$.
StatPac For Windows User's Manual /eywords '!
setting will e adHusted when to your new folder name when you generate the
<41."
If you "ill be using your o"n server#
Specify the full >$. to the folder that will hold your sur%eys"
!f your domain name is acme"com and you place the sur%ey in the home directory0
then you would set this parameter to5
We8older>$.^http5MMwww"acme"com
!f you want to place your sur%ey in a Osur%eyO folder immediately elow the home
directory0 then you would set We8older>$. to5
We8older>$.^http5MMwww"acme"comMsur%ey
!f you want to run the sumission process o%er a secure 6SS.7 ser%er0 then you must
use the fully ;ualified secure soc,et >$.5
We8older>$.^https5MM www"acme"com Msur%ey
0d,anced Settin%s
4he #d%anced Settings can e %iewed in the script y chec,ing the #d%anced
Settings chec,o9" <owe%er0 it is usually easier to clic, the Settings &utton"
5eader 6 Footer
4he <eader = 8ooter settings let you control what will appear at the top and ottom
of each page"
'* /eywords StatPac For Windows User's Manual
Repeat!annerImage
$epeat&anner!mage sets whether the anner image 6as defined in the Primary
Settings7 will e repeated on each page" $epeat&anner!mage may e set to Jes or
'o"
$epeat&anner!mage^Jes
Repeat1eading
$epeat<eading sets whether the page heading 6defined in the Primary Settings7 will
e repeated on each page" $epeat<eading may e set to Jes or 'o"
$epeat<eading^'o
PageNumbers
Page'umers sets whether page numers will e shown at the top of each page"
When a anner image is displayed0 page numers will appear in a small font elow
the anner image" !f no anner image is displayed0 they will appear elow the page
heading" Page'umers may e set to Jes or 'o"
StatPac For Windows User's Manual /eywords '-
Page'umers^'o
Continue!uttonTe't
Continue&utton4e9t sets the te9t on the continue utton for multiple page sur%eys"
:n a single page sur%ey0 this setting is ignored"
Continue&utton4e9t^Continue
4he Continue&utton4e9t may e used more than once in the Sur%ey Creation section
of the script to change the continue utton te9t on each page"
[Commands to create the first page go here\
Continue&utton4e9t^Clic, here for the second page
'ewPage
[Commands to create the second page go here\
Continue&utton4e9t^Clic, here for the third page
'ewPage
$ubmit!uttonTe't
Sumit&utton4e9t sets the te9t on the final sumit utton for the last sur%ey page"
Clic,ing this utton will ta,e the respondent to the than, you page"
Sumit&utton4e9t^8inish
Progress!ar
Progress&ar sets whether a progress ar will e shown at the ottom of each page" !t
applies only to multiple page sur%eys" 4he progress ar uses two graphics0 lue"gif
and grey"gif" 4hus0 when using the progress ar0 oth of these graphics must e
uploaded to the same ser%er folder as the sur%ey" #uto 4ransfer will automatically
upload these files when necessary" Progress&ar may e set to Jes or 'o"
Progress&ar^Jes
FootnoteTe't 2 Footnote,RL
8ootnote4e9t sets the te9t for a lin, that will e shown at the ottom of each page
and 8ootnote>$. sets the >$. for the lin," 4his is usually a lin, that a respondent
can clic, if they ha%e prolems with the sur%ey" !f oth settings are lan,0 no
footnote will e shown" !f 8ootnote4e9t is specified and 8ootnote>$. is left lan,0
the footnote will appear as te9t only"
8ootnote>$.^http5MMstatpac"com
8ootnote>$.^mailto5adminPstatpac"comYsuHect^Sur%ey <elp
'; /eywords StatPac For Windows User's Manual
Finish 6 Pous
4he 8inish and Popup settings let you control the message respondents will see when
the sur%ey is completed0 and the characteristics of popup windows if they are used"
Tan/s
4han,s sets the te9t for the than, you page" 4he te9t will use the 4itle command
attriutes ut may e modified using asic html tags to control the te9t appearance
and line spacing"
4han,s^Jour response has een recei%ed"[r\4han, you for completing
the sur%ey"
Closed
Closed sets the te9t for the sur%ey closed page" &y default0 the te9t will use the 4itle
attriutes0 ut may e modified using asic html tags to control the te9t appearance
and line spacing"
Closed^4han, you for your interest"[r\ 4he sur%ey is closed"
StatPac For Windows User's Manual /eywords ''
1elp-indo"-idt 2 1elp-indo"1eigt
<elpWindowWidth sets the <elp window width in pi9els and <elpWindow<eight
sets the <elp window height in pi9els"
<elpWindow<eight^220
<elpWindowWidth^320
1elpLin/Te't
<elp.in,4e9t sets the te9t that the respondent will see on the sur%ey for the help
lin," !f not specified0 the default is O<elpO"
<elp.in,4e9t^Clic, here for help
<elp commands may e used together to insert a pre-e9isting help file" 4he ,eyword
O<elpWindowO determines where the lin, will e inserted"

<elpWindow<eight^-00
<elpWindowWidth^1000
<elp.in,4e9t^Clic, here for help"
<elp8ile'ame^help-file-name"htm
<elpWindow
Lin/Te't
.in,4e9t sets the te9t for the .in, command which is used to insert a hyperlin, into
the sur%ey" .in,4e9t and .in,>$. should e set efore using the .in, command"
.in,4e9t^Clic, here to see our home page
.in,>$.^http5MMwww"statpac"com
.in,
Popup!annerImage
Popup&anner!mage sets whether the anner image will e displayed at the top of
popup windows" Popup&anner!mage may e set to Jes or 'o"
Popup&anner!mage^Jes
PopupFull$creen
Popup8ullScreen sets the siBe of popup pages" Popup8ullScreen may e set to Jes or
'o" When set to Jes0 popup pages will fill the respondentNs entire screen" When set
to 'o0 popup pages will only fill the current window display area 6i"e"0 the rowser
toolar and >$. address ar will not e oscured y the popup page7" When there
are no popup pages0 the setting is ignored" # full screen popup is preferred if the
popup window contains more than a couple of ;uestions"
Popup8ullScreen^'o
1>> /eywords StatPac For Windows User's Manual
Control
4he Control ta lets you change settings that control the asic operation of the
sur%ey
%etod
1ethod sets the method that will e used to capture respondentsD answers" 1ethod
may e set to Amail0 8ile0 or &oth" When 1ethod^Amail0 the responses will e
emailed to you" When 1ethod^8ile0 they will e sa%ed in a file on the ser%er" When
1ethod^&oth0 responses will e emailed to you and stored in a file on the ser%er"
4he suggested method is 8ile"
1ethod^8ile
&mail
Amail sets the suffi9 or full email address where the completed sur%ey responses will
e mailed" 4his command is ignored when using the 8ile method"
!n the first form of the command0 only the suffi9 is specified and the email will e
sent to your codeoo, name at the specified domain" 8or e9ample0 if you create an
!nternet sur%ey for a codeoo, named OresearchO0 the completed responses will e
mailed to researchPdomain"com" !n the second form of the command0 the entire
email address is specified"
StatPac For Windows User's Manual /eywords 1>1
A1ail^Pacme"com
A1ail^Iohn"@oePacme"com
Restart$econds
$estartSeconds sets the numer of seconds that the than, you page is displayed
efore the sur%ey is restarted" 4his feature is useful for ,ios, sur%eys or when using
a We sur%ey as the mechanism for data entry" When $estartSeconds is set to lan,
or Bero0 the than, you page will e displayed indefinitely" When set to a %alue greater
than 00 the than, you page will show for the specified numer of seconds0 and then
the sur%ey will e loaded again eginning with the first page"
$estartSeconds^12
%a'imi3e-indo"
1a9imiBeWindow sets whether the sur%ey will attempt to ma9imiBe the respondents
rowser window to full screen" 1a9imiBeWindow may e set to Jes or 'o"
1a9imiBeWindow^Jes
!rea/Frame
&rea,8rame sets whether the sur%ey will attempt to rea, out of an <41. frame"
@o not use this feature unless you are lin,ing to the sur%ey from within a frame set"
&rea,8rame may e set to Jes or 'o"
&rea,8rame^'o
4uto4dvance
#uto#d%ance sets whether the screen will automatically scroll to the ne9t ;uestion
when a radio utton is clic,ed" !t is often disconcerting for respondents to see the
screen scroll on its own0 so the recommended setting is 'o" #uto#d%ance may e set
to Jes or 'o"
#uto#d%ance^'o
!rancDelay
&ranch@elay sets whether ranching is immediate or delayed until the page is
sumitted" &ranch@elay may e set to Jes or 'o" When the last %ariale on a page
contains a ranch0 it will always e delayed until the page is sumitted"
When set to 'o0 all other ranching will happen immediately when the radio utton
is clic,ed" When set to Jes0 all ranching on that page will e delayed until the
respondent finishes the page and clic,s the sumit utton" &ranch@elay may e used
multiple times to change the setting from page to page or within a page"
&ranch@elay^Jes
1>& /eywords StatPac For Windows User's Manual
Cace
Cache sets whether the respondentsD rowsers will cache the sur%ey pages" Cache
may e set to Jes or 'o" !f you e9pect respondents to fre;uently use the ac, utton
to re%iew pre%ious answers0 set Cache to Jes so their pages load faster" :therwise0
the setting is not important"
Cache^Jes
Inde'
!nde9 sets whether search engine spiders will e allowed to inde9 and follow lin,s
on the sur%ey pages" !nde9 may e set to Jes or 'o" Aach sur%ey page will include
the roots meta tag with instructions to search engine spiders to include or e9clude
the page from their inde9" Some search engine spiders ignore meta tags so setting
!nde9 to 'o will not guarantee that a page will not e inde9ed"
!nde9^'o
ForceLoader$ubmit
8orce.oaderSumit sets the method used to load the first page of the sur%ey"
8orce.oaderSumit may e set to Jes or 'o" 4he lin, to the sur%ey is actually a lin,
to a loader page" 4he loader can display the first page of the sur%ey using two
different methods"
When set to 'o 6fastest method70 the loader page is replaced with the first page of the
sur%ey" >sing this method0 you will not e ale to tell how many people Hust loo,ed
at the sur%ey without completing any ;uestions" @ata will only e captured when
they clic, a sumit utton"
When set to Jes0 the loader page is processed as if a sumit utton were clic,ed" 4he
respondentDs !P address and data and time are captured" A%en if they donDt complete
any actual sur%ey ;uestions0 youDll ,now that they loo,ed at first page of the sur%ey"
8orce.oaderSumit^Jes
&'traTall!lan/Line
A9tra4all&lan,.ine sets the height when the &lan,.ine command is used"
A9tra4all&lan,.ine may e set to Jes or 'o" # setting of Jes increases the height of
a lan, line0 and 'o decreases it"
A9tra4all&lan,.ine^'o
RadioTe'tPosition
$adio4e9tPosition sets the position of the te9t that is adHacent to a radio utton"
$adio4e9tPosition may e set to .eft or $ight" When set to .eft0 the te9t will appear
to the left of a radio utton0 and when set to $ight0 the te9t will e displayed to the
right of the radio utton"
A9ample5 $adio4e9tPosition^$ight
StatPac For Windows User's Manual /eywords 1>1
$adio4e9tPosition may e used multiple times to display some ;uestions with the
te9t to the left of the radio uttons and some ;uestions to the right of the radio
uttons" 8or e9ample0 these lines would show two groups of ;uestions with radio
uttons in a horiBontal format" 4he first group would ha%e the te9t 6;uestions7 appear
to the right of the radio uttons0 and the second group would ha%e the te9t appear to
the left of the radio uttons"
Cuestion^Please indicate the importance of these items5
$adio4e9tPosition^$ight
$adio !mptX1 - !mptX2
&lan,.ine
$adio4e9tPosition^.eft
Cuestion^Please indicate your satisfaction with the following items5
$adio SatX1 - SatX2
Te't!o'Te'tPosition
4e9t&o94e9tPosition sets the position of the te9t that is adHacent to a te9t o9"
4e9t&o94e9tPosition may e set to .eft or $ight" When set to .eft0 the te9t will e to
the left of the te9t o90 and when set to $ight0 the te9t will e displayed to the right
of the te9t o9" 4e9t&o94e9tPosition may e used multiple times to display some
;uestions with the te9t to the left and other ;uestions with the te9t to the right of the
te9t o9"
4e9t&o94e9tPosition^.eft
LargeTe't!o'Position
.arge4e9t&o9Position sets the position of a large te9t o9" .arge4e9t&o9Position
may e set to .eft or Center" When set to .eft0 a te9t o9 will e left Hustified0 and
when set to Center0 a large te9t o9 will e centered on the page"
.arge4e9t&o9Position may e used multiple times to show some large te9t o9es to
the left and some centered" #pplies to large te9t o9es only 6i"e"0 multiple lines7"
.arge4e9t&o9Position^.eft
LargeTe't!o'Progress!ar
.arge4e9t&o9Progress&ar sets whether a large te9t o9 will ha%e a progress ar
underneath of it to show respondents how much of the ma9imum te9t space they
ha%e typed" .arge4e9t&o9Progress&ar may e set to Jes or 'o" !f the field width of
the %ariale is %ery long0 then the progress ar is unnecessary" !f you elie%e that
respondents might attempt to type te9t that is longer than the field width then a
progress ar is desirale"
.arge4e9t&o9Progress&ar^'o
Fonts 6 Colors
4here are numerous commands to insert te9t into a sur%ey page" 4hese are5
1>) /eywords StatPac For Windows User's Manual
<eading^4his is a large heading"
4itle^4his is a title with smaller te9t"
4e9t^4his is normal te9t"
8ootnote^4his is the footnote at the ottom of the page"
!nstructions^4his is te9t in a frame"
Cuestion^4his is more te9t in a frame"
4he attriutes for these commands control the siBe0 color0 spacing0 Hustification0 and
features li,e old0 underline and italics"
.lobal 4ttributes
4he Floal #ttriutes specify the default Hustifications0 colors0 and tale attriutes
for the %arious components of the sur%ey" 4he first letter of each attriute indicates
that it is a gloal command 6OFO stands for gloal70 and applies to the we page as a
whole"
FIustification^Center
FColor^/000000
F&gColor^/888888
F&order^0
StatPac For Windows User's Manual /eywords 1>!
FCellpadding^2
FCellspacing^0
FWidth^)2`
F&orderColor^/C0C0C0
Wallpaper^c5SStatPacSWallpaperSac,ground"Hpg
FIustification sets the gloal Hustification" 6.eft0 Center0 or $ight7
FColor sets the gloal font color" 4o select a color while editing the script0 right clic,
on the command line"
F&gColor sets the ac,ground color when a wallpaper is not specified" 4o select a
color while editing the script0 right clic, on the command line"
F&order sets the gloal order thic,ness in pi9els"
FCellpadding sets the space etween the gloal frame and tale cells in pi9els"
FCellspacing sets the amount of space etween the contents of a cell and the cell
wall in pi9els"
FWidth sets the sur%ey width as a percent of the total screen width in percent"
F&orderColor sets the gloal order color when there is a order" 4o select a color
while editing the script0 right clic, on the command line"
Wallpaper sets the ac,ground wallpaper for the sur%ey" 4o select the wallpaper0
right clic, on the command line"
1eading5 Title5 Te't5 2 Footnote 4ttributes
4here are four commands that can e used to insert te9t into the sur%ey without a
frame 6i"e"0 the gloal ac,ground color or wallpaper will appear as the ac,ground
ehind the te9t7" 4hese are the <eading0 4itle0 4e9t and 8ootnote commands"
Aach of these has its own attriutes" Fenerally0 heading is the largest font and
footnote is the smallest"
----- <eading #ttriutes -----
<eading8ont8ace^#rial
<eading8ontSiBe^1(
<eading&old^Jes
<eading>nderline^'o
<eading!talics^'o
<eadingIustification^center
<eadingColor^/000000
----- 4itle #ttriutes -----
4itle8ont8ace^#rial
4itle8ontSiBe^12
4itle&old^Jes
4itle>nderline^'o
4itle!talics^'o
1>* /eywords StatPac For Windows User's Manual
4itleIustification^left
4itleColor^/000000
----- 4e9t #ttriutes -----
4e9t8ont8ace^#rial
4e9t8ontSiBe^10
4e9t&old^'o
4e9t>nderline^'o
4e9t!talics^'o
4e9tIustification^left
4e9tColor^/000000
----- 8ootnote #ttriutes -----
8ootnote8ont8ace^#rial
8ootnote8ontSiBe^(
8ootnote&old^'o
8ootnote>nderline^'o
8ootnote!talics^'o
8ootnoteIustification^center
8ootnoteColor^/000000
X8ont8ace sets the font face" 6#ny font name7
X8ontSiBe sets the font siBe" 68ont siBe in points7
X&old sets whether the te9t will e old" 6Jes or 'o7
X>nderline sets whether the te9t will e underline" 6Jes or 'o7
X!talics sets whether the <eading will e italics" 6Jes or 'o7
XIustification sets the Hustification for the te9t" 6.eft0 Center0 or $ight7
XColor sets the font color for the te9t" 4o select a color while editing the script0 right
clic, on the command line"
Instructions5 6uestion5 and Response 4ttributes
4here are three ,inds of framed te9t" 4his te9t will appear in a frame with a order"
4he ac,ground color of the frame may e different from the gloal ac,ground
color" 4wo of these 6!nstructions and Cuestion7 may e inserted into the page y
using the command"
!nstructions^Please answer the following items"
Cuestion^Select you le%el of agreement or disagreement with the
following5
4he response attriutes controls the appearance of the response choice frame" 4hat is0
the frame that displays the response choices and contains radio uttons0 chec, o9es0
or te9t o9es"
StatPac For Windows User's Manual /eywords 1>-
4he first letter of the command indicates which type of attriute is eing modified"
O!O stands for instructions0 which is special te9t that can e shown to the user" 4he
instruction attriutes control the appearance of the instruction te9t"
OCO stands for the ;uestion itself 6i"e"0 the %ariale lael7" 4he ;uestion attriutes
control the appearance of the ;uestion te9t"
O$O is for the response categories or response te9t 6i"e"0 the %alue laels7" 4he
response attriutes control the appearance of the response choices"
4here are se%eral attriutes for each of the framed components" 4hese lines descrie
the attriutes that will e used to create the !nternet sur%ey" :nce you ha%e set your
preferences0 they will rarely need to e changed in the script commands"
----- !nstruction #ttriutes -----
!8ont8ace^#rial
!8ontSiBe^10
!&old^Jes
!>nderline^'o
!!talics^'o
!Iustification^left
!Color^/000000
!&gColor^/888888
!&order^0
!Cellpadding^2
!Cellspacing^0
!Width^100`
!&orderColor^/C0C0C0
----- Cuestion #ttriutes -----
C8ont8ace^#rial
C8ontSiBe^10
C&old^Jes
C>nderline^'o
C!talics^'o
CIustification^left
CColor^/000000
C&gColor^/@@@@@@
C&order^1
CCellpadding^2
CCellspacing^0
CWidth^100`
C&orderColor^/C0C0C0
----- $esponse #ttriutes -----
1>; /eywords StatPac For Windows User's Manual
$8ont8ace^#rial
$8ontSiBe^10
$&old^'o
$>nderline^'o
$!talics^'o
$Iustification^left
$Color^/000000
$&gColor^/888888
$&order^1
$Cellpadding^2
$Cellspacing^0
$Width^100`
$&orderColor^/C0C0C0
$&arColor^/808080
X8ont8ace sets the font face" 6#ny font name7
X8ontSiBe sets the font siBe" 68ont siBe in points7
X&old sets whether the te9t will e old" 6Jes or 'o7
X>nderline sets whether the te9t will e underline" 6Jes or 'o7
X!talics sets whether the <eading will e italics" 6Jes or 'o7
XIustification sets the Hustification for the te9t" 6.eft0 Center0 or $ight7
XColor sets the font color for the te9t" 4o select a color while editing the script0 right
clic, on the command line"
X&FColor sets the ac,ground color of the frame" 4o select a color while editing the
script0 right clic, on the command line"
X&order sets the siBe of the order around the frame in pi9els"
XCellpadding sets the space etween the gloal order and the frame order in
pi9els" XCellpadding is used to control the amount of space that the te9t will e
indented" 8or e9ample0 if RCellpadding45 then the oHect for the response choices
6radio uttons0 chec, o9es0 etc"7 will e flush left" !f RCellpadding4A then the
oHect for the response choices will e indented fi%e spaces 6characters7" <ere are
two e9amples" :n the first one0 RCellpadding43 and on the second0
RCellpadding415"
1" What is your genderY
1ale
8emale
1" What is your genderY
1ale
8emale
XCellspacing sets the space etween the frame order and the te9t in the ;uestions
cell in pi9els"
StatPac For Windows User's Manual /eywords 1>'
XWidth sets the width of the frame as a percent of the gloal width 6usually 100`7"
X&orderColor sets the ;uestions order color when there is a order"
$&arColor sets the ac,ground color of e%ery other row in matri9 style response
choices"
Passwords 9 Color 6 Banner I(a%e
Password protected sur%eys are one way to control who has access to the sur%ey"
Login!annerImage
Sets the image that will appear at the top of the login page" 4o select the image while
editing the script0 right clic, on the command line"
.ogin&anner!mage^c5SimagesSlogo"Hpg
Login!.Color
Sets the ac,ground color for the login page when no login wallpaper is specified"
4o select a color while editing the script0 right clic, on the command line"
.ogin&gColor^/888888
11> /eywords StatPac For Windows User's Manual
Login-allpaper
Sets the ac,ground wallpaper for the login page" 4o select the wallpaper while
editing the script0 right clic, on the command line"
.oginWallpaper^c5SimagesSac,ground"Hpg
Login-indo"Color
Sets the ac,ground cell color for the login window" 4o select a color while editing
the script0 right clic, on the command line"
.oginWindowColor^/888888
Passwords 9 :e2t 6 Control
Pass"ordType
Paswword4ype sets the method that will e used for password protection"
Password4ype may e set to type to 'one0 Single0 or 1ultiple"
When %assword,ype4None0 there will e no password protection" 'one of the other
parameters in the Password Section need to e set" 4hey are only important if
%assword,ype is set to Single or ?ultiple"
StatPac For Windows User's Manual /eywords 111
When %assword,ype4Single0 there will e one password for all respondents who
access the sur%ey"
When %assword,ype4?ultiple0 each person who accesses the sur%ey will ha%e a
uni;ue password"
Password4ype^1ultiple
LoginTe't
.ogin4e9t sets the te9t shown at the top of the login window" !t is the heading for the
login window"
.ogin4e9t^Please .og !n
Pass"ordTe't
Password4e9t sets the te9t on the login screen that prompts the respondent for the
password" !t will appear to the left of the te9to9 where a respondent enter their
password"
Password4e9t^Password
Login!uttonTe't
.ogin&utton4e9t sets the te9t for the utton on the login screen"
.ogin&utton4e9t^.og !n
FailTe't
8ail4e9t sets the message that will e shown to a respondent who enters an in%alid
password"
8ail4e9t^!n%alid .ogin #ttempt to
Fail!uttonTe't
Sets the te9t on the retry utton that will e shown to a respondent who enters an
in%alid password"
8ail&utton4e9t^4ry #gain
$o"Lin/
Show.in, sets whether the finish page hyperlin, 6usually a lin, to your home page7
will also e displayed on the login page" Show.in, may e set to Jes or 'o" 4he
Primary settings of 8inish4e9t and 8inish>$. control the creation of the lin,"
Show.in,^Jes
&mail%e
Amail1e sets the conditions when you will e emailed a notification of a login"
Amail1e may e set to 'one0 ?alid0 !n%alid0 or &oth"
11& /eywords StatPac For Windows User's Manual
Amail1e^'one 'o e-mail will e sent to you for either %alid or in%alid login
attempts"
Amail1e^?alid #n email will e sent to you when there has een a %alid login"
Amail1e^!n%alid #n email will e sent to you when there has een an unsuccessful
attempt to login"
Amail1e^&oth #n email will e sent to you when there has een a %alid or in%alid
login attempt"
Amail1e^'o
7eepLog
Eeep.og sets what ,ind of access will e sa%ed in a ser%er log" Eeep.og may e set
to 'one0 ?alid0 !n%alid0 or &oth" 4he actual log file will e named
codebookname.log and will e stored in the same folder as the script 6usually the cgi-
in folder7" 4his is an #SC!! te9t ta delimited file and may e downloaded and
e9amined with any editor"
Eeep.og^'one 'o messages will e written to the ser%er log"
Eeep.og^?alid # message will e written to the ser%er log when there has een a
%alid login"
Eeep.og^!n%alid # message will e written to the ser%er log when there has een
an unsuccessful attempt to login"
Eeep.og^&oth # message will e written to the ser%er log when there has een an
%alid or in%alid attempt to login"
Eeep.og^&oth
Passwords 9 Sin%le ,s. Multile
4he script editor will as, for slightly different information depending on the
password method 6single or multiple7" 4he lin, to a password protected sur%ey is the
same as a non-password protected sur%ey"
Pass"ord 8single pass"ord metod9
Password sets the password for the sur%ey" 4he same password is used for all
respondents" 4he password can e any comination of letters and numers" !t is not
case sensiti%e" We recommend short numeric passwords consisting of three to fi%e
digits or simple words or acronyms" #ccess to the sur%ey will e limited to people
,nowing the password"
Password^Secret
Pass"ordFile 8multiple pass"ords metod9
Password8ile sets the name of the file containing the passwords" 1ultiple password
sur%eys use a data ase of passwords stored on the ser%er in the cgi-in folder" 4he
password file is in ta delimited #SC!! te9t format" !t must contain at least one field
6the %alid passwords70 ut it may contain other fields as well" !t is often the same file
that used to send e-mail in%itations to participate in the sur%ey" When a respondent
StatPac For Windows User's Manual /eywords 111
types a password at the login screen0 the password file associated with the sur%ey is
e9amined to see if there is a match" 4o select a password file0 right clic, on the
command line"
Password8ile^c5Ssur%eyS#(3passwords"t9t
Pass"ordField 2 ID Field 8multiple pass"ords metod9
Suppose you had an A9cel file of email addresses and employee !@ numers" 4he
first thing you would do is use A9cel to write the two fields to a ta delimited file"
4he file would now loo, li,e this5
HohnPsomedomain"com 3-2-32
maryPanotherdomain"com 3)--2)
!f you wanted to use employee !@ as the password for the login0 you would set
Password8ield^2" Amployee !@ would e used as the password"
Password8ield^2
!f you want to e ale to trac, who responded and who didnDt then you need to also
specify an !@8ield" !@8ield identifies what field will e used as StatPacDs internal
$espondent!@ to identify that respondent" !n the ao%e e9ample0 if you wanted to
use Amployee !@ to trac, respondents0 then you would also set !@8ield^2"
Password8ield^2
!@8ield^2
!f you wanted to use employee !@ as the password for the login ut ,eep the sur%ey
anonymous0 you would set Password8ield^2 and lea%e the !@8ield lan," When
!@8ield is left lan,0 a random !@ numer will e generated when a respondent
egins ta,ing the sur%ey" 4his will not allow you to trac, who responded and who
didnDt" !t is the only method to create a password protected anonymous sur%ey"
Password8ield^2
!@8ield^
Jou could use the e-mail list management programs to add a random !@ numer to
the ta delimited file for trac,ing respondents" StatPac always adds the !@ numer as
the second field0 so after running the program to add an !@ numer0 the file might
loo, li,e this5
HohnPsomedomain"com 9(-)323 3-2-32
maryPanotherdomain"com 32)9-(3 3)--2)
11) /eywords StatPac For Windows User's Manual
Jou would set Password8ield^3 and set !@8ield^2" 4hen0 respondents would enter
their Amployee !@ numer as the password and a random !@ numer would e used
to trac, respondents" 'ote that this method is not anonymous ecause the random !@
numer could e used to lin, a particular respondent with their responses to the
sur%ey"
Password8ile^c5SofficeSemployee"t9t
Password8ield^3
!@8ield^2
Pass"ordControl
PasswordControl sets the progress control that will e used on password protected
sur%eys" !t is only a%ailale for multiple password sur%eys and can e set to 'one0
:nce0 or 8orward"
:nce means that a respondent can complete the sur%ey only once" 4hey can log in
multiple times 6always eginning on page one70 ut after theyD%e reached the than,
you page0 they will not e ale to log in again"
8orward means that they can log in multiple times0 ut they will always egin on the
page where they left off" #fter theyDre reached the than, you page0 they will not e
ale to log in again" 8orward control only applies to multiple page sur%eys"
PasswordControl^:nce
Passwords 9 :echnical 7otes
4he information in this section is not re;uired to run StatPac" StatPacDs #uto 4ransfer
feature ma,es it unnecessary to ,now what files need to e uploaded to what folders"
<owe%er0 the information is important should you decide to manually upload or
download files"
When you create a password protected sur%ey StatPac does numerous things Oehind
the scenesO"
8or a single password method0 a file called studyname.text is created in the proHect
folder" !t contains a single line consisting of the password" 8or a multiple password
method0 the password file you specify is written to the proHect folder using the name
studyname.text" #uto 4ransfer uploads this file to the cgi-in folder"
# file called password.pl will e created in your proHect folder" #uto 4ransfer
uploads the file to the cgi-in folder on your ser%er and sets the permissions to )22"
4his is the program that reads the data ase to determine if the respondent has
entered a %alid password"
4he first page of the sur%ey 6studyname"htm7 is renamed to studynameXstart"htm and
the login page is named studyname"htm" #uto 4ransfer uploads studynameXstart"htm0
StatPac For Windows User's Manual /eywords 11!
Ser,er 3,errides
When using your own ser%er0 you can o%erride your ser%er settings y using these
commands" We do not recommend the use of these commands since the appropriate
way to ma,e a change is to change your ser%er settings" 4o use these commands0
remo%e the leading a so the command is left Hustified in the script"
4ctionTag
#ction4ag sets the full >$. to StatPacDs Perl script" 4he #ction4ag setting will
ecome part of the action tag in the html source code for the sur%ey" 4he function of
the Perl script is to ta,e the answers from the html page and store them in a file on
the ser%er or email them to you" When a respondent clic,s the sumit utton0 it will
direct the process to the location of the Perl script on the ser%er"
4he name of the Perl script on your local computer is statpac11"pl" $espondents will
see the #ction4ag setting in the address ar of their rowser while ta,ing the sur%ey"
8or e9ample0 they would see5
http5MMwww"yourdomain"comMcgi-inMstatpac11"pl
4herefore0 the default script will change the name of statpac11"pl to your
surveyname.pl. 8or e9ample0 if you are doing a sur%ey for *JL company0 you might
name the html files O*JLO" 4he default #ction4ag setting would e5
#ction4ag^http5MMwww"yourdomain"comMcgi-inM*JL"pl
4hat way0 respondents will see the company name in their address ar while they are
ta,ing the sur%ey" :n most ser%ers0 the www is optional and could e5
#ction4ag^http5MMyourdomain"comMcgi-inM*JL"pl
!f you are running on a secure ser%er will SS. and your We8older>$. uses a
https5MM prefi90 then the #ction4ag should also use https5MM
#ction4ag^https5MMyourdomain"comMcgi-inM*JL"pl
Jou may name the Perl file to anything you want 6e9cept it must ha%e a "pl
e9tension7" !f you manually upload the files to your ser%er0 then you need to
manually rename the file on your ser%er from statpac11"pl to *JL"pl" 4he important
thing is that the name of the "pl file on your ser%er is e9actly the same as the
#ction4ag setting in the script"
>ni9M.inu9 ser%ers are case sensiti%e0 so ma,e sure you use the same case for the
file name that you plan to gi%e to respondents"
$torageFolder
Storage8older sets the path to the folder where responses will e stored on the ser%er"
4ypically0 responses are stored in the cgi-in folder ecause it in not readily
11* /eywords StatPac For Windows User's Manual
accessile to the outside world" When left lan,0 StatPac will use the cgi-in folder
to store responses"
4he actual file name for storing responses will e codebookname.asc"
4he setting is specified differently for >ni9 and Windows ser%ers"
$ni1 or &inu1 Server
4here are numerous ways to specify the storage folder on a >ni9 or .inu9 ser%er"
4he setting may e specified as asolute or relati%e to the cgi-in folder"
#ll of these would store the results in the cgi-in folder"
Storage8older^MhomeMusernameMpulicXhtmlMcgi-in
Storage8older^""Mcgi-in 6two periods7
Storage8older^"M 6one period7
#ll of these would store the results in a folder called OstorageO which is immediately
elow the cgi-in folder"
Storage8older^MhomeMusername pulicXhtmlMMcgi-inMstorage
Storage8older^""Mcgi-inMstorage 6two periods7
Storage8older^"Mstorage 6one period7
4his would store the results in a folder called Opri%ateO which is at the same le%el as
pulicXhtml 6and therefore not accessile to the outside world7"
Storage8older^""M""Mpri%ate 6two periods7
4hese would store the results file in a folder called OstorageO which is immediately
elow the pulicXhtml folder" 'ote that this may pose a security ris, ecause the
storage folder would e accessile to the world"
Storage8older^MhomeMusernameMpulicXhtmlMstorage
Storage8older^""Mstorage 6two periods7
#T% Windows% or IIS Server
:n an '4 or !!S ser%er the setting is specified using a @:S path 6i"e"0 the full path
eginning with a dri%e letter to the folder where responses should e stored7" >sers
must ha%e readMwrite access to the folder" #n e9ample might e5
Storage8older^c5SinetpuSwwwrootScgi-in
!n order to use 84P to retrie%e the data0 the wwwroot folder name must part of the
Storage8older path" 8or e9ample0 you would not e ale to use 84P to retrie%e this
data ecause the storage folder is not elow the wwwroot folder"
StatPac For Windows User's Manual /eywords 11-
Storage8older^d5Sdatastorage
Some !!S ser%ers re;uire that you use doule ac,slashes instead of single
ac,slashes" !f you recei%e a QSer%er &usyR message after clic,ing the sumit utton
on a sur%ey0 try changing the path to doule ac,slashes in place of single
ac,slashes5
Storage8older^c5SSinetpuSSwwwrootSScgi-in
$criptFolder
Script8older sets the full >$. of the cgi-in folder 6including the trailing M7"
Script8older^http5MMwww"yourdomain"comMcgi-inM
Perl
Perl is set to the asolute path where Perl is installed on your ser%er" Jour !SP will e
ale to tell you this information" 4he synta9 for this setting is different for
>ni9M.inu9 and '4M!!S ser%ers"
$ni1 or &inu1 server!
Perl^MusrMinMperl
Windows 2#T or IIS4 server!
Perl^c5SperlSinSperl"e9e
%ailProgram
1ailProgram is set to point to the mail program on your ser%er" 4he 1ailProgram
parameter only needs to e set if you are using password protection and want e-mail
notification of login acti%ity"
1ailProgram^MusrMsinMsendmail
Branchin% and Piin%
7rancing is set up in the codeoo, using a semi-colon to indicate a s,ip pattern"
#ny s,ip patterns specified in the codeoo, will wor, for internet sur%eys" 'othing
special needs to e done" &ranching is supported for radio uttons"
# ranch to another ;uestion on the same page will e immediate" #s soon as the
respondent clic,s one of the radio uttons0 the screen will scroll to the ranched
%ariale" # ranch to a %ariale on another page may e immediate 6when the
11; /eywords StatPac For Windows User's Manual
respondent clic,s the radio utton7 or delayed until the respondent clic,s the sumit
utton"
4he &ranch@elay command may e used multiple times in the script to set the
ranching to immediate or delayed" !t may e set to Jes or 'o" 8or e9ample0 the
following command would delay the ranching to another page until the sumit
utton is clic,ed"
&ranch@elay^Jes
%iping refers to displaying an answer from a pre%ious ;uestion to a suse;uent
;uestion" Piping is supported for multiple page sur%eys" Jou may pipe a response
from one page to another page0 ut not to the current page"
8or %ariales that contain %alue laels0 the piped te9t will e the %alue lael of the
selected response choice" 8or %ariales that do not contain %alue laels0 the piped
te9t will e the actual te9t entered y the respondent" # piped response is re;uested
on a suse;uent page using the 6b?ariale'ameb7 synta9 in either an !nstruction
command0 Cuestion command0 a %ariale lael or %alue lael in the codeoo,"
8or e9ample0 suppose you had a %ariale named Fender with %alue laels of 1^male
and 2^female" Jou also ha%e a two open ended %ariales named 8irst'ame and #ge"
4he script for the sur%ey might e5
4e9t&o9 8irst'ame
&lan,.ine
$adio Fender
&lan,.ine
4e9t&o9 #ge
'ewPage
!nstructions^<ello 6b8irst'ameb7_ 4han,s for ta,ing our sur%ey"
!nstructions^Jou indicated that you are a 6b#geb7 year old 6bFenderb7"
&lan,.ine
Cuestion^<ow would most 6bFenderb7 s respond to these itemsY
$adio ?22-?30
Piping may also e used to prefill a te9to9 with a response to a ;uestion from a
pre%ious page" !n order to prefill a te9to90 you must use the W6b?ariale'ameb7
synta9 as a %alue lael in the codeoo," 'ote that the synta9 egins with a
semicolon when it is specified as a %alue lael" 8or e9ample0 if a pre%ious ;uestion
had as,ed for QJour'ameR0 and a ;uestion on a suse;uent page as,ed for the 'ame
of the CA:0 you could prefill the 'ame of the CA: te9to9 with QJour'ameR0 y
adding a %alue lael to the 'ame of the CA: %ariale in the codeoo," 4he %alue
lael would e W6bJour'ameb7 on a line y itself"
Rando(i?ation <Rotations=
StatPac supports %alue lael randomiBation for radio uttons and chec,o9es" !t also
supports %ariale randomiBation when groups of %ariales are displayed horiBontally"
StatPac For Windows User's Manual /eywords 11'
4raditional paper and pencil ;uestionnaires typically use rotations for nominal data
in order to %ary the order in which response choices are presented to respondents"
4his is done to reduce ias that might e introduced y the order in which choices
are listed on the page" !nternet sur%eys ha%e an ad%antage ecause they can
randomiBe 6not rotate7 the order of the %alue laels 6i"e"0 response choices7"
4he M$ switch can e added to the end of the $adio or Chec,&o9 commands to
randomiBe the order that the response choices will e displayed in the respondentNs
rowser" Aach respondent will see a uni;ue se;uence of the response choices" 8or
e9ample0 the following two commands would randomiBed the response choices for
the %ariale 1 radio uttons and the multiple response %ariales 2 through -" >se a
space to separate the M$ from the rest of the command"
$adio ?1 M$
Chec,&o9 ?2-?- M$
When used in the ao%e form0 all of the %alue laels will e randomiBed" 4his is
sometimes undesirale when the last %alue lael is an QotherR response" 4ypically0
you would want to lea%e the QotherR choice as the last one displayed e%en though the
other choices are randomiBed"
#dd a numer suffi9 to the M$ switch to tell how many %alue laels should e
e9cluded from the randomiBation" 8or e9ample0 if the last two %alue laels for
%ariale 1 were QotherR and QdonNt ,nowR choices0 the following command would
e9clude oth %alue laels from the randomiBation 6i"e"0 they will always e displayed
as the last two choices7"
$adio ?1 M$2
!n a similar e9ample0 the last %alue lael would not e included in the randomiBation"
Chec,&o9 ?2-?- M$1
4he following would randomiBe the order of the %ariales in a series of horiBontal
radio uttons"
$adio ?9- ?y M$
$andomiBation will only wor, when the sur%ey is online" !t will not wor, on your
local computer and the %ariale and %alue laels will always appear in the order
specified in the codeoo,"
Sur,ey Creation Scrit
1ost te9t in the sur%ey will e generated from the codeoo," 4here are many
situations though where you will want to insert additional te9t into the sur%ey 6e"g"0
to gi%e a section a heading7"
3,er,iew
4he MMMMM S>$?AJ C$A#4!:' MMMMM line is inserted as part of the initial script as a
comment to let you ,now where the portion of the script egins that controls the
%ariales" *o not delete or chan/e the location of this line" !t is re;uired for
StatPac to properly uild the <41. sur%ey pages"
1&> /eywords StatPac For Windows User's Manual
&lan, lines in the script are ignored" !n long and comple9 sur%eys0 you can add lan,
lines to the script to ma,e it easier for you to ,eep trac, of pages" Jou can also egin
any line with an apostrophe to ma,e it a comment"
DStart the sur%ey
4e9t^4han, you for your participation"
&lan,.ine
4e9t^ 'o indi%idual firms are identified and only aggregate data are made
pulic"
&lan,.ine
4itle^@emographics
$adio #ge
&lan,.ine
$adio Fender
&lan,.ine
'ewPage
D&egin second page
4itle^#ttitudes
Cuestion^Please rate the importance of each of the following items"
$adio :pinionX1 - :pinionX2
'ewPage
D&egin third page
4e9t&o9 C)
,sing Commands %ore tan Once in a $cript
4he Primary settings are only specified once at the eginning of the scrip" 1ost
#d%anced settings can e specified repeatedly in the Sur%ey Creation portion of the
script to change te9t0 fonts0 Hustifications0 colors0 and tale attriutes for the %arious
;uestions of the sur%ey"
8or e9ample0 you could egin a sur%ey with one color scheme and change to a
different color scheme midway through the sur%ey" 4o change an attriute0 insert the
command in the script at the place where you want the new %alue to ta,e effect"
Secify :e2t
4here are - ways to specify te9t"
1eading
<eading is used to insert te9t using the heading attriutes 6usually %ery large font7"
4here will e no frame around the te9t"
StatPac For Windows User's Manual /eywords 1&1
<eading^@A1:F$#P<!C SAC4!:'
Title
4itle is used to insert te9t using the title attriutes" 4here will e no frame around the
te9t"
4itle^#out Jou
Te't
4e9t is used to insert te9t using the te9t attriutes" 4here will e no frame around the
te9t"
4e9t^4han, you for your participation" [r\ [r\ 4he information
will e reported in aggregate and no indi%idual will e identified"
FootnoteTe't
8ootnote4e9t sets the te9t at the ottom of the page using the footnote attriutes"
8ootnotes will always appear at the ottom of the page regardless of where you
insert the command in the script"
8ootnote4e9t^Sponsored y StatPac !nc"
Instructions
!nstructions displays te9t in a frame using the instructions attriutes"
!nstructions^Please answer all items"
6uestion
Cuestion displays te9t in a frame using the ;uestion attriutes" !t is most often used
to add the ;uestion to grouped te9t o9es or a series of matri9 style radio uttons"
Cuestion^Please rate the importance of each of the following items"
$adio :pinionX1 - :pinionX2
Cuestion^Please ran, the three most important items from this list y
typing a 10 20 and 3"
4e9t&o9 !temsX1 - !temsX10
Sacin% and a%ination
1&& /eywords StatPac For Windows User's Manual
!lan/Line
4he 7lank:ine command has no e;uals symol or parameters" !t is inserted into the
script at desired locations to create a lan, line on the <41. page" !t is usually
inserted etween each ;uestion"
$adio #ge
&lan,.ine
$adio Fender
&lan,.ine
Ne"Page
4he New%age command has no e;uals symol or parameters" !nsert this line into the
script when you want to end the current sur%ey page and egin a new sur%ey page"
Aach time the New%age command appears0 StatPac will create a new <41. page"
StatPacDs default script for a sur%ey is for the entire sur%ey to appear on a single
page" !f you want to create a multi-page sur%ey0 youDll ha%e to manually insert the
New%age commands where you want to egin a new page"
'ewPage
I(a%es and .in#s
Image
4he *mage command may e used to insert one or more graphics images into the
sur%ey" 4ype !mage^ and then right clic, to select the desired graphics file 6"gif0
"Hpg0 or "mp7" 4he format for the command is5
!mage^c5SStatPacS@ataSPicture"Hpg
Jou can place multiple images side y side y specifying multiple filenames
separated y semicolons"
!mage^8ilenameW8ilenameW8ilename
#fter the <41. is generated0 you can use an <41. editor to manually insert a
graphic0 you must use either the fully ;ualified >$. as the source file path or the
special filename prefi9 of dot slash dot slash dot slash 6i"e"0 "M"M"M7 8or e9ample0 either
of the following would e acceptale methods of specifying a graphics source file5
[img src^Rhttp5MMwww"statpac"comMsur%eyMgraphic"gifR\
[img src^R"M"M"Mgraphic"gifR\
When manually inserting a graphic with and <41. editor and you plan to use #uto
4ransfer to upload your files0 the graphic must e in the proHect folder"
StatPac For Windows User's Manual /eywords 1&1
Lin/
!nserts a hyperlin, into the sur%ey" !t may e added to the script as a line y itself or
may e added as a suffi9 to other commands"
&efore using the .in, command0 first set the hyperlin, information with the
.in,>$. and .in,4e9t commands"

.in,>$.^http5MMwww"statpac"com
.in,4e9t^Clic, here to see our home page
4hen insert the .in, command 6without the e;uals symol7 where you would li,e the
lin, to appear" !t may e inserted on a line y itself in the script or may e added as a
suffi9 to other commands" Aach of the following would e correct uses of the .in,
command0 and each would create a lue hyperlin, on the sur%ey page that a
respondent could clic, on
!nstructions^Please answer these ;uestions" .in,
Cuestion^Please rate each of the following items5 .in,
$adio C1 .in,
@rop@own Choices .in,
4e9to9 :pinion .in,
.ist&o9 ?12 .in,
4he .in, commands may e used to ma,e it easier for the respondent to email you"
8or e9ample0 if you ha%e done an anonymous sur%ey and you want respondents to e
ale to re;uest a copy of the final report without any chance of lin,ing their e-mail
address to their responses0 you could insert these three commands into the script5
.in,>$.^mailto5adminPstatpac"comYsuHect^Please send the report
.in,4e9t^Clic, here to send an e-mail re;uesting a copy of the report
.in,
5el Windows
<elpWindow inserts a hyperlin, into the sur%ey for a popup help window" 4hat is0 it
lets respondent to see additional te9t that does not appear on the sur%ey itself 6e"g"0 a
help screen7" 4he command may e added to the script as a line y itself or may e
added as a suffi9 to other commands"
4he actual appearance of the lin, created y the <elpWindow command and the
contents of the popup window are controlled y three parameters" 4hese parameters
should e set in the script efore using the <elpWindow command" When the
<elpWindow command is e9ecuted0 it will use the current settings of the three
parameters" 4he three parameters are5
<elp.in,4e9t^4e9t
<elp4e9t^4e9t
<elp8ile'ame^8ilename
1&) /eywords StatPac For Windows User's Manual
<elp.in,4e9t is the lue lin, te9t that the respondent will see on the sur%ey" !f not
specified0 the default is O<elpO"
<elp4e9t is the actual te9t that will appear in the popup window when opened" !t
may use imedded <41. tags to control fonts and spacing"
<elp.in,4e9t^Please clic, here for more information
<elp4e9t^4his additional information is pro%ided to help you answer the
;uestion[r\Please try to e oHecti%e answering this ;uestion" !t is
important that you are truthful and gi%e your est answer"
<elpWindow
!f you already ha%e an "htm file that you want to use as the contents of the popup
window0 then you would not use the <elp4e9t command" !nstead0 use the
<elp8ile'ame command to specify the name of the e9isting "htm file" !f you plan to
use #uto 4ransfer to upload your files0 this file must e in the proHect folder"
<elp.in,4e9t^Clic, here for an e9planation
<elp4e9t^
<elp8ile'ame^c5SStatPacS@ataSe9planation"htm
<elpWindow

#fter setting the parameters0 the <elpWindow command" #ctually creates the
window" 4he <elpWindow command may appear on a line y itself in the script or
may e added as a suffi9 to other commands" 8or e9ample0 each of the following
would e correct uses of the <elpWindow command0 and each would create a lin,
on the sur%ey page that a respondent could clic, on to e%o,e the help window5
<elpWindow
!nstructions^Please answer these ;uestions" <elpWindow
Cuestion^Please rate each of the following items5 <elpWindow
$adio ?2 <elpWindow
@rop@own ?9 <elpWindow
4e9to9 ?32 <elpWindow
.ist&o9 ?12 <elpWindow
4he names of the popup window pages will e Osur%eynameXhelp1"htmO0
Osur%eynameXhelp2"htmO0 etc" 8or each occurrence of the <elpWindow command in
the script0 a new popup page will e created" 4he popup window pages are "htm files
and must e uploaded to the ser%er to the same folder as your sur%ey"
<ere is an e9ample of a script that creates three lin,s in the sur%ey that a respondent
could clic, on to e%o,e three different popup windows" !t will also create three
different help files"
<elp.in,4e9t^Clic, <ere for !nformation aout our sponsor
StatPac For Windows User's Manual /eywords 1&!
<elp4e9t^4his sur%ey is sponsored y StatPac !nc"[r\Jou can call us
at 6)127 332-22-1
<elpWindow
&lan,.ine
<elp.in,4e9t^:ur Pri%acy Policy
<elp4e9t^We donDt tell anyone anything_
!nstructions^Please answer all ;uestions <elpWindow
&lan,.ine
<elp.in,4e9t^<elp
<elp4e9t^Please answer this ;uestion from the perspecti%e of your a%erage
customer" 4ry to answer how you thin, your typical customer would
respond"
$adio ?1 <elpWindow
Pou Windows
Popup windows pro%ide another way of ranching" 4hey are useful when you want
to as, 6or not as,7 a few additional ;uestions depending on the respondentNs answer
to another ;uestion without changing pages from the respondentDs perspecti%e"
#n e9ample would e a ;uestion where you say0 Q!f yes0 please answer the
following"R !n a multiple page sur%ey0 you would place the yesMno ;uestion on one
page0 the conditional ;uestion6s7 on a second page0 and the rest of the ;uestions on
suse;uent pages" 4he popup window offers the same functionality0 e9cept the
conditional ;uestions will appear in a new 6popup7 window0 and the rest of the
;uestions are on the same html page as the yesMno ;uestion"
4he actual ranching instructions are set up in the codeoo, using the semicolon
synta9" 8or e9ample0 suppose we ha%e a codeoo, with a ranch so people who
drin, coffee are as,ed ;uestions 1a and 10 while people who donNt drin, coffee are
not as,ed those ;uestions" #ll %alue laels immediately prior to the popup must
specify a ranch 6e%en if itDs Hust to the ne9t %ariale0 which is in the popup window7"
?ariale .ael 15 1" @o you drin, coffeeY
1^Jes W 2
2^'o W 3
?ariale .ael 25 1a" What is your fa%orite rand of coffeeY
?ariale .ael 35 1" <ow often do you drin, coffeeY
?ariale .ael 35 2" <ow old are youY
Jou can adHust the StatPac script so that ;uestions 1a and 1 will appear on a popup
window" 4he PopupStart and PopupAnd commands may e inserted into the script to
create the popup window" !n this e9ample0 the script might e5
$adio ?1
&lan,.ine
PopupStart
1&* /eywords StatPac For Windows User's Manual
4e9t&o9 ?2
&lan,.ine
4e9t&o9 ?3
&lan,.ine
PopupAnd
4e9t&o9 ?3
4he sur%eynameX1"htm file will ha%e ;uestions 1 and 3" 4he popup page
sur%eynameXpopup1"htm file will ha%e ;uestions 2 and 3" 4he first page the
respondent sees will ha%e ;uestions 1 and 2" 4hey will egin y answering ;uestion
1" !f they select QyesR0 a popup window will appear Qon topR of the page they are
seeing" 4he popup window will show ;uestions 1a and 1" When they press the
continue utton on the popup window0 it will close0 and the respondent will see the
main page again0 showing ;uestions 1 6already answered7 and 2"
Popup windows are regular html pages" 4he only difference from a regular sur%ey
page is the way in which they are e%o,ed" Popup windows will e named
sur%eynameXpopup1"htm0 sur%eynameXpopup2"htm0 sur%eynameXpopup3"htm0 etc"
4here are se%eral rules and limitations for using popup windows5
1" Popup windows will only wor, online" Jou may %iew the popup page on your
local computer0 ut you cannot test the popup feature until the files are uploaded to a
ser%er"
2" Jou may ranch within a popup window0 ut you may not ranch out of a popup
window" 4hat is0 you may not ranch to a %ariale that is not in the popup window"
Comple9 ranching is not supported within a popup window"
3" Piping is not supported within a popup window" Jou cannot pipe to or from a
popup window"
3" !n the %ariale that e%o,es the popup window0 all %alue laels must specify a
ranch0 e%en if itDs to the ne9t %ariale 6which will e in the popup window7"
Popup windows are ideal for situations where you ha%e a small numer of
conditional ;uestions" When there are many conditional ;uestions0 use the 'ewPage
command instead of a popup window"
Sur,ey Creation 9 3"Bects
4he input methods 6called oHects7 include radio uttons0 drop down menus0 te9t
o9es0 chec, o9es0 and list o9es" When StatPac first creates the default script0 it
will select the oHects that seem most appropriate to the ;uestions" <owe%er0 after the
default script has een created0 the oHects can e changed y simply changing the
Sur%ey Creation portion of the script"
4he following is a description of the commands that can e used to create oHects" !n
all of commands0 %ariale names can e used instead of the O?O numers"
Radio Buttons for a Sin%le 8aria"le
$ynta'# Radio V' :or: Radio 8parameters9 V'
StatPac For Windows User's Manual /eywords 1&-
4he $adio command will create a radio utton for each %alue lael" !t is most
appropriate when there are a small numer of choices" 4he first form of the
command will create all the radio utton in a single column" 4he second form of the
command will allow you to specify %arious display parameters" 4he parameters are5
? < %ertical or horiBontal
1 2 one or two columns of radio uttons 6applies to %ertical format only7
# A lael all points or lael only the end points
J ' show numeric codes 6yes or no7
Parameters may e any comination in any order 6upper or lower case7" 4he
following would create a group of horiBontal radio uttons for %ariale nine with
only the end points laeled and numeric codes ao%e each radio utton"
$adio 6<AJ7 ?9
!n creating the default script0 if there are si9 or fewer %alue laels0 the default will e
one column" !f there are )-12 %alue laels0 the default will e two columns" 8or more
than 12 %alue laels0 the default will e a @rop@own menu"
When creating horiBontal radio uttons 6either single ;uestions or a matri970 one or
two minus signs can e included in the parameters to hide the codes for the one or
two highest %alue laels" 8or e9ample0 suppose you ha%e a 1-2 .i,ert scale and you
also ha%e -^'o :pinion" !ncluding a minus sign in the parameters would still show
'o :pinion te9t0 ut hide the - code in the numeric scale" !f the two highest response
choices were -^'o :pinion and )^'ot #pplicale0 then two consecuti%e minus
signs in the parameters would hide the numeric codes for oth categories" 4his
feature can e used for single %ariales in a horiBontal format or matri9 style radio
uttons"
$adio 6<#J--7 ?9

1&; /eywords StatPac For Windows User's Manual

$adio 6-7 C2a - C2f
&lan,.ine

Radio Buttons for Groued 8aria"les <(atri2 style=
$ynta'# Radio V' ; Vy :or: Radio 8parameters9 V' : Vy
When your sur%ey has a series of .i,ert scale or semantic differential scale items0 a
horiBontal radio utton format can e specified" <oriBontally grouped radio uttons
are often referred to as matrix ;uestions"
4he first form of the command will create all the radio utton in a single column"
4he second form of the command will allow you to specify %arious display
parameters" 4he parameters are5
. $ radio uttons to left or right of te9t
# A lael all points or lael only the end points
J ' show numeric codes 6yes or no7
C @ descries codeoo, format as close or distant for two
side-y-side radio utton groups
4he . and $ parameters may e used to show the ;uestions to the left or right of the
radio uttons" 4he default can e set with the Radio,ext%osition command"
4he # and A parameters may e used to lael all points or Hust the end points of the
scale" 4he # parameter will lael e%ery response choice" 4he A parameter will lael
only the anchors of the scale"
4he J and ' parameters control whether numeric codes are used to lael the scale"
Parameters may e any comination in any order 6upper or lower case7" 4he
following would create a group of horiBontal radio uttons for %ariales C2a to C2f
with te9t to the left of the uttons0 only the end points laeled0 and numeric codes
ao%e each radio utton"
StatPac For Windows User's Manual /eywords 1&'
$adio 6.AJ7 C2a - C2f
Jou will need to manually edit the default script to display a series of items in this
format" When you create the default script0 StatPac doesnDt ,now which items should
e grouped together0 so each item will e specified as an indi%idual radio utton
%ariale" 4he default script might loo, li,e this5
$adio C2a
&lan,.ine
$adio C2
&lan,.ine
$adio C2c
&lan,.ine
$adio C2d
&lan,.ine
$adio C2e
&lan,.ine
$adio C2f
&lan,.ine
4o con%ert these to matri9 format0 you would change the script so the items to e
grouped together are specified as a range on a single script line instead of each on
their own script line"
$adio C2a - C2f
&lan,.ine
!f you want to show a single %ariale in horiBontal matri9 style format0 include the
dash without the second %ariale0 as in5 $adio ?9- or $adio 6parameters7 ?9-"
4he C 6close7 or @ 6distant7 parameter should only e used when you want two
groups of radio uttons to appear side y side" 8or e9ample0 you may ha%e three
11> /eywords StatPac For Windows User's Manual
attriute %ariales" Jou want to as, respondents to rate each of the three attriutes
and you also want them to assign an importance rating to each attriute" Jou want
the layout on the screen to loo, li,e this5
#ttriute 1 $ating 1 !mportance 1
#ttriute 2 $ating 2 !mportance 2
#ttriute 3 $ating 3 !mportance 3
Jou can set up the codeoo, two different ways" 4he C or @ descries which way
the codeoo, is set up"
!n this codeoo,0 the $ating and !mportance %ariales are close to each other"
?1 #ttriute 1 $ating
?2 #ttriute 1 !mportance
?3 #ttriute 2 $ating
?3 #ttriute 2 !mportance
?2 #ttriute 3 $ating
?- #ttriute 3 !mportance
4he command would e5
$adio 6C7 %1-%-
!n this codeoo,0 the $ating and !mportance %ariales are distant from each other"
?1 #ttriute 1 $ating
?2 #ttriute 2 $ating
?3 #ttriute 3 $ating
?3 #ttriute 1 !mportance
?2 #ttriute 2 !mportance
?- #ttriute 3 !mportance
4he command would e5
$adio 6@7 %1-%-
<ere is an e9ample for 3 attriutes rated on ;uality and o%erall impression5 4he
%ariales are5
?1 #ttriute 1 G :%eral Cuality
?2 #ttriute 2 G :%erall !mpression
?3 #ttriute 3 - @ocumentation Cuality
?3 #ttriute 3 - @ocumentation !mpression
StatPac For Windows User's Manual /eywords 111
?2 #ttriute 1 G Power Cuality
?- #ttriute 2 G Power !mpression
?) #ttriute 3 G Support Cuality
?( #ttriute 3 G Support !mpression
4he command to create the side-y-side radio utton matri9 would e5
Cuestion^Please ran, the ;uality and your o%erall impression of each of the
following"
$adio 6C'7 ?1-?(
&lan,.ine
# te9to9 can e placed ne9t to the :ther response category" When used with a side-
y-side matri90 the :ther %ariale must follow the last %ariale in the %ariale list" !n
oth e9amples0 ?) would e the :ther %ariale"
$ro$own Menu
$ynta'# DropDo"n V' :or: DropDo"n 8y9 V'
4he dropdown menu is used when there are a large numer of possile categories for
the respondent to choose from" 4he most common e9ample of this is when as,ing for
a country or state" 4he first form of the command will create a dropdown menu
where only one line shows until the menu is selected y the user" Jou can set the
default te9t for the line y inserting the command5 @rop@own@efault^some te9t" !n
the second form of the command0 you can specify the numer of %alue laels to
display in the dropdown window efore the dropdown occurs" J is the numer of
lines you want to display efore the user selects the menu" !f y e;uals the numer of
%alue laels0 then all the %alue laels will e shown all the time"
@rop@own 627 Country
11& /eywords StatPac For Windows User's Manual
:e2tBo2 for a Sin%le 8aria"le
$ynta'# Te't!o' V' :or: Te't!o' 8parameters9 V'
# 4e9t&o9 is used when re;uesting that the user type something rather than choose
from a menu of items" 4he default script will use a te9to9 if there are no %alue
laels for a %ariale and the %ariale has a field width greater than 1" When the field
width for a %ariale is a long alpha field 6greater than #-070 the te9to9 will ha%e
multiple lines and a scroll ar" !f you want to force a long alpha field to use a single
line 4e9t&o90 then use the command format of5 4e9t&o9 617 ?9
4he parameters for the te9to9 are5
. C left Hustify or center the 4e9t&o9 in the frame
n numer of lines to show in the 4e9t&o9 61 to 27
P ' progress ar or no progress ar 6multiple line 4e9t&o9 only7
4he following 4e9t&o9 was centered0 shows fi%e lines0 and show no progress ar as
the respondent is typing5
4e9t&o9 6C2'7 C)
StatPac has a special feature that lets you attach a te9to9 to the last item of a radio
utton %ariale0 set of multiple response %ariales0 and a series of horiBontal radio
StatPac For Windows User's Manual /eywords 111
uttons" <ere is an e9ample of a te9to9 that has een attached to a radio uttton
%ariale"
4o use this feature0 simply create an alpha %ariale immediately following the
%ariale 6or %ariales7 that you want to contain the te9t o9" >se the word O:therO as
the %ariale lael for the alpha %ariale and do not specify the alpha %ariale in the
StatPac script" 4he codeoo, for the ao%e e9ample would e5
?ariale 1 .ael5 What is your fa%orite randY
1^&rand *
2^&rand J
3^&rand L
3^:ther
?ariale 2 .ael5 :ther
4he two criteria necessary to use this feature are5 17 the alpha %ariale has a %ariale
lael of O:therO0 and 27 the StatPac script doesnDt include the alpha %ariale" !n the
ao%e e9ample0 the"StatPac script would omit %ariale 2 6i"e"0 it would not include a
command line5 4e9t&o9 ?27"
<ere is an e9ample of a te9to9 that has een attached to the last in a series of
multiple response %ariales" 4here are four multiple response %ariales followed y a
single alpha %ariale with a %ariale lael of O:therO"
4he codeoo, to produce this e9ample would e5
?ariale 1 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
11) /eywords StatPac For Windows User's Manual
3^:ther 6specify7
?ariale 2 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
3^:ther 6specify7
?ariale 3 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
3^:ther 6specify7
?ariale 3 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
3^:ther 6specify7
?ariale 2 .ael5 :ther
8inally0 here is an e9ample of a te9to9 that has een attached to a group of
horiBontal radio uttons"
4he last two %ariales in the codeoo, used to create this e9ample are5
?ariale - .ael5 :ther 6please specify7
1^A9cellent
2^
3^
3^Poor
?ariale ) .ael5 :ther
StatPac For Windows User's Manual /eywords 11!
Jou can change the %ariale lael used to trigger this feature y editing the
StatPac"ini file" Search for ',?:KOter,ext 4 Oter and change it to the %ariale
lael you want to use to e%o,e this feature"
0ddin% a :e2tBo2 to a Radio ButtonC Chec#Bo2C or
Radio Button Matri2
StatPac has a special feature that lets you attach one or more te9to9es to a radio
utton %ariale0 set of multiple response %ariales0 or a series of horiBontal radio
uttons" 4here are two ways to do this depending on the numer and position of the
te9to9es you want to add" !n its simplest form0 one te9to9 is added to the last item"
!n the more comple9 form0 a te9to9 can e added to one or more radio uttons or
chec,o9es"

!n all of the following e9amples0 the te9to9 %ariales are specified as alpha format
and should use a field length long enough to hold the longest e9pected comment0 !n
these e9amples a format of #200 for the te9to9 %ariales would most li,ely e
sufficient"
4ttacing One Te'tbo' to te Last Item
StatPac has a special feature that lets you attach a te9to9 to the last item of a radio
utton %ariale0 set of multiple response %ariales0 and a series of horiBontal radio
uttons" <ere is an e9ample of a te9to9 that has een attached to a radio utton
%ariale"


4o use this feature0 simply create an alpha %ariale immediately following the
%ariale 6or %ariales7 that you want to contain the te9t o9" >se the word O:therO as
the %ariale lael for the alpha %ariale and do not specify the alpha %ariale in the
StatPac script" 4he codeoo, for the ao%e e9ample would e5

?ariale 1 'ame5 &rand
?ariale 1 .ael5 What is your fa%orite randY
1^&rand *
2^&rand J
3^&rand L
3^:ther
?ariale 2 'ame5 :therX&randXSpecified
?ariale 2 .ael5 :ther

11* /eywords StatPac For Windows User's Manual
4he two criteria necessary to use this feature are5 17 the alpha %ariale has a %ariale
lael of O:therO0 and 27 the StatPac script doesnDt specify the alpha %ariale"
!n the ao%e e9ample0 the StatPac script would omit %ariale 2 6i"e"0 it would not
include a command line5 4e9t&o9 :therX&randXSpecified7" 4he command to
produce the ao%e e9ample would e5

$adio &rand
&lan,.ine

Similarly0 a te9to9 can e attached to the last in a series of multiple response
%ariales" 4here are four multiple response %ariales followed y a single alpha
%ariale with a %ariale lael of O:therO"


4he codeoo, to produce this e9ample would e5

?ariale 1 'ame5 <earX1
?ariale 1 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
3^:ther 6specify7
?ariale 2 'ame5 <earX2
?ariale 2 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
3^:ther 6specify7
?ariale 3 'ame5 <earX3
?ariale 3 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
3^'ewspaper
3^:ther 6specify7
?ariale 3 'ame5 <earX3
?ariale 3 .ael5 Where did you hear aout the product 6chec, all7
1^$adio
2^4?
StatPac For Windows User's Manual /eywords 11-
3^'ewspaper
3^:ther 6specify7
?ariale 2 'ame5 <earX:therXSpecified
?ariale 2 .ael5 :ther

!n this e9ample0 the StatPac script would not specify %ariale 2" 4he command to
produce the ao%e e9ample would e5

Chec,&o9 <earX1 - <earX3
&lan,.ine

8inally0 here is an e9ample of a te9to9 that has een attached to the last %ariale in a
horiBontal radio utton matri9"


4he last two %ariales in the codeoo, used to create this e9ample are5

?ariale - 'ame5 :therX$ating
?ariale - .ael5 :ther 6please specify7
1^A9cellent
2^
3^
3^Poor
?ariale ) 'ame5 :therX$atingXSpecified
?ariale ) .ael5 :ther
4he StatPac script would not specify %ariale )" 4he command to produce the ao%e
e9ample would e5

$adio 4aste - :therX$ating
&lan,.ine

11; /eywords StatPac For Windows User's Manual
!n all of the ao%e e9amples0 the %ariale lael O:therO is used to e%o,e this feature"
Jou can change the %ariale lael used to trigger this feature y editing the
StatPac"ini file" Search for ',?:KOter,ext 4 Oter and change it to the %ariale
lael you want to use to e%o,e this feature"
4ttacing %ore tan One Te'tbo'
When you want to attach a te9to9 to more that one item in a radio utton %ariale0
set of multiple response %ariales0 or a series of horiBontal radio uttons0 a different
form of the synta9 is re;uired" 4his synta9 can e used to attach a te9to9 to any of
the items 6not only the last item7"
4he %ariale name for the te9to9 %ariales is how you control which radio uttons
will ha%e te9to9es" #ll te9to9 %ariale names end with OX:therO"
<ere is an e9ample of a radio utton %ariale that has three te9to9es attached to it"

4he te9to9 items immediately follow the radio utton %ariale" 4heir %ariale name
has three parts with an underscore separating the parts5 17 the name of the radio
utton %ariale0 27 the %alue lael code in the radio utton %ariale0 and 37 the word
O:therO"
4he codeoo, to produce the ao%e e9ample would loo, li,e this5

?ariale 1 'ame5 $esidence
?ariale 1 .ael5 1" Where do you li%eY
1^1inneapolis0 1'
2^St" Paul0 1'
3^:ther city in 1innesota 6specify75
3^1adison0 W!
2^1ilwau,ee0 W!
-^:ther city in Wisconsin 6specify75
)^:ther state 6specify75
?ariale 2 'ame5 $esidenceX3X:ther
?ariale 3 'ame5 $esidenceX-X:ther
?ariale 3 'ame5 $esidenceX)X:ther

StatPac For Windows User's Manual /eywords 11'
4he %ariales for the te9to9es are not specified in the StatPac script0 So the script
for this e9ample would simply e5

$adio $esidence
&lan,.ine

1ore than one te9to9 can also e included in a set of multiple response %ariales"
<ere is an e9ample where two te9to9es are attached to a set of multiple response
%ariales5


4he te9to9 %ariales immediately follow the multiple response %ariales" 4he
te9to9 %ariale names ha%e two parts separated y an underscore5 17 the name of
the multiple response %ariale0 and 27 the word O:therO"
<ere is the codeoo, for the pre%ious e9ample5

?ariale 3 'ame5 <earX1
?ariale 3 .ael5 3" Where did you hear aout StatPacY 6chec, all7
1^!nternet
2^1agaBine 6please specify75
3^Word of mouth
3^:ther 6please specify7
?ariale 2 'ame5 <earX2
?ariale 2 .ael5 3" Where did you hear aout StatPacY 6chec, all7
1^!nternet
2^1agaBine 6please specify75
3^Word of mouth
3^:ther 6please specify7
?ariale - 'ame5 <earX3
?ariale - .ael5 3" Where did you hear aout StatPacY 6chec, all7
1^!nternet
2^1agaBine 6please specify75
3^Word of mouth
3^:ther 6please specify7
?ariale ) 'ame5 <earX3
?ariale ) .ael5 3" Where did you hear aout StatPacY 6chec, all7
1^!nternet
2^1agaBine 6please specify75
1)> /eywords StatPac For Windows User's Manual
3^Word of mouth
3^:ther 6please specify7
?ariale ( 'ame5 <earX2X:ther
?ariale ( .ael 6optional75 1agaBine specified
?ariale 9 'ame5 <earX3X:ther
?ariale 9 .ael 6optional75 :ther specified

4he %ariales for the te9to9es are not specified in the StatPac script0 So the script
for this e9ample would e5

Chec,&o9 <earX1 - <earX3
&lan,.ine

4e9to9es can also e attached to any or all items in a horiBontal radio utton matri9"
<ere is an e9ample where two te9to9es are attached to all of the items in a radio
utton matri95


4he te9to9 %ariales immediately follow the last matri9 %ariale" 4he te9to9
%ariale names ha%e two parts separated y an underscore5 17 the name of the matri9
%ariale0 and 27 the word O:therO"
<ere is the codeoo, for the matri9 e9ample5

?ariale 1 'ame5 Cuality
?ariale 1 .ael5 Cuality5
1^?ery Food
2^Food
3^8air
3^Poor
2^?ery Poor
?ariale 2 'ame5 Ser%ice
?ariale 2 .ael5 Ser%ice5
1^?ery Food
2^Food
3^8air
StatPac For Windows User's Manual /eywords 1)1
3^Poor
2^?ery Poor
?ariale 3 'ame5 ?alue
?ariale 3 .ael5 ?alue5
1^?ery Food
2^Food
3^8air
3^Poor
2^?ery Poor
?ariale 3 'ame5 CualityX:ther
?ariale 2 'ame5 Ser%iceX:ther
?ariale - 'ame5 ?alueX:ther

4he %ariales for the te9to9es are not specified in the StatPac script0 So the script
for this e9ample would e5

Cuestion^Please rate our product on each of the following criteria" 8eel free
to add comments"
$adio Cuality - ?alue
&lan,.ine
:e2tBo2es for Groued 8aria"les
$ynta'# Te't!o' V' : Vy :or: Te't!o' 8parameters9 V' : Vy
1ore that one 4e9t&o9 can e inserted into a single frame y specifying a %ariale
range" 8ields with less than 30 characters will shown as a single line 4e9t&o9 and
longer fields will e shown as a multiple line te9t o9 with a scroll ar"
Parameters may e used to control the numer of lines in each 4e9t&o9 and the
location of the te9t" 4e9t may e placed to the left0 right0 top0 or ottom of the
4e9t&o9 using the .$4& parameters" 4he numer of lines for the 4e9t&o9 can also
e specified" 8or e9ample0 in the following command0 parameters were used to set
the te9t to the right and to create single-line 4e9t&o9es5
Cuestion^Please ran, each of the following y typing a 1 for the most
important0 2 for the second most important0 and so on"
4e9t&o9 6$17 4aste - Pac,age
1)& /eywords StatPac For Windows User's Manual
4here are two special %alidity chec,s that can e applied to grouped te9t o9es"
4hese chec,s can e added to the sur%ey y inserting a line in the script"
Constant $um Validity Cec/ for Te't!o'es
4he first is a constant sum0 where you want the responses to add up to a certain
%alue" #n e9ample would e OWhat percent of your total time do you spendKO and
you want the percents for each of the items to add to 100" 4he Sum command may
e inserted anywhere in the script" 4he format of the command is5 Sum 6the desired
sum7 ?9 G ?y" 4he desired sum is enclosed in parentheses0 and ?9 and ?y should e
the same as the 4e9t&o9 command" #n e9ample would e5
Cuestion^What percent of your total time do you spendK
4e9t&o9 Aating G Sleeping
Sum 61007 Aating G Sleeping
!n !nternet sur%eys it is %ery important not to frustrate respondents" Sometimes
respondentsD sums are off a little it 6e"g"0 they may add to 99 or 101 instead of 1007"
4he MA switch may e added to the end of the Sum command to specify the amount
of error that can e accepted efore the respondent will get an error message" 8or
e9ample0 if you were willing to accept sums that were etween 9( and 1020 the
commands would e5
Cuestion^What percent of your total time do you spendK
4e9t&o9 Aating G Sleeping
Sum 61007 Aating G Sleeping MA2
# special M4 switch may also e added to the end of the Sum command" 4his will add
a disaled 4e9t&o9 at the ottom laeled 4otal" !t will e updated dynamically as
respondents type numers into the other fields of the 4e9t&o9 Froup" 4his feature is
useful when you ha%e as,ed respondents to ma,e their responses total a gi%en
numer ecause it lets them see their current total in real time and ma,e adHustments
to their responses to achie%e the desired total"
Cuestion^1a,e the following items total Z100
4e9t&o9 8ood - !nsurance
Sum 61007 8ood - !nsurance M4
Jou may want to allow respondents to lea%e a series of constant sum 4e9t&o9es
lan," 4hat is0 respondents can lea%e the items lan, or they can fill in the items so
they add to a constant sum" 4he 1issing #llowed field in the codeoo, controls this
feature" When 1issing #llowed is chec,ed in the codeoo, for the first %ariale in
the series 6i"e"0 ?970 then the respondent can lea%e all the items lan, or they can fill
them in so they add to a constant sum" When 1issing #llowed is not chec,ed0 they
will e re;uired to ma,e the items add to a constant sum and will not ha%e the option
to lea%e them lan,"
StatPac For Windows User's Manual /eywords 1)1
Ran/ing Validity Cec/ for Te't!o'es
4he second type of %alidity chec, that can e applied to grouped te9t o9es is for
ran,ing ;uestions" $espondents are often as,ed to ran, items 6e"g"0 type a 1 for the
most important item0 a 2 for the ne9t most important item0 etc"7" 4he ran,ing %alidity
chec, will chec, for duplicate or missing ran,s" 4he $an, command may appear
anywhere in the script" 4he synta9 of the command is5 $an, 6numer of ran,s7 ?9 G
?y" 4he desired numer of ran,s is enclosed in parentheses0 and ?9 and ?y should
e the same as the 4e9t&o9 command" !f the parentheses and desired numer of
ran,s is omitted0 all items in the list will need to e ran,ed y the respondent"
#n e9ample where you as, respondents to ran, the top two items only would e5
Cuestion^$an, the two most important items5
4e9t&o9 Salary - &enefits
$an, 627 Salary - &enefits
Jou might want to allow respondents to lea%e a series of ran,ing 4e9t&o9es lan,"
4hat is0 respondents can lea%e the items lan, or they can ran, the items" 4he
1issing #llowed field in the codeoo, controls this feature" When 1issing #llowed
is chec,ed in the codeoo, for the first %ariale in the series 6i"e"0 ?970 then the
respondent can lea%e all the items lan, or they can ran, them as specified y the
$an, command" When 1issing #llowed is not chec,ed0 they will e re;uired to ran,
the items and will not ha%e the option to lea%e them lan,"
Slider for Sin%le or Multile 8aria"les
$ynta'# $lider V' : Vy :or: $lider 8parameters9 V' : Vy
4he Slider command is used to creates one or more sliders with a scaled ruler and a
handle that allows a respondent to %isually set a %alue y mo%ing the handle with the
mouse" 4he general appearance of a slider is5
.aeling for the slider scale is controlled either y %alue laels or specified
parameters" 4he slider will always show an adHacent 4e9t&o9 to allow the respondent
to manually type the response0
4he Slider command may e used as an alternati%e way to present psychometric
scaling items or a te9to9 re;uiring a numeric response" 4he slider will ne%er e
created as a default oHect" !f you want to use a slider0 you must modify the script y
changing a $adio or 4e9to9 command to a Slider command"
4he Slider is appropriate for .i,ert and semantic differential scales 6e"g" agree to
disagree0 %ery important to not important0 fa%or to oppose0 etc70 4hese scales are
usually 1-20 1-)0 or 1-10" #n e9ample might e5
Variable 2 Label: How important is the amendment?
1=Not Important
2=
1)) /eywords StatPac For Windows User's Manual
3=
4=
5=Very Important
4he default script would e5 $adio ?2
Jou would change the script to e5 Slider ?2

4he Slider is also appropriate for ;uestions where you as, the respondent to rate one
or more items5
8or e9ample5 Please rate your le%el of optimism aout the economy on a scale from
0 to 100" !n the codeoo,0 you would define the %ariale as '3 and set the %alue
laels to 0-100"
4he default script would e5 4e9t&o9 ?2
Jou would change the script to e5 Slider ?2
Parameters can e used for laeling the slider" 4he parameters are separated from
each other y commas" 4he format for the parameters is5
-,itleB :ow :abelB ?iddle :abelB 'ig :abel1
4he title will appear ao%e the scaled ruler" 4he low0 middle0 and high laels will e
ta,en from the %alue laels or can e specified or changed with the parameters"
A9amples might e5
A9ample5 Slider 6Percent7 ?9
6Create a slider for ?9 with a title of Percent0 and use the e9isting %alue laels to
lael the lowest0 middle0 and highest positions of the slider7"
A9ample5 Slider 6Percent0'egati%e0'eutral0Positi%e7 ?10
6Create a slider for ?10 with a title of Percent" .ael the left end of the slider
'egati%e0 the middle 'eutral0 and the right end Positi%e"
A9ample5 Slider 6 0.owest0 0<ighest7 ?10 - ?12
6Create three grouped sliders for ?100 ?110 and ?12" 4here will e no title and no
middle laeling" 4he left end of the slider will e laeled .owest and the right end
will e laeled <ighest" 6'ote that commas are used to indicate lael separation0
e%en if a lael is lan,7"
#dditional A9amples5
Suppose in your codeoo,0 you ha%e a %ariale to measure satisfaction on a 1 to 10
scale" 4he codeoo, is5
$ariable < :abelM 'ow satis!ied are you wit te program(
$ariable < @ormatM N0
$ariable < $alue :abelsM
14Not at all Satis!ied
04
34
>4
A4
;4
<4
/4
=4
154$ery Satis!ied
StatPac For Windows User's Manual /eywords 1)!
4he default script would e5
$adio 627 ?)
&lan,.ine
Jou would modify the default script to5
Slider ?)
&lan,.ine
4he slider would e created and the endpoints would e laeled 'ot at all Satisfied
and ?ery Satisfied" 4he slider would not ha%e a title and the middle point of the
slider would not e laeled"
4he following would add a title to the slider5
Slider 6.e%el of Satisfaction7 ?)
&lan,.ine
!n another e9ample0 suppose in your codeoo,0 you ha%e two %ariales to measure
respondentsD pessimismMoptimism for their country and their company" Jou plan to
use a scale of -10 to ]10" 4he codeoo, would e5
$ariable 1 :abelM ,e country were you live.
$ariable 1 @ormatM N3
$ariable 1 $alid CodesM -15 - .15
$ariable 0 :abelM ,e company were you work.
$ariable 0 @ormatM N3
$ariable 0 $alid CodesM -15 - .15
4he default script would e5
4e9t&o9 ?1
&lan,.ine
4e9t&o9 ?2
&lan,.ine
Jou would modify the default script to5
Cuestion^Please indicate your le%el of pessimism or
optimism y mo%ing the slider handle with your mouse"
Slider 6PessimismM:ptimism $ating0 ?ery Pessimistic0
'eutral0 ?ery :ptimistic7 ?1 - ?2
&lan,.ine
1)* /eywords StatPac For Windows User's Manual
'ote5 4he slider oHect uses acti%e scripting" @epending on your rowser security
settings0 you may e as,ed for permission to run the script when pre%iewing the
<41. page on your local computer" Permission is not re;uired to run the script after
it has een uploaded to a We hosting ser%er"
Chec#Bo2 for Multile Resonse 8aria"les
$ynta'# Cec/!o' V' : Vy :or: Cec/!o' 8<9 V' : Vy
4he Chec,&o9 is used for multiple response" When creating !nternet sur%eys with
multiple response %ariales0 there must e the same numer of %ariales as there are
%alue laels" 8urthermore0 all the %alue laels must e specified in each of the
%ariales" !n the following e9ample0 there would e 3 identical %ariales0 each with 3
%alue laels"
4he first form of the command will create all the Chec,&o9es in a single column"
4he second form of the command will create two columns of Chec,&o9es" !n
creating the default script0 if there are si9 or fewer %alue laels0 the default will e
one column" !f there are )-12 %alue laels0 the default will e two columns" 4he
Chec,&o9 is the only input method for multiple response"
Chec#"o2 for Grous of Multile Resonse
8aria"les <hori?ontal (atri2=
$ynta'# Cec/bo' V' : Vy
Sometimes you might ha%e se%eral multiple response %ariales that are etter shown
in a horiBontal matri9 8or e9ample0 suppose you ha%e the following ;uestion5
)at role did you play in selecting eac o! te !ollowingM -ceck all tat apply1
4he codeoo, loo,s li,e this5
$=aK1 :abelM ?agazine 6
14Getermine need
04Recommend
346pprove
$=aK0 :abelM ?agazine 6
14Getermine need
04Recommend
346pprove
$=aK3 :abelM ?agazine 6
14Getermine need
04Recommend
346pprove
StatPac For Windows User's Manual /eywords 1)-
$=bK1 :abelM ?agazine 7
14Getermine need
04Recommend
346pprove
$=bK0 :abelM ?agazine 7
14Getermine need
04Recommend
346pprove
$=bK3 :abelM ?agazine 7
14Getermine need
04Recommend
346pprove
$=cK1 :abelM Oter ?agazine
14Getermine need
04Recommend
346pprove
$=cK0 :abelM Oter ?agazine
14Getermine need
04Recommend
346pprove
$=cK3 :abelM Oter ?agazine
14Getermine need
04Recommend
346pprove
$=cKOter :abelM Oter
4he default script would treat each of the three groups of %ariales indi%idually0 and
would loo, li,e this5
A9ample5
Chec,&o9 C9aX1 - C9aX3
&lan,.ine
Chec,&o9 C9X1 - C9X3
&lan,.ine
Chec,&o9 C9cX1 - C9cX3

4o switch to a matri9 format0 change the script so that all %ariales are in the same
chec,o9 command"

Cuestion^What role did you play in selecting each of the following5
6chec, all that apply7
Chec,&o9 C9aX1 - C9cX3
1); /eywords StatPac For Windows User's Manual

Validity Cec/s for Cec/!o'es
4he #t.east command is used when you want to re;uire the respondent to chec, at
least 9 Chec,&o9es" 4he #t.east command may e inserted anywhere in the script"
4he format of the command is5 #t.east 6minimum numer of chec,s7 ?9 G ?y" 4he
minimum numer of chec,s is enclosed in parentheses0 and ?9 and ?y should e the
same as the Chec,&o9 command" #n e9ample would e5
Cuestion^Please select at least two of the following items"
Chec,&o9 ?20-?30
#t.east 627 ?20-?30
4he >p4o command is used when you want to limit the numer of Chec,&o9es a
respondent can chec," 4he >p4o command may e inserted anywhere in the script"
4he format of the command is5 >p4o 6ma9imum numer of chec,s7 ?9 G ?y" 4he
ma9imum numer of chec,s is enclosed in parentheses0 and ?9 and ?y should e
the same as the Chec,&o9 command" #n e9ample would e5
Cuestion^Please select up to three items"
Chec,&o9 ?20-?30
>p4o 637 ?20-?30
4he A9actly command is used when you want to re;uire the respondent to chec,
e9actly 9 Chec,&o9es" 4he A9actly command may e inserted anywhere in the
script" 4he format of the command is5 A9actly 6numer of chec,s7 ?9 G ?y" 4he
numer of chec,s is enclosed in parentheses0 and ?9 and ?y should e the same as
the Chec,&o9 command" #n e9ample would e5
Cuestion^8rom the following list0 please select your three fa%orite items"
Chec,&o9 ?20-?30
A9actly 637 ?20-?30
Jou might want to allow respondents to lea%e all the Chec,&o9es unchec,ed"
<owe%er0 if they chec, any o9es they must chec, the numer specified in the
#t.east or A9actly commands" 4he 1issing #llowed field in the codeoo, controls
this feature" When 1issing #llowed is chec,ed in the codeoo, for the first %ariale
in the series 6i"e"0 ?970 then the respondent can lea%e all the items unchec,ed" When
StatPac For Windows User's Manual /eywords 1)'
1issing #llowed is not chec,ed0 they will e re;uired to chec, at least the numer of
Chec,&o9es specified in the #t.east command or e9actly the numer of
Chec,&o9es specified in the A9actly command"
.istBo2
$ynta'# List!o' V'
4he .ist&o9 may e used as an alternati%e to radio uttons" 8unctionally0 the
.ist&o9 is identical to the radio uttons"
Uloadin% and $ownloadin% Files fro( the Ser,er
0uto :ransfer
,ploading a $urvey
4he easiest way to upload files to the !nternet is to use the #uto 4ransfer feature0 #ll
necessary files will e uploaded automatically" Changes to the Perl scripts are made
automatically"
$un #uto 4ransfer from the script window y clic,ing the Ser%er utton" $un #uto
4ransfer at other times y loading your codeoo, and then selecting Ser%er \ #uto
4ransfer"
!f We8older>$. 6a Primary setting in the script7 is set to your own ser%er0 #uto
4ransfer will e to and from that ser%er" !f We8older>$. specifies the StatPac
ser%er0 then #uto 4ransfer will e to and from your current folder on the StatPac
ser%er"
!f you change pri%ate folders on the StatPac ser%er0 #uto 4ransfer will automatically
adHust your <41. to reflect the new folder name" Jou do not ha%e to regenerate the
<41. or ma,e other changes to your script"
Do"nloading Responses
When you download responses using #uto 4ransfer they will e imported into
StatPac" StatPac assumes that your are always downloading the entire data set from
the eginning of the sur%ey" Aach time you download0 StatPac will o%erwrite the
e9isting data file with the newly downloaded data" 4hus0 there are only two
situations where you should delete a response file from the ser%er5 17 to delete the
test data file0 and 27 to delete the real data after you ha%e finished the sur%ey
analysis"
1!> /eywords StatPac For Windows User's Manual
Jou can edit the StatPac"ini file so that StatPac will prompt you on whether to
o%erwrite or append to the e9isting data file" Set @ataCuery ^ 1 to use the prompt"
F:P
84P 6file transfer protocol7 is the method used to transfer files to and from a remote
We ser%er" #uto 4ransfer also uses 84P 6it Hust happens Oehind the scenesO7"
!n order to use 84P0 you need to ,now the locations of the wwwroot folder and the
CF! folder on your ser%er"
4he wwwroot folder is where your We site pages are located" :n a >ni9M.inu9
ser%er this is proaly pulicXhtml" :n a Windows '4 or !!S ser%er0 it is proaly
wwwroot" When you login %ia 84P0 you might already e in the wwwroot folder0 or
you might ha%e to change to another sufolder 6e"g"0 pulicXhtml7"
4he CF! folder is almost always immediately elow the wwwroot folder and it is
usually called cgi-in or cgi"
4o run StatPacDs 84P program0 select Ser%er \ 84P \ server
4wo panes will e displayed" 4he top pane is your ser%er and the ottom pane is your
local computer" Jou can drag and drop files from one pane to the other" <ighlight
one or more files in one page and drag those to the other pane" 4he current folder is
shown in the te9t on top of the pane" 4hat is the folder where files will e dropped"
4o drop to a displayed folder0 first doule clic, on that folder to ma,e it the current
folder"
Jou can also right clic, on a file in either pane for additional options" @oule clic,
on a folder to change to that folder"
StatPac For Windows User's Manual /eywords 1!1
When using the StatPac ser%er0 you will only ha%e access to two ser%er folders0 17
the folder where your sur%eys reside0 and 27 the folder where your response files are
written" Select ?iew to change folders"
@emo users all share the folder name of guest and therefore will not ha%e 84P access
to the StatPac ser%er" When using your own ser%er0 you will ha%e complete 84P
na%igation"
,ploading a $urvey
4he We8older>$. setting specifies the folder where the sur%ey will reside" !f it is
Hust a >$. without a folder name0 then the sur%ey should e uploaded to the
wwwroot folder"
We8older>$.^http5MMyourser%er"com
<owe%er0 if it also specifies a folder name0 then the <41. files should e uploaded
to that folder"
We8older>$.^http5MMyourser%er"comMsur%ey
1!& /eywords StatPac For Windows User's Manual
While #uto 4ransfer creates the folder if it doesnDt e9ist0 you may ha%e to manually
create it if using 84P" !n the ser%er pane 6top70 change to the wwwroot folder 6if
necessary7" 4hen right clic, on the pane and select 'ew 8older"
#ll of the following files will e found in your current proHect folder"
4he following files need to e uploaded to the sur%ey folder"
Sur%ey'ame"htm 6.oader7
Sur%ey'ameX1"htm 61st page7
Sur%ey'ameX2"htm 62nd page7
Sur%ey'ameX3"htm 63rd page7
Sur%ey'ameX3"htm 64han,-you page7
#dditionally0 the <41.'ame command is used to name se%eral other files"
Sur%ey'ameXclosed"htm 6Sur%ey is closed page7
Sur%ey'ameXcoo,ieXcutter"htm 6@elete the coo,ie7
Sur%ey'ameXpopupX1"htm 61st popup window7
Sur%ey'ameXpopupX2"htm 62nd popup window7
closepopup"htm 6internal file to close popup windows7
Sur%ey'ameXhelpX1"htm 61st help window7
Sur%ey'ameXhelpX2"htm 62nd help window7
Sur%ey'ameXstart"htm 6.oader page for password protected sur%eys7
#ny graphics used 6including lue"gif and grey"gif7
4he following file needs to e uploaded to the cgi-in folder"
Sur%ey'ame"pl 6Processes data when respondent clic,s sumit7
#fter uploading the "pl file0 right clic, on it and set the permissions to )22"
!f you ha%e a password protected sur%ey0 you also must upload two additional files to
the cgi-in folder5
password"pl 6Controls the login7
Sur%ey'ame"te9t 6@ata ase containing one or more passwords7
#fter uploading password"pl0 right clic, on it and set the permissions to )22"
Do"nloading Responses
$esponses will always e sa%ed in the cgi-in folder and ha%e a" asc e9tension"
!n the ser%er pane 6top70 na%igate to the cgi-in folder0 drag the Su%ey'ame"asc file
to your current proHect folder"
While #uto 4ransfer automatically imports the data0 when you use 84P0 you ha%e to
manually import the "asc file to create the data file" Close the 84P window and select
@ata \ !mport"
StatPac For Windows User's Manual /eywords 1!1
1!) /eywords StatPac For Windows User's Manual
Su((ary of the Most Co((on Scrit Co((ands
4his is a summary of the most commonly use commands in the Sur%ey Creation
section of the script"
(ommands to display te1t
<eading^4e9t @isplays %ery large te9t
4itle^4e9t @isplays large te9t
4e9t^4e9t @isplays normal te9t
8ootnote^4e9t Sets the footnote te9t
!nstructions^4e9t @isplays te9t using instructions color scheme
Cuestion^4e9t @isplays te9t using ;uestion color scheme
(ommands for spacin/ and pa/ination
&lan,.ine !nserts lan, line
'ewPage &egins a new sur%ey page
(ommands to insert ima/es and links
!mage^8ilename6s7 !nsert one or more images
.in,>$.^>$. Sets the >$. for the ne9t hyperlin,
.in,4e9t^4e9t Sets the te9t for the ne9t lin, on the sur%ey
.in, !nserts the hyperlin, in the sur%ey
(ommands for help and popup windows
<elp.in,4e9t^4e9t Sets the te9t for the help lin, on the sur%ey
<elp4e9t^4e9t Sets the te9t that will appear in the popup help window
<elp8ile'ame^8ilename Sets the name of an e9isting popup help window file
<elpWindow !nserts the help window hyperlin, into the sur%ey
PopupStart &egin a popup window
PopupAnd And a popup window
(ommands to create ob;ects
$adio ?9 !nserts radio uttons for %ariale 9
$adio ?9-?y !nserts horiBontal radio uttons for %ariales 9-y 6matri9
format7
@rop@own ?9 !nserts a dropdown o9 for %ariale 9
4e9t&o9 ?9 !nserts a single or multiple line te9t o9 for %ariale 9
6depending on the field width of the %ariale7
4e9t&o9 ?9-?y !nserts te9t o9es for %ariales 9-y into a single frame
Slider ?9-?y !nserts sliders for %ariales 9-y into a single frame
.ist&o9 ?9 !nserts a list o9 for %ariale 9
StatPac For Windows User's Manual /eywords 1!!
+(ail .ist Mana%e(ent
3,er,iew
StatPac contains a complete e-mail list management system" Select0 Amail0 .ist
1anagement to access these features"
For(at of an +(ail 0ddress File
#n e-mail list is simply an #SC!! te9t file of e-mail addresses" 4he file may
optionally contain other information" Amail address lists may use a "lst0 "t9t0 or "cs%
e9tension for the file name" When StatPac creates or writes an e-mail list0 it will
always use a "lst e9tension" 4hese are ta delimited #SC!! te9t files" !f necessary for
compatiility with other software pac,ages0 "lst files may e renamed to "t9t"
4he file should contain one record 6line7 for each person that will e sent an e-mail"
!n its simplest form0 this is Hust a file of e-mail addresses 6one per line7" #n address
file with three names might loo, li,e this5
da%idPstatpac"com
HohnXsmithPmindspring"com
1!* /eywords StatPac For Windows User's Manual
fred2(9Paol"com
:ptionally0 the te9t file can also contain a uni;ue !@ numer or identifier" !f
included0 it should e separated from the email address y a comma or a ta" !n other
words0 it is a comma or ta delimited file with two %ariales" 4he first %ariale is the
email address and the second %ariale is a uni;ue !@" 4he uni;ue !@ can contain
numers and letters0 ut not special characters li,e ;uestion mar,s0 pound symols0
or spaces" 4he !@ numer will always e the second %ariale in an e-mail address
line"
da%idPstatpac"com0912)(3
HohnXsmithPmindspring"com0)2)-
fred2(9Paol"com032-(0-3
#dditional information may also e included in the e-mail address file" Aach
additional field is separated from the other %ariales y a comma or ta" #ll records
in the e-mail address file must contain the same numer of %ariales" :ne reason you
might ha%e additional %ariales in an e-mail address file is to e ale to customiBe
the e-mails" 8or e9ample0 instead of Q<ello CustomerR0 you could egin your e-mail
with Q<ello @a%idR" #nother reason you might ha%e additional information is to e
ale to merge that data with the completed sur%eys" 4hat is0 you can Hoin data from
an e9isting data ase with the answers to a sur%ey"
#dditional information in an e-mail address file always egins with the third
%ariale" 4he first %ariale is the email address0 the second %ariale is the !@ numer0
and the additional information egins is the third %ariale" 8or e9ample0 this e-mail
address file contains the first and last names0 and these could e used in the ody of
the e-mail"
da%idPstatpac"com0912)(30@a%id0Walonic,
HohnXsmithPmindspring"com0)2)-0Iohn0Smith
fred2(9Paol"com032-(0-308red0Iones
!n all of the ao%e e9amples0 the first record in the e-mail address file contained
actual data" 1any other software programs write a header row when creating an
delimited te9t file 6i"e"0 an e-mail address file7" 4hat is0 the first record in the e-mail
address file contains %ariale names instead of data" #n e9ample would e5
Amail0!@08irst0.ast
da%idPstatpac"com0912)(30@a%id0Walonic,
HohnXsmithPmindspring"com0)2)-0Iohn0Smith
fred2(9Paol"com032-(0-308red0Iones

StatPac can e set to use or not use a header row for all e-mail address lists" Adit
StatPac"ini and set Amail.ist<eader$ow ^ 1 to use a header row or
Amail.ist<eader$ow ^ 0 to not use a header row"
StatPac For Windows User's Manual /eywords 1!-
+2tract +(ail 0ddresses
!t is often desirale to e ale to e9tract e-mail addresses from a file or from the
clipoard" 4his is especially helpful if you are uilding an e-mail list" !t can e used
to capture ounced e-mail addresses that you want to eliminate from an address file"
4he file you want to e9tract e-mail addresses from can e in any te9t format" StatPac
will find and e9tract the addresses and write them to an e-mail address file 6"lst
e9tension7" 4he e9tract program will not e9tract e-mail addresses from compressed
data ase formats such as #ccess" Jou should e9port the data to a te9t file efore
attempting to e9tract the e-mail addresses"
4here are two prolems you might encounter when e9tracting e-mail addresses" 4he
first is that you might e9tract e-mail addresses that are generated y a ser%er" 8or
e9ample0 postmasterPsomedomain"com is proaly not an address youNd want to
add to an e-mail address file" Jour own domain is proaly also an address you want
to e9clude" 4he reHection filter may e used to omit those addressesMdomains that you
do not want to e added to an e-mail address file e%en when they e9ist in the
document you are e9tracting from" 4he reHection filter should contain one word per
line" !f that word is part of an e-mail address0 it will not e captured y the program"
$eHection filter te9t is not case sensiti%e"
4he other prolem you might encounter is that many ser%ers issue a long numerical
e-mail address as part of the header for a ounced or reHected e-mail" 4hese might
loo, li,e this5 1)3-(3-)3((3-393))3Psomedomain"com" Jou can set the ma9imum
consecuti%e digits parameter to filter out long numerical e-mail addresses generated
y a ser%er"
.ist Statistics
4he .ist Statistics program can e used to count the numer of e-mail addresses in a
file and tell when the last update was made to that file"

1!; /eywords StatPac For Windows User's Manual
Doin :wo or More .ists
4here will e many situations where you ha%e gathered e-mail addresses from
multiple sources and stored them in separate files" >se this program to comine lists
from multiple files and create a new file consisting of addresses from all the lists"
Select the files to e Hoined using the &rowse &utton0 or type them one per line"
Specify a new e-mail address file that will contain the addresses from all the files"
4his program does not chec, for the e9istence of duplicate e-mail addresses" !t only
comines the files into one ig list" 4herefore0 after comining multiple e-mail files0
it is ad%isale to run the e-mail management program to clean0 sort0 and eliminate
duplicates"
StatPac For Windows User's Manual /eywords 1!'
Slit a .ist
4here are many situations where you might want to split a list5 17 Jou ha%e a %ery
large list and you want to e-mail to only a specific numer of respondents 27" Jou
ha%e a %ery large list and you want to split it up to ma,e it more manageale0 37 Jou
want to randomly select winners for a drawing0 etc"
StatPac can split a list using three different methods5 se;uential0 systematic and
random" Which method you use depends upon your application"
When the se;uential method is selected0 a new file will e created and e-mail
addresses will e written to the new file until a certain numer of addresses ha%e
een written" 4hen another new file will e created and the ne9t x addresses will e
written to that file" Aach of the new e-mail address files will contain the same
numer of records as the pre%ious file6s70 e9cept the last one that is written"
4he 8ile 'ame Prefi9 for Sulists is the eginning of the file name for the new
smaller lists" 4he actual file names for the sulists will end with X10 X20 X30 etc"
1*> /eywords StatPac For Windows User's Manual
Systematic selection is often called 'th 'ame Selection" A%ery 'th name will e
selected from an e-mail list file and written to a new e-mail list file" :ptionally0 you
can also write the non-selected addresses to a different e-mail address file"
Systematic selection is fre;uently used to draw a sample for a sur%ey from a larger
list" !t is considered to e as good as random selection pro%ided that the order of the
e-mail list is not related to the focus of the study"
4he third method of splitting a list is the random selection method" $ecords will e
randomly selected from the e-mail list" Jou only need to specify the numer of
random records that will e drawn from the e-mail address file" :ptionally0 you may
also specify a file name for the records that are not randomly selected"
!t should e noted that this method in%ol%es true random selection" 4hus0 running the
program twice on the same list will not select the same e-mail addresses"
StatPac For Windows User's Manual /eywords 1*1
CleanC SortC and +li(inate $ulicates
1any e-mail lists are dynamic0 in that you are continually updating0 adding0 and
deleting e-mail addresses from the list" 4he Clean0 Sort0 and Aliminate @uplicates
program can e used to maintain a clean list" !n%alid and duplicate e-mail addresses
will e eliminated"
0dd I$ 7u("ers to a .ist
!@ numers are used to ,eep trac, of those who respond to your sur%ey" Jou can
conduct we sur%eys without !@ numers0 ut there will e no way to determine who
responded and who didnDt" !f you are planning on sending e-mailing follow-up
in%itations to those who did not respond to the first in%itation0 then !@ numers are
essential" !@ numers are used to lin, the names in an e-mail address file to the
sur%ey respondents"
!f you already ha%e an !@ numer in an e9isting data ase0 it can e used pro%ided
that it does not contain any special characters0 li,e ;uestion mar,s0 pound symols0
or spaces" !t must e the second %ariale in the e-mail address file 6which is ta or
comma delimited #SC!! te9t7"
4he #dd !@ 'umers to a .ist program may e used to create random !@ numers
and add them to an e9isting e-mail address list" 4he !@ numers will e inserted as
the second %ariale in the list" !f there is already more than one %ariale in the list0
the !@ numer will e inserted as %ariale two and all the other %ariales will e
mo%ed to the right" 8or e9ample0 suppose you ha%e this e-mail list consisting of three
%ariales 6e-mail address0 company0 and city7"
da%idPstatpac"com0 StatPac !nc"0 1inneapolis
1*& /eywords StatPac For Windows User's Manual
HohnXsmithPmindspring"com0 #cme Widgets Co"0 Chicago
#fter adding !@ numers0 the list would appear li,e this5
da%idPstatpac"com0 21)-9(310 StatPac !nc"0 1inneapolis
HohnXsmithPmindspring"com0 (932)9120 #cme Widgets Co"0 Chicago
Create a .ist of 7onresonders
!n a typical we sur%ey0 you might send out hundreds 6or thousands7 of e-mail
in%itations to ta,e the sur%ey" Within a few days0 you will recei%e aout 90` of the
total response that youDll get" #fter a wee, has passed0 you can sustantially oost the
response rate y sending a reminder e-mail to those who ha%e not yet responded" 4he
purpose of this program is to create an e-mail list consisting of Hust those people who
ha%e not yet responded to the sur%ey"
4he process is straight forward0 although there are se%eral steps in%ol%ed"
17 #dd the Respondent*G %ariale to the codeoo," When you create an !nternet
sur%ey0 StatPac will as, if you want to add the special %ariales to the codeoo, if
they ha%e not already een added" Fenerally0 you would answer yes"
27 $un the e-mail management program to add !@ numers to the e-mail address file"
37 Send e-mail in%itations using StatPacDs ul, e-mail program"
37 #ppro9imately one wee, later0 download and import the !nternet response file
6#uto 4ransfer7"
27 $un this program and create an e-mail list of nonresponders" 4his list will e
identical to the original e-mail list e9cept it will only contain the e-mail addresses of
those who ha%e not yet responded to the sur%ey"
-7 Send a reminder e-mail to the nonresponders using StatPacDs ul, e-mail program"
4he only two parameters in the ul, e-mail program you will need to change are the
name of the e-mail address file 6which will e the nonresponders file instead of the
original file7 and the file containing the ody te9t 6which will presumale e
different than the original in%itation7"
StatPac For Windows User's Manual /eywords 1*1
)7 #fter another wee,0 re-download the !nternet response file" When you download
an !nternet response file from your ser%er0 it is not deleted from your ser%er" 4hus0
when you re-download the !nternet response file0 you should o%erwrite the e9isting
data file rather than appending to it"
(7 #nalyBe the data"
Su"tract 3ne .ist Fro( 0nother .ist
!t is %ery common for e-mail addresses to e wrong" People change accounts and e-
mail addresses fre;uently" 4yping errors in e-mail addresses are aundant" !t would
not e unusual for 10`-20` of the addresses in an e-mail address file to e in%alid"
When you send ul, e-mail to the names in an e-mail address file0 in%alid addresses
will ounce ac, to you" 4hese ounced e-mails can e captured with the e-mail
management program to e9tract e-mail addresses" #fter you ha%e an e-mail list of the
ounced e-mails0 you will proaly want to remo%e them from the e-mail address
file that was used to send the in%itations" 4his is especially true if you want to use the
e-mail list again in the future" Jou can sutract 6i"e"0 remo%e7 the ounced e-mail
addresses from the e-mail file using this program"
1*) /eywords StatPac For Windows User's Manual
Mer%e an +(ail .ist into a StatPac $ata File
When you recei%e responses to an !nternet sur%ey0 the file will not contain the e-mail
address of the respondent" !n fact0 there is no way to capture the-mail addresses of
people ta,ing the sur%ey unless the sur%ey itself specifically as,s for their e-mail
address as one of the %ariales"
<owe%er0 if you used $espondent !@ numers0 youDll e ale to match respondentDs
with their entry in the e-mail address file" 4he e-mail address file will contain the
respondentDs e-mail address0 !@ numer0 and possily other data ase information"
4he e-mail list management program will merge the e-mail list information into the
StatPac data file" Jou should wait until the sur%ey is closed efore using this
program" !n other words0 do not run this program if you are e9pecting additional
response"
Send +(ail In,itations
Amail is a popular way of in%iting potential respondents the opportunity of
participating in an !nternet sur%ey" 4he Send Amail !n%itations program will allow
you to send a large numer of customiBed e-mails at high speed"
&efore eginning0 you need two files" 4he first is a list of e-mail addresses" 4he
second is an #SC!! te9t file containing the ody te9t of the e-mail" >sually0 you
would create this file with 'otepad or 1SWord"
Usin% an I$ 7u("er to :rac# Resonses
:ne important feature of the e-mail program is that it lets you serialiBe the e-mails
with a uni;ue !@ numer that can e used to trac, respondents"
!n the ody of the e-mail0 there will e a lin, to the sur%ey on the we site" 4his lin,
will contain the respondentDs uni;ue !@ numer0 so when they clic, on the lin,0 it
will ta,e them to the sur%ey we page 6and StatPac will ,now the !@ numer of the
StatPac For Windows User's Manual /eywords 1*!
person who is responding7" 1oreo%er0 their !@ numer will e stored with their
responses on your ser%er" 4he !@ numer may contain alpha characters as well as
numers" 4his feature can e used to match information from an e9isting data ase
with respondentsD answers" !n the following e9ample of a lin, with an !@ numer0
notice the >$. has a Yid^1(2- suffi9 and the !@ numer is 1(2-"
http5MMwww"statpac"comMonline-sur%eysMmultipage-sur%ey"htmYid^1(2-
+(ail 0ddress File
!t is ?A$J important that you create a short test file of one to three e-mail
addressees" #ll the e-mail addresses in the test file should e your own e-mail
address" 4his will allow you to send test e-mails to yourself to chec, their
appearance efore you send to the real respondents" 'ame this file something li,e
O4est.ist"lstO so you will immediately ,now what it is y loo,ing at its name" Jou
can also use the 4est 1ode y typing your e-mail address into the te9t o9 so that
instead of sending to the specified e-mail list0 only one e-mail will e sent to you" &e
sure to completely erase your e-mail address from the te9t o9 when you are ready to
send to the entire list"
Body :e2t File
4he ody te9t file is the actual e-mail message you will e sending to potential
respondents" !t may e plain te9t or <41." Jou can use 'otepad or 1SWord to
create a plain te9t ody file0 or 1S8rontPage of 1SWord to create an <41. email"
8or a plain te9t email0 StatPac can include attachments to the email" !f it is an <41.
email0 StatPac will automatically include the graphics in the ody of the email" When
using an <41. ody file with graphics0 the Osrc^O tag in the <41. source should
point to the image on your local computer 6not the internet7"
?ariale sustitution can e used in the ody te9t file to include the >$. of the
sur%ey" !f the address file is a StatPac data file0 then you can also use %ariale
sustitution for any %ariale in the codeoo," Sustitution is specified using 6b and
b7 to egin and end the %ariale name"
<ere is an e9ample of a ody te9t file that uses three sustitution %ariales" #ssume
%ariale 3 in the e-mail address file is O8irstX'ameO and %ariale 3 in the e-mail
address file is O.astX'ameO" !n this e9ample0 %ariale sustitution is eing used to
customiBe the greeting" !t also uses 6burlb7 to specify where the lin, should e placed
in the e-mail" 4he 6b3b7 and 6b3b7 can e specified in the ody te9t ecause they are
%ariales in the e-mail address file"
<ello 6b3b7 6b3b70
We are doing a sur%ey and would li,e your participation"
Please clic, here to ta,e the sur%ey
6burlb7
4han, you"
1** /eywords StatPac For Windows User's Manual
$egards0
@a%id Walonic,
StatPac !nc"
http5MMwww"statpac"com
6)127 332-22-1
!f the email is <41. then the lin, to the >$. is still 6burlb7" 8or e9ample0 the
source in the <41. might loo, li,e this5
[a href^O6burlb7O\Please clic, here to ta,e the sur%ey[Ma\
!f the e-mail address file contains a header row of %ariale names0 then the names in
the header row can e used for %ariale sustitution instead of the %ariale numer"
8or e9ample0 the greeting could e written as5
<ello 6b8irstX'ameb7 6b.astX'ameb70
When creating a plain te9t ody file0 we recommend limiting all lines to a ma9imum
of -0 characters and inserting a hard return at the end of each line" 64his means to
press UAnterV after each -0-character line when you are typing the ody te9t7" While
not necessary0 it will produce a more uniform appearance in the %ariety of e-mail
readers that potential respondents might e using"
Sendin% +(ail
#fter you ha%e created the e-mail address and ody te9t files0 youDll e ready to test
your wor," Select Amail0 Send Amail to egin show the ul, e-mail sending screen"
StatPac For Windows User's Manual /eywords 1*-
4he 6pparent Hmail 6ddress o! Sender should contain the e-mail address that you
want to appear as the sender of the e-mails" Similarly0 the 6pparent Company Name
o! Sender should e set to the name you want to appear as the sender" SubNect is what
will appear on the suHect line of the e-mails"
!f you want the Reply ,o Hmail 6ddress to e different than the 6pparent Hmail
6ddress o! Sender0 then enter a different e-mail address" !f it is the same0 then lea%e
this field lan," 4he Reply ,o Hmail 6ddress is the address that the respondent will
see if they clic, the reply utton in their e-mail program"
>se the rowse utton to select the 7ody ,ext @ile" 4his can e a plain te9t file or an
<41. file"
>se the rowse utton to select your O4est.ist"t9tO file for the Hmail 6ddress @ile"
#lways egin with your test list until you are satisfied with the appearance of the e-
mails" 4hen change Hmail 6ddress @ile to your actual list of e-mail addresses" !t is
generally a good idea to limit the siBe of your Hmail 6ddress @iles to less than fi%e
thousand addresses0 as some ser%ers stop responding to e9tended S14P sending"
!f sending a plain te9t ody file0 you can also specify 6ttacments. 1ultiple
attachments may e specified y clic,ing the #ttachments rowse utton multiple
times or y holding down the control ,ey to select multiple attachments"
1*; /eywords StatPac For Windows User's Manual
@ull OR: to Survey is the >$. of the sur%ey on your we site" !t should e the fully
;ualified path to your sur%ey0 eginning with http5MM #n e9ample would e5
http5MMwww"statpac"comMonline-sur%eysMmultipage-sur%ey"htm !f you are using
password protection0 the lin, might e http5MMwww"statpac"comMcgi-inMmultipage-
sur%ey"pl @o not inad%ertently end the >$. with a period" 4he >$. is case
sensiti%e0 so type it e9actly as it is on your we site" @o not add a ;uery string to the
>$." 4hat is0 do not include a ;uestion mar, in the >$." 4he ;uery string is
reser%ed for the respondent !@ numer and will e added automatically y the
software during the send"
!f your e-mail list has !@ numers 6as the second %ariale70 chec, the >se !@
'umers in >$. o9" 4he !@ numer will ecome the ;uery string during the
sending of the e-mails" !f you do not chec, the o90 no !@ numers will e used in
the e-mails and a random !@ numer will e assigned when a respondent clic,s on
the lin,"
Hmail S?,% Server is the mail ser%er you will e using" !t will e something li,e
mail"yourdomain"com" Jour !SP will e ale to tell you what to specify here"
#lternati%ely0 you can chec, the S14P settings in your own e-mail program and set
StatPac to the same thing"
!f your ser%er re;uires authentication to send emails0 and chec, 6utentication o9
type your >sername and Password" Some ser%ers re;uire QP:P-efore-S14PR
protocol" !f the StatPacNs ul, email program wonNt send0 this is the most li,ely
reason" 4o fi9 this prolem0 chec, %O% 7e!ore S?,% and type the name of your
P:P3 mail ser%er 6often the same as your S14P ser%er7" When QP:P-efore-S14PR
protocol is used0 !SPs usually limit sessions to aout half hour0 so email address list
siBes should e limited to what can e sent in that time"
S?,% %ort is the port used y your S14P ser%er" 4he standard is port 220 ut
occasionally !SPs will use a different port numer" @o not change this unless your
!SP re;uires the use of a different port"
Jou must e logged onto your ser%er efore you egin sending the e-mails" Clic,
Start to egin sending the e-mails"
When your are satisfied with the e-mail appearance 6y sending se%eral to yourself70
change the Amail #ddress 8ile to your real file and clic, Start to egin sending the e-
mails" 4he status window will show the progress"
4he speed at which the e-mails are sent will depend on your e-mail S14P ser%er"
StatPac can easily send three or more e-mails per second" 4his may e too fast for
some ser%ers and you may ha%e to slow StatPac down a it" 4o slow StatPac down0
edit the StatPac"ini file 6select 8ile M :pen M System @efaults 8ile7 and change
Amail@elay from 0 to a delay %alue 6in thousands of a second7" 8or e9ample0 if you
set Amail@elay ^ 1000 then there will e a 1M10 of a second delay etween each
email"
While sending e-mails0 you can temporarily pause y clic,ing the Pause utton" !f
you clic, the $esume utton0 the e-mails will continue to e sent from the point
where you paused" !f you close the Send Amail !n%itations window0 ma,e note of the
record numer so you will e ale to continue where you left off"
Some e-mails might fail to e sent ecause of either ad addresses or the ser%er
ecomes temporarily usy" 8ailed e-mails will e sa%ed in a new a Hmail 6ddress
@ile with a Q-@6*:HGR suffi9 as part of the file name" Jou may attempt to resend
these y changing the Hmail 6ddress @ile to the failed list"
4hree words of caution are in order"
StatPac For Windows User's Manual /eywords 1*'
1" StatPacDs Send Amail !n%itations program is a general purpose ul, e-mailer that
can send thousands of e-mails per hour" !f you use it to send SP#1 to people0 there
is a good chance that someone will contact your !SP0 and the most li,ely result is that
your !SP will cancel your account" Please donDt use this program to send SP#1"
2" Some !SP ser%ers are set to automatically detect and refuse ul, sending of emails"
4hey detect multiple emails eing originated y the same S14P ser%er connection"
4wo StatPac settings can e used to minimiBe the possiility of eing flagged as
SP#1 y your !SP" &oth are in the StatPac"ini file 6select 8ile M :pen M System
@efaults 8ile7" !f Amail@elay is set to a %alue higher than Bero0 a new S14P
connection will e estalished for each email" !f Amail.imitPerConnection is set to a
%alue higher than 00 the software will close and reopen the S14P connect at that
limit" Jou can set either or oth %alues"
3" Some hosting ser%ices ha%e a ;uota on the numer of emails you can send in a
day" 4hey do this in order to pre%ent spammers from ausing their S14P mail
ser%er" !f your !SP has such a policy0 they will usually increase your ;uota y a
simple re;uest stating the reason why you need a higher ;uota"
1-> /eywords StatPac For Windows User's Manual
Procedure Files
3,er,iew
# procedure in StatPac refers to a set of commands that perform one or more tas,s" #
procedure may specify a single analysis or se%eral analyses of the same type"
Procedures can also contain commands to perform transformations and write
sufiles"
4he commands to perform an analysis 6or series of analyses70 can e stored in a file
called a Oprocedure fileO" 4his means that you can easily recall a pre%iously e9ecuted
procedure0 and ma,e changes to it without ha%ing to retype the commands" 4he
procedure file is automatically stored on dis, with the study name and a "P$:
e9tension" Jou can also store procedure files using different names" Procedure files
can e sa%ed0 loaded and merged with other procedure files"
Clic, on the #nalysis &utton to start the procedure file editor" 4he commands to run
analyses are typed into the te9t window on the left of the screen" 4he ?ariale .ist
window 6on the right of the screen7 will show the names of the %ariales in the
current study"
Mouse and /ey"oard Functions
4he procedure file editor is similar to any te9t editor0 although it has numerous uilt
in features to simplify editing procedure files"
%ouse Functions
Clic, 1o%e cursor to point of clic,
Shift]Clic, A9tend selection to the point of clic,"
@oule-clic, Selects the word that is clic,ed on 6when no %ariales are
selected in the ?ariale .ist window7W otherwise0 transfers
selected %ariales from the ?ariale .ist window to the te9t"
@rag Select te9t from point of utton down to point where utton
is released"
@oule-clic, and drag A9tend the selection from word to word"
4riple-clic, and drag A9tend the selection from row to row"
7eyboard Functions
<:1A 1o%e cursor to the eginning of the line"
A'@ 1o%e cursor to the end of the line"
6.eft #rrow7 1o%e cursor one character to the left"
6$ight #rrow7 1o%e cursor one character to the right"
6>p #rrow7 1o%e cursor one line up"
6@own #rrow7 1o%e cursor one line down"
C4$.]6.eft #rrow7 1o%e cursor to the eginning of the current word"
C4$.]6$ight #rrow7 1o%e cursor to the eginning of the ne9t word"
C4$.]<:1A 1o%e cursor to start of te9t"
C4$.]A'@ 1o%e cursor to end of te9t"
C4$.]' 1o%e cursor to ne9t procedure
C4$.]P 1o%e cursor to pre%ious procedure
@A. @elete selected te9t"
C4$.]* or S<!84]@A. Copy selected te9t to the Clipoard and delete the
selection"
C4$.]C or C4$.]!'S Copy selected te9t to the clipoard"
C4$.]? or S<!84]!'S !nsert te9t from the clipoard"
C4$.]6&ac,space7 @elete pre%ious word"
$esi%nin% 0nalyses
StatPac uses an easy programming language for designing procedures" !t also has a
large selection of automatic features to simplify the process"
8or e9ample0 a simple procedure might e5
S4>@J S>$?AJ
8$AC>A'C!AS $#CA
""
1-& /eywords StatPac For Windows User's Manual
4his procedure consists of a single tas, using a study called S>$?AJ 6i"e"0 a
codeoo, called S>$?AJ"C:@ and a data file called S>$?AJ"@#47" 4he
procedure says to use the study called S>$?AJ0 and perform a fre;uency analysis of
the $#CA %ariale" 'otice that a procedure always ends with two dots 6periods7"
# more comple9 procedure would e5
S4>@J S>$?AJ
8$AC>A'C!AS $#CA0 !'C:1A0 SA*
""
4his procedure contains three tas,s0 each using the same study 6and data file7" !f you
e9ecute this procedure0 the program will first do a fre;uency analysis of $#CA0 then
of !'C:1A0 and finally of SA*" 4here is no limit to the numer of tas,s that can e
specified in a single procedure"
# procedure file may also contain many different procedures" 4he only re;uirement
is that the procedures e separated from each other y two dots" 8or e9ample0 the
following commands specify three procedures5
S4>@J S>$?AJ
8$AC>A'C!AS $#CA
""
C$:SS4#&S $#CA &J #FA
""
8$AC>A'C!AS #FA0 !'C:1A0 SA*0 P$A8A$A'CA
""
4he first procedure contains one tas,0 the second one tas,0 and the third four tas,s"
4hese commands would actually run si9 analyses" 'otice that the study name is only
specified once 6in the first procedure7" Suse;uent procedures will automatically use
the same study and data file" >sually0 the S4>@J command is used only once"
4he use of the S4>@J ,eyword in the first procedure is mandatory since it defines
the codeoo, and data file names for all the following procedures" <owe%er0 the
S4>@J ,eyword may also e used in suse;uent procedures" !f the ,eyword
S4>@J is specified in another procedure0 that procedure0 and the procedures
following it0 will use the new codeoo, and data file"
4he following commands contain two procedures0 each ha%ing two tas,s" 4he
S4>@J command is used in oth procedures" 4his means that the first procedure
will analyBe data from one study 6S>$?AJ17 and the second procedure will analyBe
data from another study 6S>$?AJ27"
S4>@J S>$?AJ1
8$AC>A'C!AS #FA0 P$A8A$A'CA
""
S4>@J S>$?AJ2
8$AC>A'C!AS #FA0 P$A8A$A'CA
""
4he S4>@J ,eyword not only specifies the name of the codeoo, to e analyBed0
ut it also implicitly specifies the name of the data file" !n most cases0 the codeoo,
and the data file name are the same 6e9cept for the e9tensions7" # codeoo, called
S>$?AJ would usually use a data file called S>$?AJ"@#4"
StatPac For Windows User's Manual /eywords 1-1
Sometimes0 the codeoo, name and data file names will not e the same" 8or
e9ample0 if the same study had een performed each year0 you might ha%e se%eral
data files with the same codeoo, name0 ut with different data file names" 4he
@#4# ,eyword may e used to analyBe different data files 6all using a common
codeoo, name7"
S4>@J S>$?AJ
@#4# @#4#-9)
8$AC>A'C!AS #FA0 #44!4>@A
""
@#4# @#4#-9(
8$AC>A'C!AS #FA0 #44!4>@A
""
!n the ao%e e9ample0 each procedure uses the @#4# ,eyword to specify what data
file should e analyBed y that procedure" &oth procedures will use the codeoo,
called S>$?AJ"C:@" A%en though the S4>@J command is only specified in the
first procedure0 suse;uent procedures will use the same codeoo, name unless
another S4>@J ,eyword is used to change it" 4he first procedure will read data
from a file called @#4#-9)"@#4 and the second procedure will read from a data file
called @#4#-9("@#4"
Whene%er you use the S4>@J or @#4# commands0 the last specification will
remain in effect until changed y another S4>@J or @#4# command" 8or e9ample0
all three of the following procedures will use a codeoo, called :P!'!:'"C:@ and
a data file called 1#$EA4"@#4"
S4>@J :P!'!:'
@#4# 1#$EA4
C$:SS4#&S !'C:1A W!4< P$A8A$A'CA
""
&#''A$S #FA $#CA !'C:1A W!4< P$A8A$A'CA
""
@ASC$!P4!?A #FA
""
When you use the S4>@J command to specify a new codeoo,0 the data file will e
changed to the new codeoo, name automatically" !n other words0 using the S4>@J
command o%errides all pre%ious S4>@J and @#4# command specifications" !n the
following e9ample0 the second procedure will use a data file called S4>@J-2"@#40
e%en though the @#4# command was used in the first procedure to specify a data
file called SA'S:$J"@#4"
S4>@J S4>@J-1
@#4# SA'S:$J
44AS4 P$A4AS4 W!4< P:S44AS4
""
S4>@J S4>@J-2
.!S4 $A1#$ES
""
1-) /eywords StatPac For Windows User's Manual
Continuation .ines
!f a command is too long to fit on one line 6e"g"0 a long %ariale list70 StatPac will
automatically indent suse;uent lines" Jou can simply continue typing and the word-
wrap feature will ta,e care the indentation for you" Jou can also use an e9plicit
6hard7 return to egin the ne9t line" # rea, etween lines should always occur
etween words or etween sets of parentheses" # continuation line is denoted y
indenting at least one character 6typing at least one space at the start of the line7" 4he
following procedure will perform a fre;uency analysis on eight %ariales" Since the
second line is indented0 StatPac will interpret it as a continuation of the pre%ious line"
S4>@J F:?4
8$AC>A'C!AS #FA $#CA SA* !'C:1A S4#4>S
C#4AF:$J <:>S!'F 4$#'SP:$4#4!:'
""
Sometimes0 continuation lines can e used to ma,e a procedure easier to read" 4he
following procedure will perform descripti%e statistics on three %ariales" &ecause
the %ariale names are indented0 they will e interpreted as a continuation of the
@ASC$!P4!?A line"
S4>@J &>@FA4
@ASC$!P4!?A !'C:1A
A*PA'SA
P$:8!4
""
Co((ent .ines
Comment lines may e included in a procedure file" 4heir purpose is to allow you to
imed notes within a procedure file" 4hey are especially helpful when re%iewing a
procedure file that you ha%e not used for a long time" Comment lines will e ignored
when performing an analysis" # comment line egins with an apostrophe0 or the
word $A1" 4here are no restrictions on the te9t that may e included in a comment
line" Comment lines may also use continuation lines" 8or e9ample0 the following
procedure contains two comment lines" 4he second comment also has a continuation
line5
$A1 4his procedure has two comment lines
S4>@J S>$?AJ12
D 4his procedure will only use the first 20 records
for the analysis ecause the SA.AC4 command is used
SA.AC4 1-20
8$AC>A'C!AS #44!4>@A
""
Comment lines can e useful when deugging a procedure that contains an un,nown
error" &y selecti%ely ma,ing each line a comment 6adding an apostrophe to the
eginning of the line70 you can essentially eliminate that line as a possile cause of
the error"
StatPac For Windows User's Manual /eywords 1-!
Jou can also turn entire loc,s of te9t in a procedure file into comment lines" .ines
eginning with Mb can e used to start a comment loc,0 and lines eginning with bM
can e used to end a comment loc," #ll the lines etween the start and end
comments loc,s will e ignored during processing"
8 7u("ers
1ost of the e9amples in this manual use %ariale names" <owe%er0 it is important to
note that either %ariale names or ? numers may e used interchangealy" 8or
e9ample0 if #FA is %ariale twel%e in a study0 the following two commands would
produce identical results5
@ASC$!P4!?AS #FA
@ASC$!P4!?AS ?12
/eywords
@esigning a procedure with StatPac consists of typing a series of commands" With
the e9ception of comment lines and continuation lines0 each line in the procedure
will egin with a ,eyword or analysis command"
Eeywords are used to modify an analysis" 4hey may e used in a procedure to
change laeling and perform transformations" !n fact0 they are used for e%erything
e9cept the actual selection of an analysis type" 4he S4>@J and @#4# commands
are ,eywords" # listing of the ,eywords can e displayed y selecting ?iew0 Synta9
<elp" 4he ,eyword menu will appear in a window"
A sin/le procedure can contain many keyword commands% but only one analysis
command. !n the following e9ample0 the analysis output will ha%e a page heading
and title ecause of the inclusion of two ,eywords in the procedure"
S4>@J SJS4A1
<A#@!'F #cme $esearch0 !nc" - System #nalysis Study
4!4.A Crosstas etween Shift and Afficiency $ating
C$:SS4#&S S<!84 &J $#4!'F
""
0nalyses
While many ,eywords can e used in a procedure0 only one analysis command can
e specified" # listing of the analysis commands can e displayed y selecting ?iew0
Synta9 <elp" 4he help window will appear"
8aria"le .ist
4he ?ariale .ist window enales you to %iew and select %ariales for an analysis" !t
can e displayed y selecting ?iew0 ?ariale .ist" 4he width of the ?ariale .ist
1-* /eywords StatPac For Windows User's Manual
window can e adHusted y dragging the ar that separates the procedure file te9t
from the ?ariale .ist window"
:ne con%enient feature of the ?ariale .ist window is the aility to transfer %ariale
names to the procedure te9t" 4o select a %ariale0 highlight it in the ?ariale .ist
window" 4o select multiple %ariales0 hold down the shift or control ,ey while
clic,ing on the desired %ariales in the ?ariale .ist window"
4o transfer selected %ariales from the ?ariale .ist window to the te9t of the
procedure file0 first select the desired %ariales in the ?ariale .ist window" 4hen
doule clic, in the procedure file where you want the %ariale names to appear" 4he
highlighted %ariales in the ?ariale .ist window will e copied to the procedure file
te9t0 and the %ariale6s7 will e deselected in the ?ariale .ist window"
8aria"le $etail
4he ?ariale @etail window lets you see detailed information aout any %ariale0 or
change the information for a %ariale" 4o display the ?ariale @etail window0 select
?iew0 ?ariale @etail" Jou can also doule-clic, on a %ariale in the ?ariale .ist
window to e%o,e the ?ariale @etail window
#ll information for a %ariale can e changed e9cept its format" Changes made in the
?ariale @etail window 6e"g"0 re%ised laeling7 will e sa%ed in the codeoo,0 and
therefore will appear in the analyses"
StatPac For Windows User's Manual /eywords 1--
4he current %ariale displayed in the ?ariale @etail window can e changed y
using the drop-down %ariale selection or y clic,ing on the desired %ariale in the
?ariale .ist window"
4he ?ariale @etail window can e dragged to any location on the screen" Press and
hold the left mouse utton anywhere on the gray orders of the window" @rag the
?ariale @etail window to the desired location and release the mouse utton to drop
the window at that location"
Jou can hide the ?ariale @etail window y selecting ?iew0 ?ariale @etail"
#lternati%ely0 clic, on the * in the top right corner of the ?ariale @etail window"
Find :e2t
>se the 8ind @ialog window to search for specific te9t in the procedure file or the
results" Select Adit0 8ind 6or use the Ctrl 8 shortcut7 to display the 8ind @ialog
window"
4o egin a search0 type the search te9t and clic, on the 8ind 'e9t &utton" #fter a
search has een started and a match has een found0 you can continue the search y
clic,ing on the 8ind 'e9t &utton 6or y pressing the U83V shortcut7" >pper and lower
case differences will e ignored in the search"
1-; /eywords StatPac For Windows User's Manual
Relace :e2t
>se the $eplace @ialog window to replace specified te9t in the procedure file or
results" Select Adit0 $eplace 6or use the Ctrl < shortcut7 to display the $eplace
@ialog window" #lternati%ely0 you can clic, the $eplace &utton from the 8ind
@ialog window"
>pper and lower case differences will e ignored when finding te9t" <owe%er0
replaced te9t will use the e9act te9t typed into the $eplace With window"
3tions
:ptions are used to control the analysis" :ptions allow you to modify the defaults for
an analysisW that is0 they allow you to customiBe the analysis parameters themsel%es"
#nalysis options may e changed temporarily or permanently" When changed
permanently0 the current procedure and all future procedures will use the new
defaults" When changed temporarily0 only the current procedure will use the new
options"
Some options are gloal and apply to all analyses" :ther options are specific to the
type of analyses eing performed" !f you select :ptions when there is no procedure
file or when the cursor is in a procedure that does not specify an analysis0 only the
gloal options will e displayed" 4hey allow you to set the pitch 6point siBe7 for the
report0 the page margins and paper orientation0 the ne9t page numer to e printed0
Boom factor0 and weighting"
4he margins are e9pressed in inches" 4he paper orientation may e set to :$^P
6portrait7 or :$^. 6landscape7" 4he Boom factor is any easy way to reduce the siBe
of a tale so it will fit on one page" 'ormally0 L8^100 and the printouts will e
displayed at 100` their normal siBe" Setting L8^(0 would display the tales at (0`
of their normal siBe0 so more columns would e ale to fit on a page" 4he ecology
option may e used to sa%e paper" When AC^J and you are sa%ing the output to a
atch file0 all page rea,s will e e9cluded" #t the conclusion of the atch run0 select
System0 Current &atch 8ile0 to print the file" When running interacti%ely or atch to
printer0 AC^J will only suppress page rea,s within each tas, or procedure"
4he W4 6weighting7 option lets you weight the data ased on the %alue of another
%ariale0 and the 8C 6fractional counts7 option controls whether the reports will show
StatPac For Windows User's Manual /eywords 1-'
integer or fractional counts" 4hey currently apply to all analyses in the &asic
Statistics 1odule"
4o %iew the options for an analysis0 mo%e the cursor to the procedure where the
analysis command is specified and select :ptions" !f no analysis is specified in the
current procedure0 only the gloal options will e shown"
4he options for each analysis are different" !f the current procedure contains an
options line that changes the default %alues0 the modified %alues will e displayed in
yellow" #ny errors in the option line will e displayed in red" 4o change the option
temporarily0 simply type the new %alue for the option" 4o ma,e a permanent option
change0 type the new %alue and add an e9clamation point as a suffi9" 8or e9ample0
typing J changes an option to yes for the current procedure only" 4yping J_ changes
the option permanently so that all future analyses will use the default of J"
4utomatic $election of Non:%issing Data Option
!n all analyses in the &asic Statistics 1odule an option can e used to select cases if
the desired data in not lan," 4he #S option is gloal and will apply to all analyses"
8or e9ample0 if you specify #S^J_ in the first procedure0 it will apply to all
suse;uent procedures until the #S^'_ option is specified"
4he #S option is a simple way to replace !8-4<A'-SA.AC4 command when you
want to include only records where the %ariale eing analyBed is not missing"
8or e9ample0 you you wanted to do a fre;uency analysis of %ariale 90 and only
include records where ?9 was not lan,0 you could do it with any of these three
procedures" #ll three would produce identical results"
1;> /eywords StatPac For Windows User's Manual
!8 ?9 [\ RR 4<A' SA.AC4
8$AC>A'C!AS ?9
""
!8 ?9 ^ RR 4<A' $AIAC4
8$AC>A'C!AS ?9
""
8$AC>A'C!AS ?9
:P4!:'S #S^J
""
4he ad%antage of the #S option ecomes clear when your %ariale list contains
multiple %ariales" !f you had a %ariale list0 such as5
8$AC>A'C!AS ?9 ?11 ?12
Jou would ha%e to run each one as a separate procedure in order to select the non-
missing data for each %ariale5
!8 ?9 [\ RR 4<A' SA.AC4
8$AC>A'C!AS ?9
""
!8 ?11 [\ RR 4<A' SA.AC4
8$AC>A'C!AS ?11
""
!8 ?12 [\ RR 4<A' SA.AC4
8$AC>A'C!AS ?12
""
'ow you can use the #S option to accomplish the same thing5
8$AC>A'C!AS ?9 ?11 ?12
:P4!:'S #S^J
""
When doing this for fre;uencies0 the P& option will no longer ha%e an effect ecause
there will e no missing cases"
4he #S option is especially useful when using the .!S4 command to list comments"
4ypically0 you would use an !8-4<A'-SA.AC4 command to list only records that
made a comment5
!8 Comment [\ RR 4<A' SA.AC4
.!S4 C:11A'4
:P4!:'S .&^0 &.^J
""
4he same thing can e accomplished with the #S optrion5
StatPac For Windows User's Manual /eywords 1;1
.!S4 C:11A'4
:P4!:'S #S^J .&^0 &.^J
""
When creating &anner tales0 the #S option applies to the stu %ariale or stu
%ariale list 6the ones down the side of the page7" !f will select only records where
the stu %ariale is non-missing"
#ll three of the the following procedures would select the same data5
!8 Stu?ar [\ RR 4<A' SA.AC4
&#''A$S Stu?ar &J 4otal &anner?ars
""
!8 Stu?ar ^ RR 4<A' $AIAC4
&#''A$S Stu?ar &J 4otal &anner?ars
""
&#''A$S Stu?ar &J 4otal &anner?ars
:P4!:'S #S^J
""
-eigt and Fractional Counts Options
4he W4 option lets you apply non-integer 6fractional7 weighting to procedures" !t is
used when the sample differs from ,nown population parameters" 4o apply case
weighting0 you must first create a %ariale that contains a weight"
4he following e9ample computes weights for each of three groups and sa%es the
weight for suse;uent analyses" 4he CaseWeight %ariale will ecome the last
%ariale in the study"
S4>@J SAF1A'4
'AW 6')7 OCaseWeightO
!8 F$:>P ^ 1 4<A' C:1P>4A CaseWeight ^ 0"31)2
!8 F$:>P ^ 2 4<A' C:1P>4A CaseWeight ^ 0"()32
!8 F$:>P ^ 3 4<A' C:1P>4A CaseWeight ^ 1"09-3
S#?A
""
Suse;uent procedures could then apply weights to the analyses using the W4
option" Parentheses are re;uired around the %ariale name" Since an e9clamation
point is used as a suffi90 weighting will ecome the default for all suse;uent
analyses" !n this e9ample0 oth the fre;uencies and descripti%e statistics procedures
would weight the data" !f the e9clamation point had een e9cluded0 weighting would
only e used in the fre;uencies procedure"
S4>@J SAF1A'4
8$AC ?1-?10
:P4!:'S W4^6CaseWeight7_
""
@ASC ?11
""
1;& /eywords StatPac For Windows User's Manual
>nli,e other options0 the W4 option 6with a _ suffi97 only applies to the current
StatPac session" !f you ;uit StatPac and restart it0 the W4 option will e set to '
6'one7" 4his is done to pre%ent a potentially serious mista,e" 8or e9ample0 suppose
you run a procedure file with weighting and then end StatPac" 4he ne9t day you run
StatPac and egin processing a different procedure file" !f the W4 option was
persistent0 weighting might inad%ertently e applied to the new procedure file when
you didnDt intend it to eK and worse0 you might not realiBe it"
Jou can turn weighting on and off y using W4^6?ariale'ame7 and W4^'" !n the
following e9ample0 weighting is applied to the first0 second procedures0 ut not the
third and fourth procedures"
S4>@J 1J$ASA#$C<
4!4.A Weighted 8re;uencies for5 6/7
8$AC ?1
:P4!:'S W4^6Weight?ariale7_
""
4!4.A Weighted @escripti%e Statistics for5 6/7
@ASC ?2
""
4!4.A >nweighted 8re;uencies for5 6/7
8$AC ?1
:P4!:'S W4^'_
""
4!4.A >nweighted @escripti%e Statistics for5 6/7
@ASC ?2
""
4he 8C 6fractional counts7 option my e set to J or '" !t sets whether the 'Ds
6counts7 in the reports will e shown as integers or decimal %alues" 4he 8C option
only applies when weighting is used" !n unweighted data0 the counts will always e
integer %alues 6whole numers7"
Weights are easily calculated as the desired percentage di%ided y the oser%ed
percentage 6or the desired count di%ided y the oser%ed count7" 8or e9ample0
suppose you ,now that the population has 22` males and 32` females" 4his is
called a known population parameter" Jour sur%ey sample0 howe%er0 has 30` males
and -0` females" !f the responses to other %ariales were different for males and
females0 your reports might present a distorted estimate of the population" Weighting
would e used to eliminate the gender sampling error" 4he weight for males would
e 22M30 and the weight for females would e 32M-0" !n the following e9ample0 the
first procedure calculates a FA'@A$WA!F<4 %ariale and sa%es it" 4he second
procedure uses the W4 option to weight the data ased on the FA'@A$WA!F<4
%ariale"
'AW 6'27 OFA'@A$WA!F<4O
!8 SA*^O1O 4<A' C:1P>4A FA'@A$WA!F<4 ^ 22M30
!8 SA*^O8O 4<A' C:1P>4A FA'@A$WA!F<4 ^ 32M-0
S#?A
""
8$AC S:1A?#$!#&.A
:P4!:'S W4^6FA'@A$WA!F<47
StatPac For Windows User's Manual /eywords 1;1
""
Important $ser Tip
4he first few times you run StatPac for Windows0 e9periment with the options to find
the %alues that produce the report formatting you want" $ather than setting these
options in each procedure0 use the e9clamation point suffi9 to ma,e them permanent"
#fter running a few procedures0 youDll ha%e configured the default formats for
StatPac to produce the reports you most often use"
.oadC Sa,eC and Mer%e Procedure Files
4he 8ile selection of the menu allows you to load0 merge0 and sa%e procedure files"
4o open a new procedure file0 select 8ile0 :pen0 or clic, the :pen &utton" 4o sa%e
the current te9t in a procedure file0 select 8ile0 Sa%e0 or clic, the Sa%e &utton"
4o egin a new procedure file0 select 8ile0 :pen0 and change the 8iles of 4ype to
codeoo,s" Select the codeoo, and clic, :E" 4he S4>@J command will e
inserted as the first line of the procedure"
Procedure files are always sa%ed with a "pro e9tension" While we recommend using
StatPac for creating and editing procedure files0 they are plain #SC!! te9t0 and may
e edited with any te9t editor 6such as notepad7"
!f loading a new file0 and the current procedure file te9t has changed0 StatPac will
chec, to see if you want to sa%e the current te9t efore aandoning it and loading the
new file" 'ote that anytime you run a procedure% the entire procedure file will be
saved before the procedure is run" 4hus0 if you load a new file immediately after
running a procedure0 it is not necessary to sa%e the current procedure file efore
loading the new procedure file ecause it will already ha%e een sa%ed"
4o merge the te9t from a procedure file pre%iously stored on dis, into the current te9t
window0 position the cursor where you want the te9t to e loaded and then select
8ile0 1erge" 4he te9t will e inserted ahead of the cursor"
Print a Procedure File
4he current procedure file can e printed y selecting 8ile0 Print" Select the
procedures you want to print and clic, :E"
!f you choose to specify procedures0 you must type the procedure numers that you
want to e printed" Procedure numers can e separated from each other y commas
or spaces" # dash can e used to indicate a range of procedures" 8or e9ample0 the
following would print procedures 10 20 (0 90 10 and 12
10 20 (-100 12
Run a Procedure File
Clic, on the $un utton to e9ecute the commands in the te9t window 6i"e"0 to run the
analysis7" StatPac will gi%e you the option to specify which procedures should e
1;) /eywords StatPac For Windows User's Manual
run0 the operating mode0 disposition of the output0 name of a file to store the output0
and the starting page numer for the output"
#fter setting these parameters0 clic, :E to run the analyses"
Procedure8s9 To Run
4he OProcedure6s7 4o $un may e an indi%idual procedure or range of procedures"
4he default will e the procedure where the cursor was located when the $un utton
was clic,ed" !f you highlight te9t efore clic,ing the $un utton0 the default
procedure6s7 will e all the procedures that contained highlighted te9t" # range of
procedures may e specified with a dash" 4o run procedures one through ten0 you
would type 1-10 in the Procedure6s7 to $un field" 4o run from procedure 2 to the last
procedure0 you would type 2- in the Procedure6s7 to run field" 4o run a single
procedure0 simply type the procedure numer"
%ode
4he 1ode selection allows you to set the analysis to operate interacti%ely0 atch0 or
in the test mode" When interacti%e is selected0 all output will first e displayed on the
screen efore eing sent to its final disposition 6printer or file7" Jou will e ale to
%iew0 edit0 print0 and sa%e the outputW and you must manually tell StatPac when to go
on to the ne9t tas, or procedure"
4he &atch mode is similar to the !nteracti%e mode" 4he difference is that the program
will automatically go on to the ne9t tas, or procedure after showing the results for 3
seconds" @uring the 3-second display time0 you can freeBe the screen and %iew the
output of the current tas, in more detail" Jou can then continue or cancel the atch
run"
4he 4est mode will simply chec, the synta9 of the selected procedures without
actually running them"
When you egin to run an analysis0 StatPac will first chec, the synta9 of your
procedure6s7" 4he synta9 chec,er will catch all maHor errors" !t is0 howe%er0 only a
synta9 chec,er" !t can tell if the synta9 is correct0 not if the commands will do what
you want" !t also cannot chec, for data dependent errors0 since these can only e
disco%ered through actual data processing" !f a synta9 error is disco%ered0 correct the
error and re-run the procedure"
StatPac For Windows User's Manual /eywords 1;!
Output
4he :utput selection will e displayed when processing in the &atch mode" !t refers
to the final disposition of the output 6i"e"0 where you want the results of the analysis
to e sent7" Jou may send the output to the printer or a file" When you choose to send
the output to a file0 you will also e ale to enter a file name for the output" 4he
output will e sa%ed in $ich 4e9t 8ormat"
!n the &atch mode0 the results of all analyses will first e displayed on the screen for
3 seconds" !f you do nothing0 the results will then e sent to the :utput 6printer or
file7" <owe%er0 if you temporarily freeBe the output y pressing the Pause utton0
you will ha%e the choice whether to sa%e or print the results"
$tarting Page Number
4he Starting Page 'umer is especially useful when processing in the &atch mode"
StatPac will automatically increment the page numers with each tas," !f you stop a
atch run0 or decide to rerun a particular tas,0 you will need to manually set the
starting page for the ne9t run"
!f the Starting Page 'umer is left lan,0 no page numers will e printed on the
output"
4he page numer will e placed on the page in the location specified in the header or
footer template"
No Delay
When running in the atch mode0 the results will normally e shown on the screen
for a few seconds efore eing printed or written to file" 4his gi%es you time to
re%iew the results efore printing or sa%ing them" When the 'o @elay o9 is
chec,ed0 the results will e immediately sent to the output de%ice"
Results +ditor
#fter StatPac has finished processing an analysis0 the results will e displayed" 6!n a
atch run0 the results will only e displayed for 3 seconds unless you freeBe the
program with the Pause utton in the results editor7" 4he results editor will allow you
to e9amine and edit the results efore printing or sa%ing them"
#ll files sa%ed or loaded with the $esults Aditor will e in $ich 4e9t 8ormat with a
"rtf e9tension" 4hese files can also e loaded with your word processor"
Grahics
Fraphics are a%ailale when performing fre;uencies0 crosstas0 descripti%e statistics0
rea,downs0 and correlation analyses" # colorful graphics utton will e shown on
the $esults Aditor tool ar for these analyses" Clic,ing the utton will let you select
and edit the graphs"
1;* /eywords StatPac For Windows User's Manual
4o modify the appearance of a graph0 select Adit0 .egend = .aels" 4his will gi%e
you the opportunity to change any of the te9t on the graph0 including legend
information 6if there is one7" 4he legend information can e sa%ed y selecting the
Sa%e #s @efault chec, o9" 8uture graphs with legends will then use the new
settings"
StatPac For Windows User's Manual /eywords 1;-
4he actual creation of the graphs happens while the analysis is eing performed" Jou
can control the ,inds of graphs that will e created and the laeling methods y
selecting Adit0 Creation Settings" 4his option is also a%ailale in the #nalysis Aditor
y selecting System0 Fraph Creation Settings"
1;; /eywords StatPac For Windows User's Manual
#fter you are satisfied with the appearance of the graph0 you can do se%eral things
with it5
1" Print the graph immediately y selecting 8ile0 Print"
2" #dd the graph to the ne9t page of the results y selecting Adit0 Copy Fraph 4o
$eport" When you e9it the Fraphics Aditor and return to the $esults Aditor0 the graph
will ha%e een added to the end of the current results"
3" Sa%e the graph as a file 6"Hpg0 "mp0 or "wmf7 y selecting 8ile0 Sa%e Fraph
!mage"
3" Sa%e the graph in the clipoard y selecting Adit0 Copy Fraph 4o Clipoard"
2" Create a ta delimited file of the laels and data used to create the graph 6not the
graph itself7 y selecting 8ile0 Sa%e @elimited 8ile"
Jou can also right clic, on the graph itself to ma,e changes to the graph"
:a"le of Contents
When processing in the atch mode a tale of contents will e created if page
numering is used" #fter the atch processing is finished0 you can display and print
the tale of contents y selecting System0 Current 4ale of Contents"
StatPac For Windows User's Manual /eywords 1;'
4he 4itle ,eyword in each procedure of the atch run will e used to create the entry
in the tale of contents" !f a procedure had no title0 the tale of contents will contain
the analysis command line in the procedure"
4he current tale of contents will e erased and a new tale of contents will e
started when the starting page is set to 1 in the $un dialog" Setting the starting page
numer to a %alue greater than 1 will add to the e9isting tale of contents"
#fter completing a atch run0 select System0 Current 4ale of Contents" 4ype [Ctrl
#\ to select the te9t and [Ctrl C\ to copy it to the clipoard" 4hen open the atch
file in 1SWord and paste the contents of the clipoard to the new page using [Ctrl
?\" Jour document will then egin with a tale of contents"
Jou can also create a tale of contents that will ha%e hyperlin,s into the atch file
document0 so when you hold down the control ,ey and clic, on an entry in the tale
of contents0 it will display the referenced page" 8irst0 in the System @efaults change
<yperlin,4:C ^ 0 to <yperlin,4:C ^1 and sa%e" 4hen0 when you run a atch file
with page numers0 the tale of contents will ha%e hyperlin,s" #fter completing a
atch file run0 select SystemMCurrent 4ale of Contents" 4his will open a Word
document containing the tale of contents" Copy the entire document to the clipoard
6Ctrl #\[Ctrl C\7" 4hen open the atch file document" 4he cursor will e positioned
at the eginning of the document" Select AditMPaste Special and select 8ormatted
4e9t 6$487 instead of Hust Paste" 4he hyperlin,ed tale of contents will e inserted at
the eginning of the document"
0uto(atically Generated :oline Procedures
# ,opline contains asic analyses for all the %ariales in a study" !t consists of
fre;uencies0 descripti%e statistics0 and listings of open-ended comments"
When you clic, on the #nalysis utton0 select System0 #utomatic 4opline"
4he report generated y an automatic ,opline will pro%ide a good summary of the
data" !f youDre Hust after OanswersO and not particularly concerned aout laeling0 the
automatic ,opline procedures can e run Oas isO" !f you want a Ocamera-readyO
report0 youDll want to edit the procedures 6especially the 4ile and :ptions
commands7" 1ost users will %iew the automatically generated 4opline a solid
foundation rather than and end-product"
1'> /eywords StatPac For Windows User's Manual
/eywords
/eyword Inde2
4hese ,eywords may e used in a procedure to control laeling and perform
transformations"
#%erage Compute Count @ata
@ifference @ummy 8ootnote <eading
!f"""4hen"""Alse .aels .ag .et
1erge 'ew 'ormaliBe :ptions
$ecode $em $un Sa%e
SelectM$eHect Sort Stac, Study
Sum 4itle Weight Write
/eywords 3,er,iew
Eeywords are used in a procedure for e%erything e9cept selecting the analysis type"
4hese words 6commands7 are recogniBed y StatPac when used at the eginning of a
line" 4hey are used for study and data specifications0 laeling output0 and data file
transformations"
Some ,eywords will e used often 6e"g"0 S4>@J0 <A#@!'F0 4!4.A and
:P4!:'S7" :ther ,eywords will e used only rarely 6e"g"0 .#F0 @!88A$A'CA0
S>17" 1ost analyses can e designed using only a few ,eywords"
#ll procedure files must use the S4>@J ,eyword once in the first procedure" 4he
use of all other ,eywords is optional and depends upon the situation"
4he following is the list of ,eywords supported y StatPac
S4>@J0 @#4#0 S#?A0 W$!4A0 1A$FA0 <A#@!'F0 4!4.A0 8::4':4A0
.#&A.S0 :P4!:'S0 SA.AC40 $AIAC40 'AW0 .A40 S4#CE0 $AC:@A0
C:1P>4A0 C:>'40 S>10 #?A$#FA0 !8-4<A'-A.SA0 S:$40 WA!F<40
':$1#.!LA0 .#F0 @!88A$A'CA0 @>11J0 and $>'"
Cate%ories of /eywords
Eeywords can e logically di%ided into four categories" 4he categories are5
1" Commands for selecting0 loading and sa%ing files"
S4>@J
@#4#
S#?A
W$!4A
1A$FA
2" Commands for laeling"
<A#@!'F
4!4.A
8::4':4A
.#&A.S
3" Commands for setting analysis options"
:P4!:'S
3" Commands for creating new %ariales and transforming data"
SA.AC4
$AIAC4
'AW
.A4
S4#CE
$AC:@A
C:1P>4A
C:>'4
S>1
#?A$#FA
!8""4<A'""A.SA
S:$4
WA!F<4
':$1#.!LA
.#F
@!88A$A'CA
@>11J
$>'
/eyword 5el
1ost ,eywords re;uire one or more parameters" 4hese parameters are go%erned y
the synta9 re;uirements of the ,eyword" Aach ,eyword has its own synta9" 4o
;uic,ly display help for a ,eyword0 select <elp0 Eeywords0 and clic, on the desired
,eyword to display the help information"
1'& /eywords StatPac For Windows User's Manual
While a procedure can contain only one analysis specification command0 it can ha%e
many ,eyword commands" Eeywords are often used in comination with each other
to form more comple9 procedures" !n the following procedure0 the first four lines are
,eyword commands and the fifth line is an analysis specification command"
S4>@J #44!4>@AS
<A#@!'F StatPac #nalysis of the #ttitude Sur%ey
4!4.A :%erall #ttitude &ro,en @own &y Se9
:P4!:'S P8^'$C4 F$^J
C$:SS4#&S S>11#$J &J SA*
""
3rderin% /eywords
Eeywords can e used in comination with each other to perform %irtually any
selection or transformation" 4he order of the ,eywords in a procedure may or may
not e important depending on the indi%idual procedure"
Fenerally0 it is important to consider the order of ,eywords whene%er a procedure
in%ol%es more than one transformation" !f the results of one transformation are
dependent upon another transformation0 then proper order is imperati%e"
8or e9ample0 in the following procedure three C:1P>4A ,eywords are used to
calculate %alues for three different %ariales" Since all of the computations are
independent from each other 6one doesnDt depend on the results of another one70 the
order of the ,eyword commands doesnDt ma,e any difference" 4he following
C:1P>4A commands could e specified in any order"
S4>@J SC!A'CA
C:1P>4A ?#$X1 ^ 0
C:1P>4A ?#$X2 ^ 1
C:1P>4A ?#$X3 ^ 2
S#?A
""
When one ,eyword command depends upon the result of a different ,eyword
command0 the order of the commands is important" !n the following e9ample0 each
C:1P>4A command uses the result of a pre%ious command to perform its
computation" 4herefore0 the order of the commands must e correctly specified"
S4>@J SC!A'CA
C:1P>4A ?#$X1 ^ 0
C:1P>4A ?#$X2 ^ ?#$X1 ] 1
C:1P>4A ?#$X3 ^ ?#$X2 ] 1
S#?A
""
StatPac For Windows User's Manual /eywords 1'1
Glo"al and :e(orary /eywords
:nly three ,eywords are gloal 6S4>@J0 @#4# and <A#@!'F7" :nce used0
suse;uent procedures will use the same study0 data file andMor page heading" 4hese
parameters can e changed in any procedure and suse;uent procedures will use the
new parameters"
#ll other ,eywords are temporary and apply only to the procedure in which they
appear" !n the following e9ample0 the first procedure will use only the first 1000
records for the descripti%e statistics analysis" 4he second procedure0 howe%er0 will
use all the records ecause the SA.AC4 ,eyword only applies to the procedure in
which it appears" 4he S4>@J and <A#@!'F 6gloal ,eywords7 will e the same
for oth procedures"
S4>@J C$:PS
<A#@!'F Summary Statistics
SA.AC4 1-1000
@ASC$!P4!?A J!A.@
""
@ASC$!P4!?A C:S4
""
Per(anently Chan%e a Code"oo# and $ata File
4wo ,eywords 6S#?A and W$!4A7 allow you to ma,e permanent changes to studies
and data files" #ny transformations in a procedure will ecome permanent if the
S#?A command is included anywhere in that procedure" Permanent means that the
study information and data file are irretrievable changed to reflect the
transformations re;uested y the ,eywords" !f you had a study of 100000 records0 the
following procedure file might result in a hu/e loss of data and e de%astating_
S4>@J 1#$EA4
SA.AC4 1001-2000
S#?A
""
'ote that the inclusion of the S#?A ,eyword ma,es the selection permanent" 4hat is0
after e9ecuting this procedure0 the data file will contain only 1000 records" #ll other
records will ha%e een eliminated y the SA.AC4 command" 4he implications of
this are o%ious" *on<t use the SA=+ command unless you have a backup of the
study information and data file"
We recommend that all procedure files egin y sa%ing duplicates of the codeoo,
and data0 and suse;uent procedures use the duplicates 6lea%ing the original
codeoo, and data intact7" !f the pre%ious e9ample were changed to the following0
the 1#$EA4 codeoo, and data file would not e affected y the use of the S#?A
command in the second procedure"
S4>@J 1#$EA4
W$!4A 1#$EA41
""
1') /eywords StatPac For Windows User's Manual
S4>@J 1#$EA41
SA.AC4 1001-2000
S#?A
""
Bac#u a Study
We stron/ly recommend ma,ing a ac,up of all study information and data files
efore eginning any analyses" !f you ha%e a ac,up0 you will always e :E and you
wonDt ha%e to worry aout sa%ing erroneous transformations" !f you donDt ha%e a
ac,up0 and you accidentally sa%e an unwanted transformation0 nothing can e done
to reco%er the data"
1a,ing a ac,up of a study is easy""" you Hust ha%e to rememer to do it" Please0 if
you plan to use the S#?A command0 ma,e a ac,up first"
4here are three asic ways to ac,up StatPac information5
1" >se Windows A9plorer to copy the desired files to another folder or dri%e"
2" Select @ata0 &ac,up to create a ac,up folder and copy all files from the current
data folder to the new folder
3" $un a procedure using the W$!4A command to sa%e a copy of the codeoo, and
data file"
4o ma,e a ac,up of a codeoo, and data file0 you need to run a two-line procedure"
4he first line specifies the codeoo, name 6and its associated data file7 and the
second line uses the W$!4A command to specify the study name for the ac,up
files" 8or e9ample0 if we ha%e a study called S>$?AJ0 the following procedure will
create a ac,up called &-S>$?AJ" 4he ac,up will contain oth the study
information and the data file"
S4>@J S>$?AJ
W$!4A &-S>$?AJ
""
4he W$!4A command is used to specify the name of the ac,up files" 4he name
may include a dri%e or path" 8or e9ample0 if you wanted to store a ac,up copy on a
dis,ette in the # dri%e0 you would run the following procedure"
S4>@J S>$?AJ
W$!4A #5S&-S>$?AJ
""
4he pre%ious e9amples would not create a ac,up of the data entry form" 4he form
itself is only used for data entry and editing0 which is normally finished y the time
you egin running analyses" 4herefore0 the form is not altered y any transformation
or analysis" Jou can0 howe%er0 manually ma,e a ac,up of a form"
We suggest that you start all procedure files with a two-line procedure that creates a
duplicate codeoo, and data file0 and in the second procedure0 egin using the new
files0 thus lea%ing your original file unchanged" !n this e9ample0 the first procedure
reads the S>$?AJ codeoo, and data file0 and creates a new codeoo, and data file
called S>$?AJ2" 4he second procedure says to use the S>$?AJ2 codeoo, and
data for the second and all suse;uent procedures" 4hus0 if any serious mista,es are
StatPac For Windows User's Manual /eywords 1'!
made in transforming data0 you could easily re%ert ac, to the original codeoo, and
data y rerunning the first procedure"
S4>@J S>$?AJ
W$!4A S>$?AJ2
""
S4>@J S>$?AJ2
6egin your procedures here7
""
#s you ecome more e9perienced with StatPac0 you may include other lines in the
first procedure" Jou might want to create a few new %ariales that you intend to use
later on in the procedure file" 8or e9ample0 you might want to always egin your
procedure files y creating an asolute record numer %ariale 6useful for identifying
ad data7 and a net %ariale that can e used in anner tales" 4he following might
e the eginning of the procedure file5
S4>@J 1JS4>@J
C:1P>4A 6'27 $AC ^ $AC:$@
'AW 6'17 Q'A4R 4otals
.#&A.S 'A4 6^7
W$!4A 4A1P-1JS4>@J
""
S4>@J 4A1P-1JS4>@J
6egin your procedures here7
S:U$E Co((and
4he S4>@J command is used to specify the name of the codeoo, and data file
eing analyBed" !t must e specified in the first procedure" Suse;uent procedures
will use the same study name unless another S4>@J command is used to change it"
4he S4>@J command may only e used once in any gi%en procedure"
4he synta9 of the command is as follows5
S4>@J [8ile name\
4he file name 6or study name7 may include a path specification" !f no path is
specified0 StatPac will assume that the study resides in default data sudirectory" #o
e1tension should be used when specifyin/ a study name.
#ll the following are e9amples of the proper use of the S4>@J command5
S4>@J 1#$EA4
S4>@J C5S@#4#S&::E
S4>@J #5S>$?AJ
1'* /eywords StatPac For Windows User's Manual
$0:0 Co((and
4he @#4# command may e used to specify the name of the data file to e analyBed"
!t is only used when the data file name is not the same as the study name" 4he @#4#
command may e used only once in a gi%en procedure"
4he synta9 of the command is as follows5
@#4# [8ile name\
4he file name may include a path specification" !f no path is specified0 StatPac will
assume that the data file resides in the default data sudirectory" !t is not necessary to
use the e9tension "@#4 when specifying the data file nameW StatPac will
automatically use this e9tension for all data files"
>sing the @#4# command changes the data file for the current and all suse;uent
procedures" 4he data file will continue to e analyBed until changed y another
@#4# or S4>@J command"
#ll the following are e9amples of the proper use of the @#4# command5
@#4# $#W@#4#
@#4# #5$AS>.4S
@#4# C5SS4#4P#CS<A#.4<SS>$?AJ
S08+ Co((and
4he S#?A command is used to ma,e all transformations in a gi%en procedure
permanent"
4here are two forms of synta9 for the S#?A command" !n the first form0 the S#?A
command is specified on a line y itself" When used this way0 all transformations
will e sa%ed to the current codeoo, and data file" #s a safety precaution0 do not use
the S#?A command in this way unless you ha%e a ac, up of the study information
and data file"
S#?A
4he other form of the S#?A command lets you sa%e the codeoo, and data to a
different file" 4his form of the command is functionally identical to the W$!4A
command e9cept that a %ariale list may not e specified" !f a path is not specified as
part of the output file name0 the default data sudirectory will e assumed" !f the file
name contains spaces0 you must enclose the file name in ;uotes or parenthesis"
S#?A [8ile name\
8or e9ample0 the following procedure creates a new fi%e-character %ariale called
#?F 6the a%erage of eight test scores70 and stores this as a permanent part of the
codeoo, and data file"
StatPac For Windows User's Manual /eywords 1'-
S4>@J SC:$AS
#?A$#FA 6'2"17 #?F ^ SC:$A1 - SC:$A(
S#?A
""
#fter running this procedure0 the codeoo, SC:$AS"C:@ and data file
SC:$AS"@#4 will ha%e one more %ariale than they had efore the procedure was
run" 4he S#?A command ma,es the new %ariale permanent"
#s another e9ample0 consider the following two procedures" 4he first procedure uses
the S:$4 command to sort the data file in ascending order y last name" &ecause the
S#?A command is used0 the data file will e sa%ed in sorted order" #lso notice that
the sa%e command specifies a file name0 so the sorted data will e sa%ed to the new
file" 4he second procedure egins with the S4>@J command to tell StatPac to use
the new file and then prints a listing of three %ariales" 4he listing will e in sorted
order ecause this is now the way the new data file is stored"
S4>@J '#1AS
S:$4 6#7 .#S4X'#1A
S#?A O1y 'ew 8ile 'ameO
""
S4>@J 1y 'ew 8ile 'ame
.!S4 8!$S4X'#1A .#S4X'#1A P<:'A
""
!f you specify a file name with the S#?A command0 your original codeoo, and data
remains untouched0 and you ne%er ha%e to worry aout ma,ing a mista,e" A%en
when you do not specify a file name0 a mista,e doesnDt necessarily mean you should
panic" 4he only transformations that are irre%ersile are those that change the
original %ariales" #s long as your raw data is intact0 you should e ale to reco%er
from any mista,e"
WRI:+ Co((and
4he W$!4A command is used to sa%e transformed data in a file or write only
selected %ariales to a file" >nli,e the S#?A command 6that sa%es the
transformations in the original file70 the W$!4A command is usually used to sa%e the
transformed data in a different file"
4he synta9 for the W$!4A command is5
W$!4A [8ile name\ [?ariale list\
4he W$!4A command actually creates a new codeoo, and data file called a sub!ile"
4he sufile is Hust li,e any other study" 4he difference etween the original study and
the sufile is that the sufile reflects all transformations performed in the procedure"
While the S#?A command sa%es all transformations in the original file 6unless a
filename is specified70 the W$!4A command always creates a new codeoo, and
data file and sa%es all transformations in the new files" 4he [?ariale list\ parameter
is used to control what %ariales should e written to the sufile" When the [?ariale
list\ is not specified0 all %ariales will e included in the sufile"
1'; /eywords StatPac For Windows User's Manual
4he following procedure would use a codeoo, called '#1AS 6and an implied data
file called '#1AS7" 4he procedure will sort the file y last name and sa%e the sorted
study as a sufile using a new study name S:$4'#1A" #ll %ariales from the
original file will e included in the sufile"
S4>@J '#1AS
S:$4 6#7 .#S4X'#1A
W$!4A S:$4'#1A
""
!n a similar e9ample0 this procedure file selects e%ery tenth name from the original
file 6'#1AS7 and creates a new study 6sufile7 called 1!'!8!.A" 4he sufile will
contain the same %ariales as the original study0 howe%er0 there will e only one-
tenth as many records" 4he second procedure uses the S4>@J command to access
the sufile and list three selected %ariales"
S4>@J '#1AS
C:1P>4A 6')"17 $AC ^ $AC:$@
C:1P>4A 6')"17 !$AC ^ $ACM10
C:1P>4A !$AC ^ !'46!$AC7b10
!8 $AC ^ !$AC 4<A' SA.AC4
W$!4A 1!'!8!.A
""
S4>@J 1!'!8!.A
.!S4 8!$S4X'#1A .#S4X'#1A P<:'A
""
4he original data file 6'#1AS"@#47 is called the input file" !t is the input data for
the transformation procedure" 4he transformed data file 61!'!8!.A"@#47 is called
the output file" !t contains the output from the transformation procedure" 4he second
procedure uses the S4>@J command to access the output file from the first
procedure" 1!'!8!.A is now0 in effect0 its own study" 4he procedure created a
1!'!8!.A"C:@ codeoo, and 1!'!8!.A"@#4 data file"
When the output file name is different from the input file name0 the input file will
remain intact0 and the new output file will contain the transformed data" When the
input file name and the output file name are the same0 the W$!4A command
functions identically to the S#?A command" !n the following e9ample0 the output
file will write o%er the input file and the original 6pre-transformed7 data will e lost"
>nless you ha%e an up-to-date ac,up0 we recommend specifying a uni;ue file name
when using the W$!4A command to eliminate the possiility of losing data"
S4>@J 8::@
C:1P>4A $!SE ^ .:F6 $!SE 7
W$!4A 8::@ 6causes a loss of the original $!SE data7
""
4he output file name parameter must e specified whene%er the W$!4A command is
used" !f a path is not specified as part of the output file name0 the default data
sudirectory will e assumed" !f the output file name contains spaces0 then you must
enclose the name in ;uotes or parenthesis" 8or e9ample5
StatPac For Windows User's Manual /eywords 1''
W$!4A #':4<A$ 8!.A Wrong
W$!4A O#':4<A$ 8!.AO Correct
W$!4A 6#':4<A$ 8!.A7 Correct
When a procedure does not create any new %ariales or change any laels0 you can
use the W$!4A command to sa%e a new data sufile without sa%ing the codeoo," !t
is not necessary to resa%e the information if none of the study information has een
changed y transformations" 4o sa%e a data file without sa%ing the study information0
add a "@#4 e9tension to the file name parameter" Suse;uent procedures could use
the same 6original7 study information0 ut would re;uire a @#4# command to access
the new data sufile" !n the following e9ample0 the first procedure selects males from
the file and writes a data sufile consisting of Hust males" 4he second and third
procedures access this sufile with the @#4# command and perform analyses on it"
4he analyses will only include those records selected in the first procedure" 'ote that
the @#4# command is re;uired only in the second procedure ecause it remains in
effect until changed y a S4>@J command or another @#4# command"
S4>@J S4#4>S
!8 SA* ^ O1O 4<A' SA.AC4
W$!4A 1#.AS"@#4
""
4!4.A !ncome Statistics for 1ale $espondents
@#4# 1#.AS
@ASC$!P4!?A !'C:1A
""
4!4.A <ousing !nformation for 1ale $espondents
8$AC>A'C!AS <:>S!'F
""
4he W$!4A command may e used to create a sufile of selected %ariales simply
y specifying which %ariales are to e contained in the sufile" 4he [?ariale list\
parameter allows you to control which %ariales 6and in which order7 will e written
to the sufile" #ll the pre%ious e9amples did not specify a %ariale list so StatPac
would write all the e9isting and newly created %ariales to the sufile" !n the
following e9ample0 two %ariales 6:?A$#.. and .#S4JA#$7 will e written to
the new sufile S>11#$J"
S4>@J #44!4>@AS
W$!4A S>11#$J :?A$#.. .#S4JA#$
""
4he %ariale list may e specified as indi%idual %ariales0 a range of %ariales0 or a
comination of the two" !t may include oth %ariale names and ? numers" Aither
commas andMor spaces may e used to separate %ariales" Continuation lines may e
used for long %ariale lists" #ll of the following W$!4A commands contain %alid
%ariale lists5
W$!4A S>11#$J ?1-?3 ?10 ?11 ?12
W$!4A S>11#$J ?10 ?2 0?30 ?100 ?110 ?12
W$!4A S>11#$J #FA !'C:1A ?9-?13 ?9)
&>> /eywords StatPac For Windows User's Manual
W$!4A S>11#$J 4AS41-4AS49 ?3-?) ?1-?3
4he W$!4A command may also e used to change the order of the %ariales" When
the new output file is created0 %ariales will e written in the same order as specified
in the %ariale list" 4hus0 it is easy to restructure the order of %ariales in a codeoo,
and data file"
8or e9ample0 suppose you ha%e finished creating a codeoo, and data entry form" #s
you egin to enter data0 you realiBe that you forgot to include a %ariale in the study
design" !f you ha%e only entered a small amount of data0 the easiest way to correct
the prolem is to5
17 delete the data file
27 add the new %ariale to the codeoo, and form using Study @esign
37 egin entering data again"
<owe%er0 if you ha%e already entered a large amount of data0 you may not want to
delete the data you ha%e already entered" !n this case0 the W$!4A command can e
used to correct the prolem"
!n this e9ample0 you might want to add a new open-ended response %ariale
immediately following %ariale 22 in a study called 1JS4>@J" 4he codeoo,
currently contains (( %ariales" 4he following procedure creates a new %ariale
called :4<A$0 and then resa%es the codeoo, and data file inserting the new
%ariale into the middle of the study" #fter running the procedure0 the study and data
file will contain (9 %ariales" 4he new %ariale 6:4<A$7 will e lan, for all
e9isting records in the data file" 4he data entry form is not automatically updated0 so
you will also need to add the new %ariale to the form efore using it to edit or enter
data"
S4>@J 1JS4>@J
'AW 6#207 O:4<A$O :ther &rand Specified
W$!4A 1JS4>@J ?1-?22 :4<A$ ?2--?((
""
4he W$!4A command can also e used to increase the length of an open-ended
response %ariale" Suppose that %ariale 12 in the study is called C!4J0 and it is 12
characters in length 6i"e"0 the format is #127" #fter entering a large numer of records
into the data file0 you come across a city name that is 1( characters in length0 and
you want to increase the length of the C!4J field from 12 to 20 characters" 8irst0 run
the following procedure to create a new 2 character dummy %ariale and write it as
the 13th %ariale in the study 6immediately following the C!4J %ariale7" 4his will
insert 2 lan, spaces after the current 12 character C!4J field" 4hen0 go to the study
design0 delete the dummy %ariale and change the format for the C!4J field to #20"
#gain0 the data entry form is not automatically modified y this procedure0 and
therefore0 it needs to e changed to reflect the new field length for the C!4J
%ariale"
S4>@J 1JS4>@J
'AW 6#27 O@>11JO
W$!4A 1JS4>@J ?1-?12 @>11J ?13-?((
""
StatPac For Windows User's Manual /eywords &>1
M+RG+ Co((and
4he 1A$FA command is used to merge a study and data file into the current study
and data file" !t is usually appears as the only line in a procedure" 4he synta9 of the
1A$FA command is5
1A$FA [filename\
4he [filename\ is the name of the study and data file that you want to merge into the
current study" #fter running the procedure0 the %ariales 6and data7 from the merge
file will e added to the end of your original %ariales" 4hat is0 after running the
procedure0 the numer of %ariales in your original codeoo, will increase" 4he new
%ariales will appear in the ?ariale .ist window"
&oth the current study and the file to e merged must ha%e the same numer of
records and they must e in the same order" !n other words0 record one in the current
data file is the same respondent as record one in the data to e merged"
4he 1A$FA command does not automatically delete the files after the merge is
completed" 4he study and data will e merged into your current study0 ut they will
also remain on dis, in their original form" !f you want to delete the study and data
after the merge is completed0 add a ME to the end of the [filename\" 8or e9ample0 the
following 1A$FA command would add the %ariales and data from a file called
@A1:F$#P<!CS to the current study 6$ASA#$C<70 and then delete the
@A1:F$#P<!CS codeoo, and data after the merge has een successfully
completed"
S4>@J $ASA#$C<
1A$FA @A1:F$#P<!CS ME
""
5+0$I7G Co((and
4he <A#@!'F command is the method used to place a page heading on the
printouts" !t will appear in the top left corner of all printouts" 4he synta9 for the
<A#@!'F command is5
<A#@!'F [Page heading\
4he use of the <A#@!'F command is optional" !f it is not included in a procedure
file0 the default page heading will e used"
.i,e the S4>@J command0 the <A#@!'F command is usually specified in the first
procedure" Suse;uent procedures will use the same heading as the pre%ious
procedures unless the <A#@!'F command is used to change the page heading"
A9amples of the <A#@!'F command might e5
<A#@!'F 8amily Planning #ttitudes Study - 1999
&>& /eywords StatPac For Windows User's Manual
<A#@!'F StatPac !nc" - Computer Software @i%ision
<A#@!'F C.#SS!8!A@ !'8:$1#4!:' - SAC>$!4J C.A#$#'CA
$AC>!$A@
4here are no restrictions on the content of the heading" &oth upper and lower case
characters may e used" 4he heading may e printed as a lan, line if the ,eyword
<A#@!'F is used y itself with no other characters on the line"
4he <A#@!'F command may e used only once in any gi%en procedure" #ll tas,s
in that procedure will use the same heading" Suse;uent procedures will0 y default0
use the last heading specified0 or0 the heading may e changed y using the
<A#@!'F command to reassign a new page heading to the output"
:I:.+ Co((and
4he 4!4.A command is used to place a procedure or tas, title on the printouts" !t
will appear in the top left corner elow the page heading"
4he synta9 for the 4!4.A command is5
4!4.A [Procedure title\
4he use of the 4!4.A command is optional" >nli,e the <A#@!'F command0 it
applies to only the procedure in which it appears" !f a title is not specified for a
procedure0 no title will appear on the output"
4here are no restrictions on the content of the title" &oth upper and lower case
characters may e used" 4he title may e printed as a lan, line if the ,eyword
4!4.A is followed y two or more spaces0 with no other characters on the line"
A9amples of the 4!4.A command might e5
4!4.A 8irst $un of the @ata - @escripti%e Statistics
4!4.A 8re;uency #nalysis of Product #cceptance Cuestions
4!4.A Comparisons of 1ales = 8emales
4here is a special feature that may e used in the 4!4.A command" 4he three-
characters 6/7 may e sustituted in the title in place of the %ariale name" 4he title
on the printout will contain the %ariale lael instead of the 6/7 symols" 8or
e9ample0 the following procedure would produce three different titles" Aach title will
sustitute the correct %ariale lael in place of the 6/7 symols"
S4>@J S>$?AJ
4!4.A 8re;uency #nalysis of 6/7
8$AC>A'C!AS #FA $#CA SA*
""
4his is especially useful when creating anner tales" When running the same
anners on a series of stu %ariales0 it is often desirale to place the %ariale lael
for the stu %ariale on the top of the page" 4he following commands would run 22
different anner tales 6one per page7 and the title for each tale would e the
StatPac For Windows User's Manual /eywords &>1
%ariale lael from on the stu" 4he C: option turns off compression so that only
one stu %ariale gets printed per page"
S4>@J S>$?AJ
4!4.A 6/7
&#''A$S ?1-?22 &J #FA $#CA SA*
:P4!:'S C:^'
""
F33:73:+ Co((and
4he 8::4':4A command may e specified in any procedure to place a footnote at
the ottom of each page of output" :nly one 8::4':4A command may appear in a
procedure" 4he synta9 for the 8::4':4A command is5
8::4':4A [Page footnote\
4he use of the 8::4':4A command is optional" !f it is not included in a procedure
file0 no footnote will e printed" 4here are no restrictions on the content of the
footnote" &oth upper and lower case characters may e used"
A9amples of the 8::4':4A command might e5
8::4':4A 4his #nalysis Was Produced &y StatPac !nc"
8::4':4A 'ote5 !ncludes all data collected through 1991"
4he functionality of the 8::4':4A command is li,e the <A#@!'F command0
where once specified0 the footnote will apply to all suse;uent procedures" 4o cancel
a pre%iously specified footnote0 use the 8::4':4A command without any footnote
te9t 6a lan, footnote7"
.0B+.S Co((and
4he .#&A.S command may e used to assign %alue laels to a newly created
%ariale or to change the %alue laels for an e9isting %ariale" !t may also e used to
change a %ariale lael" 4he synta9 of the command to change one or more %alue
laels is5
.#&A.S [?ariale list\ 6[Code\^[.ael\76[Code\^[.ael\7"""
4he synta9 of the command to change one or more %ariale laels is5
.#&A.S [?ariale list\ ^ ['ew ?ariale .ael\
&>) /eywords StatPac For Windows User's Manual
Fenerally0 when the .#&A.S command is used to change a %ariale lael0 only a
single %ariale is specified 6although a %ariale list could e used to change the
%ariale laels for a series of multiple response %ariales7" 4his e9ample changes the
%ariale lael for %ariale fi%e to O<ow do you feel aout the programYO" 'ote that
the %ariale lael te9t is not enclosed in parentheses or ;uotes"
.#&A.S ?2 ^ <ow do you feel aout the programY

When used to change %alue laels0 the .#&A.S command is often used in
conHunction with the $AC:@A command" 8or e9ample0 letDs say a sur%ey as,ed the
respondentDs age 6#FA7" 8or our purposes0 it is sufficient to report the age as either
Ounder 21O or O21 and o%erO" 4he $AC:@A command would e used to recode the
data0 and the .#&A.S command would e used to assign %alue laels to the new
categories5
S4>@J ?:4!'F
$AC:@A #FA 6.:-20^17621-<!^27
.#&A.S #FA 61^>nder 21762^21 and :%er7
8$AC>A'C!AS #FA
""
Continuation lines are allowed in the .#&A.S command" 8or e9ample0 if #FA were
to e di%ided into fi%e groups0 the .#&A.S command could e entered as5
$AC:@A #FA 6.:-20^17 621-30^27 631-30^37 631-20^37 621-<!^27
.#&A.S #FA 61^>nder 217 62^21-30 Jears7 63^31-30 Jears7 63^31-20
Jears7 62^:%er 20 Jears7
""
When used to change %alue laels0 two restrictions apply to the use of the .#&A.S
command" 4he first is that some discretion should e used in the length of the %alue
laels" A9cessi%e %alue laels will ma,e printouts difficult to read" # good guideline
is to limit %alue laels to aout 30 characters" 4he second restriction is that the code
on the left of the e;uals sign must not contain more characters than the field width"
?alue laels eing assigned to a new or e9isting %ariale will e temporary and apply
only to the current procedure" 4he %alue laels can e made permanent y using the
S#?A or W$!4A commands"
4he .#&A.S command may e used more than once in a procedure and it may e
used to assign new laels to more than one %ariale" 8or e9ample0 the following
procedure file uses the .#&A.S command to assign new %alue laels to ten
consecuti%e items on a ;uestionnaire0 and to another %ariale called :P!'!:'"
&ecause the S#?A command is also specified in the procedure0 the new laels will
ecome a permanent part of the study information0 replacing any pre%ious laels"
S4>@J S>$?AJ
.#&A.S !4A11-!4A110 6#^?ery much7 6&^Somewhat7 6C^'ot at all7
.#&A.S :P!'!:' 61^Positi%e7 62^>ndecided7 63^'egati%e7
S#?A
""
StatPac For Windows User's Manual /eywords &>!
When using the .#&A.S command to change a single %alue lael or add new %alue
laels0 it is not necessary to retype all the %alue laels" #dding an e9clamation mar,
to the end of the .#&A.S command instructs StatPac to update the current laels
rather than completely replace them"
8or e9ample0 if you want to show the no-responses on a printout0 e%en though there
is not a %alue lael for the no-responses0 Hust add an e9clamation point to the end of
the line and StatPac will update the e9isting %alue laels" 4he following command
would add a O'o responseO %alue lael to %ariale one" 4he %alue laels that already
e9ist for %ariale one would remain intact"
.#&A.S ?1 6 ^'o response7_
!n another e9ample0 suppose two of the %alue laels for an income %ariale are5
O1^.ess than Z100000 per yearO and O2^1ore than Z320000 per yearO" #fter
re%iewing a anners tale0 you decide that it would loo, etter if the %alue laels
were are%iated" 4he following line could e used to change the %alue laels for
codes 1 and 2 without affecting the %alue laels for codes 20 30 and 3"
.#&A.S ?1 61^[1000007 62^\3200007_
#ny %alue lael in the .#&A.S command may include a %ertical ar to force a new
line in the printout" 64he %ertical ar appears as two stac,ed %ertical ars on the
,eyoard7" 4his is especially useful in anner tales when you want to force the
location of a rea, in the anner heading" 8or e9ample0 the following %alue lael will
cause the word O$esponsiilityO to print on two lines with a hyphen after the letter
OnO5
.#&A.S ?1 61^$espon-csiility7
3P:I37S Co((and
4he :P4!:'S command is used in conHunction with any of the analysis commands"
!ts purpose is to specify the computational parameters used to control the analysis0
and to select the ,inds of printouts desired"
4he default parameters for each analysis are stored in the StatPac"!ni file" When you
run an analysis without specifying any options0 the analysis will e run using the
default parameters" 4he :P4!:'S command is simply a way to o%erride or change
these settings" !f the :P4!:'S command is e9cluded0 the %alues in the tale will e
used for the analysis"
4he analysis editor allows you to display and modify the options for the current
procedure y selecting :ptions" 4he options will appear0 and you will e ale to
modify them" Jou can also type options directly on the :P4!:'S line in a
procedure"
Aach analysis has its own options" #fter selecting :ptions0 the options and their
default %alues will e displayed" Jou can temporarily change any options y simply
entering the desired %alue" 4he change will e temporary in that it will only apply to
the current procedure" 4o permanently change an option0 add an e9clamation point
&>* /eywords StatPac For Windows User's Manual
suffi9 6_7 to the desired %alue" 4he default %alue for the option will e permanently
changed so that the new %alue ecomes the default"
4he following information is only necessary if you choose to manually enter the
options"
#ll of the analysis options are designated y two-letter codes" >se one or more
spaces to separate the options" 4he format for the :P4!:'S command is5
:P4!:'S [Code\^[?alue\ [Code\^[?alue\ [Code\^[?alue\"""
4o set an option0 type the two-letter code followed y an e;uals symol and the
%alue you want to gi%e the option" 8or e9ample0 to set one decimal place on the
report 6option @P70 you could type5
:P @P^1 6'ote5 :P4!:'S can e are%iated as :P7
!f there are too many option codes to fit on a single line0 continue typing and let the
automatic word-wrap ta,e care of indenting the continuation line !f you use a hard
return at the end of a line0 ma,e sure that the rea, etween lines occurs etween
two options so that no option specification is di%ided y the rea," 8or e9ample5
:P4!:'S @S^' $S^J $C^' 1S^J S4^J 8:^2 PS^J
@P^1 #C^J P$^J
#lternately0 multiple options statements may e specified in the same procedure"
4hey will e interpreted as if they were one option line" 4he pre%ious options line
could ha%e een specified as5
:P4!:'S P!^12 @S^' $S^J $C^' 1S^J S4^J 8:^2 PS^J
:P4!:'S @P^1 #C^J P$^J
Fenerally0 options only apply to the procedure in which they appear" !f an
e9clamation point is added as a suffi9 to the option0 it will ecome the default for all
future analyses unless changed y another option" !n the following e9ample0 the
:P4!:'S line in the first procedure sets the default for the percentage ase to the
numer of cases" &ecause0 the P& option ends with e9clamation point0 the second
procedure 6and all suse;uent procedures7 will continue to use the same percentage
ase 6i"e"0 P&^'7"
S4>@J 1JS4>@J
8$AC ?1-?20
:P4!:'S P&^'_
""
8$AC ?-0-?)0
""
StatPac For Windows User's Manual /eywords &>-
S+.+C: and R+D+C: Co((ands
4he SA.AC4 and $AIAC4 commands are used to create a suset of the data that
consists of Hust some of the records from the original file" 4he commands are
temporary and apply only to the procedure in which they are specified"
Jou can use the SA.AC4 or $AIAC4 commands to select or reHect y record numer
range or y other criteria" 4he synta9 for the SA.AC4 and $AIAC4 commands are
identical" $ecords will e selected or e9cluded from the procedure ased upon the
selection or reHection criteria"
4he format for the SA.AC4 and $AIAC4 commands to select y record numer
range is5
SA.AC4 [.ow record / - <igh record /\
$AIAC4 [.ow record / - <igh record /\
4ype the ,eyword SA.AC4 followed y the record numer range" 8or e9ample0 to
select Hust the first 20 records from your data file0 you would type5
SA.AC4 1-20
4his would cause the first 20 records to e selected for further processing"
Jou could e9clude a single record from an analysis 6say record 227 with the
following command5
$AIAC4 22
Jou may e9clude the high record numer if you want the entire last part of the file to
e used in the procedure" 8or e9ample0 the following SA.AC4 command would s,ip
the first )3 records from the data file" 4he procedure will use all the records from )2
on"
SA.AC4 )2-
Similarly0 the following command would select only the first 20 records for an
analysis 6records 21 to the last record would e reHected75
$AIAC4 21-
When the SA.AC4 or $AIAC4 command is specified0 suse;uent procedures will
use the full data set 6not Hust the selected records7" !n the following e9ample0 the first
procedure lists 20 records0 while the second procedure lists the entire data file"
&>; /eywords StatPac For Windows User's Manual
S4>@J C>AS4!:'
SA.AC4 1-20
.!S4 !@ :P!'!:' F$:>P
""
.!S4 !@ :P!'!:' F$:>P
""
4he W$!4A command is used to create a sufile of the selected data so that
suse;uent procedures could access the sufile" When the W$!4A command is not
specified0 the selected records will e used for all the tas,s in the procedure0 ut will
not e written to a permanent sufile"
#ever use the SA=+ command in the same procedure as the S+&+(T command
unless you have a backup of the study information and data. @oing so will
eliminate records from your data file0 and they will not e reco%erale without a
ac,up"
#n alternate form of the Select command may e used to randomly select a specified
numer of records from the data file" 4he synta9 is5
SA.AC4 ['umer of records\ M$
8or e9ample0 the following command would randomly select 30 records from the
data file and write a new codeoo, and data file called $'@5
SA.AC4 30 M$
W$!4A $'@
""
#gain0 do not use the S#?A command in the same procedure as the SA.AC4
command" @oing so would erase the original data file and replace it with a data file
containing the selected records 6resulting in a loss of data7" !nstead0 use the W$!4A
command to create a new data file that contains Hust the selected records"
Aach time a procedure with the SA.AC4 command and the M$ option is run0 a new
set of random records will e selected" $unning the ao%e procedure multiple times
would produce a different set of random records with each run" 4his can e altered
y setting an e9plicit random numer seed"
!n the System @efaults 8ile 6StatPac"ini70 the default for the $andom'umerSeed
parameter is lan, and will e shown as5
$andom'umerSeed ^
# lan, random numer seed means that a new set of random numers will e
created each time the random numer generator is e%o,ed" !f you change
$andom'umerSeed to any numeric %alue 68ile\:pen\System @efauts 8ile70
StatPac will use the same random numer se;uence each time itNs run" 4he numer
itself determines the random se;uence 6which you cannot control70 so it really
StatPac For Windows User's Manual /eywords &>'
doesnNt matter what numer you enter0 although different numers will produce
different random numer se;uences" # gi%en numer will always produce the same
se;uence"
$andom'umerSeed ^ 22
#nother form of the SA.AC4 and $AIAC4 commands is used in conHunction with
the !8-4<A' command" 8or e9ample0 to select Hust males for an analysis0 you would
enter the command5
!8 SA*^O1O 4<A' SA.AC4
# record will e selected if the criteria is met 6i"e"0 if SA* is e;ual to 17" 4he
following would also select Hust the males y eliminating the females5
!8 SA*^O8O 4<A' $AIAC4
4he general form of this command is5
!8 [Statement\ 4<A' SA.AC4
4he spaces in the synta9 are mandatory" 4here must e at least one space after the !8
and at least one space on each side of the 4<A'" Spacing within the [Statement\
portion of the command doesnDt matter"
!f the [Statement\ portion of the command is true for a gi%en record0 that record will
e selected and written to the output file andMor included in the analysis" !f the
[Statement\ portion is false for a record0 it will e s,ipped 6omitted from the
procedure7"
4he ;uotation mar,s around the code to e selected are mandatory for alpha-type
data only" 8or numeric-type %ariales0 the ;uotation mar,s are unnecessary" 4he
following procedure would first select students that had a grade point a%erage of 3"2
or higher0 and then perform two fre;uency analyses using the selected records"
S4>@J S4>@A'4S
!8 FP# \ ^ 3"2 4<A' SA.AC4
8$AC>A'C!AS SA* $#CA
""
Similarly0 the following analyses would only e performed on students who had at
least a 2"0 grade point a%erage5
S4>@J S4>@A'4S
!8 FP# [ 2"0 4<A' $AIAC4
8$AC>A'C!AS SA* $#CA
""
&1> /eywords StatPac For Windows User's Manual
4he SA.AC4 Command can perform an 'th record selection when used in
comination with compute commands" 8or e9ample0 the following procedure would
list e%ery tenth record" 'ote that the integer function is used to chec, for the record
numers that are e%enly di%isile y ten" #lso note that the $AC %ariale was
computed so that the listing would show the record numer from the original data
file instead of its se;uence numer in the selected suset"
S4>@J 1#$EA4
C:1P>4A 6'27 $AC ^ $AC:$@
C:1P>4A 6'27 !'4AFA$ ^ !'46$ACM107
C:1P>4A 6'27 $A#. ^ $ACM10
!8 !'4AFA$ ^ $A#. 4<A' SA.AC4
.!S4 $AC '#1A P<:'A
""
4he SA.AC4 or $AIAC4 command may e used to e9clude missing data from an
analysis y selecting only non-lan, records" 8or e9ample0 either of these two
commands could e used to select non-lan, records for an analysis of an attitude
;uestion0 you would enter the command5
!8 #44!4>@A [\ O O 4<A' SA.AC4
!8 #44!4>@A ^ O O 4<A' $AIAC4
'otice that a space is used to indicate missing data" 4he SA.AC4 command says to
select all records where #44!4>@A is une;ual to a lan," 4he $AIAC4 command
says to e9clude all records where #44!4>@A is e;ual to a lan," 4he result of either
command will e the same" $ecords with non-missing data will e selected" When
selecting missing data0 ;uotation mar,s are re;uired regardless of whether the
%ariale is alpha or numeric" 4here does not ha%e to actually e a space etween the
;uotation mar,s 6i"e"0 two ;uotation mar,s together would accomplish the same
thing7"
4he SA.AC4 and reHect commands are often used in conHunction with the .!S4
command to list open-ended comments" 4he purpose is to eliminate records where
the respondent made no comment" &oth of these procedures would produce identical
printouts"
!8 C:11A'4 [\ O O 4<A' SA.AC4
.!S4 C:11A'4
""
!8 C:11A'4 ^ O O 4<A' $AIAC4
.!S4 C:11A'4
""
4he SA.AC4 and $AIAC4 commands may also e used in comination with #'@
and :$ relational operators to select or reHect records ased on multiple criteria"
>sing #'@ and :$ relational operators can sometimes e confusing" $efer to the
!8""4<A' statement for a full discussion of relational operators"
#s a simple e9ample0 suppose we wanted to perform an analysis of people o%er -0
who rate their health as good 61^Food 2^8air 3^Poor7" &oth criteria must e true
StatPac For Windows User's Manual /eywords &11
efore weDll select the record 6a person must e o%er -0 A#* they must e in good
health7" 4he command would e5
!8 #FA \ -0 #'@ <A#.4< ^ 1 4<A' SA.AC4
When the #'@ operator is used0 oth statements must e true efore the record will
e selected" 4he :$ operator wor,s differently" When :$ is used0 the record will e
selected if either statement is true" 8or e9ample0 the following command will select
people that are @emocrats -R people that ha%e no political affiliation 6@^@emocrat
$^$epulican '^'one75
!8 #88!.!#4!:' ^ O@O :$ #88!.!#4!:' ^ O'O 4<A' SA.AC4
# statement can contain as many #'@ and :$ operators as needed" When there are
no parenthesis0 #'@ and :$ statements will e e%aluated from left to right"
Parentheses may e used to control the order that the statement will e e%aluated" 8or
e9ample0 the following command would select all males o%er 1( and all females o%er
21"
!8 6SA*^O1O #'@ #FA\1(7 :$ 6SA*^O8O #'@ #FA\217 4<A'
SA.AC4
StatPac contains a special feature that simplifies the synta9 of comple9 :$
statements" 8or e9ample0 suppose you want to select respondents from groups 10 30 )
and 9" >sing :$ operators0 you would type5
!8 F$:>P^1 :$ F$:>P^3 :$ F$:>P^) :$ F$:>P^9 4<A'
SA.AC4
4he same command in using the simplified :$ synta9 would e5
!8 F$:>P ^ O1M3M)M9O 4<A' SA.AC4
!n the first statement0 the record will e selected if any part of the statement is true"
!n the second statement0 the :$ relational operator is replaced y the slash" When
using this method to perform a multiple selection0 the codes 6O1M3M)M9O7 must e
enclosed in ;uotes0 regardless of the %ariale type 6alpha or numeric7" 4here is no
limit on the numer of slashes that may e used in the statement to replace :$
relational operators" !dentical synta9 may e used with the $AIAC4 command"
#s another e9ample0 if some data entry operators entered upper case codes0 while
other data entry operators entered lower case codes0 we would want to select if the
code was either upper :$ lower case" 4he following two statements would produce
identical results5
!8 SA* ^ O1O :$ SA* ^ OmO 4<A' SA.AC4
&1& /eywords StatPac For Windows User's Manual
!8 SA* ^ O1MmO 4<A' SA.AC4
7+W Co((and
4he 'AW command is one of se%eral ,eywords that allows you to create new
%ariales" !ts primary application is for creating new alpha-type %ariales" 4he
ad%antage of the 'AW command o%er other ways of creating new %ariales is that it
allows you to specify a %ariale lael"
4he synta9 for the command is as follows5
'AW [68ormat7\ [O?ariale nameO\ [?ariale lael\
4he format defines the type0 field width and decimal formatting 6if numeric7 for the
new %ariale" !t is specified using the same con%entions as in the study design e9cept
that it is enclosed in parentheses"
4he [8ormat\ for creating new alpha %ariales is5
6#97 where 9 is the field width
4he following command would create a new one-column alpha %ariale named
F$:>P" 4he %ariale lael for F$:>P would e Froup !dentification Code"
'AW 6#17 OF$:>PO Froup !dentification Code
Cuotation mar,s must e included around the %ariale name" 4he %ariale name
itself should e rief 6e"g"0 less than 20 characters in length7" 4he %ariale lael may
use a continuation line if the entire lael will not fit on the first line" 4he new
%ariale will e initialiBed to lan,s 6i"e"0 the %ariale e9ists0 ut its %alue is missing7"
'umeric %ariales may also e created with the 'AW command"
4he [8ormat\ portion of the synta9 for creating new numeric %ariales is5
6'97 where 9 is the total field width for the %ariale
or
6'9"y7 where 9 is the total field width and y is the
numer of decimal characters
When wor,ing with integer data0 the first format is preferale" 8or e9ample0 the
following command would create a two-column numeric %ariale" 4he %ariale name
is F$#'@-4:4#. and its %ariale lael is O4he sum of the indi%idual scoresO" 4he
%ariale does not ha%e any specified formatting"
'AW 6'27 OF$#'@-4:4#.O 4he sum of the indi%idual scores
StatPac For Windows User's Manual /eywords &11
When creating %ariales that will contain decimal formatting0 the precision for the
formatting should e specified" While this is not mandatory0 it is highly
recommended" 8or e9ample0 letDs create a new numeric %ariale called P$:8!4-
.:SS" Jour study now contains two %ariales0 A*PA'@!4>$AS 6?17 and
!'C:1A 6?27" 4he first step is to gi%e the new %ariale a name andMor lael" 4ype5
'AW 6'10"27 OP$:8!4-.:SSO 4he ottom line
4his would create a new numeric %ariale called P$:8!4-.:SS" !t will ecome the
third %ariale in the study" 4he %ariale will ha%e a total field width of ten characters
6se%en to the left of the decimal point0 the decimal point itself0 and two to the right of
the decimal point7" 4he field width refers to the total numer of characters reser%ed
for the %ariale" 4his includes the space necessary for a decimal point andMor minus
sign" !n other words0 you must ha%e an idea of the magnitude of the new %ariale
efore creating it"
#fter entering the 'AW command0 the new %ariale can e referenced y the new
%ariale name 6P$:8!4-.:SS7 or y the new ? numer 6?37" 4he C:1P>4A
statement could then e used to calculate a %alue for the new %ariale P$:8!4-
.:SS"
4o create se%eral new %ariales in the same run0 simply type se%eral 'AW statements
on successi%e lines" Aach 'AW command will create one new %ariale"
When running a procedure with the 'AW and S#?A commands0 the new %ariale
will e created and sa%ed at the end of the codeoo, and data files" !f you attempt to
run the same procedure again0 StatPac will tell you that you are attempting to create
a new %ariale with the same name as an e9isting %ariale 6i"e"0 it was created and
sa%ed the first time you ran the procedure" 4he StatPac"ini file can e edited so
StatPac ignores this situation" Set !gnore@uplicate'ewCommand ^ 1 in the
StatPac"ini file to tell StatPac to ignore the 'AW command if a %ariale already
e9ists with that %ariale name"
When using the 'AW command0 the %ariale name is suHect to the same restrictions
as during the study design"
1" Shorter %ariale names are preferale"
2" # %ariale name must e uni;ue from all other %ariale names and may
not e the same as any ,eyword"
3" 4he first character of a %ariale name may not e a numer or a space"
3" # %ariale name may not e the same as a ? numer" 8or e9ample0 you
cannot name a %ariale O?12O"
2" # %ariale name may not contain a comma or period" 4he %ariale name
may include a spaceW howe%er0 for the purpose of clarity0 we
recommend using a dash or underline character instead of a space"
-" # %ariale name may not e @0 A0 $AC:$@0 4!1A0 .:0 <!0 W!4<0 &J0
4<A'0 4:4#. or 1A#'" 4hese words ha%e special meaning to
StatPac"
&1) /eywords StatPac For Windows User's Manual
.+: Co((and
4he .A4 command is used to create a new %ariale from an e9isting %ariale or to
assign a new %alue to an e9isting %ariale" 4he synta9 of the command is5
.A4 ['ew or e9isting %ariale name\ ^ [A9isting %ariale name\
4he .A4 command is often used as a way of ma,ing transformations to a data file
without destroying the raw data" 8or e9ample0 suppose #FA had een entered in the
data file as the respondentDs actual age" 4his would pro%ide e9cellent descripti%e
statistics 6mean0 median0 etc"70 ut it is not conduci%e to crossta and anner tales"
8or these analyses0 we want categorical data" !f we recode the #FA %ariale into
groups0 the original data will e destroyed0 since the #FA %ariale would then
contain recoded data 6not the raw data7" 4he following procedure o%ercomes this
prolem y first using the .A4 command to create a duplicate copy of a %ariale0
and then recoding the new %ariale rather than the original %ariale"
S4>@J 1#$EA4
.A4 #FAXF$:>P ^ #FA
$AC:@A #FAXF$:>P 6.:-20^17 621-30^27 631-30^37 631-<!^37
.#&A.S #FAXF$:>P 61^>nder 217 62^21-307 63^31-307 63^:%er 307
S#?A
""
4he new %ariale #FAXF$:>P is created with the .A4 command" A%erything is
duplicated e9cept the %ariale name" #FAXF$:>P will ha%e the same format0
%ariale lael0 %alue laels0 and data as the original %ariale #FA" 4he only thing
changed is the %ariale name" 4he $AC:@A command recodes #FAXF$:>P
6lea%ing #FA intact70 and the .#&A.S command assigns new %alue laels to the
recoded data" 4he S#?A command ma,es the transformations permanent so
suse;uent procedures will ha%e access to the new %ariale #FAXF$:>P as well as
the original raw data #FA"
When using the .A4 command to create a new %ariale0 the new %ariale name is
suHect to the same restrictions as during the study design"
4he .A4 command in conHunction with the 'AW command can e used to increase
the field width of a %ariale" Suppose you had created a 20 character alpha %ariale
called C!4J" #fter entering se%eral records of data0 you decide that you really need
30 characters for the C!4J field" Jou cannot simply change the codeoo, ecause
you ha%e already entered data0 and the e9isting data needs to e changed in addition
to the codeoo," 4he .A4 command pro%ides an easy solution"
4his procedure creates a new %ariale called 'AWC!4J and assigns the contents of
the e9isting C!4J %ariale to the new %ariale for all e9isting records" #fter running
this procedure0 you would add the 'AWC!4J %ariale to the data entry form"
S4>@J C:'4#C4S
'AW 6#307 O'AWC!4JO City
.A4 'AWC!4J^C!4J
S#?A
""
StatPac For Windows User's Manual /eywords &1!
When you create a new %ariale0 it is added to the end of the codeoo," !n the
pre%ious e9ample0 the 'AWC!4J %ariale would ecome the last %ariale in the
study" 4he C!4J %ariale would still e in the codeoo, and on the data entry form"
# etter solution is to use the W$!4A command to eliminate the original C!4J
%ariale and replace it with the 'AWC!4J %ariale" !n this e9ample0 C!4J was
originally %ariale 22 in the codeoo," 4he W$!4A command is used to set
'AWC!4J as %ariale 22 and the original C!4J %ariale is omitted"
S4>@J C:'4#C4S
'AW 6#307 O'AWC!4JO City
.A4 'AWC!4J^C!4J
W$!4A C:'4#C4S ?1-?23 'AWC!4J ?2--?100
""
4he .A4 command can also e used to con%ert an alpha 6#17 %ariale to a numeric
6'27 %ariale" 4his is useful when you ha%e data coded as #0 &0 CK and you would
li,e to ha%e it coded as 10 20 3" Jou could recode the data 6#^176&^276C^370 sa%e
the recoded data0 and then manually change the codeoo, format from #1 to '10 and
change the %alue laels" #lternati%ely0 you can use the 'AW and .A4 commands to
do the recode" Suppose #PP.A is an 6#17 %ariale coded as #^1 apple0 &^2 apples0
and C^3 apples" 4he following two commands would create a new %ariale 6and
data7 called '>1X#PP.A that was coded as 1^1 apple0 2^2 apples0 and 3^3 apples"
4he new numeric %ariale must e specified with an '2 format"
'AW 6'27 O'>1X#PP.AO 'umer of #pples
.A4 '>1X#PP.A^#PP.A
S:0C/ Co((and
# S4#CE command is used to create new %ariales that consist of all the possile
cominations of categories from two to four other %ariales" !t is especially useful
for creating special %ariales in anner tales"
4he synta9 for the S4#CE command is5
S4#CE ['ew %ariale name\ ^ [?ariale list\
4he S4#CE command may e used only to create a new %ariale 6i"e"0 it cannot e
used to calculate a new %alue for an e9isting %ariale7" 4he format of the new
%ariale will always e alpha0 and the field width will e the sum of the indi%idual
%ariales in the %ariale list" 4he %alue laels for the new %ariale will e
automatically created from the cominations of the %alue laels of the %ariales in
the %ariale list" 4he S4#CE command is temporary and the new %ariale will only
e9ist in the procedure where the command appears unless the S#?A or W$!4A
command is used"
#s an e9ample0 if your study contains a %ariale called SA* and another %ariale
called #FA0 SA* is coded5 1^1ale and 8^8emale" #FA is coded5 1^Joung0
&1* /eywords StatPac For Windows User's Manual
2^1iddle and 3^:ld" 4he following command would create a new %ariale called
SA*#FA that contained si9 %alue laels5
S4#CE SA*#FA ^ SA* #FA
4he new SA*#FA %ariale would e a two-column alpha %ariale0 and its %alue
laels would e5
11 ^ 1ale Joung
12 ^ 1ale 1iddle
13 ^ 1ale :ld
81 ^ 8emale Joung
82 ^ 8emale 1iddle
83 ^ 8emale :ld
4he S4#CE command is a method of adding multiple dimensions to an analysis" !f
an analysis is performed using the new SA*#FA %ariale0 the results would e
ased on oth the SA* and #FA dimensions"
4he S4#CE command [%ariale list\ may stac, up to four %ariales" 8or e9ample0 a
third dimension ased on a %ariale called $#CA0 could e added with the following
command5
S4#CE SA*#FA$#CA ^ SA* #FA $#CA
4he $#CA %ariale 6coded5 W^White0 &^&lac, and C^:ther7 would add a third
dimension to the @A1:F$#P<!C %ariale" 4he new %alue laels would e5
11W ^ 1ale Joung White
11& ^ 1ale Joung &lac,
11: ^ 1ale Joung :ther
12W ^ 1ale 1iddle White
12& ^ 1ale 1iddle &lac,
12: ^ 1ale 1iddle :ther
13W ^ 1ale :ld White
13& ^ 1ale :ld &lac,
13: ^ 1ale :ld :ther
81W ^ 8emale Joung White
81& ^ 8emale Joung &lac,
81: ^ 8emale Joung :ther
82W ^ 8emale 1iddle White
82& ^ 8emale 1iddle &lac,
82: ^ 8emale 1iddle :ther
83W ^ 8emale :ld White
83& ^ 8emale :ld &lac,
83: ^ 8emale :ld :ther
StatPac For Windows User's Manual /eywords &1-
'ote that the numer of %alue laels in the new stac,ed %ariale is the product of the
numer of %alue laels in each of the indi%idual %ariales in the %ariale list"
Stac,ing more than two %ariales in a single command can potentially result in a
huge numer of %alue laels"
#lso note that the new %alue laels are created y adding together the %alue laels
that already e9ist in the study" 4he %alue lael creation feature of the S4#CE
command wor,s est when each of the %alue laels for the stac,ed %ariales are
short"
R+C3$+ Co((and
4he $AC:@A command is used to recode a %ariale into groups" !t is a data
reduction techni;ue used for summariBing data" &oth alpha and numeric data may e
recoded" 4he simplest form of the command is5
$AC:@A [?ariale or %ariale list\ 6[:ld %alue\ ^ ['ew %alue\7
8or e9ample0 assume we ha%e a %ariale called !'@!C#4:$0 and we want to change
all %alues of 0 to a %alue of 2" We would type5
$AC:@A !'@!C#4:$ 60^27
4he space after $AC:@A and after the %ariale name is mandatory" Se%eral
%ariales can e recoded with the same command y specifying a %ariale list
instead of a single %ariale" 4he following command would perform the same recode
on ten consecuti%e !'@!C#4:$ %ariales"
$AC:@A !'@!C#4:$1 - !'@!C#4:$10 60^27
4here are se%eral other formats for the $AC:@A command" :ne of them allows you
to string se%eral recode statements together" 8or e9ample0 letDs say you want to
change all %alues of 1 and 2 to a %alue of 10 all %alues of 3 and 3 to a %alue of 20 and
all %alues of 2 to a %alue of 3" 4he recode statement would e5
$AC:@A $#4!'F 62^1763^2763^2762^37
'ote that it is not necessary to specify 61^17 as part of the recode command" #s in
the pre%ious e9ample0 a %ariale list could e specified instead of a single %ariale"
!f you prefer0 you could reference the %ariale $#4!'F y its %ariale numer rather
than its %ariale lael" Iust prefi9 the %ariale numer with the letter ?" 8or e9ample0
if $#4!'F was the third %ariale in our data file0 we could ha%e typed the pre%ious
command as5
$AC:@A ?3 62^1763^2763^2762^37
&1; /eywords StatPac For Windows User's Manual
4he final format for the $AC:@A command is used to specify a %alue range to e
recoded instead of an asolute %alue" 4he synta9 for this type of statement is5
$AC:@A [?ar" or %ar" list\ 6[.ow %alue\ - [<igh %alue\ ^ ['ew %alue\7
8or e9ample0 letDs say we want to recode all the %alues from 1 to 20 and gi%e them a
new %alue of 10 and we want to recode all %alues from 21 to 30 and gi%e them a new
%alue of 20 and finally0 all %alues o%er 30 should e gi%en a new %alue of 3" :ur
$AC:@A command would e5
$AC:@A #FA 61-20^17621-30^27631-99^37
4he ,eywords .: and <! may e included in a $AC:@A command" .: refers to the
lowest %alue in a data file while <! refers to the highest %alue in the file" 8or
e9ample0 letDs say you ha%e a %ariale called !'?A'4:$J" 4o change all %alues
from the lowest through 39 to a new %alue of 0 and also change all %alues from 20
through the highest to a new %alue of 10 you would use the following $AC:@A
command5
$AC:@A !'?A'4:$J 6.:-39^07620-<!^17
1issing information is stored in StatPac data files as spaces" Spaces may e used in
the $AC:@A command to indicate missing data" 8or e9ample0 letDs ta,e the
following sur%ey ;uestion5
<ow well do you li,e our spaghettiY
1" # lot
2" Somewhat
3" 'ot at all
3" 'o opinion
4o recode all the Ono opinionO responses to missing data0 type5
$AC:@A :P!'!:' 63^ 7
'otice that a lan, is used as part of the $AC:@A statement to indicate missing
data"
#s a similar e9ample0 after downloading a twenty-%ariale data file 6@#4#8!.A7
from a mainframe0 you disco%er that all missing data was coded as 99 instead of
lan,s" Since StatPac recogniBes only lan,s as missing data0 you decide to recode
all the %ariales and sa%e the recoded data" 4he following commands are used to
recode the data file and write a new data file5
S4>@J @#4#8!.A
$AC:@A ?1-?20 699^ 7
StatPac For Windows User's Manual /eywords &1'
S#?A
""
Jou may use any of the ao%e formats or comination of formats to create $AC:@A
commands" 1any different $AC:@A commands can e specified in a single
procedure" #ll recodes will e temporary in nature and will e applied to all the tas,s
in the procedure" # recode can e made permanent y using the S#?A or W$!4A
commands in the same procedure"
C3MPU:+ Co((and
4he C:1P>4A command is one of the most %ersatile ,eywords" !t is used to
perform algeraic andMor trigonometric functions on numeric %ariales" 4he
C:1P>4A command may e used whene%er you want to use arithmetic to
transform an e9isting %ariale or calculate a new %ariale" #ll operations are
performed using doule precision arithmetic"
4he synta9 for a compute statement is almost identical to the synta9 that the &#S!C
interpreter uses to e%aluate your programs" 4he format for the compute statement is5
C:1P>4A [?ariale\ ^ [A;uation\
8or e9ample0 the following e;uation will add three %ariales together0 calculate the
mean a%erage0 and replace the contents of %ariale 9 with the result5
C:1P>4A ?9 ^ 6?3 ] ?3 ] ?27 M 3
'otice that the letter ? is used to distinguish a %ariale numer from a constant" Jou
may also use the actual %ariale names in the e;uation rather than a ? numer" 8or
e9ample0 the same e;uation could e written5
C:1P>4A @AP4X#?F ^ 6@AP4X:'A ] @AP4X4W: ] @AP4X4<$AA7
M 3
Compute statements may use fi%e numeric operators and twel%e intrinsic functions"
4hey are5
] addition
- sutraction
b multiplication
M di%ision
d e9ponentiation
SC$ s;uare root
.:F natural log
S!' sine
C:S cosine
&&> /eywords StatPac For Windows User's Manual
4#' tangent
#S' arcsign
#4' arctangent
#&S asolute %alue
A*P e9ponent
$'@ random 6random integer etween 1 and the argument7
!'4 integer 6rounds argument up or down7
8!* integer 6drops decimal portion of the argument7
A;uations may also use parentheses to specify the order of computations" !f no
parentheses are included0 computations will e performed in the standard
hierarchical order 6intrinsic functions M e9ponentiation M multiplication = di%ision M
addition = sutraction7" !f no hierarchy e9ists0 the e;uation will e e%aluated from
left to right" Spaces in an e;uation will e ignored"
4he following are e9amples of %alid e;uations5
C:1P>4A ?11 ^ 6?22 b 1"37 M 6?21 ] ?1-7
C:1P>4A ?9 ^ 66?--?)7b1"327M9"31
C:1P>4A ?2 ^ 0
C:1P>4A C!$C>18A$A'CA ^ 3"13129 b @!#1A4A$
C:1P>4A ?3 ^ 3"13129 b ?2 d 2
C:1P>4A ?12 ^ .:F6@:..#$S7
C:1P>4A 4:4#.-S#.AS ^ SC$6?12 - 1-"27
C:1P>4A 1:@!8!A@ ^ S!'66:$!F!'#.-3"127]:$!F!'#.7
C:1P>4A $:>'@A@-'>1&A$ ^ !'46'>1&A$7
C:1P>4A 4$>'C#4A@-'>1&A$ ^ 8!*6'>1&A$7
4he following are in%alid e;uations5
C:1P>4A ?1) ^ 66?3M?27 61ismatched parentheses7
C:1P>4A ?9 ^ ?-M0 6@i%ision y Bero is illegal7
C:1P>4A ?9 ] ?3 ^ ?2 6:nly one %ariale allowed to the left
of the e;uals sign7
#ll computations 6including the intrinsic functions7 are performed using doule
precision" 4he result will e rounded to the precision specified y the %ariale eing
computed 6i"e"0 the decimal formatting of the %ariale7"
8or e9ample0 letDs say we want to compute an a%erage of three %ariales" 4he
%ariale eing computed has a format of '2"2" We would write a compute statement
to add the three %ariales and di%ide y three" !f the sum of the three %ariales is 1000
the mean a%erage will e calculated as 33"33333333333333 and the result would e
rounded to 33"33"
When no decimal formatting e9ists for the %ariale eing computed0 the result will
e e9pressed with the ma9imum decimal precision possile" 8or e9ample0 if the
StatPac For Windows User's Manual /eywords &&1
format of the computed %ariale were ')0 the pre%ious e9ample would e rounded to
33"3333 6a total field width of se%en characters including the decimal point7" !f the
format were '20 the result would e rounded to 33"
!f a computed %ariale ecomes too large for the field width of the %ariale0 the
precision of the result may e diminished" !n the e9treme case0 where the integer
portion of the result would e changed0 the result will e set to lan,s 6missing data7"
!n the pre%ious e9ample0 if the format of the computed %ariale were '10 the result
would e stored as missing data ecause the result 633"333"""7 could not e e9pressed
using an '1 format" !t is0 therefore0 %ery important that you ha%e an idea of the
magnitude of the numer you will e computing"
#s another e9ample0 suppose we want to add three %ariales 6SC:$A10 SC:$A2
and SC:$A37" 4he scores are etween 0"0 and 99"9 so the %ariales were originally
defined using '3"1 formats" 4he sum of the %ariales could e9ceed 99"9 6four
characters70 so the new %ariale that holds the sum 64:4#.XSC:$A7 should e
created with an '2"1 format"
'AW 6'2"17 O4:4#.XSC:$AO Sum of the three test scores
C:1P>4A 4:4#.XSC:$A ^ SC:$A1 ] SC:$A2 ] SC:$A3
4he C:1P>4A statement can also e used to create a new %ariale directly without
first using the 'AW command" 4he synta9 to create a new %ariale is5
C:1P>4A 6[8ormat\7 ['ew %ariale name\ ^ [A;uation\
4he only disad%antage of using the C:1P>4A command to create a new %ariale is
that a %ariale lael cannot e specified"
4he command for the ao%e e9ample is5
C:1P>4A 6'2"17 4:4#.XSC:$A ^ SC:$A1 ] SC:$A2 ] SC:$A3
# new fi%e-character numeric %ariale would e created and called 4:4#.XSC:$A"
!t will ha%e three digits to the left of the decimal point and one digit to the right"
'otice that the format for the new %ariale is enclosed in parentheses"
:ften0 e;uations will ecome %ery comple9 and re;uire many le%els of parentheses"
While StatPac can handle %irtually any le%el of comple9ity0 it is sometimes easier to
rea, an e;uation into se%eral smaller e;uations and store the intermediate results in
the %ariale eing computed"
8or e9ample0 the following comple9 e;uation could e ro,en down into smaller
e;uations5
C:1P>4A 6'-"27 'AW?#$ ^ 6?)-?-7 ] 13"(2

Could e e9panded to5
'AW 6'-"27 O'AW?#$O
&&& /eywords StatPac For Windows User's Manual
C:1P>4A 'AW?#$ ^ ?) - ?-
C:1P>4A 'AW?#$ ^ 'AW?#$ ] 13"(2
'otice that a new %ariale 6'AW?#$7 was first created with the 'AW command0
and then computed as the difference etween %ariales ) and -" 8inally0 it was
recomputed to its current %alue0 ] 13"(2" &ecause 'AW?#$ is not already a %ariale
lael in the file0 it will ecome the ne9t a%ailale %ariale" !n this e9ample0 if there
were 1( %ariales already in the file0 'AW?#$ would ecome the %ariale name for
%ariale 19"
Sometimes you will need se%eral C:1P>4A statements to accomplish a tas,"
Surprisingly0 one of the most difficult formulas you might use is to find the numer
of days etween two dates" Se%eral C:1P>4A statements are re;uired" Aach date
re;uires three %ariales in your study 6month0 day and year7" 1onth and day each
re;uire two columns0 and year re;uires four columns" !n the following e9ample0 the
%ariale names for each date are5 1:'4<1 @#J1 JA#$1 and 1:'4<2 @#J2
JA#$2" !f the names in your study are different0 you must modify this procedure"
4he @!88 %ariale contains the numer of days etween the two dates"
4his suroutine can e merged into your procedure file" 'ote that this e9ample
assumes that four digits were used in your study to store the years"
C:1P>4A 6'37 J$1 ^ JA#$1
C:1P>4A 6')7 4!1A1"0 ^ 3-2 b JA#$1 ] @#J1
!8 1:'4<1 \ 2 4<A' C:1P>4A 4!1A1 ^ 4!1A1 -
!'461:'4<1b"3]2"37
!8 1:'4<1 \ 2 4<A' C:1P>4A J$1 ^ J$1 ] 1
C:1P>4A 4!1A1 ^ !'464!1A1 ] 6J$1-17 M 3 ] 1:'4<1 b 317
C:1P>4A 6'37 J$2 ^ JA#$2
C:1P>4A 6')7 4!1A2 ^ 3-2 b J$2 ] @#J2
!8 1:'4<2 \ 2 4<A' C:1P>4A 4!1A2 ^ 4!1A2 -
!'461:'4<2b"3]2"37
!8 1:'4<2 \ 2 4<A' C:1P>4A J$2 ^ J$2 ] 1
C:1P>4A 4!1A2 ^ !'464!1A2 ] 6J$2-17 M 3 ] 1:'4<2 b 317
C:1P>4A 6'27 @!88 ^ #&S64!1A2 - 4!1A17
4he year 2000 is not a prolem with the pre%ious procedure ecause the year was
stored using four digits" !f you ha%e data that uses only two digits to store the year0
then the procedure can e modified to correct the millennium change"
8irst0 determine the oldest year in the data" Suppose in the following e9ample0 the
oldest %alue for JA#$1 or JA#$2 is 1921 6stored in the data as 217" &y chec,ing
each date and comparing it to 210 you can determine if it is a 1999 or 2099 year"
#gain0 the @!88 %ariale contains the numer of days etween the two dates"
C:1P>4A 6'27 :88SA4^21
'AW 6'37 OJ$1O
!8 JA#$1 [ :88SA4 4<A' C:1P>4A J$1 ^ JA#$1 ] 2000
A.SA J$1 ^ JA#$1 ] 1900
C:1P>4A 6')7 4!1A1"0 ^ 3-2 b J$1 ] @#J1
StatPac For Windows User's Manual /eywords &&1
!8 1:'4<1 \ 2 4<A' C:1P>4A 4!1A1 ^ 4!1A1 -
!'461:'4<1b"3]2"37
!8 1:'4<1 \ 2 4<A' C:1P>4A J$1 ^ J$1 ] 1
C:1P>4A 4!1A1 ^ !'464!1A1 ] 6J$1-17 M 3 ] 1:'4<1 b 317
'AW 6'37 OJ$2O
!8 JA#$2 [ :88SA4 4<A' C:1P>4A J$1 ^ JA#$2 ] 2000
A.SA J$1 ^ JA#$2 ] 1900
C:1P>4A 6')7 4!1A2 ^ 3-2 b J$2 ] @#J2
!8 1:'4<2 \ 2 4<A' C:1P>4A 4!1A2 ^ 4!1A2 -
!'461:'4<2b"3]2"37
!8 1:'4<2 \ 2 4<A' C:1P>4A J$2 ^ J$2 ] 1
C:1P>4A 4!1A2 ^ !'464!1A2 ] 6J$2-17 M 3 ] 1:'4<2 b 317
C:1P>4A 6'27 @!88 ^ #&S64!1A2 - 4!1A17
4here are se%eral types of errors that may occur while using C:1P>4A statements
6e"g"0 di%ision y Bero or the s;uare root of a negati%e numer7" 4he result of any
in%alid computation will e set to lan,s 6missing data7"
08+R0G+C C3U7: and SUM Co((ands
4he #?A$#FA0 C:>'4 and S>1 commands are pro%ided to perform calculations
in situations in which the C:1P>4A command would fail ecause of missing data"
4he synta9 for all three commands is identical"
4he #?A$#FA command calculates the mean a%erage of all non-missing %alues in a
list of %ariales" 4he synta9 of the #?A$#FA command is5
#?A$#FA [?ariale\ ^ [?ariale list\
4he C:>'4 command counts the numer of non-missing %alues in a list of
%ariales" 4he synta9 of the C:>'4 command is5
C:>'4 [?ariale\ ^ [?ariale list\
4he S>1 command adds the non-missing %alues in a list of %ariales" 4he synta9 of
the S>1 command is5
S>1 [%ariale\ ^ [%ariale list\
4he reason for these commands is of the way the C:1P>4A command handles
missing data" !f any of the %ariales in the C:1P>4A statement are missing0 the
result will e missing" # %alue calculated y the #?A$#FA command is missing
only when all %alues in the list of %ariales are missing" 8or e9ample0 the following
C:1P>4A command would fail if either @AP4X:'A0 @AP4X4W:0 or
@AP4X4<$AA contained a missing %alue"
&&) /eywords StatPac For Windows User's Manual
C:1P>4A @AP4X#?F ^ 6@AP4X:'A ] @AP4X4W: ] @AP4X4<$AA7
M 3
4his C:1P>4A command would store a lan, result in @AP4X#?F for any record
in which @AP4X:'A0 @AP4X4W:0 or @AP4X4<$AA is missing" !nstead0 the
#?A$#FA command could e used to calculate the mean of the non-missing %alues
of the three %ariales in each record" 4he commands to accomplish this tas, would
e5
S4>@J !'C:1A
'AW 6'9"27 O@AP4X#?FO #%erage !ncome of @epartments 1-3
#?A$#FA @AP4X#?F ^ @AP4X:'A @AP4X4W: @AP4X4<$AA
S#?A
""
!n this e9ample0 the @AP4X#?F %ariale was created y a 'AW command" 4he
format of @AP4X#?F 6'9"27 specifies two places to the right of the decimal point"
4herefore0 the result of the #?A$#FA command will e e9pressed to two significant
decimal places"
4he #?A$#FA command itself may also e used to create a new %ariale 6ma,ing
the use of the 'AW command unnecessary7" 4he synta9 of the command is changed
only y the inclusion of the new %ariale format"
#?A$#FA 6[8ormat\7 ['ew %ariale name\ ^ [?ariale list\
4he pre%ious procedure could ha%e een5
S4>@J !'C:1A
#?A$#FA 6'9"27 @AP4X#?F ^ @AP4X:'A @AP4X4W:
@AP4X4<$AA
S#?A
""
'ote that the format must e enclosed in parentheses" 4he only disad%antage of using
the #?A$#FA command to create the new %ariale is that the new %ariale will not
contain a %ariale lael"
4he C:>'4 command counts the numer of non-missing %alues from a %ariale
list" !tD use is identical to the #?A$#FA command0 e9cept that the result is the
numer of non-missing %alues instead of the a%erage of the non-missing %alues" .i,e
the #?A$#FA command0 it may also e used to create a new %ariale" # %alue
calculated y the C:>'4 command is always an integer etween Bero and the
numer of %ariales specified in the list"
4he following procedure creates a new %ariale @AP4XC:>'4 and counts the
numer of non-missing %alues in each record" 'ote that the new %ariale will always
e an integer etween 0 and 30 and therefore uses an 6'17 format"
S4>@J !'C:1A
C:>'4 6'17 @AP4XC:>'4 ^ @AP4X:'A @AP4X4W: @AP4X4<$AA
S#?A
StatPac For Windows User's Manual /eywords &&!
""
4he S>1 command adds all the non-missing %alues from a %ariale list" 4he result
is the sum of these %alues" .i,e the #?A$#FA and C:>'4 commands0 a new
%ariale may e created" 4he following procedure would create a new %ariale called
@AP4X4:4#. that contains the sum of the three departments5
S4>@J !'C:1A
S>1 6'107 @AP4X4:4#. ^ @AP4X:'A @AP4X4W: @AP4X4<$AA
S#?A
""
4he final e9ample shows all three commands in one procedure5
S4>@J !'C:1A
#?A$#FA 6'9"27 @AP4X#?F ^ @AP4X:'A @AP4X4W:
@AP4X4<$AA
C:>'4 6'17 @AP4XC:>'4 ^ @AP4X:'A @AP4X4W: @AP4X4<$AA
S>1 6'107 @AP4X4:4#. ^ @AP4X:'A @AP4X4W: @AP4X4<$AA
S#?A
""
4he result of sa%ing these transformations in a data file could e5
@AP4X1 c @AP4X2 c @AP4X3 c @AP4X#?F c @AP4XC:>'4 c @AP4X4:4#.
3- c 33 c 32 c 30"33 c 3 c 121
39 c 23 c c 21"20 c 2 c 103
2) c -0 c 3( c 32"00 c 3 c 132
31 c c c 31"00 c 1 c 31
c c c c 0 c
33 c 33 c 21 c 32"-) c 3 c 12(
IF9:5+7 F +.S+ Co((and
4he $AC:@A0 C:1P>4A and SA.AC4 commands may e modified so that they
ecome conditional" 4hat is0 the recode0 compute or select will e performed or not
performed on a gi%en record depending on whether something else is true or false"
4he synta9 for the !8-4<A' modifier is5
!8 [Statement\ 4<A' $AC:@A [?ariale\ [$ecode statement\
!8 [Statement\ 4<A' C:1P>4A [?ariale\ ^ [A;uation\
!8 [Statement\ 4<A' SA.AC4
'ote that the portions to the right of the $AC:@A and C:1P>4A commands ha%e
synta9 identical to the command when there is no !8-4<A' modifier" !f the
[Statement\ portion of the command is true for a gi%en record0 4<A' the record
&&* /eywords StatPac For Windows User's Manual
will e recoded0 computed or selected" !f the [Statement\ portion is false0 4<A' the
record will e s,ipped"
4he following e9ample uses three !8-4<A' commands to compute a weighted score
ased on a group numer" &ecause the S#?A command is used0 the weighted score
could e referenced in suse;uent procedures"
S4>@J SAF1A'4
'AW 6'10"37 OWSO Weighted Score
!8 F$:>P ^ 1 4<A' C:1P>4A WS ^ SC:$A b 0"31)2
!8 F$:>P ^ 2 4<A' C:1P>4A WS ^ SC:$A b 0"()32
!8 F$:>P ^ 3 4<A' C:1P>4A WS ^ SC:$A b 1"09-3
S#?A
""
!n the e9ample ao%e0 F$:>P was a numeric %ariale and it was not necessary to
enclose the %alues in ;uotes" !f F$:>P had een an alpha %ariale0 the procedure
would ha%e re;uired ;uotation mar,s around the group codes"
S4>@J SAF1A'4
'AW 6'10"37 OWSO Weighted Score
!8 F$:>P ^ O1O 4<A' C:1P>4A WS ^ SC:$A b "31)2
!8 F$:>P ^ O2O 4<A' C:1P>4A WS ^ SC:$A b "()32
!8 F$:>P ^ O3O 4<A' C:1P>4A WS ^ SC:$A b 1"09-3
S#?A
""
When performing an !8-4<A'-C:1P>4A command0 the A.SA ,eyword may e
used to specify an alternate computation if the [statement\ portion is false" 4he
following e9ample uses different formulas for males and females to calculate a
%ariale called #@I>S4A@-SC:$A" 4he spacing for the continuation lines is for
readaility only"
S4>@J SC:$AS
'AW 6'3"27 O#@I>S4A@XSC:$AO
!8 SA* ^ O1O 4<A' C:1P>4A #@I>S4A@XSC:$A ^ SC:$A b "29
A.SA
#@I>S4A@XSC:$A ^ SC:$A b 1"3)
S#?A
""
4he 'AW statement in this e9ample could e eliminated y specifying the %ariale
format as part of the C:1P>4A statement"
S4>@J SC:$AS
!8 SA* ^ O1O 4<A' C:1P>4A 6'3"27 #@I>S4A@XSC:$A ^
SC:$A b "29 A.SA 6'3"27 #@I>S4A@XSC:$A ^ SC:$A b 1"3)
S#?A
""
StatPac For Windows User's Manual /eywords &&-
4he following is another e9ample of how ;uotes are used for referencing alpha-type
%ariales" !f the format of SA* was #10 6coded 1 or 870 this procedure would select
Hust the males for a descripti%e statistics analysis of #FA5
S4>@J S>$?AJ
!8 SA* ^ O1O 4<A' SA.AC4
@ASC$!P4!?A #FA
""
When you want to reference missing data0 use two ;uote mar,s 6with or without a
space etween them7" 8or e9ample0 if you want to select all non-missing data from
the C:11>'!4J %ariale0 either of the following commands would produce the
desired results regardless of whether C:11>'!4J is alpha or numeric format"
!8 C:11>'!4J [\ O O 4<A' SA.AC4
!8 C:11>'!4J ^ OO 4<A' $AIAC4

4he !8-4<A' modifier is often used in conHunction with the C:1P>4A command
to eliminate the possiility of computational errors" 8or e9ample0 letDs say we want to
compute the s;uare root of P$:8!4.:SS" Since we cannot ta,e the s;uare root of a
negati%e numer0 we only want to perform the transformation if the P$:8!4.:SS
%ariale is positi%e" !n other words0 if P$:8!4.:SS is greater than Bero0 ta,e the
s;uare rootW otherwise0 s,ip it"
!n our e9ample0 the statement would e5
!8 P$:8!4.:SS \ 0 4<A' C:1P>4A P$:8!4.:SS ^
SC$6P$:8!4.:SS7
:nce again0 notice that the last part of the statement is identical to the C:1P>4A
command without the !8-4<A' modifier" 4he only difference is in the !8
[Statement\ 4<A' part of the command" 4he %alid relationships supported y
StatPac are5
^ A;ual to
\ Freater than
\^ Freater than or e;ual to
[ .ess than
[^ .ess than or e;ual to
[\ >ne;ual to
^^ !s found within the te9t string
With the e9ception of the ^^ symol0 all the relational operators are standard
algeraic notation" 4he purpose of the ^^ relational operator is to locate a target
string within another string" !ts primary use is to search %eratim open-ended
responses for selected words or phrases" 8or e9ample0 suppose ?10 ?20 and ?3 were
open-ended multiple response0 and respondentsD %eratim answers were entered into
these three fields" Jou could use the ^^ relational operator to list comments that
mentioned the word OhoursO" 4he !8-4<A' SA.AC4 line says to search %ariales
&&; /eywords StatPac For Windows User's Manual
one through three for the specified te9t string 6<:>$S70 and select any record that
contains the string" >pper and lower case differences will e ignored when using the
^^ operator"
C:1P>4A 6'27 $AC ^ $AC:$@
!8 ?1 - ?3 ^^ O<:>$SO 4<A' SA.AC4
.!S4 $AC ?1 - ?3
:P4!:'S 1$^6?1 - ?37
""
:ften0 it may e desirale to search for more that one ,ey word or phrase" 4he
following procedure tells StatPac to search %ariales one through three for se%eral
,ey words5 hours0 time0 longer0 shorter0 duration0 and length" 4he .!S4 command
will display the comments that contain any of the search strings"
C:1P>4A 6'27 $AC ^ $AC:$@
!8 ?1 - ?3 ^^
O<:>$SM4!1AM.:'FA$MS<:$4A$M@>$#4!:'M.A'F4<MO
4<A' SA.AC4
.!S4 $AC ?1 - ?3
:P4!:'S 1$^6?1 - ?37
""
!t is important to note that the ^^ relational operator wor,s on the sound of the word0
and not the e9act spelling" 8or e9ample0 the following procedure might e used to
list respondentsD positi%e comments to a multiple response open-ended ;uestion"
!8 #44!4>@A^^O<appyMFladMSatisfiedMPleasedO 4<A' SA.AC4
.!S4 #44!4>@A
""
4he report might loo, li,e this" 'otice that StatPac found the word OsatsfiedO e%en
though it was misspelled"
Comments
! am %ery happy with the current program and ! cannot thin, any changes to ma,e"
! am completely satsfied with the new procedures"
! am glad you finally added an e%aluation component"
8inally0 a program that holds my interest" ! am %ery pleased"
When used in conHunction with other commands0 the ^^ relational operator can e
used to create a new coded categorical %ariale from the %eratim te9t" !n a simply
e9ample0 suppose you as,ed respondents0 OWhat do you feel is the numer one
prolem in societyYO Jou are especially interested in responses relating to crime0
drugs0 %iolence0 and the economy" 4he following procedure would create a new
%ariale and perform a fre;uency analysis on it"
StatPac For Windows User's Manual /eywords &&'
'AW 6'17 OP$:&.A1O W<#4 !S 4<A '>1&A$ :'A P$:&.A1 !'
S:C!A4JY
.#&A.S P$:&.A1 61^C$!1A762^@$>FS763^?!:.A'CA7
63^AC:':1J762^:4<A$7
!8 ?1 [\ O O 4<A' C:1P>4A P$:&.A1 ^ 2
!8 ?1 ^^ OC$!1AMC$!1!'#.SMO 4<A' C:1P>4A P$:&.A1 ^ 1
!8 ?1 ^^ O@$>FSM#.C:<:.MC:C#!'AM'#$C:4!CSO 4<A'
C:1P>4A P$:&.A1 ^ 2
!8 ?1 ^^ O?!:.A'CAM?!:.A'4MO 4<A' C:1P>4A P$:&.A1 ^ 3
!8 ?1 ^^ OAC:':1JMAC:':1!CM&>@FA4M1:'AJMO 4<A'
C:1P>4A P$:&.A1 ^ 3
8$AC P$:&.A1
""
StatPac also supports relational operators #'@ and :$" 4hey may e used in
conHunction with the C:1P>4A0 $AC:@A and SA.AC4 ,eywords 6with or
without parentheses7 to ma,e comple9 !8-4<A' statements" 4he general synta9 is5
!8 [Statement\ #'@ [Statement\ 4<A' $AC:@A [?ariale\ [$ecode
statement\
!8 [Statement\ :$ [Statement\ 4<A' $AC:@A [?ariale\ [$ecode
statement\
!8 [Statement\ #'@ [Statement\ 4<A' C:1P>4A [?ariale\ ^
[A;uation\
!8 [Statement\ :$ [Statement\ 4<A' C:1P>4A [?ariale\ ^
[A;uation\
!8 [Statement\ #'@ [Statement\ 4<A' SA.AC4
!8 [Statement\ :$ [Statement\ 4<A' SA.AC4
8or e9ample0 letDs say we want to compute the following e;uation5
'AW?#$ ^ SC$6!'@A*17 ] SC$6!'@A*27
8or this computation to e successful0 oth !'@A*1 and !'@A*2 must e greater
than Bero" 6!t is not possile to ta,e the s;uare root of a negati%e numer"7
!n this e9ample0 you could eliminate the possiility of error with the following
statement5
!8 !'@A*1 \ 0 #'@ !'@A*2 \ 0 4<A' C:1P>4A
'AW?#$ ^ SC$6!'@A*17 ] SC$6!'@A*27
&ecause the second line is indented0 it is interpreted as a continuation of the pre%ious
line" 4he computation will e performed only if oth !'@A*1 and !'@A*2 are
greater than 0"
&1> /eywords StatPac For Windows User's Manual
When using #'@ relational operators0 oth statements must e true efore the
operation 6compute0 select or recode7 will e performed" When using the :$
relational operator0 if either statement is true0 the operation will e performed"
Parentheses may e used in conHunction with #'@ and :$ relational operators to
create comple9 statements" 4here is no limit on the numer of parentheses that may
e used in an !8-4<A' statement"
Comple9 weighting schemes can e de%eloped y using cominations of C:1P>4A
commands" 4he following procedure creates a weighted sufile where the file is
weighted y oth age 6'27 and se9 6#17"
S4>@J @A1:
'AW 6'-"37 OC#SAXW4O
!8 #FA[21 #'@ SA*^O1O 4<A' C:1P>4A C#SAXW4 ^ "9013
!8 #FA[21 #'@ SA*^O8O 4<A' C:1P>4A C#SAXW4 ^ 1"203)
!8 6#FA\^21 #'@ #FA[317 #'@ SA*^O1O 4<A' C:1P>4A
C#SAXW4 ^ "31(2
!8 6#FA\^21 #'@ #FA[317 #'@ SA*^O8O 4<A' C:1P>4A
C#SAXW4 ^ "(109
!8 #FA\^31 #'@ SA*^O1O 4<A' C:1P>4A C#SAXW4 ^ ")(92
!8 #FA\^31 #'@ SA*^O8O 4<A' C:1P>4A C#SAXW4 ^ "((10
WA!F<4 C#SAXW4
W$!4A W4X@A1:
""
StatPac contains a special pro%ision that allows the condensation of se%eral :$
relational operators" 4he condensation may pertain to %alues or %ariales"
8or e9ample0 the following command will select a record if the F$:>P %ariale is
10 30 2 or )" !f the F$:>P %ariale is any other %alue0 the record will not e selected"
!8 F$:>P^1 :$ F$:>P^3 :$ F$:>P^2 :$ F$:>P^) 4<A'
SA.AC4
4his same command could e condensed as5
!8 F$:>P^O1M3M2M)O 4<A' SA.AC4
When using this form of the :$ relational operator0 the %alues are separated from
each other y slashes" 'ote that whether you are chec,ing alpha or numeric %alues0
you must enclose the list of %alues in ;uotation mar,s to indicate that there is more
than one %alue to e chec,ed"
Similarly0 the following command will select a record if any of the three %ariales
are e;ual to one5
!8 $ASP:'SAX1^1 :$ $ASP:'SAX2^1 :$ $ASP:'SAX3^1 4<A'
SA.AC4
4his same command could e condensed as5
StatPac For Windows User's Manual /eywords &11
!8 $ASP:'SAX1-$ASP:'SAX3^1 4<A' SA.AC4
4he %ariales in the %ariale list portion of the statement can e listed separately0 or
as a %ariale range 6or comination of the two7" 4he pre%ious command could also
e5
!8 $ASP:'SAX1 $ASP:'SAX2 $ASP:'SAX3 ^ 1 4<A' SA.AC4
S3R: Co((and
!t is sometimes desirale to sort a data file" 4his is especially true when you will e
listing the file and you want the listing to e in some meaningful order" 8or e9ample0
you may want to sort y L!P code efore printing a name and address file"
4here are two other situations where a data file must e sorted5 17 efore merging
two files y a common %ariale oth files must e sorted y the common %ariale0
and 27 efore creating an aggregate file0 the file must first e sorted y the aggregate
%ariale"
4he synta9 for the S:$4 command is straightforward5
S:$4 6:rder7 [?ariale or %ariale list\
4he sort order refers to either ascending or descending order and may e specified as
6#7 or 6@7" 4he sort %ariale6s7 may e alpha or numeric format"
#n e9ample of the S:$4 command would e5
S4>@J 'A!F<&:$
S:$4 6#7 L!P
.!S4 '#1A #@@$ASS C!4J S4#4A L!P P<:'A
""
4he result of this procedure is that the data file will e sorted so the lowest Bip code
is first and the highest Bip code is last" Selected %ariales from the data will then e
listed in sorted order" 4he S:$4 command only applies to the procedure in which it
appears" Suse;uent procedures will use the unsorted data unless the S#?A or
W$!4A commands were also used in the procedure"
4he S:$4 command is always the last ,eyword that will e e9ecuted in a procedure
regardless of where it appears in the procedure 6i"e"0 a file is sorted only after all
other transformations ha%e een completed7" 4herefore0 if in the same procedure a
%ariale is oth sorted and assigned a new %alue in a C:1P>4A statement0 the file
will e sorted according to the newly computed %alues0 regardless of the order of the
S:$4 and C:1P>4A lines in the procedure" !f you wish to sort y a %ariale efore
it is computed0 you must sort the %ariale in a separate procedure efore the
procedure that computes the %ariale"
&1& /eywords StatPac For Windows User's Manual
Jou can use the S:$4 command to perform a multidimensional sort y specifying a
list of %ariales to e sorted" 4he %ariales should e listed in decreasing order of
significanceW that is0 the first %ariale in the list is the primary sorting %ariale0 the
second %ariale is used only when two %alues of the first %ariale are identical0 and
so on" 8or e9ample0 if you had a file which contained information aout people
including their last name 6.#S4X'#1A70 first name 68!$S4X'#1A70 and year of
irth 6&!$4<XJA#$70 and you wanted to sort the file according to these three
%ariales0 you could use the command5
S:$4 6#7 .#S4X'#1A0 8!$S4X'#1A0 &!$4<XJA#$
4he records in the output file '#1AS:$4 would e ordered alphaetically
according to last name" !f two or more people in the file had the same last name0 their
first names would determine who was placed first" !f more than one person had the
same first and last names0 the year of irth would e used to put the records in order"
'ote that alpha and numeric %ariales can e comined in the %ariale list for the
S:$4 command" #ll %ariales in the list are sorted in the same order0 either
ascending or descending"
W+IG5: Co((and
:ften0 there are ,nown iases in the sample0 and the researcher may want to adHust
the sample y weighting cases" 4his will create a data file that compensates for the
ias"
!nteger case weighting always produces a fi9ed output" !f a case has a weight of two0
it will e duplicated twice in the weighted file" !f a case has a weight of three0 it will
e duplicated three times in the output file"
'on-integer case weighting is ased on a proaility function and will0 therefore0
produce different results with each run" !f a case has a weight of 2"30 it will e
duplicated twice in the weighted file0 and there is a 30` chance that it will e
duplicated a third time" !f a case has a weight of "(310 there is an (3"1` chance that
it will appear in the output file
4his command will allow you to use weights that are already contained in the file0 or
weights may e assigned to each case depending on the %alue of another %ariale in
the file"
4here are two forms of the command synta9" 4he first is used when there is a
numeric %ariale in the file that already contains the case weight" 4he synta9 for this
form of the WA!F<4 command is5
WA!F<4 [?ariale\
8or e9ample0 if there were a %ariale called C#SAWA!F<40 the synta9 would e5
WA!F<4 C#SAWA!F<4
4his %ariale must e numeric and contain the weight of the case" !f C#SAWA!F<4
is missing in any record0 the record will e interpreted as if the weight were Bero"
StatPac For Windows User's Manual /eywords &11
!f the file does not contain a case weight %ariale0 the other form of the command
can e used to assign the weights" 4he synta9 for this form of the command is5
WA!F<4 [?ariale\ 6[Code\^[Weight\76[Code\^[Weight\7"""
8or e9ample0 to weight the file ased on the respondentDs se9 6SA*70 you would
weight each case depending on whether it is coded as 1 or 8" !n this e9ample0 you
want to assign a weight of 1"2 to males and 2"3 to females" 4he synta9 to perform
this is5
WA!F<4 SA* 61^1"2768^2"37
Jou should enter a weight for each of the codes that e9ists in the file" 4he code 6on
the left of the e;uals sign7 may e alpha or numeric data0 while the weight 6on the
right of the e;uals sign7 must e numeric" !f a code e9ists in the file that is not
reflected in the WA!F<4 command0 it will e assigned a weight of Bero"
'otice that the WA!F<4 command can produce a file that contains many more
records than the original file" Jou can control the siBe of the weighted file y
adHusting the %alues of the weights"
!f you want the weighted file to contain appro9imately the same numer of records
as the input data file0 determine the weight for each code y di%iding the desired
percentage of records containing the code y the oser%ed percentage of records
containing the code"
8or instance0 suppose you ha%e a sur%ey consisting of 120 respondents 6100 males
and 20 females70 and you want to create a weighted data file with 120 records" #lso0
you want the new file to contain aout the same numer of males and females 6)2
males and )2 females7" 4he weight for the male code would e calculated as "2M"-) or
")2" 4he weight for the female code would e calculated as "2M"33 or 1"2" 4he
command to produce the weighted file would e5
WA!F<4 SA* 61^")27 68^1"27
'ote that you can also calculate the weights y di%iding the desired numer of
records y the oser%ed numer of records for each code" 4he weight for males 6")27
is e;ui%alent to )2M1000 and the weight for females 61"27 is e;ui%alent to )2M20"
&ecause the non-integer portion of the weight is ased on a proaility function0 the
output file will usually not contain the e9act numer of records as the input file"
Comple9 weighting schemes can e de%eloped y using cominations of C:1P>4A
commands" 4he following procedure creates a weighted sufile where the file is
weighted y oth race and se9"
S4>@J @A1:
'AW 6'-"37 OC#SAXW4O
!8 $#CA^OWO #'@ SA*^O1O 4<A' C:1P>4A C#SAXW4 ^ "9013
!8 $#CA^O&O #'@ SA*^O1O 4<A' C:1P>4A C#SAXW4 ^ 1"203)
!8 $#CA^O:O #'@ SA*^O1O 4<A' C:1P>4A C#SAXW4 ^ "31(2
&1) /eywords StatPac For Windows User's Manual
!8 $#CA^OWO #'@ SA*^O8O 4<A' C:1P>4A C#SAXW4 ^ "(109
!8 $#CA^O&O #'@ SA*^O8O 4<A' C:1P>4A C#SAXW4 ^ "9392
!8 $#CA^O:O #'@ SA*^O8O 4<A' C:1P>4A C#SAXW4 ^ "((10
WA!F<4 C#SAXW4
W$!4A W4X@A1:
""
!t is especially important to include the W$!4A command when you use the
WA!F<4 command" Since StatPacDs weighting is ased on a proaility function0
different sets of weighted data will e created each time you run the procedure" 4hus0
if your intent is the weight the data0 and used the weighted data in a series of
suse;uent analyses0 you should use the W$!4A command to create a weighted data
file that can e used in the suse;uent analyses"
S4>@J 1yStudy
WA!F<4 CaseWeight
W$!4A 1yStudy2
""
S4>@J 1yStudy2
6the rest of the procedures7
73RM0.IG+ Co((and
# normaliBed %ariale is one in which all the %alues are e9pressed in terms of
standard de%iations 6L scores7 rather than as the raw data itself" Jou can normaliBe
any %ariale or list of %ariales with the ':$1#.!LA command"
4he formula for a normaliBed %ariale is5
L ^ 6* - *&ar7 M S@
where5
* is the raw data %alue
*&ar is the mean a%erage
S@ is the standard de%iation
# normaliBed %ariale will ta,e on positi%e and negati%e %alues" # positi%e %alue of
L indicates that the data is ao%e the mean y L standard de%iations0 while a negati%e
%alue indicates that the data is elow the mean y L standard de%iations" 4he format
for the ':$1#.!LA command is straightforward5
':$1#.!LA [?ariale list\
8or e9ample0 to normaliBe a S#.AS %ariale0 we would type5
':$1#.!LA S#.AS
StatPac For Windows User's Manual /eywords &1!
!t is also possile to normaliBe se%eral %ariales using the same command" >sing a
similar e9ample0 letDs say we want to normaliBe three %ariales 6S#.AS0
#@?A$4!S!'F and @!$AC4X1#!.7" 4here are se%eral different ways we could
use the ':$1#.!LA command to normaliBe all three %ariales" 4his in%ol%es
simply specifying all three %ariales in the %ariale list5
':$1#.!LA ?30 ?30 ?2
':$1#.!LA ?3-?2
':$1#.!LA S#.AS0 #@?A$4!S!'F0 @!$AC4X1#!.
':$1#.!LA S#.AS - @!$AC4X1#!.
'otice that the only difference etween the ao%e commands is the way in which the
%ariale list is specified" 4he results from each of these would e identical" 4he
%ariale list may list the %ariales indi%idually 6separated y commas70 or y %ariale
range 6.ow %ariale - <igh %ariale7 or y any comination of the two" Aither
%ariale numers or %ariale names may e used"
'ormaliBed data are non-integer %alues and contain decimal portions" 4he numer of
decimal places is determined y the format of the %ariale6s7 eing normaliBed"
Fenerally0 you will not want to normaliBe the raw data" !nstead0 create a new %ariale
with the C:1P>4A command0 sa%e it0 and then normaliBe it in the ne9t procedure"
4he C:1P>4A command will allow you to control the decimal precision of the
normaliBed data"
S4>@J S#.AS
C:1P>4A 6'10"27 O':$1XS#.ASO ^ S#.AS
S#?A
""
':$1#.!LA ':$1XS#.AS
S#?A
""
4he ':$1#.!LA command may only e used to normaliBe an e9isting %arialeW it
may not e used to normaliBe a new0 computed0 recoded0 or selected %ariale"
4herefore0 if you want to preser%e the original data0 you will need to run two
procedures as illustrated in the pre%ious e9ample"
.0G Co((and
.agging a %ariale is often used in simple and multiple regression" When one
%ariale has an effect on another %ariale0 ut the effect occurs at a future time0 the
%ariale is said to ha%e a lagged effect" # simplified e9ample might e the
relationship etween our ad%ertising udget and sales" !f we doule our ad%ertising
udget this month0 sales will proaly increase ne9t month" !n other words0
ad%ertising udget has a lagged effect on sales" 4he two %ariales are related0 ut one
lags ehind the other y a specific time period"
4he .#F command may e used to lag one or more %ariales a specified numer of
time periods" 4he synta9 for the .#F command is5
&1* /eywords StatPac For Windows User's Manual
.#F 6['umer of lags\7 [?ariale list\
8or e9ample0 letDs say we wanted to lag %ariale two y three time periods" 4he .#F
command would e5
.#F 637 ?2
!n essence0 when you lag a %ariale 9 times0 you are pushing the data down 9 records
for that %ariale 69 refers to the numer of lags you specify7" 4he conse;uence of this
action is that the data set ecomes longer" 4he following data set illustrates lagging5
$aw data .ag of one .ag of two
3 1issing 1issing
9 3 1issing
12 9 3
- 12 9
2 - 12
2 -
2
>sing our e9ample where #@?A$4!S!'F has a lagged effect on S#.AS0 we could
loo, at the two %ariales efore and after #@?A$4!S!'F is lagged5
&A8:$A .#F #84A$ .#F
$ecord / Sales #d%ertising Sales #d%ertising
1 22 30 22 1issing
2 -2 30 -2 30
3 (0 20 (0 30
3 9( -3 9( 20
2 1issing -3
When you lag a %ariale in a multiple %ariale file0 the new file will e longer than
the original file y the numer of lags you specified" 4he most recent %alues for the
%ariales that were not lagged will e missing in the new file"
$IFF+R+7C+ Co((and
@ifferencing data is a method for remo%ing trend andMor seasonality" &asically0
differencing in%ol%es sutracting successi%e oser%ations from each other" 4he
@!88A$A'CA command is easy to use and can ta,e differences from data %alues
one or more time periods apart" 4o illustrate the concept of differencing0 letDs loo, at
the following data set" 'ote that the original data has a well-defined trend 6with no
irregular %alues70 while the result of the differencing produces a stationary series
with no trend"
StatPac For Windows User's Manual /eywords &1-
'umers used to compute @ifferenced
$aw data a difference data
3 - - 3 3
- 9 - - 3
9 12 - 9 3
12 12 - 12 3
12 1( - 12 3
1(
#lso note that differencing has the effect of reducing the numer of records y one"
Aach time you difference your data0 the numer of records is reduced"
4he format for the @!88A$A'CA command is5
@!88A$A'CA 6[Periodicity\7 [?ariale list\
!n the pre%ious e9ample0 if the %ariale were C#S<-:'-<#'@0 the command
would e5
@!88A$A'CA 617 C#S<-:'-<#'@
!f there is more than one %ariale to difference0 simply specify a %ariale list rather
than a single %ariale name" >se commas or spaces to separate the %ariale names
from one another" 4he periodicity parameter refers to how many time lags are to e
used to calculate the difference" !n this e9ample0 we are sutracting adHacent %alues0
so the periodicity is one" 4his is often referred to as a regular or OshortO difference
ecause we sutract adHacent %alues" !t has the effect of eliminating trend"
4o eliminate seasonality from a data set0 do not sutract successi%e 6adHacent7 %alues"
!nstead0 sutract %alues from the ne9t seasonal period" 8or e9ample0 letDs ta,e the
following series that has seasonality with a cycle 6periodicity7 of si9 periods" 4hat is0
the seasonal pattern repeats itself e%ery si9 periods" !n this case0 differencing consists
of sutracting a %alue from the corresponding %alue in the ne9t season" !t is ,nown as
a seasonal or OlongO difference"
A9ample of seasonal differencing 6Periodicity ^ -7
$ec" / $aw 'umers used to compute @ifferenced
64ime7 data a difference data
1 3 3 - 3 64) - 417 0
2 3 3 - 3 64( - 427 0
3 2 2 - 2 649 - 437 0
3 3 3 - 3 6410 - 437 0
2 3 3 - 3 6411 - 427 0
- 2 2 - 2 6412 - 4-7 0
) 3 3 - 3 6413 - 4)7 0
( 3 3 - 3 6413 - 4(7 0
&1; /eywords StatPac For Windows User's Manual
9 2 2 - 2 6412 - 497 0
10 3 3 - 3 641- - 4107 0
11 3 3 - 3 641) - 4117 0
12 2 2 - 2 641( - 4127 0
13 3 3 - 3 6419 - 4137 0
13 3 3 - 3 6420 - 4137 0
12 2 2 - 2 6421 - 4127 0
1- 3 3 - 3 6422 - 41-7 0
1) 3 3 - 3 6423 - 41)7 0
1( 2 2 - 2 6423 - 41(7 0
19 3
20 3
21 2
22 3
23 3
23 2
'ote that the result of seasonal differencing on a series that contains no trend or
irregular %alues produces a perfectly stationary series" @ifferencing will always
result in the loss of data" When you difference for seasonality0 the amount of data lost
will e e;ual to one seasonal period" !n our e9ample0 we lost eight data points
ecause the seasonal period was eight" 4he command synta9 is identical to a Oshort
differenceO e9cept that the periodicity parameter is greater than one 6i"e"0 e;ual to the
periodicity7"
@!88A$A'CA 6(7 C#S<-:'-<#'@
@ifferencing can0 therefore0 e used to reduce or eliminate oth trend and
seasonality0 depending on the time lag used for differencing" When the lag is one0 the
effect will e to eliminate trend" When the time lag is e;ual to the seasonal period0
the effect is to eliminate seasonality"
$UMME Co((and
@ummy %ariales are used in multiple regression to include nominal or ordinal-type
data in the regression e;uation" 'ormally0 only inter%al or ratio-type data may e
used in multiple regression" @ummy %ariales may only ta,e on %alues of one or
Bero" 4hey may e used as independent %ariales in multiple regression"
.etDs say we ha%e a %ariale that indicates the presence or asence of a credit history"
4his %ariale could e coded as a one 6meaning there is a credit history70 or Bero
6meaning there is no credit history7" 4his %ariale could then e included in a
multiple regression prolem" !t is ,nown as a dummy %ariale ecause it represents
nominal data"
4he situation ecomes somewhat more comple9 when there is more than a simple
dichotomy 6yesMno7" .etDs ta,e an e9ample where there are se%eral nominal type
categories" A9tending the pre%ious e9ample0 the information for the %ariale
StatPac For Windows User's Manual /eywords &1'
OC$A@!4-<!S4:$JO might ha%e een coded5 1^A9cellent history 2^Food history
3^8air history 3^Poor history" 4his could e e9pressed with dummy %ariales y
creating four new %ariales" 4he first new %ariale would e OA9cellent historyO and
would e coded as one 6yes7 or Bero 6no7" 4he second new %ariale would e OFood
historyO and would also e coded as one or Bero0 and so on" 4he coding scheme can
e illustrated y the following tale5
$aw 'ew %ar 1 'ew %ar 2 'ew %ar 3 'ew %ar 3
@ata A9cellent Food 8air Poor
1 1 0 0 0
2 0 1 0 0
3 0 0 1 0
3 0 0 0 1
'otice that each of the new dummy %ariales is assigned a %alue of one or Bero
depending on the original data %alue" :%iously0 it would e ;uite time consuming to
re-enter four new %alues 6the four new dummy %ariales7 for each record" 4he
@>11J command will perform this tas, for you" 4he synta9 for the command is5
@>11J [?ariale\
8or e9ample0 to create dummy %ariales for the pre%ious e9ample0 the command
would e5
@>11J C$A@!4-<!S4:$J
4his would automatically create four new dummy %ariales and fill in the %alues
with ones and Beros0 depending on the data set" # dummy %ariale will e created for
each uni;ue %alue that e9ists in the original data file for that %ariale" Aach dummy
%ariale will e a one-digit numeric %alue" 4he result of using the @>11J
command will e the creation of new %ariales that may then e included in a
multiple regression"
4he new dummy %ariale names will e the %alue laels from the study" 8or
instance0 if a %ariale were coded #^Anglish0 &^8rench and C^Spanish0 the
@>11J command would create three new %ariales named A'F.!S<0 8$A'C<
and SP#'!S<" !f the %ariale does not contain %alue laels0 the %ariale names for
the new dummy %ariales will e O@>11J-?9-yO0 where 9 is the %ariale that was
used to create the dummy %ariales and y is the code from the data that defines the
group it came from" 8or e9ample0 if %ariale 32 were used to create dummy
%ariales0 and the data file contained codes #0 & and C0 the %ariale names will e
O@>11J-?32-#O0 O@>11J-?32-&O and O@>11J-?32-CO"
4he @>11J command will only wor, if the total numer of %ariales 6including
the new dummy %ariales7 is not greater than fifty" @o not con%ert inter%al or ratio
data to dummy %ariales" 4his is unnecessary and will usually result in e9ceeding the
fifty %ariale limit"
'ote that a dummy %ariale will e created for each uni;ue %alue of the original
%ariale" !n order to use these dummy %ariales in multiple regression0 it is necessary
to call one of them the OstandardO and not include it in the regression prolem" >sing
all the new dummy %ariales in the regression e;uation will result in a singular
matri90 and it will not e possile to perform the matri9 in%ersion necessary for
&)> /eywords StatPac For Windows User's Manual
regression" Choose one of the dummy %ariales0 call it the OstandardO0 and e9clude it
from the multiple regression analysis"
4he @>11J command may only e used on a %ariale that already e9ists in the
data file" # %ariale that is dummied cannot e computed0 recoded0 or selected in the
same procedure" !f you want to apply the @>11J command to a transformed
%ariale0 you must perform the transformation in a separate procedure efore the
procedure in which the %ariale is dummied"
RU7 Co((and
4he $>' command may e added to the end of any procedure file to enale atch
processing of multiple procedure files" !t is useful for unattended processing of large
Hos0 where the siBe of a procedure file would ecome e9cessi%e" !t allows the user to
process a series of procedure files in a single atch"
4he $>' command may e added as a single line procedure at the end of any
procedure file"
4he command synta9 is5
$>' [Procedure file name\ [&atch output file name\
4he [Procedure file name\ is the name of the ne9t procedure file to e run" 8or
e9ample0 the following procedure file would first run a fre;uency analysis and a
crossta0 and then a new procedure file 6P$:C27 would e loaded and run"
S4>@J $ASA#$C<
8$AC ?1
""
C$:SS4#& ?1 &J ?2
""
$>' P$:C2
""
1ultiple procedure files can e run in a atch y adding the $>' command to the
end of each procedure file so that at the completion of each procedure file0 a new
procedure file would e loaded and run" Pre-analysis synta9 chec,ing will e
performed only on the initial procedure file"
4he [&atch output file name\ may e optionally specified in the $>' command
line to change the atch output file name for the new procedure file" 8or e9ample0 the
following command would load the P$:C2 procedure file and run it writing the
output to 8!.A2"rtf"
$>' P$:C2 8!.A2
!f a [&atch output file name\ is specified in the $>' command0 the new procedure
file will write the results to the [&atch output file name\" !f page numering is eing
used0 the new output file will egin with page one0 and the tale of contents will e
StatPac For Windows User's Manual /eywords &)1
appended so that the final tale of contents will contain the page numers for all the
procedure files that were run"
R+M Co((and
4he purpose of the $A1 command is to allow you to imed notes within a procedure
file" Comments are especially helpful when re%iewing a procedure file that you ha%e
not used for a long time" Comment lines will e ignored when performing an
analysis" # comment line egins with an apostrophe0 or the word $A1" 4here are no
restrictions on the te9t that may e included in a comment line" Comment lines may
also use continuation lines" 8or e9ample0 the following procedure contains two
comment lines" 4he second comment also has a continuation line5
$A1 4his procedure has two comment lines
S4>@J S>$?AJ12
D 4his procedure will only use the first 20 records
for the analysis ecause the SA.AC4 command is used
SA.AC4 1-20
8$AC>A'C!AS #44!4>@A
""
Comment lines can e useful when deugging a procedure that contains an un,nown
error" &y selecti%ely ma,ing each line a comment 6adding an apostrophe to the
eginning of the line70 you can essentially eliminate that line as a possile cause of
the error"
Writing comple9 procedures is often an iterati%e process" JouNll try something0 see if
it wor,s0 and then modify it" 4ry it again0 and modify itK and so on until you get the
result youNre loo,ing for" :ften times0 youNll want to sa%e what youN%e written0 and
then try something new"
:ne way to do this is to insert an apostrophe at the eginning of each line you
wanted to ma,e a comment ecause lines eginning with an apostophe are ignored
when processing a procedure file" !f you had a procedure file with 3 procedures0 and
you wanted to completely ignore procedure 20 youNd insert an apostrophe at the
eginning of each line in procedure 20 li,e this5
8re; ?1
""
T 4itle 6/7
T @esc ?2
T ""
4itle 6/7
&anners ?2 &y 4otal ?1
""
Jou can also turn entire loc,s of te9t in a procedure file into comment lines" .ines
eginning with Mb can e used to start a comment loc,0 and lines eginning with bM
can e used to end a comment loc,"
&)& /eywords StatPac For Windows User's Manual
!n the following e9ample0 procedure 2 would not e e9ecuted ecause it is enclosed
in start and end comment loc, symols 6Mb to start and bM to end7"
8re; ?1
""
Mb &egin ignoring lines from here on
4itle 6/7
@esc ?2
bM Stop ignoring lines
""
4itle 6/7
&anners ?2 &y 4otal ?1
""
Jou can include multiple comment loc,s and as many procedures 6or indi%idual
lines7 as you want in each comment loc," #ll lines within a comment loc, will e
ignored while processing a procedure file"
#nother way to start and end a comment loc, is to egin a line with bb to start and
end a comment loc," 4he first line eginning with bb will start a comment loc,
and the ne9t line eginning with bb will end the loc,"
8re; ?1
""
bbbbbbbb &egin a comment loc, bbbbbbb
4itle 6/7
@esc ?2
bbbbbbbb And a comment loc, bbbbbbb
""
4itle 6/7
&anners ?2 &y 4otal ?1
""
!f you use the bb synta9 to start and end comment loc,s0 then e careful ecause
they wor, in pairs" !f you ha%e a start and stop comment and you remo%e the start
comment bb while inad%ertantly forgetting to remo%e the stop comment bb0 then the
stop comment bb would act li,e a start comment bb and all lines after it would e
ignored"
Reser,ed Words
!n addition to ,eywords0 StatPac recogniBes se%eral reserved words" Where
,eywords are always used at the eginning of a line0 reser%ed words are always used
somewhere in the middle of a line" $eser%ed words are specified as a parameter
following a ,eyword or analysis specification command" 4he reser%ed words are5
$AC:$@0 4!1A0 4:4#.0 1A#'0 .:0 <!0 W!4<0 &J0 4<A'0 and A.SA" 4hese
words ha%e special meaning and should not e used as %ariale names" 4hese
reser%ed words may e imedded in command lines as parameters of ,eywords0 ut
may not e used as ,eywords themsel%es"
StatPac For Windows User's Manual /eywords &)1
Reser,ed Word R+C3R$
4he word $AC:$@ is a reser%ed %ariale name" !t is an implicit name uilt into the
command processor and should not e used as one of your %ariale names" 4he
$AC:$@ %ariale will always contain the %alue of the current record numer
6se;uence7 that is eing read from the data file"
4he word $AC:$@ may e used to create a time-series regression" 8or e9ample0 the
following command would perform a multiple regression analysis using time
6$AC:$@7 and &>@FA4 as the independent %ariales and S#.AS as the dependent
%ariale5
$AF$ASS 627 S#.AS0 $AC:$@0 &>@FA4
!f we had collected yearly data ut had not entered the year as a %ariale0 we could
use the reser%ed word $AC:$@ to create the year" 4he following procedure will
create a new sufile 6'AW8!.A7 that contains %ariales one through nine of the
!'C:1A study0 and the new %ariale JA#$ as the tenth %ariale"
S4>@J !'C:1A
'AW 6'37 OJA#$O
C:1P>4A JA#$"0 ^ $AC:$@ ] 1931 6:ur data egins in 19327
W$!4A 'AW8!.A ?1-?9 JA#$
""
Important $ser Tip
4here is one caution that should e oser%ed when using $AC:$@" !f the SA.AC4
or S:$4 commands are used0 the record numers will change so that the record
numers reflect the selected or sorted records" 8or e9ample0 suppose we wanted to
list the record numers of all the cases where #FA is greater than si9ty" 4he
following procedure is wrong"
S4>@J $A4!$A
!8 #FA \ -0 4<A' SA.AC4
.!S4 $AC:$@
""
!nstead0 you must first compute the record numer0 and then reference the computed
%ariale to display the record numer" 4he following procedure is correct"
S4>@J $A4!$A
C:1P>4A 6'27 $ACX'>1 ^ $AC:$@
!8 #FA \ -0 4<A' SA.AC4
.!S4 $ACX'>1
""
&)) /eywords StatPac For Windows User's Manual
Reser,ed Word :3:0.
4he reser%ed word 4:4#. is used in anners to specify row and column totals in the
tale" !ts use is descried in detail under the O$ow 4otals and Column 4otalsO section
of the &#''A$S command documentation"
Reser,ed Word M+07
4he reser%ed word 1A#' is used in anners to specify row and column mean
a%erages in the tale" !ts use is descried in detail under the O1eans and Standard
@e%iationsO section of the &#''A$S command documentation"
Reser,ed Word :IM+
4he reser%ed word 4!1A will e used in a future %ersion of StatPac for Windows"
StatPac For Windows User's Manual /eywords &)!
Basic 0nalyses
0nalyses Inde2
4hese commands may e used in a procedure to set the type of analysis to e
performed"
&anners &rea,down Correlate Crosstas
@escripti%es 8re;uencies .ist 4test
4hese additional commands may e used in a procedure when the #d%anced
#nalyses module has een installed"
#':?# Canonical Cluster @iscriminant
8actor .ogit 1ap PC#
Proit $egress Stepwise
0nalyses 3,er,iew
4here are many different types of analyses that can e performed with StatPac" 1ost
commands are easy to use since much of the re;uired analysis information comes
from the default parameter tale"
With the e9ception of the :P4!:'S command all other analysis commands are
mutually e9clusi%e in any gi%en procedure" !n other words0 a single procedure cannot
perform more than one ,ind of analysis" # procedure file0 howe%er0 may contain
many procedures0 each performing a different ,ind of analysis"
4he :P4!:'S command may e used in any procedure to o%erride the default
%alues in the parameter tale" !t is used to control printing and analysis parameters"
4he analysis commands a%ailale in StatPacDs asic pac,age are5 .!S40
8$AC>A'C!AS0 @ASC$!P4!?A0 &$A#E@:W'0 C$:SS4#&S0 &#''A$S0
44AS40 and C:$$A.#4A"
4he analysis commands a%ailale in the StatPac #d%anced Statistics module are5
$AF$ASS0 @!SC$!1!'#'40 PC#0 8#C4:$0 #':?#0 C#':'!C#.0
C.>S4A$0 and 1#P"
Important $ser Tip
#ny of the analysis commands may e are%iated y using only the first two
characters of the ,eyword" 8or e9ample0 8$AC>A'C!AS could e are%iated to
8$0 8#C4:$ could e are%iated as 8#0 and :P4!:'S could e are%iated as
:P"
.IS: Co((and
4he .!S4 command is used to list selected %ariales in the data file" 4he command
synta9 is5
.!S4 [?ariale list\
!f the .!S4 command does not specify a %ariale or %ariale list0 all %ariales will e
listed" When used in this fashion0 %alue laels will e listed instead of the raw data"
8or e9ample0 letDs say you want to print a report consisting of only two columns" 4he
first column is %ariale ) 6#FA7 and the second column is %ariale 13 6SA*7" Aither
%ariale numers or names may e used to specify the %ariale list" 4he command
line would e entered as either5
.!S4 ?) ?13
.! #FA SA* 6 .!S4 may e are%iated as .!7
4he ,eyword $AC:$@ may e used as part of the %ariale list to print the record
numer as one of the columns" 8or e9ample0 the following parameter line will
produce a report consisting of four columns0 the first column eing the se;uence of
the case in the data file5
.!S4 $AC:$@ ?12 ?31 ?(3
Jou may specify as many %ariales to e included in the report that can e
accommodated y the pitch and orientation of the output" !f too many %ariales are
specified0 the output will e truncated" 1issing data will e displayed as a series of
dashes"
4he .!S4 command is often used as a way to troule-shoot a procedure that is not
wor,ing" 8or e9ample0 if the following procedure didnDt wor, properly0 we might try
the .!S4 command to figure out what went wrong5
S4>@J A*#1P.A
C:1P>4A 6'3"17 #?F ^ ?1 b ?2 M 2
@ASC$!P4!?A #?F
&); Basic 0nalyses StatPac For Windows User's Manual
""
We could replace the @ASC$!P4!?A command with the .!S4 command and list the
rele%ant %ariales" #lso note that we added the SA.AC4 command to limit the
printout to the first twenty-fi%e records 6e"g"0 we donDt need to list the whole file to
find out why it is not wor,ing7"
S4>@J A*#1P.A
C:1P>4A 6'3"17 #?F ^ ?1 b ?2 M 2
SA.AC4 1-22
.!S4 $AC:$@ ?1 ?2 #?F
""
&'ample of a List Printout
4o list an open-ended %ariale0 simply specify it in the .!S4 command" 4he
following would list a %ariale called OCommentO" 4he C:1P>4A line is used to
calculate a record numer so it can e included in the printout" 4he !8-4<A'-
SA.AC4 line is used to select only those who made a comment" 4he :P4!:'S line
is used insert a lan, line etween each response"
C:1P>4A 6'27 $AC^$AC:$@
!8 Comment [\ O O 4<A' SA.AC4
.!S4 $ec Comment
:P4!:'S &.^J
""
4he output might loo, li,e this5
StatPac For Windows User's Manual Basic 0nalyses &)'
&'ample of a Verbatim Listing
%ultiple Response 2 Combining Variables
4here are two options 61$ and C&7 to control the way that data gets displayed with
the .!S4 command"
4he 1$ option is used to specify %ariales you want to e stac,ed on top of each
other in a single column" 4he specified %ariales will e listed in a single column
rather than using multiple columns on the listing" 4he %ariales do not ha%e to e
true multiple response %ariales in the codeoo,W you may use the 1$ option for any
%ariales"
4he C& option is used to specify %ariales that you want to comine into a single
field instead of eing treated as indi%idual fields" 8or e9ample0 if City0 State0 and Lip
were separate %ariales0 you could display them together using the C& option"
'ormally0 all %ariales in a listing would appear side-y-side" 4he 1$ and C&
options are used to create an easier to read format"
8or e9ample0 suppose %ariales si90 se%en0 and eight are eing used to hold
respondentsD %eratim answers to a ;uestion on a restaurant sur%ey5 OWhat three
things could we do to impro%e your dining e9perienceYO 4hree #)0 %ariales were
used" 4he following command would produce a listing of the data in a %ertical
format" >p to three lines in the report would e displayed for each respondent" 4he
SA.AC4 command is used to eliminate suHects who did not answer the ;uestion"
!8 ?- [\ O O 4<A' SA.AC4
.!S4 ?--?(
:P4!:'S 1$^6?--?(7
&!> Basic 0nalyses StatPac For Windows User's Manual
""
#n e9ample of a single record in the printout might loo, li,e this5
8aster ser%ice"
$educe prices"
Freater selection"
!f the C& option were used instead of the 1$ option0 all three responses would e
comined into a single field 6gi%ing the appearance that the three responses we part
of the same sentence or paragraph"
!8 ?- [\ O O 4<A' SA.AC4
.!S4 ?--?(
:P4!:'S C&^6?--?(7
""
4he C& option formats the printout so each record in the listing will use the numer
of lines that it needs to show the data" 4he listing might appear as follows5
8aster ser%ice" $educe prices" Freater selection"
4he 1$ and C& options may e used in conHunction with each other to produce
desired outputs" 8or the ne9t e9ample0 assume the following %ariales5
?1 'ame
?2 StreetX#ddress
?3 City
?3 State
?2 Lip
?- PhoneX'umer
?) 8a9X'umer
?( AmailX#ddress
We might want to stac, 'ame0 #ddress0 City0 State0 and Lip into a single column on
the printout" We might also want to stac, the Phone and 8a9 numers into a single
column" !n the following procedure0 the C& option is used to comine City0 State0
and Lip into a single field0 and the 1$ option is used to specify which %ariales
should e displayed in a %ertical column"
.!S4 ?1-?(
:P4!:'S C&^6?3-?27 1$^6?1-?276?--?)7
""
4he output might loo, li,e this5
StatPac For Windows User's Manual Basic 0nalyses &!1
&'ample of a Listing ,sing te %R and C! Options
:abeling and Spacing Options
3tion Code Function
.aeling .& Sets the column headings to print the %ariale lael
6.&^A70 the %ariale name 6.&^'70 or the %ariale
numer 6.&^C7" #lso0 .&^0 suppresses laeling0
and .&^* suppresses all laeling and page feeds"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns of
the listing"
1a9imum Width 1W Sets the ma9imum width 6in inches7 that will e
used for long alpha %ariales and multiple response
%ariales"
&lan, .ine &etween $ows &. When &.^J0 a lan, line will e printed etween
each row of the listing" When &.^'0 no lan, line
will e printed"
1a9imum Pages 1P 4he 1P option may e set to the ma9imum numer
of pages that will e printed" !ts purpose is to
pre%ent an unintentional listing of hundreds or e%en
thousands of pages" !f 1P^00 then the listing will
ecome as long as necessary to print all the output"
!f 1P is set to any other numer0 that will ecome
the ma9imum numer of pages that will e printed"
FR+@U+7CI+S Co((and
# fre;uency analysis is the simplest of all statistical procedures" !t is ideal for data
which has een coded into groups or categories" 4he coding can e either alpha or
numeric-type data"
4he synta9 of the command to run a fre;uency analysis is5
&!& Basic 0nalyses StatPac For Windows User's Manual
8$AC>A'C!AS [?ariale list\
8or e9ample0 to find the percent of males and females in a sample0 you would
re;uest a single analysis5
8$ SA* 6 8$AC>A'C!AS may e are%iated as 8$7
Se%eral fre;uency analyses can e re;uested with a single command" 8or e9ample0 to
get a fre;uency analysis of SA* 6?370 $#CA 6?27 and !'C:1A 6?-70 the re;uest
could e specified in se%eral ways5
8$AC>A'C!AS SA*0 $#CA0 !'C:1A
8$AC>A'C!AS SA* $#CA !'C:1A
8$AC>A'C!AS ?3 ?2 ?-
8$AC>A'C!AS ?3-?-
'otice that either the %ariale name or the %ariale numer may e specified as part
of the %ariale list"
# fre;uency analysis may e run on alpha or numeric-type %ariales" 1issing data
will e included in the fre;uencies only if there is a %alue lael for missing data0
6e"g"0 [&.#'E\^'o response7"
Table Format
4hree types of printout formats are uilt into the program5 e9panded0 condensed and
automatic" 4he option to control the tale format is5
:P4!:'S 48^' 6'o tale will e printed7
:P4!:'S 48^# 68ormatting will e automatic7
:P4!:'S 48^A 68ormatting will e e9panded7
:P4!:'S 48^C 68ormatting will e condensed7
Condensed formatting is especially useful when there are many unlaeled %alues"
8or e9ample0 if one of the %ariales is !@ '>1&A$0 there are generally no %alue
laels associated with this %ariale" !t is often a good idea to chec, the data to e
sure that no records were inad%ertently entered twice 6i"e" duplicate !@ numers7" #
condensed fre;uencies printout would allow you to ;uic,ly determine if any !@
'>1&A$ is specified more than once" #n e9ample of condensed formatting might
loo, li,e this5
StatPac For Windows User's Manual Basic 0nalyses &!1
&'ample of a Compressed Fre=uencies Printout
#utomatic formatting is generally recommended since it minimiBes the amount of
paper that will e used" !f automatic formatting is used and there are more than 20
unlaeled categories 6no %alue laels70 the printout will automatically e con%erted to
condensed format" !n most cases0 this will result in the e9panded format" #n e9ample
of e9panded formatting might loo, li,e this5
&'ample of an &'panded Fre=uencies Printout
Print >ero Values
Sometimes there may e a category listed in the %alue laels that has no
accompanying data" 8or e9ample0 noody in the sample may e o%er 30 years old or
ma,e o%er Z300000 a year" Whether or not you want the lael to appear with a count
of Bero is a matter of preference" !f you want the reader of your report to ,now that a
category was a%ailale0 youDd proaly want to print Bero %alues 6L?^J7" !f you are
interested in sa%ing space0 you might want to e9clude Bero %alues 6L?^'7"
$ort Type 2 $ort Order
8re;uency analyses are often more meaningful when the output is displayed in sorted
order" When wor,ing with nominal-type data and few categories0 the order in which
categories are presented is not %ery important" 6e"g" !t really doesnDt ma,e much
difference whether males or females are listed first"7 <owe%er0 as the numer of
categories increases0 it may e desirale to list those with the highest count first0
&!) Basic 0nalyses StatPac For Windows User's Manual
followed y those with lower counts" 4his would e a sort y fre;uency of response
in descending order" !t would e re;uested with the following options5
:P4!:'S S4^8 S:^@ 6Sort 4ype y fre;uency of response7
6Sort :rder is descending7
When data is ordinal0 it is more appropriate to present the output in order defined y
the categories themsel%es" >sually this is the same as the alpha or numeric code used
to represent a category" 8or e9ample0 ta,e the following two sur%ey ;uestions5
<ow old are youY What is your annual incomeY
#^>nder 21 1^>nder Z100000
&^21-30 2^Z100000-Z200000
C^31-30 3^Z210000-Z300000
@^:%er 30 3^:%er Z300000
&oth ;uestions are ordinalW the first one is coded alpha and the second is numeric" !t
would e desirale to ha%e the fre;uencies printout appear in ascending order y the
code 6the same way they are listed ao%e7" 4he options statement to do this is5
:P4!:'S S4^C S:^# 6Sort 4ype is y category code7
6Sort :rder is ascending7
'otice that this type of sort is generally the way the information would e specified
in the %alue laels" !f this is the case0 sorting y category code will ha%e no effect"
Sorting y category codes is useful if you did not enter %alue laels for the %ariale"
!f no sort type is specified 6S4^'70 the output will e displayed in the same order as
specified y the %alue laels" !f the %alue laels do not contain all the %alues in the
data file 6such as mispunched data70 the unlaeled %alues will appear on the printout
in the order that they are encountered in the data file"
#dditionally0 a digit may e added as a suffi9 to the S:^# or S:^@" !t is used to
sort the %alue laels e9cluding the last one or more %alue laels" 4his is useful when
the last %alue lael is an OotherO category0 and you want to sort the %alue laels0 ut
still lea%e the Oother O as the last row in the report" 8or e9ample S4^8 S:^@1 would
sort the %alue laels in descending order y fre;uency0 e9cept it would lea%e the last
%alue lael as the last row regardless of its fre;uency"
Truncate Labels
?ery long %alue laels may sometimes e9ceed the space allocated for them in the
printout" !n those situations0 you may set the program to either truncate the %alue
laels 64.^J e9cludes the ending portion of the lael70 or to use multiple lines to
print the entire %alue lael 64.^'7"
Cumulative Percents
When the fre;uency tale is printed in e9panded format0 you may print or e9clude
cumulati%e percents with the CP option" 4his would e specified as5
StatPac For Windows User's Manual Basic 0nalyses &!!
:P4!:'S CP^J 64urn on cumulati%e percents7
:P4!:'S CP^' 64urn off cumulati%e percents7
Confidence Intervals
Confidence inter%als for proportions can e re;uested with the C! option" 8or
e9ample0 to re;uest the 92` confidence inter%als0 you would use the option C!^920
and the 99` confidence inter%als could e re;uested y C!^99" Confidence inter%als
allow us to estimate the proportions in the population for each of the response
categories" !f repeated samples are ta,en from the population0 we would e9pect the
category proportions to fall within the confidence inter%als" When confidence
inter%als are re;uested0 cumulati%e percents will not e printed regardless of the
setting of the CP option"
Confidence inter%als are calculated y first computing the estimated standard error of
the proportion0 and then using the t distriution to find the actual inter%al" 'ote that
the finite population correction factor 61-nM'7 is used to adHust the standard error if
the sample represents a large proportion 6say greater than ten percent7 of the
population" When the sample is large0 use the 8P options to specify the population
siBe 6i"e"0 8P^90 where 9 is the siBe of the population7" !f the 8P option is not
specified0 no correction will e applied"
&'ample of an Confidence Intervals 4round 4 Percent
Critical T Probability
#fter performing a fre;uency analysis0 researchers are often interested in
determining if there is a significant difference etween the %arious categories" 4he
Chi-s;uare statistic is often used to determine if the oser%ed fre;uencies mar,edly
differ from the e9pected fre;uencies" 4he prolem with the Chi-s;uare statistic is
that it does not isolate the significant differences 6i"e"0 it only tells whether or not one
e9ists7" StatPac uses a t-test to compare all possile pairs of categories to determine
where the actual differences lie"
4he C4 option may e set etween 0 and 1" When C4^00 no t-tests will e performed
or printed" !f C4^10 the t-statistic and proaility will e printed for all possile pairs
of categories" # typical setting for the critical t proaility is 2` 6C4^"027" !n this
case0 StatPac will print the t-statistic and two-tailed proaility for all pairs of
categories that ha%e a proaility of p^"02 or less" StatPac uses the following
formula to calculate the t-statistic5
&!* Basic 0nalyses StatPac For Windows User's Manual
&'ample of a Critical T Probability 4nalysis
Percentage !ase
4he percentage ase on a fre;uency analysis can either e the numer of respondents
6'7 or the total numer of responses" !f P&^'0 the denominator for calculating
percentages will e the numer of respondents" !f P&^$0 the denominator will e the
total numer of responses for all indi%iduals"
%ultiple Response
Sur%eys often include ;uestions in which the respondent is as,ed to ma,e more than
one response to a single ;uestion" #n e9ample of the ,ind of ;uestion that is
appropriate for multiple %ariale response is5
1" Which of the following ser%ices did you useY
6Chec, all that apply7
XX Counseling
XX Io placement
XX $emedial reading
XX $emedial math
XX $esume writing
4he multiple response fre;uency analysis is used to summariBe these ,inds of items"
When designing a study that includes this type of ;uestion0 each choice is considered
as a separate %ariale" 4he %alue laels need to e specified only for the first
%ariale0 ut it is fine if they are specified for all the multiple response %ariales"
StatPac For Windows User's Manual Basic 0nalyses &!-
?1 OSer%icesX1O Ser%ices >sed
1^Counseling
2^Io placement
3^$emedial reading
3^$emedial math
2^$esume writing
?2 OSer%icesX2O Ser%ices >sed
?3 OSer%icesX3O Ser%ices >sed
?3 OSer%icesX3O Ser%ices >sed
?2 OSer%icesX2O Ser%ices >sed
4he synta9 for the multiple response fre;uency analysis is5
8$AC>A'C!AS [?ariale list\
:P4!:'S 1$^J
!n this e9ample0 all the %ariales in the %ariale list will e treated as one multiple
response %ariale" #nother way to use the 1$ option is to re-specify the %ariale
numers 6not the %ariale names7 that should e grouped"
8$AC>A'C!AS [?ariale list\
:P4!:'S 1$^6[?ariale list\7
'ote that the parentheses are re;uired around the %ariale list in the options line" !n
the ao%e e9ample0 the commands would e5
8$AC>A'C!AS ?1-?2
:P4!:'S 1$^6?1-?27
4he output will contain the counts and percents for each of the response %alues" 4hat
is0 how many times code 1 6counseling7 was chosen for any %ariale0 how many
times code 2 6Ho placement7 was chosen for any %ariale0 etc" !n other words0 it will
print the total numer of times that each response was recorded for %ariales 10 20 30
3 and 2 comined"
4he options line may e used to specify se%eral multiple response analyses y using
additional sets of parentheses in the 1$ option" 4he following commands would
perform three different tas,s 6each one eing a multiple response analysis on a new
set of %ariales7"
8$AC>A'C!AS ?1-?20
:P4!:'S 1$^6?1-?1076?11-?1276?1--?207
&!; Basic 0nalyses StatPac For Windows User's Manual
1ultiple response may also e used when the ;uestionnaire limits the choices to less
than the numer of possile responses" 8or e9ample0 the following ;uestion as,s for
two responses from the same %alue laels list5
1) = 1(" Write the numers of your two fa%orite foods from the list elow"
XXXXX XXXXX
1 ^ <otdogs
2 ^ <amurgers
3 ^ 8ish
3 ^ $oast &eef
2 ^ Chic,en
- ^ Salad
'otice that there are two %ariales 61) = 1(7 that hold the information for this
;uestion" &oth %ariales use the same %alue laels and the responses to oth
%ariales are weighted e;ually 6i"e" the first one is not more important than the
second7" 1ultiple response assumes that all %ariales to e analyBed ha%e the same
%alue laels" !n this e9ample0 the command would e5
8$AC>A'C!AS ?1) ?1(
:P4!:'S 1$^6?1) ?1(7
&'ample of a %ultiple Response Fre=uency 4nalysis
!f you ha%e imported the data from an e9ternal source0 the multiple response data
might not e in StatPac format" Se%eral other commercial software pac,ages use
dichotomous multiple response0 where the data for all multiple response %ariales is
either one or lan,""
StatPac For Windows User's Manual Basic 0nalyses &!'
4he 1*^Code option can e used in conHunction with the 1$ option to tell StatPac
that the data for the %ariales are dichotomous" 4he OCodeO is the single character
%alue that indicates the item is selected" !n the ao%e e9ample0 the data was coded as
ones and lan,s0 so 1* would e set to 1" !f the data had een coded as J and '0
then 1* would e set to J"

8re;uencies ?1-?3
:ptions 1$^J 1*^1
""

>sing this method does not actually change the data file" StatPac Hust reads the data
differently for the fre;uencies procedure" #n e9clamation mar, cannot e used to
permanently set the 1* option" !t must e e9plicitly specified in each procedure
where you want to use it" !f you want to permanently change the data0 use the
Con%ersion >tility program"
Category Creation
4he actual categories in the fre;uency analysis can e created either from the study
design %alue laels 6CC^.7 or from the data itself 6CC^@7" When the categories are
created from the laels0 the %alue laels themsel%es will e used to create the
categories for the analysis0 and data that does not match up with a %alue lael code
will e counted as missing" 4hat is0 mispunched data will e counted as missing"
When categories are created from the data0 all data will e considered %alid whether
or not there is a %alue lael for it"
One 4nalysis
4he one-analysis option allows you to print fre;uency analyses for se%eral %ariales
on one page" 4his option is especially useful for management reporting when the
information needs to e condensed and concise"
#ll the %ariales specified with the :# option must ha%e the same %alue laels" #n
e9ample might e a series of JesM'o ;uestions or .i,ert scale items" 4he important
point is that each %ariale has e9actly the same %alue laels as the other %ariales"
8or e9ample0 suppose that %ariales 21-30 are ten items as,ing the respondents to
rate the item as low0 medium or high" 4he following commands would produce a one
page summary of all ten items5
8$AC>A'C!AS ?21-?30
:P4!:'S :#^J
4he one analysis option is limited y the numer of characters that can e printed on
a line 6i"e"0 y the pitch and carriage width of the printer7" !f there are too many
different %alue laels0 they will not e ale to fit on one line and the analysis will e
s,ipped" !f this should happen0 try rerunning the analysis using a compressed pitch"
#s a general rule0 each %alue lael will re;uire ten spaces on the output"
&'ample of a One:4nalysis Printout
&*> Basic 0nalyses StatPac For Windows User's Manual
4he :# option is used in fre;uency analyses to summariBe the fre;uencies of se%eral
%ariales that all contain the same %alue laels" 'ote the difference etween the :#
and 1$ options" With the multiple response option 61$70 the items are treated as if
they are a single %ariale" 4he one analysis option 6:#70 howe%er0 treats each item as
a separate analysis" 4he results0 howe%er0 will e summariBed on one page"
4he ,eyword $AC:$@ in the %ariale list creates a lan, line in the report" 8or
e9ample0 the following will print three rows0 a lan, row0 and then two more rows
8re; ?1 ?3 ?) $ecord ?9 ?12
:ptions :#^J
""
When the 1$ option is used in conHunction with the :# option0 the %ariales in the
1$ options list will e treated as multiple response %ariales" 4his ma,es it easy to
create nets in a fre;uencies with the :#^J option"
8or e9ample0 if ?1-?20 are the twenty %ariales0 we could add a net y first creating
a duplicate copy of ?1 with a new name0 and then including the 1$ option to
comine the %ariales to ma,e the net" 4he net will e the sum of the counts of the
indi%idual %ariales that ma,e up the 1$ %ariale list"
S4>@J Jourstudy
'AW 6'17 OFrand-4otalO
C:1P>4A Frand-4otal ^ ?1
.#&A.S Frand-4otal 61^#gree762^'eutral763^@isagree7
8$AC Frand-4otal ?2-?20 ?1-?20
:P4!:'S :#^J 1$^6Frand-4otal ?2-?207
""
4he results might loo, li,e this5
StatPac For Windows User's Manual Basic 0nalyses &*1
#gree 'eutral @isagree
Frand-4otal -------- -------- --------
?ariale 1 -------- -------- --------
?ariale 2 -------- -------- --------
?ariale 3 -------- -------- --------
etc"
4he following is another e9ample shows how you can use 1$ option in conHunction
with the :# option to create comple9 nets" !t also shows how the reser%ed word
O$AC:$@O can e used to create lan, lines in the report"
Suppose we are conducting of sur%ey of go%ernment policies" We ha%e nine
O#greeM@isagreeO items coded as 1^#gree and 2^@isagree" 4he first three items deal
with OSocial PolicyOW the ne9t three items with O8oreign PolicyOW and the last three
items with O8iscal PolicyO" We would li,e to produce a report that loo,s something
li,e this5
Peoples #ttitudes 4owards Fo%ernment Policies
6'^97 #gree @isagree
:?A$#.. ----- -----
S:C!#. P:.!CJ ----- -----
!tem 1 ----- -----
!tem 2 ----- -----
!tem 3 ----- -----
8:$A!F' P:.!CJ ----- -----
!tem 3 ----- -----
!tem 2 ----- -----
!tem - ----- -----
8!SC#. P:.!CJ ----- -----
!tem ) ----- -----
!tem ( ----- -----
!tem 9 ----- -----
4here are four different nets in this report" 4he :?A$#.. net includes all %ariales"
4he S:C!#. P:.!CJ net includes the first three items0 the 8:$A!F' P:.!CJ net
the ne9t three items0 and the 8!SC#. P:.!CJ net the last three items" 8or this
e9ample !tems 1-9 are stored in %ariales 1 to 9"
4he spacing 6indentation7 in this e9ample is used only to ma,e the procedure easier
to understand" !t is not necessary to use the this type of spacing in your procedures"
S4>@J Jourstudy
&*& Basic 0nalyses StatPac For Windows User's Manual
<A#@!'F Peoples #ttitudes 4owards Fo%ernment Policies
C:1P>4A 6'17 :?A$#..^?1
C:1P>4A 6'17 S:C!#. P:.!CJ^?1
C:1P>4A 6'17 8:$A!F' P:.!CJ^?3
C:1P>4A 6'17 8!SC#. P:.!CJ^?)
.#&A.S :?A$#..
S:C!#. P:.!CJ
8:$A!F' P:.!CJ
8!SC#. P:.!CJ
61^#gree762^@isagree7
8$AC :?A$#.. ?2-?9 Produces o%erall net
$AC:$@ Produces a lan, line
S:C!#. P:.!CJ ?2-?3 Produces social policy net
?1-?3 Produces 3 social policy %ariales
$AC:$@ Produces a lan, line
8:$A!F' P:.!CJ ?2-?- Produces foreign policy net
?3-?- Produces 3 foreign policy %ariales
$AC:$@ Produces a lan, line
8!SC#. P:.!CJ ?(-?9 Produces fiscal policy net
?)-?9 Produces 3 fiscal policy %ariales
:P4!:'S S?^' :#^J
1$^6:?A$#.. ?2-?97
6S:C!#. P:.!CJ ?2-?37
68:$A!F' P:.!CJ ?2-?-7
68!SC#. P:.!CJ ?(-?97
""
$pecial Value Label 1ID&
When performing a fre;uencies with the :# option0 it is often desirale to only
display some of the response categories" $ecoding undesirale categories to missing
is one method to e9clude it from the tale" 4his will eliminate the column from the
tale and from any calculations of percentages on the tale"
8or e9ample0 assume the following counts for ?15
1 2 3
#gree 'eutral @isagree 'o $esponse 4otal '
30 20 30 10 100
!f P&^'0 6denominator e;uals numer of respondents70 the percents will e5
#gree 'eutral @isagree
30` 20` 30`
!f P&^$0 6denominator e;uals numer of responses70 the percents will e5
StatPac For Windows User's Manual Basic 0nalyses &*1
#gree 'eutral @isagree
30M90^33` 20M90^22` 30M90^33`
We could use the following $AC:@A command to eliminate the O'eutralO category
from the tale5
$AC:@A ?1 62^ 7
!f P&^'0 the percents will still e ased on a denominator of 100" !f howe%er0 P&^$0
then the percents will e ased on a denominator of )0 630]3075
#gree @isagree
30M)0^33` 30M)0^2)`
4he special %alue lael O<!@AO may e used to suppress printing of a %alue lael
without reducing the denominator for the percents calculations" 4he following
.#&A.S command could e used to eliminate the O'eutralO category from the tale0
while still including the O'eutralO count in the denominator5
.#&A.S ?1 61^#gree762^<ide763^@isagree7
#ny row or column that has a %alue lael of O<!@AO will not e printed0 ut it will
e included in the percent calculations when P&^$" 'ote that the percentages are
ased on the counts for all %alue laels 6including the O'eutralO category70 e%en
though all the %alue laels are not displayed in the tale"
#gree @isagree
30M90^33` 30M90^33`
!f you only wanted the O#greeDsO to show in the tale0 you could use the following
statements in the procedure" 4he percentages in the tale would still e ased on 905
.#&A.S ?1 61^#gree762^<ide763^<ide7
:P4!:'S P&^$
Print Format
4he results from the one analysis option may e printed as row percents 6P8^$70 as
counts 6P8^'70 or oth 6P8^'$7" When row percents are re;uested0 the denominator
used to calculate the percents will e the numer of non-missing responses for that
particular item" 4hat is0 when there is missing data0 the numer of %alid responses to
a particular ;uestion may e different than the numer of %alid responses for any of
the other ;uestions"
&*) Basic 0nalyses StatPac For Windows User's Manual
Print Total
4he P4 option may e used in conHunction with the :# 6one-analysis7 option to print
the total ' for each %ariale" When there is considerale missing data0 this option is
highly recommended since each of the %ariales may e using a different ' 6numer
of %alid responses7" 8or e9ample0 the following commands would produce a one-
page report summariBing %ariales 21 to 30" #n additional column will e included
on the output that lists the numer of %alid cases for each of the %ariales"
8$AC>A'C!AS ?21-?30
:P4!:'S :#^J P4^J
$ort Variables
When performing a fre;uency analysis with the :#^J option0 you can sort the
%ariales y the contents of the first column of the results" 4he S? 6sort %ariales7
option may e set to O'O for no sort0 O#O to sort in ascending order0 or O@O to sort in
descending order" When no sort is specified0 the %ariales will e listed in the order
that they appear in the analysis command %ariale list" 4he S? option is applicale
only when the :#^J option is specified" <owe%er0 if the 1$ option is also
specified0 the S? option should e set to '"
#dditionally0 a digit may e added as a suffi9 to the S?^# or S?^@" !t is used to
sort the %ariales e9cluding the last one or more %ariales when the :#^J option is
specified" 4his is useful when the last %ariale is an OotherO %ariale0 and you want to
sort the %ariales0 ut still lea%e the Oother O as the last %ariale" 8or e9ample S?^@1
would sort the %ariales in descending order0 e9cept it would lea%e the last %ariale
as the last row regardless of its %alue"
$upplemental 1eading
4he supplemental heading will only e printed when the :#^J option is specified" !t
is a line of te9t that will appear efore the first row of the tale" 4he supplemental
heading may contain any te9t and should e enclosed in ;uotes" When the pounds
symol is used in the supplemental heading0 it will e printed as the numer of
cases" 4he S< option is usually used to indicate who is included in the tale" 4he
following is an e9ample of a supplemental heading5
:P4!:'S S<^O4:4#. $ASP:'@A'4S ^ /O
%inimum Denominator
Percentages can e misleading if they are ased on a small denominator" 4he 1@
option may e used to suppress the printing of percentages that are ased on a small
denominator" 4he 1@ option sets the minimum denominator that StatPac will use for
calculating percents" 8or e9ample0 if 1@^20 StatPac will calculate percentages if the
denominator is greater than or e;ual to 2" !f a denominator were less than 20 StatPac
would print dashes instead of the percent" ?alid %alues for 1@ are etween 0 and
100" !f 1@^00 all percentages will e printed"
Print %ean
4he mean a%erage is generally not calculated for a fre;uency ecause it in%ol%es the
assumption of inter%al data" <owe%er0 there are some situations where you may want
to display the mean as part of a fre;uency analysis" 4he 1A option may e used to
StatPac For Windows User's Manual Basic 0nalyses &*!
re;uest the mean 6and standard de%iation7" When 1A^'0 no mean will e printed" !f
1A^J0 the mean will e printed0 and if 1A^S0 oth the mean and standard de%iation
will e printed" When used in conHunction with the :#^J option0 a separate mean
will e printed for each %ariale"
%ean Position
When the 1A option is used with the :#^J option0 the means 6and standard
de%iations7 can e printed as the first or last column" !f 1P^80 the means will e
printed as the first column0 and when 1P^.0 they will e printed in the last column"
When means are printed in the first column 61P^870 and the S? option is used to
sort the %ariales0 they will e sorted y the means instead of the percents"
:abeling and Spacing Options
3tion Code Function
.aeling .& Sets the column headings to print the %ariale lael
6.&^A70 the %ariale name 6.&^'70 or the %ariale
numer 6.&^C7"
.aeling Width .W Set the ma9imum width 6in inches7 for the %ariale
laels on the stu when :#^J"
4runcate .aels 4. Sets long %alue laels to e truncated when 4.^J"
A9act Width AW When :#^J and AW^J0 the laeling width for the
stu will e e9actly what is specified with the .W
option" When AW^'0 the width of the stu will
self-adHust ased on the length of the stu laels"
Column Width CW Sets the minimum width of the columns 6in inches7
when :#^J"
Column Spacing CS Sets the spacing 6in inches7 etween the columns of
the listing when :#^J"
A9tra Spacing AS When AS^J0 a lan, line will e printed elow the
tale headings When AS^'0 no lan, line will e
printed"
&lan, .ine &etween $ows &. Sets the numer of lan, lines etween rows when
:#^J"
Print Percent Symol PP Sets whether percentage symols will e shown"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
Print Codes PC Sets whether the code 6to the left of the e;uals
symol7 will e shown with the %alue laels"
Open:&nded Response Coding
!t is often useful to code open-ended responses into response categories in order to
perform a fre;uency analysis or crosstas" 4he 8$AC>A'C!AS command with the
:A option allows you to e9amine and code open-ended alpha %ariales"
:pen-ended response coding is re;uested y performing a fre;uency analysis on the
%ariales containing the %eratim te9t and setting the option :A^J" @o not use an
!8-4<A' SA.AC4 command in the same procedure"
8$AC Comment
:P4!:'S :A^J
""
&** Basic 0nalyses StatPac For Windows User's Manual
When a %eratim response is held in more that one %ariale0 it is not necessary to
specify the 1$ 6multiple response7 option" #ll %ariales listed in the 8re;uencies
command will e considered to e part of the same %eratim comment" 4he
following procedure says to egin an open-ended response coding session on
%ariales one through three" 'ote that the te9t for all three %ariales will e displayed
at the same time during the coding session"
8$AC ?1 - ?3
:P4!:'S :A^J
""
Aach time you complete a coding session0 StatPac will create a new study and data
file called S4#4P#C-?A$&#4!1" 4he S4#4P#C-?A$&#4!1 study contains the
coded %eratim data0 and the fre;uency analysis will e performed on this file 6i"e"0
the coded data7" Jour original study and data file are not affected y the coding
process" #ll of the coded information is stored in the S4#4P#C-?A$&#4!1 file" !n
order to use this coded information in future analyses0 the S4#4P#C-?A$&#4!1
files must e merged with your study and data files using the 1A$FA command"
:ccasionally0 you may start a coding session0 and for one reason or another0 not e
ale to finish" Jou can ;uit the current coding session and continue at a future time"
4o continue with a pre%iously unfinished coding session 6i"e"0 one that you started
coding efore0 ut did not finish70 simply run the procedure again" StatPac will detect
the e9istence of a partially completed S4#4P#C-?A$&#4!1 file0 and as, if you
want to continue with the pre%ious %eratim coding0 or delete the e9isting %eratim
coding and egin a new coding session"
Clic, on the Continue Pre%ious Session utton to continue with the pre%ious coding0
or the Start 'ew Coding Session utton to delete the e9isting S4#4P#C-
?A$&#4!1 files" !f your intent is to continue with a pre%ious session0 you can
ypass this ;uestion y changing the :A option from :A^J to :A^C 6continuation7"
Verbatim !laster
StatPac for Windows has the ?eratim &laster module uilt in and it will
automatically pre-code all open-ended responses"
?eratim &laster processes open-ended responses in two steps" 4he first step is
called pre-coding0 and the second step is called !inal coding" Jou may modify or
interact with the coding process at either or oth steps"
4he pre-coding step will e performed first" ?eratim &laster will read the file and
count all the uni;ue words that occur in the te9t" !t attempts to comine %ariations of
StatPac For Windows User's Manual Basic 0nalyses &*-
the same word into a single root word" 8or e9ample0 it would attempt to comine
singulars and plurals0 different tenses0 prefi9es and suffi9es into a single root word"
4he pre-coding is not perfect0 ut it will catch nearly all %ariations on each root
word"
4he result of the pre-coding will e to present you with a list of root words along
with the numer and percent of respondents who used each word" 4he list will e
initially sorted in descending order y fre;uency of occurrence in the te9t" 4hus0 the
words at the top of the list appeared most often in the te9t" !f a respondent used the
same word more than once0 it will only e counted as one occurrence in calculating
the fre;uencies"
4he pre-coding screen appears5

$tep ) : &'amine -ords
4he most important tas, in Step 1 6pre-coding7 is to familiariBe yourself with the
asic content of the %eratim comments"
When no words are selected 6highlighted7 in the word list0 the Pre%ious and 'e9t
uttons will show the pre%ious and ne9t records"
# more important feature is the aility to e9amine the conte9t in which specific
words are used" 8irst select the word or words you are interested in e9ploring y
clic,ing on those words in the word list" 4hen the Pre%ious and 'e9t uttons can e
used to find the pre%ious and ne9t comments that used any of the selected words" 4he
selected word6s7 will e shown in red to draw your eyes to that portion of the
comment"
Clic,ing on a word that is not already selected will select the word" Clic,ing on a
word that is already selected will deselect the word"
&*; Basic 0nalyses StatPac For Windows User's Manual
?oin -ord Variations
@uring pre-coding0 one of the maHor functions of ?eratim &laster is to comine all
the %ariations of each root word" !t is generally a good idea to re%iew the words and
to comine any %ariations that ?eratim &laster may ha%e missed" !t will usually not
miss any0 ut itDs still a good idea to chec,"
!n the 4ype of Sort window0 clic, on #lphaetic" 4hen use scroll ar to scroll through
the list" !t will e easy to spot %ariations of the same root word that were not
comined since they will appear ne9t to each other in the alphaetically sorted list"
!f you should find two %ariations of the same root word0 you will want to Hoin them
together so ?eratim &laster treats them as a single uni;ue word" 8irst select the
words to e Hoined y clic,ing once on each word" 4he selected words will e
highlighted" Jou may Hoin more than two words at once y clic,ing on each word"
4hen clic, the Ioin utton" 4he words will e Hoined and the count and percent will
e modified to reflect the new %alues" 4he important thing is to Hoin words that are
%ariations of the same root word or words that ha%e the same meaning"
Jou may Hoin words during pre-coding or final coding" <owe%er0 Hoining word
%ariations is easiest during the pre-coding process ecause of the aility to perform
an alphaetical sort"
When you ha%e finished Hoining words0 clic, on 8re;uency in the 4ype of Sort
window to re-sort the list in descending order y fre;uency of occurrence" @uring
the final coding process0 it is usually most con%enient to ha%e the most common
responses appear near the top of the response category list"
Delete and &'clude -ords
4here are many words that add little meaning to a sentence" Words li,e o!0 te0 !or0
by0 tis0 and hundreds of others donDt add much to the meaning of a respondentDs
statement" 4hese words could e e9cluded from a sentence without sustantially
distracting from its meaning"
1odifiers are words that are used to descrie the ;uantity or magnitude of the word
or phrase that follows the modifier" 4hey are usually ad%ers" A9amples are usually0
mostly0 and greatly" 1odifiers do add meaning to a sentence0 ut they are generally
not helpful in determining the maHor topic of a sentence"
?eratim &laster maintains a list of e9clusionMmodifier words in a file called
A*C.>@A"4*4" 4his file is an #SC!! te9t file and may e edited with any word
processor or te9t editor" !t contains an alphaetical listing of words that do not help
identify the primary topic of a sentence"
4he first thing ?eratim &laster does when you as, it to analyBe a te9t file is to
eliminate the e9clusionMmodifier words" !t doesnDt really eliminate the wordsW it Hust
pretends theyDre not there"
4he e9clusionMmodifier list distriuted with ?eratim &laster is fairly complete"
<owe%er0 specific applications may re;uire that you add new words to this list" Jou
can use any te9t editor to modify the A*C.>@A"4*4 file" Words added with a te9t
editor will e sorted into alphaetic order the ne9t time that ?eratim &laster is run"
Jou can also add e9clusionMmodifier words to this file during pre-coding" !f you see
a word that doesnDt add sustantial meaning to sentence0 add it to the
e9clusionMmodifier list y clic,ing on the word to select it0 and then clic,ing on the
A9clude utton" 4he word6s7 will e added to the A*C.>@A"4*4 file and will e
e9cluded from all future open-ended coding session"
@eleting words is different that e9cluding words" @eleting a word with the delete
utton will delete the word from the current session only" 8uture coding sessions
StatPac For Windows User's Manual Basic 0nalyses &*'
with other %eratim te9t would show the word" 4o delete a word0 clic, on the word to
highlight it and clic, the @elete utton"
$et te %inimum Percent to Display
# typical te9t file might contain 300 to 200 uni;ue root words 6e%en after comining
all the %ariations of the same words and eliminating the e9clusion words7" >sually0
we wouldnDt want to loo, at a list of this siBe" !nstead0 weDre most often interested in
responses that were made y more than one respondent" ?eratim &laster lets you
adHust the siBe of the word list y specifying a minimum percent" 4his is the
minimum proportion of respondents that used a word" 8or e9ample0 if you set the
minimum percent e;ual to fi%e0 ?eratim &laster will display words that were used
y at least fi%e percent of the respondents" Words that were used y less than fi%e
percent of the respondents would e hidden from your %iew"
#t any time during pre-coding0 you may change the minimum percent" When the
minimum percent is set to Bero0 all words will e displayed" 4o change the minimum
percent0 simply type the new minimum percent and press enter"
$tep < : $elect -ords for Categories
4he purpose of pre-coding is to identify the important words that are mentioned y
respondents" O!mportantO is0 of course0 a suHecti%e decision" 4he minimum percent
feature will narrow the numer of words to a manageale list" Step 2 is to select
those words that seem to hit upon the ,ey concepts in respondentsD answers"
Sometimes these will e easy to identify0 and other times they wonDt" !f the sur%ey
;uestion was e9tremely specific0 it will proaly e easy to identify the ,ey concept
words0 and if the sur%ey ;uestion was ;uite general0 it might e e9tremely difficult to
identify the ,ey concepts"
OSelect Words for CategoriesO refers to identifying the ,ey concept words that will e
carried forward to the final coding process" 4o select a word0 or to deselect a word
that has already een selected0 clic, on it in the word list"
!f you select any words0 only those words will e carried forward to the final coding
process0 and words not selected will e e9cluded" !f you do not select any words0 all
displayed words will e carried forward to final coding"
$tep @ : Final Coding
4he final coding process is where you refine the coding and the response category
laels" 4he words selected in the pre-coding process pro%ide the foundation for the
final response categories" 4hese are the laels you gi%e to the ,ey concepts" 4he
initial response categories will e the words that were selected during pre-coding"
4he final coding process in%ol%es re%iewing the actual open-ended responses for
each respondent0 and using your understanding of the comment6s7 to refine the
response category laels" # response category lael can e changed at any time" 4o
change the te9t in a response category lael0 doule clic, on the lael"
4he text window 6respondentDs %eratim te9t7 will appear at the left of the screen0 and
the response categories window will appear on the right" 4here will e an arrow to
the left of all response categories that were mentioned y the respondent0 and the ,ey
words in the te9t will e highlighted"
&-> Basic 0nalyses StatPac For Windows User's Manual
$elect and Deselect a Response Category
>se the mouse to select and deselect a response category" When a response category
is selected0 an arrow will appear to the left of that category" 4his means that the
current respondent made a comment related to that response category" !f a response
category is not selected0 there will e no arrow" Clic,ing to the left of the response
category lael 6in the small area reser%ed for the arrows7 will select or deselect that
response category"
Cange Records
# record is the same as a respondent" 4hus0 when we say canging records0 it simply
means displaying a different respondentDs answer" 4here are two ways to change
records"
4he first way is used to show a specific desired record" Clic, on the record numer
shown on the top left of the Conte9t window" #fter clic,ing on the record numer0
change it to the desired record and press enter"
4he second way is to use the Pre%ious and 'e9t uttons to change to the pre%ious
and ne9t records" When no response category laels are highlighted0 the Pre%ious and
'e9t uttons will ad%ance to the pre%ious or ne9t record numers" When one or more
response category laels are highlighted0 the pre%ious or ne9t record that has een
pre-coded into that category will e displayed" 4he current record numer will e
displayed ao%e and to the left side of the conte9t windows"
:ne method of performing the final coding would in%ol%e repeatedly clic, the 'e9t
utton to re%iew the coding eginning with the first respondent and going to the last
respondent" ?eratim &laster will s,ip o%er respondentDs who did not ma,e a
comment"
#nother method of pre-coding would e to e9amine the comments for each response
category" 8irst0 highlight the response category 6or categories7 you want to search for"
StatPac For Windows User's Manual Basic 0nalyses &-1
4hen clic, the 'e9t utton to search for the ne9t record that contains a reference to
that response category" Aach time you clic, the 'e9t utton0 the ne9t record with a
reference to that response category will e displayed" When the last record in the te9t
file is reached0 the search will e stopped"
4he search feature pro%ides a ;uic, way to gain a etter understanding of a particular
response category" !t lets you scan all comments related to a specific response
category" While using the search feature0 the search will e limited to the response
category currently eing searched" 4his ma,es it e9tremely easy to scan the rele%ant
te9t" Scanning a particular response category will gi%e you a etter understanding of
the comments coded into that category"
Cange a Response Category Label
Sometimes0 it might e necessary to change or delete an e9isting response category0
or to create a new category" 4he response category laels can e changed at any time
y simply typing the new te9t" @oule-clic, on the response category lael you want
to change and then you will e ale to edit the category lael"
Delete and Create Ne" Response Categories
4o create a new response category0 highlight a response category and clic, the Create
Category utton" 4his will insert a lan, line in the response categories so you can
type the new response category lael on that line" !f you create a new response
category using this method0 you will need to go through each record and decide
whether or not that record falls into the newly created response category" ?eratim
&laster does not automatically code responses ased on the words you type"
4o delete a response category0 highlight it and clic, the @elete Category utton" 4he
response category will e immediately eliminated" 4here is no automatic OundeleteO0
so e careful" Jou might use @elete Category utton to eliminate a response category
you consider to e unimportant"
?oin T"o Response Categories
Sometimes you will want to comine response categories that you initially thought
were different" Jou may Hoin response categories 6at any time7 into a single category"
Clic, the Ioin utton" 4hen drag and drop one of the categories onto the other
category" 4he category you dragged will e deleted and all the responses that were
initially assigned to that category will e reassigned to the category you drop it on"
4o drag a category0 mo%e the mouse pointer o%er that category" Press and hold the
left mouse utton" While still holding the mouse utton0 mo%e the mouse so the
category outline is o%er the category to e Hoined and then release the mouse utton"
'ote that once you use the Hoin category feature0 there is no way to return to the
unHoined %ersion" 4here is no automatic OunHoinO0 so e careful"
Create a Net Response Category
Creating a net category is a useful method of aggregating responses" !t is similar to
Hoining response categories e9cept that the secondary response category is not
remo%ed as a uni;ue entry in the response category list"
4he most common use of a net category is to summariBe a group of related response
categories without affecting the e9isting categories" 8or e9ample0 suppose you were
e%aluating respondents preferences for a new food and there were response
categories of red0 green0 and lue" Jou might want to create a net category called
color" Jou could use the Ioin utton to Hoin the three categories0 ut you would then
e unale to rea, down the respondents y their indi%idual color choices" Creating a
net category is the solution to the prolem"
&-& Basic 0nalyses StatPac For Windows User's Manual
4o create a net category0 first create a new lan, line for the 'et category" <ighlight
a category and clic, on the !nsert Category utton to open up a lan, line in the
response category list" 4his lan, line will ecome the net category" 'e9t clic, the
'et utton to egin net creation" 8inally0 drag the category you want to net and drop
it on the lan, line" #dditional response categories can now e added to the new net
category" Clic, 'et again0 and drag another category to the new 'et category"
$esponse categories may e included in a net one at a time using this method"
!f you ma,e a mista,e while creating or adding to a net0 clic, on the Cancel utton to
cancel the process" !f you inad%ertently add a wrong %ariale to a net0 delete the net
with the @elete Category utton and recreate the net"
Cange te Order of te Response Categories
!t is sometimes desirale to rearrange the order of the response categories" 4o mo%e a
response category0 clic, the 1o%e utton" 4hen select a category0 drag it to a new
position0 and drop it in the new position in the response category laels list
Finis te Coding Process
!f you wish to e9it the open-ended response coding program efore finishing the
coding process0 ma,e a note of the current record numer and clic, the Stop 8or
'ow utton" 4o continue where you left off at a future time0 run the same procedure
again0 and select Continue Pre%ious Session" 4hen clic, on the current record
numer on the top left of the Conte9t window0 type the record numer where you left
off0 and press enter"
4o finish the coding process0 and run the fre;uency analysis on the coded data0 clic,
the #nalyBe utton" 4he fre;uency analysis will e performed on the coded data"
#fter %iewing the results of the analysis0 StatPac will as, if you want to merge the
coded %eratim responses" 8or e9ample0 you may want to use the coded %eratim
information in other analyses 6e"g" crosstas of the %eratim responses with other
%ariales7" Since StatPac can only analyBe one study at a time0 you should merge the
coded responses 6i"e"0 the S4#4P#C-?A$&#4!1 file7 with your original study and
#fter running the merge procedure0 your original file will contain all the original data
6including the original %eratim comments7 and the new coded %eratim comments"
4he coded comments 6from the S4#4#C-?A$&#4!1 file7 will e added to the end
of your original %ariales0 so running the procedure will increase the numer of
%ariales in your original study"
Produce a List of Verbatim Comments for &ac Response
Category
#fter merging a coded %eratim file0 you can merge the S4#4P#C-?A$&#4!1
procedure file into your e9isting procedure file" 4he S4#4P#C-?A$&#4!1
procedure file is created automatically when you do a merge" !t contains a series of
procedures to print a listing of the %eratim responses that were coded into each
response category" 4o merge the file0 position the cursor at the eginning of the line
StatPac For Windows User's Manual Basic 0nalyses &-1
following two dots" 4hen select 8ile0 1erge0 and select S4#4P#C-?A$&#4!1 as
the file to merge"
CR3SS:0BS Co((and
Crosstas is one of the easiest ways to loo, at the relationship etween two %ariales0
and one of the most popular ways of e9amining categorical data"
4he synta9 for the crosstas analysis is5
C$:SS4#&S [?ariale list\ &J [?ariale list\
8or e9ample0 letDs loo, at how peopleDs e9pectations for learning 6A*PAC4#4!:'7
are related to their satisfaction with a lecture 6S#4!S8#C4!:'7" 4he command to
re;uest this crossta analysis is5
C$ A*PAC4#4!:' &J S#4!S8#C4!:'
6C$:SS4#&S may e are%iated C$7
4he results will e printed in the form of a two-dimensional matri9" 4he first %ariale
6A*PAC4#4!:'7 will y printed on the y a9is0 while the second %ariale
6S#4!S8#C4!:'7 will e printed on the 9 a9is" 4he ,eyword &J is a mandatory
part of the statement"
!f se%eral different crosstas are desired0 re;uest them y specifying a %ariale list
instead of an indi%idual %ariale" 8or e9ample0 you might e interested in oth
S#4!S8#C4!:' with the lecture and the amount of actual .A#$'!'F that
occurred" 4he command to run this analysis would e5
C$:SS4#&S A*PAC4#4!:' &J S#4!S8#C4!:'0 .A#$'!'F
4he matri9 siBe that the crosstas program can accommodate depends on the
a%ailale $#1" 4he %ariales themsel%es may e alpha or numeric" StatPac will not
print a row or column when total count for that row or column is Bero" 1issing data
6lan,s7 will e e9cluded from the analysis unless there is a %alue lael for lan,
data 6e"g"0 &.#'E^1issing data7"
4hree-way crosstas may e re;uested y the following command5
C$:SS4#&S [?ar" list\ &J [?ar" list\ &J [?ar" list\
# three-way crossta is essentially a series of two-way crosstas controlled for a
third %ariale" 4hat is0 the two-way crosstas are performed on susets of the data as
defined y the third %ariale" 8or e9ample0 consider the following crosstas
command5
C$:SS4#&S A*PAC4#4!:' &J S#4!S8#C4!:' &J SA*
&-) Basic 0nalyses StatPac For Windows User's Manual
4his command will produce two different crossta tales0 one for males and the other
for females" 4he same results could e otained y e9ecuting the following two
procedures5
!8 SA*^O1O 4<A' SA.AC4
C$:SS4#&S A*PAC4#4!:' &J S#4!S8#C4!:'
""
!8 SA*^O8O 4<A' SA.AC4
C$:SS4#&S A*PAC4#4!:' &J S#4!S8#C4!:'
""
CountAPercent 2 ObservedA&'pected Tables
4here are two common ways to print crosstas" :ne is numer0 row percent0 column
and total percent" 4he second is oser%ed0 e9pected0 oser%ed minus e9pected0 and
the cells contriution to the total chi-s;uare" &oth of these tales may e printed or
e9cluded using J or ' options" 4o print oth tales0 use the following options5
:P4!:'S CP^J :A^J
4he chi-s;uare is an important statisticW it is used to test whether two %ariales are
independent of each other" !n other words0 do the oser%ed fre;uencies in the cells
de%iate mar,edly from the fre;uencies we would e9pect if the two %ariales were not
related to each otherY
# large chi-s;uare statistic indicates that the oser%ed fre;uencies differ significantly
from the e9pected fre;uencies" # crossta with r rows and c columns is said to ha%e
6r-17 times 6c-17 degrees of freedom"
>sing the chi-s;uare distriution and its associated degrees of freedom0 you can
calculate the proaility that the differences etween the oser%ed and e9pected
fre;uencies occurred y chance" Fenerally0 a proaility of "02 or less is considered
to e a significant differenceW this proaility is termed Oproaility of chanceO in the
output"
When a crossta contains many cells with counts less than fi%e0 the proaility of
chance for the chi-s;uare statistic can e inaccurate" 4herefore0 the user should
consider grouping some rows andMor columns if many cells ha%e e9pected %alues less
than fi%e"
4he second way of printing crosstas 6oser%edMe9pected tale7 is useful in
e9plaining the significance of the chi-s;uare statistic" 4he cells with high %alues in
the Ocontriution to the chi-s;uareO are the ones that OcontriuteO the most to the
significance of the chi-s;uare" 4his is useful in the discussion of the results of a study
as there are often only a few cells which de%iate from independency"
StatPac For Windows User's Manual Basic 0nalyses &-!
&'ample of a CountAPercent Table
Print Format
Aach cell of the crosstas tale may contain up to four numers" 4heir meanings are
laeled in the upper left corner of the tale" Jou may choose to print or suppress any
of these numers y using the P8 option" 4he parameters for this option are5
' 'umer or oser%ed fre;uency
$ $ow percent or e9pected fre;uency
C Column percent or oser%ed minus e9pected
4 4otal percent or contriution to chi-s;uare
:ne or more parameters may e used with the P8 option" 4hese should not e
separated from each other" 8or e9ample0 if you want to print the numer and total
percent0 use the following option5
:P4!:'S P8^'4
!f a tale is too large to fit on one page0 it will e split to use as many pages as
necessary" 4he actual numer of columns that can fit on a page is determined y the
pitch and carriage width of your printer"
Category Creation
4he actual categories 6rows and columns7 in the crossta analysis can e created
either from the study design %alue laels 6CC^.7 or from the data itself 6CC^@7"
&-* Basic 0nalyses StatPac For Windows User's Manual
When the categories are created from the laels0 the %alue laels themsel%es will e
used to create the categories for the analysis0 and data that does not match up with a
%alue lael code will e counted as missing" 4hat is0 mispunched data will e
counted as missing" When categories are created from the data0 all data will e
considered %alid whether or not there is a %alue lael for it"
$ort Codes
4he actual laeling for the 9 and y a9es are ta,en from the %alue laels" !n most
circumstances0 the order that you entered the %alue laels 6during the study design7
reflects the order in which you want the %alue laels to e listed" Jou can o%erride
the order of the %alue laels in the study design y using the option 6SC^J7" 4he
%alue laels will then e displayed in ascending alphaetical or numeric order" 4his
feature is especially useful when the study design itself does not contain any %alue
laels" !f this option is not used 6i"e"0 SC^'70 the order of the %alue laels on the
printout will reflect the order in which %alues are encountered in the data file"
$tatistics
When the statistics option is specified0 se%eral other statistics will e calculated and
printed"
&'ample of a $tatistics Printout
# discussion of each statistic follows5
Pi
4he Phi statistic is calculated and printed for two-y-two tales" !t may e
interpreted as a measure of the strength of the relationship etween two %ariales"
When there is no relationship0 Phi is Bero" When there is a perfect positi%e
relationship0 Phi is one" When there is a perfect negati%e relationship0 Phi is minus
one"
When comparing one crossta tale to another0 Phi is preferale to the chi-s;uare
ecause it corrects for the fact that the chi-s;uare statistic is directly proportional to
the numer of cases" !n other words0 Phi could e used to compare two crosstas
with une;ual 'Ds"
CramerBs V
!f Phi is calculated for tales larger than two-y-two0 there is no upper limit to its
%alue" 4herefore0 the Phi statistic is not printed for tales greater than two-y-two"
!nstead0 CramerDs ? is printed" CramerDs ? adHusts the Phi for the numer of rows and
columns so that its ma9imum %alue is also one" !t may e interpreted e9actly li,e the
Phi 6e"g"0 a large CramerDs ? indicates a high degree of association etween the two
%ariales7"
StatPac For Windows User's Manual Basic 0nalyses &--
Contingency Coefficient
4he contingency coefficient is another measure of association ased on the chi-
s;uare statistic" !t may e calculated for any siBe of taleW howe%er0 its ma9imum
%alue will %ary depending on the numer of rows or columns" 4herefore0 the
contingency coefficient should only e used to compare tales with the same
numers of rows and columns"
7endallBs Tau $tatistics
EendallDs tau statistics are used to measure the correlation etween two sets of
ran,ings" !t is the numer of concordant pairs of oser%ations minus the numer of
discordant pairs adHusted so it has a range of minus one to plus one" 4here are three
different methods for standardiBing tau 6tau-a0 tau- and tau-c7" 'ote that tau- is
only calculated for s;uare tales"
.amma
Famma is similar to the tau statistics e9cept that it may e interpreted directly as the
difference in proaility of li,e rather than unli,e orders for the two %ariales when
they are chosen at random" Famma has a %alue of plus one when all the data is in the
diagonal that runs from the upper-left corner to the lower-right corner of the tale" !t
has a %alue of minus one when all the data is concentrated in the upper-right to
lower-left diagonal"
CoenBs 7appa
CohenDs Eappa is another measure of the degree to which the data falls on the main
diagonal" !t is only calculated for s;uare tales"
$omersB d
SomersD d is a measure of association for ordered contingency tales when there is a
dependent and independent %ariale" !t may e interpreted in the same fashion as a
regression coefficient"
Odds ratio
4he odds ratio is calculated for two-y-two tales" !ts %alue may %ary etween Bero
and infinity" # %alue greater than one indicates a positi%e relationship while a %alue
near Bero represents a negati%e relationship" # %alue of one indicates statistical
independence" 'ote that this is different than most measures of association"
CuleBs 6 and Cules C
JuleDs C is a function of the odds ratio" .i,e the odds ratio0 its %alue will %ary
etween Bero and oneW unli,e the odds ratio0 a %alue of Bero indicates statistical
independence0 while %alues of minus one and one represent perfect negati%e and
positi%e relationships" !t will e calculated for two-y-two tales"
&ntropy
Antropy is a measure of disorderW that is0 the e9tent to which the data is randomly
distriuted in a contingency tale" 4he greater the disorder0 the greater the entropy
statistic" !t is useful for comparing different crossta tales with each other" # low
entropy 6near Bero7 indicates that the data tends to e clustered in only a few of the
possile categories" # high entropy indicates that the data is e%enly distriuted
among all the possile categories"
&-; Basic 0nalyses StatPac For Windows User's Manual
CateBs Correction
!f degrees of freedom e;uals one 6i"e"0 when the crosstas produces a two-y-two
tale70 the chi-s;uare statistic can ha%e the JateDs correction applied and e printed as
the OCorrected chi-s;uareO" 4he option J#^J will enale JateDs correction for two-
y-two tales0 while J#^' will disale it"
Residual 4nalysis
$esidual analysis is one method used for identifying the categories responsile for a
significant chi-s;uare statistic" 4his in%ol%es calculating the standardiBed residual for
each cell and adHusting it for its %ariance" 4he normal distriution is used to find the
proaility of the adHusted residual using a two-tailed test of significance" #
significant adHusted residual indicates that the cell made a significant contriution to
the chi-s;uare statistic"
4he residual analysis may e turned on or off with the option $#^J and $#^'0
respecti%ely" # sample printout of a residual analysis would loo, li,e this5
&'ample of a Residual 4nalysis Printout
Interaction 4nalysis
While many of the statistics indicate whether or not two %ariales are related0
FoodmanDs interaction analysis is a method of finding out if the magnitude of the
relationship is caused more y one part of the tale than another" !ts purpose is to
e%aluate all possile cominations of two-y-two tales for interaction effects"
4he interaction is defined as the natural log of the odds ratio" 4he purpose of the log
function is to ta,e into account the possiility of a cur%ilinear relationship" 4he
standard error of the interaction is calculated as well as the standardiBed interaction"
4he standardiBed interaction is used to calculate a two-tailed proaility using a
normal distriution"
StatPac For Windows User's Manual Basic 0nalyses &-'
4he interaction analysis may e re;uested with the !#^J option" # sample printout
would loo, li,e this5
&'ample of an Interaction 4nalysis Printout
&=ui"eigting
A;uiweighting is a techni;ue to eliminate distortions from most measures of
association caused y column marginal disparities" Jou should use A;uiweighting
whene%er there is a dependentM independent %ariale relationship 6implying
causality7 and the column totals differ mar,edly for each of the categories" 'ote that
A;uiweighting only applies to the oser%edMe9pected tale and the statistics that are
printed with the tale" #fter A;uiweighting0 cell fre;uencies will no longer e integer
%alues" A;uiweighting may e re;uested with the AC^J option"
&;> Basic 0nalyses StatPac For Windows User's Manual
:abeling and Spacing Options
3tion Code Function
.aeling .& Sets the column headings to print the %ariale lael
6.&^A70 the %ariale name 6.&^'70 or the %ariale
numer 6.&^C7"
.aeling Width .W Set the ma9imum width 6in inches7 for the %ariale
laels on the stu"
A9act Width AW When AW^J0 the laeling width for the stu will
e e9actly what is specified with the .W option"
When AW^'0 the width of the stu will self-adHust
ased on the length of the stu laels"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
Eey EJ Sets whether the top left corner of the anner will
show a legend of the cell contents"
Print Percent Symol PP Sets whether percentage symols will e shown"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
Print Codes PC Sets whether the code 6to the left of the e;uals
symol7 will e shown with the %alue laels"
.ael Iustification .I Sets the Hustification for the anner %ariale lael"
.ael >nderline .> Sets whether the anner %ariale lael will e
underlined"
Column Iustification CI Sets the Hustification for the anner %alue lael
columns"
Column >nderline C> Sets whether the anner %alue lael columns will
e underlined"
&ottom Iustify &I Sets whether the anner laels will e ottom
Hustified"
B077+RS Co((and
&anner crosstas are often used in mar,eting research when it is important to display
se%eral crossta tales as part of the same printout" !t is similar to the crosstas
program e9cept that multiple %ariales may e specified for the 9 andMor y a9is" 4he
%ariales across the top of the page are called the anners and the %ariales down the
side of the page are called the stu" !t has an ad%antage o%er regular crosstas in that
there is much more control o%er the appearance of the output" 4he disad%antage is
that not all the statistical measures of association are a%ailale with anners"
4he synta9 for the command to run anners is5
&#''A$S [Stu %ariale list\ &J [&anner %ariale list\
4he ,eyword &J is a mandatory part of the command synta9" 4he first %ariale list
6called the stu7 will e displayed down the side of the page0 and the second %ariale
StatPac For Windows User's Manual Basic 0nalyses &;1
list 6called the anner7 will e displayed across the top of the page" 4he ma9imum
tale siBe is 220 rows and -0 columns" 4he %ariales may e alpha or numeric"
4o print anners with %ariales 1 = 2 on the y a9is and %ariales 3 to ) on the 9 a9is0
enter the command5
&# ?1 ?2 &J ?3 - ?) 6&#''A$S may e are%iated as &#7
!f a tale is too large to fit on one page0 it will e split o%er as many pages as
necessary"
?ertical ars may e inserted into the anner %ariale list to force a page rea, at that
position etween anner %ariales" 4he following would create at least two pages"
?ariales 3 and 3 would e the anner for the first page and %ariales 20 -0 and )
would e the anner for the second page" 4he %ertical ar is inserted in the list as if
it were a %ariale 6separated y commas or spaces from the other %ariales7"
&# ?- &J ?3 ?3 c ?2 ?- ?)
""
1ultiple %ertical ars can e used and each c will create a page rea, at that position
in the tale"
4he actual numer of columns that can fit on one page is determined y the many
parameters including font siBe 6pitch70 column width0 spacing etween anner
columns0 spacing etween anner %ariales0 and Boom factor" 1ost users run their
anner tales in the landscape mode 6:$^.7 in order to increase the numer of
columns that can fit on a page"
?alue laels appearing in the anner heading will e split into multiple lines as
necessary to fit in the anner column widths" 4he actual positions of the word splits
can e controlled y inserting a %ertical ar into the %alue laels at the locations
where you want the words to split" 8or e9ample0 a %alue lael of QFo%ernmentR
might rea, into two lines in the anner heading" Jou could force the rea, to occur
etween the n and m y changing the %alue lael to Fo%erncment or Fo%ern-cment"
>se a .#&A.S statement with a _ suffin9 to change the %alue laels"
.#&A.S :rganiBation 61^Fo%erncment762^Pri%ate763^'on-cProfit7_
&#''A$S ?9 &J 4:4#. :rganiBation
""
Type of Data
4wo types of anner tales can e printed" 4he most common type is the
countMpercent tale" 4he data for the rows and columns is categorical 6nominal or
ordinal7" Aach row and column in the tale represents a category" Set 4J^C to select
the countMpercent tale" >nli,e crosstas0 the banners pro/ram defines its row and
columns from the value labels in the study desi/n. 4hat is0 the program uses the
%alue laels to create the anner rows and columns" #ny data %alue not ha%ing a
matching %alue lael in the study design will e counted as missingW therefore0 set up
the study design laels to reflect the headings and laeling for the anners"
4he second type of tale is when the stu %ariales are inter%al or ratio data" 4here
arenDt any defined categories for the rows" !nstead of counts and percents0 we would
&;& Basic 0nalyses StatPac For Windows User's Manual
want to see means and standard de%iations in the tale" Set 4J^P to indicate that the
stu %ariales are parametric" 4he tale will show means and standard de%iations
instead of counts and percents"
Print Format
Aach cell of the anners tale may contain up to four numers" 4o print or suppress
any of these numers0 use the P8 option"
4he parameters for this option are5
' 'umer
$ $ow percent
C Column percent
4 4otal percent
:ne or more parameters may e used with the P8 option" 4hese should not e
separated from each other" 8or e9ample0 to print the numer and total percent0 use
the following option5
:P4!:'S P8^'4
StatPac For Windows User's Manual Basic 0nalyses &;1
&'ample of a !anners Printout
4lternate Format
When 4J^P 6the stu is parametric data70 each cell of the anners tale may contain
up to fi%e numers" 4o print or suppress any of these numers0 use the #8 option"
4he parameters for this option are5
' 'umer
1 1ean
S Standard @e%iation
A Standard Arror
@ 1edian
:ne or more parameters may e used with the #8 option" 4hese should not e
separated from each other" 8or e9ample0 to print the numer0 mean0 standard
de%iation and median0 use the following option5
&#''A$S !ncome &y 4otal IoXPosition
:P4!:'S 4J^P #8^'1S@
""
Category Creation
!n most cases you will want the rows and columns of a anners tale to e a
reflection of the %alue laels" When CC^. the categories 6what StatPac defines as a
row or column7 will e created from the %alue laels in the codeoo," 4hat is0 a row
on the stu or column in the anners will e created for each %alue lael in the
codeoo," !f a %ariale does not ha%e %alue laels0 it will not e included in the tale"
!n some cases0 howe%er0 you might not ha%e pre%iously assigned %alue laels to a
%ariale ut still want the %ariale to e included in the tale" Set CC^@ to create the
categories from the data itself instead of the %alue laels" 8or e9ample0 if you had a
%ariale with data %alues of 1-2 ut no %alue laels0 you could include this %ariale
&;) Basic 0nalyses StatPac For Windows User's Manual
in the anner tale y setting CC^@" #lternati%ely0 you could use the .#&A.S
command in the procedure to specify %alue laels for the %ariale"
%eans 2 $tandard Deviations
4he reser%ed word 1A#' may e used to print the mean a%erage of any row or
column %ariale" 4he mean will e the a%erage of the %alue codes 6not the %alue
laels7" 4he word 1A#' should e included in the %ariale list immediately
following any %ariale that you want to calculate the mean a%erage of" Aither row or
column means may e specified" 8or e9ample0 the following command has two
%ariales on each a9is 6?1 and ?2 &J ?3 and ?37" 1eans will e printed for oth
the first and second row %ariales0 and following only the first column %ariale"
&#''A$S ?1 1A#' ?2 1A#' &J ?3 1A#' ?3
4he standard de%iations or standard errors may also e printed elow the means y
specifying the S@^@ or S@^A option0 respecti%ely" When S@^A and the 8P option is
used to specify a finite population siBe0 the standard error will e calculated using the
finite population correction factor" 6See the :P4!:'S Command in the Eeywords
section of this manual"7
Ro" 2 Column Totals
4he reser%ed word 4:4#. can e used with the &#''A$S command to specify
row andMor column totals anywhere in the tale" 4he word 4:4#. can e used as a
%ariale name in any position 6and as many times as desired7 in either 6or oth7
%ariale lists" When 4:4#. is used in the first %ariale list 6for the J a9is70 a row is
included that displays the totals for all columns in the tale" When 4:4#. is used in
the second %ariale list 6for the * a9is70 the tale includes a column that contains row
totals" #s an e9ample0 a command to print totals in the first row and first column of
the anners tale would e5
&#''A$S 4:4#.0 S#4-SC:$A0 FP# &J 4:4#.0 C.#SS
# row or column total reflects the numer of cases throughout the entire data file in
which the %alue for the row or column appears" 4herefore0 the numers for one
particular pair of intersecting %ariales may not add up to the numer for the row or
column total" 8or e9ample0 if a %ariale which recorded se9 6maleMfemale7 is placed
on the * a9is against a %ariale on the J a9is which recorded ma,e of car owned0
and 20 of the 100 women who completed the sur%ey did not answer the car ;uestion0
the column total for females would e 1000 ut the sum of the females in all the rows
of the car %ariale would e only (0"
1ale 8emale 4otal
8ord 20 20 100
:ther 30 -0 100
4otal 100 100
!t is easy to create a total column that reflects the row totals irrespecti%e of the other
cell counts" 8irst use the 'AW command to create a new %ariale called 'A4" 4he
%alue of 'A4 will e initialiBed as missing for all cases" 4hen use the .#&A.S
StatPac For Windows User's Manual Basic 0nalyses &;!
command to assign a lael to missing data" Since the anners program uses %alue
laels to determine what is a row and what is a column0 it is necessary to use the
.#&A.S command0 e%en though the lael is set to lan," 8inally0 specify the new
'A4 %ariale instead of the 4:4#. ,eyword in the &#''A$S command"
'AW 6'17 O'A4O 4otals
.#&A.S 'A4 6^7
&#''A$S 4:4#. SC:$A &J 'A4 C.#SS
$ort $tub
4he actual laeling for the 9 and y a9es are ta,en from the study design information
in the codeoo," !n most circumstances0 the %alue laels will reflect the order in
which you want the category codes to e listed" !t is possile to o%erride the order of
the %alue laels in the study design y using the option 6SS^# or SS^@7" 4he
category codes 6%alue laels7 on the stu will then e displayed in ascending or
descending numeric order y fre;uency"
#dditionally0 a digit may e added as a suffi9 to the SS^# or SS^@" !t is used to sort
the stu e9cluding the last one or more %alue laels" 4his is useful when the last
%alue lael is an OotherO or OdonDt ,nowO category0 and you want to sort the stu0 ut
still lea%e the Oother Oor OdonDt ,nowO as the last row on the stu" 8or e9ample
SS^@1 would sort the stu in descending order y fre;uency0 e9cept it would lea%e
the last %alue lael as the last row regardless of its fre;uency"
$ort !anners
4he S& option 6sort anner7 can e used to sort the anner %ariales" 4he anner
%ariales to e sorted can e specified0 as well as the sort order"
4he S& option is enclosed in parentheses and will contain two entries for each
anner %ariale to e sorted" Parameters may e separated y commas or spaces"
4he first parameter is # for ascending and @ for descending" # numer may e used
as a suffi9 to indicate the numer of %alues that should not e included in the sort"
8or e9ample0 if the last %alue lael was Q:therR and you wanted it to remain as the
last column 6e%en after the other columns were sorted70 the first parameter would e
@1 for descending order and #1 for ascending order""
Jou can also indicate whether you want to sort to e done ased on the fre;uencies
6counts7 or the %alue lael category codes y including a 8 or C" 4he default is a sort
y fre;uencies" 8or e9ample0 @2 would indicate a sort y fre;uencies 6the default7
in descending order lea%ing the last two columns not sorted" !t could e specified as
8@2" Specifying 8C2 would e the same sort y category codes"
4he second parameter is the %ariale numer 6with a ?7 or the %ariale name" 8or
e9ample0 the following would sort the first 6?17 and third 6?)7 anner %ariales" 4he
second and fourth anner %ariales would remain in the order specified y the %alue
laels ecause they are not specified in the S& option" 4he first anner %ariale 6?17
would e in descending order y fre;uency and the third anner %ariale 6?)7 would
e in ascending order y fre;uency"
&anners Stu?ar &y 4otal ?1 ?2 ?) ?3
:ptions S&^6@ ?1 # ?)7
""
&;* Basic 0nalyses StatPac For Windows User's Manual
!f you add an e9clamation point immediately following the closing parenthesis0 the
same sorts will apply to all suse;uent procedures in this StatPac session"
:ptions S&^6@ ?1 # ?)7_
Jou can change the sort in a suse;uent procedure" Jou can or cancel it y either
closing StatPac0 or adding S&^' or S&^67 to a procedure
Compress Output
Compression refers to the way the program creates page rea,s" When compression
is on 6C:^J70 the program will attempt to fit as many columns and rows on a page
as possile" 4hat is0 page rea,s may occur etween different %alue laels of the
same %ariale" When compression is off 6C:^'70 the program will rea, pages
etween each %ariale on the y-a9is" :f course0 when there are many categories for a
%ariale0 it may e necessary to split up a %ariale o%er successi%e pages regardless
of the compression setting" Setting C:^J or C:^' will apply to oth the stu and
anner" Compression my e selecti%ely applied to either the stu or anner using
C:^S and C:^&0 respecti%ely" When compression is set to the stu 6C:^S70 page
rea,s will occur etween %ariales 6not etween %alue laels70 howe%er0 the
program will still attempt to ma9imiBe the numer of %ariales that can fit on a page"
Percentage !ase
4he percentage ase on a anners analysis can either e the numer of respondents
6'7 or the total numer of responses" !f P&^'0 the denominator for calculating
percentages will e the numer of respondents" !f P&^$0 the denominator will e the
total numer of responses for all indi%iduals"
$pecial Value Label 1ID&
When creating a anner tale0 it is often desirale to display only some of the
response categories" 4he .#&A.S command may e used to eliminate undesirale
categories from the tale" 4his will eliminate the column from the tale and from any
calculations of percentages on the tale"
8or e9ample0 assume the following counts for ?15
1 2 3
#gree 'eutral @isagree 'o $esponse 4otal '
30 20 30 10 100
!f P&^'0 6denominator e;uals numer of respondents70 the percents will e5
#gree 'eutral @isagree
30` 20` 30`
!f P&^$0 6denominator e;uals numer of responses70 the percents will e5
#gree 'eutral @isagree
30M90^33` 20M90^22` 30M90^33`
StatPac For Windows User's Manual Basic 0nalyses &;-
We could use the following .#&A.S command to eliminate the O'eutralO category
from the tale5
.#&A.S ?1 61^#gree763^@isagree7
!f P&^'0 the percents will still e ased on a denominator of 100" !f howe%er0 P&^$0
then the percents will e ased on a denominator of )0 630]3075
#gree @isagree
30M)0^33` 30M)0^2)`
4he special %alue lael O<!@AO may e used to suppress printing of a %alue lael
without reducing the denominator for the percents calculations" 4he following
.#&A.S command could e used to eliminate the O'eutralO category from the tale0
while still including the O'eutralO count in the denominator5
.#&A.S ?1 61^#gree762^<ide763^@isagree7
#ny row or column that has a %alue lael of O<!@AO will not e printed0 ut it will
e included in the percent calculations when P&^$" 'ote that the percentages are
ased on the counts for all %alue laels 6including the O'eutralO category70 e%en
though all the %alue laels are not displayed in the tale"
#gree @isagree
30M90^33` 30M90^33`
!f you only wanted the O#greeDsO to show in the tale0 you could use the following
statements in the procedure" 4he percentages in the tale would still e ased on 905
.#&A.S ?1 61^#gree762^<ide763^<ide7
:P4!:'S P&^$
""
%ultiple Response
1ultiple response %ariales can e included in anner crosstas y using the 1$
option to comine those %ariales that should e interpreted as a single %ariale" 4he
synta9 to comine multiple response %ariales is5
:P4!:'S 1$^6[list 1\76[list 2\7""""6[list n\7
Aach %ariale list represents a group of multiple response items that should e
grouped as if they were a single %ariale" Aach group must e enclosed in
parentheses and specified as a %ariale list 6indi%idual %ariales are separated y
&;; Basic 0nalyses StatPac For Windows User's Manual
commas or spaces0 and ranges are specified with a dash7" Aither %ariale names or
%ariale numers may e specified in the 1$ option %ariale list" 4he ? prefi9 is
optional for %ariale numers"
4he se;uence of %ariales specified in a multiple response group list must match a
se;uence of the 9 or y a9is anner list" 8or e9ample0 consider the following
&#''A$S command5
&#''A$S ?2 - ?(0 ?100 ?11 &J ?1 - ?30 ?20 ?-
1ultiple response %ariales y-a9is5 2-(010011 9-a9is5 1-3020-
:P4!:'S 1$^61-37 Froups %ars" 10 2 = 3 on the 9-a9is
:P4!:'S 1$^62037 Froups %ars" 2 = 3 on the 9-a9is
:P4!:'S 1$^6(010-117 Froups %ars" (0 10 = 11 on the y-a9is
:P4!:'S 1$^620-7 Froups %ars" 2 = - on the 9 = y-a9is
4he following groupings might cause prolems5
:P4!:'S 1$^61--7 Froups %ars" 10 2 = 3 on the 9-a9is0
ut not %ariales 2 or - ecause
%ariale 3 was not part of the anners
%ariale list
:P4!:'S 1$^6--117 Froups %ars" -0 ) = ( on the y-a9is0
ut not %ariales 10 or 11 ecause
%ariale 9 was not part of the anners
%ariale list
:P4!:'S 1$^610-127 Froups %ars" 10 = 11 on the y-a9is and
ignores the e9tra %ariales
:P4!:'S 1$^63-)7 'o %ariales grouped
:P4!:'S 1$^611-207 'o %ariales grouped
:P4!:'S 1$^6302017 'o %ariales grouped
:P4!:'S 1$^6(0110107 'o %ariales grouped
!n general0 the 1$ option will ne%er cause a fatal error" !f an in%alid grouping is
found0 it is simply ignored and the %ariales will not e grouped on the output" 4he
anners program uses the %alue laels from the first %ariale specified in each group
list" 4he 1$ option should e used only to group %ariales which share a list of
common %alue laels" 4he %alue laels must e specified in the study design 6i"e"0
they will not automatically e determined from the data file7" 4his was implemented
to pre%ent mispunched or spurious data from creating its own row or column in the
output"
Net Codes
'et categories may e created and displayed on the stu using the '4 option in
conHunction with the 1$ option" 4he '4 option specifies the codes on the stu
%ariale that are to e interpreted as net categories" 'et categories are e9cluded from
StatPac For Windows User's Manual Basic 0nalyses &;'
the calculations of totals and means" 1ultiple categories are separated with a slash
and enclosed in ;uotes" 4he general format is5
:P4!:'S '4^OcodeMcodeMcodeO
8or e9ample0 suppose you want to create a anner tale where the stu 6?27 is a fi%e-
point .i,ert scale" 4he scale is coded5 61^?ery good7 62^Food7 63^8air7 63^Poor7
62^?ery poor7" Jou want the stu to contain two net %ariales and loo, li,e this5
1^?ery Food
2^Food
'A45 ?ery Food or Food
3^8air
'A45 Poor or ?ery Poor
3^Poor
2^?ery Poor
1ean = S@
4he first step is to create a 'A4 %ariale and compute it e;ual to %alues not used in
the originally coded %ariale" !n this e9ample0 -0 )0 (0 90 and 0 are unused0 so we
could use any of them for the new 'A4 %ariale" 4hen use the .#&A.S command to
relael the stu categories in the order you want them to appear" !nclude the new
'A4 %ariale in the &#''A$S command as if it were a multiple response %ariale"
>se the 1$ option to specify multiple response and use the '4 option to specify
which codes are the net categories"
'ew 6'17 O'A4O
!f ?2^O1M2O 4hen Compute 'A4^-
!f ?2^O3M2O 4hen Compute 'A4^)
.aels ?2 61^?ery Food7 62^Food7 6-^'A45 ?ery Food or Food7
63^8air7 6)^'A45 Poor or ?ery Poor7 63^Poor7 62^?ery Poor7
&anners ?2 'A4 1ean &y 4otal #ge Fender Froup
:ptions 1$^6?2 'A47 '4^O-M)O
""
-eigting
Weighting is useful when the true incidence in the population is ,nown0 ut data
collection yielded a different incidence" !n other words0 there was a sampling error
6the sample does not ade;uately represent the population7" Weighting can e used to
mathematically increase or decrease the counts of any anner %ariales so they more
accurately reflect the ,nown population parameters"
4he WA!F<4 command in StatPac will create a weighted file using integer case
weights where a proaility function is used for the non-integer portion of the
weights" 4he W4 option in the &#''A$S command will not create a new data file0
ut rather0 simply adHusts the counts in the anner tale" 4he WA!F<4 command and
the W4 option in anners are different methods of accomplishing the same goal and
should not e used together in the same procedure"
&'> Basic 0nalyses StatPac For Windows User's Manual
4he easiest way to create a weighting %ariale is to use the >tility program0
Sampling \ Create ?ariale for Weighting" !t will allow you to create a weighting
%ariale that can e used in any of the StatPac procedures" !f youNre weighting y
more than one %ariale simultaneously0 the utility program is the est way to create
the weights"
4he following e9planation is if you want to manually create a weighting %ariale" !t
is presented here to show the mathematical concepts in%ol%ed in weighting" While
you can create a weighting %ariale manually0 we recommend using the utility
program"
4a,e for e9ample a simple anner tale with an automatic total row and a mean row5
4itle 6/7
&anners ?1 &y 4otal Fender
:ptions #4^J #1^J PC^J
""
4he tale might loo, li,e this5
.oo,ing at the 4otal row0 we see that our sample had -3"-` males and 32"3`
females" <owe%er0 we ,now that the population actually has 22` males and 32`
females0 so the 4otal column might e producing an inaccurate reflection of the total
population due to a sampling error" 4o correct the prolem0 we would weight the
gender %ariale so the tale reflects the 22` and 32` proportions that we ,now e9ist
in the population"
4he first step is to calculate the weights for males and females" 4he weights are
easily calculated y the following formula5
StatPac For Windows User's Manual Basic 0nalyses &'1
)eigt 4 Gesired %ercentage 2 Observed %ercentage
4hus0 the weight for males would e 22 di%ided y -3"- ^ "(213 and the weight for
females would e 32 di%ided y 32"3 ^ 1"2)12"
4ypically0 youDll want to weight the entire anner tale0 &egin y creating a %ariale
that contains the weight for each case" Suse;uent procedures would specify the W4
option to weight the entire anner tales y the case weight %ariale
S4>@J SAF1A'4
'AW 6')7 OCaseWeightO
!8 FA'@A$ ^ 1 4<A' C:1P>4A CaseWeight ^ 0"(213
!8 FA'@A$ ^ 2 4<A' C:1P>4A CaseWeight ^ 1"2)12
S#?A
""
&anners ?1 &y 4otal #ge Fender Froup
:ptions W4^6CaseWeight7
""
&anners ?11-?20 &y 4otal #ge Fender Froup
:ptions W4^6CaseWeight7
""
4he other form of the W4 option lets you weight indi%idual anner %ariales with
their own weights
4he first step is to calculate the weights for males and females using the same
formula as ao%e" 4he ne9t step is to add the W4 option to the anners procedure"
4he format for the W4 option is5
:P4!:'S W4^6%ariale code^weight code^weight7
Spaces or commas may e used within the parentheses to separate each of the
components of the option"
!n this e9ample0 the codeoo, specifies 1^1ale and 2^8emale so the W4 options
would use codes of 1 and 2"
4itle 6/7
&anners ?1 &y 4otal Fender
:ptions #4^J #1^J PC^J W4^6Fender 1^"(213 2^1"2)127
""
$erunning the procedure would produce a weighted analysis with an adHusted total
row and total column"
&'& Basic 0nalyses StatPac For Windows User's Manual
1ore than one anner %ariale may e weighted" 4he synta9 is the same e9cept
additional sets of parentheses are added for each %ariale to e weighted"
:P4!:'S W4^6%ariale code^weight code^weight7 6%ariale code^weight
code^weight code^weight7
When the W4 option is used0 the total column will reflect the weighted %alues of the
%ariale that follows it" !f more than one %ariale is weighted0 it would e wise to
specify more than one total column" 8or e9ample0 if ethnicity were coded as an alpha
%ariale 6W^White and &^&lac,70 the following commands would produce a total
column for gender and a total column for ethnicity0 and oth would e weighted5
&anners ?1 &y 4otal Fender 4otal Athnicity
:ptions #4^J #1^J PC^J W4^6Fender 1^"(213 2^1"2)1276Athnicity
W^"2-)2 &^1"(1317
""
Fractional Counts
4he 8C option may e used in conHunction with the W4 option to display fractional
cell counts" 8C^J will show the decimal portion of the cell counts and 8C^' will
display them as integers" While weighting does create fractional cell counts0 it is
often confusing 6e"g"0 how could there e 1)("- malesY7" >sing 8C^' will round all
cell counts to whole numers0 while 8C^J will show the decimal portions"
StatPac For Windows User's Manual Basic 0nalyses &'1
$upplemental 1eading
4he supplemental heading is a line of te9t that will appear after the heading and title0
ut efore the anner tale" !t may contain any te9t and should e enclosed in ;uotes"
When the pound symol is used in the supplemental heading0 it will e printed as
the numer of cases" 4he S< option is usually used to indicate who is included in the
anner tale" 4he following is an e9ample if a supplemental heading5
:P4!:'S S<^O&#SA5 #.. $ASP:'@A'4S 6'^/7O
N &=uals
4he sample siBe can e displayed in the top left corner of the tale with the 'A
option" !t may contain any te9t and should e enclosed in ;uotes" When the pound
symol is used in the ' A;uals option0 it will e printed as the numer of cases" 4he
'A option is usually used to indicate who is included in the anner tale" 4he
following is an e9ample of the ' A;uals option5
:P4!:'S 'A^O6'^/7O
$ignificance Tests
StatPac offers significance testing in anner tales" 4o ypass all significance testing0
set the S4 option to none 6S4^'7" 4he following options control the type of
significance tests5
:P4!:'S S4^' 6no significance tests7
:P4!:'S S4^P 6t-test etween percents only7
:P4!:'S S4^1 6t-tests etween means only7
:P4!:'S S4^4 6t-tests etween percents and means7
:P4!:'S S4^C 6chi-s;uare tests for each sutale7
:P4!:'S S4^# 6t-tests etween means and percents and chi-s;uare tests7
T:Tests !et"een Proportions and %eans
4wo-tailed t-tests etween column percents and means can e performed with the S4
option" When specified0 StatPac will automatically set the anner to include a code
letter for each column0 eginning with column O#O" #n independent samples t-test
will e performed etween all cominations of anner columns0 and the results will
e displayed in the tale if they are significant at the alpha le%els set y the C1 and
C2 options"
>pper case letters indicate Ohigh significance5 and lower case letters indicate
Omoderate significanceO 6high and moderate eing defined y the %alues of C1 and
C27" 8or e9ample0 suppose C1^"02 and C2^"01" #fter running the analysis0 you see a
cell with the letters OCeO" 4his means that the percentage in this cell is significantly
different from the percentage in column C at the "01 le%el0 and significantly different
from the percentage in column A at the "02 le%el"
Ci:$=uare Tests
&anner crossta tales may e ro,en down into se%eral cominations of smaller
tales0 consisting of one %ariale on each a9is" 8or e9ample0 the following
&#''A$S statement could e ro,en down into three sutales5
&') Basic 0nalyses StatPac For Windows User's Manual
&#''A$S ?1 &J ?20 ?-0 ?9
4he sutales would e ?1 y ?20 ?1 y ?-0 and ?1 y ?9" !t is then possile to
calculate a chi-s;uare statistic for each sutale" >se the option S4^C to re;uest a
chi-s;uare analysis for all the cominations of sutales" 4he chi-s;uare0 degrees of
freedom and proaility of chance will e printed for each sutale"
!t is not possile to calculate chi-s;uare statistics for tales with completely missing
rows or columnsW therefore0 if any row or column in a sutale is completely
missing0 it will not e included in the calculation of the chi-s;uare statistic or degrees
of freedom 6e%en though it may e displayed in the countMpercent tale7"
&'ample of a T"o:-ay Ci:$=uare $tatistics Printout
When S4^#0 all types of significance testing will e performed" 4he output will
include the t-tests etween percents and means and two-way chi-s;uare tests"
CateBs Correction
!f degrees of freedom e;uals one 6i"e"0 when the anners program produces a two-y-
two tale70 the chi-s;uare statistic can ha%e the JateDs correction applied" 4he option
J#^J will enale JateDs correction for two-y-two tales0 while J#^' will disale
it"
>ero Ro"s 2 Columns
Jou may choose whether or not to print Bero rows and columns" 4his situation 6of
Bero rows or columns7 could occur if there are %alue laels in the study design for
which there is no data" !f you want the reader of your report to ,now that a category
e9ists0 you will proaly want to print rows and columns with Bero counts 6L$^J
LC^J7" !n most cases0 howe%er0 conser%ing space is more important0 so you would
set L$^' and LC^'"
4utomatic Page Title Creation
When performing a series of anner analyses0 each ha%ing the same anner columns0
and only one y a9is %ariale 6per page70 it may e desirale to ma,e the page title the
same as the y a9is %ariale lael" When the title is set to a pounds symol in
parentheses0 the title will ecome the %ariale lael for the y a9is %ariale" 64his can
e changed to the 9 a9is lael using a patch7"
StatPac For Windows User's Manual Basic 0nalyses &'!
8or e9ample0 letDs say you had se%eral demographic %ariales as your anner points0
and you wanted to loo, at se%eral other %ariales on the y a9is 6down the stu7" Jou
want a series of tales that loo, li,e this5
Special Study 6Page <eading7
4he %ariale lael of the OSome ?arialeO on the y a9is 64itle7
#ge Se9 !ncome
>nder 21 1ale 8emale .ow 1iddle <igh
Some ------- ----- ----- ----- ----- -----
?ariale ------- ----- ----- ----- ----- -----
4he following procedure would produce fi%e similar tales0 each on a different page0
and each with a different title5
S4>@J Jourstudy
<A#@!'F Special Study
4!4.A 6/7
&#''A$S ?1-?2 &J #FA SA* !'C:1A
:P4!:'S C:^' S<^OO
""
Total Ro" Position
When the 4:4#. ,eyword is imedded etween other %ariales in the anners
command line0 the 4P option is used to determine whether the total should e printed
for the pre%ious %ariale or the ne9t %ariale" !n the following e9ample0 the total row
could e the last stu for ?1 or it could e the first stu for ?20 depending on the
setting of the 4P option"
&#''A$S ?1 4:4#. ?2 &J #FA SA* !'C:1A
!f 4P^.0 the last row for ?1 will e a total row" !f 4P^80 the first row for ?2 will e
a total row"
Total Counts
4he 4C option ma,es it possile to print only the counts 6without the percents7 in
total rows and total columns0 e%en when percentages are eing printed in the rest of
the tale" !f 4C^J0 total rows and total columns will only contain the counts" !f
4C^'0 total rows and columns will e defined y the P8 option0 and will contain the
same numer of %alues as the other cells in the tale"
Total 4dDustment
4he 4# option may e used to set how total columns are calculated" !f 4#^'0 the
total columns will e ased on the numer of non missing cases for the stu %ariale"
!f 4#^J0 the total column counts will e the sum of the counts for the %ariale that
follows it" !f there are no missing data for the anner %ariale0 the counts will e the
&'* Basic 0nalyses StatPac For Windows User's Manual
same0 ut if the anner %ariale that follows the 4:4#. ,eyword has missing data0
the counts in the total column will e different" 4hus0 when setting 4#^J0 you could
insert the wor, 4:4#. efore each anner %ariale and each total column might
contain different counts"
Total Ro" Denominator
'ormally0 a total row will e ased on the same denominator at specified y the P&
option 6either ' the numer of cases0 or $ the numer of respondents7" !f P& is set to
$0 you can force the percentages in a total row to e calculated using ' as the
denominator y setting 4@^J" 4his is sometimes handy when the anner contains
multiple response %ariales"
Total Total Intersections
When printing a tale that contains oth total rows and total columns0 there will e at
least one intersection of a total row and a total column" Jou must set the precedence
as to how the intersection cell is calculated" !t may e ased on the sum of the row
counts 644^$7 or the sum of the column counts 644^C7"
4utomatic Total Ro"
4he #4 option may e used to automatically print a total row for each %ariale on the
stu" !ts purpose is to eliminate the necessity of ha%ing to type the 4:4#. ,eyword
for each of the stu %ariales" !n the pre%ious e9ample0 if you wanted each stu
%ariale to egin with a total row0 the command would e5
&#''A$S 4:4#. ?1 4:4#. ?2 4:4#. ?3 4:4#. ?3 4:4#. ?2 &J
#FA SA* !'C:1A
:P4!:'S C:^'
""
!f the #4 option is set to OJO0 the total rows will e included in the output0 e%en when
the 4:4#. ,eyword is not included in the stu %ariale list" 4he following
procedure would produce the same output as the pre%ious procedure5
&#''A$S ?1-?2 &J #FA SA* !'C:1A
:P4!:'S C:^' #4^J 4$^8
""
4he 4$ option is used in conHunction with the #4 option to determine whether the
total row will e the first or last row on the stu" 'ote that if you use the option
#4^J0 then you should not use the 4:4#. ,eyword anywhere in the stu %ariale
list"
4utomatic %ean Ro"
4he #1 option may e used to automatically print a row of means for each %ariale
on the stu" !ts purpose is to eliminate the necessity of ha%ing to type the 1A#'
,eyword for each of the stu %ariales" !n the pre%ious e9ample0 if you wanted each
stu %ariale to include a row of means0 the command would e5
&#''A$S ?1 1A#' ?2 1A#' ?3 1A#' ?3 1A#' ?2 1A#' &J
#FA SA* !'C:1A
:P4!:'S C:^'
StatPac For Windows User's Manual Basic 0nalyses &'-
""
!f the #1 option is set to OJO0 a row of means will e included in the output0 e%en
when the 1A#' ,eyword is not included in the stu %ariale list" 4he following
procedure would produce the same output as the pre%ious procedure5
&#''A$S ?1-?2 &J #FA SA* !'C:1A
:P4!:'S C:^' #1^J
""
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the column headings to print the %ariale lael
6.&^A70 the %ariale name 6.&^'70 or the %ariale
numer 6.&^C7"
.aeling Width .W Set the ma9imum width 6in inches7 for the %ariale
laels on the stu"
A9act Width AW When AW^J0 the laeling width for the stu will
e e9actly what is specified with the .W option"
When AW^'0 the width of the stu will self-adHust
ased on the length of the stu laels"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
?ariale Spacing ?S Sets the spacing 6in inches7 etween the anner
%ariales"
Eey EJ Sets whether the top left corner of the anner will
show a legend of the cell contents"
Print Percent Symol PP Sets whether percentage symols will e shown"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
Print Codes PC Sets whether the code 6to the left of the e;uals
symol7 will e shown with the %alue laels"
>nderline Stu ?ariale
.aels
>. Sets whether the stu %ariale laels will e
underlined"
&ottom Iustify &I Sets whether the anner laels will e ottom
Hustified"
<eading Iustification <I Sets the Hustification for the anner %ariale laels
&ottom Iustify <eading &< Sets whether the anner %ariale laels will e
ottom Hustified"
?alue .ael Iustification .I Sets the Hustification for the anner %alue laels"
&ottom Iustify ?alue .aels &. Sets whether the anner laels will e ottom
Hustified"
A9tra Spacing AS When AS^J0 a lan, line will e printed ao%e and
elow the anner %alue laels" When AS^'0 no
lan, lines will e printed"
Code Iustification CI Sets the Hustification for the %alue lael codes"
Print Stu ?ariale .ael S. Sets whether the stu %ariale laels are shown"
Stu ?ariale Spacing ?J Sets the numer of lan, rows etween %ariales
on the stu"
&'; Basic 0nalyses StatPac For Windows User's Manual
Stu .ael Spacing .J Sets the numer of lan, rows etween %alue
laels on the stu"
%inimum Cell Count
$esearchers often choose not to show the percentages for cells containing a small '"
4he 1C option may e used to suppress the printing of percentages of cells with low
counts" 8or e9ample0 if 1C^20 StatPac will print cell counts that are greater than or
e;ual to 2" !f a cell has a count of less than 20 StatPac would print dashes instead of
the percent" !f 1C^10 StatPac will print dashes for cells where the count is Bero"
?alid %alues for 1C are etween 0 and 100" !f 1C^00 all cell counts will e printed"
%inimum Denominator
Percentages can e misleading if they are ased on a small denominator" 4he 1@
option may e used to suppress the printing of percentages that are ased on a small
denominator" 4he 1@ option sets the minimum denominator that StatPac will use for
calculating percents" 8or e9ample0 if 1@^20 StatPac will calculate percentages if the
denominator is greater than or e;ual to 2" !f a denominator were less than 20 StatPac
would print dashes instead of the percent" ?alid %alues for 1@ are etween 0 and
100" !f 1@^00 all percentages will e printed"
$+SCRIP:I8+ Co((and
@escripti%e statistics are usually the first step in the analysis of inter%al or ratio data"
4hey re%eal central tendency and the shape of the distriution"
4he synta9 of the command to run descripti%e statistics is5
@ASC$!P4!?A [?ariale list\
8or e9ample0 if you are e9amining college entrance e9am scores for $A#@!'F
6?)70 #$!4<1A4!C 6?127 and ?A$&#. 6?197 s,ills0 descripti%e statistics could
e re;uested with any of the following commands5
@ASC$!P4!?A $A#@!'F0 #$!4<1A4!C0 ?A$&#.
@ASC$!P4!?A ?)0 ?120 ?19
@A ?) ?12 ?19 6@ASC$!P4!?A may e are%iated as @A7
4here are a wide %ariety of descripti%e statistics a%ailale" 4o print or e9clude
indi%idual statistics0 use the appropriate option"
1issing data 6lan,s7 will always e e9cluded from the calculation of descripti%e
statistics" !t will e reported as the numer of missing cases ut will not e used for
any calculations"
One 4nalysis
4he one-analysis option allows you to print selected descripti%e statistics for se%eral
%ariales on one page" 4his option is especially useful for summary reporting0 when
you only need a few descripti%e statistics for a large numer of %ariales"
StatPac For Windows User's Manual Basic 0nalyses &''
#ll the %ariales specified with the :# option must e numeric" 8or e9ample0
suppose that %ariales 22-33 are ten numeric scores" 4he following commands would
produce a one-page summary of selected descripti%e statistics for each of the ten
items5
@ASC$!P4!?A ?22-?33
:P4!:'S :#^J
&'ample of a Descriptive $tatistics One:4nalysis Printout
When the :# option is used0 the ,eyword $AC:$@ in the %ariale list will lea%e a
lan, line in the report" 4his allows you to %isually group %ariales" 8or e9ample0
this will print fi%e rows of descripti%e statistics0 a lan, row0 and then fi%e more
rows"
@A %1-%2 $ecord ?--%10
:P4!:'S :#^J
""
$tatistics
When the :# option is specified0 you may select which descripti%e statistics you
want with the S4 option" 4he codes for the S4 option are the same as the specific
statistic codes descried elow" 64he only e9ception is 'C0 which stands for the
numer of %alid cases7" 8or e9ample0 the following commands would report the
mean0 median0 uniased standard de%iation and numer of cases for %ariales 22-335
@ASC$!P4!?A ?22-?33
:P4!:'S :#^J S4^61A 1@ >S 'C7
1>> Basic 0nalyses StatPac For Windows User's Manual
'ote that the commands are identical to the pre%ious e9ample e9cept the S4 option is
used to identify the specific statistics you want calculated" 4he parentheses around
the list of statistics is mandatory"
$ort Variables
When performing descripti%e statistics with the one-analysis option 6:#^J70 you
can sort the %ariales y the contents of the first column of the results" 4he S? 6sort
%ariales7 option may e set to O'O for no sort0 O#O to sort in ascending order0 or O@O
to sort in descending order" When no sort is specified0 the %ariales will e listed in
the order that they appear in the analysis command %ariale list" 4he S? option is
applicale only when the :#^J option is specified"
#dditionally0 a digit may e added as a suffi9 to the S?^# or S?^@" !t is used to
sort the %ariales e9cluding the last one or more %ariales" 4his is useful when the
last %ariale is an OotherO %ariale0 and you want to sort the %ariales0 ut still lea%e
the Oother O as the last %ariale" 8or e9ample S?^@1 would sort the %ariales in
descending order0 e9cept it would lea%e the last %ariale as the last row regardless of
its %alue"
%inimum5 %a'imum5 Range5 2 $um
4here are four %ery simple measures of dispersion that gi%e an o%erall picture of the
data" 4hese are the minimum data %alue0 ma9imum data %alue0 range 6ma9imum
minus the minimum70 and sum of the data" #n option line that would enale all of
these features is5
:P4!:'S 1!^J 1#^J $#^J S>^J
%ean5 %edian5 2 %ode
4he est ,nown descripti%e statistics are the mean0 median and mode" 4hey descrie
the central tendency of a distriution" 4he mean 6a%erage7 is the most popular" !t is
found y adding the %alues for all the 6non-missing7 cases and di%iding y the
numer of 6non-missing7 cases" 8or e9ample0 to find the mean age of all your
friends0 add all their ages together and di%ide y the numer of friends" 4he mean
a%erage can present a distorted picture of central tendency if the sample is s,ewed in
any way"
8or e9ample0 letDs say fi%e people ta,e a test" 4heir scores are 100 120 130 1(0 and 93"
64he last person is a genius"7 4he mean would e the sums of the scores
10]12]13]1(]93 di%ided y 2" !n this e9ample0 a mean of 29"- is not a OgoodO
measure of how well people did on the test in general" When analyBing data0 e
careful of using only the mean a%erage when the sample has a few %ery high or %ery
low scores" 4hese scores tend to s,ew the shape of the distriution and will distort
the mean"
4he median pro%ides a measure of central tendency such that half the sample will e
ao%e it and half the sample will e elow it" 8or s,ewed distriutions this is a etter
measure of central tendency" !n the pre%ious e9ample0 13 would e the median for
the sample of fi%e people"
4he mode is the most common score or category - the one which occurred most
fre;uently" !t is possile to ha%e more than one mode if there is not a single Omost
fre;uent scoreO" 8or e9ample0 the following set of data has two modes5 12 and 1-"
12 12 12 13 13 12 12 1- 1- 1- 1) 1(
StatPac For Windows User's Manual Basic 0nalyses 1>1
4he distriution of many %ariales follows that of a ell-shaped cur%e" 4his is called
a Onormal distriutionO" :ne must assume that data is appro9imately normally
distriuted for many statistical analyses to e %alid" When a distriution is normal0
the mean0 median and mode in the population will all e e;ual" !f they are not e;ual0
the distriution is distorted in some way"
$/e"ness5 7urtosis5 2 7olmogorov:$mirnov
4here are asically two ways that a distriution can e distorted5 s,ewness and
,urtosis" S,ewness refers to Otop hea%yO or Oottom hea%yOW 6i"e"0 the tail of the
cur%e7" !f the longest tail of the cur%e goes to the right 6the cur%e is top hea%y70 it is
positi%ely s,ewed" !f it is ottom hea%y 6the longest tail of the cur%e goes to the left70
it is negati%ely s,ewed" # %alue of Bero for s,ewness represents a symmetrical
distriution0 such as the normal distriution mentioned ao%e"
Eurtosis refers to how pea,ed or flat the cur%e is" # %ery flat cur%e is called
Oplaty,urticO and has a ,urtosis of less than three" # %ery pea,ed cur%e is called
Olepto,urticO and has a ,urtosis greater than three" # %alue of three for ,urtosis
indicates normal pea,edness and the distriution is termed Omeso,urticO"
4he Eolmogoro%-Smirno% statistic pro%ides a ;uic, chec, to determine the degree of
normality in the data" 4he %alue pro%ides a relati%e indication of normalityW as the
%alue mo%es further away from Bero0 we can e more certain that the data does not
appro9imate a normal distriution" 4he distriution is non-normal5
at the "12le%el if ES \ "))2
at the "10le%el if ES \ "(19
at the "02le%el if ES \ "(92
at the "022 le%el if ES \ "922
at the "01le%el if ES \ 1"032
$tandard Deviation 2 Variance
4he standard de%iation is a %ery useful statistic that measures the dispersion of scores
around the mean" :n the a%erage0 -( percent of all the scores in a sample will e
within plus or minus one standard de%iation of the mean and 92 percent of all scores
will e within two standard de%iations of the mean"
4he %ariance is calculated directly from the distriution of raw scores" !t is the sum
of the s;uared de%iations of each score from the arithmetic mean di%ided y '" 4he
standard de%iation is simply the s;uare root of the %ariance" 4he uniased estimates
should e used when sampling from the population" 4he formula for the uniased
estimates of the %ariance and standard de%iation is the same e9cept that '-1 is used
in the denominator"
$tandard &rror 2 Confidence Intervals
Confidence inter%als are %ery important" 4hey allow us to predict where the mean
would fall if another sample is ta,en" 4he standard error of the mean is used to
estimate the range within which we would e9pect the mean to fall"
.etDs say the 92 percent confidence inter%al for the mean is 12"3 to 22"(" !n repeated
samples of the same siBe0 the mean would e e9pected to fall etween these two
%alues 92 percent of the time" # similar interpretation can e made for the 99 percent
confidence inter%al" 4he 92 and 99 percent confidence inter%als may e re;uested
using the C2 and C9 options respecti%ely5
1>& Basic 0nalyses StatPac For Windows User's Manual
:P4!:'S C2^J C9^J
4he ao%e formula for the standard error of the mean is used when the sample siBe is
small relati%e to the population siBe 6say0 less than ten percent7" When the sample
siBe represents a sustantial proportion 6greater than ten percent7 of the population0
the standard error is modified y the finite population correction factor 4his has the
effect of reducing the standard error and narrowing the confidence inter%al and"
When the 8P option is used to specify a population siBe0 the standard error will e
adHusted and printed as the OCorrected Standard Arror :f 4he 1eanO" 6See the
:P4!:'S command in the Eeywords section of this manual for information on
using the 8P option"7
Confidence inter%als are accurate only if the distriution of the data resemles a
normal cur%e" &e carefulW using confidence inter%als from non-normal data is ris,y
usiness"
&'ample of a Descriptive $tatistics Printout
6uartiles 2 .eneral E:ilesE
Cuartiles are often used in education to di%ide a distriution into 3 groups of e;ual
'" # ;uartile printout will contain three %alues 6one less than the numer of groups7"
!f0 for e9ample0 the %alue for the first 6lowest7 ;uartile is 200 it means that 22` of the
sample had a score of 20 or less" Jou can specify any di%ision with the !. option"
StatPac For Windows User's Manual Basic 0nalyses 1>1
8or e9ample0 if you specify !.^100 then deciles will e printed" !f the ninth decile
6highest7 %alue is (20 it means that 90` of the distriution had a score of (2 or less0
and 10` scored e;ual to or higher than (2" 4he O-ileO %alues are interpolated when
necessary" Set !.^1 to disale the Oany ilesO option
&'ample of a 6uartile Printout
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling to print the %ariale lael 6.&^A70
the %ariale name 6.&^'70 or the %ariale numer
6.&^C7"
.aeling Width .W Set the ma9imum width 6in inches7 for the %ariale
laels on the stu"
A9act Width AW When AW^J0 the laeling width for the stu will
e e9actly what is specified with the .W option"
When AW^'0 the width of the stu will self-adHust
ased on the length of the stu laels"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
.ael Iustification .I Sets the Hustification for the anner %ariale lael"
A9tra Spacing AS When AS^J0 a lan, line will e printed etween
each %ariale on the stu" When AS^'0 no lan,
lines will e printed"
BR+0/$3W7 Co((and
4he rea,down program gi%es descripti%e statistics for one or more criterion
%ariales ro,en down y one or more sugroup %ariales" !n other words0 the
rea,down program pro%ides a way of summariBing descripti%e statistics for many
sugroups" 4he same information could e otained y performing multiple
descripti%e statistics analyses using the !8-4<A'-SA.AC4 command to limit each
analysis to the desired sugroup"
4he synta9 for the command to e%o,e the rea,down program is5
&$A#E@:W' [Criterion %ar" list\ &J [Sugroup %ar" list\
8or e9ample0 letDs say you want descripti%e statistics for #FAW howe%er0 you want
these statistics ro,en down y $#CA0 SA* and !'C:1A le%el" !n other words0
you are interested in comparing age for each of the sugroups 6e"g"0 a%erage age of
males %ersus a%erage age of females7"
# data file for this analysis would loo, li,e this5
1>) Basic 0nalyses StatPac For Windows User's Manual
#113- 6record 1 - race is coded as #
se9 is coded as 1
income le%el is coded as 1
age is 3-7
&8332 6record 2 - race is coded as &
se9 is coded as 8
income le%el is coded as 3
age is 327
4he criterion %ariale is #FA 6?37" !t is this %ariale that you will e calculating
descripti%e statistics for0 so it must e inter%al or ratio-type data"
>p to ten sugroup %ariales may e included in the sugroup %ariale list" 4hese
%ariales may e either alpha or numeric" !n our e9ample0 these would e5 $#CA
6?170 SA* 6?27 and !'C:1A 6?37" Aach of the sugroup %ariales may contain up
to 100 categories 6%alue laels7"
#ny of the following commands would perform the analysis5
&$A#E@:W' #FA &J $#CA0 SA*0 !'C:1A
&$A#E@:W' #FA &J $#CA - !'C:1A
&$A#E@:W' #FA &J $#CA SA* !'C:1A
&$ ?3 &J ?1 - ?3 6&$A#E@:W' may e are%iated as &$7
'otice that the ,eyword &J is mandatory" 4his is necessary ecause you may want a
rea,down on se%eral criterion %ariales" 4hat is0 se%eral different %ariales may e
ro,en down y the same sugroup %ariales"
When a criterion %ariale list is specified0 it is e;ui%alent to performing a different
rea,down for each criterion %ariale" 8or e9ample0 oth #FA and !CSC:$A could
e ro,en down y $#CA0 SA* and !'C:1A5
&$A#E@:W' #FA !CSC:$A &J $#CA SA* !'C:1A
When a criterion %ariale list 6#FA and !CSC:$A7 is specified0 it is the same as
re;uesting a separate analysis for each %ariale in the list" !n this e9ample0 two tas,s
will e performed" 4hey are5
&$A#E@:W' #FA &J $#CA SA* !'C:1A
&$A#E@:W' !CSC:$A &J $#CA SA* !'C:1A
When specifying a criterion %ariale list0 care must e ta,en to insure that each
%ariale in the criterion %ariale list is different from those in the sugroup %ariale
list" 4hat is0 a %ariale cannot e ro,en down y itself"
4he output from the rea,down program will print the mean0 standard de%iation0
numer of cases0 and percent for each of the sugroups"
StatPac For Windows User's Manual Basic 0nalyses 1>!
&'ample of a !rea/do"n Printout
$ort Type 2 $ort Order
4he output from the rea,down analyses may e more meaningful when the
sugroup categories are displayed in sorted order" !f no sort is selected 6S4^'70 the
sugroup categories will e displayed in the order they appear in the study design" !f
the study design does not contain all the %alues in the data file 6such as mispunched
data70 the unlaeled %alues will appear on the printout in the order that they are
encountered in the data file"
Jou can sort the sugroup categories y fre;uency of response using the option
S4^80 or y the category codes themsel%es 6S4^C7" 8or e9ample0 the following
option would sort the categories y fre;uency of response in descending order" !t
would e re;uested with the following options5
:P4!:'S S4^8 S:^@ 6Sort 4ype y fre;uency of response7
6Sort :rder is descending7
!n most cases0 youDll proaly want to ha%e the rea,down printout appear in
ascending order y the code" 4he options statement to do this is5
:P4!:'S S4^C S:^# 6Sort 4ype is y category code7
6Sort :rder is ascending7
'otice that this type of sort is generally the way the information would e listed in
the study design" !f this is the case0 sorting y category code will ha%e no effect"
Sorting y category codes is useful if you did not enter %alue laels for the sugroup
%ariale"
Print %issing
When a sugroup %ariale is missing0 it may e included or e9cluded from the
analysis with the P1 option" When P1^J0 all sugroup %ariales that are missing
1>* Basic 0nalyses StatPac For Windows User's Manual
will e grouped into a uni;ue category and descripti%e statistics for the criterion
%ariale will e reported for the Omissing categoryO"
Category Creation
Sometimes there may e a sugroup category listed in the study design that has no
accompanying data" 8or instance0 noody in the sample may e o%er -0 years old"
Whether or not you want the lael to appear with a count of Bero is a matter of
preference"
4he actual categories 6%alue laels7 in the rea,down analysis can e created either
from the study design %alue laels 6CC^.7 or from the data itself 6CC^@7" When the
categories are created from the laels0 the %alue laels themsel%es will e used to
create the categories for the analysis0 and data that does not match up with a %alue
lael code will e counted as missing" When categories are created from the data0 all
data will e considered %alid whether or not there is a %alue lael for it"
Percentage !ase
!n addition to means and standard de%iations0 the rea,down analysis also prints
counts and percents for each of the categories" 4he denominator for the percentages
can either e the numer of respondents or the total numer of responses" !f P&^'0
the denominator for calculating percentages will e the numer of respondents 6i"e"0
the numer of records in the data file7" !f P&^$0 the denominator will e the total
numer of responses for all indi%iduals"
Labeling 2 $pacing Options
3tion Code Function
.aeling .& Sets the column headings to print the %ariale lael
6.&^A70 the %ariale name 6.&^'70 or the %ariale
numer 6.&^C7"
.aeling Width .W Set the ma9imum width 6in inches7 for the %ariale
laels on the stu when :#^J"
A9act Width AW When AW^J0 the laeling width for the stu will
e e9actly what is specified with the .W option"
When AW^'0 the width of the stu will self-adHust
ased on the length of the stu laels"
Column Spacing CS Sets the spacing 6in inches7 etween the columns
when :#^J"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
Print Percent Symol PP Sets whether the percent symol is shown"
Print Codes PC Sets whether the codes are printed with the %alue
laels"
.ael Iustification .I Sets the Hustification for the anner %ariale lael
when :#^J"
A9tra Spacing AS When AS^J0 a lan, line will e printed after each
%ariale name or lael on the stu" When AS^'0 no
lan, lines will e printed"
StatPac For Windows User's Manual Basic 0nalyses 1>-
::+S: Co((and
4he t-test is a relati%ely simple statistic to test the difference etween two means
e%en when the sample siBes are small 6less than 307" 4he two %ariales must e
inter%al or ratio-type data" StatPac lets you test the difference if the 'Ds are e;ual or
une;ual" 4he primary ad%antage of the t statistic is that it allows us to test the
difference etween samples with small numers of cases"
4he t distriution depends on the siBe of the samples" With small samples0 the t
distriution is lepto,urticW howe%er0 as the sample siBe e9ceeds 300 the t distriution
approaches that of the normal cur%e" 4he standard error of the difference is used to
estalish a range where the difference etween the true means of the two populations
would e e9pected to fall"
4he significance of the t statistic depends upon the hypothesis the researcher plans to
test" 4his hypothesis should e de%eloped efore collecting the data" !f interested in
determining whether there is a significant difference etween two means0 ut you do
not ,now which of the means is greater0 use the two-tailed test" !f interested in
testing the specific hypothesis that one mean is greater than the other0 use the one-
tailed test"
4here are two asic ,inds of t-testsW one for matched pairs and the other for
independent groups"
:9:est For Matched Pairs
!f each suHect or unit eing tested was measured in oth groups0 then the appropriate
t-test is for matched pairs" 4o perform this type of analysis0 you must enter the data
so that oth oser%ations for a suHect are in the same data record" #n e9ample of an
appropriate use of the t-test for matched pairs might e to compare pretest and
posttest scores where each person too, oth a P$A4AS4 6?17 and a P:S44AS4
6?27" &oth %alues are contained in each data record" #n e9ample of a data file for
this analysis would loo, li,e this5
(292 6record 1 - Pretest ^ (2 = Posttest ^ 927
)-(9 6record 2 - Pretest ^ )- = Posttest ^ (97
22)- 6record 3 - Pretest ^ 22 = Posttest ^ )-7
4he synta9 of the command to perform one or more matched pairs t-tests is5
44AS4 [?ariale list\ W!4< [?ariale list\
4he ,eyword W!4< is mandatory if a %ariale list is specified 6i"e"0 more than one t-
test is re;uested7" !f only one t-test is eing re;uested0 the ,eyword W!4< may e
omitted" !n our pretest-posttest e9ample0 the commands would e5
44AS4 P$A4AS4 W!4< P:S44AS4
44AS4 P$A4AS4 P:S44AS4
44 ?1 W!4< ?2 644AS4 may e are%iated as 447
1>; Basic 0nalyses StatPac For Windows User's Manual
!n a matched pairs t-test0 it does not matter which %ariale is listed first in the
command" !dentical results would e otained with the command5
44AS4 P:S44AS4 W!4< P$A4AS4
When a %ariale list is specified as part of the 44AS4 command0 more than one t-test
analysis will e performed" 8or e9ample0 the following command will perform four
t-test analyses 6?1 with ?90 ?1 with ?230 ?) with ?90 and ?) with ?2375
44AS4 ?1 ?) W!4< ?9 ?23
&'ample of a t Test for %atced Pairs Printout
:9:est For Indeendent Grous
4he other ,ind of t-test is for independent groups and it is used for noncorrelated
data" !f each case in the data file is to e assigned to one group or the other ased on
another %ariale0 use the t-test for independent groups" 8or e9ample0 to compare
reading scores etween males and females0 split the reading scores into two groups
depending upon whether the person is male or female" 6Aach record in the data file is
assigned to one group or the other"7
1(3 6record 1 - male with score of (37
891 6record 2 - female with score of 917
8(3 6record 3 - female with score of (37
4he synta9 for the command to perform an independent groups t-test is5
44AS4 [?ar" list\ W!4< [Frouping %ar" list\^6[Code 1\76[Code 2\7
StatPac For Windows User's Manual Basic 0nalyses 1>'
#s in the matched pairs t-test0 the ,eyword W!4< is only mandatory if a %ariale list
is specified for the analyBed %ariale or the grouping %ariale" !f only one t-test is
re;uested0 its use is optional"
!n the ao%e e9ample0 SC:$A is the %ariale under analysis and SA* is the %ariale
used to assign records to one group or the other" 4he commands to perform this t-test
are5
44AS4 SC:$A W!4< SA*^617687
44AS4 SC:$A W!4< SA*^61Mm768Mf7
!n the second e9ample0 notice that oth upper and lower case codes are specifiedW
they are separated from each other y a slash" 4his is done Hust in case our data entry
operators were not consistent in the way they entered the data" 4hat is0 sometimes a
male was designated with an O1O0 and other times with an OmO" !f you are certain
that upper case was always used0 you could use the first command"
When a %ariale list is specified0 se%eral t-tests will e performed" 8or e9ample0 the
following statement would re;uest three different t-tests etween males and females
6one for each type of score75
44AS4 SC:$A1 SC:$A2 SC:$A3 W!4< SA*^617687
4here is no limit on the numer of codes that can e specified as part of a group" 8or
e9ample0 letDs say an !'C:1A %ariale is coded into fi%e income groups5
What is your annual incomeY
1^>nder Z100000
2^Z100000 - Z200000
3^Z210000 - Z300000
3^Z310000 - Z300000
2^:%er Z300000
4o compare scores for those that ma,e up to Z300000 with those that ma,e o%er
Z300000 per year0 the command would e5
44AS4 SC:$A W!4< !'C:1A^61M2M3763M27
When performing a t-test for independent groups0 the program will accept a wide
%ariety of user styles and formats" 4wo asic formats are possile" 4hese are5
6[Code\M[Code\7 or 6[Code\-[Code\7
#ll of the following would e %alid re;uests when entering the code6s7 or %alue6s7 to
split the data into two groups" 'otice that the reser%ed words .: and <! are %alid
when specifying a range of codes or %alues"
11> Basic 0nalyses StatPac For Windows User's Manual
6#M&M@7 6Place all cases with codes #0 & or @ in this group7
6#-@7 6Place all cases with codes # to @ in this group7
6.:-@7 6Place all cases with codes up to @ in this group7
6--97 6Place all cases with codes --9 in this group7
6.:-217 6Place all cases with up to a 21 in this group7
622-<!7 6Place all cases with a 22 or higher in this group7
&'ample of a t:Test for Independent .roups Printout
Non:Parametric $tatistics
4he non-parametric e;ui%alents of the t-test can e re;uested with the 'P^J option"
Aither the Wilco9on test or the 1ann-Whitney > test will e printed depending on
whether you are performing a matched pairs or independent groups t-test"
4he Wilco9on test for correlated samples is the non-parametric e;ui%alent of the
matched pairs t-test" 4he data is assigned ran, %alues and the differences etween the
ran,s are computed" 4he Wilco9on test statistic is the minimum of positi%e and
negati%e differences in ran,s" !f the numer of cases is greater than or e;ual to ten0
the proaility is calculated from the normal distriution" When there are fewer than
ten cases0 refer to the appendi9 to determine the proaility"
&'ample of -ilco'on $tatistic Printout
4he 1ann-Whitney > test is the non-parametric e;ui%alent of the t-test for
independent groups" !t may e used to e%aluate the difference etween two
population distriutions" 4he data is first ran,ed" 4he 1ann-Whitney > is the
numer of times that one group is smaller than the other"
StatPac For Windows User's Manual Basic 0nalyses 111
8or sample siBes of less than twenty0 refer to the appendi9 to find the proaility of
>" !f the sample siBe is twenty or more0 the distriution appro9imates the normal
distriution0 and the normal de%iate will e used to calculate the proaility" 4he
1ann-Whitney > may e selected y using 1W^J or suppressed y using 1W^'"
&'ample of %ann:-itney , $tatistic Printout
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the column headings to print the %ariale lael
6.&^A70 the %ariale name 6.&^'70 or the %ariale
numer 6.&^C7"
.aeling Width .W Set the ma9imum width 6in inches7 for the %ariale
laels on the stu"
A9act Width AW When AW^J0 the laeling width for the stu will
e e9actly what is specified with the .W option"
When AW^'0 the width of the stu will self-adHust
ased on the length of the stu laels"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
Print Percent Symol PP Sets whether the percent symol is shown"
.ael Iustification .I Sets the Hustification for the anner laels"
&lan, .ines &etween $ows &. Sets the numer of lan, lines etween each
%ariale on the stu when :#^J"
C3RR+.0:+ Co((and
Correlation is a measure of association etween two %ariales" # correlation
coefficient can e calculated for ordinal0 inter%al or ratio-type data" 4his program can
print descripti%e statistics and a correlation matri9 for up to (( %ariales"
4he synta9 of the command to run a correlation analysis is5
C:$$A.#4A [?ariale list\
8or e9ample0 to run a simple correlation of A@>C#4!:' and !'C:1A0 you could
type the command as5
11& Basic 0nalyses StatPac For Windows User's Manual
C:$$A.#4A A@>C#4!:' !'C:1A
C:$$A.#4A ?10 ?2
C: ?1 ?2 6C:$$A.#4A can e are%iates as C:7
4he correlation program can also correlate more than two %ariales" 8or e9ample0 to
print a correlation matri9 of #FA0 !'C:1A0 #SSA4S and 4AS4-SC:$A0 you
would type the command5
C:$$A.#4A #FA0 !'C:1A0 #SSA4S0 4AS4-SC:$A
4he output would contain a correlation matri9 of all possile cominations of
%ariale pairs" Se%eral statistics can e printed for each pair of %ariales" 4hese are
the correlation coefficient0 numer of %alid records0 standard error of the estimate0 t
statistic and proaility of t"
Type of Correlation Coefficient
StatPac can calculate two different ,inds of correlation coefficients5 SpearmanDs
ran,-difference correlation coefficient and PearsonDs product-moment correlation
coefficient" When calculating a correlation coefficient for ordinal data0 choose
SpearmanDs ran,-difference techni;ue" 8or inter%al or ratio-type data0 select PearsonDs
product-moment formula"
!t is your responsiility to select the appropriate type of statistic" 4his can e
accomplished y using the 4J option" 4he 4J option may e specified as S
6SpearmanDs7 or P 6PearsonDs7" 8or e9ample0 when analyBing inter%al-type %ariales0
type5
:P4!:'S 4J^P
Descriptive $tatistics
@escripti%e statistics can e selected or reHected with the option @S^J or @S^'" !f
PearsonDs product-moment correlation is selected0 the output will include the numer
of records0 mean and standard de%iation" :nly the numer of records will e printed
if SpearmanDs ran,-difference correlation is selected"
&'ample of a Descriptive $tatistics Printout
StatPac For Windows User's Manual Basic 0nalyses 111
$imple Correlation %atri'
4he correlation matri9 may e printed or suppressed with the SC^J or SC^' option
respecti%ely" 1ost of the time0 youDll proaly want to print the correlation matri9"
<owe%er0 there may e times when you only want descripti%e statistics andMor
CronachDs alpha reliaility statistic"
Correlation Coefficient
4he correlation coefficient6s7 can e printed with the CC option" 4he option CC^J
will print the correlation coefficient while CC^' will suppress it"
4he %alue of a correlation coefficient can %ary from minus one to plus one" # minus
one indicates a perfect negati%e correlation0 while a plus one indicates a perfect
positi%e correlation" # correlation of Bero means there is no relationship etween the
two %ariales"
Number Of Cases
4he numer of cases 6records7 used to calculate the correlation coefficient can e
printed with 'C^J" 4his may or may not e the same as the numer of records in the
data file" !f either the * or J %alue is missing from a pair of data0 the record will e
s,ipped and not included in the analysis"
$tandard &rror
4he standard error of the estimate for a correlation coefficient measures the standard
de%iation of the data points as they are distriuted around the regression line" 4he
standard error of the estimate can e used to specify the limits and confidence
inter%al for a correlation coefficient" !t can only e calculated for inter%al or ratio-
type data" 4he standard error can e printed using the option SA^J"
T $tatistic
4he significance of the correlation coefficient is determined from the studentDs t
statistic" 4he formula to calculate the t statistic depends upon which type of
correlation coefficient is specified" 4he t statistic can e printed or not y using the
option 44^J or 44^'0 respecti%ely" #lthough StatPac does not calculate the 8
statistic0 it is simply the s;uare of the t statistic"
Probability Of Cance
4he proaility of the t statistic indicates whether the oser%ed correlation
coefficient occurred y chance if the true correlation is Bero" !t can e printed with
the option P$^J" StatPac uses a two-tailed test to deri%e this proaility from the t
distriution" Proailities of "02 or less are generally considered significant0 implying
that there is a relationship etween the two %ariales"
When the t statistic is calculated for SpearmanDs ran,-difference correlation
coefficient0 there must e at least 30 cases efore the t distriution can e used to
determine the proaility" !f there are fewer than 30 cases0 use the tale in the
appendi9 to find the proaility of the correlation coefficient"
11) Basic 0nalyses StatPac For Windows User's Manual
&'ample of a Correlation %atri' Printout
CronbacBs 4lpa
CronachDs alpha is a measure of the internal consistency of a group of items" !t
pro%ides a uni;ue estimate of reliaility for a gi%en test administration" 4he %alue of
CronachDs alpha may %ary etween Bero and one" !n general0 it is a lower ound to
the reliaility of a scale of items" !n other words0 CronachDs alpha tends to e a %ery
conser%ati%e measure of reliaility"
#s well as eing a measure of the reliaility of a scale of items0 CronachDs alpha
may also e interpreted as an estimate of the correlation of one test with an
alternati%e form containing the same numer of items"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
StatPac For Windows User's Manual Basic 0nalyses 11!
0d,anced 0nalyses
0d,anced 0nalyses Inde2
4he #d%anced #nalyses module adds multi%ariate procedures that are not a%ailale
in the asic StatPac for Windows pac,age" 4hese commands may e used in a
procedure when the #d%anced #nalyses module has een installed"
#':?# Canonical Cluster @iscriminant
8actor .ogit 1ap PC#
Proit $egress Stepwise
R+GR+SS Co((and
4he $AF$ASS command may e used to perform ordinary least s;uares regression
and cur%e fitting" :rdinary least s;uares regression 6also called simple regression7 is
used to e9amine the relationship etween one independent and one dependent
%ariale" #fter performing an analysis0 the regression statistics can e used to predict
the dependent %ariale when the independent %ariale is ,nown"
People use regression on an intuiti%e le%el e%ery day" !n usiness0 a well-dressed man
is thought to e financially successful" # mother ,nows that more sugar in her
childrenDs diet results in higher energy le%els" 4he ease of wa,ing up in the morning
often depends on how late you went to ed the night efore"
Cuantitati%e regression adds precision y de%eloping a mathematical formula that
can e used for predicti%e purposes"
4he synta9 of the command to run a simple regression analysis is5
$AF$ASS [@ependent %ariale\ [!ndependent %ariale\
- or -
$AF$ASS [@ependent %ariale list\ W!4< [!ndependent %ariale list\
8or e9ample0 a medical researcher might want to use ody weight 6?1^WA!F<47 to
predict the most appropriate dose for a new drug 6?2^@:SA7" 4he command to run
the regression would e specified in se%eral ways5
$AF$ASS @:SA W!4< WA!F<4
$AF$ASS @:SA WA!F<4
$A ?2 W!4< ?1 6'ote5 $AF$ASS may e are%iated as $A7
$A ?2 ?1
'otice that the ,eyword W!4< is an optional part of the synta9" <owe%er0 if you
specify a %ariale list for either the dependent or independent %ariale0 the use of the
W!4< ,eyword is mandatory" When a %ariale list is specified0 a separate regression
will e performed for each comination of dependent and independent %ariales"
4he purpose of running the regression is to find a formula that fits the relationship
etween the two %ariales" 4hen you can use that formula to predict %alues for the
dependent %ariale when only the independent %ariale is ,nown"
4he general formula for the linear regression e;uation is5
y ^ a ] 9
where5
9 is the independent %ariale
y is the dependent %ariale
a is the intercept
is the slope
Curve Fitting
8re;uently0 the relationship etween the independent and dependent %ariale is not
linear" Classical e9amples include the traditional sales cur%e0 learning cur%e and
population growth cur%e" !n each case0 linear 6straight-line7 regression would present
a distorted picture of the actual relationship"
Se%eral classical non-linear cur%es are uilt into StatPac and you can simply as, the
program to find the est one" 4ransformations are used to find an e;uation that will
ma,e the relationship etween the %ariales linear" # linear least s;uares regression
can then e performed on the transformed data"
4he process of finding the est transformation is ,nown as Ocur%e fittingO" &asically0
it is an attempt to find a transformation that can e made to the dependent andMor
independent %ariale so that a least s;uares regression will fit the transformed data"
4his can e e9pressed y the e;uation5
6transformed y7 ^ intercept ] slope b 6transformed 97
'otice the similarity to the least s;uares e;uation" 4he difference is that we are
transforming the independent %ariale and predicting a transformed dependent
%ariale" 4o sol%e for y0 use the formula to untransform y and apply it to oth sides
of the e;uation"
11; 0d,anced 0nalyses StatPac For Windows User's Manual
y ^ >ntransformation of 6intercept ] slope b 6transformed 977
!n addition to the uilt-in transformations0 any non-linear relationship that can e
e9pressed as a mathematical formula can e e9plored with the C:1P>4A
statement" !t is possile to transform oth the dependent and independent %ariales
with the C:1P>4A statement"
4he transformations that are uilt into StatPac are ,nown as &o9-Co9
transformations" 4hey are5
3tions :ransfor(ation
4*^# or 4J^# #utomatic
4*^& or 4J^& $eciprocal
4*^C or 4J^C $eciprocal root
4*^@ or 4J^@ $eciprocal fourth root
4*^A or 4J^A .og
4*^8 or 4J^8 8ourth root
4*^F or 4J^F S;uare root
4*^< or 4J^< 'o transformation
4*^! or 4J^! $oust techni;ue 6no transformation7
8or e9ample0 to apply a s;uare root transformation to the independent %ariale and
no transformation to the dependent %ariale0 the options statement would e5
:P4!:'S 4*^F 4J^<
4he following option statement would try to fit your data to a classical S-Cur%e" !t
says to apply a reciprocal transformation to the independent %ariale and a log
transformation to the dependent %ariale5
:P4!:'S 4*^& 4J^A
4he program also contains an automatic feature to search for the est transformation"
When 4* or 4J is set to automatic0 the program will select the transformation that
produces the highest r-s;uared" 4o get a complete tale of all cominations of the
transformations0 set oth 4* and 4J to automatic"
:P4!:'S 4*^# 4J^#
4he result will produce a tale of all possile cominations of transformations and
the $-S;uared statistics5
StatPac For Windows User's Manual 0d,anced 0nalyses 11'
&'ample of a Transformation Table
4he &o9-Co9 transformations can e e9pressed mathematically5
:ransfor(ation Untransfor(ation
$eciprocal B ^ 1M6y],7 y ^ 6B7-1 - ,
$eciprocal root B ^ 1M6y],7d"2 y ^ 6B7d-2 - ,
$eciprocal fourth root B ^ 1M6y],7d"22 y ^ 6B7d-3 - ,
.og B ^ .og6y],7 y ^ A9p6B7 - ,
8ourth root B ^ 6y],7d"22 y ^ 6B7d3 - ,
S;uare root B ^ 6y],7d"2 y ^ 6B7d2 - ,
'otes5
B is the transformed data %alue
y is the original data %alue
, is a constant used in the transformation
4wo cautions should e noted when using transformations"
1" When a reciprocal transformation is used0 the sign of the correlation coefficient
may no longer indicate the direction of the relationship in the untransformed data"
2" Some transformations may not e possile for some data" 8or e9ample0 it is not
possile to ta,e the log or s;uare root of a negati%e numer or the reciprocal of Bero"
When necessary0 StatPac will automatically add a constant to the data to pre%ent this
type of error"
:ne prolem with least s;uares regression is its susceptiility to e9treme or unusual
data %alues" !n many cases0 e%en a single e9treme data %alue can distort the
regression results" # techni;ue called roust regression is included in StatPac to
o%ercome this prolem" $oust regression mathematically adHusts e9treme data
%alues through an iterati%e process" 4he effect is to reduce the distortion in the
regression line caused y the outlying data %alue6s7"
4he roust process ma,es successi%e adHustments to e9treme data %alues y
e9amining the median residual and using a weighted least s;uares regression to
adHust the outliers"
1&> 0d,anced 0nalyses StatPac For Windows User's Manual
!f roust regression is specified for either the 9 or y transformation0 no other uilt-in
transformations will e used 6e%en if a transformation is specified for the other
%ariale7"
$tatistics
4he regression statistics pro%ide the information needed to ade;uately e%aluate the
Ogoodness-of-fitOW that is0 how well the regression line e9plains the actual data" 4he
statistics include correlation information0 descripti%e statistics0 error measures and
regression coefficients" 4his data can e used to predict future %alues for the
dependent %ariale and to de%elop confidence inter%als for the predictions"
&'ample of a $tatistics Printout
Correlation is a measure of association etween two %ariales" StatPac calculates the
Pearson product-moment correlation coefficient" !ts %alue may %ary from minus one
to plus one" # minus one indicates a perfect negati%e correlation0 while a plus one
indicates a perfect positi%e correlation" # correlation of Bero means there is no
relationship etween the two %ariales" When a transformation has een specified0
the correlation coefficient refers to the relationship of the transformed data"
4he coefficient of determination 6r-s;uared7 is the s;uare of the correlation
coefficient" !ts %alue may %ary from Bero to one" !t has the ad%antage o%er the
correlation coefficient in that it may e interpreted directly as the proportion of
%ariance in the dependent %ariale that can e accounted for y the regression
e;uation" 8or e9ample0 an r-s;uared %alue of "39 means that 39` of the %ariance in
the dependent %ariale can e e9plained y the regression e;uation" 4he other 21` is
une9plained error"
4he standard error of estimate for regression measures the amount of %ariaility in
the points around the regression line" !t is the standard de%iation of the data points as
they are distriuted around the regression line" 4he standard error of the estimate can
e used to specify the limits and confidence of any prediction made and is useful to
otain confidence inter%als for yD gi%en a fi9ed %alue of 9"
StatPac For Windows User's Manual 0d,anced 0nalyses 1&1
$egression analysis enales us to predict one %ariale if the other is ,nown" 4he
regression line 6,nown as the Oleast s;uares lineO7 is a plot of the e9pected %alue of
the dependent %ariale for all %alues of the independent %ariale"
4he difference etween the oser%ed and e9pected %alue is called the residual" !t can
e used to calculate %arious measures of error" 4he measures of error in StatPac are
the mean percent error 61PA70 mean asolute percent error 61#PA7 and the mean
s;uared error 61SA7"
>sing the regression e;uation0 the %ariale on the y a9is may e predicted from the
score on the 9 a9is" 4he slope of the regression line 67 is defined as the rise di%ided
y the run" 4he y intercept 6a7 is the point on the y a9is where the regression line
would intercept the y a9is" 4he slope and y intercept are incorporated into the
regression e;uation as5 y ^ a ] 9
4he significance of the slope of the regression line is determined from the studentDs t
statistic" !t is the proaility that the oser%ed correlation coefficient occurred y
chance if the true correlation is Bero" StatPac uses a two-tailed test to deri%e this
proaility from the t distriution" Proailities of "02 or less are generally
considered significant0 implying that there is a relationship etween the two
%ariales" #lthough StatPac does not calculate the 8 statistic0 it is simply the s;uare
of the t statistic for the slope"
Data Table
4he data tale pro%ides a detailed method to e9amine the errors etween the
predicted and actual %alues of the dependent %ariale" StatPac allows printing of the
tale to more closely study the residuals" 4yping the option @4^J will cause the
output to include a data tale"
&'ample of a Data Table
Outlier Definition and 4dDustment
:utliers 6e9treme data points7 can ha%e dramatic effects on the slope of the
regression line" :ne method to deal with outliers is to use roust regression 64*^! or
4J^!7" 4here are two other common methods to deal with outliers" 4he first is to
simply eliminate any records that contain an outlier and then rerun the regression
without those data records" 4he other method is ,nown as data trimming0 where the
highest and lowest e9treme %alues are replaced with a %alue that limits the
standardiBed residual to a predetermined %alue" 4he :# option is used to set the
1&& 0d,anced 0nalyses StatPac For Windows User's Manual
outlier adHustment method" !t may e set to :#^' 6none70 :#^@ 6delete70 or :#^#
6adHust7"
&oth methods use a two-step process" 8irst the regression is performed using the
actual %alues for the dependent %ariale and standardiBed residuals are calculated for
each predicted %alue" When a standardiBed residual e9ceeds a gi%en B-%alue0 the
record is flagged" 4hen the regression is run again and the flagged records are either
eliminated 6:#^@70 or the %alue of the dependent %ariale is adHusted to the %alue
defined y the outlier definition B-%alue 6:#^#7" 8or e9ample0 if the outlier
definition is set to 1"9- standard de%iations 6:@^1"9-70 the upper and lower two and
a half percent of the outliers would e flagged" 4hen the dependent %ariales for the
flagged records would e modified to a %alue that would produce an outlier of plus
or minus 1"9-" 8inally0 the regression would e rerun using the modified dependent
%ariale %alues for the flagged records" 8lagged data records will e shown with an
asteris, in the data tale"
!t is important to note that the outlier adHustment process is only performed once
ecause each regression would produce a new set of standardiBed residuals that
would e9ceed the outlier definition %alue 6:@^B7" 4hat is0 any set of data with
sufficient sample siBe will yield a set of outliers0 e%en if the data has already een
adHusted" #llowing the outlier adHustment process to repeat indefinitely would
e%entually result in an adHustment to nearly e%ery data record"
When outlier adHustment is used0 the program will also report adHusted means and
standard de%iations for the dependent %ariale" 4his refers to the recalculated mean
after deleting or adHusting the data"
Confidence Intervals 2 Confidence Level
Confidence inter%als pro%ide an estimate of %ariaility around the regression line"
'arrow confidence inter%als indicate less %ariaility around the regression line" 4he
option C!^J will include the confidence inter%als in the data tale"
Prediction inter%als0 rather than confidence inter%als0 should e used if you intend to
use the regression information to predict new %alues for the dependent %ariale" &oth
the confidence inter%als and the prediction inter%als are centered on the regression
line0 ut the prediction inter%als are much wider" 4he option C!^P will print the
prediction inter%als in the data tale"
4he actual confidence or prediction inter%al is set with the C. option" 4he C. option
specifies the percentage le%el of the inter%al" 8or e9ample0 if C!^P and C.^920 the
92` prediction inter%als would e printed in the data tale"
Residual 4utocorrelation Function Table
A9amining the autocorrelation of the residuals is often used in time-series analysis to
e%aluate how well the regression wor,ed" !t is a way of loo,ing at the Ogoodness-of-
fitO of the regression line" !f the residuals contain a pattern0 the regression did not do
as well as we might ha%e desired"
# residual autocorrelation tale is the correlation etween %alues that occur at
%arious time lags" 8or e9ample0 at time lag one0 you are loo,ing at the correlation
etween adHacent %aluesW at time lag two0 you are loo,ing at the correlation etween
e%ery other %alue0 etc" 4o select the residual autocorrelation function tale0 type the
option #C^J"
&'ample of a Residual 4utocorrelation Function Table
StatPac For Windows User's Manual 0d,anced 0nalyses 1&1
&'panding $tandard &rror
Jou may use the A* option to set the standard error limits of the residual
autocorrelation function to a fi9ed %alue or to e9pand with increasing time lags"
# study of sampling distriutions on autocorrelated time series was made y &artlett
in 193-" <e found that0 as one goes out further in time0 the standard error increases
with successi%e time lags" 6O4heoretical Specifications of Sampling Properties of
#utocorrelated 4ime SeriesO0 &artlett0 193-"7 !t is only in recent years that his
findings ha%e een accepted y the forecasting community"
When A*^J0 the residual autocorrelation function error limits will widen with each
successi%e time lag" !f A*^'0 the standard error limits will remain constant"
Force Constant to >ero
4he option CL^J can e used to calculate a regression e;uation with the constant
e;ual to Bero" !f this is done0 the regression line is forced through the origin" 'ote
that forcing the constant to Bero disales calculation of the correlation coefficient0 r-
s;uared0 and the standard error of estimate" 8or this reason0 it is not possile to set
the transformation parameter for either the independent or dependent %ariale to
automatic0 ecause there are no r-s;uared statistics to compare" 8urthermore0
confidence inter%als0 which are calculated from the standard error of estimate0 cannot
e computed" 4he option CL^' results in a standard regression e;uation"
$ave Results
1any times researchers want to sa%e results for future study" &y using the option
S$^J0 the predicted %alues0 residuals and confidence or prediction inter%als can e
sa%ed so they can e merged with the original data file" #t the completion of the
analysis0 you will e gi%en the opportunity to merge the predictions and residuals"
Predict Interactively
When performing a regression0 predicting %alues for the dependent %ariale for
specific %alues of the independent %ariale may e desired" 4his is ,nown as
interacti%e prediction" Select interacti%e prediction y entering the option P$^J"
#fter the completion of the taular outputs0 the user will e prompted to enter a
%alue for the independent %ariale" 4he program will predict the %alue for the
1&) 0d,anced 0nalyses StatPac For Windows User's Manual
dependent %ariale ased on the regression e;uation" Confidence andMor prediction
inter%als will also e gi%en"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
S:+PWIS+ Co((and
1ultiple regression is an e9tension of simple regression" !t e9amines the relationship
etween a dependent %ariale and two or more e9planatory %ariales 6also called
independent or predictor %ariales7" 1ultiple regression is used to5
1" Predict the %alue of a dependent %ariale using some or all of the independent
%ariales" 4he aim is generally to e9plain the dependent %ariale accurately with as
few independent %ariales as possile"
2" 4o e9amine the influence and relati%e importance of each independent %ariale on
the dependent %ariale" 4his in%ol%es loo,ing at the magnitude and sign of the
standardiBed regression coefficients as well as the significance of the indi%idual
regression coefficients"
4he synta9 of the command to run a stepwise regression is5
S4APW!SA [@ependent %ariale\ [!ndependent %ariale list\
8or e9ample0 we might try to predict annual income 6?1^!'C:1A7 from age
6?2^#FA70 numer of years of school 6?3^SC<::.70 and !C score 6?3^!C7" 4he
command to run the regression could e specified in se%eral different ways5
S4APW!SA !'C:1A0 #FA0 SC<::.0 !C
S4APW!SA ?10?20?30?3
S4 !'C:1A ?2-?3 6'ote5 S4APW!SA may e are%iated as S47
S4APW!SA ?1-?3
!n each e9ample0 the dependent %ariale was specified first0 followed y the
independent %ariale list" 4he %ariale list itself may contain up to 200 independent
%ariales and can consist of %ariale names andMor %ariale numers" Aither a comma
or a space can e used to separate the %ariales from each other"
4he multiple regression e;uation is similar to the simple regression e;uation" 4he
only difference is that there are se%eral predictor %ariales and each one has its own
regression coefficient"
4he multiple regression e;uation is5
StatPac For Windows User's Manual 0d,anced 0nalyses 1&!
JD ^ a ] 1 91 ] 2 92 ] 3 93 ] """ n 9n
where
JD is the predicted %alue
# is a constant
&1 is the estimated regression coefficient for %ariale 1
*1 is the score for %ariale 1
&2 is the estimated regression coefficient for %ariale 2
*2 is the score for %ariale 2
Descriptive $tatistics
4he mean and standard de%iations for all the %ariales in the e;uation can e printed
with the @S^J option"
&'ample of a Descriptive $tatistics Printout
Regression $tatistics
4he regression statistics can e selected with option $S^J" 4hey gi%e us an o%erall
picture of how successful the regression was"
4he coefficient of multiple determination0 fre;uently referred to as r-s&uared0 can e
interpreted directly as the proportion of %ariance in the dependent %ariale that can
e accounted for y the comination of predictor %ariales" # coefficient of multiple
determination of "(2 means that (2 percent of the %ariance in the dependent %ariale
can e e9plained y the comined effects of the independent %arialesW the remaining
12 percent would e une9plained"
4he coefficient of multiple correlation is the s;uare root of the coefficient of multiple
determination" !ts interpretation is similar to the simple correlation coefficient" !t is
asically a measure of association etween the predicted %alue and the actual %alue"
4he standard error of the multiple estimate pro%ides an estimate of the standard
de%iation" !t is used in conHunction with the in%erted matri9 to calculate confidence
inter%als and statistical tests of significance"
1&* 0d,anced 0nalyses StatPac For Windows User's Manual
When there are fewer than 100 records0 StatPac will apply an adHustment to the
ao%e three statistics0 and the adHusted %alue will e printed" 4he adHustment is for a
small n and its %alue should e used"
4he %ariaility of the dependent %ariale is made up of %ariation produced y the
Hoint effects of the independent %ariales and some une9plained %ariance" 4he o%erall
8-test is performed to determine the proaility that the true coefficient of multiple
determination is Bero" 4ypically0 a proaility of "02 or less leads us to reHect the
hypothesis that the regression e;uation does not impro%e our aility to predict the
dependent %ariale"
&'ample of te Regression $tatistics Printout
Regression Coefficients
4he regression coefficients can e printed with the $C^J option" 4he output
includes the constant0 coefficient0 eta weight0 8-ratio0 proaility0 and standard error
for each independent %ariale"
Aach coefficient pro%ides an estimate of the effect of that %ariale 6in the units of the
raw score7 for predicting the dependent %ariale" 4he eta weights0 on the other
hand0 are the standardiBed regression coefficients and represent the relati%e
importance of each independent %ariale in predicting the dependent %ariale"
4he 8-ratio allows us to calculate the proaility that the influence of the predictor
%ariale occurred y chance" 4he t-statistic for each independent %ariale is e;ual to
the s;uare root of its 8-ratio"
4he standard error of the ith regression coefficient can e used to otain confidence
inter%als aout each regression coefficient in conHunction with its 8-ratio"
&'ample of Regression Coefficients Printout
StatPac For Windows User's Manual 0d,anced 0nalyses 1&-
$imple Correlation %atri'
#fter performing a regression analysis0 it is a good idea to re%iew the simple
correlation matri9 6SC^J7" !f two %ariales are highly correlated0 it is possile that
the matri9 is not well conditioned and it might e eneficial to run the regression
again without one of the %ariales" !f the coefficient of multiple determination does
not show a significant change0 you might want to lea%e the %ariale out of the
e;uation"
&'ample of a $imple Correlation Printout
Partial Correlation %atri'
4he partial correlation matri9 6often called the %ariance-co%ariance matri97 is
otained from the in%erse of simple correlation matri9" !t can e selected with the
option PC^J" 4his is useful in studying the correlation etween two %ariales while
holding all the other %ariales constant"
1&; 0d,anced 0nalyses StatPac For Windows User's Manual
# significant partial correlation etween %ariales # and & would e interpreted as
follows5 When all other %ariales are held constant0 there is a significant relationship
etween # and &" 4he partial correlation matri9 will e printed for those %ariales
remaining in the e;uation after the stepwise procedure"
&'ample of a Partial Correlation %atri' Printout
Inverted Correlation %atri'
4he solution to a multiple regression prolem is otained through a techni;ue ,nown
as matri9 in%ersion" 4he in%erted correlation matri9 is the in%ersion of the simple
correlation matri9" !t may e selected with the option !C^J"
!n e9amining the in%erted matri90 we are specifically interested in the %alues along
the diagonal" 4hey pro%ide a measure of how successful the matri9 in%ersion was" !f
all the %alues on the diagonal are close to one0 the in%ersion was %ery successful and
we say the matri9 is Owell conditionedO" !f0 howe%er0 we ha%e one or more diagonal
%alues that are high 6greater than ten70 we ha%e a prolem with collinearity 6high
correlations etween independent %ariales7"
StatPac For Windows User's Manual 0d,anced 0nalyses 1&'
&'ample of an Inverted %atri' Printout
Print &ac $tep
Jou can print the statistics for each step of the stepwise procedure using the option
PS^J" 4his may e important when you want to study how the inclusion or deletion
of a %ariale affects the other %ariales"
&'ample of te Print $teps Output
$ummary Table
# good way to get an o%er%iew of how the steps proceeded and what effect each step
had upon the r-s;uared is to print a summary tale" 4o print the summary tale0 use
the option S4^J"

11> 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of a $ummary Table
Data Table
4he data tale pro%ides a detailed method to e9amine the residuals" StatPac allows
printing of the tale to more closely study the residuals" >sing the option @4^J will
cause the output to include a data tale"
# OresidualO is the difference etween the oser%ed %alue and the predicted %alue for
the dependent %ariale 6the error in the prediction7" 4he standardiBed residuals which
appear in the data tale are the residuals di%ided y the standard error of the multiple
estimate" 4herefore0 the standardiBed residuals are in standard de%iation units" !n
large samples0 we would e9pect 92 percent of the standardiBed residuals to lie
etween -1"9- and 1"9-"
&'ample of a Data Table
Outlier Definition and 4dDustment
:utliers 6e9treme data points7 can ha%e a dramatic effect on the staility of a
multiple regression model" 4here are two common methods to deal with outliers in
multiple regression models" 4he first is to simply eliminate any records that contain
an outlier and then rerun the regression without those data records" When using
:#^@ 6setting the outlier adHustment to delete70 records containing the highest and
lowest e9treme residuals are deleted from the analysis" 4he other method is where
the dependent %ariale is adHusted for records with the highest and lowest e9treme
residuals" 4hat is0 the dependent %ariale is modified to a %alue that limits the
standardiBed residual to a predetermined %alue" 4he :# option is used to set the
StatPac For Windows User's Manual 0d,anced 0nalyses 111
outlier adHustment method" !t may e set to :#^' 6none70 :#^@ 6delete70 or :#^#
6adHust7"
&oth methods use a two-step process" 8irst the regression is performed using the
actual %alues for the dependent %ariale and standardiBed residuals are calculated for
each predicted %alue" When a standardiBed residual e9ceeds a gi%en B-%alue0 the
record is flagged" 4hen the regression is run again and the flagged records are either
eliminated 6:#^@70 or the %alue of the dependent %ariale is adHusted to the %alue
defined y the outlier definition B-%alue 6:#^#7" 8or e9ample0 if the outlier
definition is set to 1"9- standard de%iations 6:@^1"9-70 the upper and lower two and
a half percent of the outliers would e flagged" 4hen the dependent %ariales for the
flagged records would e modified to a %alue that would produce an outlier of plus
or minus 1"9-" 8inally0 the regression would e rerun using the modified dependent
%ariale %alues for the flagged records" 8lagged data records will e shown with an
asteris, in the data tale"
4he stepwise procedure presents a prolem for data trimming" 4he stepwise
procedure often reduces the numer of independent %ariales to a suset of the
original list of independent %ariales" @ata trimming in%ol%es using the standardiBed
residuals to adHust the %alue of the dependent %ariale for some records" $erunning
the stepwise procedure with different %alues for some of the dependent %ariales
could result in a different set of independent %ariales eing stepped into the model0
especially when there are highly correlated independent %ariales" 4o a%oid this
prolem0 StatPac reruns the multiple regression using the same independent %ariales
selected in the first stepwise procedure" 4hese %ariales are forced into the model so
that the analysis runs in the non-stepwise mode"
!t is important to note that the outlier adHustment process is only performed once
ecause each regression would produce a new set of standardiBed residuals that
would e9ceed the outlier definition %alue 6:@^B7" 4hat is0 any set of data with
sufficient sample siBe will yield a set of outliers0 e%en if the data has already een
adHusted" #llowing the outlier adHustment process to repeat indefinitely would
e%entually result in an adHustment to nearly e%ery data record"
!t is suggested that the user actually e9amine records that are flagged as e9treme
outliers efore allowing the program to ma,e any adHustments" :utlier adHustments
assume that the data for all independent %ariales is acceptale" # mispunched data
%alue for an independent %ariale could result in an e9treme prediction that gets
flagged as an outlier" 4herefore0 %isual inspection is the est way to guarantee the
successful handling of outliers"
Confidence Intervals 2 Confidence Level
Confidence inter%als pro%ide an estimate of %ariaility around the regression line"
'arrow confidence inter%als indicate less %ariaility around the regression line" 4he
option C!^J will include the confidence inter%als in the data tale"
Prediction inter%als0 instead of confidence inter%als0 should e used if you intend to
use the regression information to predict new %alues for the dependent %ariale" &oth
the confidence inter%als and the prediction inter%als are centered on the regression
line0 ut the prediction inter%als are much wider" 4he option C!^P will print the
prediction inter%als in the data tale"
4he actual confidence or prediction inter%al is set with the C. option" 4he C. option
specifies the percentage le%el of the inter%al" 8or e9ample0 if C!^P and C.^920 the
92` prediction inter%als would e printed in the data tale"
11& 0d,anced 0nalyses StatPac For Windows User's Manual
Number of Variables to Force
4he aility to force %ariales into an e;uation is important for se%eral reasons5
1" # researcher often wishes to replicate the analysis of another study and0 therefore0
to force certain core %ariales into the e;uation0 letting stepwise regression choose
from the remaining set"
2" Some %ariales may e cheaper or easier to measure0 and the user may want to see
whether the remaining %ariales add anything to the e;uation"
3" !t is common to force certain design %ariales into the e;uation"
3" When independent %ariales are highly correlated0 one of them may e more
accurate than the rest0 and you may want to force this %ariale into the e;uation"
4he 8: option specifies the numer of %ariales to force into the regression
e;uation" 4o perform a standard 6non-stepwise7 multiple regression0 set the 8:
option to the numer of independent %ariales or higher" 8:^200 will always force
all independent %ariales into the e;uation" 4hus0 the 8: option may e used to
eliminate the stepwise part of the multiple regression procedure" !f you force all
%ariales into the e;uation0 the multiple regression will contain only one step0 where
all %ariales are included in the e;uation"
4he %ariales to e forced are ta,en in order from the list of independent %ariales"
8or instance0 the option 8:^3 forces the first three %ariales from the list of
independent %ariales" 4herefore0 any %ariales you want to force should e
specified at the eginning of the independent %ariale list"
F to &nter 2 F to Remove
When faced with a large numer of possile e9planatory %ariales0 two opposed
criteria of selecting a regression e;uation are usually in%ol%ed5
1" 4o ma,e the e;uation useful for predicti%e purposes0 we would li,e our model to
include as many of the independent %ariales as possile so that reliale fitted %alues
can e determined"
2" &ecause of the costs in%ol%ed in otaining information on a large numer of
independent %ariales0 and suse;uently monitoring them0 we would li,e the
e;uation to include as few of the independent %ariales as possile"
4he compromise etween these two e9tremes is generally called Oselecting the est
regressionO" 4his in%ol%es multiple e9ecutions of multiple regression in an attempt to
add %ariales to impro%e prediction or remo%e %ariales to simplify the regression
function" Stepwise regression pro%ides a partial automation of this procedure"
#n important property of the stepwise procedure is ased on the fact that a %ariale
may e indicated to e significant in an early stage0 and0 thus0 e entered in the
e;uation" #fter se%eral other %ariales are added to the regression e;uation0 howe%er0
the initial %ariale may e indicated to e insignificant" 4he comined effects of two
or more independent %ariales capture the same %ariance as a %ariale entered early
on in the stepwise process" 4his method is often referred to as forward inclusion with
ac,ward elimination"
4he algorithm used y StatPac is as follows5
1" 8irst0 enter into the regression e;uation all %ariales which the user wishes to force
into the e;uation"
2" Anter the predictor that produces the greatest decrease in the residual sum of
s;uares from all remaining predictors whose entry is not inhiited y the 8-to-enter"
StatPac For Windows User's Manual 0d,anced 0nalyses 111
3" $emo%e the predictor that ma,es the least increase in the residual sum of s;uares
from all 6non-forced7 predictors whose remo%al is not inhiited y the 8-to-remo%e
inhiiting rule"
'ote that step 2 is e9ecuted only when it is not possile to e9ecute step 3" !f neither
can e e9ecuted0 the stepping is complete"
4he following should e considered when setting 8-to-enter and 8-to-remo%e %alues
in the parameter tale5
1" # %ariale is remo%ed if the 8-%alue associated with that %ariale is less than the
8-to-remo%e %alue set in the parameter tale" Similarly0 a %ariale is added if the 8-
%alue associated with that %ariale would e greater than the 8-to-enter %alue set in
the parameter if that %ariale were entered in the current e;uation"
2" Care should e ta,en to ensure that the 8-to-remo%e e less than the 8-to-enterW
otherwise0 a %ariale would e entered and then remo%ed at alternate steps"
3" 4he default %alues for the 8-to-enter and 8-to-remo%e for many mainframe
pac,ages and StatPac are 3"0 and 3"90 respecti%ely0 which pro%ide useful starting
%alues"
3" 8orcing all %ariales in an e;uation will gi%e the usual 6non-stepwise7 multiple
regression results"
2" Setting the 8-to-remo%e %alue low yields the forward inclusion method"
-" 8or the first run on a data set0 it is common to set the 8-to-enter and 8-to-remo%e
%alues low to e9ecute a large numer of steps"
Residual 4utocorrelation Function Table
A9amining the autocorrelation of the residuals is often used in time-series analysis to
e%aluate how well the regression wor,ed" !t is a way of loo,ing at the Ogoodness-of-
fitO of the regression line" !f the residuals contain a pattern0 the regression did not do
as well as we might ha%e desired"
# residual autocorrelation function tale contains the correlation etween %alues that
occur at %arious time lags" 8or e9ample0 at time lag one0 you are loo,ing at the
correlation etween adHacent %aluesW at time lag two0 you are loo,ing at the
correlation etween e%ery other %alue0 etc" 4o select the residual autocorrelation
function plot0 type the option #C^J"
&'ample of a Residual 4utocorrelation Function Table
11) 0d,anced 0nalyses StatPac For Windows User's Manual
&'panding $tandard &rror
Jou may use the A* option to set the standard error limits of the residual
autocorrelation function to a fi9ed %alue or to e9pand with increasing time lags"
# study of sampling distriutions on autocorrelated time series was made y &artlett
in 193-" <e found that0 as one goes out further in time0 the standard error increases
with successi%e time lags" 6O4heoretical Specifications of Sampling Properties of
#utocorrelated 4ime SeriesO0 &artlett0 193-"7 !t is only in recent years that his
findings ha%e een accepted y the forecasting community"
When A*^J0 the residual autocorrelation function error limits will widen with each
successi%e time lag" !f A*^'0 the standard error limits will remain constant"
$ave Residuals
$esearchers often want to sa%e the residuals in a file for further study" !f further
analysis of the residuals shows a pattern0 the regression may not ha%e captured all the
%ariance it might ha%e0 and we may want to model the residuals to further e9plain the
%ariance"
Jou can sa%e the results in a file with the options command S$^J" 4he dependent
%ariales0 predicted %alues0 residuals and confidence or prediction inter%als will e
sa%ed0 and at the completion of the procedure you will e offered the opportunity to
merge the sa%ed data into the original data file" in the new file"
Force Constant to >ero
4he option CL^J can e used to calculate a regression e;uation with the constant
e;ual to Bero" !f this is done0 the regression line is forced through the origin" 'ote
that forcing the constant to Bero disales calculation of the r-s;uared0 coefficient of
multiple correlation and the standard error of estimate" 8urthermore0 confidence
inter%als0 which are calculated from the standard error of estimate0 cannot e
computed" 4he option CL^' results in a standard regression e;uation"
%ean $ubstitution
1ean sustitution is one method often used to reduce the prolem of missing
information" :ften0 multiple regression research is difficult ecause if one
independent %ariale is not ,nown0 it is necessary to e9clude the whole record from
the analysis" !t is possile that this can sustantially reduce the numer of records
that are included in the analysis" 1ean sustitution o%ercomes this prolem y
replacing any missing independent %ariale with the mean of that %ariale" While
this techni;ue has the possiility of slightly distorting the results0 it can ma,e it
possile to perform a regression with sustantial missing data"
$teps Limit
4he steps limit is simply the ma9imum numer of steps that can occur" Aach
inclusion and deletion of a %ariale is counted as one step" 4he purpose of the steps
limit is to limit computer time" 4he synta9 for the steps limit option is S.^n0 where n
is the ma9imum numer of steps allowed"
Predict Interactively
#fter performing a regression0 you may want to predict %alues for the dependent
%ariale" 4his is ,nown as interacti%e prediction" Select interacti%e prediction y
StatPac For Windows User's Manual 0d,anced 0nalyses 11!
entering the option P$^J" Jou will then e prompted to enter a %alue for each
independent %ariale0 and the computer will use the regression coefficients to predict
the dependent %ariale"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
.3GI: and PR3BI: Co((ands
Proit and logistic regression analyses e9amine the relationship etween a
dichotomous dependent %ariale 6ta,es on only two %alues7 and one or more
e9planatory %ariales 6also called independent or predictor %ariales7" When the
dichotomous %ariale 6dependent %ariale7 is coded as 0 or 10 its predicted %alue
from proit or logistic regression is the estimated proaility of it eing 1"
Proit and logistic regressions are often used to answer yesMno type ;uestions" 8or
e9ample5 a an,er wants to decide whether or not to ma,e a loan0 or a scientist wants
to predict whether the rat li%es or dies" &oth ;uestions are yesMno and could e coded
as Bero or one"
@eciding etween proit or logistic regression is a matter of choice" !n logistic
regression0 the estimated %alue of the dependent %ariale is ased on the cumulati%e
logistic distriution0 and in proit regression it is ased on the cumulati%e normal
distriution" 4he logistic distriution is scarcely distinguishale from the cumulati%e
normal distriution etween response rates of "01 and "990 and therefore0 the choice
of proit or logistic regression is usually made on the asis of which techni;ue the
user is most familiar with"
4he synta9 of the commands and options to run proit or logistic regression are
identical5
P$:&!4 [@ependent %ariale\ [!ndependent %ariale list\
.:F!4 [@ependent %ariale\ [!ndependent %ariale list\
8or e9ample0 a an,er might want to predict successful loan repayment 6?3^.:#'
P#J&#CE7 from pre%ious loan e9perience 6?1^A*PA$!A'CA70 numer of credit
cards 6?2^C$A@!4 C#$@S70 and an, alance 6?3^&#.#'CA7" 4he command to
run the regression could e specified in se%eral ways"
P$:&!4 .:#' P#J&#CE0 A*PA$!A'CA0 C$A@!4 C#$@S0
&#.#'CA
P$:&!4 ?30 ?1-?3 6'ote5 P$:&!4 may e are%iated as P$7
11* 0d,anced 0nalyses StatPac For Windows User's Manual
.:F!4 .:#' P#J&#CE ?1-?3
.: ?3 ?1 ?2 ?3 6'ote5 .:F!4 may e are%iated as .:7
!n each e9ample0 the dependent %ariale is specified first0 followed y the
independent %ariale list" 4he %ariale list may contain up to 200 independent
%ariales and can consist of %ariale names andMor numers" Aither a comma or a
space can e used to separate the %ariales from each other"
When using proit or logistic regression0 the dependent %ariale is always coded as 0
or 1" $egular multiple linear regression0 with the dependent %ariale coded as 0 or 10
is inappropriate for the following reasons5
1" Astimated proailities using multiple regression are not restricted to the inter%al
60017" >sing multiple linear regression0 it is ;uite possile to get an estimated
proaility of greater than one or less than Bero" !t would e difficult to interpret this
as an estimated proaility" >nfortunately0 it is ;uite common for 10` to 20` of the
estimated proailities to lie outside the unit inter%al when employing multiple
regression with a 60017 dependent %ariale"
2" Astimated proailities using multiple regression are e9ceptionally sensiti%e to the
oser%ed distriution of the dependent %ariale 6i"e"0 %ery small or %ery large mean
for the dependent %ariale7"
3" Standard multiple regression assumes that the effect of the independent %ariales
is constant o%er the entire range of the predicted dependent %ariale" Proit and
logistic regression0 on the other hand0 assume that the effects of the independent
%ariales %ary 6i"e"0 nonlinear multiple regression7"
!n summary0 there are two assumptions we ma,e when using proit or logistic
regression analysis5
1" the dependent %ariale of a record is assumed to e most fle9ile when its
estimated proaility is near one-half 6i"e"0 the effect of an independent %ariale is
e9pected to e highest when its estimate of proaility is one-half7"
!n cases when the outcome of the e%ent seems certain 6e"g" P["1 or P\"9 7 the
e9planatory %ariales ha%e a smaller impact on changing the proaility than the
cases where the outcome is less certain" !f the proaility of an e%ent is "90 we are in
a stage of diminishing return to increasing its proaility"
2" the effect of an independent %ariale depends on the estimated proaility"
Descriptive $tatistics
@escripti%e statistics will e printed as part of the proit or logistic regression output
if the option @S^J is specified"

StatPac For Windows User's Manual 0d,anced 0nalyses 11-
&'ample of Descriptive $tatistics Printout
4he e9ample is an analysis loo,ing at cancer remission data" 4he oHecti%e of the
analysis is to assess the proaility of complete cancer remission 6$A1!SS!:'7 on
3 patient characteristics 6CA..0 .!4<!>1 and 4A1PA$#4>$A7"
4he output re%eals that there were 9 cases with cancer remission 6@?^17 and 1(
cases without cancer remission 6@?^070 for a total of 2) cases" 8rom the descripti%e
statistics0 we can see that $A1!SS!:' appears associated with high mean %alues for
CA.. and .!4<!>10 and a low mean %alue for 4A1PA$#4>$A"
$imple Correlation %atri'
4he simple correlation matri9 can e re;uested with the option SC^J" 4he simple
correlation output can e used to e9amine the relationships etween the independent
%ariales"
&'ample of a $imple Correlation %atri' Printout
Regression Information
4he regression coefficients and their standard errors are automatically included in
each analysis" 4he output also includes the t statistic and its proaility" 4he t
statistic for an independent %ariale is its coefficient di%ided y its standard error"
11; 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of a Regression Information Printout
4he chi-s;uare statistic is used to measure the o%erall significance of the e;uation in
e9plaining the dependent %ariale" 4his statistic is e;ui%alent to the o%erall 8-ratio in
multiple regression and tests whether the set of independent %ariales as a group
contriutes significantly to the e9planation of the dependent %ariale"
Astimates of the regression coefficients are otained y ma9imiBing the log of the
li,elihood function using the iterati%e 'ewton-$aphson method of scoring"
Con%ergence is said to ha%e occurred if the change in the log of the li,elihood
function on successi%e iterations is less than or e;ual to the tolerance le%el set in the
parameter file" 4he tolerance le%el can e set etween "001 and "000000001"
Cange in Probability Table
4he change in proaility tale may e selected with the option P4^J" #s indicated
earlier0 the independent %ariale has its ma9imum effect when the estimated
proaility is one-half" >sing the change in proaility tale0 we can study how the
proaility changes when there is a change in the %alue of an independent %ariale"
&'ample of a Cange in Probability Table
4he tale re%eals how a one unit increase in each independent %ariale will affect the
proaility of the dependent %ariale"
!n the sample printout0 note that if the estimated proaility of cancer remission for
an indi%idual is "20 a one unit increase in the independent %ariale ?3 is e9pected to
increase the predicted proaility y "(9(12" 8or that same indi%idual0 an increase
of "1 in ?3 would e e9pected to increase the predicted %alue of $A1!SS!:' y "
(9(12 times "1 ^ "0(9(12"
!f the estimated proaility of cancer remission for an indi%idual is "90 a "1 increase
in ?3 is e9pected to increase the predicted proaility y only "039201 6"39201 times
StatPac For Windows User's Manual 0d,anced 0nalyses 11'
"17" 4he first column in the OChange in ProailityO tale is always the effect of the
independent %ariale e%aluated at the sample mean of the dependent %ariale 6"3333
for this e9ample7"
Classification Table
4he classification tale may e selected with the option C4^J" !t gi%es the fre;uency
distriution of the oser%ed %alue of the dependent %ariale 60 or 17 %ersus its
predicted %alue ased on the set of independent %ariales" !f the dependent %ariale
is well e9plained y the set of independent %ariales0 we e9pect5
1" 4he fre;uencies in the first row of the tale 6oser%ed %alue of @?^07 to e
clustered in the first few columns"
2" 4he fre;uencies in the last row of the tale 6oser%ed %alue of @?^17 to e
clustered in the last few columns"
&'ample of a Classification Table Printout
%ean $ubstitution
1ean sustitution is one method often used to reduce the prolem of missing
information" :ften0 regression analysis is difficult ecause if one independent
%ariale is not ,nown0 it is necessary to e9clude the whole record from the analysis"
!t is possile that this can sustantially reduce the numer of records that are
included in the analysis" 1ean sustitution o%ercomes this prolem y replacing any
missing independent %ariale with the mean of that %ariale" While this techni;ue
has the possiility of slightly distorting the results0 it can ma,e it possile to perform
a regression with sustantial missing data"
Convergence Tolerance
4he con%ergence tolerance is used to find the ma9imum log of the li,elihood
function" !t may e set using the option 4.^n0 where n is the con%ergence tolerance"
# good initial %alue to use is "0000001"
4he %alue of the con%ergence tolerance is %ery important" 4oo high a %alue does not
result in the ma9imum of the li,elihood function0 while too small a %alue results in
an iterati%e procedure which drifts aout the ma9imum" !f this is the case0 the
program will start hal%ing0 wor,ing towards the pre%ious 6higher7 %alue of the log of
the li,elihood function" # message will e printed as follows5
1)> 0d,anced 0nalyses StatPac For Windows User's Manual
Results are not based on last iteration but on a previous iteration wic ad a iger
value !or te log likeliood !unction. Convergence assumed a!ter x iterations
4he ao%e message will also e printed if the iterations donDt con%erge" 4his is
usually due to one 6or more7 of the following reasons5
1" Some of the e9planatory %ariales are highly correlated" A9amination of the
correlation matri9 in conHunction with collinearity diagnostics 6such as those found
in principal components and multicollinearity analyses7 will usually indicate a
%ariale which should ha%e een omitted or transformed"
2" 4he response surface is %ery flatW this is usually due to the %ariales as a group
eing poor predictors of the dependent %ariale" 4here is then no significant
ma9imum to find"
3" # %ariale may ha%e %ery little %ariaility and0 therefore0 e highly correlated with
the constant term"
3" 4he iteration may go too far and s,ip the ma9imum point" 4his is usually due to
setting the %alue too low" #lthough the message is printed0 it is not usually a prolem
since StatPac always sa%es the %alue of the regression coefficients at the ma9imum
%alue of the log li,elihood and attempts hal%ing towards the ma9imum point"
Iteration Limit
4he ma9imum numer of iterations can e set from 1 to 100 as a safeguard against a
flat surface where iterations might proceed indefinitely" With the con%ergence
tolerance set at 0"00000010 the numer of iterations re;uired for con%ergence usually
%aries from 3 to 12" Setting the ma9imum numer of iterations around 30 is
ade;uate" !t should e noted that the data is read from dis, with each iteration" 4he
amount of time to e9ecute one iteration is aout the same as the amount of time it
ta,es to run a multiple regression with the same numer of %ariales and cases"
$ave Probabilities
$esearchers often want to sa%e the proailities in a file for further study" When
S$^J0 you will e offered the opportunity to merge the predicted proailities into
the original data file at the completion of the analysis"
Predict Interactively
#fter performing a regression0 you may want to predict %alues for the dependent
%ariale" Select interacti%e prediction y entering the option P$^J" #t the
completion of the analysis0 you will then e prompted to enter a %alue for each
independent %ariale0 and the computer will use the regression coefficients and
cumulati%e normal distriution 6for proit7 or the cumulati%e logistic distriution 6for
logit7 to predict the proaility that the %alue of the dependent %ariale is e;ual to
one"
StatPac For Windows User's Manual 0d,anced 0nalyses 1)1
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
PC0 Co((and
Principal components analysis 6PC#7 in%estigates relationships among %ariales
without designating some as independent and others as dependentW instead PC#
e9amines relationships within a single set of %ariales" 4he techni;ue of PC# is
primarily used to reduce the numer of dimensions" >sually0 most of the %ariation in
a large group of %ariales can e captured with only a few principal components" >p
to 200 %ariales can e analyBed"
4his techni;ue asically attempts to e9plain the %ariance-co%ariance structure of
%ariales y constructing a smaller set of orthogonal 6independent7 linear
cominations 6principal components7 of the original %ariales" 4he first principal
component 6PC7 is that weighted comination of response %ariales which accounts
for the ma9imum amount of total %ariation in the original %ariales" 4he second PC
is that weighted comination of response %ariales which0 among all cominations
orthogonal to the first0 accounts for the ma9imum amount of remaining %ariation"
4he synta9 to run a principal components analysis is5
PC# [?ariale list\
8or e9ample0 after conducting a lengthy sur%ey0 we might elie%e that se%eral of the
;uestions were actually measuring the same thing" Principal components could e
used to isolate those ;uestions that were measuring the same dimension" 4a,e the
following ;uestions from a larger twenty-fi%e ;uestion sur%ey5
11" What is your annual incomeY
12" What percent of your salary do you pay in ta9esY
13" <ow much discretionary income do you ha%eY
13" What is the mar,et %alue of your houseY
12" <ow much disaility insurance do you carryY
#ll of the ao%e ;uestions might e measuring a dimension related to income" !f a
principal components analysis e9tracted these %ariales into one component0 we
might try to shorten future sur%eys y as,ing fewer ;uestions aout income" 4he
command to run the principal components analysis would e5
1)& 0d,anced 0nalyses StatPac For Windows User's Manual
PC# ?1-?22
PC ?1-?22 6'ote5 PC# may e are%iated as PC7
'otice that all the ;uestions in the sur%ey were specified as part of the %ariale list" !t
is the Ho of PC# to e9tract the indi%idual components"
# component is the weighted comination of %ariales which e9plains the ma9imum
amount of remaining %ariation in the original %ariales 6orthogonal to the pre%ious
components7" 4hat is0 each component is mutually independent from all other
components" 1athematically0 the prolem is one of e9plaining the %ariance-
co%ariance structure of the %ariales through linear cominations of the %ariales"
Primary interest lies in the algeraic sign and magnitude of the principal component
coefficients 6loadings70 and in the total %ariation in the dependency structure
e9plained y a component"
Frouping of %ariales is ased on the magnitude of the loadings associated with each
principal component" .oadings elow "30 are usually disregarded for purposes of
interpretation" .oadings are comparale to standardiBed partial regression
coefficients" 4he sign and magnitude of each loading re%eals how the particular
%ariale is associated with that principal component" # loading may e interpreted
li,e a correlation coefficient in that it shows the strength and direction of the
relationship etween a gi%en %ariale and the principal component"
Fenerally0 during study design0 concepts or constructs are identified as part of the
study goals" ?ariales are de%eloped to answer the study goals" Principal components
analysis can e used to e%aluate how well each %ariale is associated with the
construct it was designed to measure" !n a well structured sur%ey0 each %ariale will
ha%e a high loading on only one construct 6the one it was designed to measure7"
When a %ariale has a high loading on more than one principal component0 the
%ariale did not do a good Ho of discriminating etween two or more constructs
Principal Components
Aither the correlation matri9 or co%ariance matri9 may e used for deri%ing principal
components" !f the responses are in similar units0 the co%ariance matri9 has a greater
statistical appeal" When the responses are in widely different units 6age in years0
weight in ,ilograms0 height in centimeters0 etc"7 the correlation matri9 should e
used" !n practice0 the use of the correlation matri9 is more common"
4he PC option may e set to one of four %alues5
# ^ Correlation matri9
& ^ Co%ariance matri9 with mean correction
C ^ Co%ariance matri9 without mean correction
@ ^ PC# not re;uested
StatPac For Windows User's Manual 0d,anced 0nalyses 1)1
&'ample of Principal Components Printout
!n the e9ample ao%e0 PC# was run on %ariales 2 to ) of the .ongley data" 4he
correlation matri9 was used 6PC^#7 ecause the %ariales were in widely different
units"
'ote that the first two principal components account for 9-"3` of the total %ariation
in the dependency structure of the si9 %ariales" 4he first PC has e;ually high
loadings on all %ariales e9cept %ariale 3 6siBe of the armed forces7" 4his
component can e interpreted as an economic performance indicator" !t is common
for the first PC to load e;ually on most %ariales" 4he second component has high
loadings on %ariale 3 6-"(07 and %ariale 3 6"-07 and the signs are different0 implying
that there is a high relationship etween siBe of the armed forces and unemployment"
4he fact that the signs are different implies that as siBe of the armed forces goes up0
unemployment goes down 6as e9pected7" 4he remaining four PCDs account for less
than 3` of the total %ariaility and are ignored"
8ollowing are some e9amples of the common uses of principal components analysis5
1" 4he most common use of principal components analysis is to deri%e a small
numer of linear cominations 6principal components7 from a set of %ariales that
retain as much of the information in the original %ariales as possile" :ften a small
numer of principal components can e used in place of the original %ariales for
plotting0 regression0 clustering0 etc"
2" Principal components analysis can also e %iewed as an attempt to unco%er
appro9imate linear dependencies among %ariales 6i"e"0 to understand the correlation
structure7" 4he multicollinearity diagnostics descried elow are ased on the
principal components"
3" !t is often impossile to measure certain theoretical concepts0 ut many 6highly
interrelated7 %ariales may e a%ailale to pro%ide a mathematical formula for the
theoretical concept" Principal components can e used to determine appropriate
weights associated with each of these %ariales to pro%ide an OoptimumO measure of
a theoretical concept0 such as mathematical aility" !n essence0 PC# otains
components which may e gi%en special meaning"
1)) 0d,anced 0nalyses StatPac For Windows User's Manual
3" &ecause the principal components are independent of each other0 they may help to
circum%ent the prolem of multicollinearity" 1ost of the %ariation in the %ariales is
accounted for y the first few principal components" 4he last few principal
components define dimensions of the regressor space that are not %ery prominent -
the components are so flimsy that they can e lown around wildly y small
perturations in the data" 4o get rid of the instaility of the estimates0 you throw
away the last few components" 4here are as many principal components as original
%ariales0 ut usually only a small numer of components are retained"
2" Principal components analysis is similar to factor analysis in that they oth
pro%ide analysis of the interdependence structure of a set of %ariales" !n factor
analysis0 it is assumed that each original %ariale is influenced y %arious factors"
Some are shared y other %ariales in the set 6common factors70 while others are not
shared y any other %ariale 6uni;ue factors7" !n PC#0 on the other hand0 no
assumptions aout the underlying structure of the %ariales are made" We define new
hypothetical %ariales that are e9act mathematical transformations of the original
%ariales0 ut that are independent of each other" 4hat is0 we see, that set of linear
cominations of the original %ariales that asor and account for the ma9imum
possile proportion of total %ariation in those %ariales"
4he first principal component is the single est summary of the total %arianceW the
second principal component is the est summary of the %ariance remaining after the
first principal component has een e9tracted" Suse;uent components are defined
similarly until all the %ariance in the data is e9hausted"
Descriptive $tatistics
@escripti%e statistics may e printed or suppressed using the @S^J or @S^' option
respecti%ely"
&'ample of Descriptive $tatistics Printout
$imple Correlation %atri'
4he simple correlation matri9 6SC^J7 is the easiest way of e9amining linear
dependencies etween the %ariales" <igh intercorrelations etween %ariales is a
warning sign that collinearity might e9ist"
&'ample of a $imple Correlation Printout
StatPac For Windows User's Manual 0d,anced 0nalyses 1)!
Collinearity Diagnostics
1ulticollinearity refers to the presence of highly intercorrelated predictor %ariales
in regression models0 and its effect is to in%alidate some of the asic assumptions
underlying their mathematical estimation" !t is not surprising that it is considered to
e one of the most se%ere prolem in multiple regression models and is often
referred to y social modelers as the Ofamiliar curseO" Collinearity diagnostics
measure how much regressors are related to other regressors and how this affects the
staility and %ariance of the regression estimates"
Signs of multicollinearity in a regression analysis include5
1" .arge standard errors on the regression coefficient0 so that estimates of the true
model parameters ecome unstale and low t-%alues pre%ail"
2" 4he parameter estimates %ary consideraly from sample to sample"
3" :ften there will e drastic changes in the regression estimates after only minor
data re%ision"
3" Conflicting conclusions will e reached from the usual tests of significance 6such
as the wrong sign for a parameter7"
2" A9treme correlations etween pairs of %ariales"
-" :mitting a %ariale from the e;uation results in smaller regression standard errors"
)" # good fit not pro%iding good forecasts"
We use the multicollinearity diagnostics5
1" 4o produce a set of condition indices that signal the presence of one or more near
dependencies among the %ariales" 6.inear dependency0 an e9treme form of
multicollinearity0 occurs when there is an e9act linear relationship among the
%ariales"7
2" 4o unco%er those %ariales that are in%ol%ed in particular near dependencies and to
assess the degree to which the estimated regression coefficients are eing degraded
y the presence of the near dependencies"
1)* 0d,anced 0nalyses StatPac For Windows User's Manual
!n practice0 if one independent %ariale has a high s;uared multiple correlation 6r-
s;uared7 with the other independent %ariales0 it is e9tremely unli,ely that the
independent %ariale in ;uestion contriutes significantly to the prediction e;uation"
When the r-s;uared is too high0 the %ariale is0 in essence0 redundant"
When the collinearity analysis is re;uested with the C@^J option0 the statistics
attriuted to &elsley0 Euh and Welsch 619(07 are printed 6namely the eigen%alues0
condition indices and the decomposition of the %ariances of the estimates with
respect to each eigen%alue7"
&'ample of Collinearity Diagnostics
'ote that %ariales 2030- and ) are highly correlated and the ?!8Ds for all %ariales
6e9cept %ariale 37 are greater than 10 with one of them eing greater than 1000"
A9amination of the condition inde9 column re%eals a dominating dependency
situation with high numers for se%eral indices" 8urther regressions on susets of the
independent %ariales are called for"
4he following steps are generally recommended in diagnosing multicollinearity5
1" !nspection of the correlation matri9 for high pairwise correlationsW this is not
sufficient0 howe%er0 since multicollinearity can e9ist with no pairwise correlations
eing high"
2" ?!8Ds greater than 10 are a sign of multicollinearity" 4he higher the %alue of ?!8Ds0
the more se%ere the prolem" !n the StatPac output0 any ?!8 greater than 999"99999
is set to the %alue 999"99999"
3" Condition indices of 30 to 100 6generally indicating moderate to strong
collinearities7 comined with at least 2 high numers 6say greater than 0"27 in a
O%ariance proportionO row are a sign of multicollinearity" 4he higher the condition
indices0 the more se%ere the multicollinearity prolem" 4hree cases can e
distinguished5
Case 15 :nly one near dependency present
4his occurs when only one condition inde9 is greater than 30" # %ariale is in%ol%ed
in0 and its estimated coefficient degraded y0 the single near dependency if it is one
of two or more %ariales in a row with O%ariance proportionO numers in e9cess of
some threshold %alue0 such as "2 "
StatPac For Windows User's Manual 0d,anced 0nalyses 1)-
Case 25 Competing dependencies
4his occurs with more than one condition inde9 of roughly the same magnitude and
greater than 30" <ere0 in%ol%ement is determined y aggregating the O%ariance
proportionO numers of each %ariale o%er the high condition inde9 rows" 4he
%ariales whose aggregate proportions e9ceed 0"2 are in%ol%ed in at least one of the
dependencies0 and therefore0 ha%e degraded coefficient estimates" 4he numer of
near dependencies present corresponds to the numer of competing indices"
Case 35 @ominating dependencies
@ominating dependencies e9ist when high condition indices 6o%er 307 coe9ist with
e%en larger condition indices" 4he dominating dependency can ecome the prime
determinant of the %ariance of a gi%en coefficient and oscure information aout the
simultaneous in%ol%ement in a wea,er dependency" !n this case0 other %ariales can
ha%e their Hoint in%ol%ement oscured y the dominating near dependency" With this
dominating near dependency remo%ed0 the oscured relationship may reappear" !n
this case0 additional analysis0 such as au9iliary regressions0 is warranted to
in%estigate the descripti%e relations among all of the %ariales potentially in%ol%ed"
Since the %ariance of any regression coefficient depends on regression residual error0
sample siBe0 and the e9tent of multicollinearity0 the following are suggested as
possiilities for increasing the precision of the regression coefficients5
1" Can the precision of measurement of any %ariale e impro%edY 4his has the
effect of reducing regression residual error"
2" Can the model specification e impro%edY <a%e we0 for e9ample0 omitted an
important %ariale or transformed the %ariales appropriately 6using logs0 reciprocal0
etc"7 to match theoryY
3" Can we increase the sample siBe0 therey decreasing mean s;uare residual errorY
3" Can we replace a %ariale with another less correlated with the current set of
independent %ariales0 ut as correlated with the dependent %arialeY
2" # group of %ariales 6highly intercorrelated7 may e aggregated 6or a%eraged70
using principal components or factor analysis to find appropriate weights" 4his is
especially true of %ariales measured in the same units0 such as income"
-" &ecause multicollinearity indicates that some independent %ariales con%ey little
information o%er that of the other %ariales0 one way to scale down %ariales is to
drop a redundant %ariale"
Include Intercept
# collinearity with the constant term occurs ecause some linear comination of two
or more %ariales is essentially constant" 4his situation can e detected y omitting
the intercept from the collinearity analysis 6set with the !C^' option70 and then
e9amining the standard de%iations or coefficients of %ariation 6standard errorMmean7
of the %ariales"
Variance Inflation Factors
?ariance inflation factors show the degree to which a regression coefficient will e
affected ecause of the %arialeDs redundancy with other independent %ariales" #s
the s;uared multiple correlation of any predictor %ariale with the other predictors
approaches unity0 the corresponding ?!8 ecomes infinite"
8or any predictor orthogonal 6independent7 to all other predictors0 the %ariance
inflation factor is 1"0" ?!8i thus pro%ides us with a measure of how many times
1); 0d,anced 0nalyses StatPac For Windows User's Manual
larger the %ariance of the ith regression coefficient will e for multicollinear data
than for orthogonal data 6where each ?!8 is 1"07" !f the ?!8Ds are not unusually larger
than 1"00 multicollinearity is not a prolem" #n ad%antage of ,nowing the ?!8 for
each %ariale is that it gi%es a tangile idea of how much of the %ariances of the
estimated coefficients are degraded y the multicollinearity" ?!8Ds may e printed
using the ?!^J option"
$ave $cores
$esearchers often want to create principal component scores for respondents" 4his
pro%ides an indication of how strongly an indi%idual loads on each component" 4he
data is first standardiBed and the principal component loadings are used as
coefficients for calculating the component score"
Jou can sa%e the component scores with the options command SS^J" #t the
completion of the analysis you will e gi%en the opportunity to merge to component
scores with the original data file""
%ean $ubstitution
1ean sustitution is one method often used to reduce the prolem of missing
information" >sually0 if one independent %ariale is not ,nown0 it is necessary to
e9clude the whole record from the analysis" !t is possile that this can sustantially
reduce the numer of records that are included in the analysis" 1ean sustitution
o%ercomes this prolem y replacing any missing %ariale with the mean of that
%ariale" While this techni;ue has the possiility of slightly distorting the results0 it
can ma,e it possile to perform a principal components analysis with sustantial
missing data"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
F0C:3R Co((and
8actor analysis is similar to principal components analysis" !t is another way of
e9amining the relationships etween %ariales" 8actor analysis differs from principal
components in that there are usually fewer factors than %ariales" >p to 200 %ariales
may e included"
StatPac contains two different methods for e9tracting factors from a set of %ariales5
%arima9 and powered-%ector" &oth methods e9tract factors that are independent
6orthogonal7 from other factors" 4his is ,nown as a simple structure analysis" 4he
program also contains an option to impro%e the simple structure y allowing the
factors to e correlated with each other" When factors are correlated0 it is ,nown as
an oli;ue reference structure analysis"
StatPac For Windows User's Manual 0d,anced 0nalyses 1)'
4he synta9 to run a factor analysis is5
8#C4:$ [?ariale list\
8# [?ariale list\ 6'ote5 8#C4:$ may e are%iated as 8#7
8actor analysis is essentially a way of e9amining the correlation matri9" While oth
techni;ues 6%arima9 and powered-%ector7 are ;uite different from each other in
methodology0 they ha%e the same first step0 which is to decide what %alues are to e
used for the communality estimates" 8or each %ariale0 the communality is defined as
the sum of the s;uares of all the factor loadings for that %ariale" # factor loading
itself can e thought of as the correlation of a %ariale with the factor" 4he
communalities are placed on the diagonal of the correlation matri9"
Initial Communality &stimates for te Diagonal
4here are three commonly used communalities5 units0 asolute row ma9imums and
s;uared multiple correlation coefficients" >nits is proaly the most commonly used
since it is always a %alue of one" 4hat is0 the %alue of one is placed on the diagonal of
the correlation matri9" 4he highest asolute row ma9imums refers to the highest
asolute correlation coefficient in each row" 4he s;uared multiple correlation
coefficients refers to the correlation of each %ariale with the remainder of the
%ariales" 4hat is0 the diagonal %ariale is regressed against all other %ariales0 and
the coefficient of multiple correlation is placed on the diagonal"
Jou can select the initial diagonal %alues y setting the @! option to one of three
%alues5
1 ^ >se units0 6i"e"0 17
2 ^ >se highest asolute row correlation
3 ^ >se s;uared multiple correlation coefficient
Type of $olution
4here are two different techni;ues to e9tract factors" 4he %arima9 solution 64J^?7
is most commonly used" 4he first step with the %arima9 techni;ue is ,nown as
Oprincipal factor analysisO" !t is the same as a principal components analysis e9cept
that the e9traction of principals is stopped y some predetermined criterion" When a
sufficient numer of principals has een e9tracted0 a rotational techni;ue called
O%arima9O is used to create the simple structure factor loadings"
4he powered-%ector techni;ue 64J^P7 uses an entirely different approach" 4his
approach is faster than the %arima9 techni;ue ecause it does not re;uire a principal
components analysis first" !nstead0 it uses a cluster techni;ue to e9tract factors
directly from the correlation matri9" #n additional techni;ue called Oweighted cross-
factorO rotation is often used with the powered-%ector solution to pro%ide a cleaner
separation among the factors"
1!> 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of a Factor 4nalysis Printout
Descriptive $tatistics
:ccasionally0 you may e interested in the means and %ariance for each of the
%ariales in the analysis" @escripti%e statistics may e printed or e9cluded from the
output y using the options @S^J and @S^'0 respecti%ely"
&'ample of a Descriptive $tatistics Printout
$imple Correlation %atri'
!t is often desirale to print the simple correlation matri9 when performing a factor
analysis 6SC^J7" !t can pro%ide a good initial understanding of the interrelationships
in the data"
StatPac For Windows User's Manual 0d,anced 0nalyses 1!1
&'ample of a $imple Correlation %atri' Printout
Principal Components 4nalysis
4he results of the principal components analysis may e printed 6PC^J7 or not
6PC^'7" 4his option only refers to printing the output" 4he remaining principal
components options must e set appropriately regardless of the PC setting"
Cross:Factor Rotation
Cross-factor rotation is often used in conHunction with the powered-%ector techni;ue
to impro%e upon the simple structure" !t usually pro%ides a OcleanerO structure0 that
is0 a clearer separation of the factors" Select cross-factor rotation with the option
C$^J"
Obli=ue $imple $tructure Factor Loadings
#fter performing either a %arima9 or powered-%ector solution0 you may want to
perform an oli;ue rotation" &oth the %arima9 and powered-%ector solutions ma,e an
aritrary assumption that factors are uni;ue and independent of one another" 4he
oli;ue rotation remo%es this restriction and allows factors to e correlated with each
other" 4he oli;ue simple structure factor loadings may e printed 6:S^J7 or
e9cluded 6:S^'7"
4he oli;ue rotation is often used to test the uni;ueness of factors" !f the resulting
factors ha%e low intercorrelations after an oli;ue rotation0 it is fairly certain that the
factors are orthogonal 6independent of each other7"
1!& 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of Obli=ue $imple $tructure Factor Loadings
Obli=ue Factor Correlation %atri'
4he correlation matri9 of the factors can e printed 6:C^J7 or e9cluded 6:C^'7" !t
represents relationships etween factors after the oli;ue rotation" !f the correlations
are low 6less than "370 we can e confident that the %arima9 or powered-%ector
solution produced uni;ue and unrelated factors"
&'ample of an Obli=ue Correlation %atri' Printout
Number of Factors
When the A*^10 StatPac will e9tract '8 factors from the data" 4his is often used to
test a specific hypothesis that has een de%eloped" 8or e9ample0 you might elie%e
that twenty items on a sur%ey are really measuring only two maHor factors" Jou could
test this hypothesis y using the option5
:P4!:'S A*^1 '8^2
!n this case0 only two components would e e9tracted" 4hey could then e e9amined
as to how well they Ohang togetherO" 4he only time you use the '8 option is to test a
specific hypothesis"
Percent of Total Variance to &'plain
When the A*^20 StatPac will continue to e9tract factors until it has accounted for P$
proportion of the %ariance"
8or e9ample0 to use the powered-%ector techni;ue and e9tract factors until 92 percent
of the %ariance has een accounted for0 enter the option5
:P4!:'S A*^2 P$^92
StatPac For Windows User's Manual 0d,anced 0nalyses 1!1
%inimum Variance Proportion for Principal Inclusion
When A*^30 StatPac will continue to e9tract components until the ne9t component
would not account for a minimum proportion of the total %ariance"
8or e9ample0 if you set 1P^20 the program will e9tract all the components that
account for at least fi%e percent of the total %ariance" #ny component that does not
account for fi%e percent of the %ariance will not e included in the analysis"
Varima' Rotational Factor 4ngle
4he %arima9 rotational techni;ue is one of the etter factoring methods" !t usually
pro%ides a clearer separation of factors than other methods" 4he techni;ue e9tracts
factors using normaliBed factor loadings during the iterations" 4hese factors are
assumed to e uni;ue 6orthogonal7 and not correlated with each other" 4he techni;ue
attempts to ma9imiBe the %ariance of the s;uared loadings for each factor" # factor
loading itself can e thought of as the correlation of a %ariale with the factor"
>sing this method0 the angle of rotation is calculated in each iteration" When the
angle is less than the %arima9 rotational factor angle 6$870 the process is completed"
!n other words0 each iteration is a rotation in an attempt to impro%e the simple
structure" When the rotational angle is less than the %alue of $80 the e9it criteria has
een achie%ed" 4he most often used %alue is one degree" 4he $8 option can e used
to set the angle to any %alue" 8or e9ample0 the following options command sets the
e9it criteria to one and a half degrees5
:P4!:'S $8^1"2
Convergence Tolerance for Principal Components
4he con%ergence tolerance is the way that the OresolutionO of the components is
controlled" !n other words0 it determines the point at which the program decides it
has finished e9tracting a component" Setting the con%ergence tolerance too low will
result in a %ery large numer of calculations and0 in the worst case0 may cause the
program to e9ceed the limit on the numer of iterations" Setting the %alue too high
would cause the program to prematurely elie%e it had e9tracted a component" #
good starting %alue for the con%ergence tolerance is 4.^"000001"
Convergence Tolerance for Obli=ue Rotation
Aach iteration in the oli;ue rotation impro%es the simple structure y successi%ely
decreasing amounts" 4he con%ergence tolerance 6:47 places a limit on the
con%ergence process0 and is used as the e9it criteria for oli;ue rotation" 4he
iterations will continue until additional rotations do not impro%e the simple structure
y more than the con%ergence tolerance %alue" While the con%ergence tolerance
could e any numer greater than Bero0 a typical %alue might e "000001" 4he
options command to set this %alue is5
:P4!:'S :4^"000001
1!) 0d,anced 0nalyses StatPac For Windows User's Manual
Iteration Limit
4he ma9imum numer of iterations for any of the factoring algorithms is included to
limit the time that the computer could e wor,ing on the prolem" Con%ergence
usually occurs in fewer than ten iterationsW howe%er0 as the con%ergence tolerance is
set to lower %alues0 it will re;uire more iterations to achie%e a solution" Fenerally0
the ma9imum numer of iterations is set to 100 6!4^1007" 4his seems to allow most
solutions0 and at the same time0 pre%ents unreasonale calculation times"
$ave $cores
$esearchers often want to create factor scores for respondents" 4his pro%ides an
indication of how strongly an indi%idual loads on each factor" 4he data is first
standardiBed and the factor loadings are used as coefficients for calculating the factor
scores" !t should e noted that the loadings will e those of last rotation re;uested
with the other options" 4hus0 if an oli;ue rotation was re;uested 6i"e"0 the last
rotation to e performed7 the sa%ed scores will e those otained from the oli;ue
rotation"
Jou can sa%e the factor scores with the options command SS^J" #t the completion
of the analysis0 you will e gi%en the opportunity to merge the sa%ed scores with the
original data file"
%ean $ubstitution
1issing data can ecome a prolem when there are few cases" !n the worst case0
missing data may ma,e it impossile to perform an analysis" 1ean sustitution is
one method often used to comat the prolem of missing data" When mean
sustitution is used 61S^J70 any data that is missing is replaced with the mean of
the %ariale"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
C.US:+R Co((and
4he oHecti%e of cluster analysis is to separate the oser%ations into different groups
6clusters7 so that the memers of any one group differ from one another as little as
possile0 whereas oser%ations across clusters tend to e dissimilar" 4he grouping
can e used to summariBe the data or as a asis for further analysis" !n discriminant
analysis0 the groups are already defined0 whereas in cluster analysis the purpose is to
define the groups"
StatPac For Windows User's Manual 0d,anced 0nalyses 1!!
4he synta9 of the command to run cluster analysis is5
C.>S4A$ [?ariale list\
#s an e9ample0 a researcher studying iris flowers wanted to ,now if the iris would
group into types ased on length and width of their sepals and petals" 4he four
clustering %ariales are5
?1 SAP#. .A'F4< length of sepal
?2 SAP#. W!@4< width of sepal
?3 PA4#. .A'F4< length of petal
?3 PA4#. W!@4< width of petal
4he command to run cluster analysis could e specified in se%eral ways5
C.>S4A$ SAP#. .A'F4<0 SAP#. W!@4<0
PA4#. .A'F4<0 PA4#. W!@4<
C.>S4A$ ?1 ?2 ?3 ?3
C.>S4A$ ?1-?3
C. ?1-?3 6'ote5 C.>S4A$ can e are%iated as C.7
!n the first e9ample0 a continuation line was used to e9tend the %ariale list" 4he
%ariale list can consist of %ariale laels andMor %ariale numers" Aither a comma
or a space can e used to separate the %ariales from each other"
C.>S4A$ pro%ides two types of cluster analysis5 agglomerati%e hierarchical cluster
analysis and non-hierarchical cluster analysis" 8or hierarchical methods0 the general
procedure is as follows5
1" &egin with as many clusters as there are oser%ations 6i"e"0 each cluster consists of
e9actly one oser%ation7"
2" Search for the most similar pair of clusters" 4his in%ol%es e%aluating a criterion
6distance7 function for each possile pair of clusters and choosing the pair of clusters
for which the %alue of the criterion function is the smallest" 4he criterion function is
constructed using the clustering %arialesW the actual formula for the criterion
function depends on the clustering algorithm used" .ael the chosen clusters as p and
;"
3" $educe the numer of clusters y one through the merger of clusters p and ;W the
new cluster is laeled ;"
3" Perform steps 2 and 3 until all the oser%ations are in one cluster" #t each stage0
the identity of the merged clusters as well as the %alue of the criterion function is
stored"
'on-hierarchical clustering methods egin with the numer of clusters gi%en" 4heir
primary use is to refine the clusters otained y hierarchical methods" 4he non-
hierarchical cluster analysis methods used y StatPac are con%ergent E-means
methods and generally follow the following se;uence of steps5
1" &egin with an initial partition of data units into clusters" 4here are se%eral different
initial partitions a%ailale in StatPac"
1!* 0d,anced 0nalyses StatPac For Windows User's Manual
2" 4a,e each data unit in se;uence and compute the distances to all cluster centroidsW
if the nearest centroid is not that of the data unitDs current cluster0 then reassign the
data unit and update the centroids of the losing and gaining clusters"
3" $epeat step 2 until con%ergence is achie%edW that is0 continue until a full cycle
through the data set fails to cause any changes in cluster memership"
Cluster analysis performed on small data sets 6a few hundred cases7 will run
relati%ely fast" <owe%er0 the time to run the analysis increases e9ponentially with the
numer of cases in the data file" When thousands of cases are in%ol%ed0 it may ta,e
se%eral hours to complete the analysis" 4herefore0 during preliminary analyses on
large data sets0 it may e desirale to use a SA.AC4 statement to limit the numer
records eing analyBed"
Type Of Clustering 4lgoritm
4here are si9 different clustering algorithms a%ailale in StatPac" 4he 4J option is
used to select the clustering method" #lgorithms 1-3 are agglomerati%e hierarchical
clustering algorithms while algorithms 3-- are non-hierarchical clustering
algorithms" Aach of the si9 algorithms are descried elow5
1inimum a%erage sum of s;uares cluster analysis 4J^1
With this algorithm0 the clusters merged at each stage are chosen so as to minimiBe
the a%erage contriution to the error sum of s;uares for each memer in the cluster"
4his ;uantity is also the %ariance in each cluster and is similar to a%erage lin,age in
that it tends to produce clusters of appro9imately e;ual %ariance" Conse;uently0 if the
clusters are all of appro9imately the same density0 then there will e a tendency for
large natural groups to appear as se%eral smaller clusters0 or for small natural groups
to merge into larger clusters"
WardDs method 4J^2
#t each stage0 this method minimiBes the within-cluster sum of s;uares o%er all
partitions due to the merger of clusters p and ;" 4his method tends to Hoin clusters
with a small numer of oser%ations and is iased towards producing clusters with
roughly the same numer of oser%ations"
Centroid method 4J^3
4his method minimiBes the s;uared Auclidian distance etween clusters at each
stage" 4he centroid method is not as sensiti%e to the presence of outliers0 ut does not
perform as well as the first two methods if there are no outliers"
!f there are no outliers0 one of the first two methods should e used" 4he first method
performs etter than WardDs method under certain types of errors 61illigan0 19(07"
4he three non-hierarchical clustering algorithms are all ased on the con%ergent E-
means method 6#ndererg0 19)37 and differ only in terms of their starting %alues"
Con%ergent E-means using minimum a%erage sum of s;uares centroids 4J^3
4his algorithm first runs the minimum a%erage sum of s;uares hierarchical cluster
analysis method and uses the centroids from this method as input to the con%ergent
E-means procedure" 4he distance measure used to allocate an oser%ation to a
cluster in the con%ergent E-means procedure is the Auclidian distance otained from
the clustering %ariales for that oser%ation"
Con%ergent E-means using Ward method centroids 4J^2
4his algorithm first runs the Ward hierarchical cluster analysis method and uses the
centroids from this method as input to the con%ergent E-means procedure" 4he
distance measure used to allocate an oser%ation to a cluster in the con%ergent E-
StatPac For Windows User's Manual 0d,anced 0nalyses 1!-
means procedure is the Auclidian distance otained from the clustering %ariales for
that oser%ation"
Con%ergent E-means using centroids from the centroid method 4J^-
4his algorithm first runs the centroid hierarchical cluster analysis method and uses
the centroids from this method as input to the con%ergent E-means procedure" 4he
distance measure used to allocate an oser%ation to a cluster in the con%ergent E-
means procedure is the Auclidian distance otained from the clustering %ariales for
that oser%ation"
'on-hierarchical methods generally perform etter than hierarchical methods if non-
random starting clusters are used" When random starting clusters are used 6for
e9ample0 the first p oser%ations are used as centroids for the p starting clusters70 the
non-hierarchical clustering methods perform rather poorly" 4he random start methods
were0 therefore0 not implemented in StatPac" E-means procedures appear more
roust than any hierarchical methods with respect to the presence of outliers0 error
perturations of distance measures and choice of distance metric" <owe%er0 non-
hierarchical methods re;uire the numer of clusters to e gi%en" 1any studies
recommend the following series of steps in running cluster analysis5
1" $un cluster analysis using one of the first two hierarchical cluster analysis
algorithms 6minimum a%erage sum of s;uares or Ward methods7"
2" $emo%e outliers from the data set" :utliers can e located y loo,ing at the
distance from the cluster centroids 6CC option70 or the hierarchical tree diagram 6one
oser%ation clusters that are late in merging with other clusters7" :utliers often
represent segments of the population that are under-represented and therefore0 should
not e discarded0 without e9amination"
3" @elete dormant clustering %ariales" 4hese can e located using the decomposition
of sum of s;uares 6@C option7"
3" @etermine the numer of clusters" 4his can e done using the criterion function
column in the decomposition of sum of s;uares 6@C option70 as well as the
hierarchical tree diagram 64@ option7"
2" :nce outliers are discarded0 dormant %ariales omitted and the numer of clusters
determined0 run one of the first two non-hierarchical methods 64J^3 or 27 se%eral
times0 %arying the numer of clusters"
Number of Clusters
!n the first cluster analysis run on a data set0 you should choose one of the first three
hierarchical clustering algorithms0 and set the numer of clusters e;ual to 99
6'C^997" 4his will print a hierarchical tree diagram and the decomposition of sum of
s;uares0 lea%ing the other options off 6i"e"0 4@^J0 @C^J0 CC^'0 C1^'7" 'ote that
the type of clustering option 64J7 should e 10 2 or 3 6one of the hierarchical
clustering algorithms7"
:nce you ha%e e9amined the hierarchical tree diagram and the decomposition of sum
of s;uares0 you would select the numer of clusters using the 'C option" Cluster
analysis is an e9ploratory techni;ue0 and you will proaly ha%e to rerun the cluster
analysis se%eral times0 %arying the numer of clusters as well as the clustering
algorithm and the set of clustering %ariales" !t is not uncommon to set the numer of
clusters to a few more than you suspect there are clusters0 in an attempt to disco%er
outliers" 'on-hierarchical clustering algorithms are more effecti%e in spotting
outliers y this method than their hierarchical counterparts"
1!; 0d,anced 0nalyses StatPac For Windows User's Manual
Descriptive $tatistics
@escripti%e statistics may e printed or suppressed using the @S^J or @S^' option0
respecti%ely"
&'ample of Descriptive $tatistics Printout
1ierarcical Tree Diagram
4he hierarchical tree diagram pro%ides the analyst with an effecti%e %isual
condensation of the clustering results" 4he hierarchical tree diagram is one of the
most commonly used methods of determining the numer of clusters" !t is also useful
in spotting outliers0 as these will appear as one-memer clusters that are Hoined later
in the clustering process"
4he numers at the top and ottom of the hierarchical tree diagram represent
e;ually-spaced %alues of the criterion function" !t gi%es a pictorial representation of
the criterion function information"
!f two or more clusters in a set of data are distinguished %ery well from each other0
all merges ut the last few 6where OtrueO clusters are Hoined7 will e clumped to the
left of the tree diagram ecause of the e9treme dissimilarity of the OtrueO clusters
6i"e"0 most of the criterion function is accounted for y these clusters7" 4o etter
understand the internal structure of these OtrueO clusters0 it may e necessary to rerun
cluster analysis separately on each of these OtrueO clusters"
StatPac For Windows User's Manual 0d,anced 0nalyses 1!'
&'ample of a 1ierarcical Tree Diagram
Cluster Centroids
4he cluster centroids are simply the means of each clustering %ariale for each
cluster" 4he cluster centroids are proaly the most useful multi%ariate
characteriBation of the clusters"
&'ample of a Cluster Centroids Printout
Decomposition of $um of $=uares
4his option comines two types of information5 criterion function information and
decomposition of sum of s;uares information"
4he criterion function is useful in determining the numer of clusters" !t is e9pressed0
at each clustering stage0 as a proportion of the %alue of the criterion function when
1*> 0d,anced 0nalyses StatPac For Windows User's Manual
all oser%ations are Hoined in one cluster 6the last stage in a hierarchical cluster
analysis7" 4he criterion function0 at a gi%en clustering stage0 is a measure of the
distance etween all oser%ations in all clusters" Conse;uently0 at the start 6when
there are as many clusters as oser%ations70 the %alue of the criterion function is Bero
6each cluster has Bero %ariance ecause it contains only 1 oser%ation7" #s clusters
are Hoined0 the %alue of the criterion function increases" 4he criterion function rises
slowly in the first stages0 as the most similar clusters are Hoined and there is %ery
little within cluster %ariaility" <owe%er0 as true distinct groups are Hoined0 the
within-cluster %ariaility increases and the criterion function rises sharply"
#s an e9ample0 suppose you are analyBing a data set with four clearly defined groups
6clusters7" 4he %alue of the criterion function should rise %ery slowly until you reach
three clusters0 in which case two OtrueO clusters are Hoined" 4his would e the clue as
to the numer of clusters 6i"e"0 the sharp rise in the criterion function when you reach
three clusters7"
# OrandomO %ariale 6%ariale not useful in separating clusters7 can ha%e a
detrimental effect in cluster analysis and should e eliminated" :ne way of
e%aluating the relationship etween a gi%en hierarchical classification0 and each of
the clustering %ariales0 is through the e9amination of the growth in une9plained sum
of s;uares0 as the clustering progresses through increasing le%els of aggregation"
#t the eginning of clustering0 each oser%ation is represented perfectly y the mean
%ector to which it elongs and there is no within cluster error" #t the highest le%el of
aggregation0 there is only one cluster and it contains e%ery oser%ation" 4he
proportion of une9plained sum of s;uares is0 therefore0 1"0" #t any stage etween
these two e9tremes0 within cluster error sum of s;uares is that portion of the total
%ariance une9plained y the current set of clusters"
4o locate OrandomO %ariales0 one compares the step y step growth in the proportion
of une9plained sum of s;uares for each clustering %ariale" 8or a few %ariales0 the
fractions may remain small up to the last few stages0 whereas0 for other %ariales0 the
fractions may get large at a fairly early stage" 4he former %ariales may e thought
of as eing dominant in the results0 while the latter are dormant" $epeating the
clustering with dormant %ariales eliminated should ha%e little effect on the results"
<owe%er0 deleting a dominant %ariale proaly will ha%e a mar,ed influence on the
clustering"
4his ,ind of analysis can e an especially useful de%ice for generating a
parsimonious set of %ariales0 to e used in suse;uent attempts to cluster the data" !t
should e noted that if the data set has %ery distinct clusters0 the une9plained sum of
s;uares will rise slowly0 e%en when a %ariale is dominant" !t is not until the siBe of
the clusters increases andMor OtrueO clusters are Hoined that the proportion of
une9plained sum of s;uares rises sharply"
!ndirectly0 the decomposition of sum of s;uares can also e used as an indicator of
the numer of true clusters" #s this option generates a line for each oser%ation0 the
numer of clustering %ariales OdecomposedO is restricted to what will fit on one
line" 4his option is only possile with hierarchical clustering algorithms 64J^10 20 or
37" 4he decomposition of sum of s;uares will remain the same0 regardless of the
numer of clusters chosen0 if you use the same data set and the same clustering
algorithm"
StatPac For Windows User's Manual 0d,anced 0nalyses 1*1
&'ample of 4 Decomposition of $um of $=uares Printout
Cluster %embersip and Distance to Cluster Centroids
4his option will list the memers of each cluster as well as the Auclidian distance of
each memer from its cluster centroid" 4his output pro%ides useful information on
how homogeneous the clusters are0 and pro%ides an aid in the detection of outliers"

1*& 0d,anced 0nalyses StatPac For Windows User's Manual
4n &'ample of a Cluster %embersip and Distance to
Centroids Printout
$tandardi3e Clustering Variables
StandardiBing the clustering %ariales consists of sutracting the %ariale mean0 and
di%iding y the %ariale standard de%iation" 4he data should e standardiBed if the
clustering %ariales are in widely different units 6age in years0 weight in ,ilograms0
height in centimeters0 etc"7 to a%oid gi%ing %ariales with higher %ariances more
weight in the clustering process" With the hierarchical clustering algorithms
especially0 standardiBing the clustering %ariales tends to reduce the effect of outliers
on the final clustering solution"
%ean $ubstitution
1ean sustitution is one method often used to reduce the prolem of missing
information" :ften0 cluster analysis is difficult ecause if one clustering %ariale is
not ,nown0 it is necessary to e9clude the whole record from the analysis" !t is
possile that this can sustantially reduce the numer of records that are included in
the analysis" 1ean sustitution o%ercomes this prolem y replacing any missing
clustering %ariale with the mean of that %ariale" While this techni;ue has the
possiility of slightly distorting the results0 it can ma,e it possile to perform a
cluster analysis with sustantial missing data" !f an oser%ation for which one or
more missing clustering %ariales was replaced y the mean shows up as an outlier0
then this oser%ation should e eliminated from future cluster analysis runs"
StatPac For Windows User's Manual 0d,anced 0nalyses 1*1
Iteration Limit
4he non-hierarchical methods re;uire that the ma9imum numer of iterations e
specified" 4he non-hierarchical clustering process will stop either when the
ma9imum numer of iterations has een reached0 or when an iteration has resulted in
no oser%ation eing mo%ed from one cluster to another" Since the non-hierarchical
clustering algorithms in StatPac start with hierarchical cluster centroids0 they will
rarely re;uire more than a few iterations" Setting the ma9imum numer of iterations
to ten should e sufficient in most cases" Should the iteration limit e reached0 the
iteration summary output should pro%ide guidance as to how much the iteration limit
should e increased"
$ave Cluster %embersip Variable
Cluster analysis is usually a first step for running other statistical techni;ues" 4he
ne9t step in the analysis often in%ol%es one of the following5
1" $un analysis within each of the clusters"
2" $un discriminant analysis on the clusters0 thus allowing one to get multi%ariate
statistics on the clusters as well as a plot of the first two canonical a9is"
4he S1 option allows you to sa%e the cluster memership %ariale for further
analysis of the clusters" #t the end of the analysis you will e gi%en the opportunity
to merge the cluster memership %ariale into the original data"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
$ISCRIMI707: Co((and
@iscriminant function analysis is a techni;ue for the multi%ariate study of group
differences" !t is similar to multiple regression in that oth in%ol%e a set of
independent %ariales and a dependent %ariale" !n multiple regression0 the
dependent %ariale is a continuous %ariale0 whereas in discriminant analysis0 the
dependent %ariale 6often called the grouping %ariale7 is categorical"
@iscriminant analysis can e seen as an e9tension of proit or logistic regression" !n
proit and logistic regression0 the dependent %ariale is numerically coded as 0 or 1W
in discriminant analysis the grouping %ariale may e numeric or alpha 6e"g"0 10 20 3
or #0 &0 C7" When there are only two groups0 many researchers use proit or logistic
regression and code the two groups as 0 and 1"
@iscriminant analysis is used to5
1" descrie0 summariBe and understand the differences etween groups"
1*) 0d,anced 0nalyses StatPac For Windows User's Manual
2" determine which set of independent %ariales est captures or characteriBes group
differences"
3" classify new suHects into groups or categories"
Canonical correlation analysis 6an option7 can e used to reduce the dimensionality
of the independent %ariales0 similar to principal components analysis" Canonical
analysis also ma,es it possile to determine how well the groups are separated0 using
two linear cominations of the independent %ariales in the discriminant e;uations"
4he synta9 of the command to run a stepwise discriminant analysis is5
@!SC$!1!'#'4 [@ependent %ariale\ [!ndependent %ariale list\
4he ma9imum numer of categories 6groups7 for the dependent %ariale is 23" >p to
200 independent %ariales may e specified"
#s an e9ample0 a researcher studying three types of iris flowers wanted to ,now if
the type of iris could e determined from the length and width of their sepals and
petals" 4he !$!S 4JPA %ariale 6?17 is coded 1^Setosa0 2^?eriscol and 3^?irginic"
'ote that this is a categorical %arialeW an iris is one type or another 6we normally
wonDt ha%e a mi9ed reed iris7"
We also ha%e four independent %ariales5 SAP#. .A'F4< 6?27 is the length of
sepal0 SAP#. W!@4< 6?37 is the width of sepal0 PA4#. .A'F4< 6?37 is the
length of petal0 and PA4#. W!@4< 6?27 is the width of petal"
4he command to run the discriminant analysis could e specified in se%eral different
ways5
@!SC$!1!'#'4 !$!S 4JPA0 SAP#. .A'F4<0 SAP#. W!@4<0
PA4#. .A'F4<0 PA4#. W!@4<
@!SC$!1!'#'4 ?1 ?2 ?3 ?3 ?2
@!SC$!1!'#'4 !$!S 4JPA ?2-?2
@! ?1-?2 6'ote5 @!SC$!1!'#'4 can e are%iated as @!7
!n each e9ample0 the dependent %ariale 6!$!S 4JPA7 was specified first0 followed
y the independent %ariale list" 4he %ariale list itself can consist of %ariale laels
andMor %ariale numers" Aither a comma or a space can e used to separate the
%ariales from each other"
4he dependent %ariale may e alpha or numeric" !f it is numeric0 it must e coded 1
through 23" !f it is alpha0 it must e coded #0 &0 C0 etc" !f the study design does not
contain %alue codes and laels for the dependent %ariale0 the program will use the
data itself to determine the %alue codes"
# discriminant function e;uation is used to otain the posterior proaility that an
oser%ation came from each of the groups" #n oser%ation is0 therefore0 classified0
y the discriminant analysis0 into the group with the highest posterior proaility as
estimated ao%e"
Descriptive $tatistics
4he mean and standard de%iations for all the independent %ariales can e printed
with the descripti%e statistics option 6@S^J7" 4he output contains the means and
StatPac For Windows User's Manual 0d,anced 0nalyses 1*!
standard de%iations for each of the independent %ariales" When @S^C0 the output
will contain descripti%e statistic controlled for each of the dependent %ariale groups"
&'ample of a Descriptive $tatistics Printout
$imple Correlation %atri'
4he within group correlation matri9 is otained y pooling the correlation matri9
from each of the groups 6SC^J7" !f two %ariales are highly correlated0 it is possile
that the matrices are not well conditioned0 and it might e eneficial to run the
discriminant analysis again without one of the %ariales" !f Wil,sD lamda does not
show a significant increase0 you might want to lea%e the %ariale out of the
discriminant analysis"
&'ample of a -itin .roup Correlation %atri' Printout
.roup Discriminant Function Coefficients
4he group discriminant function 6classification7 coefficients can e printed with the
C: option 6C:^J7" 4he output includes a constant and a coefficient for each
independent %ariale0 for each %alue of the grouping %ariale" Aach coefficient
pro%ides an estimate of the effect of that %ariale 6in the units of the raw score7 for
classifying an oser%ation into each group"
1** 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of .roup Discriminant Function Coefficients
Printout
Classification %atri'
4he classification matri9 may e selected with the option C1^J" !t gi%es the
fre;uency distriution of the oser%ed group %ersus its predicted group0 ased on the
set of independent %ariales in the discriminant function" 4his option also calculates
the percent correctly classified in each group0 as well as o%er all groups" !f the group
is well predicted y the set of independent %ariales0 we e9pect to find most
oser%ations falling on the diagonal of this matri9 6i"e"0 oser%ations in group i
would e classified as elonging to group i7" 4he classification matri9 also pro%ides
%aluale insight into which groups are well separated and which groups are harder to
separate"
&'ample of a Classification %atri'
List Incorrectly Classified Cases
4his listing may e selected with the option !C^J" 8or each case that was incorrectly
classified0 this option gi%es the case numer0 the group that case came from as well
as the predicted group ased on the independent %ariales in the discriminant
function" 4his listing can e used to chec, for errors in one or more of the
independent %ariales"
StatPac For Windows User's Manual 0d,anced 0nalyses 1*-
&'ample of Incorrectly Classified Cases Listing
Print &ac $tep
Jou can print the statistics for each step using the option PS^J" 4his may e
important when you want to study how the inclusion or deletion of a %ariale affects
other %ariales"
Wil,sD lamda is the ratio of the determinants of the within groups cross-product to
total cross-product matrices" !t has %alues etween 0 and 1" Wil,sD lamda is similar
to the coefficient of multiple determination 6r-s;uared7 in multiple regression0 e9cept
that it mo%es in the opposite direction" Where r-s;uared gets larger as the e;uation
impro%es0 Wil,sD lamda gets smaller as the e;uation impro%es" 4hus0 Wil,sD lamda
could e interpreted as the proportion of %ariance in the dependent %ariale that is
not e9plained y the discriminant function model" .arge %alues of Wil,sD lamda
indicate that the independent %ariales in the e;uation are not doing a good Ho of
predicting the dependent %ariale group" Small %alues of Wil,sD lamda indicate
good separation etween 6at least some7 groups"
4he o%erall 8-ratio measures whether the %ariales in the e;uation are useful in
classifying cases" 4ypically0 a proaility of "02 or less leads us to reHect the
hypothesis that the discriminant function does not impro%e our aility to classify
cases" 4he 8-to-enter %alue for any %ariale not in the e;uation tests whether adding
this %ariale in the e;uation would lead to a significant decrease in Wil,sD lamda0
while the 8-to-remo%e %alue for any %ariale in the e;uation tests whether this
%ariale would lead to a significant increase in Wil,sD lamda" 4hese %alues are used
to determine the independent %ariale to enter or delete in the ne9t step"
&'ample of te Print &ac $tep Output
1*; 0d,anced 0nalyses StatPac For Windows User's Manual
$ummary Table
# good way to get an o%er%iew of how the steps proceeded0 and what effect each
step had upon Wil,sD lamda0 is to print the summary tale" 4o print the summary
tale0 use the option S4^J"
&'ample of a $ummary Table
Canonical Variable 4nalysis
Canonical analysis can e used to reduce the dimensionality of the independent
%ariales0 and is similar to principal components"
4he first canonical %ariale is the linear comination of independent %ariales that
est summariBes the differences among the groups" 4he second canonical %ariale is
the ne9t est linear comination orthogonal to the first one0 and so on" Jou can print
the canonical %ariale analysis y entering the option C?^J" 4his option pro%ides
two tales"
4he first tale is a summary of the eigen%alues associated with each canonical
%ariale0 as well as the proportion of the Oetween-group %ariailityO accounted for
y each canonical %ariale"
&'ample of a Canonical Variable $ummary Table
4he second tale gi%es the coefficients of the canonical %ariales" 4his is similar to
the eigen%alue print-out in principal components" 4he numer of canonical %ariales
reported is the lesser of 6the numer of groups minus 17 and the numer of %ariales
entered in the discriminant function"
StatPac For Windows User's Manual 0d,anced 0nalyses 1*'
&'ample of a Canonical Variable Coefficients Table
Canonical Variables &valuated at .roup %eans
Jou can select to print a tale of the canonical %ariales0 e%aluated at the group
means using the option F1^J"
&'ample of Canonical Variables &valuated at .roup %eans
Printout
$ave Canonical Pair
$esearchers often want to sa%e the first two canonical %ariales for future analysis"
Jou can sa%e them with the options command SP^J" #t the completion of the
analysis0 you will e gi%en the opportunity to merge the canonical %ariale pair and
predicted group into the original data"
Prior Probabilities
Prior proailities are the initial %alues that will e placed on the diagonal of the
matri9" Prior proailities may e set to e;ual 6PP^A70 automatic 6PP^#70 or
indi%idual proailities may e specified"
When PP^A0 the %alues for the prior proailities will e e;ual to one di%ided y the
numer of categories 6so each category has an e;ual prior proaility7"
Setting the prior proailities option to automatic 6PP^#7 will assign prior
proailities to each category0 ased on the fre;uency of that category" 4he sum of
the prior proailities will e one"
4he other method of setting the prior proailities is to e9plicitly specify them"
When this method is used0 a prior proaility must e assigned to each category"
4hey do not need to sum to one" 4he following option would assign prior
proailities to three alpha categories" 'ote that commas are used to separate them
from each other"
:P4!:'S PP^6#^3"20 &^3")0 C^2"97
1-> 0d,anced 0nalyses StatPac For Windows User's Manual
Number of Variables to Force
4he aility to force %ariales into an e;uation is important for se%eral reasons5
1" # researcher often wishes to replicate the analysis of another study and0 therefore0
to force certain core %ariales into the e;uation0 letting stepwise discriminant
analysis choose from the remaining set"
2" Some %ariales may e cheaper or easier to measure0 and the user may want to see
whether the remaining %ariales add anything to the e;uation"
3" When independent %ariales are highly correlated0 one of them may e more
accurate than the rest0 and you may want to force this %ariale in the e;uation"
4he synta9 for the numer of %ariales to force in is 8:^n0 where n is the numer of
%ariales to force" 8or e9ample0 8:^3 will force the first 3 %ariales from the
independent %ariale list into the e;uation" #n option such as 8:^200 may e used
to perform a non-stepwise analysis 6all %ariales will e included in the analysis7"
Category Creation
4he actual categories 6dependent %ariale groups7 can e created either from the
study design %alue laels 6CC^.7 or from the data itself 6CC^@7" When the
categories are created from the laels0 the %alue laels themsel%es will e used to
define the dependent %ariale groups" #ny data that does not match up with a %alue
lael 6e"g"0 mis,eyed data7 will e counted as missing" When categories are created
from the data0 all data will e considered %alid0 whether or not there is a %alue lael
for it"
F to &nter 2 F to Remove
When faced with a large numer of possile e9planatory %ariales0 two opposed
criteria of selecting %ariales for a discriminant analysis are usually in%ol%ed5
1" 4o ma,e the e;uation useful for classification purposes0 we would li,e our model
to include as many of the independent %ariales as possile so that reliale group
classification can e determined"
2" &ecause of the costs in%ol%ed in otaining information on a large numer of
independent %ariales0 we would li,e the e;uation to include as few of the
independent %ariales as possile"
4he compromise etween these two e9tremes is generally called Oselecting the est
set of independent %arialesO" 4his in%ol%es multiple e9ecution of discriminant
analysis0 in an attempt to add %ariales to impro%e classification or remo%e %ariales
to simplify the classification e;uations" Stepwise discriminant analysis pro%ides a
partial automation of this procedure"
#n important property of the stepwise procedure is ased on the fact that a %ariale
may e indicated to e significant in an early stage and0 thus0 e entered in the
e;uation" #fter se%eral other %ariales are added to the e;uation0 howe%er0 the initial
%ariale may e indicated to e insignificant 6redundant70 and thus remo%ed from the
model" 4his method is often referred to as forward inclusion with ac,ward
elimination"
4he algorithm used y StatPac is as follows5
1" 8irst0 enter into the discriminant analysis all %ariales which the user wishes to
force into the e;uation"
StatPac For Windows User's Manual 0d,anced 0nalyses 1-1
2" Anter the predictor that produces the greatest decrease in Wil,sD lamda from all
the remaining predictors whose entry is not inhiited y the 8-to-enter"
3" $emo%e the predictor that ma,es the least increase in Wil,sD lamda from all 6non-
forced7 predictors whose remo%al is not inhiited y the 8-to-remo%e"
'ote that step 2 is e9ecuted only when it is not possile to e9ecute step 3" !f neither
can e e9ecuted0 the stepping is complete"
4he following should e considered when setting 8-to-enter and 8- to-remo%e %alues
in the parameter tale5
1" # %ariale is remo%ed if the 8-%alue associated with that %ariale is less than the
8-to-remo%e %alue set in the parameter tale" Similarly0 a %ariale is added if the 8-
%alue associated with that %ariale would e greater than the 8-to-enter %alue set in
the parameter tale0 if that %ariale were entered in the current e;uation"
2" Care should e ta,en to ensure that the 8-to-remo%e e less than the 8-to-enterW
otherwise0 a %ariale would e entered and then remo%ed at alternate steps"
3" 4he default %alues for the 8-to-enter and 8-to-remo%e for many mainframe
pac,ages0 and StatPac0 are 3"0 and 3"90 respecti%ely0 which pro%ide useful starting
%alues"
3" Setting the 8-to-remo%e %alue low yields the forward inclusion method"
2" 8or the first run on a data set0 it is common to set the 8-to-enter and 8-to-remo%e
%alues low0 to e9ecute a large numer of steps"
$teps Limit
4he steps limit is the ma9imum numer of steps that can occur" Aach inclusion and
deletion of a %ariale is counted as one step" 4he purpose of the steps limit option is
to limit computer time" 4he synta9 for the steps limit option is S.^n0 where n is the
ma9imum numer of steps allowed"
%ean $ubstitution
1ean sustitution is one method often used to reduce the prolem of missing
information" :ften0 discriminant analysis is difficult ecause if one independent
%ariale is not ,nown0 it is necessary to e9clude the whole record from the analysis"
!t is possile that this can sustantially reduce the numer of records that are
included in the analysis" 1ean sustitution o%ercomes this prolem y replacing any
missing independent %ariale with the mean of that %ariale" While this techni;ue
has the possiility of slightly distorting the results0 it can ma,e it possile to perform
a discriminant analysis with sustantial missing data" !f the %alue of the dependent
6grouping7 %ariale is missing0 the whole record is deleted from the analysis"
Predict Interactively
#fter performing a discriminant analysis0 you may want the posterior proailities
associated with each group0 for a new oser%ation0 or an oser%ation in your data for
which the %alue of the dependent %ariale was missing" 4his is ,nown as interacti%e
prediction"
Jou can select interacti%e prediction y entering the option P$^J" #t the end of the
analysis you will then e prompted to enter a %alue for each independent %ariale0
and the computer will use the discriminant function coefficients to estimate the
posterior proailities associated with each group" 4he oser%ation is then assigned
to the group with the highest posterior proaility" Jou can s,ip o%er any
independent %ariale y Hust pressing [enter\W the %alue of the group mean for that
independent %ariale will e used"
1-& 0d,anced 0nalyses StatPac For Windows User's Manual
07380 Co((and
4he analysis of %ariance procedure pro%ides a systematic way of studying %ariaility"
>sually0 we are interested in how much of the %ariaility of scores on the dependent
%ariale can e e9plained y the differences etween scores 6le%els7 on the
e9perimental %ariales 6factors7" StatPac may contain up to three factors and up to 90
le%els for each factor"
Type of Design
StatPac Fold contains ele%en different #':?# designs 6or models7" Choosing the
appropriate design for a particular e9periment re;uires careful e%aluation" !t is ;uite
possile to perform an inappropriate statistical procedure y choosing the wrong
model" Since StatPac has no way of ,nowing that the model is wrong0 it will produce
erroneous results" 4he following types of models are a%ailale5
1" :ne 8actor Completely $andomiBed @esign
2" $andomiBed Complete &loc, @esign
3" $andomiBed Complete &loc, @esign With Sampling
3" 4wo 8actor 8actorial in Completely $andomiBed @esign
2" 4wo 8actor 8actorial in $andomiBed Complete &loc, @esign
-" 4hree 8actor 8actorial in Completely $andomiBed @esign
)" 4hree 8actor 'ested @esign
(" Split-Plot With Completely $andomiBed @esign of 1ain Plots
9" Split-Plot With $andomiBed Complete &loc, @esign of 1ain Plot
10" Split-Plot With Su->nits #rranged in Strips
11" .atin S;uare @esign
4he numer relating to the type of design has no intrinsic meaning in and of itself" !t
is simply a numer used to specify which model you want StatPac to use for the
analysis"
%issing Data in 4NOV4 Designs
1any analysis of %ariance e9perimental designs in%ol%e assigning an e;ual numer
of cases to each cell" When all cells do not contain the same numer of cases0 the
model is said to e OunalancedO" >nalanced designs usually occur ecause of
differential attrition 6e"g"0 some of the crop dies0 respondents ecome una%ailale or
refuse to participate0 recording errors0 etc"7"
StatPac uses an unweighted means solution when there is not an e;ual numer of
cases in each cell" 4his in%ol%es the use of the harmonic mean to adHust the sums of
s;uares" !f there is an e;ual numer of oser%ations in each cell0 the unweighted
means solution is e;ui%alent to the usual least s;uares approach" 4he unweighted
means solution re;uires at least one case in e%ery cell" 4here may not e any cells
where all the data is missing"
4he unweighted means approach is an appro9imation techni;ue and does not
produce e9act results when the design is unalanced" #lthough the 8 statistics may
not e e9act0 researchers ha%e found that the 8-ratios are acceptale unless the design
is highly unalanced" #s a measure of departure from a alanced design0 use the ratio
of 'iM'H0 where 'i is the greatest numer of oser%ations in any cell and 'H is the
minimum" # ratio of 351 is tolerale0 ut a ratio of 1-51 should not e accepted" !n
StatPac For Windows User's Manual 0d,anced 0nalyses 1-1
these cases0 an e9act solution can e otained y creating appropriate dummy
%ariales and performing a regression analysis" 8or a detailed discussion0 see @"F"
Fosslee and <"." .ucas 6&iometrics0 ?olume 210 p" 112-1337"
Command $ynta' and te Data File $tructure
4he synta9 for the #':?# command is similar for all ele%en different models" 4he
only difference is in the numer of factors that are specified as part of the command"
4here are two general forms of the command5
#':?# 64ype7 [@ependent ?ariale\ 6[8act" 1\7 6[8act" 2\7 6[8act" 3\7
4his format is used when each record contains a single %alue for the dependent
%ariale" 4he type of design is specified first and must e enclosed in parentheses" !t
may e a numer etween one and ele%en" 4he dependent %ariale is specified ne9t"
8inally0 a %ariale is specified for each factor" Aach of these %ariales is also
enclosed in parentheses" !f a design only contains one 6or two7 factors0 only one 6or
two7 need e specified"
4he second form of the #':?# command is used when each record contains se%eral
%alues for the dependent %ariale 6one for each le%el of one of the factors7" !n this
case0 the dependent %ariale is not a single %ariale0 ut rather a %ariale list" Since
any one of the factors may e the dependent %ariale list0 the synta9 may ta,e on
three different forms5
#':?# 64ype7 6[8actor 1 %ar" list\7 6[8actor 2\7 6[8actor 3\7
#':?# 64ype7 6[8actor 1\7 6[8actor 2 %ar" list\7 6[8actor 3\7
#':?# 64ype7 6[8actor 1\7 6[8actor 2\7 6[8actor 3 %ar" list\7
Which form of the #':?# command you use depends upon how the data file is
arranged" 4he following three e9amples illustrate the different forms of the
command"
4he first e9ample is a completely randomiBed one-way design 64ype 17" 4here is
only one factor for this ,ind of model" #s stated ao%e0 there are two possile
formats for the command" 4hey are5
#':?# 617 [@ependent %ariale\ 6[8actor 1\7
#':?# 617 6[8actor 1 %ariale list\7
8or e9ample0 letDs say we are interested in studying the effect of training after one
hour0 two hours0 and three hours" 4here are two ways the data file might e
organiBed" !n the first format0 each record contains the score and the time of
measurement" !t would appear li,e this5
33 1 6record 1 - score at time 1 for case 17
33 2 6record 2 - score at time 2 for case 17
1-) 0d,anced 0nalyses StatPac For Windows User's Manual
22 3 6record 3 - score at time 3 for case 17
31 1 6record 3 - score at time 1 for case 27
22 2 6record 2 - score at time 2 for case 27
-3 3 6record - - score at time 3 for case 27
3) 1 6record ) - score at time 1 for case 37
29 2 6record ( - score at time 2 for case 37
-1 3 6record 9 - score at time 3 for case 37
!n this e9ample0 the dependent %ariale 6SC:$A7 is %ariale one and the factor
64!1A-PA$!:@7 is %ariale two" 4he %alues for %ariale two represent the le%els of
the %ariale 6i"e"0 what time the score was ta,en7" 4wo e9amples of the synta9 to run
a one-way #':?# using the ao%e data file would e5
#':?# 617 ?1 6?27
#':?# 617 SC:$A 64!1A-PA$!:@7
!n the other type of data file format0 each record contains the score for each hour of
training" With this format0 the ao%e data file would appear li,e this5
33 33 22 6rec 1 - score after each hour of training for case 17
31 22 -3 6rec 2 - score after each hour of training for case 27
3) 29 -1 6rec 3 - score after each hour of training for case 37
4his data file format differs from the pre%ious format0 ut the data is the same" 4he
dependent %ariale is no longer Hust held in a single %ariale" 4here is a dependent
%ariale for each le%el of the factor" ?ariale one is the score for time one 64!1A-170
%ariale two is the score for time two 64!1A-270 and %ariale three is the score for
time three 64!1A-37"
4hree e9amples of the synta9 to run a one-way analysis of %ariance for this type of
data file format are5
#' 617 6?1-?37 6'ote5 #':?# may e are%iated as #'7
#':?# 617 6?10?20?37
#':?# 617 64!1A-10 4!1A-20 4!1A-37
4he only difference etween the two data files is in the way in which they are coded"
4he actual data is the same in oth files0 and the results of the analysis of %ariance
will e identical"
4he second e9ample is two-way #':?# in a completely randomiBed design 64ype
37" # two-way analysis of %ariance is used to e9amine the effect that two independent
%ariales ha%e on the dependent %ariale" &ecause of the high cost of conducting
e9periments and the possiility of interaction effects0 researchers often use a two-
way design to get the most out of each e9periment"
8or e9ample0 letDs say we are studying the F$:W4< 6dependent %ariale7 of four
different hyrid SAA@S" We are also interested in whether any rand of
8A$4!.!LA$ wor,s etter than the others" !nstead of conducting two separate
StatPac For Windows User's Manual 0d,anced 0nalyses 1-!
e9periments0 we conduct only one and analyBe the results with a two-way #':?#"
4his has an added ad%antage ecause it will ta,e into account the interaction etween
fertiliBer and seed type"
4he first form of the command synta9 for the two-way #':?# is5
#':?# 637 [@ependent %ariale\ 6[8actor 1\7 6[8actor 2\7
Since there are two factors is this design0 the second form of the command could
specify either factor as the %ariale list5
#':?# 637 6[8actor 1 %ariale list\7 6[8actor 2\7
#':?# 637 6[8actor 1\7 6[8actor 2 %ariale list\7
'otice that the last two forms of the command are %ariations of the same synta9"
Since there are two factors0 they oth must e specified in the command synta9" 4he
actual synta9 depends upon the way the data file is structured"
4he first form of the command is used when there is a dependent %ariale and a
%ariale for each factor" # sample data file format for this e9perimental design might
loo, li,e this5
-) 1 # 6record 1 - yield this acre is -)
fertiliBer used is coded as 1
type of hyrid seed is coded as #7
23 2 # 6record 2 - yield this acre is 23
fertiliBer used is coded as 2
type of hyrid seed is coded as #7
3 # 6record 3 - yield this acre is missing - crop died
fertiliBer used is coded as 3
type of hyrid seed is coded as #7
22 1 & 6record 3 - yield this acre is 22
fertiliBer used is coded as 1
type of hyrid sees is coded as &7
-1 2 & 6record 2 - yield this acre is -1
fertiliBer used is coded as 2
type of hyrid seed is coded as &7
2) 3 & 6record - - yield this acre is 2)
fertiliBer used is coded as 3
type of hyrid seed is coded as &7
4wo commands to run a two-way #':?# with this data file are5
#':?# 637 ?1 6?27 6?37
#':?# 637 F$:W4< 68A$4!.!LA$7 6SAA@7
1-* 0d,anced 0nalyses StatPac For Windows User's Manual
4he data file could contain the same information formatted in another way" 8or
e9ample0 the following data file contains the same information as the pre%ious file
e9cept that the dependent %ariale 6F$:W4<7 is specified for each type of fertiliBer"
-) 23 # 6record 1 - growth for all 3 fertiliBers with seed type #7
22 -1 2) & 6record 2 - growth for all 3 fertiliBers with seed type &7
?ariale one is the growth for 8A$4!.!LA$-10 %ariale two is the growth for
8A$4!.!LA$-20 and %ariale three is the growth for 8A$4!.!LA$-3" ?ariale four
is the SAA@ type" 4hree commands to perform a two-way #':?# with this type of
data file format are5
#':?# 637 6?10 ?20 ?37 6?37
#':?# 637 6?1-?37 6?37
#':?# 637 68A$4!.LA$-10 8A$4!.!LA$-20 8A$4!.!LA$-37 6SAA@7
8or a final e9ample of data file formatting0 weDll loo, at a typical three-factor
factorial e9periment 64ype ^ -7" 4his model is similar to the pre%ious model e9cept
that three e9perimental factors are eing e9amined"
4here are now four possile data file formats corresponding to four forms of synta95
#':?# 6-7 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 6-7 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 6-7 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 6-7 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
# medical researcher was studying the pain-relie%ing properties of two different
drugs 6# and &7" !n addition to testing the drugs themsel%es0 she wanted to compare
high and low doses as well as the method of administration 6oral or intra%enously7"
4he dependent %ariale is a measure of pain $A.!A8 6on a scale of 0 to 970 factor #
is the @$>F type0 factor & is the @:SA and factor C is the 1A4<:@ of
administration"
!n the first data file format0 the dependent %ariale and each factor represent uni;ue
%ariales in the data file"
( # < : 6Pain relief ( - drug # - high dose - oral admin"7
- # . : 6Pain relief - - drug # - low dose - oral admin"7
9 # < ! 6Pain relief 9 - drug # - high dose - i%" admin"7
( # . ! 6Pain relief ( - drug # - low dose - i%" admin"7
2 & < : 6Pain relief 2 - drug & - high dose - oral admin"7
StatPac For Windows User's Manual 0d,anced 0nalyses 1--
3 & . : 6Pain relief 3 - drug & - low dose - oral admin"7
- & < ! 6Pain relief - - drug & - high dose - i%" admin"7
2 & . ! 6Pain relief 2 - drug & - low dose - i%" admin"7
4he commands to run the #':?# with this data file organiBation are5
#':?# 6-7 ?1 6?27 6?37 6?37
#':?# 6-7 $A.!A8 6@$>F7 6@:SA7 61A4<:@7
4he last three forms of the command are used when one of the factors is specified as
part of a %ariale list" 8or e9ample0 oth methods of administering the drug could e
contained in the same data record" 4he data file would appear li,e this5
# < ( 9 6@rug # - high dose - relief for oral = i% admin"7
# . - ( 6@rug # - low dose - relief for oral = i% admin"7
& < 2 - 6@rug & - high dose - relief for oral = i% admin"7
& . 3 2 6@rug & - low dose - relief for oral = i% admin"7
4he commands to run the #':?# with this data file format would e5
#':?# 6-7 6?17 6?27 6?30 ?37
#':?# 6-7 6@$>F7 6@:SA7 6:$#.0 !?7
!t is especially important to match the appropriate command synta9 with the format
of the data file" 4he %ersatility of StatPac to read se%eral different data file formats
ma,es it easy to analyBe most data sets" 4he est ad%ice is to plan the analysis efore
entering data"
Descriptive $tatistics
@escripti%e statistics for each cell may e printed or suppressed with the option
@S^J or @S^'0 respecti%ely" !n multi-factor e9periments it is often desirale to
print descripti%e statistics for each factor controlled for the other factors" 4o print
controlled descripti%e statistics0 use the option @S^C" 4he descripti%e statistics
printout will contain the count0 mean and uniased standard de%iation"
1-; 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of Descriptive $tatistics
4nova Table
4he #':?# tale is the heart of the analysis" 4he 8-test re%eals whether or not there
are significant differences etween the le%els of the e9perimental factor6s7" 4he
actual terms that appear in the #':?# tale depend on the type of design"
Fenerally0 e9periments in%ol%e assigning cases to groups on the asis of some
e9perimental condition and oser%ing the differences etween the groups on the
dependent %ariale" #s the differences etween the groups increase0 so will the 8-
ratio" 4he actual formula for a particular 8-test depends upon the #':?# design and
whether the factors are fi9ed or random"
# significant 8-ratio means that there is a significant difference etween the means
of the dependent %ariale for at least two groups" 8or e9ample0 in a completely
randomiBed two-factor factorial analysis 64ype ^ 370 there are three 8-ratios5 one for
the # factor0 one for the & factor and one for the #& interaction" 4heir interpretation
is as follows5
1" 4he 8-ratio for factor # tests whether the factor # %ariale has a significant effect
on the response of the dependent %ariale0 a%eraged o%er all le%els of the factor &
%ariale" # significance le%el less than "02 is generally considered significant"
2" 4he 8-ratio for factor & tests whether the factor & %ariale has a significant effect
on the response of the dependent %ariale0 a%eraged o%er all le%els of the factor #
%ariale"
3" 4he 8-ratio for interaction tests whether there is significant interaction etween the
factor # and factor & %ariales" !nteraction results from the failure of differences
StatPac For Windows User's Manual 0d,anced 0nalyses 1-'
etween responses at the different le%els of one of the %ariales to remain constant
o%er the different le%els of the other %ariale" !f the interaction term is significant0 the
8-test for factor # and & should e interpreted with care" 4he ne9t step is generally to
e9amine the means for all pairs of le%els of the two %ariales"
&'ample of an 4nova Table
Fi'ed and Random Factors
When conducting tests of significance in multi-factor designs0 you must specify
whether each of the factors is fi9ed or random" 4his will determine which of the
mean s;uares in the analysis of %ariance tale is used for the denominator of the 8-
ratio"
4he concept of whether a factor is fi9ed or random can e determined using the
following reasoning" #ssume a factor has a potential 6or population7 of P le%els
which may e ;uite large" 4he e9perimenter may group the P potential le%els into p
effecti%e le%els y either comining adHoining le%els or delierately selecting what
are considered to e representati%e le%els" While p is less than P0 the effecti%e le%els
still represent the entire potential 6or population7" Whene%er the selection of the p
le%els from the potential P le%els is determined y some systematic non-random
procedure0 the factor is fi9ed" !n the special case where the numer of le%els 6p7 of a
factor is e;ual to P 6no le%els were grouped70 the factor is also fi9ed"
A9amples of fi9ed factors include rates of application0 %arieties0 types of compound0
etc" With fi9ed factors0 we are generally interested in estimating fi9ed effects
associated with the specific le%els of the fi9ed factors"
!n contrast to this systematic selection procedure0 if p le%els of a factor included in
the e9periment represent a random sample from the potential P le%els0 the factor is
considered to e a random factor" 8or e9ample0 if a random sample of p of the P
potential hospitals is included in the e9periment0 the factor 6hospitals7 is a random
factor" !n most practical situations in which random factors are encountered0 p is
;uite small relati%e to P"
A9amples of random factors include people0 herds0 plants0 lots0 hospitals0 etc" With
random factors0 we are generally interested in estimating the %ariaility present in
these factors"
4he 810 82 and 83 options may e used to set a factor as fi9ed or random" 8or
e9ample0 to set factors 2 and 3 as random factors0 you would use the option5
:P4!:'S 82^$ 83^$
1;> 0d,anced 0nalyses StatPac For Windows User's Manual
4he formulas for the 8 tests depend upon the type of design and whether the factors
are fi9ed or random" !f a factor is inappropriately specified as random0 StatPac will
simply continue processing it as if it were random and will e unale to detect the
error"
Critical F Probability
4he analysis of %ariance y itself can re%eal that differences e9ist etween different
le%els of the e9perimental condition" 4hat is0 a significant 8-ratio indicates a
significant difference etween at least two of the le%els" !t does not actually tell
where the differences occur" 4he lsd t-tests etween all the cominations of means
re%eal where the actual difference6s7 is 6are7" 4he t-tests will only e performed if the
8-ratio is significant at the critical 8 proaility" 8or e9ample0 if the critical 8
proaility is e;ual to "02 6C8^"0270 the t-tests will e performed only if the 8-ratio
is less than or e;ual to "02"
4he t-tests will e performed for only those pairs of means that ha%e a significant 8-
ratio" 4a,e the e9ample where factor # has a significant 8-ratio and factor & does
not" 4he lsd t-tests will e performed etween all cominations of le%els of factor #0
while no t-tests will e performed etween the le%els of factor &"
Critical T Probability
!f an 8-ratio is significant at the critical 8 proaility0 StatPac will run through the
pair of cell means and compute the lsd t-statistic and proaility of t" We are usually
only interested in those cominations where the t-statistic is significant" 4he critical t
proaility allows the selecti%e printing of the t-statistics depending on the
proaility of t" 8or e9ample0 if the critical t proaility is set to "02 6C4^"0270 only
those t-%alues that ha%e proailities of "02 or less will e printed"
4he t statistic will re%eal differences etween the group means" !f any t is significant0
it will e printed" 4his procedure0 called the new lsd 6least significant difference7 t-
test0 is considered to e one of the most conser%ati%e post-hoc tests"
&'ample of a t:Test Printout
Category Creation
4he actual categories 6le%els for each factor7 can e created either from the study
design %alue laels 6CC^.7 or from the data itself 6CC^@7" When the categories are
created from the laels0 the %alue laels themsel%es will e used to define the le%els
for each factor" #ny data that does not match up with a %alue lael 6e"g"0 mispunched
StatPac For Windows User's Manual 0d,anced 0nalyses 1;1
data7 will e counted as missing" When categories are created from the data0 the data
itself will e used to define the le%els0 whether or not there is a matching %alue lael"
Print Codes
4he code for each le%el can e printed or suppressed with the PC^J and PC^'
options0 respecti%ely"
7rus/al:-allis Test
4he non-parametric e;ui%alent of an analysis of %ariance is the Erus,al-Wallis test"
4he data is ran,ed0 and the sum of the ran,s for each of the groups is used to
calculate the statistic" 4he proaility is determined using the chi-s;uare distriution
with the degrees of freedom e;ual to the numer of groups minus one"
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
4nova &'amples
4he following pages gi%e a rief description of the ele%en analysis of %ariance
designs which StatPac can analyBe along with simple e9amples and the statistical
tests for each of these designs" !t is important to note that0 in many cases0 more than
one design may e appropriate for a gi%en data set"
5. -ne ,actor (ompletely Randomi>ed *esi/n
Synta95
#':?# 617 [@ependent %ariale\ 6[8actor #\7
#':?# 617 6[8actor # %ariale list\7
@iscussion5 4his is the simplest design and the easiest to carry out" 4he design
contains only one factor0 and can handle une;ual numers of oser%ations per le%el"
#n A9ample5 !n an attempt to study fat asorption in doughnuts0 23 doughnuts were
prepared 6si9 doughnuts from each of four ,inds of fats7" 4he dependent %ariale is
grams of fat asored0 and the factor %ariale is the type of fat" 4he factor contains
four le%els 6four types of fat were tested7" 4he researcher accidentally dropped one of
the doughnuts from the second type of fat0 so the second type of fat contains fi%e
oser%ations instead of si9"
1;& 0d,anced 0nalyses StatPac For Windows User's Manual
4he analysis of %ariance tale follows5
6. Randomi>ed (omplete 'lock *esi/n
Synta95
#':?# 627 [@ependent %ariale\ 6[8actor #\7 6[8actor &\7
#':?# 627 6[8actor # %ariale list\7 6[8actor &\7
#':?# 627 6[8actor #\7 6[8actor & %ariale list\7
'ote5 8actor # is always the e9perimental treatment
8actor & is always the replication or loc,
@iscussion5 4his design is easy to carry out" !t is essentially a one-way analysis of
%ariance with replications 6loc,s7" 4his design always contains e9actly one
oser%ation per cell" >nits assigned to the same loc, are as similar as possile in
responsi%eness0 thus increasing the precision of treatment comparisons y
eliminating loc,-to-loc, %ariation" &loc,s can represent time0 location or
e9perimental material" A9amples of loc,s include repeated testing o%er time0 litter-
mates0 and groups of e9perimental plots as similar as possile in terms of fertility0
drainage0 and liaility to attac, y insects"
#n A9ample5 # researcher wants to study the effects four seed treatments and a
control group 6a total of fi%e treatment le%els7 on the germination of soyean seeds"
4he factor %ariale is the type of treatment 61 to 27" 8i%e germination eds were
prepared for each le%el of treatment and 100 seeds factors were planted in each ed"
4hus0 the replications are the fi%e eds" 4he dependent %ariale is the numer of
plants in each ed which failed to germinate" 4here are two factors5 treatment and
replication"
4he analysis of %ariance tale follows5
StatPac For Windows User's Manual 0d,anced 0nalyses 1;1
9. Randomi>ed (omplete 'lock *esi/n With Samplin/
Synta95
#':?# 637 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 637 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 637 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 637 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always the e9perimental treatment
8actor & is always the replicate or loc,
8actor C is always the sampling or determinations
@iscussion5 4his design is the same as the pre%ious design with more than one
oser%ation per e9perimental unit" A9periments often contain more than one
oser%ation per e9perimental unit when the researcher wishes to estimate the
reliaility of measurement" With this design0 the error term is ro,en down into
e9perimental error and sampling error" Sampling error measures the failure of
oser%ations made on any e9perimental unit to e precisely ali,e" A9perimental error
is usually e9pected to e larger than sampling error" !n other words0 %ariation among
e9perimental units is e9pected to e larger than %ariation among susamples of the
same unit"
#n A9ample5 4he oHecti%e of an e9periment was to study the effect of corn %ariety
on protein content" # field was di%ided into three similar plots" Aach plot was
sudi%ided into fourteen sections" 8ourteen different %arieties of corn were planted in
each plot 6one in each section7" #fter har%est0 two protein determinations were made
on each %ariety of corn in each plot" 4he dependent %ariale was the protein content"
8actor # was the type of corn and contained 13 le%els" 8actor & was the replication
6the three plots7" 8actor C was the two determinations"
4he analysis of %ariance tale follows5
:. Two0,actor ,actorial in (ompletely Randomi>ed *esi/n
Synta95
#':?# 637 [@ependent %ariale\ 6[8actor #\7 6[8actor &\7
#':?# 637 6[8actor # %ariale list\7 6[8actor &\7
#':?# 637 6[8actor #\7 6[8actor & %ariale list\7
1;) 0d,anced 0nalyses StatPac For Windows User's Manual
@iscussion5 When compared to a one-factor-at-a-time approach0 factorial designs
are superior ecause they enale interactions etween different factors to e
e9plored" !nstead of performing two e9periments 6one for each factor70 the researcher
can perform one e9periment to determine the effects of each factor and their
interaction" >nalanced designs are acceptale"
#n A9ample5 Si9ty ay male rats were randomly assigned to one of si9 feeding
treatments" 4he dependent %ariale is the weight gain of the rats" 4he feeding
treatments were a comination of two factors0 source and le%el of protein" 4hree of
the rats died efore the e9periment was completed" 4he si9 feeding treatments were a
comination of two factors5
8actor # 63 le%els75 Source of protein5 &eef0 Cereal0 Por,
8actor & 62 le%els75 .e%el of protein5 <igh0 .ow
4he analysis of %ariance tale follows5
?. Two0,actor ,actorial in Randomi>ed (omplete 'lock *esi/n
Synta95
#':?# 627 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 627 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 627 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 627 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always an e9perimental treatment
8actor & is always an e9perimental treatment
8actor C is always the replicate or loc,
@iscussion5 4his #':?# design is the same as the pre%ious two-way factorial
design e9cept that replications ha%e een added" 4his design will always contain
e9actly one oser%ation per cell" !t should e noted that for small e9periments0 the
degrees of freedom for error may e ;uite small with this design"
#n A9ample5 $iofla%in content of collard lea%es can e determined y a chemical
techni;ue ,nown as fluorometric determination" #n e9periment was designed to
study this techni;ue" 8actor # is the siBe of leaf used to ma,e the determination 60"22
grams and 1"00 grams70 and factor & is the effect of the inclusion of a permanganate-
pero9ide clarification step in the chemical process" 4he procedure was replicated on
three successi%e days" 4here is one oser%ation for each cell of the design" 4he
dependent %ariale is apparent riofla%in concentration 6mg"Mgm"7 in collard lea%es"
StatPac For Windows User's Manual 0d,anced 0nalyses 1;!
4he analysis of %ariance tale follows5
@. Three0,actor ,actorial in (ompletely Randomi>ed *esi/n
Synta95
#':?# 6-7 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 6-7 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 6-7 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 6-7 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always an e9perimental treatment
8actor & is always an e9perimental treatment
8actor C is always an e9perimental treatment
@iscussion5 4he three-way design is used when there are three factors to in%estigate"
4here are three main effects 6#0 & and C7 and four interaction effects 6#&0 #C0 &C
and #&C7" >nalanced designs are acceptale" !n the special case where there is only
one oser%ation per cell0 the error term ecomes e;ual to Bero" !n this case0 it is
usually assumed that the three-way interaction term is not significantly different
from the error term0 and the three-way interaction is used in place of the error term"
With small numers of le%els for the factors0 this can lea%e %ery few degrees of
freedom for the error 63-way interaction7 term"
#n A9ample5 # researcher was in%estigating the effect of %arious fertiliBers on the
growth of carrots" 4he three factors were nitrogen 6'70 potassium 6E7 and
phosphorous 6P7" 4hree le%els of concentration le%els were tested for each factor
6low0 medium0 and high7" 4his resulted in 2) different fertiliBer cominations" 4he
dependent %ariale is the weight of the carrot root 6in grams7 grown under each of
the fertiliBer conditions" 'ote that in the special case of one oser%ation per cell 6i"e"0
one carrot for each fertiliBer comination70 no error term appears in the #':?#
tale"
1;* 0d,anced 0nalyses StatPac For Windows User's Manual
4he analysis of %ariance tale is as follows5
A. Three0,actor #ested *esi/n
Synta95
#':?# 6)7 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 6)7 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 6)7 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 6)7 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always the e9perimental unit
8actor & is always a su-unit of 8actor #
8actor C is always a su-unit of 8actor &
@iscussion5 When each sample is composed of susamples0 we ha%e a nested or
hierarchical design" 4he oHecti%e of this design is to estimate the %ariance
components associated with the %arious nested factors" >nalanced designs are
acceptale" !n the special case of e9actly one oser%ation per cell0 the error term is
Bero0 and it will not e printed"
#n A9ample5 #n in%estigator wanted to estimate calcium concentration in lea%es of
turnip plants" 8our plants were ta,en at random and three lea%es 6samples7 were
randomly selected from each plant" 4wo susamples were then ta,en from each leaf0
and calcium was determined y microchemical methods" 4he oHecti%es of the
e9periment were to estimate the %ariaility in concentration across plants0 etween
lea%es of the same plant0 and within susamples of the same leaf"
4he analysis of %ariance tale follows5
StatPac For Windows User's Manual 0d,anced 0nalyses 1;-
B. Split0lot With (ompletely Randomi>ed *esi/n of "ain lots
Synta95
#':?# 6(7 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 6(7 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 6(7 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 6(7 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always an e9perimental treatment
8actor & is always an e9perimental treatment
8actor C is always the replicate or loc,
@iscussion5 4he term split-plot comes from agricultural e9perimentation" Split-plot
designs contain two treatment factors" 4he main plots are the e9perimental units for
one of the factors0 and the suplots are the e9perimental units for the other factor"
Split-plots are a repeated measure design"
#n A9ample5 !n this e9periment0 si9 suHects were di%ided into two groups
according to the method they were told to use for calirating dials" 4hree suHects
used method #1 to calirate the dials0 and three suHects used method #2" Aach
suHect was told to calirate four differently shaped dials 6&10 &20 &3 and &37" 4he
dependent %ariale is the accuracy of each caliration attempt" 8actor # is the
method of calirating dials0 and factor & is the shape of dials" 4he three suHects in
each group are the replicates" 4his design will always contain e9actly one
oser%ation per cell"
4he analysis of %ariance tale follows5
C. Split0lot With Randomi>ed (omplete 'lock *esi/n of "ain lots
Synta95
#':?# 697 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 697 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 697 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 697 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
1;; 0d,anced 0nalyses StatPac For Windows User's Manual
'ote5 8actor # is always an e9perimental treatment
8actor & is always an e9perimental treatment
8actor C is always the replicate or loc,
@iscussion5 4his design is preferale to the pre%ious design when homogeneous
loc,s of e9perimental units are a%ailale0 thus allowing a more accurate comparison
of treatments y eliminating intra-loc, %ariaility" Aach #& treatment comination
is replicated in each loc," 4here will always e e9actly one oser%ation per cell
with this design"
#n A9ample5 4his e9ample studies the effects of alfalfa %ariety and the date of
har%est on yields" Si9 plots 6replicates7 were used" 8actor # is alfalfa %ariety and
factor & is the date of har%est" 8actor C are the replicates 6si9 plots7"
4he analysis of %ariance tale follows5
5D. Split0lot With Sub0$nit Treatments Arran/ed in Strips
Synta95
#':?# 6107 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 6107 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 6107 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 6107 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always an e9perimental treatment
8actor & is always an e9perimental treatment
8actor C is always the replicate or loc,
@iscussion5 !nstead of randomiBing the su-unit treatment independently within
each unit0 it is often necessary 6or desirale7 to ha%e the su-unit treatment arranged
in strips across each replication" 4his design has an ad%antage o%er the pre%ious
design ecause it allows the determination of e9perimental error 6error not
attriutale to either main factor7" 4he layout may e particularly con%enient for
some field e9periments" 4his design always contains e9actly one oser%ation per
cell"
StatPac For Windows User's Manual 0d,anced 0nalyses 1;'
4his design sacrifices precision on the main effects of # and & in order to pro%ide
higher precision on the interaction term which will generally e more accurately
determined than in either randomiBed loc,s or the simple split-plot design" 8or a 2
y 3 design0 the appropriate arrangement 6after randomiBation7 might e as shown
elow for 2 replications5
$eplication 1 $eplication 2
a3 a1 a2 a0 a3 a1 a3 a0 a2 a3
2 1
0 2
1 0
#n A9ample5 4he researcher used ten %arieties and three generations of corn seed to
study the effect of yield" 4he generations 6a0 and c7 appear in strips across loc,s as
well as the hyrid numer"
4he analysis of %ariance tale follows5
55. &atin S3uare *esi/n
Synta95
#':?# 6117 [@ep" %ar"\ 6[8actor #\7 6[8actor &\7 6[8actor C\7
#':?# 6117 6[8actor # %ariale list\7 6[8actor &\7 6[8actor C\7
#':?# 6117 6[8actor #\7 6[8actor & %ariale list\7 6[8actor C\7
#':?# 6117 6[8actor #\7 6[8actor &\7 6[8actor C %ariale list\7
'ote5 8actor # is always the row factor
8actor & is always the column factor
8actor C is always the treatment factor
@iscussion5 .atin s;uare designs are %ery efficient when a small numer of
treatments are eing tested ecause treatment comparisons are made more precise y
eliminating row and column effects" 4he asic characteristic of a .atin s;uare design
is that each treatment appears once in each row and once in each column" With small
numers of treatments0 there are few degrees of freedom for error" 4he limitation of
the .atin s;uare for a large numer of treatments is due to the re;uirement that there
1'> 0d,anced 0nalyses StatPac For Windows User's Manual
e the same numer of replications as treatments" 4hus0 the most generally used
.atin s;uares %ary from 3 y 3 to 10 y 10" .atin s;uare designs are also useful to
study se;uences of treatments andMor carry-o%er of treatments" 4his design will
always contain e9actly one oser%ation per cell"
#n A9ample5 4he field layout for 2 irrigation treatments 6#0 &0 C0 @ and A7 was as
follows5
Columns
1 2 3 3 2
$ow 1 A @ # & C
$ow 2 C A @ # &
$ow 3 # C & A @
$ow 3 @ & A C #
$ow 2 & # C @ A
4he analysis of %ariance tale follows5
$ummary of 4nova Designs
#no%a 4ype^1 :ne-8actor Completely $andomiBed @esign
8actor # - e9perimental treatment
&alanced or unalanced design
#no%a 4ype^2 $andomiBed Complete &loc, @esign
8actor # - e9perimental treatment
8actor & - replicates or loc,s
&alanced design only
#no%a 4ype^3 4wo-8actor 8actorial in Completely $andomiBed @esign
8actor # - e9perimental treatment
8actor & - replicates or loc,s
8actor C - sampling or determinations
&alanced design only
StatPac For Windows User's Manual 0d,anced 0nalyses 1'1
#no%a 4ype^3 4wo-8actor 8actorial in Completely $andomiBed @esign
8actor # - e9perimental treatment
8actor & - e9perimental treatment
&alanced and unalanced design
#no%a 4ype^2 4wo-8actor 8actorial in $andomiBed Complete &loc, @esign
8actor # - e9perimental treatment
8actor & - e9perimental treatment
8actor C - replicates or loc,s
&alanced design only
#no%a 4ype^- 4hree-8actor 8actorial in Completely $andomiBed @esign
8actor # - e9perimental treatment
8actor & - e9perimental treatment
8actor C - e9perimental treatment
&alanced or unalanced design
#no%a 4ype^) 4hree-8actor 'ested @esign
8actor # - e9perimental unit
8actor & - su-unit of factor #
8actor C - su-unit of factor &
&alanced or unalanced design
#no%a 4ype^( Split-Plot With Completely $andomiBed @esign of 1ain Plots
8actor # - e9perimental treatment
8actor & - e9perimental treatment
8actor C - replicates or loc,s
&alanced design only
#no%a 4ype^9 Split-Plot With $andomiBed Complete &loc, of 1ain Plots
8actor # - e9perimental treatment
8actor & - e9perimental treatment
8actor C - replicates or loc,s
&alanced design only
#no%a 4ype^10 Split-Plot With Su->nit 4reatments #rranged in Strips
8actor # - e9perimental treatment
8actor & - e9perimental treatment
8actor C - replicates or loc,s
&alanced design only
1'& 0d,anced 0nalyses StatPac For Windows User's Manual
#no%a 4ype^11 .atin S;uare @esign
8actor # - row factor
8actor & - column factor
8actor C - e9perimental treatment
&alanced design only
C0737IC0. Co((and
Canonical correlation analysis is a powerful multi%ariate statistical techni;ue to
study the intercorrelation structure of two sets of %ariales 6%ariale set 1 and
%ariale set 27" Aach OsetO of %ariales must contain at least two %ariales0 although
the numer of %ariales in each set does not need to e the same" StatPac defines set
1 as the set with the larger numer of %ariales0 and set 2 as the set with the smaller
numer of %ariales" 4his con%ention is used to speed up the e9ecution of the
analysis"
:ften 6ut not necessarily70 one set is regarded as a OdependentO set and the other set
is regarded as an OindependentO set" 8or e9ample0 uying eha%ior could e a
OdependentO %ariale set0 and %arious personality characteristics of the uyers could
e the OindependentO %ariale set" >sually0 the %ariales in each set represent two
distinct %ariale OdomainsO that are conceptually different and measured on the same
indi%iduals"
Canonical correlation analysis is related to many other statistical techni;ues"
Consider the following analogy" !f each set of %ariales were to contain only one
%ariale0 simple correlation analysis would e e;ui%alent to canonical correlation
analysis" !f one of the sets has one %ariale and the other set has two or more
%ariales0 then multiple regression analysis would e e;ui%alent to canonical
correlation analysis" Canonical correlation analysis can e seen as an e9tension of
multiple regression when a single dependent %ariale is replaced y a set of
dependent %ariales"
Canonical correlation analysis first calculates two new %ariales called the Ofirst
canonical %ariale pairO" :ne of the new %ariales is calculated from set 10 and the
other new %ariale is calculated from set 2" 4hese new %ariales are constructed
through linear cominations of the original %ariales so that the new canonical
%ariale from set 1 has ma9imum correlation with the new canonical %ariale from
set 2"
4he second canonical %ariale pair is created in a similar fashion" :ne canonical
%ariale is constructed from the first set of original %ariales and has ma9imum
correlation with the second canonical %ariale created from the second set of original
%ariales" 4his process is suHect to the constraint that the second canonical %ariale
pair is uncorrelated with the first canonical %ariale pair" !n essence0 the first
canonical pair 6one canonical %ariale from each set7 is chosen so that the correlation
etween the two sets of original %ariales is ma9imiBed" 4he second set of canonical
%ariales ma9imiBes the Oremaining correlationO etween the two sets of %ariales
6not pic,ed up y the first set of canonical %ariales7" 4he same philosophy applies
to suse;uent canonical %ariale pairs created"
4his concept of independence of each canonical %ariale pair is similar to that
in%ol%ed in calculating principal components" 4he difference lies in the way the
canonical %ariale pairs 6or weights assigned to the original %ariales of each of the
two sets7 are created" !n canonical correlation0 the weights for each pair of canonical
%ariales are calculated with the intent of ma9imiBing OremainingO correlation
etween the two sets of %ariales0 while in principal components the weights are
StatPac For Windows User's Manual 0d,anced 0nalyses 1'1
calculated with the intent of ma9imiBing the remaining Ocorrelation 6or %ariance7
structureO in one set of %ariales"
Canonical analysis pro%ides a powerful method of studying the correlation structure
etween two sets of %ariales" 8or e9ample0 assume we are interested in studying the
inter-correlation of %ariales from two different tests0 each containing 20 %ariales"
4he correlation matri9 would contain 300 different correlation coefficients to
e9amine" 4his would e a %ery large tas," 4he canonical correlation analysis
simplifies this tas, y5
1" @etermining the ma9imum correlation possile of any linear comination of the
original %ariales in each set"
2" @eri%ing two sets of weighting coefficients 6one for each of the two sets of
%ariales7 to arri%e at a new composite %ariale 6canonical %ariate7 representing each
set of %ariales" 4his pro%ides a structured way of e9amining the contriution of each
original %ariale 6from each set7" 1ore specifically0 this allows one to pinpoint
groups of %ariales from each set that are highly correlated" :ften0 these groups can
e gi%en theoretical meaning"
3" @eri%ing additional linear functions which ma9imiBe the remaining correlation
etween the two sets0 suHect to eing independent of the preceding set6s7 of linear
compounds"
3" 4esting the statistical significance of the correlation measures0 therey determining
the minimum numer of linear functions re;uired to account for the correlation
structure of the two sets"
2" #ssessing the o%erall e9tent of correlation etween the two sets of %ariales"
8or a detailed mathematical discussion of canonical correlation analysis 6as well as
the interpretation of the canonical correlation output of se%eral e9amples70 the user is
referred to the .ohnes and Cooley 619)17 oo, gi%en in the iliography"
4he synta9 of the command to run canonical correlation analysis is5
C#':'!C#. [?ariale list 1\ W!4< [?ariale list 2\
#s an e9ample0 a researcher wished to study the correlation etween 3 physiological
measurements WA!F<4 6?170 W#!S4 6?27 and P>.SA 6?37 with 3 e9ercise
%ariales C<!'S 6?370 S!4>PS 6?27 and I>1PS 6?-7"
4he command to run canonical correlation analysis could e specified in se%eral
ways5
C#':'!C#. WA!F<40 W#!S40 P>.SA W!4< C<!'S0 S!4>PS0 I>1PS
C#':'!C#. ?1 ?2 ?3 W!4< ?3 ?2 ?-
C#':'!C#. ?1-?3 W!4< ?3-?-
C# ?1-?3 W!4< ?3-?- 6'ote5 C#':'!C#. can e are%iated as C#7
4he %ariale list can consist of %ariale laels andMor %ariale numers" Aither a
comma or a space can e used to separate the %ariales from each other" 4he
,eyword W!4< is used to separate the two sets of %ariales"
1') 0d,anced 0nalyses StatPac For Windows User's Manual
Descriptive $tatistics
4he mean and standard de%iations for all %ariales in oth sets can e printed with
the descripti%e statistics option 6@S^J7"
&'ample of Descriptive $tatistics
$imple Correlation %atri'
4he simple correlation matri9 is printed with the SC^J option"
&'ample of a $imple Correlation %atri'
R:$=uared Table
4his option 6$S^J7 pro%ides the multiple correlation 6r-s;uared7 analysis of each
%ariale in each set0 regressed on all %ariales in the other set" 4he r-s;uared %alue
StatPac For Windows User's Manual 0d,anced 0nalyses 1'!
gi%en in the first row0 is the s;uared multiple correlation of the first %ariale in the
first set0 with the entire set of %ariales in the second set" 4he r-s;uared %alue in the
last row is the s;uared multiple correlation of the last %ariale in the second set0 with
the entire set of %ariales in the first set0 and so forth"
4his output is a useful supplement to canonical correlation analysis0 especially when
used in conHunction with the redundancy analysis output descried elow" 4he output
from this option allows one to measure whether certain %ariales are more correlated
than other %ariales 6within the same set7 to the other set as a whole"
&'ample of an R:$=uared Table
$tandardi3ed Coefficients
StandardiBed coefficients for all canonical %ariales in oth sets are printed with the
option $C^J" 4he standardiBed canonical %ariale coefficients are printed for the
first set of %ariales0 followed y those of the second set" 4hese are the weights
assigned to each original %ariale 6standardiBed y sutracting the mean and di%iding
y the standard de%iation7 to construct the new %ariales 6standardiBed canonical
%ariale pairs7 for each set"
&'ample of a $tandardi3ed Coefficients Table
Correlation of Canonical Pair "it Original Variables
4he canonical %ariale loadings are pro%ided for each set in a separate tale" 4hese
loadings are the correlation of the canonical %ariales with the original %ariales in
the set and are similar to factor loadings in factor analysis" 4he loadings
6correlations7 therefore indicate the relati%e contriution of each original %ariale 6in
1'* 0d,anced 0nalyses StatPac For Windows User's Manual
each set7 in constructing the new canonical %ariales" 4his is the most useful tale in
understanding the correlation structure of the two sets of %ariales0 and it pro%ides
insight into interpretation of the canonical %ariale pairs"
&'ample of Canonical Variable Loadings
Redundancy Table
Canonical redundancy analysis e9amines 17 how well the original %ariales can e
predicted from the canonical %ariales0 and 27 how much of the O%arianceO of the two
sets is in common 6i"e"0 how much of the O%arianceO in one set can e accounted for
y the other set7" !f $4^J0 a redundancy tale is printed for each of the 2 sets of
%ariales" Aach tale pro%ides two statistics for each canonical %ariale"
4he statistic gi%en in the first column represents the proportion of the O%arianceO in
the set of %ariales eing analyBed that is accounted for y each canonical %ariale in
that set" Since all canonical %ariales are independent0 the total figure 6last row7
presents a measure of how well the canonical %ariales ha%e een ale to account for
the O%arianceO in the original %ariales" !t should e noted that0 for the second set of
%ariales0 this total figure will always e 1 since there are as many new %ariales as
original %ariales and the new %ariales are independent"
4he statistic in the second column gi%es the proportion of the O%arianceO in the set
that is e9plained y each canonical %ariale in the other set" 4his statistic is usually
referred to as the Oredundancy of a set gi%en the otherO0 and measures the e9tent of
o%erlap etween the two sets with respect to that canonical %ariale pair" # small
redundancy %alue indicates that practically no o%erlap across sets is present in that
particular pair of canonical %ariales" 4he total figure 6last row of the second
column7 pro%ides an o%erall measure of the e9tent to which one set is a good
predictor of the other 6ased on the canonical %ariale pairs constructed7" 4he
redundancy measure is important ecause a %ery large canonical coefficient could e
the result of a %ery large Bero-order correlation of Hust one %ariale of one set with
Hust one %ariale of the other set0 and the remainder of the %ariales in the two sets
could e essentially unin%ol%ed" !n this case0 the canonical correlation for that pair of
canonical %ariales would e high ut the redundancy for that pair of canonical
%ariales would e low" 4he redundancy criteria would therefore e a etter measure
of the e9tent of o%erlap in the two OsetsO than the measure pro%ided y the canonical
correlation associated with that canonical correlation pair"
StatPac For Windows User's Manual 0d,anced 0nalyses 1'-
&'ample of a Redundancy Table
RaoBs F:$tatistic Table
?arious statistics0 including $aoDs 8-statistic0 are included in this tale" !t pro%ides
information to e%aluate the e9tent of the correlation etween the two sets of
%ariales0 the numer of canonical %ariale pairs that are re;uired to represent this
correlation0 and how successful the canonical %ariales ha%e een in summariBing
the interdependence of the two sets of %ariales"
>ntil recently0 $aoDs 8-statistic tale was %irtually the only tool a researcher had to
e%aluate the ao%e criteria" 1ore recently0 howe%er0 researchers ha%e come to realiBe
that these statistics can e misleading in the asence of the redundancy analysis
tale" 4he statistics in this tale0 comined with the redundancy tale statistics0
pro%ide a more powerful approach to studying the performance of the canonical
correlation analysis"
4he canonical correlation gi%en in the first row of this tale 6second column7 is the
correlation etween the first pair of canonical %ariales 6i"e"0 the correlation of the
first new %ariale created from the first set of original %ariales with that of the first
new %ariale created from the second set of %ariales7" &y construction0 this is the
ma9imum correlation that can e otained etween any linear comination of the
first set of %ariales and any linear cominations of %ariales in the second set" 4he
canonical correlation gi%en in the second row of this tale is the correlation etween
the second pair of canonical %ariales0 and so forth"
4he ma9imum numer of canonical %ariale pairs that can e constructed is e;ual to
the numer of %ariales in the second set" $ememer that0 y construction0 the ith
canonical %ariale pair is independent of all the canonical %ariale pairs efore it0
thus implying that the second canonical %ariale pair represents two new %ariales
that are ma9imally correlated0 suHect to the condition that they are not pic,ing out
any of the correlation structure that was already pic,ed up y a pre%ious canonical
%ariale pair"
4he third column 6canonical r-s;uared7 is simply the s;uare of the canonical
correlation and represents the amount of %ariance in one canonical %ariate that is
1'; 0d,anced 0nalyses StatPac For Windows User's Manual
accounted for y its canonical %ariale counterpart in the other set" &y definition0 the
canonical r-s;uare gi%en in the first row should e greater than the r-s;uare %alue
otained y regressing only one %ariale from a set 6say the first7 with all the
%ariales from the other set 6the second set7" 4his can e %erified with the r-s;uared
tale 6option $S7" Should any of the %alues in the r-s;uared tale e close to the first
canonical r-s;uare0 it is doutful that the other %ariales in that set are adding much
to the correlation with the other set"
4he fourth column pro%ides $aoDs 8-statistic to test how many canonical %ariale
pairs are needed to ade;uately represent the correlation structure of the two sets of
%ariales" Some software uses &artlettDs chi-s;uare statistic to test the hypothesis"
StatPac pro%ides $aoDs 8-statistic0 as it is a more accurate test0 especially with a
small sample siBe"
4he fifth and si9th columns gi%e the degrees of freedom associated with this 8-
statistic0 while the se%enth column gi%es the significance le%el 6proaility %alue7
associated with the 8-statistic" 4he proaility %alue in the first row pro%ides a test of
whether the canonical %ariales ha%e accounted for a significant amount of the
correlation structure etween the two sets of %ariales 6i"e"0 at least the first canonical
correlation is significantly different from Bero7" 4he proaility %alue gi%en in the
second row tests whether all the canonical correlations 6e9cept the first7 are
significantly different from Bero" 4he proaility %alue in the third row tests whether
all canonical correlations 6e9cept the first two7 are significantly different from Bero0
and so forth" StatPac pro%ides output on all canonical %ariale pairs possileW it is up
to the user to determine 6ased on magnitude of the canonical correlations as well as
the significance le%el of the 8-statistics7 how many of these pairs are rele%ant" 4he
last column pro%ides Wil,Ds lamda as each of the canonical %ariales is addedW this
criterion is used in calculating the 8-statistic"
&'ample of a RaoBs F:$tatistic Table
%ean $ubstitution
1ean sustitution is one method often used to reduce the prolem of missing
information" Sometimes0 canonical correlation analysis is difficult ecause if one
%ariale is not ,nown0 the whole record must e e9cluded from the analysis" 4his
could sustantially reduce the numer of records that are included in the analysis0
especially when there are many %ariales in the analysis" 1ean sustitution
o%ercomes this prolem y replacing any missing %ariale with the mean of that
%ariale"
$ave Canonical Pair
$esearchers often want to sa%e the first two canonical %ariales for future analysis"
Jou can sa%e them with the options command SP^J" #t the conclusion of the
analysis you will e gi%en the opportunity to merge the new %ariales into the
original data"
StatPac For Windows User's Manual 0d,anced 0nalyses 1''
Labeling and $pacing Options
3tion Code Function
.aeling .& Sets the laeling for descripti%e statistics to print
the %ariale lael 6.&^A70 the %ariale name
6.&^'70 or the %ariale numer 6.&^C7"
Column Width CW Sets the minimum width of the columns 6in inches7"
Column Spacing CS Sets the spacing 6in inches7 etween the columns"
@ecimal Places @P Sets the numer of decimal digits that will e
shown"
M0P Co((and
Perceptual mapping refers to a road range of mar,et research techni;ues to study
consumer perceptions of products 6OrandsO7 in a class ased on the product
attriutes" 4o achie%e this oHecti%e0 an attempt is made to reduce the dimensionality
of the productMattriute spaceW plots 6perceptual maps7 are then used to graphically
display consumer perceptions of OrandsO in a category"
1ar,eting researchers use perceptual mapping to identify new opportunities and
mar,eting strategies" :ne of its primary application is to analyBe the effecti%eness of
mar,eting campaigns designed to modify peopleDs perceptions of a product"
4he four most fre;uently used attriute-ased statistical tools for perceptual mapping
are discriminant analysis0 principal components analysis0 factor analysis and
correspondence analysis"
4he 1#P command uses the correspondence analysis approach to perceptual
mapping" Correspondence analysis is an e9ploratory statistical techni;ue for
e9amining multi%ariate categorical data 6usually in the form of a anners tale7 and
graphically displaying oth the rows and columns of the tale in the same
multidimensional space" 4he oHect of correspondence analysis is to graphically
summariBe the correlations among row and column categories"
!n mar,eting applications0 columns are usually rands0 and rows are image attriutes"
<owe%er0 since the row and column categories are treated e;ually0 the a9es of the
anners tale could e swapped and the results would e the same" Correspondence
analysis produces perceptual maps showing how consumers percei%e %arious rands
in relation to a set of image attriutes" &rands with similar image profiles appear
closer together on the map"
Correspondence analysis is synonymous to the following techni;ues5 dual scaling0
method of reciprocal a%erages0 optimal scaling0 pic,-any scaling0 canonical analysis
of contingency tales0 categorical discriminant analysis0 homogeneity analysis0
;uantification of ;ualitati%e data"
Correspondence analysis starts with the usual anners 6crosstas7 tale" 4he tale
always contains one row %ariale and one column %ariale" 4hese are referred to as
the acti%e %ariales"
4he analysis egins y calculating the usual 6contingency tale7 chi-s;uare statistic0
or more specifically0 the chi-s;uare statistic di%ided y sample siBe 6PearsonDs mean-
s;uared contingency coefficient7" 4his ;uantity is often referred to as total inertia" #
)>> 0d,anced 0nalyses StatPac For Windows User's Manual
large chi-s;uare statistic implies association etween rows and columns 6i"e"0 lac, of
independence etween rows and columns7"
4he purpose of correspondence analysis is to plot the nature of this association in a
reduced dimensionality" !t is similar to principal components in that new components
6or factors7 are e9tracted0 each eing independent of each other" !f the first few
components account for most of the Oassociation in the taleO0 we ha%e een
successful in reducing the dimensionality of the rows and columns"
4he difference etween principal components and correspondence analysis is the
O%ariailityO we are trying to e9plain" !n principal components analysis0 we are trying
to e9plain the OcorrelationO or Oco%arianceO structure of a set of %ariales0 while in
correspondence analysis we are trying to e9plain the OassociationO etween rows and
columns of a tale of fre;uencies"
4he decomposition of the chi-s;uare proceeds y calculating two factors or %ectors
6one for the column le%els and the other for the row le%els7" 4hese factors are
e9tracted such that the association etween them is ma9imiBed 6i"e"0 e9plains as
much of the chi-s;uare statistic as possile7" 'e9t0 a second pair of factors is
e9tracted" 4heir association is ma9imiBed to e9plain as much of the remaining chi-
s;uare statistic 6suHect to the constraint that this second factor pair is uncorrelated
with the first factor pair7" 4he same philosophy applies to suse;uent factor pairs
created"
4his concept of independence of each factor pair is similar to the calculation of
principal components" 4he difference lies in the way the factor pairs 6or weights
assigned to the le%els of each row and column7 are created" !n correspondence
analysis0 the weights for each factor pair are calculated with the intent of ma9imiBing
OremainingO association etween row and column le%els0 while in principal
components the weights are calculated with the intent of ma9imiBing the remaining
Ocorrelation 6or %ariance7 structureO in the %ariales"
4he synta9 of the command to run correspondence analysis is5
1#P [#cti%e row %ariale\ &J [#cti%e column %ariale\
4he only restriction on the data is that oth %ariales must e categorical 6alpha or
numeric70 and there must e at least three categories on each a9is" <owe%er0 since the
row and column categories are treated e;ually0 oth can e either oHects 6rands7 or
attriutes"
# simple e9ample might e to map the relationship etween purchasing @AC!S!:'
6?17 and !'C:1A 6?27" 4he command might e e9pressed in many ways5
1#P !'C:1A &J @AC!S!:'
1#P @AC!S!:' &J !'C:1A
1#P ?1 &J ?2
1# ?2 &J ?1 6'ote5 1#P may e are%iated as 1#7
Passive Variables
StatPac can perform multiple correspondence analysis" 4his means that passi%e rows
and columns 6often referred to a supplemental rows and columns7 can e added to
the perceptual maps" 4hese are not included in the actual analysis0 ut rather0 are
superimposed upon the perceptual map of the acti%e %ariales" Passi%e rows and
StatPac For Windows User's Manual 0d,anced 0nalyses )>1
columns are re;uested y adding them to the 1ap command" 4o include passi%e
%ariales0 the synta9 for the 1ap command ecomes5
1#P [#cti%e row %ariale\[Passi%e row %ariales\ &J [#cti%e column
%ariale\[Passi%e column %ariales\
Passi%e rows and columns are often used as reference points for acti%e points in the
plot" 8or e9ample0 if the acti%e columns was rands0 an e9ample of a passi%e column
point could e a hypothetical rand or a rand from a pre%ious similar study"
$tac/ing Variables
Correspondence analysis always uses one acti%e row %ariale and one acti%e column
%ariale 6each containing at least three categories7" !t is often desirale0 howe%er0 to
perform correspondence analysis on contingency tales that contain more than two
dimensions" Stac,ing %ariales allows you to comine two or more %ariales into a
single %ariale" 4he Stac, command may e used to create a new %ariale that
represents all possile cominations of two or more other %ariales"
4he following e9ample would create a single %ariale called @A1:F$#P<!CS0
and it would e used as the acti%e column %ariale" 4he numer of categories in the
new stac,ed %ariale will e the product of the numer of categories in each of the
indi%idual %ariales"
S4#CE @A1:F$#P<!CS ^ #FA SA*
1#P @A1:F$#P<!CS &J &$#'@
!f #FA had fi%e categories and SA* had two categories0 the resultant column
%ariale 6@A1:F$#P<!CS7 would contain ten categories" 4his would co%er all the
possile cominations of categories" Stac,ing %ariales should e used carefully
ecause of the potential for a huge numer of rows or columns" 4he ma9imum
numer of rows or columns is 120"
CountAPercent Table
Correspondence analysis always egins with a anners tale" 4he anner tale itself
is called the countMpercent tale" !t may e printed with the CP^J option or
suppressed with the CP^' option" 4he options to control the appearance of the
CountMPercent tale are identical the options for the &anner command"
!n the following e9ample0 the acti%e row is Party #ffiliation and the acti%e column is
#ttitude on the 'ew Fo%ernment Proposal" #nnual !ncome is a passi%e row0 and
.ieralMConser%ati%e is a passi%e column"
)>& 0d,anced 0nalyses StatPac For Windows User's Manual
&'ample of a CountAPercent Table
Design $ummary for 4bbreviated Labeling on %ap
Perceptual maps can easily ecome o%erly cluttered0 it is sometimes necessary to
are%iate the %alue laels with Hust a numer" 4he design summary will contain the
Oplot numerO for each row and column %ariale 6i"e"0 a numeric are%iation that
can e used when creating large perceptual maps7" 4he #&^J option may e used to
are%iate the map so it uses numers instead of %alue laels" # design summary will
then e printed that prints the %alue laels for all acti%e and passi%e rows and
columns" 4his feature is only important when there are many rows and columns in
the anners tale"
StatPac For Windows User's Manual 0d,anced 0nalyses )>1
&'ample of a Design $ummary
Correspondence 4nalysis &igenvalue $ummary
4he correspondence analysis eigen%alue summary tale is always included in the
output" Aach non-tri%ial eigen%alue represents a dimension 6factor pair7" 4he
ma9imum numer of eigen%alues for any contingency tale is one less than the
minimum of the numer of rows and the numer of columns in the contingency
tale" 4he sum of all eigen%alues e;uals the chi-s;uare statistic of independence
di%ided y sample siBe 6total inertia7"
4he eigen%ectors of the non-tri%ial eigen%alues define the coordinates of the factor
pairs" !f the first few eigen%alues are large relati%e to the remaining eigen%alues0 it is
then possile to display the association etween rows and columns in a one or two-
dimensional tale" 4he eigen%alue tale allows us to determine how much
OinformationO is lost y ignoring all dimensions e9cept for the first 6or first and
second7" 4he first two dimensions should account for nearly 100` of the total row
and column association 6i"e"0 they completely e9plain all the association etween the
rows and columns7"
&'ample of Correspondence 4nalysis &igenvalue $ummary
Table
$ummary of Ro" and Column Points
4he correspondence analysis summary of row and column points tale presents
useful insight into the nature of the association etween rows and columns0 and is
)>) 0d,anced 0nalyses StatPac For Windows User's Manual
printed for each analysis" 4his tale pro%ides information on the first two factor pairs
6i"e"0 the first 2 dimensions7 only"
&'ample of $ummary of Ro" and Column Points Table
4he first column 6Coordinate7 gi%es the factor scores for the first dimension" 4hese
are the coordinates that are used to plot the first dimension or a9is" &y definition0
these coordinates are calculated to account for as much of the association in the
contingency tale as possile" $ow and column le%els with coordinates close to Bero
do not account for any of the association e9plained y the first dimensionW they may
howe%er e important in the second dimension or a9is"
4he first correlation 6Corr"7 column gi%es the correlation of each row and column
with the first dimension" # high %alue implies that the particular row 6column7 is
important in descriing the first dimension"
4he first contriution 6Contr"7 column gi%es the row and column contriution to the
association Opic,ed-upO y the first dimension 6e9pressed as a percentage7" # row or
column with a high marginal has a larger contriution than a row or column with a
low marginal" !t is important to note the difference etween the concepts measured
y the Corr. and Contr. columns" Corr. simply measures the correlation of the rows
and columns with the first dimension" !t is therefore useful in defining the first
dimension" Contr.0 on the other hand0 pro%ides a measure of how useful a particular
row or column is in e9plaining the contingency tale association for the first
dimension" # row or column may e highly correlated with the first dimension ut
e9plain %ery little of the association etween rows and columns"
4he Contr" column is useful in locating outliers" When a row or column has a %ery
large asolute contriution and a large coordinate0 it can e considered an outlier and
has a maHor role in determining the first andMor second coordinates" 4hought should
e gi%en to redefining this outlier point as a passi%e 6supplementary7 point and
performing the analysis again without this point0 therey eliminating that pointDs
influence in the creation of the first few a9is" 4he point can e superimposed on the
a9is calculated for the remaining points"
StatPac For Windows User's Manual 0d,anced 0nalyses )>!
4he second column of coordinates gi%es the factor scores for the second dimension"
4hese are the coordinates that are used to plot the second dimension or a9is" &y
definition0 these coordinates are calculated to account for as much of the association
in the contingency tale not accounted for y the first dimension" 4he second Corr"
column gi%es the correlation of each row and column le%el with the second
dimension" # high %alue implies that the particular row 6column7 is important in
descriing the second dimension" 4he second Contr" column is the rowDs 6and
columnDs7 contriution to the association Opic,ed-upO y the second dimension
6e9pressed as a percentage7" !f a row or column has low contriution on oth the first
and second dimension0 this can e due to one or more of the following reasons5
1" 4here is no association etween that row 6column7 and the le%els of columns
6rows7"
2" 4he third 6and higher7 dimensions account for a significant portion of the
association in the contingency tale and cannot e ignored"
3" 4he row or column marginal is small and therefore has only a small effect on the
chi-s;uare statistic"
Carroll:.reen:$affer $caling of Coordinates
4he option CF^J re;uests that the Carroll-Freen-Shaffer scaling of coordinates e
used" !f CF^'0 the usual O8rench schoolO correspondence analysis coordinates are
calculated"
4hese O8rench schoolO coordinates do not allow one to compare distances etween
column and row points ut rather only distance etween column points or etween
row points" Carroll0 Freen and Shaffer claim that their method of scaling of
coordinates allow one to compare oth within and across group 6rowMcolumn7
distances" !f eigen%alues are almost e;ual0 the CFS and O8rench schoolO plots loo,
almost the same0 ut if the first eigen%alue is consideraly greater than the second0
the plots can loo, %ery different"
Plots
4he correspondence analysis plots show the relationship etween a row and all
columns or etween a column and all rows" When using the O8rench schoolO
techni;ue 6CF^'70 distances etween a row and a column point cannot e
interpreted" When using the Carroll-Freen-Schaffer coordinates0 distances etween a
row and a column point can e e9amined"
8our types of maps can e created with the P. option"
#" two-dimension row-column plot
&" one-dimension row-column plot
C" two-dimension row plot
@" two-dimension column plot
8or e9ample0 the following option would create a two-dimension row-column plot0 a
two-dimension row plot0 and a two-dimension column plot"
:P4!:'S P.^#C@
)>* 0d,anced 0nalyses StatPac For Windows User's Manual
4he two-dimension row-column plot will show oth row and column %ariales using
the first two dimensions" !f the first two eigen%alues 6dimensions7 account for a large
portion of the total chi-s;uare0 then this plot pro%ides a useful summary of the
association etween row and column points"
&'ample of a T"o:Dimension Ro":Column %ap
!n general0 the more the row and column points are spread out0 the higher the
association and hence the higher the chi-s;uared statistic" Columns and rows
represented y points in the plot relati%ely far from the origin account for relati%ely
large portions of the lac, of independence in the contingency tale" $ows positioned
close together in the map ha%e similar profiles across the columns" #nalogously0
columns positioned close together in the plot e9hiit similar profiles across the rows"
4he two-dimension row plot is especially useful when there are a lot of row and
column points to plot andMor one wishes to e9amine the distance etween row points
only"
4he two-dimension column plot is especially useful when there are a lot of row and
column points to plot andMor one wishes to e9amine the distance etween column
points only"
4he one-dimension row-column plot is especially useful when the first dimension
e9plains most of the association in the tale" !n this case the %alue of the first
eigen%alue would e close to PearsonDs mean-s;uare contingency coefficient"
StatPac For Windows User's Manual 0d,anced 0nalyses )>-
0d,anced 0nalyses Bi"lio%rahy
4he following iliography is recommended for more detailed information on the
ad%anced analyses module of StatPac for Windows5
Re/ression Analysis
@raper '"$" and <" Smith - #pplied $egression #nalysis0 2nd Ad"0 'ew Jor,0 Iohn
Wiley and Sons0 !nc"0 619(17"
<enderson0 <"?" and P"8" ?elleman0 619(17 - &uilding 1ultiple $egression 1odels
!nteracti%ely" &iometrics0 ?ol" 3)0 pp" 391-311"
Ienrich0 $"!" - Stepwise $egression in Statistical 1ethods for @igital Computers0
edited y Eurt Anstein0 #nthony $alston0 <erert S" Wiff0 619))7"
.ewis0 C"@" - !ndustrial and &usiness 8orecasting 1ethods" &oston0 &uterworth
Scientific0 619(27"
robit and &o/istic Re/ression Analysis
Funderson0 1"0 619)37 - $etention of 4rainees - # Study with @ichotomous
@ependent ?ariales" Iournal of Aconometrics0 ?ol" 20 pp" )9-93"
4oin0 I" - 4he #pplication of 1ulti%ariate Proit #nalysis to Aconomic Sur%ey
@ata" Cowles 8oundation @iscussion Paper 'o" 10 @ecemer 619227"
Wal,er0 S"<" and @uncan0 @"&"0 619-)7 - Astimation of the Proaility of an A%ent as
a 8unction of Se%eral !ndependent ?ariales" &iometri,a0 ?ol" 230 pp" 1-)-1)9"
Principal Components0 8actor and 1ulticollinearity #nalysis
#fifi0 #"#" and #Ben0 S"P" - Statistical #nalysis5 # Computer :riented #pproach"
'ew Jor,0 #cademic Press0 !nc" 619)27"
&elsley0 @"#"0 Euh0 A" and Welsch0 $"A - $egression @iagnostics5 !dentifying
!nfluential @ata and Sources of Collinearity" 'ew Jor,0 Iohn Wiley and Sons0 !nc"
619(07"
<oc,ing0 $"$" and Pendleton0 :"I"0 619(37 - 4he $egression @ilemma"
Communications in Statistics0 ?ol" #120 pp" 39)-22)"
Eim0 Iae-:n and C"W" 1ueller - 8actor #nalysis5 Statistical 1ethods and Practical
!ssues" California0 Sage Pulications0 !nc" 619)(7"
Eramer0 C"J"0 619)(7 - #n :%er%iew of 1ulti%ariate #nalysis" Iournal of @airy
Science0 ?ol" -10 pp" (3(-(23"
?eldman0 @"I" - 8ortran Programming for the &eha%ioral Sciences" 'ew Jor,0 <olt0
$inehart and Winston0 !nc" 619-)7"
(luster Analysis
#ndererg0 1"$"- Cluster #nalysis for #pplications" 'ew Jor,0 #cademic Press
619)37"
)>; 0d,anced 0nalyses StatPac For Windows User's Manual
1illigan0 F"W"0 619(07 - #n A9amination of the Affect of Si9 4ypes of Arror
Perturation on 8ifteen Clustering #lgorithms" Psychometri,a0 ?ol" 320 pp" 322-332"
Pung0 F" and Stewart0 @"W"0 619(37 - Cluster #nalysis in 1ar,eting $esearch5
$e%iew and Suggestions for #pplications" Iournal of 1ar,eting $esearch0 ?ol" 20
61ay70 pp" 133-13("
Spath0 <" - Cluster #nalysis #lgorithms" Chichester0 Angland0 Allis <orwood 619(07"
Analysis of =ariance
Cochran0 W"F" and F"1" Co9 - A9perimental @esigns0 2nd Adition0 Wiley &oo,s0
6192)7"
8inney0 @"I" - A9perimental @esign and its Statistical &asis0 4he >ni%ersity of
Chicago Press0 619227"
Cuenouille0 1"<" - 4he @esign and #nalysis of A9periments0 Charles Friffin and
Co" .td"0 619237"
Snedecor0 F"W" and W" F" Cochran - Statistical 1ethods" Si9th Adition0 4he !owa
State Press0 619-)7"
Steel0 $"F"@" and I"<" 4orrie - Principles and Procedures of Statistics0 1cFraw-<ill
&oo, Company0 !nc"0 619-07"
Winer0 &"I" - Statistical Principles in A9perimental @esign0 1cFraw-<ill &oo,
Company0 !nc"0 619-27"
(anonical (orrelation Analysis
Cooley0 W"W" and .ohnes0 P"$" - 1ulti%ariate @ata #nalysis 6Chapter -7" 'ew Jor,0
Iohn Wiley and Sons 619)17"
Freen0 P"A"0 <alert0 1"<" and $oinson0 P"I"0 619--7 - Canonical #nalysis5 #n
A9position and !llustrati%e #pplication" Iournal of 1ar,eting $esearch0 ?ol" 30 pp"
32-39"
(orrespondance Analysis
Carroll-Freen-Shaffer0 619(-7 - Iournal of 1ar,eting $esearch0 ?ol" 230 pp" 2)1-2(0"
@illion0 William $"0 8rederic,0 @onald F"0 4angpanichdee0 ?anchai 619(27 - # 'ote
on #ccounting for Sources of ?ariation in Perceptual 1aps" Iournal of 1ar,eting
$esearch0 ?ol" 19 6#ugust70 pp" 302-311"
8o90 $ichard I"0 619((7 - Perceptual 1apping >sing the &asic Structure 1atri9
@ecomposition" Iournal of the #cademy of 1ar,eting Science0 ?ol" 1-0 pp" 3)-29"
Freenacre0 1"I"0 - 4heory and #pplications of Correspondance #nalysis" 'ew Jor,0
#cademic Press 619(37"
Freenacre0 1"I" 619(97 - Iournal of 1ar,eting $esearch0 ?ol" 2-0 pp" 32(-3-("
StatPac For Windows User's Manual 0d,anced 0nalyses )>'
Utilities
Utility Pro%ra(s
Se%en utility programs are pro%ided to gi%e greater control and more %ersatility o%er
studies and data files 4hey can e run from the #nalysis0 >tilities menu"
4he !mport and A9port program will allow you to read files created y other
software or write files that can e read y other software" Se%eral formats are
supported5 #ccess0 A9cel0 d&ase0 8o9Pro0 all prior %ersions of StatPac0 all prior
%ersions of StatPac Fold0 .otus0 comma delimited0 ta delimited0 multiple record
files0 !nternet response files0 and plain-te9t e-mail"
4he 1erge program is used to merge %ariales from different studies and data files
or to rearrange the se;uence of %ariales in a file" !t can merge data from up to fi%e
indi%idual data files" !t can also e used to concatenate 6Hoin7 data files using the
same codeoo,"
4he #ggregate program is used to create a true or compositional aggregate study and
data file" #ggregate files are useful for summariBing sugroups of data"
4he Codeoo, program is used to ;uic,ly create a codeoo,0 or to chec, a codeoo,
and data file for errors" 4he Chec, program is used when you suspect that there is a
prolem in the codeoo, or data file" !f a specific procedure wonDt run0 this program
can sometimes pro%ide a solution" # common use of this program is when you are
planning to use a data file created from a source other than StatPac0 and you want to
ma,e sure that your study design matches the data file"
4he Sampling program is used to generate a random numer tale0 create a random
digit dialing tale for telephone studies0 and to select a random sample from a data
file"
4he Compare @ata 8iles program is used to compare two data files for differences" !t
is used to chec, the accuracy of data entry when a doule entry system has een
used"
4he Statistics Calculator is used to calculate distriutions0 proailities and other
statistics from proportions and summary data"
I(ort and +2ort
StatPac can import and e9port information to other software" Select >tilities0 and
then select import or e9port" !mport means you want to con%ert a non-StatPac file
into StatPac for Windows format" A9port means you want to con%ert a StatPac for
Windows file to a different format" When importing or e9porting data0 the original
file6s7 will remain intact and a new file6s7 will e created"
When importing0 select the type of file and name of the file to e imported" !f you are
importing from pre%ious %ersions of StatPac0 it will e assumed that the
codeoo,Mstudy name and the data file name are the same" 4he names for the StatPac
for Windows codeoo, and data may e different"
Aach of the import and e9port file formats is e9plained elow"
StatPac and Prior 8ersions of StatPac Gold
Prior %ersions of StatPac and StatPac Fold used a Ocodeoo,O file or Ostudy designO
files to store %ariale format and laels information" StatPac for Windows stores all
)1& Inde2 StatPac For Windows User's Manual
this information in a codeoo, file" &ecause older %ersions of StatPac ha%e limited
laeling space0 some laels may e truncated when e9porting to an older %ersion of
StatPac"
4he import program assumes that the data file name is the same as the study file
name for the pre%ious %ersion" 4hus0 the O'ame of the 8ile to !mportO will indirectly
also specify the data file name" 8or e9ample0 if the file to import is S>$?AJ"AL00
the program will try to import a data file called S>$?AJ"@#4 from the same folder"
!f the data file does not e9ist0 only the codeoo, will e imported" StatPac for
Windows stores data in the same format as prior %ersions of StatPac 6fi9ed format
se;uential #SC!!7" 4herefore0 if there is not a matching data file name0 you can
simply copy the old data file to the folder where you imported the codeoo, and use
it without modification"
0ccessC +2celC Parado2C dBaseC and .otus
StatPac can import or e9port to a %ariety common data aseMwor,sheet formats" 4he
appropriate e9tension will e used when you select the type of data ase to e
imported or e9ported" When importing to StatPac0 the import procedure will create a
new StatPac codeoo, and data file" @o not create a StatPac codeoo, efore doing
the import or it will e o%erwritten y the import procedure"
When importing from .otus to StatPac0 the default %ariale names are the wor,sheet
column letters 6e"g" Column #0 Column &0 etc"7" !f your wor,sheet contains loc,ed
column headings0 they will e used as %ariale names for those columns" 4he column
headings may e loc,ed in .otus y using the MWor,sheet 4itles <oriBontal
command" !f the column titles are not loc,ed0 they will e written as the first record
in the StatPac data file 6an undesirale situation7" #lso0 e sure your wor,sheet does
not contain any empty rows or di%iding lines etween the titles and the first row of
data"
$IF Files
@!8 files were originally de%eloped to pro%ide a uni%ersal method of transferring
data files from one program to another" >nfortunately0 many program de%elopers
decided to add their own special features to the @!8 file" 4he result was that that
Ouni%ersalO compatiility of @!8 files ecame marginal"
Co((a $eli(ited and :a" $eli(ited Files
StatPac can import and e9port comma and ta delimited files" 4here are many
software pac,ages that can interchange data in this format" # comma delimited file is
a se;uential #SC!! file where the %ariales are separated from each other y commas
6rather than each %ariale using a fi9ed numer of characters7" !n a ta delimited file0
the separator is a ta character" 4a delimited imports and e9ports are generally more
reliale than comma delimited files"
When importing0 StatPac creates a new codeoo, ased on the field widths re;uired
to hold the data" !f a codeoo, already e9ists0 you may use it instead of creating a
new codeoo," !f a data file already e9ists0 youDll e offered the option of appending
to the e9isting data file or deleting it" Selecting append will add the newly imported
data to the end of the e9isting data file"
1any software pac,ages write ;uotation mar,s around alpha fields0 while others do
not" When importing a comma delimited file0 all ;uotation mar,s will automatically
e eliminated0 since StatPac does not use ;uotes" When e9porting to a comma
delimited file0 any field containing a comma will always e enclosed in ;uotes" 4he
StatPac For Windows User's Manual Utilities )11
StatPac"ini file contains a setting #uote6lpa@ields" When #uote6lpa@ields410 all
alpha fields will e ;uoted when e9porting to comma delimited" When set to Bero0
only fields containing a comma will e enclosed in ;uotes"
1any software pac,ages can read or write a header record in comma and ta
delimited files" # header record is usually the first record in the data file" !t contains
the names of the %ariales instead of actual data" !f you are importing a comma or ta
delimited file and donDt ,now if there is a header record0 load the file into your word
processor and loo, at it" !t the first line in the file is the names of the %ariales0 there
is a header record" !f the first record loo,s Hust li,e the other records0 itDs data0 and
not a header record"
When e9porting to a ta or comma delimited file0 StatPac will gi%e the option to
con%ert the raw data to the %alue laels" 8or e9ample" if the first %ariale were
gender and coded 1^1ale and 2^8emale0 a normal e9port would write a 1 or 2 for
the %ariale" !f the Hxpand ,o ,ext option is selected0 it would write 1ale or 8emale
to each data record instead of the raw data"
When e9porting to a ta or comma delimited file 6or A9cel70 with the intention of
eing ale to import the file into SPSS0 StatPac will gi%e the option to also create a
SPSS synta9 file" 4his file is a te9t file with the same name as the e9ported file
e9cept it will ha%e a "sps e9tension" !n SPSS0 first import the data" 4hen load the "sps
file into 'otepad or another te9t editor" Copy the contents of the file into the SPSS
synta9 editor and clic, play" 4his will create the %ariale and %alue laels in SPSS"
When using this feature0 StatPac may modify 6are%iate7 the %ariale names0 laels
and %alue laels in order to fit the limited space offered y SPSS"
4he ta delimited import utility can e used to import a te9t file for ?eratim &laster
open-ended response coding" 8or e9ample0 you might ha%e used 1icrosoft Word to
enter %eratim comments into a "t9t file" Aach personDs comments were entered as a
paragraph 6i"e"0 a continuous string of te9t ending with a carriage return7" 4his file
can e imported as a ta delimited file" Since there are actually no tas in the file0
StatPac will correctly import the te9t into a codeoo, and data file containing a
single %ariale" 4he %ariale will e an alpha type and will e as long as necessary to
hold the open-ended comments"
A9ported ta delimited files may use a "t9t or "ts% 6ta separated %ariales7 e9tension"
A9ported comma delimited files may use a "t9t or "cs% 6comma separated %ariales7
e9tensions
When e9porting to a ta or comma delimited file0 ,eep in mind that many programs
6A9cel0 #ccess0 etc"7 limit the numer of columns to 222 6while StatPac can ha%e as
many as 200007" !f your codeoo, has more than 222 %ariales0 an e9port to an
#ccess file is preferred ecause it will split the data into multiple tales as necessary"
:therwise0 youNll ha%e to use the Write command to create a series of codeoo,s and
data files 6each containing 222 or fewer %ariales7 and then e9port each one
indi%idually to a delimited file"
Files Containin% Multile $ata Records er Case
1any researchers want to use data that is in card-image format on a mainframe
computer" #lso0 many data entry ser%ices are capale of only punching data in card-
image format" While it is relati%ely easy to download data from a mainframe0 it often
comes in (0-column format" !f there is only one record per case0 this data can e read
y StatPac without performing an import" <owe%er0 when there is more than one
Ocard imageO 6i"e"0 record7 per case0 it ecomes necessary to concatenate 6Hoin7 the
Ocard-imageO records together to produce a StatPac readale file"
)1) Inde2 StatPac For Windows User's Manual
!mporting a multiple record file that loo,s li,e this"""
Card 1 Case 1
Card 2 Case 1
Card 3 Case 1
Card 1 Case 2
Card 2 Case 2
Card 3 Case 2
etc"
will ecome a StatPac file that loo,s li,e this"""
Card 1 Case 1 Card 2 Case 1 Card 3 Case 1
Card 1 Case 2 Card 2 Case 2 Card 3 Case 2
etc"
StatPac re;uires that a data record e a continuous stream of characters terminated
with a carriage return and linefeed" 4his program will read a file in multiple record
format and create a new data file with one record per case" 4he filename should ha%e
a "t9t e9tension"
StatPac assumes that there are (0 characters in each record of the multiple record
file" !f the Ocard-imageO record length is less than (00 StatPac will pad the records
with spaces efore comining them
Jou will need to specify how many records there are for each case" !f the
downloaded data file has 3 records per case0 you will answer 3 6e%en if the third
Ocard-imageO record is only partially used7"
Internet Files
4he preferred method of performing !nternet sur%eys is to store the responses in a
file on the ser%er" When using the method0 responses are stored in #SC!! 6"asc7 te9t
format" When youDre ready to perform an analysis0 download the file to your local
computer using an 84P program or #uto 4ransfer" !f you use a different 84P
program0 e sure to set it to downloaded the file as an #SC!! 6not inary7 file"
!f you use #uto 4ransfer0 the downloaded file will automatically e imported into
StatPac" !f you manually download the file0 you will need to use this import utility to
con%ert the "asc file to StatPac data"
@ownloaded !nternet response files are not automatically deleted from your ser%er"
4herefore0 each time you download the responses0 it will e the entire set of
responses since the eginning of the sur%ey" StatPac will offer you the choice of
deleting the e9isting data file or appending to the end of it" Since the downloaded file
is usually the entire data set0 you would normally want to replace the e9isting data
file with the newly downloaded data"
+(ail Sur,eys
&ecause of the %ariety of Amail programs0 it is not possile to descrie the e9act
steps you must ta,e to import a returned Amail sur%ey" Aach Amail program operates
a little differently0 and you will need to e9periment with your program"
StatPac pro%ides import capailities for CF! and plain te9t Amail sur%eys" CF!
Amail would e produced y a sur%ey placed on a we site that used StatPacDs email
StatPac For Windows User's Manual Utilities )1!
method of capturing responses" # plain-te9t sur%ey would e produced y a sur%ey
that was simply part of the te9t in the ody of an Amail"
Select e-mail as the import type and use the rowse utton to select the file to e
imported" >sually0 this would e a "m9 file 6i"e"0 a mailo9 in :utloo, A9press or
Audora where the e-mails were filtered to" >se the rowse utton to select the
e9isting StatPac codeoo, and specify the name of the data file" !f the data file does
not e9ist0 it will e created y the import procedure" !f it does e9ist0 the new data will
e appended to the end of the e9isting data file" 8inally0 select 4e9t as the Amail type
and clic, :E" StatPac will ad%ise you if any errors were encountered during the
import" !f so0 the notepad will appear on the menu ar" Clic, 'otepad on your menu
ar to see a description of the errors"
$etting Defaults for te &mail Import
#n e-mail consist of two parts" 4he first part is the e-mail header and the second part
is the contents 6or ody7 of the e-mail" 4he header contains many lines that are often
hidden y e-mail readers0 ut can e seen y loading an e-mail into the notepad"
StatPac must e ale to properly identify where the header starts and stops in order to
,now where the e-mail ody egins" 4he settings in the StatPac"ini file may e
adHusted to e compatile with your e-mail reader or language"
4he StartAmail<eader and AndAmail<eader settings should e set to the te9t that
egins and ends the header section" 4he StartAmail<eader parameter should e the
te9t that egins the header section0 and the AndAmail<eader parameter should e set
to the last Amail header line" !f you are manually copying and pasting incoming e-
mails to mailo9 file0 it may e important to change these settings" 4he default
%alues for these parameters are5
StartAmail<eader ^ $eturn-Path5
AndAmail<eader ^ *->!@.5
:ther e-mail parameters may also e set in the StatPac"ini file" StartAmail8ield and
AndAmail8ield can e used to change the rac,ets from U and V to other characters"
4he AmailPrefi9 parameter tells StatPac what line contains the nameMe-mail address
of the respondent" 4he Amail?ar'ame is the name of the StatPac codeoo, %ariale
that will automatically capture the respondentDs e-mail address in a plain-te9t e-mail0
and the Amail@ate8ield parameter is used to get the date of the e-mail in order to
more precisely report which e-mails contained errors" &y modifying these
parameters0 StatPac can e made to wor, with any e-mail reader or language"
Mer%in% $ata Files
4here are two asic ways that data files can e merged" 4he first is called
concatenation0 and it is used to merge two or more data files that contain the same
%ariales in the same order" 4he second type of merge lets you Hoin data containing
different %ariales" Select >tilities0 1erge0 and then the type of merge you want to
perform"
)1* Inde2 StatPac For Windows User's Manual
Concatenate $ata Files
1any times0 se%eral data entry operators will simultaneously enter data into a data
file on their own machines" When all the data files ha%e een entered0 they can e
merged into one large file y concatenating 6Hoining7 the data files"
8or e9ample0 letDs say you ha%e three months of data in three separate files
6I#'"@#40 8A&"@#4 and 1#$"@#47" 4he following @:S command would create
a new file called C>#$4A$1"@#4 which contained all three months of data" Jou
could then run your analysis on all the data for the first ;uarter"
4he concatenation-style merge assumes that the codeoo,6s7 for all the data files are
e9actly the same" 4he 1erge program will let you concatenate any numer of data
files into a new 6larger7 data file" Jou can type the data file names or use the rowse
utton to select data files" :nly one data file name should appear per line"
@o not confuse concatenating files with the 1A$FA utility program" !f all your data
files reference identical study information 6contain the same %ariales in the same
order70 use concatenation to merge your data into one file" !f your data files0
howe%er0 contain different %ariales0 use the 1A$FA utility program"
StatPac For Windows User's Manual Utilities )1-
Mer%e 8aria"les and $ata
4he merge program allows you to e9tract selected %ariales from up to fi%e studies
and create an entirely new study that will e sa%ed on dis," !f data files ha%e already
een entered for any of the studies0 they can also e restructured to match the new
study format"
@o not confuse the function of this program with data file concatenation" !f two data
files ha%e identical formats 6i"e"0 they contain the same %ariales in the same order70
the data files should e merged with the concatenation program"
4he restructure and merge program can e used to reorganiBe a single study 6and
data file7 or to comine se%eral studies 6and their associated data files7" !t allows
complete %ersatility with regard to which %ariales are selected from each of the
studies and the order of the %ariales"
4he program will as, for the name6s7 of the codeoo,s0 data files0 and common
%ariales that will e utiliBed" 8or each specified codeoo,0 also enter the name of
the associated data file 6if one e9ists7" !f no data file is specified for a particular
study0 the program will use lan,s for all %ariales re;uested from that study"
#lso select the common %ariale in each of the studies" 4his refers to a %ariale that
can e used to match up the records from each data file 6e"g"0 OC#SA !@O7" !f there is
not a common %ariale0 it is imperati%e that the data files contain the same numer of
records and in the same order" 4hat is0 record one from data file one should represent
the same respondent 6case7 as record one from data file two"
!f a data record is missing in any of the data files0 it could cause data from one file to
e matched with the wrong data from another file" 4herefore0 it is always a good idea
to ha%e a common %ariale in each of the data files 6and associated study
information7 that represents a uni;ue case identification numer" All data files must
be sorted by this variable before runnin/ this pro/ram" !f one of the data files is
missing a particular record0 lan,s will e merged into the output file"
Clic, :E to continue" 4he study numers and names will e displayed0 and the
program will re;uest the format for the new study" 4he format statement defines the
structure of the new codeoo,"
)1; Inde2 StatPac For Windows User's Manual
4he general format for creating a new file structure is5
6[Study numer\7 [?ariales\ or [?ariale range\
#n e9ample of a format statement is5
617 1-30(03 637 2-) 627 9 13 617 12
4his statement indicates that the new study format should contain %ariales in the
following order5
8rom study 1 - %ariales 10 20 30 ( and 3
8rom study 3 - %ariales 20 30 30 20 - and )
8rom study 2 - %ariales 9 and 13
8rom study 1 - %ariale 12
'otice that the study numer is enclosed in parentheses with no spaces" !ndi%idual
%ariales may e separated y either commas or spaces" # range of %ariales is
specified y a dash 6minus sign7 with no spaces on either side of the dash" !f the
format statement re;uires more than one line0 Hust continue typing and word-wrap
will correctly rea, the line
?ariales may e specified in any order" 4he study numers will e displayed at the
top of the screen and are assigned y the computer simply for con%enience when
specifying the new study format" 4he indi%idual %ariale numers for each codeoo,
can e determined y e9amining the ?ariale 'ames windows
4he new study format will e chec,ed for %alidity efore processing egins" !f errors
are found0 you will e as,ed to re-enter the format" 4he new study and data file 6if
specified7 will e written"
StatPac For Windows User's Manual Utilities )1'
0%%re%ate
4he aggregate utility program creates a new study and data file that consist of
aggregate statistics for sugroups of the original data" #ny descripti%e statistic may
e included in the aggregate files" 4he program allows the creation of oth
compositional and true aggregate files"
8or e9ample0 letDs say weD%e distriuted a ;uestionnaire to 200 people in each of 20
communities" #fter performing some preliminary analyses0 we want to compare the
communities on a numer of the inter%al or ratio-type ;uestions" We could0 of
course0 use the !8-4<A' SA.AC4 and W$!4A commands to create sufiles for each
of the communities and then perform descripti%e statistics analyses on each of the
sufiles" :%iously0 this would e a %ery time consuming procedure" 4he aggregate
utility program pro%ides a much more efficient way to deri%e this information"
&y using the aggregate program0 we could create a new codeoo, and data file that
Hust contain the descripti%e statistics we desire" Aach record in the new aggregate file
would represent one community" 4he record would contain the descripti%e statistics
for the community as a whole 6and not the raw data from the original file7" Since
there are 20 communities0 the aggregate file would contain 20 records" 4his type of
aggregate file is called a true aggregate file" !t is made up of Hust the aggregate
statistics and does not contain the original data collected" #fter creating a true
aggregate file0 the .!S4 command could e used to print a summary of the
descripti%e statistic for the communities"
4he other type of aggregate file is referred to as a compositional file" >sing the same
e9ample as ao%e0 letDs say we want to compare each case in our original file to the
descripti%e statistic for the community" 8or e9ample0 we might want to compare the
indi%idualDs age with the mean age in that personDs community" !n other words0 we
want each record in the aggregate data file to contain oth the original raw data and
the descripti%e statistic for the community as a whole" 4he numer of records in the
compositional aggregate file will contain the same numer of records as the original
raw data file" <owe%er0 the aggregate file will contain more %ariales 6the original
%ariales plus the aggregate statistics7"
When creating either a true or compositional aggregate file0 a new study information
file will also e automatically created to match the new aggregate data file"
'efore runnin/ the a//re/ate pro/ram% the data file must be sorted by the
variable that contains the /roup code. 8or e9ample0 if you plan to create an
aggregate file y community0 the data file must e sorted y community efore
running the aggregate utility program" 4he sort order is not important0 howe%er0 it is
important that all cases from the same community fall together in the file" 4he
aggregate program will accommodate a minimum of 1000 indi%idual groups"
4o sort the file0 you might use the following procedure5
S4>@J F:?4
S:$4 6#7 C:11>'!4J
S#?A
""
4hen run the #ggregate program" !t will as, for the codeoo, name0 data file and the
%ariale containing the group code" 4his refers to the codeoo, and data file that
already e9ist 6not the new aggregate files7" 4he %ariale containing the group code is
the same %ariale that was used to sort the data file efore running this program" !n
)&> Inde2 StatPac For Windows User's Manual
this e9ample0 it is the OcommunityO %ariale" Jou must also select the type of
aggregate file to e created0 either compositional or true"
Clic, :E to continue" 'ow you can select the %ariale6s7 for which you want to
calculate aggregate statistics" Select the desired %ariale" 4hen clic, on the statistics
you want for that %ariale" Aach time you clic, on a statistic0 an aggregate statement
will e created in the #ggregate Statement window" Aach aggregate statement will
create one new aggregate %ariale"
StatPac For Windows User's Manual Utilities )&1
When performing a compositional aggregate procedure0 the new aggregate %ariales
will e added to the end of each data record" !f the study and data file contain 10
%ariales0 and you type two aggregate statements0 the new aggregate %ariales would
e added as %ariales 11 and 12"
When performing a true aggregate procedure0 the first %ariale in the aggregate file
will always e the group code 6that is0 the %ariale used to determine the groups7"
Aach aggregate statement will produce a statistic that is added as the ne9t %ariale in
the file" 4he first aggregate statement would create %ariale two0 the ne9t %ariale
three0 and so forth"
#ggregate statistics can only e calculated for numeric-type %ariales" 4here is one
e9ception to this rule5 !f the %ariale used to split the data file into groups is alpha0
you may still calculate the numer of %alid cases" !n our e9ample0 if community were
coded alpha0 it would e acceptale to as, for the numer of %alid cases 6statistic 1)7
for this %ariale"
Aach aggregate statement you enter will create a new %ariale in the aggregate file"
#fter entering all the aggregate statements0 clic, :E" # new codeoo, will e
created" 4he new %ariale laels in this study will include oth the original laels and
the types of statistics" #fter the new study has een created0 the program will
perform all the aggregate calculations and write the new data file"
&ecause many calculations are in%ol%ed in creating an aggregate file0 the program
may ta,e some time to finish" !t will display a message informing you of successful
completion"
!f any statistic cannot e calculated0 or if there are an insufficient numer of columns
to hold the aggregate statistic0 the output file will contain spaces for that %ariale"
8or e9ample0 if you re;uested the mode0 and the group was multi-modal0 the
aggregate statistic would e stored as lan,s"
)&& Inde2 StatPac For Windows User's Manual
Code"oo#
4here are two utility programs for codeoo,s" 4he Cuic, Codeoo, Creation utility
creates an entire codeoo, using a single 8:$4$#'-li,e statement" 4he Chec,
Codeoo, = @ata utility is used to %erify the integrity of the codeoo, and to fi9
errors in the file"
@uic# Code"oo# Creation
4he fastest way to create a codeoo, is to use the Cuic, Codeoo, Creation
program" <owe%er0 this will create a OareonesO codeoo, consisting of only the
format for each %ariale" !n most cases0 youNll want to use the Frid or ?ariale @etail
window to create a new codeoo,"
Select #nalysis0 >tilities0 Codeoo,0 Cuic, Codeoo, Creation" Jou will need to
enter a file name for the new codeoo, and a !ormat statement" 4his is essentially a
data definition statement and is similar to a 8:$4$#' style format statement"
4he 8ormat Statement defines the numer and type of %ariales that will e in the
new study" It is the combination of all the individual variable formats. >sing the
format statement can sa%e considerale time if %ariale and %alue laels are not
re;uired0 or if you plan to use a fi9ed format data file from another source"
4he synta9 for each component of a format statement is5
['o" of ?ars"\ [?ar" 4ype\ ['o" of Cols\ " [@ecimals\
<No. of Vars.> is the numer of consecuti%e %ariales that use the format defined y
the ne9t three parameters" !f this component of the format statement is omitted0 the
default is one"
<Var. Type> is always # or ' and refers to whether the %ariale6s7 are alpha or
numeric" StatPac automatically left Hustifies alpha %ariales and right Hustifies
numeric %ariales"
<No. of Cols> is the field width allocated for the %ariales6s7" 4his is the total field
width for the %ariale6s7 and it must e large enough to hold a plus or minus sign and
a decimal point if necessary"
StatPac For Windows User's Manual Utilities )&1
. <Decimals> is the numer of significant decimal places that the %ariale6s7 will
contain" 4his component of the format statement is optional and may e omitted" !f
8decimals9 is not specified0 the data will e stored e9actly as entered 6with or
without a decimal point7"
&'amples of Format $tatements
1'2 creates 1 numeric %ariale using 2 columns
'2 creates 1 numeric %ariale using 2 columns
12'3 creates 12 numeric %ariales each using 3
columns
'2"2 creates 1 numeric %ariale using 2 columns
the format of the %ariale will e //"//
)'2"0 creates ) numeric %ariales each using 2
columnsW the format of the %ariales will e
// 6always rounded to an integer7
#1 creates 1 alpha %ariale using 1 column
2#32 creates 2 alpha %ariales each using 32
columns
2'3 2#1 3')"2 creates a study with 10 %ariales"
1-2 are numeric each using 3 columns0
--) are alpha using 1 column each0
(-10 are numeric using ) columns each
with 2 significant decimal places
Chec# Code"oo# and $ata
4his utility program will %erify the integrity of a codeoo, and data file" !f errors are
found the program will attempt to fi9 them" !f you ha%e created a codeoo, to match
a foreign data file 6one created y a program other than StatPac70 use this program to
ma,e sure that the data record lengths match the codeoo, you created"
Select the codeoo, and data file to e chec,ed and clic, :E" !f the program
corrects any errors0 they will e listed in the notepad"
)&) Inde2 StatPac For Windows User's Manual
Sa(lin%
4he Sampling program is used to generate a random numer tale0 create a random
digit dialing tale for telephone studies0 and to select a random sample from a data
file"
Rando( 7u("er :a"le
When planning to conduct a sur%ey0 choosing the sample is Hust as important as the
sur%ey itself" !f the sample is incorrectly chosen0 any results are li,ely to e distorted"
4hat is0 the characteristics of the sample will not represent the characteristics of the
population"
:ne of the est ways to choose a sample is to use a random sampling techni;ue" !f
the sample is randomly chosen from the population0 it will represent the population"
4hat is0 characteristics of the sample are li,ely to e found in similar proportions in
the population"
4he classical method of selecting the sample is to gi%e each case in the population a
numer and then randomly select numers until the sample siBe is achie%ed" 4he
second function of this program is to print a random numer tale"
StatPac For Windows User's Manual Utilities )&!
Jou should first select whether the numers should e selected with or without
replacement" When replacement is used0 a numer may e selected more than once
6selection does not eliminate it from eing a%ailale for future selection7" When
random numers are selected without replacement0 the selection of a numer
eliminates it from the pool of a%ailale numers" 4he algorithm used for selection
without replacement will display the random numers in se;uential order"
Anter the numer of random numers you want to e printed" 4his relates to the
sample siBe determined with the Statistics Calculator" &e sure to add a sufficient
numer to the ideal sample siBe to accommodate a pilot test and replacement of
nonresponders 6if part of your study design7"
Anter the smallest allowale random numer and the largest allowale random
numers" 4ypically0 the lowest %alue would e one and the highest %alue would e
e;ual to the numer of cases in the population"
Anter the name of the StatPac codeoo, and data file to store the random numers
and clic, :E" # StatPac codeoo, and data file will e created that contains one
%ariale called O$#'@:1O" 8inally0 the random numers will e displayed in a
compressed format in the 'otepad" Jou do not need to sa%e them with 'otepad since
they are already stored in a StatPac data file"
Rando( $i%it $ialin% :a"le
4elephone sur%eys sometimes use random digit dialing to secure the sample" While
this method will result in many non-wor,ing or non-%oice numers0 it will produce a
random sample of people who ha%e telephones" Since local prefi9 codes are set 6i"e"0
predefined y the phone company70 only the last four digits of a phone numer can
)&* Inde2 StatPac For Windows User's Manual
e randomly selected" 4he random numer method of creating a telephone file
allows you to specify a series of local prefi9 codes and the numer of random
telephone numers you want created for each prefi9 code"
4here is an important consideration to ,eep in mind when creating a random digit
file" 1any of the random numers will not e useful" 8or e9ample0 a numer may
e non-e9istent0 a usiness office0 or a fa9 or computer line" 4here are se%eral
algorithms for ma9imiBing the numer of home phone numers0 howe%er0 these
techni;ues ha%e generally produced poor results and are not included in StatPac"
4herefore0 it is usually a good idea to select more phone numers than you actually
need"
4he random numer utility program allows you to specify any numer of prefi9es
and to specify how many numers you want from each prefi9" 8or local sur%eys0 the
prefi9 will e three digits 6the local e9change7W for long distance sur%eys0 the prefi9
will e se%en digits 6i"e"0 1 ] three digits for the area code ] three digits for the local
e9change7"
!n the .ocal A9change e9amples on the screen display0 20 numers would e created
with a 929 prefi9 and 32 numers would e created with a 9() prefi9" 8or the .ong
@istance e9amples0 22 numers would e created that egin with 1--12-922 and 20
numers would e created that egin with 1-(0)-92)"
#fter you ha%e finished typing the prefi9es and ;uantities0 clic, :E to create the
phone numer file" # StatPac codeoo, and data file will e created that contains one
%ariale O4A.AP<:'AX'>1&A$O" 8inally0 the random numers will e displayed
StatPac For Windows User's Manual Utilities )&-
in a compressed format in the 'otepad" Jou do not need to sa%e them with 'otepad
since they are already stored in a StatPac data file"
4he actual techni;ue used to create the file is called random numer selection
without replacement" 4his means that as a phone numer is selected0 it will e
eliminated from the pool of a%ailale numers for the ne9t selection" 4his eliminates
the possiility of selecting the same numer 6with the same prefi97 twice"
@epending on the numer of prefi9es and the ;uantities from each prefi90 the actual
creation of the file may ta,e a little while" Please e patientW the program will inform
you when the sample selection has een completed"
Select Rando( Records fro( $ata File
With this utility0 you can select a specified numer of random records from a data
file and write them to a new data file" !f you ha%e a %ery large data ase and a long
procedure file0 you might use this utility to create a shorter data file0 and perform a
test run of the procedure file on it"
Anter for the name of the e9isting data file0 the new data file0 and the numer of
records to e selected and written to the new data file"
Jou can also create a data file of the reHected 6not selected7 records" 4he file name
for the reHected data records will e the same as the selected records file e9cept that it
will ha%e a O-$eHectedO suffi9 at the end of the file name"
4o e%o,e this feature0 you need to change a setting in the System @efaults 8ile"
Select 8ile\:pen\System @efaults 8ile" Select Adit\8ind and search for5
Create$eHected8ile ^ 0
Change it to5
Create$eHected8ile ^ 1
Clic, the Sa%e !con 6dis,ette7" Select 8ile\Close
4he reHected records file will then e created along with the selected records file"
)&; Inde2 StatPac For Windows User's Manual
Create 8aria"le for Wei%htin%
4his utility will create a weighting %ariale that can e used with the W4 option in
order to adHust the data to conform to ,nown population parameters" >p to ten
%ariales may e weighted simultaneously" 4he mathematical techni;ue is ,nown y
se%eral names5 rim weigting0 iterative proportional !itting0 biproportional !itting0
matrix raking0 and matrix scaling" #ll refer to the same general process of creating
weights that adHust the data so selected demographic %ariales conform to actual
,nown %alues in the population"
#fter conducting a sur%ey0 you might perform a fre;uency analysis of the gender
%ariale and find that your sample isnNt e9actly the same as the gender distriution in
the population" 4here may e numerous reasons for the difference0 ut any analyses
you perform will reflect the sampling error"
8irst try to understand the reason your sample is different from the population" 4he
difference may simply e attriutale to sampling error or it may e ecause of some
hidden error in your sampling techni;ue" #fter that0 you can use this utility to create
a set of weights that will compensate for the error in sampling" :ne or more
%ariales may e adHusted"
4his utility will create a new weighting %ariale and add it to the codeoo, and data
file so that it can e referenced with the W4 option in your procedures"
When there is only one demographic %ariale that needs to e adHusted0 weights are
easily calculated y hand as the desired percent di%ided y the oser%ed percent"
<owe%er0 when more than one demographic %ariale needs adHustment 6and they are
done se;uentially70 suse;uent weighting adHustments will modify pre%ious
adHustments and itNs nearly impossile to ma,e your sample match the population"
$im weighting lets you ma,e all the adHustments simultaneously so the end result
will e an adHusted sample that e9actly reflects the ,nown population parameters"
4o use this utility0 you only need to ,now the population parameters for the %ariales
you will e weighting" 4hat is0 the percent in the population for each response
category 6%alue lael7"
When you start the utility program0 you will e as,ed to select the codeoo,0 data
file0 and the %ariales you will use for weighting" >se the rowse utton to select the
codeoo, and the name of the data file will e filled in automatically" Jou can select
one or more weighting %ariales" <old the control ,ey to ma,e multiple selections if
you want to weight y more than one %ariale"
StatPac For Windows User's Manual Utilities )&'

#fter clic,ing :E0 StatPac will read the data and calculate the oser%ed fre;uency
for each %alue lael of the selected %ariale6s7" 4hese will e shown in parentheses
adHacent to the %alue lael" Jou can then enter the desired fre;uency 6percent7 for
each of the %alue laels" 4he desired fre;uency is the population parameter" Anter a
Q@AS!$A@ `R for each %alue lael" #fter weighting0 a fre;uency analysis with the
W4 option will show the desired percents instead of the oser%ed percents and all
other %ariales will e adHusted accordingly"
)1> Inde2 StatPac For Windows User's Manual
4his procedure will create a weighting %ariale and add it to the end of the codeoo,
and data file" Jou can gi%e the new weighting %ariale any name you want" 4he
default name is Case)eigt" !f the %ariale already e9ists in the codeoo, and data0
it will e replaced with the new %alues calculated y this utility program" !f it doesnNt
e9ist0 it will ecome the last %ariale in the study"
8or any gi%en %ariale0 the desired percents you enter must sum to e9actly 100
percent" 1issing data will e assigned a weight of Bero" 4his means that if any of the
weighting %ariales contain missing data0 the weighted sample siBe will e reduced
y the numer of missing cases" $espondents often refuse to answer some
demographic ;uestions" !f you ,now the incidence in the population that refuses0 you
can add a %alue lael to the codeoo, [lan,\^$efused for that %ariale" !f you
donNt ,now0 then you ha%e to accept the reduced sample siBe"
When you clic, the Calculate utton0 StatPac will calculate %alues for the weighting
%ariale and add them to the codeoo, and data file" 4o use the weighting %ariale0
you can either add the W4^6CaseWeight7 option to each procedure" !f youNre
running a series of procedures as a atch0 you can add W4^6CaseWeight7_ 6with the
e9clamation point7 to Hust the first procedure eing run and the W4 option will e
applied to all the procedures in the atch"
# word of caution" Weighting with the W4 option counts respondentsN answers ased
on their weight" Someody with a weight of 2 will ha%e twice the influence on the
StatPac For Windows User's Manual Utilities )11
results as a person with a weight of 1" !f your sample is mar,edly different from the
population0 weighting may introduce undesirale errors into the results y down-
playing the influence of some respondents and up-playing others" &e careful"
Co(are $ata Files
1any data entry operators use a doule entry method of data %erification" @ata is
entered into one data file and the same data is re-entered into another data file" 4he
two data files are then compared for differences"
4he purpose of this utility program is to identify possile errors in the dataW it does
not ha%e any editing features"
Anter the name of the StatPac codeoo, and the names of the two data files to e
compared" 4he data files should contain the same numer of records in the same
order"
>pon completion0 the total numer of errors will e reported" !f differences are
found0 the record numers and which %ariales are different will e shown in the
'otepad" >se the notepad to print the errors listing
Con,ersions
StatPac supports only two data types0 alpha and numeric" 4his can ma,e it difficult to
wor, with dates and currency %ariales" 4hese utilities simplify the tas, of wor,ing
with date and currency %ariales"
4he con%ersion utilities read an e9isting codeoo, and data file0 and create a new
codeoo, and data file with a new con%erted %ariale" 4he original date or currency
%ariale is not modified and will remain Qas isR in the codeoo, and data" !nstead0 a
new %ariale 6the con%erted field7 is created and added to the end of the codeoo,
and data"
)1& Inde2 StatPac For Windows User's Manual
$ate Con,ersions
4he most common functions with dates are sorting and selecting" 4ypically0 a user
would create an alpha %ariale for a date %ariale ecause it contains non-numeric
characters such as slashes or dashes" $egardless of the format0 sorting y date or
selecting the records etween two dates can e difficult unless the date can e readily
con%erted to a numeric eight-column 6'(7 %ariale in the format JJJJ11@@"
4he first function will ta,e one or more date %ariales in any format and create new
'( %ariale6s7 in JJJJ11@@ format" 4he new '( %ariale6s7 can e used with
the Sort command to sort a file y date" !t can also e used with the Select command
to select a range of dates"
4he second function will calculate the numer of days etween two dates" 4he two
dates can e any date format and the new %ariale 6numer of days7 will e an '2
format" 4he asolute %alue of the difference etween the two dates will e calculated
and added to the end of the new codeoo, and data file"
4he third function will create an Anglish te9t %ersion of a date in Q@ 1on0 JJJJR
format 6e"g"0 2 :ct 20027" 4he purpose is to ma,e it possile for the user to
suse;uently use the .ist command to create an easily readale listing of the data"
StatPac For Windows User's Manual Utilities )11
Currency Con,ersion
4he currency con%ersion utility is useful for adding or remo%ing the Z or e symols0
interpreting a E or 1 suffi90 and remo%ing commas from currency fields"
When conducting internet sur%eys 6where the respondent is entering their own
response7 currency fields can create prolems" Jou can re;uire numeric input ut
that is often frustrating for respondents who want to enter something li,e 20E or
101 or Z220000" !f you elie%e respondents will want to enter anything other than a
numer0 you can specify the field as alpha in the codeoo, 6which will accept any
input from the respondent7" #fter the sur%ey is closed0 use this utility to con%ert the
data to a numeric field"
4he CurrencySymol setting in the defaults 6StatPac"ini7 file can e set to your
countryNs currency symol" When con%erting the alpha field to a numer0 commas
will e remo%ed0 the letter E will multiple the %alue times a thousand0 and the letter
1 will multiple the %alue times a million"
$ichoto(ous Multile Resonse Con,ersion
4he dichotomous multiple response con%ersion utility is useful when you ha%e
imported data from an e9ternal source that coded multiple response %ariales in a
dichotomous format"
)1) Inde2 StatPac For Windows User's Manual
8or e9ample0 data in the e9ternal file might e coded as ones and lan,s0 where a
one means the respondent selected the attriute and lan, means they didnDt"
#ssume the ;uestion was +)at are your !avorite colors(+ !mported data might loo,
li,e this5

?1 ?2 ?3 ?3
$espondent :range &lue Jellow $ed
1 1 1
2 1 1
3 1 1

#fter importing0 you could write a procedure to con%ert the data to the multiple
response format used y StatPac" !t would loo, li,e this5

.aels ?1^What are your fa%orite colorsY
.aels ?2^What are your fa%orite colorsY
.aels ?3^What are your fa%orite colorsY
.aels ?3^What are your fa%orite colorsY
.aels ?1-?3 61^:range762^&lue763^Jellow763^$ed7
$ecode ?2 61^27
$ecode ?3 61^37
$ecode ?3 61^37
8re;uencies ?1-?3
:ptions 1$^J
""

4his will wor, fine although it is cumersome" When there are ten or more %ariales
in the multiple response group0 it ecomes more difficult ecause the imported
%ariales are li,ely coded as '10 while the StatPac %ariales need to e coded as '2"
4wo methods are incorporated into StatPac to deal with imported data that use
dichotomous multiple response"
4he first method is in the fre;uencies program itself" 4he 1*^Code option can e
added to the fre;uency program to tell StatPac that the %ariales are dichotomous"
4hen OCodeO is the single character %alue that indicates the item is selected" !n the
ao%e e9ample0 the data was coded as ones and lan,s0 so 1* would e set to 1" !f
the data had een coded as J and '0 then 1* would e set to J"

8re;uencies ?1-?3
:ptions 1$^J 1*^1
""

>sing this method does not actually change the data file" StatPac Hust reads the data
differently for the fre;uencies procedure" #n e9clamation mar, cannot e used to
permanently set the 1* option" !t must e e9plicitly specified in each procedure
where you want to use it"
StatPac For Windows User's Manual Utilities )1!
4he other method is to actually con%ert the data file to the format used y StatPac for
multiple response" !f you plan to do anners or other procedures that utiliBe the
dichotomous multiple response %ariales0 then it is est to permanently alter the data"
#fter con%ersion0 the ao%e data set would loo, li,e this5

?1 ?2 ?3 ?3
$espondent :range &lue Jellow $ed
1 2 3
2 1 3
3 2 3

4he con%ersion utility lets you select se%eral sets of %ariales that are dichotomous
multiple response0 howe%er they are done one at a time" 4he first screen lets you
select the codeoo, and data file0 and specify a name for the new 6con%erted7
codeoo, and data file" #fter selecting the codeoo,0 the %ariale names will appear
so they can e selected"


)1* Inde2 StatPac For Windows User's Manual
#fter selecting the %ariales that ma,e up the first multiple response group0 clic, the
plus utton to add them to the con%ersion list"
4he second screen lets you set the code and laeling for the selected group of
%ariales"


4he code is the dichotomous %alue that indicates the item is selected"
Since the imported data doesnDt ha%e a single %ariale name for the group of
%ariales0 StatPac names them 1$XFroupX#0 1$XFroupX&0 etc" #fter the
con%ersion0 the con%erted %ariales in the group will e named using the X9
con%ention 6e"g"0 1$XFroupX#X10 1$XFroupX#X20 1$XFroupX#X30 and
1$XFroupX#X37" 4hus0 you might want to change the %ariale name to something
more meaningful0 8or e9ample0 if you changed the name to Color0 the con%erted
%ariales would e named ColorX10 ColorX20 ColorX30 and ColorX3"
Similarly0 the %ariale lael might e changed to the actual ;uestion" #ll the
con%erted %ariales will use that %ariale lael" Jou could change O?ultiple
Response Iroup 6M $1-$>O to O)at are your !avorite colors(O
#fter you are satisfied with the con%ersion laeling0 clic, the Con%ert utton" 4his
will return you to the first screen where you can select an additional set of multiple
response %ariales and clic, the plus utton to add them to the con%ersion"
StatPac For Windows User's Manual Utilities )1-
#fter you ha%e finished selecting all the groups of multiple response %ariales0 clic,
:E to perform the con%ersion" 4he new codeoo, and new data file will then
contain the multiple response %ariales in StatPac format"
)1; Inde2 StatPac For Windows User's Manual
Statistics Calculator
Statistics Calculator Menu
Statistics (alculator is an easy-to-use program designed to perform a series of asic
statistical procedures related to distriutions and proailities" 1ost of the
procedures are called in!erential ecause data from a sample is used to infer to a
population"
4he menu ar of Statistic (alculator contains si9 types of operations that can e
performed y the software"
@istriutions Counts Percents
1eans Correlation Sampling
4he *istributions menu item is the electronic e;ui%alent of proaility tales"
#lgorithms are included for the B0 t0 80 and chi-s;uare distriutions" 4his selection
may e used to find proailities and critical %alues for the four statistics"
4he (ounts menu item contains routines to analyBe a contingency tale of counts0
compute 8isherDs e9act proaility for two-y-two tales0 use the inomial
distriution to predict the proaility of a specified outcome0 and the poisson
distriution to test the li,elihood of oser%ing a specified numer of e%ents"
4he ercents menu item is used to compare two percents" #lgorithms are included
to compare proportions drawn from one or two samples" 4here is also a menu option
to calculate confidence inter%als around a percent"
4he "eans menu item is used to calculate a mean and standard de%iation of a
sample0 compare two means to each other0 calculate a confidence inter%al around a
mean0 compare a sample mean to a population mean0 compare two standard
de%iations to each other0 and compare three or more standard de%iations"
4he (orrelation menu item is used to calculate correlation and simple linear
regression statistics for paired data" #lgorithms are included for ordinal and inter%al
data"
4he Samplin/ menu item is used to determine the re;uired sample siBe for a study"
4he software can e used for prolems in%ol%ing percents and means"
$istri"utions Menu
4he *istributions menu selection is used to calculate critical %alues and
proailities for %arious distriutions" 4he most common distriutions are the z
6normal7 distriution0 t distriution0 @ distriution0 and the chi-s;uare distriution"
Within the last 20 years0 computers ha%e made it easy to calculate e9act proailities
for the %arious statistics" Prior to that0 researchers made e9tensi%e use of oo,s
containing proaility tales"
7or(al distri"ution
4he normal distriution is the most well-,nown distriution and is often referred to
as the z distriution or the ell shaped cur%e" !t is used when the sample siBe is
greater than 30" When the sample siBe is less than 300 the t distriution is used
instead of the normal distriution"
4he menu offers three choices5 17 proaility of a B %alue0 27 critical B for a gi%en
proaility0 and 37 proaility of a defined range"
Probability of a 3 Value
When you ha%e a B 6standardiBed7 %alue for a %ariale0 you can determine the
proaility of that %alue" 4he software is the electronic e;ui%alent of a normal
distriution proaility tale" When you enter a z %alue0 the area under the normal
cur%e will e calculated" 4he area not under the cur%e is referred to as the reNection
region" !t is also called a two-tailed proaility ecause oth tails of the distriution
are e9cluded" 4he Statistics (alculator reports the two-tailed proaility for the B
%alue" # one-tailed proaility is used when your research ;uestion is concerned with
only half of the distriution" !ts %alue is e9actly half the two-tailed proaility"
+1ample
B-%alue5 1"9-
-----------------------------------------
4wo-tailed proaility ^ "0200
Critical 3 for a .iven Probability
4his menu selection is used to determine the critical z %alue for a gi%en proaility"
+1ample
# large company designed a pre-employment sur%ey to e administered to
perspecti%e employees" &aseline data was estalished y administering the sur%ey to
all current employees" 4hey now want to use the instrument to identify Ho
applicants who ha%e %ery high or %ery low scores" 1anagement has decided they
want to identify people who score in the upper and lower 3` when compared to the
norm" <ow many standard de%iations away from the mean is re;uired to define the
upper and lower 3` of the scoresY
4he total area of reHection is -`" 4his includes 3` who scored %ery high and 3`
who scored %ery low" 4hus0 the two-tailed proaility is "0-" 4he B %alue re;uired to
reHect -` of the area under the cur%e is 1"((1" 4hus0 new applicants who score
higher or lower than 1"((1 standard de%iations away from the mean are the people to
e identified"
))> Inde2 StatPac For Windows User's Manual
4wo tailed proaility5 "0-
---------------------------------
B-%alue ^ 1"((1
Probability of a Defined Range
Enowing the mean and standard de%iation of a sample allows you to estalish the
area under the cur%e for any gi%en range" 4his menu selection will calculate the
proaility that the mean of a new sample would fall etween two specified %alues
6i"e"0 etween the limits of a defined range7"
+1ample
# manufacturer may find that the emission le%el from a de%ice is 22"9 units with a
standard de%iation of 2")" 4he law limits the ma9imum emission le%el to 2("0 units"
4he manufacturer may want to ,now what percent of the new de%ices coming off the
assemly line will need to e reHected ecause they e9ceed the legal limit"
Sample mean ^ 22"9
>niased standard de%iation ^ 2")
.ower limit of the range ^ 0
>pper limit of the range ^ 2("0
----------------------------------------------------------------
Proaility of a %alue falling within the range ^ ")(1)
Proaility of a %alue falling outside the range ^ "21(3
4he area under the cur%e is the sum of the area defined y the lower limit plus the
area defined y the upper limit"
4he area under the normal cur%e is the proaility that additional samples would fall
etween the lower and upper limits" !n this case0 the area ao%e the upper limit is the
reHection area 621"(3` of the product would e reHected7"
: distri"ution
1athematicians used to thin, that all distriutions followed the ell shaped cur%e" !n
the early 1900Ds0 an !rish chemist named Fosset0 disco%ered that distriutions were
much flatter than the ell shaped cur%e when wor,ing with small sample siBes" !n
fact0 the smaller the sample0 the flatter the distriution" 4he t distriution is used
instead of the normal distriution when the sample siBe is small" #s the sample siBe
approaches thirty0 the t distriution appro9imates the normal distriution" 4hus0 the t
distriution is generally used instead of the B distriution0 ecause it is correct for
oth large and small sample siBes0 where the B distriution is only correct for large
samples"
4he menu offers three choices5 17 proaility of a t %alue0 27 critical t %alue for a
gi%en proaility0 and 37 proaility of a defined range"
StatPac For Windows User's Manual Statistics Calculator ))1
Probability of a t Value
!f you ha%e a t %alue and the degrees of freedom associated with the %alue0 you can
use this program to calculate the two-tailed proaility of t" !t is the e;ui%alent of
computeriBed tale of t %alues"
+1ample
t-%alue5 2"22(
df5 10
------------------------------------
4wo-tailed proaility ^ "020
Critical t Value for a .iven Probability
4his program is the opposite of the pre%ious program" !t is used if you want to ,now
what critical t %alue is re;uired to achie%e a gi%en proaility"
+1ample
4wo-tailed proaility5 "020
@egrees of freedom5 10
-----------------------------------
t-%alue ^ 2"22(
Probability of a Defined Range
Enowing the mean and standard de%iation of a sample allows you to estalish the
area under the cur%e for any gi%en range" Jou can use this program to calculate the
proaility that the mean of a new sample would fall etween two %alues"
+1ample
# company did a sur%ey of 20 people who used its product" 4he mean a%erage age
of the sample was 22"3 years and the uniased standard de%iation was 3"1 years" 4he
company now wants to ad%ertise in a magaBine that has a primary readership of
people who are etween 1( and 230 so they need to ,now what percent of its
potential customers are etween 1( and 23 years of ageY
Sample mean5 22"3
>niased standard de%iation5 3"1
Sample siBe ^ 20
.ower limit of the range ^ 1(
>pper limit of the range ^ 23
----------------------------------------------------------------
Proaility of a %alue falling within the range ^ "-0(
Proaility of a %alue falling outside the range ^ "392
&ecause of the small sample siBe0 the t distriution is used instead of the B
distriution" 4he area under the cur%e represents the proportion of customers in the
population e9pected to e etween 1( and 23 years of age" !n this e9ample0 we
))& Inde2 StatPac For Windows User's Manual
would predict that -0"(` of the its customers would e e9pected to e etween 1(
and 23 years of age0 and 39"2` would e outside of the range" 4he company
decided not to ad%ertise"
F distri"ution
4he @-ratio is used to compare %ariances of two or more samples or populations"
Since it is a ratio 6i"e"0 a fraction70 there are degrees of freedom for the numerator and
denominator" 4his menu selection may e use to calculate the proaility of an @
-ratio or to determine the critical %alue of @ for a gi%en proaility" 4hese menu
selections are the computer e;ui%alent of an @ tale"
Probability of a F:Ratio
!f you ha%e a @-ratio and the degrees of freedom associated with the numerator and
denominator0 you can use this program to calculate the proaility"
+1ample
8-ratio5 2"))3
'umerator degrees of freedom5 20
@enominator degrees of freedom5 10
----------------------------------------------
4wo-tailed proaility ^ "0200
Critical F for a .iven Probability
!f you ,now the critical alpha le%el and the degrees of freedom associated with the
numerator and denominator0 you can use this program to calculate the 8-ratio"
+1ample
4wo-tailed proaility ^ "0200
'umerator degrees of freedom5 20
@enominator degrees of freedom5 10
-----------------------------------------------
8-ratio5 2"))3
Chi9s4uare distri"ution
4he chi-s;uare statistic is used to compare the oser%ed fre;uencies in a tale to the
e9pected fre;uencies" 4his menu selection may e use to calculate the proaility of
a chi-s;uare statistic or to determine the critical %alue of chi-s;uare for a gi%en
proaility" 4his menu selection is the computer e;ui%alent of an chi-s;uare tale"
Probability of a Ci:$=uare $tatistic
!f you ha%e a chi-s;uare %alue and the degrees of freedom associated with the %alue0
you can use this program to calculate the proaility of the chi-s;uare statistic" !t is
the e;ui%alent of computeriBed tale of chi-s;uare %alues"
+1ample
StatPac For Windows User's Manual Statistics Calculator ))1
Chi-s;uare %alue5 1("30)
@egrees of freedom5 10
------------------------------------
Proaility ^ "020
Critical Ci:$=uare for a .iven Probability
!f you ha%e the critical alpha le%el and the degrees of freedom0 you can use this
program to calculate the proaility of the chi-s;uare statistic" !t is the e;ui%alent of
computeriBed tale of chi-s;uare %alues"
+1ample
Proaility ^ "0200
@egrees of freedom5 10
------------------------------------
Chi-s;uare %alue5 1("30)
Counts Menu
4he (ounts menu selection has four tests that can e performed for simple
fre;uency data" 4he chi-s;uare test is used to analyBe a contingency tale consisting
of rows and columns to determine if the oser%ed cell fre;uencies differ significantly
from the e9pected fre;uencies" 8isherDs e9act test is similar to the chi-s;uare test
e9cept it is used only for tales with e9actly two rows and two columns" 4he
inomial test is used to calculate the proaility of two mutually e9clusi%e outcomes"
4he poisson distriution e%ents test is used to descrie the numer of e%ents that will
occur in a specific period of time"
Chi9s4uare test
4he chi-s;uare is one of the most popular statistics ecause it is easy to calculate and
interpret" 4here are two ,inds of chi-s;uare tests" 4he first is called a one-way
analysis0 and the second is called a two-way analysis" 4he purpose of oth is to
determine whether the oser%ed fre;uencies 6counts7 mar,edly differ from the
fre;uencies that we would e9pect y chance"
4he oser%ed cell fre;uencies are organiBed in rows and columns li,e a spreadsheet"
4his tale of oser%ed cell fre;uencies is called a contingency tale0 and the chi-
s;uare test if part of a contingency table analysis"
4he chi-s;uare statistic is the sum of the contriutions from each of the indi%idual
cells" A%ery cell in a tale contriutes something to the o%erall chi-s;uare statistic" !f
a gi%en cell differs mar,edly from the e9pected fre;uency0 then the contriution of
that cell to the o%erall chi-s;uare is large" !f a cell is close to the e9pected fre;uency
for that cell0 then the contriution of that cell to the o%erall chi-s;uare is low" # large
chi-s;uare statistic indicates that somewhere in the tale0 the oser%ed fre;uencies
differ mar,edly from the e9pected fre;uencies" !t does not tell which cell 6or cells7
are causing the high chi-s;uare"""only that they are there" When a chi-s;uare is high0
you must %isually e9amine the tale to determine which cell6s7 are responsile"
When there are e9actly two rows and two columns0 the chi-s;uare statistic ecomes
inaccurate0 and JateDs correction for continuity is often applied"
))) Inde2 StatPac For Windows User's Manual
!f there is only one column or one row 6a one-way chi-s;uare test70 the degrees of
freedom is the numer of cells minus one" 8or a two way chi-s;uare0 the degrees of
freedom is the numer or rows minus one times the numer of columns minus one"
>sing the chi-s;uare statistic and its associated degrees of freedom0 the software
reports the proaility that the differences etween the oser%ed and e9pected
fre;uencies occurred y chance" Fenerally0 a proaility of "02 or less is considered
to e a significant difference"
# standard spreadsheet interface is used to enter the counts for each cell" #fter
youD%e finished entering the data0 the program will print the chi-s;uare0 degrees of
freedom and proaility of chance"
>se caution when interpreting the chi-s;uare statistic if any of the cell fre;uencies
are less than fi%e" #lso0 use caution when the total for all cells is less than 20"
+1ample
# drug manufacturing company conducted a sur%ey of customers" 4he research
;uestion is5 !s there a significant relationship etween pac,aging preference 6siBe of
the ottle purchased7 and economic statusY 4here were four pac,aging siBes5 small0
medium0 large0 and Humo" Aconomic status was5 lower0 middle0 and upper" 4he
following data was collected"
lower middle upper
small 23 22 1(
medium 23 2( 19
large 1( 2) 29
Humo 1- 21 33
------------------------------------------------
Chi-s;uare statistic ^ 9")33
@egrees of freedom ^ -
Proaility of chance ^ "1329
Fisher's +2act :est
4he chi-s;uare statistic ecomes inaccurate when used to analyBe contingency tales
that contain e9actly two rows and two columns0 and that contain less than 20 cases"
8isherDs e9act proaility is not plagued y inaccuracies due to small 'Ds" 4herefore0
it should e used for two-y-two contingency tales that contain fewer than 20 cases"
+1ample
<ere are the results of a recent pulic opinion poll ro,en down y gender" What is
the e9act proaility that the difference etween the oser%ed and e9pected
fre;uencies occurred y chanceY
1ale 8emale
8a%or 30 32
:pposed)0 2(
-------------------------------------------
8isherDs e9act proaility ^ "0239
StatPac For Windows User's Manual Statistics Calculator ))!
Bino(ial :est
4he inomial distriution is used for calculating the proaility of dichotomous
outcomes in which the two choices are mutually e9clusi%e" 4he program re;uires
that you enter the numer of trials0 proaility of the desired outcome on each trial0
and the numer of times the desired outcome was oser%ed"
+1ample
!f we were to flip a coin one hundred times0 and it came up heads se%enty times0
what is the proaility of this happeningY
'umer of trials5 100
Proaility of success on each trial 60-175 "2
'umer of successes5 )0
---------------------------------------------------------
Proaility of )0 or more successes [ "0001
Poisson $istri"ution +,ents :est
4he poisson distriution0 li,e the inomial distriution0 is used to determine the
proaility of an oser%ed fre;uency" !t is used to descrie the numer of e%ents that
will occur in a specific period of time or in a specific area or %olume" Jou need to
enter the oser%ed and e9pected fre;uencies"
+1ample
Pre%ious research on a particular assemly line has shown that they ha%e an a%erage
daily defect rate of 39 products" 4hus0 the e9pected numer of defecti%e products
e9pected on any day is 39" 4he day after implementing a new ;uality control
program0 they found only 22 defects" What is the proaility of seeing 22 or fewer
defects on any dayY
:ser%ed fre;uency5 22
A9pected fre;uency5 39
---------------------------------------------------
Proaility of 22 or fewer e%ents ^ "022-
Percents Menu
Percents are understood y nearly e%eryone0 and therefore0 they are the most popular
statistics cited in research" $esearchers are often interested in comparing two
percentages to determine whether there is a significant difference etween them"
Choosin% the Proer :est
4here are two ,inds of t-tests etween percents" Which test you use depends upon
whether youDre comparing percentages from one or two samples"
))* Inde2 StatPac For Windows User's Manual
A%ery percentage can e e9pressed as a fraction" &y loo,ing at the denominator of
the fraction we can determine whether to use a one-sample or two-sample t-test
etween percents" !f the denominators used to calculate the two percentages
represent the same people0 we use a one-sample t-test etween percents to compare
the two percents" !f the denominators represent different people0 we use the two-
sample t-test etween percents"
8or e9ample suppose you did a sur%ey of 200 people" Jour sur%ey as,ed0
)ere you satis!ied wit te program(
KKK Des KKK No KKK GonJt know
:f the 200 people0 (0 said yes0 100 said no0 and 20 didnDt ,now" Jou could
summariBe the responses as5
Jes (0M200 ^ "3 ^ 30`
'o 100M200 ^ "2 ^ 20`
@onDt ,now 20M200 ^ "1 ^ 10`
!s there a significant difference etween the percent saying yes 630`7 and the
percent saying no 620`7Y :%iously0 there is a differenceW ut how sure are we that
the difference didnDt Hust happen y chanceY !n other words0 how reliale is the
differenceY
'otice that the denominator used to calculate the percent of yes responses 62007
represents the same people as the denominator used to calculate the percent of no
responses 62007" 4herefore0 we use a one-sample t-test etween proportions" 4he
,ey is that the denominators represent the same people 6not that they are the same
numer7"
#fter you completed your sur%ey0 another group of researchers tried to replicate your
study" 4hey also used a sample siBe of 2000 and as,ed the identical ;uestion" :f the
200 people in their sur%ey0 -0 said yes0 100 said no0 and 30 didnDt ,now" 4hey
summariBed their results as5
Jes -0M200 ^ "3 ^ 30`
'o 100M200 ^ "2 ^ 20`
@onDt ,now 30M200 ^ "2 ^ 20`
!s there a significant difference etween the percent who said yes in your sur%ey
630`7 and the percent that said yes in their sur%ey 630`7Y 8or your sur%ey the
percent that said yes was calculated as (0M2000 and in their sur%ey it was -0M200" 4o
compare the yes responses etween the two sur%eys0 we would use a two-sample t-
test etween percents" A%en though oth denominators were 2000 they do not
represent the same 200 people"
+1amples that would use a one0sample t0test
Which proposal would you %ote forY
XXX Proposal # XXX Proposal &
Which product do you li,e etterY
XXX 'ame &rand XXX &rand *
StatPac For Windows User's Manual Statistics Calculator ))-
Which candidate would you %ote forY
XXX Iohnson XXX Smith XXX #nderson
When there are more than two choices0 you can do the t-test etween any two of
them" !n this e9ample0 there are three possile cominations5 IohnsonMSmith0
IohnsonM#nderson0 and SmithM#nderson" 4hus0 you could actually perform three
separate t-tests"""one for each pair of candidates" !f this was your analysis plan0 you
would also use &onferroniDs theorem to adHust the critical alpha le%el ecause the
plan in%ol%ed multiple tests of the same type and family"
+1amples that would use a two0sample t0test
# pre%ious study found that 39` of the pulic elie%ed in gun control" Jour study
found the 33` elie%ed in gun control" #re the eliefs of your sample different than
those of the pre%ious studyY
4he results of a magaBine readership study showed that 1)` of the women and 11`
of the men recalled seeing your ad in the last issue" !s there a significant difference
etween men and womenY
!n a rand awareness study0 22` of the respondents from the Western region had
heard of your product" <owe%er0 only 1(` of the respondents from the Aastern
region had heard of your product" !s there a significant difference in product
awareness etween the Aastern and Western regionsY
3ne Sa(le t9:est "etween Percents
4his test can e performed to determine whether respondents are more li,ely to
prefer one alternati%e or another"
+1ample
4he research ;uestion is5 !s there a significant difference etween the percent of
people who say they would %ote for candidate # and the percent of people who say
they will %ote for candidate &Y 4he null hypothesis is5 4here is no significant
difference etween the percent of people who say they will %ote for candidate # or
candidate &" 4he results of the sur%ey were5
Plan to %ote for candidate # ^ 32"2`
Plan to %ote for candidate & ^ 22"3`
Sample siBe ^ 10)
4he sum of the two percents does not ha%e to e e;ual to 100 6there may e
candidates C and @0 and people that ha%e no opinion7" >se a one-sample t-test
ecause oth percentages came from a single sample"
>se a two-tailed proaility ecause the null hypothesis does not state the direction
of the difference" !f the hypothesis is that one particular choice has a greater
percentage0 use a one-tailed test 6di%ide the two-tailed proaility y two7"
)); Inde2 StatPac For Windows User's Manual
Anter the first percent5 32"2
Anter the second percent5 22"3
Anter the sample siBe5 10)
-----------------------------------------
t-%alue ^ 1"(0(
@egrees of freedom ^ 10-
4wo-tailed proaility ^ "0)3
Jou might ma,e a statement in a report li,e this5 # one-sample t-test etween
proportions was performed to determine whether there was a significant difference
etween the percent choosing candidate # and candidate &" 4he t-statistic was not
significant at the "02 critical alpha le%el0 t610-7^1"(0(0 p^"0)3" 4herefore0 we fail to
reHect the null hypothesis and conclude that the difference was not significant"
4wo Sample t-4est etween Percents
4his test can e used to compare percentages drawn from two independent samples"
!t can also e used to compare two sugroups from a single sample"
+1ample
#fter conducting a sur%ey of customers0 you want to compare the attriutes of men
and women" A%en though all respondents were part of the same sur%ey0 the men and
women are treated as two samples" 4he percent of men with a particular attriute is
calculated using the total numer of men as the denominator for the fraction" #nd
the percent of women with the attriute is calculate using the total numer of women
as the denominator" Since the denominators for the two fractions represent different
people0 a two-sample t-test etween percents is appropriate"
4he research ;uestion is5 !s there a significant difference etween the proportion of
men ha%ing the attriute and the proportion of women ha%ing the attriuteY 4he null
hypothesis is5 4here is no significant difference etween the proportion of men
ha%ing the attriute and the proportion of women ha%ing the attriute" 4he results of
the sur%ey were5
(- men were sur%eyed and 22 of them 622"-`7 had the attriute"
39 women were sur%eyed and 19 of them 63("(`7 had the attriute"
Anter the first percent5 22"-
Anter the sample siBe for the first percent5 (-
Anter the second percent5 3("(
Anter the sample siBe for the second percent5 39
-------------------------------------------------------------
t-%alue ^ 1"-03
@egrees of freedom ^ 133
4wo-tailed proaility ^ "111
Jou might ma,e a statement in a report li,e this5 # two-sample t-test etween
proportions was performed to determine whether there was a significant difference
StatPac For Windows User's Manual Statistics Calculator ))'
etween men and women with respect to the percent who had the attriute" 4he t-
statistic was not significant at the "02 critical alpha le%el0 t61337^1"-030 p^"111"
4herefore0 we fail to reHect the null hypothesis and conclude that the difference
etween men and women was not significant"
Another e1ample
Suppose inter%iews were conducted at two different shopping centers" 4his two
sample t-test etween percents could e used to determine if the responses from the
two shopping centers were different"
4he research ;uestion is5 !s there a significant difference etween shopping centers #
and & with respect to the percent that say they would uy product *Y 4he null
hypothesis is5 4here is no significant difference etween shopping centers # and &
with respect to the percent of people that say they would uy product *" # two-tailed
proaility will e used ecause the hypothesis does not state the direction of the
difference" 4he results of the sur%ey were5
(9 people were inter%iewed as shopping center # and 2) of them 6-3"0`7 said they
would uy product *"
92 people were inter%iewed as shopping center & and 21 of them 622"3`7 said they
would uy product *"
Anter the first percent5 -3"0
Anter the sample siBe for the first percent5 (9
Anter the second percent5 22"3
Anter the sample siBe for the second percent5 92
-------------------------------------------------------------
t-%alue ^ 1"1)9
@egrees of freedom ^ 1)9
4wo-tailed proaility ^ "230
Jou might write a paragraph in a report li,e this5 # two-sample t-test etween
proportions was performed to determine whether there was a significant difference
etween the two shopping centers with respect to the percent who said they would
uy product *" 4he t-statistic was not significant at the "02 critical alpha le%el0
t61)97^1"1)90 p^"230" 4herefore0 we fail to reHect the null hypothesis and conclude
that the difference in responses etween the two shopping centers was not
significant"
Confidence Inter,als around a Percent
Confidence inter%als are used to determine how much latitude there is in the range of
a percent if we were to ta,e repeated samples from the population"
+1ample
!n a study of 120 customers0 you find that -0 percent ha%e a college degree" Jour
est estimate of the percent who ha%e a college degree in the population of
customers is also -0 percent" <owe%er0 since it is Hust an estimate0 we estalish
confidence inter%als around the estimate as a way of showing how reliale the
estimate is"
)!> Inde2 StatPac For Windows User's Manual
Confidence inter%als can e estalished for any error rate you are willing to accept"
!f0 for e9ample0 you choose the 92` confidence inter%al0 you would e9pect that in
fi%e percent of the samples drawn from the population0 the percent who had a college
degree would fall outside of the inter%al"
What are the 92` confidence inter%als around this percentY !n the following
e9ample0 note that no %alue is entered for the population siBe" When the population
is %ery large compared to the sample siBe 6as in most research70 it is not necessary to
enter a population siBe" !f0 howe%er0 the sample represents more than ten percent of
the population0 the formulas incorporate a finite population correction adHustment"
4hus0 you only need to enter the population siBe when the sample siBe e9ceeds ten
percent of the population siBe"
Anter the percent5 -0
Anter the sample siBe5 120
Anter the population siBe5 6left lan,7
Anter the desired confidence inter%al 6`75 92
----------------------------------------------------------
Standard error of the proportion ^ "030
@egrees of freedom ^ 139
92` confidence inter%al ^ -0"0`

)"9`
Confidence inter%al range ^ 22"1` to -)"9`
4herefore0 our est estimate of the population proportion with 2` error is -0`


)"9`" Stated differently0 if we predict that the proportion in the population who ha%e
a college degree is etween 22"1` and -)"9`0 our prediction would e wrong for
2` of the samples that we draw from the population"
Means Menu
$esearchers usually use the results from a sample to ma,e inferential statements
aout the population" When the data is inter%al or ratio scaled0 it usually descried in
terms of central tendency and %ariaility" 1eans and standard de%iations are usually
reported in all research"
Mean and Standard $e,iation of a Sa(le
4his menu selection will let you enter data for a %ariale and calculate the mean0
uniased standard de%iation0 standard error of the mean0 and median" @ata is entered
using a standard spreadsheet interface" 8inite population correction is incorporated
into the calculation of the standard error of the mean0 so the population siBe should
e specified whene%er the sample siBe is greater than ten percent of the population
siBe"
+1ample
# sample of ten was randomly chosen from a large population" 4he ten scores were5
20 22 23 32 31 33 3) 21 32 32
StatPac For Windows User's Manual Statistics Calculator )!1
----------------------------------------------------
1ean ^ 39"0
>niased standard de%iation ^ 11"-
Standard error of the mean ^ 3")
1edian ^ 32"0
Matched Pairs t9:est "etween Means
4he matched pairs t-test is used in situations where two measurements are ta,en for
each respondent" !t is often used in e9periments where there are efore-treatment
and after-treatment measurements" 4he t-test is used to determine if there is a
reliale difference etween the mean of the efore-treatment and the mean of the
after treatment measurements"
Pretreatment Posttreatment
Iohnny -------------------- Iohnny
1artha -------------------- 1artha
Ienny ---------------------- Ienny
Sometimes0 in %ery sophisticated 6i"e"0 e9pensi%e7 e9periments0 two groups of
suHects are indi%idually matched on one or more demographic characteristics" :ne
group is e9posed to a treatment 6e9perimental group7 and the other is not 6control
group7"
A9perimental Control
Iohnny -------------------------- 8red
1artha -------------------------- Sharon
Ienny ---------------------------- .inda
4he t-test wor,s with small or large 'Ds ecause it automatically ta,es into account
the numer of cases in calculating the proaility le%el" 4he magnitude of the t-
statistic depends on the numer of cases 6suHects7" 4he t-statistic in conHunction with
the degrees of freedom are used to calculate the proaility that the difference
etween the means happened y chance" !f the proaility is less than the critical
alpha le%el0 then we say that a significant difference e9ists etween the two means"
+1ample
# e9ample of a matched-pairs t-test might loo, li,e this5
Pretest Posttest
( 31
13 3)
22 32
22 2(
)!& Inde2 StatPac For Windows User's Manual
29 20
31 3)
32 39
3( 22
32 3-
22 -9
-----------------------------------------------------------
?ar"15 1ean ^ 29"2 >niased S@ ^ 13"2
?ar" 25 1ean ^ 30") >niased S@ ^ 13"0
t-statistic ^ 2"-9
@egrees of freedom ^ 9
4wo-tailed proaility ^ "022
Jou might ma,e a statement in a report li,e this5 4he mean pretest score was 29"2
and the mean posttest score was 30")" # matched-pairs t-test was performed to
determine if the difference was significant" 4he t-statistic was significant at the "02
critical alpha le%el0 t697^2"-90 p^"022" 4herefore0 we reHect the null hypothesis and
conclude that posttest scores were significantly higher than pretest scores"
Indeendent Grous t9:est "etween Means
4his menu selection is used to determine if there is a difference etween two means
ta,en from different samples" !f you ,now the mean0 standard de%iation and siBe of
oth samples0 this program may e used to determine if there is a reliale difference
etween the means"
:ne measurement is ta,en for each respondent" 4wo groups are formed y splitting
the data ased on some other %ariale" 4he groups may contain a different numer of
cases" 4here is not a one-to-one correspondence etween the groups"
Score Se9 1ales 8emales
22 1 22 2)
2) 8 -----ecomes----\ 19 1)
1) 8 21
19 1
21 8
Sometimes the two groups are formed ecause the data was collected from two
different sources"
School # Scores School & Scores
222 32)
392 232
StatPac For Windows User's Manual Statistics Calculator )!1
2(2 -00
223
220
4here are actually two different formulas to calculate the t-statistic for independent
groups" 4he t-statistics calculated y oth formulas will e similar ut not identical"
Which formula you choose depends on whether the %ariances of the two groups are
e;ual or une;ual" !n actual practice0 most researchers assume that the %ariances are
une;ual ecause it is the most conser%ati%e approach and is least li,ely to produce a
4ype ! error" 4hus0 the formula used in Statistics (alculator assumes une;ual
%ariances"
+1ample
4wo new product formulas were de%eloped and tested" # twenty-point scale was
used to measure the le%el of product appro%al" Si9 suHects tested the first formula"
4hey ga%e it a mean rating of 12"3 with a standard de%iation of 1"3" 'ine suHects
tested the second formula0 and they ga%e it a mean rating of 13"0 with a standard
de%iation of 1")" 4he ;uestion we might as, is whether the oser%ed difference
etween the two formulas is reliale"
1ean of the first group5 12"3
>niased standard de%iation of the first group5 1"3
Sample siBe of the first group5 -
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
1ean of the second group5 13"0
>niased standard de%iation of the second group5 1")
Sample siBe of the second group5 9
-------------------------------------------------------------------
t %alue ^ 2"03
@egrees of freedom ^ 13
4wo-tailed proaility ^ "0-3
Jou might ma,e a statement in a report li,e this5 #n independent groups t-test was
performed to compare the mean ratings etween the two formulas" 4he t-statistic was
not significant at the "02 critical alpha le%el0 t6137^2"030 p^"0-3" 4herefore0 we fail
to reHect the null hypothesis and conclude that there was no significant difference
etween the ratings for the two formulas"
Confidence Inter,al around a Mean
Jou can calculate confidence inter%als around a mean if you ,now the sample siBe
and standard de%iation"
4he standard error of the mean is estimated from the standard de%iation and the
sample siBe" !t is used to estalish the confidence inter%al 6the range within which we
would e9pect the mean to fall in repeated samples ta,en from the population7" 4he
)!) Inde2 StatPac For Windows User's Manual
standard error of the mean is an estimate of the standard de%iation of those repeated
samples"
4he formula for the standard error of the mean pro%ides an accurate estimate when
the sample siBe is %ery small compared to the siBe of the population" !n mar,eting
research0 this is usually the case since the populations are ;uite large" 4hus0 in most
situations the population siBe may e left lan, ecause the population is %ery large
compared to the sample" <owe%er0 when the sample is more than ten percent of the
population0 the population siBe should e specified so that the finite population
correction factor can e used to adHust the estimate of the standard error of the mean"
+1ample
Suppose that an organiBation has 20000 memers" Prior to their memership renewal
dri%e0 )2 memers were randomly selected and sur%eyed to find out their priorities
for the coming year" 4he mean a%erage age of the sample was 23"1 and the uniased
standard de%iation was 3"2 years" What is the 90` confidence inter%al around the
meanY 'ote that the population siBe can e left lan, ecause the sample siBe of )2
is less than ten percent of the population siBe"
1ean5 23"1
>niased standard de%iation5 3"2
Sample siBe5 )2
Population siBe5 6left lan, -or- 20007
@esired confidence inter%al 6`75 90
-------------------------------------------------
Standard error of the mean ^ "3(2
@egrees of freedom ^ )3
90` confidence inter%al ^ 23"1

"(
Confidence inter%al range ^ 22"3 - 23"9
Co(are a Sa(le Mean to a Poulation Mean
:ccasionally0 the mean of the population is ,nown 6perhaps from a pre%ious census7"
#fter drawing a sample from the population0 it might e helpful to compare the mean
of your sample to the mean of the population" !f the means are not significantly
different from each other0 you could ma,e a strong argument that your sample
pro%ides an ade;uate representation of the population" !f0 howe%er0 the mean of your
sample is significantly different than the population0 something may ha%e gone
wrong during the sampling process"
+1ample
#fter selecting a random sample of 1( people from a %ery large population0 you want
to determine if the a%erage age of the sample is representati%e of the a%erage age of
the population" 8rom pre%ious research0 you ,now that the mean age of the
population is 32"0" 8or your sample0 the mean age was 2("0 and the uniased
standard de%iation was 3"2" !s the mean age of your sample significantly different
from the mean age in the populationY
StatPac For Windows User's Manual Statistics Calculator )!!
Sample mean ^ 2(
>niased standard de%iation ^ 3"2
Sample siBe ^ 1(
Population siBe ^ 6left lan,7
1ean of the population ^ 32
---------------------------------------
Standard error of the mean ^ ")23
t %alue ^ 2"303
@egrees of freedom ^ 1)
4wo-tailed proaility ^ "0001
4he two-tailed proaility of the t-statistic is %ery small" 4hus0 we would conclude
that the mean age of our sample is significantly less than the mean age of the
population" 4his could e a serious prolem ecause it suggests that some ,ind of
age ias was inad%ertently introduced into the sampling process" !t would e prudent
for the researcher to in%estigate the prolem further"
Co(are :wo Standard $e,iations
4he 8-ratio is used to compare %ariances" !n its simplest form0 it is the %ariance of
one group di%ided y the %ariance of another group" When used in this way0 the
larger %ariance 6y con%ention7 is the numerator and the smaller is the denominator"
Since the groups might ha%e a different sample siBes0 the numerator and the
denominator ha%e their own degrees of freedom"
+1ample
4wo samples were ta,en from the population" :ne sample had 22 suHects and the
standard de%iation 3"2 on some ,ey %ariale" 4he other sample had 12 suHects and
had a standard de%iation of -"3 on the same ,ey %ariale" !s there a significant
difference etween the %ariances of the two samplesY
8irst standard de%iation5 3"2
8irst sample siBe5 22
Second standard de%iation5 -"3
Second sample siBe5 12
-----------------------------------------
8-ratio ^ 2"023
@egrees of freedom ^ 11 and 23
Proaility that the difference was due to chance ^ "0)2
Co(are :hree or (ore Means
#nalysis of %ariance 6#':?#7 is used when testing for differences etween three or
more means"
)!* Inde2 StatPac For Windows User's Manual
!n an #':?#0 the 8-ratio is used to compare the %ariance etween the groups to the
%ariance within the groups" 8or e9ample0 suppose we ha%e two groups of data" !n
the est of all possile worlds0 all the people in group one would ha%e %ery similar
scores" 4hat is0 the group is cohesi%e0 and there would e %ery little %ariaility in
scores within the group" #ll the people in group two would also ha%e similar scores
6although different than group one7" #gain0 there is %ery little %ariaility within the
group" &oth groups ha%e %ery little %ariaility within their group0 howe%er0 there
might e sustantial %ariaility etween the groups" 4he ratio of the etween groups
%ariaility 6numerator7 to the within groups %ariaility 6denominator7 is the 8-ratio"
4he larger the 8-ratio0 the more certain we are that there is a difference etween the
groups"
!f the proaility of the 8-ratio is less than or e;ual to your critical alpha le%el0 it
means that there is a significant difference etween at least two of groups" 4he 8-
ratio does not tell which group6s7 are different from the others"""Hust that there is a
difference"
#fter finding a significant 8-ratio0 we do Opost-hocO 6after the fact7 tests on the factor
to e9amine the differences etween le%els" 4here are a wide %ariety of post-hoc
tests0 ut one of the most common is to do a series of special t-tests etween all the
cominations of le%els for that factor" 8or the post-hoc tests0 use the same critical
alpha le%el that you used to test for the significance of the 8-ratio"
+1ample
# company has offices in four cities with sales representati%es in each office" #t
each location0 the a%erage numer of sales per salesperson was calculated" 4he
company wants to ,now if there are significant differences etween the four offices
with respect to the a%erage numer of sales per sales representati%e"
Froup 1ean S@ '
1 3"29 1"3( )
2 3"90 1"32 10
3 )"20 1"3( -
3 -"00 1"-0 (
-----------------------------------------------------------------------------------
Source df SS 1S 8 p
-----------------------------------------------------------------------------------
8actor 3 -2"( 20"9 9")( "0002
Arror 2) 2)"( 2"13
4otal 30 120"-
Post-hoc t-tests
Froup Froup t-%alue df p
1 2 2"23 12 "0312
1 3 2"1) 11 "0003
1 3 3"2( 13 "0033
2 3 3"33 13 "0030
StatPac For Windows User's Manual Statistics Calculator )!-
2 3 1"29 1- "1322
3 3 1"09 12 "0019
Correlation Menu
Correlation is a measure of association etween two %ariales" 4he %ariales are not
designated as dependent or independent" 4he two most popular correlation
coefficients are5 SpearmanDs correlation coefficient rho and PearsonDs product-
moment correlation coefficient"
When calculating a correlation coefficient for ordinal data0 select SpearmanDs
techni;ue" 8or inter%al or ratio-type data0 use PearsonDs techni;ue"
4he %alue of a correlation coefficient can %ary from minus one to plus one" # minus
one indicates a perfect negati%e correlation0 while a plus one indicates a perfect
positi%e correlation" # correlation of Bero means there is no relationship etween the
two %ariales" When there is a negati%e correlation etween two %ariales0 as the
%alue of one %ariale increases0 the %alue of the other %ariale decreases0 and %ise
%ersa" !n other words0 for a negati%e correlation0 the %ariales wor, opposite each
other" When there is a positi%e correlation etween two %ariales0 as the %alue of one
%ariale increases0 the %alue of the other %ariale also increases" 4he %ariales mo%e
together"
4he standard error of a correlation coefficient is used to determine the confidence
inter%als around a true correlation of Bero" !f your correlation coefficient falls
outside of this range0 then it is significantly different than Bero" 4he standard error
can e calculated for inter%al or ratio-type data 6i"e"0 only for PearsonDs product-
moment correlation7"
4he significance 6proaility7 of the correlation coefficient is determined from the t-
statistic" 4he proaility of the t-statistic indicates whether the oser%ed correlation
coefficient occurred y chance if the true correlation is Bero" !n other words0 it as,s
if the correlation is significantly different than Bero" When the t-statistic is calculated
for SpearmanDs ran,-difference correlation coefficient0 there must e at least 30 cases
efore the t-distriution can e used to determine the proaility" !f there are fewer
than 30 cases0 you must refer to a special tale to find the proaility of the
correlation coefficient"
+1ample
# company wanted to ,now if there is a significant relationship etween the total
numer of salespeople and the total numer of sales" 4hey collect data for fi%e
months"
?ar" 1 ?ar" 2
20) -90)
1(0 2991
220 -(10
202 -223
190 -190
--------------------------------
)!; Inde2 StatPac For Windows User's Manual
Correlation coefficient ^ "921
Standard error of the coefficient ^ ""0-(
t-test for the significance of the coefficient ^ 3"100
@egrees of freedom ^ 3
4wo-tailed proaility ^ "02-3
Another +1ample
$espondents to a sur%ey were as,ed to Hudge the ;uality of a product on a four-point
.i,ert scale 6e9cellent0 good0 fair0 poor7" 4hey were also as,ed to Hudge the
reputation of the company that made the product on a three-point scale 6good0 fair0
poor7" !s there a significant relationship etween respondents perceptions of the
company and their perceptions of ;uality of the productY
Since oth %ariales are ordinal0 SpearmanDs method is chosen" 4he first %ariale is
the rating for the ;uality the product" $esponses are coded as 3^e9cellent0 3^good0
2^fair0 and 1^poor" 4he second %ariale is the percei%ed reputation of the company
and is coded 3^good0 2^fair0 and 1^poor"
?ar" 1 ?ar" 2
3 3
2 2
1 2
3 3
3 3
1 1
2 1
-------------------------------------------
Correlation coefficient rho ^ "(30
t-test for the significance of the coefficient ^ 3"332
'umer of data pairs ^ )
Proaility must e determined from a tale ecause of the small sample siBe"
Re%ression
Simple regression is used to e9amine the relationship etween one dependent and
one independent %ariale" #fter performing an analysis0 the regression statistics can
e used to predict the dependent %ariale when the independent %ariale is ,nown"
$egression goes eyond correlation y adding prediction capailities"
People use regression on an intuiti%e le%el e%ery day" !n usiness0 a well-dressed
man is thought to e financially successful" # mother ,nows that more sugar in her
childrenDs diet results in higher energy le%els" 4he ease of wa,ing up in the morning
often depends on how late you went to ed the night efore" Cuantitati%e regression
adds precision y de%eloping a mathematical formula that can e used for predicti%e
purposes"
StatPac For Windows User's Manual Statistics Calculator )!'
8or e9ample0 a medical researcher might want to use ody weight 6independent
%ariale7 to predict the most appropriate dose for a new drug 6dependent %ariale7"
4he purpose of running the regression is to find a formula that fits the relationship
etween the two %ariales" 4hen you can use that formula to predict %alues for the
dependent %ariale when only the independent %ariale is ,nown" # doctor could
prescrie the proper dose ased on a personDs ody weight"
4he regression line 6,nown as the least s&uares line7 is a plot of the e9pected %alue
of the dependent %ariale for all %alues of the independent %ariale" 4echnically0 it is
the line that OminimiBes the s;uared residualsO" 4he regression line is the one that
est fits the data on a scatterplot"
>sing the regression e;uation0 the dependent %ariale may e predicted from the
independent %ariale" 4he slope of the regression line 67 is defined as the rise
di%ided y the run" 4he y intercept 6a7 is the point on the y a9is where the regression
line would intercept the y a9is" 4he slope and y intercept are incorporated into the
regression e;uation" 4he intercept is usually called the constant0 and the slope is
referred to as the coefficient" Since the regression model is usually not a perfect
predictor0 there is also an error term in the e;uation"
!n the regression e;uation0 y is always the dependent %ariale and 9 is always the
independent %ariale" <ere are three e;ui%alent ways to mathematically descrie a
linear regression model"
y ^ intercept ] 6slope 97 ] error
y ^ constant ] 6coefficient 97 ] error
y ^ a ] 9 ] e
4he significance of the slope of the regression line is determined from the t-statistic"
!t is the proaility that the oser%ed correlation coefficient occurred y chance if the
true correlation is Bero" Some researchers prefer to report the 8-ratio instead of the t-
statistic" 4he 8-ratio is e;ual to the t-statistic s;uared"
4he t-statistic for the significance of the slope is essentially a test to determine if the
regression model 6e;uation7 is usale" !f the slope is significantly different than
Bero0 then we can use the regression model to predict the dependent %ariale for any
%alue of the independent %ariale"
:n the other hand0 ta,e an e9ample where the slope is Bero" !t has no prediction
aility ecause for e%ery %alue of the independent %ariale0 the prediction for the
dependent %ariale would e the same" Enowing the %alue of the independent
%ariale would not impro%e our aility to predict the dependent %ariale" 4hus0 if the
slope is not significantly different than Bero0 donDt use the model to ma,e predictions"
4he coefficient of determination 6r-s;uared7 is the s;uare of the correlation
coefficient" !ts %alue may %ary from Bero to one" !t has the ad%antage o%er the
correlation coefficient in that it may e interpreted directly as the proportion of
%ariance in the dependent %ariale that can e accounted for y the regression
e;uation" 8or e9ample0 an r-s;uared %alue of "39 means that 39` of the %ariance in
the dependent %ariale can e e9plained y the regression e;uation" 4he other 21`
is une9plained"
4he standard error of the estimate for regression measures the amount of %ariaility
in the points around the regression line" !t is the standard de%iation of the data points
as they are distriuted around the regression line" 4he standard error of the estimate
can e used to de%elop confidence inter%als around a prediction"
+1ample
)*> Inde2 StatPac For Windows User's Manual
# company wants to ,now if there is a significant relationship etween its
ad%ertising e9penditures and its sales %olume" 4he independent %ariale is
ad%ertising udget and the dependent %ariale is sales %olume" # lag time of one
month will e used ecause sales are e9pected to lag ehind actual ad%ertising
e9penditures" @ata was collected for a si9 month period" #ll figures are in thousands
of dollars" !s there a significant relationship etween ad%ertising udget and sales
%olumeY
!? @?
3"2 2)"1
-"1 30"3
3"9 22"0
2") 29")
)"3 30"1
2"9 2("(
--------------------------------------------------
1odel5 y ^ 10"0)9 ] 63")00 97 ] error
Standard error of the estimate ^ 2"2-(
t-test for the significance of the slope ^ 3"092
@egrees of freedom ^ 3
4wo-tailed proaility ^ "0139
r-s;uared ^ "(0)
Jou might ma,e a statement in a report li,e this5 # simple linear regression was
performed on si9 months of data to determine if there was a significant relationship
etween ad%ertising e9penditures and sales %olume" 4he t-statistic for the slope was
significant at the "02 critical alpha le%el0 t637^3"100 p^"012" 4hus0 we reHect the null
hypothesis and conclude that there was a positi%e significant relationship etween
ad%ertising e9penditures and sales %olume" 8urthermore0 (0")` of the %ariaility in
sales %olume could e e9plained y ad%ertising e9penditures"
Sa(lin% Menu
4he formula to determine sample siBe depends upon whether the intended
comparisons in%ol%e means or percents"
Sa(le Si?e for Percents
4his menu selection is used to determine the re;uired siBe of a sample for research
;uestions in%ol%ing percents"
8our ;uestions must e answered to determine the sample siBe5
StatPac For Windows User's Manual Statistics Calculator )*1
1" &est estimate of the population siBe5 Jou do not need to ,now the e9act siBe of the
population" Simply ma,e your est estimate" #n inaccurate population siBe will not
seriously affect the formula computations" !f the population is %ery large0 this item
may e left lan,"
2" &est estimate of the rate in the population 6`75 1a,e your est estimate of what
the actual percent of the sur%ey characteristic is" 4his is ased on the null hypothesis"
8or e9ample0 if the null hypothesis is Olondes donDt ha%e more funO0 then what is
your est estimate of the percent of londes that do ha%e more funY !f you simply do
not ,now0 then enter 20 6for fifty percent7"
3" 1a9imum acceptale difference 6`75 4his is the ma9imum percent difference that
you are willing to accept etween the true population rate and the sample rate"
4ypically0 in social science research0 you would e willing to accept a difference of 2
percent" 4hat is0 if your sur%ey finds that 22 percent of the sample has a certain
characteristic0 the actual rate in the population may e etween 20 and 30 percent"
3" @esired confidence le%el 6`75 <ow confident must you e that the true population
rate falls within the acceptale difference 6specified in the pre%ious ;uestion7Y 4his
is the same as the confidence that you want to ha%e in your findings" !f you want 92
percent confidence 6typical for social science research70 you should enter 92" 4his
means that if you too, a hundred samples from the population0 fi%e of those samples
would ha%e a rate that e9ceeded the difference you specified in the pre%ious
;uestion"
+1ample
# pulishing wants to ,now what percent of the population might e interested in a
new magaBine on ma,ing the most of your retirement" Secondary data 6that is
se%eral years old7 indicates that 22` of the population is retired" 4hey are willing to
accept an error rate of 2` and they want to e 92` certain that their finding does not
differ from the true rate y more than 2`" What is the re;uired sample siBeY
&est estimate of the population siBe5 6left lan,7
&est estimate of the rate in the population 6`75 22
1a9imum acceptale difference 6`75 2
@esired confidence le%el 6`75 92
-------------------------------------------------------------
$e;uired sample siBe ^ 2-3
Sa(le Si?e for Means
4his menu selection is used to determine the re;uired siBe of a sample for research
;uestions in%ol%ing means"
4hree ;uestions must e answered to determine the sample siBe5
1" Standard de%iation of the population5 !t is rare that a researcher ,nows the e9act
standard de%iation of the population" 4ypically0 the standard de%iation of the
population is estimated a7 from the results of a pre%ious sur%ey0 7 from a pilot study0
c7 from secondary data0 or d7 or the Hudgment of the researcher"
)*& Inde2 StatPac For Windows User's Manual
2" 1a9imum acceptale difference5 4his is the ma9imum amount of error that you
are willing to accept" 4hat is0 it is the ma9imum difference that the sample mean can
de%iate from the true population mean efore you call the difference significant"
3" @esired confidence le%el 6`75 4he confidence le%el is your le%el of certainty that
the sample mean does not differ from the true population mean y more than the
ma9imum acceptale difference" 4ypically0 social science research uses a 92`
confidence le%el"
+1ample
# fast food company wants to determine the a%erage numer of times that fast food
users %isit fast food restaurants per wee," 4hey ha%e decided that their estimate
needs to e accurate within plus or minus one-tenth of a %isit0 and they want to e
92` sure that their estimate does differ from true numer of %isits y more than one-
tenth of a %isit" Pre%ious research has shown that the standard de%iation is ") %isits"
What is the re;uired sample siBeY
Population standard de%iation5 ")
1a9imum acceptale difference5 "1
@esired confidence inter%al 6`75 92
--------------------------------------------
$e;uired sample siBe ^ 1((
StatPac For Windows User's Manual Statistics Calculator )*1
w
)*) Inde2 StatPac For Windows User's Manual
Inde2
;
(0-column format 313
0
add to an e9isting data file -2
agglomerati%e hierarchical cluster analysis 32-
aggregate 121G220 121G220 121G220 2320 33(0 3110
320G220 320G220 320G220 320G220 320G220 320G
220 320G220 320G22
analysis commands 1)-0 20-0 23)
analysis of %ariance 3)3
#nalysis of %ariance 3)30 3)20 3(0G(30 3(0G(30 3)30
3(0G(20 3(0G(20 3(0G(20 3(0G(20 3(3G910 3(3G
910 3(3G910 3(3G(-0 3(0G(30 3(3G910 3(3G910
3()G910 3090 32-
#'@ operator 212
#':?# 3)3
#':?# tale 3)9
#SC!! file -(0 313
#uto #d%ance 32
autocorrelation 3230 333
#utomatic form creation 200 22
#utomatic 1ean $ow 29)
#utomatic Page 4itle 292
#utomatic $ecord #d%ance 2-G2)0 -30 -)
#utomatic 4otal $ow 2910 29)
#utomatic %ariale creation 22
#?A$#FA command 223G220 223G220 223G220 223G
220 223G220 223G220 223G22
B
&ac,ing up -
ac,up 30 -0 193G920 193G920 193G920 193G920 193G920
193G920 193G920 1990 209
anners 1)30 203G30 2030 20-0 232G320 232G3)0 232G
3)0 23)0 2(1G920 2(1G9)0 2(3G()0 2(3G()0 2(3G
(-0 2(3G(-0 2(3G(-0 2(9G9)0 2(9G9)0 2(1G(30
2(9G930 2(9G930 23)0 293G9)0 2(1G(30 2(1G(30
300G3020 300G3020 300G3020 302G30 302G30 302G
30 3030 33-
&#''A$S Command 2320 2(10 2(2G(-0 2(2G(-0 2(2G
(-0 2(2G(-0 2(2G(-0 2(2G(-0 2(20 2(90 2900 29-
atch 10 )0 110 1)90 1(2G(-0 1(2G(-0 1(2G(-0 1(2G(-0
1(9G900 1(9G900 1(9G900 1(9G900 231G320 231G
320 1(90 1(2G(-0 2310 331
eta weights 32)
&inomial 4est 333G3-0 3330 33-
&o9-Co9 transformations 319
ranching 9G100 9G100 9G100 9G100 9G100 9G100 330 220
))G)(0 ))G11(0 ))G11(0 ))G11(0 ))G11(0 (20 1020
11(0 12-G2)0 12-G2)
&$A#E@:W' Command 302
C
canonical correlation 393
canonical correlation analysis 3-2
canonical redundancy analysis 39)
canonical %ariale 3-9
Caps :nly 32
card-image 313G120 313G120 313
Carroll-Freen-Shaffer scaling 30-
Category Creation 2-00 2)-0 2(30 30(0 3)10 3(1
central tendency 2)0 2990 3010 321
cgi mail 20 ))
change in proaility 339
change the %alue laels 203G-0 203G-0 203G-0 20-0 21-
Chec, Codeoo, and @ata 323
chi-s;uare 220 22-0 2)2G)90 2)2G)90 2)2G)90 2)2G)90
2))G)90 2))G)90 2))G)90 293G920 293G920 293G
920 293G920 293G920 3390 3(20 3990 3010 3030
30-G)0 30-G)0 30-G)0 30-G)0 30-G)0 30-0 339G300
339G300 339G300 339G300 339G300 339G300 339G
300 333G330 333G320 333G320 333G320 333G320
333G32
chi-s;uare statistic 339
classification matri9 3-)
classification tale 330
cluster analysis 322
cluster centroids 3-0
cluster memership 3-3
clustering algorithms 32)
codeoo, 10 -G(0 -G(0 -G90 -G120 -G90 -G(0 9G120 9G120
9G120 100 9G120 29G300 29G300 29G300 300 32G310
32G320 290 3-G320 3-G310 3-G310 320 32G220 32G
3-0 32G210 32G220 32G310 32G320 39G220 39G220
230 290 -20 -9G)10 -90 )3G)-0 )3G)-0 )3G11(0 )3G
11(0 )3G11(0 ))G)(0 (3G(20 (3G(20 ((G(90 910
1010 11(G200 11(G200 1200 12-0 1290 1310 133G310
133G310 133G390 ((0 (3G(20 133G3-0 133G3-0 13)0
1390 1-30 1--0 1)3G)30 1)3G)30 1)3G)30 1)3G)30
1)3G)30 1)30 1))0 1(30 193G2020 193G2020 193G
2020 133G3-0 193G2020 1200 2090 2130 212G1-0
2120 2200 2(3G(-0 2(3G(-0 2(3G(-0 2(30 2(-0 2920
311G130 311G130 311G200 311G130 311G130 311G
120 31-G200 31-G200 31-G230 31-G230 1)3G)30
3220 3230 32-G2)0 32-G2)0 32-G2)0 32)G290 32)G
290 32)G330 331G330 331G330 332G330 311G200
3320 33-G3(0 33-0 33(
Codeoo, .iraries 3)
codeoo, name (30 1)30 1920 320
coding session 2-)0 2-9
coefficient of determination 321
coefficient of multiple correlation 32)
coefficient of multiple determination 32-
CohenDs Eappa 2)(
collinearity diagnostics 33-
column marginal disparities 2(0
Comma @elimited 100 120 1-20 3110 313G130 313G130
313G130 313G12
Comment .ine 1)20 232
comments 1320 1)-0 1900 2110 2290 2320 2-(0 2)1G)30
2)10 2)30 313
communalities 320
Compact @ata 8ile --G-)0 --G-)0 --G-)0 -)
Compare @ata 8iles 3120 332
comple9 :$ statements 212
compositional aggregate 3110 320G220 320G220 3200
322
Compression 2030 2()
C:1P>4A command 1930 2200 2220 2230 22)G2(0
22)G2(0 22)G2(0 22)G2(0 22)G2(0 23-
concatenation 31-G1)0 31-G1(0 31-G1(0 31-G1(0 31-G
1(
confidence inter%als 3230 332
Confidence inter%als 2(0 22-0 3030 321G230 321G230
321G230 321G230 3230 32)0 3320 3320 3390 3200
3230 32(0 3-0
Contingency Coefficient 2)(0 3010 30)
contingency tale 2)(0 3010 303G)0 303G)0 303G)0 303G
)0 3390 333
Continuation .ine 1)20 20)0 2130 2320 32-
continuity 333
con%ergence tolerance 3300 323
C:$$A.#4A Command 313
correlation matri9 313G1-0 313G1-0 313G120 313G120
313G1-0 31-0 32(G290 32(G290 32(G290 32(G290
33(0 3310 333G330 333G320 3330 332G3)0 332G3)0
332G3)0 33)0 3200 321G230 333G330 3230 3--0
393G920 393G920 393G920 393G92
correspondence analysis 300
C:>'4 command 223G220 223G220 223G220 222
co%ariance matri9 333
CramerDs ? 2))
create a form 310 20G210 200 210 23
create a new %ariale 213G1-0 213G1-0 213G1-0 213G1-0
212G1-0 2220 2220 2300 23-0 2(20 3020 322
Create 'ew @ata 8ile -2
criterion function 3-1
CronachDs alpha 190 312G1-0 312G1-0 312G1-0 31-
cross-factor rotation 322
C$:SS4#&S Command 2)3
cumulati%e percents 222G2-0 222G2-0 222G2-
cur%e fitting 31)G1(0 31)G1(0 31)G1(0 31)G1(0 31)0
31(
$
@#4# command 1)30 19)0 200
data entry control parameters 300 320 --
data entry form -0 90 290 320 320 220 1920 2010 212G1-0
212G1-
data file 10 -G(0 -G(0 -G(0 -G(0 -G(0 100 120 300 320 390
32G3-0 32G3-0 32G3)0 32G3)0 32G200 390 -1G-30
-1G-30 -1G-(0 -1G-20 -1G-20 -30 --G-90 --G)20
--G-90 -)G-90 )20 )3G)20 )3G)20 )30 )20 (20 1200
1230 1-3G--0 1-3G--0 1-3G-20 1-3G-20 1--0 1)3G
)30 1)3G)30 1)3G)30 1)3G)30 1)30 1910 193G2020
193G2020 193G2020 193G2010 20(G110 20(G110
20(G110 2110 2120 21(G190 21(G190 21(G190 21(G
190 22-0 232G330 232G320 232G320 232G320 232G
320 2300 2330 23(0 2220 2-00 2-)0 2))0 2(20 2(9G
900 2(9G900 2(9G900 2(9G900 2(90 302G(0 3020
30)G90 30)G90 30)G100 30)G100 309G100 3100 3120
3220 3320 3310 3390 3220 32)0 3)3G)(0 3)3G)(0
3)3G))0 3)3G))0 311G230 311G200 311G120 311G
330 311G2(0 31)G2-0 322G2-0 32-G330 32)G290
3)3G)(0 331G330 33-G3(0 33-0 33(
@ata 8ile 8ormat -(0 3)2G)(0 3)2G)(0 3)2G))0 3)2G))
data file name -20 1)30 19)0 312G130 312G130 312G130
312G130 3120 31)
data input fields 390 21G220 21G220 210 220 2)
@ata !nput Settings 2-G2)0 2-G2)0 2-G2)0 2-G2)0 -30
--G-)0 --G-)0 --G-)0 --G-)0 -)
data manager 10 9G100 9G100 9G100 9G100 390 210 -1G-20
-1G-20 -1G-20 -1G-20 -10 -20 --G-)0 --G-)0 --0
-)
data trimming 3230 332
deugging 1)20 232
decimal format 31
decomposition of sum of s;uares 3-0
degrees of freedom 2(0 2)20 2)90 2920 3(20 3(2G(-0
3(2G(-0 3(2G(-0 3(2G(-0 3900 3990 332G320 332G
320 332G320 332G320 332G320 339G230 339G210
339G210 339G2-0 339G210 339G230 3220 323G2-0
323G2-0 323G2-0 3290 3-1
@elete # $ecord --0 -)
delete all the %ariales on a form 20
@elete &utton 3(0 (00 2)0
@ASC$!P4!?A Command 2390 299
dichotomous 190 2290 33-0 30(0 333G3(0 333G320 33(0
33-
dichotomous dependent %ariale 33-
@!8 8iles 313
@!88A$A'CA command 23)G3(
@isale S,ips 2)0 -)
)** Inde2 StatPac For Windows User's Manual
discriminant function analysis 3-3
discriminant function coefficients 3--
@>11J command 239G300 239G300 239G300 239G300
239G30
@ummy %ariales -90 239G300 239G300 239G300 239G
300 3)3
@uplicate # 8ield -2
@uplicate &utton 3(0 32
@uplicating ?ariales 3(
+
ecology 1)9
ecology option 1)9
eigen%alue summary tale 303
eigen%alues 3-9
A.SA ,eyword 22)
A-1ail Sur%eys )10 312
Antropy 2)(
A;uiweighting 2(0
e9clude missing data 211
e9ecution time )
e9ploratory research 120 1)
e9port 100 120 12(0 311G130 311G130 311G130 311G130
311G13
F
8ield Placement 22G230 22G230 22G230 22G23
field width 31G320 31G320 31G320 320 320 3-0 1030 1330
1220 2020 213G120 213G130 213G1-0 212G1-0 212G
1-0 212G1-0 21-0 2220 323
file names 10 10G120 10G120 10G120 10G120 100 290 920
1-00 1)3G)30 31)
final coding 2-)G)10 2-)G)10 2-)G-90 2-9G)10 2-9G)10
2)0G)1
8ind @ialog window 2(0 -30 1)(G)90 1)(G)90 1)(G)90
1)(G)9
8ind 'e9t 2(0 -30 1)(
8ind $ecords -3G-20 -3G-20 -3G-20 -3G-20 -3G-2
8ind 4e9t -20 1)(
finite population correction factor 2(0 22-0 2(20 3030
322
8isherDs A9act 4est 333G320 333G320 333G320 333G320
332
fi9ed factors 3(0
8i9ed format -(0 3130 323
font name 210 10)0 109
font siBe 210 10)0 109
8::4':4A command 203
force %ariales 3330 3)1
forcing the constant to Bero 323
8ormat Statement 31G320 31G320 31G320 310 320 32G3-0
32G3-0 320 310 31(G190 31(G190 31(G190 31(G190
31(G190 3230 31(G190 323G230 323
8-ratio 32)0 3-(0 3)9
8$AC>A'C!AS Command 2220 2--G-)0 2--G-)0 2--G
-)0 2--
G
Famma 2)(
gloal options 1)9G(00 1)9G(00 1)9G(00 1)9G(00 1)9G
(0
goal definition 12
goals and oHecti%es 12
FoodmanDs interaction analysis 2)9
goodness-of-fit 321
Fraphics 30 ))0 9(0 1230 1230 1--0 1(-0 1(9
Frid 3-G310 3-G310 3-G300 3)G310 3)G310 320 (30 (90
323
5
<A#@!'F command 202G30 202G30 202G30 202G30
203G3
<!@A 12(0 1)(0 2-3G-30 2-3G-30 2-3G-30 2-3G-30
2-3G-30 2()G((0 2()G((0 2()G((0 2()G((0 2()G
((
hierarchical tree diagram 329
hypothesis 120 1(0 20G210 20G210 200 23G2-0 23G2-0
23G2-0 20G210 23G2-0 3090 32)0 3230 3-(0 3990
33(G200 33(G200 33(G200 33(G200 33(G200 323G
230 3230 3230 3-1G-20 3-1G-20 3-1G-20 3-1G-2
I
!8-4<A' 1910 2100 22-G310 22-G310 22-G2(0 22-G310
22-G2(0 230G310 230G310 2390 2--0 3020 320
import 10 310 -9G)10 -90 )20 )-G)90 )-G)90 )(0 1230
1-30 311G120 311G120 311G1-0 311G120 311G13
increase the field width of a %ariale 212
!ndependent Froups 230 2-0 309G100 309G120 309G120
309G120 310G120 311G120 323G230 323G230 323G
230 323G230 323G23
inferential 3390 321
!nsert &utton 3(
!nstallation 2G30 2G30 2G30 2G30 20 (90 92
!nteraction #nalysis 2)9
interacti%e 10 1(20 3220 3320 3310 3)2
interacti%e prediction 3220 3320 331
internet 10 3G30 3G30 9G110 9G110 9G100 9G100 290 320 310
)10 )-G11(0 )-G11(0 ))G)90 ))G)90 (3G(90 (3G(90
1010 10(0 11(G200 11(G200 1300 133G3)0 133G3)0
13)0 1200 1-3G--0 1-3G--0 1-3G-20 1-3G-20 3110
3120 333
internet sur%eys 90 ))
!nternet Sur%eys 90 320 )10 ))G11(0 ))G11(0 (3G(20 (3G
(20 1200 13)0 312
in%erted matri9 329
iterations 331
StatPac For Windows User's Manual Inde2 )*-
D
Hoin words 2-9
/
EendallDs 4au Statistics 2)(
,eyword &J 2)30 2(10 30-
Eeyword <elp 192
Eeyword !nde9 191
,eywords .: and <! 219
Eolmogoro%-Smirno% 302
Erus,al-Wallis test 3(2
Eurtosis 302
.
.#&A.S command 203G-0 203G-0 203G-0 203G20 202G
-0 2120 2-30 2(2G((0 2(2G((0 2(2G((0 2(2G()0
290
.#F command 23-G3)0 23-G3)
least s;uares line 322
lepto,urtic 3020 309
.A4 command 212G1-0 212G1-0 212
liaility (G90 3(3
lirary 3)G3(0 3)G3(0 3)0 31
linear regression e;uation 31(
.!S4 command 2110 2290 23(G200 23(G200 23(G200
23(0 2200 3200 333
log of the li,elihood function 339
logistic regression 33-
.otus 3110 313
M
1ann-Whitney > 312G13
manually change records -3
matri9 in%ersion 329
ma9imum numer of columns 31
1ean 190 230 2)G2(0 2)G2(0 2)G2(0 2)G2(0 2)G2(0 31G
320 31G320 31G320 31G320 320 33G320 330 320 19(0
213G120 2130 220G210 220G210 220G210 220G210
2210 223G220 223G220 223G220 223G220 2320 233G
320 233G320 233G320 233G320 2320 2-2G--0 2-2G
--0 2-20 2(3G(20 2(3G(20 2(3G(20 2(3G(20 2(30
2900 233G320 2900 29)0 300G3020 300G3030 300G
3020 300G3020 300G3020 30-0 3090 3130 322G230
322G230 322G230 2-2G--0 32-0 332G3)0 332G3)0
2900 3320 33)G3(0 33(0 3300 3330 33(G390 33(G390
300G3020 2900 3220 3-10 3-30 3-20 3)2G)30 3)2G
)30 322G230 3)2G)30 3)(0 3(00 392G9-0 392G9-0
392G9-0 392G9-0 399G3010 399G3010 399G3010
3010 30)0 3200 339G320 339G320 339G300 339G320
339G320 3320 321G2)0 321G2)0 321G2)0 321G2)0
3-3
mean asolute percent error 322
mean percent error 322
mean s;uared error 322
mean sustitution 3320 3300 3390 3220 3-30 3)20 399
1edian 2)0 2120 300G3010 300G3010 300G3020 300G
3010 300G3010 3210 321
1A$FA command 2020 2-)
1erge Procedure 8iles 1(3
1erging @ata 8iles 31-
meso,urtic 302
methods of research 1-
minimum percent 2)0
missing data 320 320 -2G--0 -2G--0 -2G-)0 --G-)0 --G
-)0 -)0 2110 2190 2220 2230 22(0 23(0 2230 2-30
2110 2-30 2)30 2(-0 29-G9)0 29-0 2990 3320 3300
3390 3220 3-30 3)2G)30 3)2G)30 3)30 331
1ode selection 1(2
1o%e ?ariales 3(
multicollinearity 33-
multiple correlation 39-
multiple regression 322
multiple regression e;uation 32-
multiple response 220 300 320 3(0 32G320 32G330 32G320
32G320 31G320 220 )3G)30 )3G)30 )30 (3G(20 (30
1200 133G330 1330 13-G3)0 13-G3)0 139G300 139G
300 13)0 2020 2290 220G220 2220 22)G290 22)G-10
22)G2(0 22)G2(0 22)G290 2-10 2-)0 2((G900 2((G
900 2((G(90 2900 29)0 333G3(0 333G3(
7
' A;uals option 293
net category 2)2
networ, 2G30 2G30 2G30 3
'AW command 213G130 213G130 213G130 213G130 2130
222G230 222G230 222G230 222G230 222G230 2220
2(2
'o @elay 1(-
non-hierarchical cluster analysis 32-
non-missing 2110 223G2-0 223G2-0 223G2-0 223G220
223G2-0 22(0 2-30 301
non-parametric 3120 3(2
normal distriution 2)0 2)90 3020 312G130 312G130 312G
130 33-0 3310 330G310 330G310 330G310 331
normaliBe 191G920 191G920 1910 232G3-0 232G3-0 232G
3-0 232G3-
':$1#.!LA command 232G3-0 232G3-0 232G3-0
232G3-0 232G3-
'th record selection 211
null hypothesis 120 20G210 20G210 200 22G2-0 22G2-0
22G2-0 22G2-0 22G2-0 33(G200 33(G200 33(G200
33(G200 33(G200 323G230 323G230 3230 3230 3-1G
-20 3-1G-20 3-1G-20 3-1
numer of days etween two dates 2230 333
)*; Inde2 StatPac For Windows User's Manual
3
oli;ue reference structure analysis 320
oli;ue rotation 322
:dds ratio 2)(G)90 2)(G)90 2)(G)90 2)(0 2)9
-ne Analysis 1)-0 1930 2-0G-10 2-0G-10 2-0G-10 2-0G
-10 2-30 300
:ne ?ariale Per Page 23
one-analysis 2-00 2-20 300G3010 300G3010 300G3010
300G3010 300
open-ended responses 310 2290 2--G-)0 2--G-)0 2-)0
2)0
:P4!:'S command 20-G)0 20-0 23)0 2(20 3030 3320
3390 323G220 323G220 323G220 3)00 300
:$ operator 212
order of ,eywords 193
ordinary least s;uares 31)
:utlier 331
outlier adHustment 323
outliers 323
:utput selection 1(-
P
page heading 930 9)0 1)-0 1930 202G30 202G30 202G30
29-
Page ?iew 23
paper orientation 1)9
parametric 210 2(3G(30 2(3G(30 2(30 3120 3(2
partial correlation matri9 32(
passi%e %ariales 302
Pause utton 1-90 1(-
percentage ase 20)0 22)0 2()0 30(
perceptual mapping 300
permanently change an option 20-
Phi 2))
Piping ))0 11(G190 11(G190 11(G190 11(G190 12)
platy,urtic 302
Poisson @istriution 3390 3330 33-
population 1-G1)0 1-G1)0 1-G1)0 1-G1(0 1-G1(0 2)G2(0
2)G2(0 2)G2(0 1-G1)0 1(2G(30 1(20 1(30 22-0 2(20
290G910 290G910 290G910 302G30 3020 2900 3020
3120 31(0 32(0 3(00 322G2-0 322G2-0 322G2-0
322G2-0 322G2-0 329G320 329G320 3390 3320 320G
210 320G210 320G210 320G210 320G210 323G220
323G2-0 323G2-0 323G220 323G2-0 3-2
posterior proaility 3-2
powered-%ector 3390 320
pre-coding 2-)G)00 2-)G)00 2-)G)10 2-)G)10 2-)0
2-(G)10 2)1
prediction inter%als 3230 332
principal components analysis 332
principal factor analysis 320
print a codeoo, 39
Print a Procedure 8ile 1(3
prior proailities 3)0
proaility of a defined range 330G320 330G320 330G310
330G32
proaility of a B %alue 330
proaility of an 8 -ratio 333
proit regression 33-
procedure 1G90 -G(0 -G(0 -G(0 )G(0 9G100 9G100 90 11G
120 9G100 120 200 220 310 --0 )10 )-0 ((G(90 ((G(90
(90 1)1G(20 1)1G(20 1)1G(20 1)1G(20 1)1G(20
190G910 190G910 191G990 1910 193G2020 193G2030
193G990 193G2110 201G30 201G100 202G100 202G
110 20-G100 213G1-0 213G120 213G1-0 213G1-0
21-0 2200 223G310 222G2(0 222G2(0 222G310 222G
2)0 2290 231G320 231G3-0 2320 2330 23-0 231G330
231G330 193G2020 2310 23)G3(0 23)G3(0 23)G3(0
23)G3(0 2210 2-00 2-20 2-30 2--0 2230 2--G-)0
2-)0 2)30 2230 2)30 2(20 2((0 290G920 290G920
2920 29-G9(0 29-0 201G100 29)0 31)0 23)G3(0 3290
3300 332G330 332G330 332G330 3320 3300 32-G2)0
32-G2)0 32)0 3)10 3)30 3(0G(10 332G330 3(0G(10
3(20 311G130 311G130 3110 3130 31-0 320G220
320G220 320G220 3220 32(0 3310 332
procedure file 1G90 -G(0 9G100 90 120 ((0 1)1G)30 1)1G
)30 1)1G)30 1)30 1)2G)90 1)2G)90 1)2G)90 1)2G
(30 1(3G(30 1(3G(30 1)2G)90 1930 19-0 1990 202G
30 2020 203G20 2020 2230 231G330 2310 2320 23)0
2)30 32(
Procedure6s7 4o $un 1(2
Processing time )
@
Cuartiles 303
Cuic, Codeoo, 3-0 310 323
;uotation mar,s 210G110 210G110 210G110 210G110 2130
22)0 2310 313
R
random digit dialing tale 3120 322G2-0 32-
$andom error 19G200 19G200 19G20
random factors 3(0
random numer tale 3120 322
random sample 1)0 3(00 3120 322G2-0 32-0 322
$aoDs 8-statistic 39(
$AC:@A command 2020 2120 21(G190 21(G190 21(0
2-3
$ecord #d%ance 2-0 -30 -)
$ecord 'umer -3G--0 -3G-30 -3G-30 -3G--0 --0 -(0
1-90 19-0 20(G110 20(0 2110 2330 23(G390 23(G390
23(0 2)10 2)3
redundancy criteria 39(
$egression 2-0 23-0 239G300 239G300 239G300 239G300
2330 2)(0 3120 31)G1(0 31)G1(0 31)G1(0 320G290
320G290 320G2)0 3290 331G3)0 331G3)0 331G310
33(G300 330G310 3310 333G330 333G330 3330 33-G
3)0 33-G3)0 33-G390 33(G390 33(G390 3-30 3-(0
StatPac For Windows User's Manual Inde2 )*'
3)30 3930 30(0 3390 329G-10 329G-00 329G-00
329G-0
regression coefficients 32)0 33(
regression e;uation 322
regression line 322
relational operators 211G120 211G120 211G120 211G120
22(G310 230G310 230G310 230G31
$eliaility 190 3120 31-0 3(3
$A1 command 232
$emo%ing 30 23)0 333
$eplace @ialog window 2(0 1)9
reser%ed words 2330 311
residual 3220 331
$esidual #nalysis 2)9
residual autocorrelation 323
response categories 21G220 21G220 21G220 21G220 320
10(0 22-0 2-30 2--0 2)0G)20 2)0G)20 2)0G)20 2)20
2()
$esults Aditor 1(-0 1(9
$ich 4e9t 8ormat 30 110 320 210 1(-
roust regression 320
r-s;uared 3210 32-
$S>1 command 231G32
rules go%erning %ariale names 32
$un a Procedure 8ile 1(30 1(3
$un utton 1(3G(20 1(3G(20 1(3G(20 1(3G(2
$>' command 231
S
Sample SiBe for 1eans 3-2
Sample SiBe for Percents 3-1
Sampling methods 1)
S#?A command 193G920 1930 19)G990 19)G990 19)G
990 19)G990 2020 2090 2120 22)
Script 2G30 2G30 90 11G120 110 ))G)(0 ))G11(0 ))G11(0
(1G(20 (2G910 9(0 10-G110 1130 11-0 1190 120G2(0
1300 133G330 13-G3(0 130G200 133G200 133G200
1220 120G2-0 120G2-
Search 1ethod -2
seasonality 23)G390 23)G390 23)G390 23)G39
select a specific %ariale 2)
SA.AC4 command 1)20 1930 20(G110 20(G110 20(G110
20(G110 2320 239G200 2200 2--0 333
select non-lan, records 211
Send A-1ail 1-2
Send A-1ail !n%itations 90 120 1130 1-30 1-20 1-9
serial numer (
simple structure analysis 339
S,ewness 302
S,ip codes 300 33G320 330 390 330 220 2)0 -)
slope of regression line 322
small ' 2990 32)
SomersD d 2)(
S:$4 command 19(0 232G330 232G330 333
Sounde9 -2
Space etween Columns 23
S4#CE command 21-G1(0 21-G1(0 21-G1(0 21-G1)0
302
stac,ing %ariales 302
standard de%iation 2)G2(0 2)0 2320 2--0 2(30 300G3020
3000 3020 30-0 313G120 313G120 3220 32)0 3310
3-30 3)(0 39-0 339G310 339G320 3390 331G320 3320
321G220 321G2-0 323G2-0 3-00 3-2
Standard Arror 2(0 22-0 2)90 2(3G(20 2(3G(20 2(3G(20
2(3G(20 3030 3090 313G120 313G120 3120 3220 3230
32)0 3310 3320 33(0 33(0 321G220 3210 323G2-0
323G2-0 323G2-0 323G220 32(G290 32(G290 32(G
290 32(0 3-0G-1
standard error of estimate 322
standard error of the multiple estimate 32)
standardiBed coefficients 39-
standardiBed residual 2)90 3230 331
Starting Columns 3(
Starting Page 'umer 1(2G(-0 1(20 1(-0 190
Statistics Calculator 3120 32-0 339G300 339G300 3300
323
StatPac"!ni file 10 20 110 130 300 3-0 13-0 1390 1210 1-9G
)00 20-0 2130 3130 31-
stu 2030 2--0 2(1G(-0 2(1G(30 2(1G(30 2(3G()0 2(-0
2(9G900 2(9G900 29-G990 29-G9(0 29-G9(0 29-G
9(0 3030 30(0 313
S4>@J command 1)3G)30 1)3G)30 1)3G)30 1(30 19-G
2000 19-G990 19-G2000 202
study design 10 9G100 90 100 290 330 3-G3)0 3-G3)0 3-G
3)0 390 2)0 22G1)00 -10 --0 -90 (20 2010 213G120
213G120 2-00 2)-0 2(20 2(-0 2(90 2920 30)G(0
30)G(0 3330 3-20 3)10 3(10 311G120 311G120 32-
Style files (9
sufile 19(G2000 19(G2000 19(G2000 2090 2310 2330 233
sugroup 302G(0 302G)0 302G(
S>1 command 1330 223G2-0 2230 22-
supplemental heading 2-20 293
Support 20 3G20 3G20 (0 )G(0 ))
Systematic error 20
:
4a @elimited 12G130 1130 12-G2)0 12-G2)0 1(90 3110
313G130 313G130 313G13
4ale of Contents 1(9
4echnical support 20 )G(
telephone inter%iews 1-
template 9G100 9G100 100 32G390 39G200 39G200 200 -1G
-20 -1G-20 -20 -(0 1(-
4est mode 1--0 1(2
three-way crossta 2)3
4!4.A command 203
tolerance le%el 339
total inertia 301
4:4#. ,eyword 2(-0 29-G9)0 29-G9)0 29-G9)
transform an e9isting %ariale 220
)-> Inde2 StatPac For Windows User's Manual
trend 230 23)G390 23)G390 23)G39
troule-shoot a procedure 23(
true aggregate 3200 322
t-test 230 2-0 22-0 2930 309G120 309G120 309G120 3(10
33)G390 33)G200 33)G390 322G230 322G230 3230
3290 3-1
44AS4 Command 309G100 309G100 309G10
two-tailed proaility 220 22-0 2)90 330G320 330G320
330G330 3330 33(G390 33(G200 33(G200 323G230
3230 323G2-0 323G2-0 32-0 3290 3-1
two-way crosstas 2)3
types of %ariales 30
U
unalanced 3)3
unweighted means 3)3
>pdating 20 1-2
>tility Programs 3110 323
8
? 'umers 1)-0 200
%alid codes 300 330 390 33G330 33G330 330 22
?alidity 9G100 9G100 1(0 -(0 133G390 133G390 319
?alue .ael <!@A 2-30 2()
?alue laels 300 32G330 32G330 32G330 33G330 3(G390
3(G390 3(0 390 310 32G330 32G330 23G220 23G220
23G220 23G220 )30 (3G11(0 (3G11(0 10(0 1200
12(G330 12(G320 13)0 203G-0 203G20 203G-0 203G
-0 212G1)0 212G1)0 2300 23(0 223G220 223G220
223G220 223G220 22)G-00 22)G-10 22)0 229G-10
229G-10 2-30 2--0 2)-0 2(1G(20 2(1G(20 2(1G(20
2(1G(20 2(3G(90 2(3G(-0 2(2G(90 2((G(90 2920
29(0 302G(0 302G(0 302G(0 302G(0 3)10 3(10 3030
3130 323
?alue .aels !ndent 23
%ariaility 200 2)0 322G230 322G230 32)0 3320 3310 3330
3-10 3-90 3)30 3(00 3()0 3(90 3010 3210 32)0 3-0G
-10 3-0G-10 3-0G-10 3-0G-1
?ariale @etail 3-0 39G320 39G320 300 390 20G210 20G
210 22G2)0 2)0 -30 -(0 1))G)(0 1))G)(0 1))0 323
?ariale 8ormat 300 3-G3(0 3(0 320 3-0 2220 22)0 312
?ariale .ael !ndent 23G230 23G23
?ariale .ist 30G320 300 320 390 20G210 20G210 220 2)0
-30 -(0 1)1G)20 1)1G)20 1)1G)20 1)1G)20 1)20
1)-G))0 1)1G)20 1)-G))0 1)-G))0 19)G9(0 19)G
9(0 19)G9(0 19)G9(0 200G2020 200G2020 200G2020
2020 2030 21-G1(0 21-G1(0 223G220 223G2-0 232G
330 223G220 232G3)0 232G3)0 23(0 23(0 2230 22(0
2-10 2-20 2)30 2(10 2(20 2((G(90 2((G(90 29)G9(0
29)0 299G3010 299G3010 2990 3010 302G-0 3020
309G110 309G110 309G110 309G110 3130 31)0 322G
2-0 3330 33-0 332G330 332G330 3200 32-0 3-20 3)10
3)3G)-0 3)3G)(0 3))0 3(2G(30 3(20 3(3G900 3(3G
900 393
?ariale .ist window 320 220 -(0 1)20 1)-G))0 1)1G)20
1)-G))0 1)-G))0 202
%ariale name 300 31G320 310 3(0 320 330 2)0 )-0 (30
1--0 1(20 2030 213G1-0 213G1-0 21(0 222G230 2220
2220 23(0 2330 222G230 222G230 222G230 222G230
2--0 2(10 2(20 29(0 3030 30(0 3130 31-0 3220 33-0
3320 3390 3220 3-30 3(20 300
?ariale 'umers 390 220 -(0 )30 23-0 23(0 22(0 2(90
32-0 32-0 3-20 3930 319
?ariale Separation 23
?ariale 4e9t 8ormatting 200 22
%ariale type 300 212
?ariance 2)0 2)90 3020 3210 32-0 32(0 3330 3320 332G330
332G330 332G3(0 332G3(0 3210 323G230 323G230
32)0 3-10 3-(0 3)30 3)20 3(0G(20 3(0G(20 3(30
3(3G910 3)30 3930 39)0 3990 3010 3090 32-0 3-0
%ariance inflation factors 33(
%ariance-co%ariance matri9 32(
%arima9 3390 3200 323
?eratim &laster 2-)G-90 2-)G-90 2-)G-90 2-)0 2-90
2)10 313
%eratim response 220 2-)
%iew mode 23
W
warranty (
we site 20 9G110 9G110 ))G(30 ))G)90 (90 1200 1220
1-20 1-90 312
WA!F<4 command 233G320 233G320 233G320 233G320
290
weighted cross-factor rotation 320
weighting 1)9G(30 1)9G(30 2310 233G330 233G330 233G
330 2330 2330 2900 2930 393
Wilco9on test 312
Wil,Ds lamda 399
Wil,sD lamda 3-(
word processor 30 20 110 31G320 31G320 310 310 390 1(-0
2-90 313
W$!4A command 1920 19)G2010 19)G2010 2090 21-0
2320 313
E
JateDs Correction 2)90 2920 333
JuleDs C and Jules J 2)(
G
Bero %alues 223
Boom factor 1)9
StatPac For Windows User's Manual Inde2 )-1

Anda mungkin juga menyukai