67 lines
1.7 KiB
Python
67 lines
1.7 KiB
Python
"""Spector and Mazzeo (1980) - Program Effectiveness Data"""
|
|
from statsmodels.datasets import utils as du
|
|
|
|
__docformat__ = 'restructuredtext'
|
|
|
|
COPYRIGHT = """Used with express permission of the original author, who
|
|
retains all rights. """
|
|
TITLE = __doc__
|
|
SOURCE = """
|
|
http://pages.stern.nyu.edu/~wgreene/Text/econometricanalysis.htm
|
|
|
|
The raw data was downloaded from Bill Greene's Econometric Analysis web site,
|
|
though permission was obtained from the original researcher, Dr. Lee Spector,
|
|
Professor of Economics, Ball State University."""
|
|
|
|
DESCRSHORT = """Experimental data on the effectiveness of the personalized
|
|
system of instruction (PSI) program"""
|
|
|
|
DESCRLONG = DESCRSHORT
|
|
|
|
NOTE = """::
|
|
|
|
Number of Observations - 32
|
|
|
|
Number of Variables - 4
|
|
|
|
Variable name definitions::
|
|
|
|
Grade - binary variable indicating whether or not a student's grade
|
|
improved. 1 indicates an improvement.
|
|
TUCE - Test score on economics test
|
|
PSI - participation in program
|
|
GPA - Student's grade point average
|
|
"""
|
|
|
|
|
|
def load():
|
|
"""
|
|
Load the Spector dataset and returns a Dataset class instance.
|
|
|
|
Returns
|
|
-------
|
|
Dataset
|
|
See DATASET_PROPOSAL.txt for more information.
|
|
"""
|
|
return load_pandas()
|
|
|
|
|
|
def load_pandas():
|
|
"""
|
|
Load the Spector dataset and returns a Dataset class instance.
|
|
|
|
Returns
|
|
-------
|
|
Dataset
|
|
See DATASET_PROPOSAL.txt for more information.
|
|
"""
|
|
data = _get_data()
|
|
return du.process_pandas(data, endog_idx=3)
|
|
|
|
|
|
def _get_data():
|
|
data = du.load_csv(__file__, 'spector.csv', sep=r'\s')
|
|
data = du.strip_column_names(data)
|
|
data = data.iloc[:, [1, 2, 3, 4]]
|
|
return data.astype(float)
|