/notify_user/pymodules/python2.7/lib/python/statsmodels-0.5.0-py2.7-linux-x86_64.egg/statsmodels/datasets/strikes/data.py
Python | 70 lines | 64 code | 2 blank | 4 comment | 0 complexity | e93512f6314502ae898034480cbb2510 MD5 | raw file
- #! /usr/bin/env python
- """U.S. Strike Duration Data"""
- __docformat__ = 'restructuredtext'
- COPYRIGHT = """This is public domain."""
- TITLE = __doc__
- SOURCE = """
- This is a subset of the data used in Kennan (1985). It was originally
- published by the Bureau of Labor Statistics.
- ::
- Kennan, J. 1985. "The duration of contract strikes in US manufacturing.
- `Journal of Econometrics` 28.1, 5-28.
- """
- DESCRSHORT = """Contains data on the length of strikes in US manufacturing and
- unanticipated industrial production."""
- DESCRLONG = """Contains data on the length of strikes in US manufacturing and
- unanticipated industrial production. The data is a subset of the data originally
- used by Kennan. The data here is data for the months of June only to avoid
- seasonal issues."""
- #suggested notes
- NOTE = """
- Number of observations - 62
- Number of variables - 2
- Variable name definitions::
- duration - duration of the strike in days
- iprod - unanticipated industrial production
- """
- from numpy import recfromtxt, column_stack, array
- from statsmodels.datasets import utils as du
- from os.path import dirname, abspath
- def load():
- """
- Load the strikes data and return a Dataset class instance.
- Returns
- -------
- Dataset instance:
- See DATASET_PROPOSAL.txt for more information.
- """
- data = _get_data()
- return du.process_recarray(data, endog_idx=0, dtype=float)
- def load_pandas():
- """
- Load the strikes data and return a Dataset class instance.
- Returns
- -------
- Dataset instance:
- See DATASET_PROPOSAL.txt for more information.
- """
- data = _get_data()
- return du.process_recarray_pandas(data, endog_idx=0, dtype=float)
- def _get_data():
- filepath = dirname(abspath(__file__))
- data = recfromtxt(open(filepath + '/strikes.csv', 'rb'), delimiter=",",
- names=True, dtype=float)
- return data