statsintro_python/ISP/Exercise_Solutions/S2_python.py at master · datapython/statsintro_python

History

52 lines (38 loc) · 1.36 KB

Raw

''' Solution to Exercise "Data Input" '''

# author: Thomas Haslwanter, date: Oct-2015

import numpy as np

import matplotlib.pyplot as plt

import pandas as pd

import urllib

import io

import zipfile

def getDataDobson(url, inFile):

'''Extract data from a zipped-archive'''

# get the zip-archive

GLM_archive = urllib.request.urlopen(url).read()

# make the archive available as a byte-stream

zipdata = io.BytesIO()

zipdata.write(GLM_archive)

# extract the requested file from the archive, as a pandas XLS-file

myzipfile = zipfile.ZipFile(zipdata)

xlsfile = myzipfile.open(inFile)

# read the xls-file into Python, using Pandas, and return the extracted data

xls = pd.ExcelFile(xlsfile)

df = xls.parse('Sheet1', skiprows=2)

return df

if __name__ == '__main__':

# 1.1 Numpy --------------------

# Read in a CSV file, and show the top:

inFile1 = 'swim100m.csv'

data = pd.read_csv(inFile1)

print(data.head())

# Read in an excel file, and show the bottom

inFile2 = 'Table 2.8 Waist loss.xls'

xls = pd.ExcelFile(inFile2)

data = xls.parse('Sheet1', skiprows=2)

print(data.tail())

# Read in a zipped data-file from the WWW

url = r'http://cdn.crcpress.com/downloads/C9500/GLM_data.zip'

inFile = r'GLM_data/Table 2.8 Waist loss.xls'

df = getDataDobson(url, inFile)

print(df.tail())

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

S2_python.py

Latest commit

History

S2_python.py

File metadata and controls