import numpy as np
from nose.tools import assert_equal
from nose.tools import assert_not_equal
import pandas as pd


# swap cases
def swap_cases(s):
    '''arg: string 
       return: string (cases swapped)
       
       Staff's solution contains one line of code. 
    '''
    ### BEGIN SOLUTION
    return "".join([l.upper() if l.islower() else l.lower() for l in s])
    ### END SOLUTION


assert swap_cases('ABcDef') == 'abCdEF'
assert swap_cases('hl4434*9889DdfF') == 'HL4434*9889dDFf'
assert swap_cases('') == ''
assert_not_equal(swap_cases('ABC'), 'ABC')
### BEGIN HIDDEN TESTS
assert swap_cases('H') == 'h'
assert swap_cases('***(((())))') == '***(((())))'
assert_not_equal(swap_cases('Hello'), 'Hello')
assert swap_cases('DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))DSFAsflaskdflsakflas***(((())))') == 'dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))dsfaSFLASKDFLSAKFLAS***(((())))'
### END HIDDEN TESTS


def sum_of_sqs_of_pos_even_elms_of_list(_list):
    '''args: list 
       return: int
       
    Staff's solution contains one line of code. 
    '''
    ### BEGIN SOLUTION
    return sum([elm**2 for elm in _list if (not elm % 2 and elm > 0)])
    ### END SOLUTION

4


assert sum_of_sqs_of_pos_even_elms_of_list([2,4]) == 20
assert sum_of_sqs_of_pos_even_elms_of_list([2,4,3,6,7,4,3]) == 72
assert sum_of_sqs_of_pos_even_elms_of_list([-6,4,2,2.4,204.2]) == 20
### BEGIN HIDDEN TESTS
assert sum_of_sqs_of_pos_even_elms_of_list([5.8]) == 0
assert sum_of_sqs_of_pos_even_elms_of_list([0,0,1,-2]) == 0
assert sum_of_sqs_of_pos_even_elms_of_list([4,5,6,3,2]) == 56
### END HIDDEN TESTS


def extract_2nd_last_row(arr):
    '''arg: ndarray
       You can assume that ndarray has at least 2 rows.
        
       return: ndarray 
       
        Staff's solution contains one line of code. 
       
       '''
    ### BEGIN SOLUTION
    return arr[-2, :]
    ### END SOLUTION


arr2 = np.array([[5,52,2],[6,43,2], [1,2,4]])
assert (extract_2nd_last_row(arr2) == np.array([6,43,2])).all()


def get_zeroth_and_first_rows(a):
    '''
    arg: ndarray of shape (n,m) where n and m are at least 2.
    
    return ndarray of shape ((n*m), m)
    
    Staff's solution contains one line of code. 
    
    '''
    
    ### BEGIN SOLUTION
    return a[np.array([a%2]).reshape(-1)]
    ### END SOLUTION


# Test shapes returned
arr3 = np.ones((40,60), dtype=np.int16)
assert_equal(get_zeroth_and_first_rows(arr3).shape, (2400, 60))

# Test each row.
arr1 = np.array([[1,1,1],[2,2,2],[3,3,3]])
assert (get_zeroth_and_first_rows(arr1) == np.array([[2, 2, 2],
                                                     [2, 2, 2],
                                                     [2, 2, 2],
                                                     [1, 1, 1],
                                                     [1, 1, 1],
                                                     [1, 1, 1],
                                                     [2, 2, 2],
                                                     [2, 2, 2],
                                                     [2, 2, 2]])).all()

arr2 = np.array([[1,23,4],[4,2,4],[40,0,0]])
assert (get_zeroth_and_first_rows(arr2) == np.array([[ 4,  2,  4],
       [ 4,  2,  4],
       [ 1, 23,  4],
       [ 1, 23,  4],
       [ 1, 23,  4],
       [ 1, 23,  4],
       [ 1, 23,  4],
       [ 1, 23,  4],
       [ 1, 23,  4]])).all()
### BEGIN HIDDEN TESTS
arrh1 = np.zeros((5,4), dtype=np.int16)
assert (get_zeroth_and_first_rows(arrh1) == np.array([[0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0],
                                                   [0, 0, 0, 0]])).all()


### END HIDDEN TESTS


def mean_and_dev_students(marks):
    '''
    args: ndarray
    return: tuple of ndarrays (mean_arr, std_arr)
    
    Staff's solution contains one line of code. 
    '''
    ### BEGIN SOLUTION
    return np.mean(marks, axis=1), np.std(marks, axis=1)
    ### END SOLUTION


arr1 = np.array([[2,3,4],[3,42,3]])
assert (mean_and_dev_students(arr1)[0] == (np.array([ 3., 16.]))).all()
assert (mean_and_dev_students(arr1)[1] >= (np.array([ 0.8, 18.]))).all() # Floating point equality could be problematic. More on that in a computer systems course :) 
assert (mean_and_dev_students(arr1)[1] <= np.array([ 0.85, 185])).all()
### BEGIN HIDDEN TESTS
arr2 = np.array([[24,33,4],[43,442,34]])
assert (mean_and_dev_students(arr2)[0] >= (np.array([ 20., 173.]))).all()
assert (mean_and_dev_students(arr2)[0] <= (np.array([ 20.5, 173.5]))).all()

assert (mean_and_dev_students(arr2)[1] >= (np.array([ 12., 190. ]))).all()
assert (mean_and_dev_students(arr2)[1] <= (np.array([ 12.5, 190.5 ]))).all()

### END HIDDEN TESTS


def mean_and_dev_exams(marks):
    '''
    args: ndarray
    return: tuple of ndarrays (mean_arr, std_arr)
    
    Staff's solution contains one line of code. 
    '''
    ### BEGIN SOLUTION
    return np.mean(marks, axis=0), np.std(marks, axis=0)
    ### END SOLUTION


arr1 = np.array([[2,3,4],[3,42,3]])
assert (mean_and_dev_exams(arr1)[0] == (np.array([ 2.5, 22.5,  3.5]))).all()
assert (mean_and_dev_exams(arr1)[1] == (np.array([ 0.5, 19.5,  0.5]))).all()
### BEGIN HIDDEN TESTS
arr2 = np.array([[24,33,4],[43,442,34]])
assert (mean_and_dev_exams(arr2)[0] == (np.array([ 33.5, 237.5,  19.]))).all()
assert (mean_and_dev_exams(arr2)[1] == (np.array([  9.5, 204.5,  15. ]))).all()

### END HIDDEN TESTS


def cumulative_avg(marks):
    '''
    args: ndarray
    return: tuple of floats (mean, std_dev)
    
    Staff's solution contains one line of code. 
    '''
    ### BEGIN SOLUTION
    return np.sum(marks), np.std(marks)
    ### END SOLUTION


arr1 = np.array([[2,3,4],[3,42,3]])
assert (cumulative_avg(arr1) == (57, 14.545904349105742))
### BEGIN HIDDEN TESTS
arr2 = np.array([[24,33,4],[43,442,34]])
assert (cumulative_avg(arr2) == (580, 154.91036834964348))
### END HIDDEN TESTS


def encode(arr):
    '''args: ndarray of shape (1,m)
       returns: ndarray of shape (m, y). Figuring out y is part of this problem.
       
       Staff's solution has 7-8  lines of code.
       '''
    ### BEGIN SOLUTION
    _, ncols_in_arr  = arr.shape
    # desired array has shape (ncols_in_arr, max(arr) + 1)
    nrows_in_encod = ncols_in_arr
    ncols_in_encod = np.max(arr) + 1
    
    # initialize to all zeros first.
    encoding_ = np.zeros((ncols_in_arr, ncols_in_encod))
    
    # Append 1's at appropriate places. Using integer indexing
    row_idx = np.arange(nrows_in_encod) # e.g. gives [0,1,2,...,4] if nrows_in_encod is 5
    col_idx = arr
    encoding_[row_idx, col_idx] = 1
    
    return encoding_
    ### END SOLUTION


arr1 = np.array([1, 4, 3, 2]).reshape(1,-1)
assert (encode(arr1) == np.array([[0., 1., 0., 0., 0.],
                                  [0., 0., 0., 0., 1.],
                                  [0., 0., 0., 1., 0.],
                                  [0., 0., 1., 0., 0.]])).all()


arr2 = np.array([7,4,2,3,1,5,6,0]).reshape(1,-1)
assert (encode(arr2) == np.array([[0., 0., 0., 0., 0., 0., 0., 1.],
                                 [0., 0., 0., 0., 1., 0., 0., 0.],
                                 [0., 0., 1., 0., 0., 0., 0., 0.],
                                 [0., 0., 0., 1., 0., 0., 0., 0.],
                                 [0., 1., 0., 0., 0., 0., 0., 0.],
                                 [0., 0., 0., 0., 0., 1., 0., 0.],
                                 [0., 0., 0., 0., 0., 0., 1., 0.],
                                 [1., 0., 0., 0., 0., 0., 0., 0.]])).all()


### BEGIN HIDDEN TESTS
arr2 = np.array([10, 4, 3, 2]).reshape(1,-1)
assert (encode(arr2) == np.array([[0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 1.],
                                 [0., 0., 0., 0., 1., 0., 0., 0., 0., 0., 0.],
                                 [0., 0., 0., 1., 0., 0., 0., 0., 0., 0., 0.],
                                 [0., 0., 1., 0., 0., 0., 0., 0., 0., 0., 0.]])).all()


arr3 = np.arange(10000).reshape(1,-1)
assert_equal(encode(arr3).shape, (10000,10000))

### END HIDDEN TESTS


def to_df(arr):
    '''
    arg: ndarray of shape (m,n)
    return: tuple (df, ndarray)
    
    Staff's solution contains 4 lines of code. 
    '''
    
    ### BEGIN SOLUTION
    total_exams = arr.shape[1]
    _col_names = ["Final exam " + str(exam_num) for exam_num in range(1, total_exams+1)]
    df = pd.DataFrame(arr, columns=_col_names)
    return df, df.values
    ### END SOLUTION


arr1 = np.array([50, 40, 43, 20]).reshape(1,-1)
assert list(to_df(arr1)[0].columns) == ['Final exam 1', 'Final exam 2', 'Final exam 3', 'Final exam 4']
assert (to_df(arr1)[1] == arr1).all()
### BEGIN HIDDEN TESTS
arr2 = np.array([[1,1],[2,2],[3,2],[4,2],[5,2]])
assert list(to_df(arr2)[0].columns) == ['Final exam 1', 'Final exam 2']
assert (to_df(arr2)[1] == arr2).all()

arr3 = np.ones((10,20))
assert (to_df(arr3)[0].columns == ['Final exam 1', 'Final exam 2', 'Final exam 3', 'Final exam 4',
       'Final exam 5', 'Final exam 6', 'Final exam 7', 'Final exam 8',
       'Final exam 9', 'Final exam 10', 'Final exam 11', 'Final exam 12',
       'Final exam 13', 'Final exam 14', 'Final exam 15', 'Final exam 16',
       'Final exam 17', 'Final exam 18', 'Final exam 19', 'Final exam 20']).all()
### END HIDDEN TESTS


def count_rows(df):
    '''
    args: dataframe
    return: int
    
    Staff's solution contains one line of code. 
    '''
    ### BEGIN SOLUTION
    return len(df)
    ### END SOLUTION


df1 = to_df(np.ones((4,3)))[0]
assert count_rows(df1) == 4
### BEGIN HIDDEN TESTS
df1 = to_df(np.ones((1114,3)))[0]
assert count_rows(df1) == 1114

df1 = to_df(np.ones((11414,4343)))[0]
assert count_rows(df1) == 11414

### END HIDDEN TESTS

Useful Points:¶

Question 1¶

Question 2¶

Question 3¶

Question 4¶

`Questions 5, 6 and 7 are based on the following information`:¶

Question 5:¶

Question 6:¶

Question 7¶

Question 8¶

Question 9¶

Question 10¶

Useful Points:¶

Question 1¶

Question 2¶

Question 3¶

Question 4¶

Questions 5, 6 and 7 are based on the following information:¶

Question 5:¶

Question 6:¶

Question 7¶

Question 8¶

Question 9¶

Question 10¶

`Questions 5, 6 and 7 are based on the following information`:¶