# Carefully modify the below two string variables. Ensure there are no typos.

student_id = "12345678" # set this to your student ID

student_mail = "firstname.lastname@student.manchester.ac.uk" # your email address

import warnings
warnings.simplefilter(action='ignore', category=FutureWarning)
warnings.simplefilter(action='ignore', category=DeprecationWarning)

import numpy as np
import pandas as pd

h_best = None

# TODO: Provide your solution code here that defines the function `h_best`

best_err = None

# TODO: Provide your solution code here that defines the function `best_err`

X_1c, Y_1c = None, None

# TODO: Provide your solution code here that defines the arrays X_1c and Y_1c

X_1d, Y_1d = None, None

# TODO: Provide your solution code here that defines the arrays X_1d and Y_1d

my_knn = None

# TODO: Provide your solution code here that defines the function `my_knn`

my_knn_predict = None

# TODO: Provide your solution code here that defines the function `my_knn_predict`

# do not change code in this cell
astro = pd.read_csv("_datasets/star_classification.csv")
astro.replace(-9999, np.nan, inplace=True)
astro.dropna(inplace=True)
astro.head()

# do not change code in this cell
X = astro[["u", "g", "r", "i", "z", "redshift"]]
y = astro["class"]

from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split( 
    X, y, 
    test_size=0.2,
    shuffle=True,
    random_state=3383 
)

astro_scores = None

# TODO: Provide your solution code here that defines `astro_scores`

astro_pipe = None

# TODO: Provide your solution code here that defines `astro_pipe`

try: 
    import re
    assert re.match(r'^[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}$', student_mail) and not 'firstname' in student_mail
    print("OKAY - student_mail appears to be valid")
except:
    print("WARN - student_mail could not be verified")

try: 
    assert callable(h_best)
    print("OKAY - h_best should be a function")
except:
    print("FAIL - h_best should be a function")

import numpy as np
X = np.array([[1,2,3],[2,-3,4],[1,2,3],[2,2,2]])
Y = np.array([[1,2],[1,2],[3,4],[1,2]])
x = np.array([1,2,3])

try:
    val = h_best(x, X, Y)
    assert val is not None
    print("OKAY - h_best returns a value")
except:
    print("FAIL - h_best does not return a value")

try: 
    assert callable(best_err)
    print("OKAY - best_err should be a function")
except:
    print("FAIL - best_err should be a function")

try:
    val = best_err(X, Y)
    assert val is not None
    print("OKAY - best_err returns a value")
except:
    print("FAIL - best_err does not return a value")

try: 
    assert type(X_1c) == np.ndarray
    assert type(X_1d) == np.ndarray
    print("OKAY - X_1c, X_1d should be NumPy arrays")
except:
    print("FAIL - X_1c, X_1d should be NumPy arrays")

try: 
    assert type(Y_1c) == np.ndarray
    assert type(Y_1d) == np.ndarray
    print("OKAY - Y_1d, Y_1d should be NumPy arrays")
except:
    print("FAIL - Y_1c, Y_1d should be NumPy arrays")

try: 
    assert callable(my_knn)
    print("OKAY - my_knn should be a function")
except:
    print("FAIL - my_knn should be a function")

try:
    val = my_knn(x, X, k=2)
    assert val is not None
    print("OKAY - my_knn returns a value")
except:
    print("FAIL - my_knn does not return a value")

try:
    val = my_knn_predict(x, X, 2, x)
    assert val is not None
    print("OKAY - my_knn_predict returns a value")
except:
    print("FAIL - my_knn_predict does not return a value")

try: 
    assert callable(my_knn_predict)
    print("OKAY - my_knn_predict should be a function")
except:
    print("FAIL - my_knn_predict should be a function")

try: 
    assert type(astro_scores) == pd.Series
    print("OKAY - astro_scores should be a pandas series")
except:
    print("FAIL - astro_scores should be a pandas series")

try: 
    assert callable(astro_pipe.fit) and callable(astro_pipe.predict)
    print("OKAY - astro_pipe should provide fit and predict methods")
except:
    print("FAIL - astro_pipe should provide fit and predict methods")

Coursework 2¶

Note on independent work¶

Start of test¶

Problem 1a¶

Problem 1b¶

Problem 1c¶

Problem 1d¶

Problem 2a¶

Problem 2b¶

Problem 3a¶

Problem 3b¶

End of test¶