numpy交叉验证集的简单构建

num_folds = 5
k_choices = [1, 3, 5, 8, 10, 12, 15, 20, 50, 100]
# k_choices = [1, 5]

x_train_folds = []
y_train_folds = []

# x_train_folds = np.array(np.split(x_train, num_folds))
# y_train_folds = np.array(np.split(y_train, num_folds))
x_train_folds = np.array(np.split(x_test, num_folds))
y_train_folds = np.array(np.split(y_test, num_folds))

k_to_accuracies = {}
for k in k_choices:
    curr_acc = []
    for i in np.arange(num_folds):
        indx = np.array([j for j in range(num_folds) if j != i])
        X_test_n = x_train_folds[i]
        y_test_n = y_train_folds[i].reshape(-1,)
        x_train_folds[indx]
        x_train_n = np.concatenate(x_train_folds[indx], axis=0)
        y_train_n = np.concatenate(y_train_folds[indx], axis=None)

        classifier = KNearestNeighbor()
        classifier.train(x_train_n, y_train_n)
        dists = classifier.compute_distances_two_loops(X_test_n)
        y_test_n_pred = classifier.predict_labels(dists, k)
        num_correct = np.sum(y_test_n_pred == y_test_n)
        accuracy = float(num_correct) / len(y_test_n)
        curr_acc.append(accuracy)
    k_to_accuracies[k] = curr_acc

 

上一篇:大数据-数据分析-numpy库-数组创建方式、数组的数据类型


下一篇:Numpy的安装和创建