1. Vybrať optimálnu hodnotu k
2. Vypočítať vzdialenosť medzi testovacím bodom a trénovacími bodmi
3. Nájsť k najbližších susedov
4. Rozhodnúť hlasovaním (klasifikácia) alebo priemerom (regresia)

import numpy as np
from typing import List

def euclidean_distance(point1: np.ndarray, point2: np.ndarray) -> float:
    # Sample return value for [1, 2] and [4, 6]: 5.0
    """
    Compute the Euclidean distance between two points.

    Args:
        point1: First point
        point2: Second point

    Returns:
        distance: float - Euclidean distance
    """
    distance = 0.0

    # TODO: Implement Euclidean distance
    # Your code here

    return distance

def get_k_nearest_neighbors(training_data: np.ndarray,
                            training_labels: List[str],
                            test_point: np.ndarray,
                            k: int) -> List[str]:
    # Sample return value: ['A', 'A', 'B']
    """
    Return the labels of the k nearest neighbors.

    Args:
        training_data: Array of training points
        training_labels: Labels for training points
        test_point: Point to classify
        k: Number of neighbors

    Returns:
        neighbors: List[str] - Labels of k nearest points
    """
    neighbors = []

    # TODO: Implement nearest-neighbor search
    # Your code here

    return neighbors

def knn_predict(training_data: np.ndarray,
                training_labels: List[str],
                test_point: np.ndarray,
                k: int) -> str:
    # Sample return value for the test dataset and k=3: 'A'
    """
    Predict the class of a test point using kNN.

    Args:
        training_data: Array of training points
        training_labels: Labels for training points
        test_point: Point to classify
        k: Number of neighbors

    Returns:
        prediction: str - Predicted class label
    """
    prediction = ""

    # TODO: Implement kNN classification by majority vote
    # Your code here

    return prediction

def select_best_k(training_data: np.ndarray,
                  training_labels: List[str],
                  validation_data: np.ndarray,
                  validation_labels: List[str],
                  candidate_k_values: List[int]) -> int:
    # Sample return value for the test dataset: 1
    """
    Select the best k based on validation accuracy.

    Args:
        training_data: Array of training points
        training_labels: Labels for training points
        validation_data: Array of validation points
        validation_labels: Correct labels for validation points
        candidate_k_values: Candidate values of k to test

    Returns:
        best_k: int - Selected value of k
    """
    best_k = -1

    # TODO: Implement best-k selection using validation accuracy
    # Your code here

    return best_k

training_data = np.array([
    [1.0, 2.0],
    [2.0, 3.0],
    [3.0, 3.5],
    [6.0, 6.0],
    [7.0, 7.0],
    [8.0, 6.5]
])

training_labels = ['A', 'A', 'A', 'B', 'B', 'B']

validation_data = np.array([
    [2.5, 2.5],
    [6.5, 6.5],
    [3.5, 3.0],
    [7.5, 6.0]
])

validation_labels = ['A', 'B', 'A', 'B']

test_point = np.array([4.0, 4.5])
candidate_k_values = [1, 3, 5]

# Test Part 1: Euclidean Distance
test_point1 = np.array([1.0, 2.0])
test_point2 = np.array([4.0, 6.0])
distance_result = euclidean_distance(test_point1, test_point2)
print("Part 1 - Euclidean Distance:")
print(f"Input points: {test_point1}, {test_point2}")
print(f"Your result: {distance_result}")
print(f"Expected: 5.0")
print()

# Test Part 2: k Nearest Neighbors
neighbors_result = get_k_nearest_neighbors(training_data, training_labels, test_point, 3)
print("Part 2 - k Nearest Neighbors:")
print(f"Test point: {test_point}, k: 3")
print(f"Your result: {neighbors_result}")
print(f"Expected: ['A', 'A', 'B']")
print()

# Test Part 3: kNN Prediction
prediction_result = knn_predict(training_data, training_labels, test_point, 3)
print("Part 3 - kNN Prediction:")
print(f"Test point: {test_point}, k: 3")
print(f"Your result: {prediction_result}")
print(f"Expected: A")
print()

# Test Part 4: Select Best k
best_k_result = select_best_k(
    training_data,
    training_labels,
    validation_data,
    validation_labels,
    candidate_k_values
)
print("Part 4 - Select Best k:")
print(f"Candidate k values: {candidate_k_values}")
print(f"Your result: {best_k_result}")
print(f"Expected: 1")
print()

K-Nearest Neighbors (kNN) - Student Assignment¶

Prehľad postupu výpočtu algoritmu kNN¶

Setup - Required Imports¶

Part 1: Calculate Euclidean Distance (2 points)¶

Part 2: Find the `k` Nearest Neighbors (2 points)¶

Part 3: Voting for Classification (2 points)¶

Part 4: Select the Optimal Value of `k` (2 points)¶

Testing Dataset¶

Test your implementation¶

K-Nearest Neighbors (kNN) - Student Assignment¶

Prehľad postupu výpočtu algoritmu kNN¶

Setup - Required Imports¶

Part 1: Calculate Euclidean Distance (2 points)¶

Part 2: Find the k Nearest Neighbors (2 points)¶

Part 3: Voting for Classification (2 points)¶

Part 4: Select the Optimal Value of k (2 points)¶

Testing Dataset¶

Test your implementation¶

Part 2: Find the `k` Nearest Neighbors (2 points)¶

Part 4: Select the Optimal Value of `k` (2 points)¶