Added kNearestNeighbour and refactored Vector to a package level above and added a constructor
This commit is contained in:
parent
5264853c8e
commit
54cfe2dece
@ -1,4 +1,4 @@
|
|||||||
package machine_learning.perceptron;
|
package machine_learning;
|
||||||
|
|
||||||
import java.util.*;
|
import java.util.*;
|
||||||
import java.util.stream.Collectors;
|
import java.util.stream.Collectors;
|
||||||
@ -10,12 +10,16 @@ public class Vector
|
|||||||
|
|
||||||
public Vector(int dim)
|
public Vector(int dim)
|
||||||
{
|
{
|
||||||
this.values = new ArrayList<>();
|
this(IntStream.range(0, dim)
|
||||||
|
.mapToDouble(i -> 0d)
|
||||||
for (int i = 0; i < dim; i++)
|
.toArray());
|
||||||
{
|
|
||||||
this.values.add(0d);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public Vector(double... value)
|
||||||
|
{
|
||||||
|
this(Arrays.stream(value)
|
||||||
|
.boxed()
|
||||||
|
.collect(Collectors.toList()));
|
||||||
}
|
}
|
||||||
|
|
||||||
public Vector(List<Double> values)
|
public Vector(List<Double> values)
|
||||||
@ -66,6 +70,14 @@ public class Vector
|
|||||||
.sum());
|
.sum());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public double distance(Vector b)
|
||||||
|
{
|
||||||
|
return Math.sqrt(IntStream.range(0,
|
||||||
|
this.dimension())
|
||||||
|
.mapToDouble(i -> (this.get(i) - b.get(i)) * (this.get(i) - b.get(i)))
|
||||||
|
.sum());
|
||||||
|
}
|
||||||
|
|
||||||
public Vector divide(double div)
|
public Vector divide(double div)
|
||||||
{
|
{
|
||||||
var divided = new ArrayList<Double>();
|
var divided = new ArrayList<Double>();
|
7
src/machine_learning/nearest_neighbour/DataClass.java
Normal file
7
src/machine_learning/nearest_neighbour/DataClass.java
Normal file
@ -0,0 +1,7 @@
|
|||||||
|
package machine_learning.nearest_neighbour;
|
||||||
|
|
||||||
|
public enum DataClass
|
||||||
|
{
|
||||||
|
POSITIVE,
|
||||||
|
NEGATIVE
|
||||||
|
}
|
8
src/machine_learning/nearest_neighbour/Distance.java
Normal file
8
src/machine_learning/nearest_neighbour/Distance.java
Normal file
@ -0,0 +1,8 @@
|
|||||||
|
package machine_learning.nearest_neighbour;
|
||||||
|
|
||||||
|
import machine_learning.Vector;
|
||||||
|
|
||||||
|
public interface Distance
|
||||||
|
{
|
||||||
|
double distance(Vector a, Vector b);
|
||||||
|
}
|
@ -0,0 +1,67 @@
|
|||||||
|
package machine_learning.nearest_neighbour;
|
||||||
|
|
||||||
|
import machine_learning.Vector;
|
||||||
|
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.Map;
|
||||||
|
import java.util.Random;
|
||||||
|
import java.util.stream.Collectors;
|
||||||
|
import java.util.stream.Stream;
|
||||||
|
|
||||||
|
public class KNearestNeighbour
|
||||||
|
{
|
||||||
|
private Distance distance;
|
||||||
|
|
||||||
|
private int k;
|
||||||
|
|
||||||
|
public KNearestNeighbour(Distance distance)
|
||||||
|
{
|
||||||
|
this(distance, 1);
|
||||||
|
}
|
||||||
|
|
||||||
|
public KNearestNeighbour(Distance distance, int k)
|
||||||
|
{
|
||||||
|
this.distance = distance;
|
||||||
|
this.k = k;
|
||||||
|
}
|
||||||
|
|
||||||
|
public DataClass kNearestNeighbour(List<Vector> positives, List<Vector> negatives, Vector toClassify)
|
||||||
|
{
|
||||||
|
var nearestNeighbours = this.nearestNeighbours(
|
||||||
|
Stream.concat(positives.stream(), negatives.stream())
|
||||||
|
.collect(Collectors.toList()),
|
||||||
|
toClassify
|
||||||
|
);
|
||||||
|
|
||||||
|
var positivesWithNearestNeighboursAmount = nearestNeighbours.stream()
|
||||||
|
.filter(positives::contains)
|
||||||
|
.count();
|
||||||
|
|
||||||
|
var negativesWithNearestNeighboursAmount = nearestNeighbours.stream()
|
||||||
|
.filter(negatives::contains)
|
||||||
|
.count();
|
||||||
|
|
||||||
|
if (positivesWithNearestNeighboursAmount > negativesWithNearestNeighboursAmount)
|
||||||
|
{
|
||||||
|
return DataClass.POSITIVE;
|
||||||
|
}
|
||||||
|
else if (positivesWithNearestNeighboursAmount < negativesWithNearestNeighboursAmount)
|
||||||
|
{
|
||||||
|
return DataClass.NEGATIVE;
|
||||||
|
}
|
||||||
|
|
||||||
|
return new Random().nextBoolean() ? DataClass.POSITIVE : DataClass.NEGATIVE;
|
||||||
|
}
|
||||||
|
|
||||||
|
private List<Vector> nearestNeighbours(List<Vector> vectors, Vector vector)
|
||||||
|
{
|
||||||
|
var nearestNeighbours = vectors.stream()
|
||||||
|
.map(v -> Map.entry(this.distance.distance(v, vector), v))
|
||||||
|
.sorted((e1, e2) -> e1.getKey() >= e2.getKey() ? (e1.getKey().equals(e2.getKey()) ? 0 : 1) : -1)
|
||||||
|
.map(Map.Entry::getValue)
|
||||||
|
.collect(Collectors.toList());
|
||||||
|
|
||||||
|
return nearestNeighbours.subList(0, this.k);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
@ -1,5 +1,7 @@
|
|||||||
package machine_learning.perceptron;
|
package machine_learning.perceptron;
|
||||||
|
|
||||||
|
import machine_learning.Vector;
|
||||||
|
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
|
|
||||||
public class Perceptron
|
public class Perceptron
|
||||||
|
@ -1,9 +1,7 @@
|
|||||||
package machine_learning.perceptron;
|
package machine_learning;
|
||||||
|
|
||||||
import org.junit.jupiter.api.Test;
|
import org.junit.jupiter.api.Test;
|
||||||
|
|
||||||
import java.util.List;
|
|
||||||
|
|
||||||
import static org.junit.jupiter.api.Assertions.*;
|
import static org.junit.jupiter.api.Assertions.*;
|
||||||
|
|
||||||
class VectorTest
|
class VectorTest
|
||||||
@ -14,7 +12,7 @@ class VectorTest
|
|||||||
{
|
{
|
||||||
var v = new Vector(3);
|
var v = new Vector(3);
|
||||||
|
|
||||||
var expected = new Vector(List.of(0d, 0d, 0d));
|
var expected = new Vector(0d, 0d, 0d);
|
||||||
|
|
||||||
assertEquals(3, v.dimension());
|
assertEquals(3, v.dimension());
|
||||||
assertEquals(expected, v);
|
assertEquals(expected, v);
|
||||||
@ -23,11 +21,11 @@ class VectorTest
|
|||||||
@Test
|
@Test
|
||||||
void shouldReturnCorrectVectorWhenAdding()
|
void shouldReturnCorrectVectorWhenAdding()
|
||||||
{
|
{
|
||||||
var v1 = new Vector(List.of(1d, 2d));
|
var v1 = new Vector(1d, 2d);
|
||||||
var v2 = new Vector(List.of(3d, 4d));
|
var v2 = new Vector(3d, 4d);
|
||||||
|
|
||||||
var result = v1.add(v2);
|
var result = v1.add(v2);
|
||||||
var expected = new Vector(List.of(4d, 6d));
|
var expected = new Vector(4d, 6d);
|
||||||
|
|
||||||
assertEquals(expected, result);
|
assertEquals(expected, result);
|
||||||
}
|
}
|
||||||
@ -35,11 +33,11 @@ class VectorTest
|
|||||||
@Test
|
@Test
|
||||||
void shouldReturnCorrectVectorWhenSubtracting()
|
void shouldReturnCorrectVectorWhenSubtracting()
|
||||||
{
|
{
|
||||||
var v1 = new Vector(List.of(1d, 2d));
|
var v1 = new Vector(1d, 2d);
|
||||||
var v2 = new Vector(List.of(3d, 4d));
|
var v2 = new Vector(3d, 4d);
|
||||||
|
|
||||||
var result = v1.subtract(v2);
|
var result = v1.subtract(v2);
|
||||||
var expected = new Vector(List.of(-2d, -2d));
|
var expected = new Vector(-2d, -2d);
|
||||||
|
|
||||||
assertEquals(expected, result);
|
assertEquals(expected, result);
|
||||||
}
|
}
|
||||||
@ -47,8 +45,8 @@ class VectorTest
|
|||||||
@Test
|
@Test
|
||||||
void shouldReturnCorrectVectorWhenScalarMultiplying()
|
void shouldReturnCorrectVectorWhenScalarMultiplying()
|
||||||
{
|
{
|
||||||
var v1 = new Vector(List.of(1d, 2d));
|
var v1 = new Vector(1d, 2d);
|
||||||
var v2 = new Vector(List.of(3d, 4d));
|
var v2 = new Vector(3d, 4d);
|
||||||
|
|
||||||
var result = v1.scalar(v2);
|
var result = v1.scalar(v2);
|
||||||
var expected = 11d;
|
var expected = 11d;
|
||||||
@ -59,7 +57,7 @@ class VectorTest
|
|||||||
@Test
|
@Test
|
||||||
void shouldReturnCorrectVectorWhenEuclid()
|
void shouldReturnCorrectVectorWhenEuclid()
|
||||||
{
|
{
|
||||||
var v1 = new Vector(List.of(1d, 2d));
|
var v1 = new Vector(1d, 2d);
|
||||||
|
|
||||||
var result = v1.euclid();
|
var result = v1.euclid();
|
||||||
var expected = Math.sqrt(5);
|
var expected = Math.sqrt(5);
|
||||||
@ -67,14 +65,26 @@ class VectorTest
|
|||||||
assertEquals(expected, result);
|
assertEquals(expected, result);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
void shouldReturnCorrectDistance()
|
||||||
|
{
|
||||||
|
var v1 = new Vector(1d, 2d);
|
||||||
|
var v2 = new Vector(3d, 4d);
|
||||||
|
|
||||||
|
var result = v1.distance(v2);
|
||||||
|
var expected = Math.sqrt(8);
|
||||||
|
|
||||||
|
assertEquals(expected, result);
|
||||||
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
void shouldReturnCorrectVectorWhenDividing()
|
void shouldReturnCorrectVectorWhenDividing()
|
||||||
{
|
{
|
||||||
var v1 = new Vector(List.of(1d, 2d));
|
var v1 = new Vector(1d, 2d);
|
||||||
var div = 2d;
|
var div = 2d;
|
||||||
|
|
||||||
var result = v1.divide(div);
|
var result = v1.divide(div);
|
||||||
var expected = new Vector(List.of(0.5d, 1d));
|
var expected = new Vector(0.5d, 1d);
|
||||||
|
|
||||||
assertEquals(expected, result);
|
assertEquals(expected, result);
|
||||||
}
|
}
|
@ -0,0 +1,62 @@
|
|||||||
|
package machine_learning.nearest_neighbour;
|
||||||
|
|
||||||
|
import machine_learning.Vector;
|
||||||
|
import org.junit.jupiter.api.BeforeAll;
|
||||||
|
import org.junit.jupiter.api.Test;
|
||||||
|
import org.junit.jupiter.api.TestInstance;
|
||||||
|
|
||||||
|
import java.util.ArrayList;
|
||||||
|
import java.util.Arrays;
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.stream.Stream;
|
||||||
|
|
||||||
|
import static org.junit.jupiter.api.Assertions.*;
|
||||||
|
|
||||||
|
@TestInstance(TestInstance.Lifecycle.PER_CLASS)
|
||||||
|
class KNearestNeighbourTest
|
||||||
|
{
|
||||||
|
List<Vector> positives;
|
||||||
|
List<Vector> negatives;
|
||||||
|
|
||||||
|
@BeforeAll
|
||||||
|
void initLearnData()
|
||||||
|
{
|
||||||
|
this.positives = new ArrayList<>(List.of(
|
||||||
|
new Vector(8d, 4d),
|
||||||
|
new Vector(8d, 6d),
|
||||||
|
new Vector(9d, 2d),
|
||||||
|
new Vector(9d, 5d))
|
||||||
|
);
|
||||||
|
|
||||||
|
this.negatives = new ArrayList<>(List.of(
|
||||||
|
new Vector(6d, 1d),
|
||||||
|
new Vector(7d, 3d),
|
||||||
|
new Vector(8d, 2d),
|
||||||
|
new Vector(9d, 0d))
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void shouldReturnCorrectClassForVectorWithKEquals3()
|
||||||
|
{
|
||||||
|
var kNearestNeighbour = new KNearestNeighbour((a ,b) -> Math.abs(a.get(0) - b.get(0)) + Math.abs(a.get(1) - b.get(1)), 3);
|
||||||
|
var vector = new Vector(8, 3.5);
|
||||||
|
|
||||||
|
var actualClass = kNearestNeighbour.kNearestNeighbour(this.positives, this.negatives, vector);
|
||||||
|
var expectedClass = DataClass.NEGATIVE;
|
||||||
|
|
||||||
|
assertEquals(expectedClass, actualClass);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void shouldReturnCorrectClassForVectorWithKEquals5()
|
||||||
|
{
|
||||||
|
var kNearestNeighbour = new KNearestNeighbour((a ,b) -> Math.abs(a.get(0) - b.get(0)) + Math.abs(a.get(1) - b.get(1)), 5);
|
||||||
|
var vector = new Vector(8, 3.5);
|
||||||
|
|
||||||
|
var actualClass = kNearestNeighbour.kNearestNeighbour(this.positives, this.negatives, vector);
|
||||||
|
var expectedClass = DataClass.POSITIVE;
|
||||||
|
|
||||||
|
assertEquals(expectedClass, actualClass);
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user