- Notifications
You must be signed in to change notification settings - Fork 19.9k
/
Copy pathReservoirSampling.java
55 lines (48 loc) · 1.64 KB
/
ReservoirSampling.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
packagecom.thealgorithms.randomized;
importjava.util.ArrayList;
importjava.util.List;
importjava.util.Random;
/**
* Reservoir Sampling Algorithm
*
* Use Case:
* - Efficient for selecting k random items from a stream of unknown size
* - Used in streaming systems, big data, and memory-limited environments
*
* Time Complexity: O(n)
* Space Complexity: O(k)
*
* @author Michael Alexander Montoya (@cureprotocols)
* @see <a href="https://en.wikipedia.org/wiki/Reservoir_sampling">Reservoir Sampling - Wikipedia</a>
*/
publicfinalclassReservoirSampling {
// Prevent instantiation of utility class
privateReservoirSampling() {
thrownewUnsupportedOperationException("Utility class");
}
/**
* Selects k random elements from a stream using reservoir sampling.
*
* @param stream The input stream as an array of integers.
* @param sampleSize The number of elements to sample.
* @return A list containing k randomly selected elements.
*/
publicstaticList<Integer> sample(int[] stream, intsampleSize) {
if (sampleSize > stream.length) {
thrownewIllegalArgumentException("Sample size cannot exceed stream size.");
}
List<Integer> reservoir = newArrayList<>(sampleSize);
Randomrand = newRandom();
for (inti = 0; i < stream.length; i++) {
if (i < sampleSize) {
reservoir.add(stream[i]);
} else {
intj = rand.nextInt(i + 1);
if (j < sampleSize) {
reservoir.set(j, stream[i]);
}
}
}
returnreservoir;
}
}