-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdatasets.py
More file actions
71 lines (54 loc) · 1.41 KB
/
datasets.py
File metadata and controls
71 lines (54 loc) · 1.41 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
import numpy as np
from sklearn import datasets
N_SAMPLES = 1500
np.random.seed(0)
def circles():
"""Concentric circles
Returns:
ndarray (1500x2): data
"""
data, _ = datasets.make_circles(n_samples=N_SAMPLES, factor=.5, noise=.05)
return data
def moons():
"""Half-moons
Returns:
ndarray (1500x2): data
"""
data, _ = datasets.make_moons(n_samples=N_SAMPLES, noise=.05)
return data
def blobs():
"""Blobs, all with the same variance
Returns:
ndarray (1500x2): data
"""
data, _ = datasets.make_blobs(n_samples=N_SAMPLES, random_state=17)
return data
def random():
"""Randomly-generated data
Returns:
ndarray (1500x2): data
"""
data = np.random.rand(N_SAMPLES, 2)
return data
def anisotropic():
"""Skewed blobs
Returns:
ndarray (1500x2): data
"""
data, _ = datasets.make_blobs(n_samples=N_SAMPLES, random_state=17)
transform = [[0.6, -0.3], [-0.4, 0.8]]
data = np.dot(data, transform)
return data
def varied_variances():
"""Blobs with different variances
Returns:
ndarray (1500x2): data
"""
data, _ = datasets.make_blobs(n_samples=N_SAMPLES, cluster_std=[1.0, 2.5, 0.5], random_state=17)
return data
def iris():
"""The Iris Dataset
Returns:
dict: dataset and feature names
"""
return datasets.load_iris()