why?
data
| dataset | x | y | |
|---|---|---|---|
| 0 | A | 55.384600 | 97.179500 |
| 1 | A | 51.538500 | 96.025600 |
| 2 | A | 46.153800 | 94.487200 |
| 3 | A | 42.820500 | 91.410300 |
| 4 | A | 40.769200 | 88.333300 |
| ... | ... | ... | ... |
| 1841 | M | 33.674442 | 26.090490 |
| 1842 | M | 75.627255 | 37.128752 |
| 1843 | M | 40.610125 | 89.136240 |
| 1844 | M | 39.114366 | 96.481751 |
| 1845 | M | 34.583829 | 89.588902 |
1846 rows × 3 columns
len(data['dataset'].unique())
13
data['dataset'].unique()
array(['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M'],
dtype=object)
data.groupby('dataset')["x"].mean()
dataset A 54.263273 B 54.266100 C 54.261442 D 54.269927 E 54.260150 F 54.267341 G 54.268805 H 54.260303 I 54.267320 J 54.268730 K 54.265882 L 54.267849 M 54.266916 Name: x, dtype: float64
data.groupby('dataset')["y"].mean()
dataset A 47.832253 B 47.834721 C 47.830252 D 47.836988 E 47.839717 F 47.839545 G 47.835450 H 47.839829 I 47.837717 J 47.830823 K 47.831496 L 47.835896 M 47.831602 Name: y, dtype: float64
d = {}
d['mean x'] = data.groupby('dataset')["x"].mean().tolist()
d['mean y'] = data.groupby('dataset')["y"].mean().tolist()
d['sd x'] = data.groupby('dataset')["x"].std().tolist()
d['sd y'] = data.groupby('dataset')["y"].std().tolist()
df = pd.DataFrame(data=d)
df.index.name = "data sets"
df
| mean x | mean y | sd x | sd y | |
|---|---|---|---|---|
| data sets | ||||
| 0 | 54.263273 | 47.832253 | 16.765142 | 26.935403 |
| 1 | 54.266100 | 47.834721 | 16.769825 | 26.939743 |
| 2 | 54.261442 | 47.830252 | 16.765898 | 26.939876 |
| 3 | 54.269927 | 47.836988 | 16.769959 | 26.937684 |
| 4 | 54.260150 | 47.839717 | 16.769958 | 26.930002 |
| 5 | 54.267341 | 47.839545 | 16.768959 | 26.930275 |
| 6 | 54.268805 | 47.835450 | 16.766704 | 26.939998 |
| 7 | 54.260303 | 47.839829 | 16.767735 | 26.930192 |
| 8 | 54.267320 | 47.837717 | 16.760013 | 26.930036 |
| 9 | 54.268730 | 47.830823 | 16.769239 | 26.935727 |
| 10 | 54.265882 | 47.831496 | 16.768853 | 26.938608 |
| 11 | 54.267849 | 47.835896 | 16.766759 | 26.936105 |
| 12 | 54.266916 | 47.831602 | 16.770000 | 26.937902 |
sr = 22050
T = .1
t = np.linspace(0, T, int(T*sr), endpoint=False)
x = data[data['dataset'] == "A"]["x"].multiply(10).sample(n=100, random_state=1).tolist()
e = []
for a in x:
e.append(0.5*np.sin(2*np.pi*a*t))
sound1 = np.array(e)
ipd.Audio(sound1.flatten(), rate=sr)
sr = 22050
T = .1
t = np.linspace(0, T, int(T*sr), endpoint=False)
x = data[data['dataset'] == "B"]["x"].multiply(10).sample(n=100, random_state=1).tolist()
e = []
for a in x:
e.append(0.5*np.sin(2*np.pi*a*t))
sound2 = np.array(e)
ipd.Audio(sound2.flatten(), rate=sr)
fig
fig
