import pandas as pd from sklearn.preprocessing import StandardScaler from sklearn.decomposition import PCA from sklearn.datasets import make_moons from sklearn.manifold import TSNE import matplotlib.pyplot as plt df = pd.read_csv("decathlon.txt", sep='\t') clean = df.drop(["Points", "Rank", "Competition"], axis="columns") mat = clean.to_numpy() scaler = StandardScaler() normalized = scaler.fit_transform(mat) pca = PCA(n_components=2) pca.fit(normalized) print(pca.explained_variance_ratio_) reduction = pca.transform(normalized) print(reduction) #plt.scatter(x=reduction[:,0], y=reduction[:,1], c=df["Rank"]) #plt.show() components = pca.components_ print(components) #plt.scatter(x=components[0], y=components[1]) #plt.show() print("===============================================") X, y = make_moons(n_samples=200, noise=0.1) #plt.scatter(X[:,0], X[:,1]) #plt.show() scaled = scaler.fit_transform(X) X_embedded = TSNE(n_components=1).fit_transform(X) print(X_embedded)