532f4 Pca Sklearn Ipynb - Notebook by Ashish Jaiswal (asheeshcric)

Learn practical skills, build real-world projects, and advance your career

Updated 5 years ago

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import random as rd

from sklearn.decomposition import PCA
from sklearn import preprocessing

Creating a sample dataset

# Create 'gene' names as the feature variables
genes = ['gene' + str(i) for i in range(1, 101)]

# Create arrays of sample names
wt = ['wt' + str(i) for i in range(1, 6)]
ko = ['ko' + str(i) for i in range(1, 6)]

data = pd.DataFrame(columns=[*wt, *ko], index=genes)