HBD(mol), float(MW(mol)), logP(mol),float(TPSA(mol)),num_rotatable_bonds(mol),num_heavy_atoms(mol),smiles...)
dataframe.set_index("CHEMBL_ID",inplace=True)
PCA分析,数据降维也称主成分分析
#PCA分析
pca1=PCA(dataframe.drop(['smiles...#运用随机森林模型,并为其选择有用数据
model=dataframe.loc[:,["smiles", "activity"]]
desc_list = Descriptors.descList
model...lambda x : -1.0 * np.log10(x / 1.0e9))
for desc_name, function in desc_list:
values = []
for smiles...in model["smiles"]:
mol = MolFromSmiles(smiles)
values.append(function(mol))
model