In [ ]:
# Import Libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.impute import KNNImputer
from sklearn.preprocessing import LabelEncoder, OneHotEncoder, TargetEncoder
In [337]:
# load data
final_data = pd.read_csv('gdsc_dataset.csv')
In [338]:
# Overview data
print(final_data.info())
<class 'pandas.core.frame.DataFrame'> RangeIndex: 242036 entries, 0 to 242035 Data columns (total 22 columns): # Column Non-Null Count Dtype --- ------ -------------- ----- 0 COSMIC_ID 242036 non-null int64 1 CELL_LINE_NAME 242036 non-null object 2 TCGA_DESC 240969 non-null object 3 DRUG_ID 242036 non-null int64 4 DRUG_NAME 242036 non-null object 5 PATHWAY_NAME 242036 non-null object 6 MIN_CONC 242036 non-null float64 7 MAX_CONC 242036 non-null float64 8 LN_IC50 242036 non-null float64 9 AUC 242036 non-null float64 10 RMSE 242036 non-null float64 11 Z_SCORE 242036 non-null float64 12 Whole Exome Sequencing (WES) 232670 non-null object 13 Gene Expression 232670 non-null object 14 Methylation 232670 non-null object 15 Drug Response 232670 non-null object 16 GDSC Tissue descriptor 1 232670 non-null object 17 GDSC Tissue descriptor 2 232670 non-null object 18 CANCER_TYPE 190589 non-null object 19 MSI 229683 non-null object 20 Growth Properties 232670 non-null object 21 TARGET 214881 non-null object dtypes: float64(6), int64(2), object(14) memory usage: 40.6+ MB None
In [339]:
# Statistical information of numeric features
numeric_cols = ['MIN_CONC','MAX_CONC','LN_IC50', 'AUC', 'RMSE', 'Z_SCORE']
final_data[numeric_cols].describe()
Out[339]:
MIN_CONC | MAX_CONC | LN_IC50 | AUC | RMSE | Z_SCORE | |
---|---|---|---|---|---|---|
count | 242036.000000 | 242036.000000 | 242036.000000 | 242036.000000 | 242036.000000 | 2.420360e+05 |
mean | 0.023143 | 23.462279 | 2.817079 | 0.882592 | 0.082779 | 7.312962e-10 |
std | 0.158738 | 158.622810 | 2.762229 | 0.146998 | 0.042695 | 9.993925e-01 |
min | 0.000010 | 0.010000 | -8.747724 | 0.006282 | 0.003274 | -8.254501e+00 |
25% | 0.003002 | 3.000000 | 1.508018 | 0.849449 | 0.051107 | -6.568485e-01 |
50% | 0.010005 | 10.000000 | 3.236731 | 0.944196 | 0.076083 | 1.058000e-02 |
75% | 0.010005 | 10.000000 | 4.700110 | 0.974934 | 0.106105 | 6.560362e-01 |
max | 2.001054 | 2000.000000 | 13.820189 | 0.998904 | 0.299984 | 7.978776e+00 |
In [340]:
# Check for outliers through graphs
for column in numeric_cols:
plt.figure(figsize=(5, 5))
sns.histplot(x=column, data=final_data, alpha=0.2, bins = 50)
plt.title(column)
plt.show()
In [341]:
# MAX and MIN concentration top lining: check 2000 for MAX and 2 for MIN
print(final_data['MAX_CONC'].value_counts())
print(final_data['MIN_CONC'].value_counts())
# No outliers to drop
MAX_CONC 10.000000 142075 1.000000 22188 2.000000 13576 3.000000 13575 5.000000 10618 20.000000 7077 30.000000 6874 0.100000 5013 4.000000 3129 0.010000 2800 100.000000 1788 0.020000 1686 2000.000000 1467 0.500000 1383 0.250000 1185 0.012500 967 2.500000 962 0.800000 942 32.000000 743 121.000000 735 640.000000 732 40.000000 731 6.000000 715 8.000000 468 50.000000 370 0.200000 225 0.316256 12 Name: count, dtype: int64 MIN_CONC 0.010005 128564 0.001001 23120 0.002001 14619 0.003002 14198 0.005003 12855 0.020011 7684 0.030016 6825 0.000100 5499 0.004002 5396 0.000010 2918 0.000250 2572 0.100053 1788 0.000020 1693 0.009766 1548 2.001054 1467 0.000500 1395 0.008004 1036 0.007813 972 0.000800 942 0.000013 916 0.002501 892 0.015625 744 0.121064 735 0.640337 732 0.040021 731 0.000977 389 0.050026 370 0.004883 315 0.003906 306 0.000200 225 0.000098 219 0.019531 126 0.009491 94 0.000012 51 0.029297 49 0.001953 48 0.006003 1 0.005859 1 0.000195 1 Name: count, dtype: int64
In [342]:
# Statistical information and unique values of categorical features
# Check need of one - hot encoding; especially for cell line name and drug name
final_data.select_dtypes(include= 'object').describe().transpose()
Out[342]:
count | unique | top | freq | |
---|---|---|---|---|
CELL_LINE_NAME | 242036 | 969 | PC-14 | 295 |
TCGA_DESC | 240969 | 32 | UNCLASSIFIED | 45691 |
DRUG_NAME | 242036 | 286 | Ulixertinib | 1698 |
PATHWAY_NAME | 242036 | 24 | Unclassified | 24979 |
Whole Exome Sequencing (WES) | 232670 | 1 | Y | 232670 |
Gene Expression | 232670 | 2 | Y | 227886 |
Methylation | 232670 | 2 | Y | 225082 |
Drug Response | 232670 | 2 | Y | 231244 |
GDSC Tissue descriptor 1 | 232670 | 19 | lung_NSCLC | 26977 |
GDSC Tissue descriptor 2 | 232670 | 54 | lung_NSCLC_adenocarcinoma | 16112 |
CANCER_TYPE | 190589 | 31 | LUAD | 15483 |
MSI | 229683 | 2 | MSS/MSI-L | 214105 |
Growth Properties | 232670 | 3 | Adherent | 168431 |
TARGET | 214881 | 185 | PARP1, PARP2 | 4714 |
In [343]:
# Overview unique values of categorical columns
cat_cols = final_data.select_dtypes(include='object').columns
for col in cat_cols:
print(f"\nTop values for '{col}':")
print(final_data[col].value_counts().head(10))
Top values for 'CELL_LINE_NAME': CELL_LINE_NAME PC-14 295 SW620 295 HT-29 295 U-2-OS 294 MHH-ES-1 294 C32 294 A375 294 HCC70 284 MDA-MB-157 284 EFM-19 284 Name: count, dtype: int64 Top values for 'TCGA_DESC': TCGA_DESC UNCLASSIFIED 45691 LUAD 15653 SCLC 13570 BRCA 13106 SKCM 12637 COREAD 12538 HNSC 9358 ESCA 9126 GBM 8384 OV 8166 Name: count, dtype: int64 Top values for 'DRUG_NAME': DRUG_NAME Ulixertinib 1698 Oxaliplatin 1684 Fulvestrant 1680 Selumetinib 1666 Dactinomycin 1659 Docetaxel 1637 GSK343 1634 Uprosertib 1634 Acetalax 1434 MG-132 969 Name: count, dtype: int64 Top values for 'PATHWAY_NAME': PATHWAY_NAME Unclassified 24979 PI3K/MTOR signaling 22724 Other 21402 DNA replication 17650 Other, kinases 17277 ERK MAPK signaling 13350 Genome integrity 12221 Cell cycle 11620 Apoptosis regulation 10828 Chromatin histone methylation 10612 Name: count, dtype: int64 Top values for 'Whole Exome Sequencing (WES)': Whole Exome Sequencing (WES) Y 232670 Name: count, dtype: int64 Top values for 'Gene Expression': Gene Expression Y 227886 N 4784 Name: count, dtype: int64 Top values for 'Methylation': Methylation Y 225082 N 7588 Name: count, dtype: int64 Top values for 'Drug Response': Drug Response Y 231244 N 1426 Name: count, dtype: int64 Top values for 'GDSC Tissue descriptor 1': GDSC Tissue descriptor 1 lung_NSCLC 26977 urogenital_system 25707 leukemia 20484 aero_dig_tract 18583 lymphoma 16747 lung_SCLC 13750 breast 13388 nervous_system 12894 skin 12636 large_intestine 12438 Name: count, dtype: int64 Top values for 'GDSC Tissue descriptor 2': GDSC Tissue descriptor 2 lung_NSCLC_adenocarcinoma 16112 lung_small_cell_carcinoma 13750 breast 13388 large_intestine 12438 melanoma 12097 glioma 11822 ovary 10434 head and neck 9457 oesophagus 9126 B_cell_lymphoma 7978 Name: count, dtype: int64 Top values for 'CANCER_TYPE': CANCER_TYPE LUAD 15483 SCLC 13750 BRCA 13106 COAD/READ 12438 SKCM 12097 HNSC 9178 ESCA 9126 GBM 8384 OV 8166 DLBC 7978 Name: count, dtype: int64 Top values for 'MSI': MSI MSS/MSI-L 214105 MSI-H 15578 Name: count, dtype: int64 Top values for 'Growth Properties': Growth Properties Adherent 168431 Suspension 56814 Semi-Adherent 7425 Name: count, dtype: int64 Top values for 'TARGET': TARGET PARP1, PARP2 4714 MEK1, MEK2 4547 TOP1 4325 EGFR 3836 TNKS1, TNKS2 3699 AKT1, AKT2, AKT3 3308 DOT1L 2873 IGF1R, IR 2872 BRAF 2859 ATR 2803 Name: count, dtype: int64
In [344]:
# Check if Drug Id and drug name values match
print(final_data['DRUG_ID'].nunique())
# Numbers are not same
# Check if COSMIC ID and cell line name values match
print(final_data['COSMIC_ID'].nunique())
# unique values are same: 979
295 969
In [345]:
# Figuring out which drug names have multiple IDs
drug_map = final_data[['DRUG_ID','DRUG_NAME']]
id_per_name = final_data.groupby('DRUG_NAME')['DRUG_ID'].nunique()
duplicates = id_per_name[id_per_name > 1]
print(f"Drug names linked to multiple IDs: {len(duplicates)}")
print(duplicates)
print()
# Get the pairs that aren't 1-to-1
conflicting_pairs = drug_map.drop_duplicates()
conflicting = conflicting_pairs[conflicting_pairs['DRUG_NAME'].isin(duplicates.index)]
conflicting_sorted = conflicting.sort_values('DRUG_NAME')
print(conflicting_sorted)
print()
Drug names linked to multiple IDs: 9 DRUG_NAME Acetalax 2 Dactinomycin 2 Docetaxel 2 Fulvestrant 2 GSK343 2 Oxaliplatin 2 Selumetinib 2 Ulixertinib 2 Uprosertib 2 Name: DRUG_ID, dtype: int64 DRUG_ID DRUG_NAME 145052 1804 Acetalax 144335 1803 Acetalax 180104 1911 Dactinomycin 148637 1811 Dactinomycin 153655 1819 Docetaxel 3212 1007 Docetaxel 69109 1200 Fulvestrant 152221 1816 Fulvestrant 207847 2037 GSK343 117542 1627 GSK343 145769 1806 Oxaliplatin 55178 1089 Oxaliplatin 133166 1736 Selumetinib 42959 1062 Selumetinib 215011 2047 Ulixertinib 177231 1908 Ulixertinib 90529 1553 Uprosertib 218768 2106 Uprosertib
In [346]:
# Keep one DRUG_ID per DRUG_NAME (e.g., the smallest)
remapping_dict = { 1804:1803, 1911:1811, 1819:1007, 1200:1816, 2037:1627, 1806:1089, 1736:1062, 2047:1908, 1553:2106 }
final_data['DRUG_ID'] = final_data['DRUG_ID'].replace(remapping_dict)
# Check if Drug Id and drug name values match
print(final_data['DRUG_ID'].nunique())
# Numbers are same
# Will be using Drug ID instead of Drug Name
final_data.drop(columns = 'DRUG_ID')
286
Out[346]:
COSMIC_ID | CELL_LINE_NAME | TCGA_DESC | DRUG_NAME | PATHWAY_NAME | MIN_CONC | MAX_CONC | LN_IC50 | AUC | RMSE | ... | Whole Exome Sequencing (WES) | Gene Expression | Methylation | Drug Response | GDSC Tissue descriptor 1 | GDSC Tissue descriptor 2 | CANCER_TYPE | MSI | Growth Properties | TARGET | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 683667 | PFSK-1 | MB | Camptothecin | DNA replication | 0.000100 | 0.1 | -1.463887 | 0.930220 | 0.089052 | ... | Y | Y | Y | Y | nervous_system | medulloblastoma | MB | MSS/MSI-L | Adherent | TOP1 |
1 | 684052 | A673 | UNCLASSIFIED | Camptothecin | DNA replication | 0.000100 | 0.1 | -4.869455 | 0.614970 | 0.111351 | ... | Y | Y | Y | Y | soft_tissue | rhabdomyosarcoma | NaN | MSS/MSI-L | Adherent | TOP1 |
2 | 684057 | ES5 | UNCLASSIFIED | Camptothecin | DNA replication | 0.000100 | 0.1 | -3.360586 | 0.791072 | 0.142855 | ... | Y | Y | Y | Y | bone | ewings_sarcoma | NaN | MSS/MSI-L | Adherent | TOP1 |
3 | 684059 | ES7 | UNCLASSIFIED | Camptothecin | DNA replication | 0.000100 | 0.1 | -5.044940 | 0.592660 | 0.135539 | ... | Y | Y | Y | Y | bone | ewings_sarcoma | NaN | MSS/MSI-L | Adherent | TOP1 |
4 | 684062 | EW-11 | UNCLASSIFIED | Camptothecin | DNA replication | 0.000100 | 0.1 | -3.741991 | 0.734047 | 0.128059 | ... | Y | Y | Y | Y | bone | ewings_sarcoma | NaN | MSS/MSI-L | Adherent | TOP1 |
... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
242031 | 1659928 | SNU-175 | COREAD | N-acetyl cysteine | Metabolism | 2.001054 | 2000.0 | 10.127082 | 0.976746 | 0.074498 | ... | Y | Y | Y | Y | large_intestine | large_intestine | COAD/READ | MSI-H | Suspension | Metabolism |
242032 | 1660034 | SNU-407 | COREAD | N-acetyl cysteine | Metabolism | 2.001054 | 2000.0 | 8.576377 | 0.913378 | 0.057821 | ... | Y | Y | Y | Y | large_intestine | large_intestine | COAD/READ | MSI-H | Adherent | Metabolism |
242033 | 1660035 | SNU-61 | COREAD | N-acetyl cysteine | Metabolism | 2.001054 | 2000.0 | 10.519636 | 0.975001 | 0.058090 | ... | Y | Y | Y | Y | large_intestine | large_intestine | COAD/READ | MSS/MSI-L | Adherent | Metabolism |
242034 | 1674021 | SNU-C5 | COREAD | N-acetyl cysteine | Metabolism | 2.001054 | 2000.0 | 10.694579 | 0.969969 | 0.101013 | ... | Y | Y | Y | Y | large_intestine | large_intestine | COAD/READ | MSI-H | Adherent | Metabolism |
242035 | 1789883 | DiFi | COREAD | N-acetyl cysteine | Metabolism | 2.001054 | 2000.0 | 10.034825 | 0.966988 | 0.089057 | ... | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | Metabolism |
242036 rows × 21 columns
In [347]:
# Check for missing values
print(final_data.isnull().sum())
COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1067 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 9366 Gene Expression 9366 Methylation 9366 Drug Response 9366 GDSC Tissue descriptor 1 9366 GDSC Tissue descriptor 2 9366 CANCER_TYPE 51447 MSI 12353 Growth Properties 9366 TARGET 27155 dtype: int64
In [348]:
# Check for missing values
def check_missing_values_by_drug(df):
missing_values = {}
for drug in df['DRUG_NAME'].unique():
drug_data = df[df['DRUG_NAME'] == drug]
missing_values[drug] =drug_data.isnull().sum()
return missing_values
drug_missing_values = check_missing_values_by_drug(final_data)
for drug, missing_counts in drug_missing_values.items():
print(f"\nMissing values for {drug}:")
print(missing_counts)
print(f"Total missing values: {missing_counts.sum()}")
print("-" * 50)
Missing values for Camptothecin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 205 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 537 -------------------------------------------------- Missing values for Vinblastine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 158 MSI 28 Growth Properties 24 TARGET 0 dtype: int64 Total missing values: 355 -------------------------------------------------- Missing values for Cisplatin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for Cytarabine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for Docetaxel: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 65 Gene Expression 65 Methylation 65 Drug Response 65 GDSC Tissue descriptor 1 65 GDSC Tissue descriptor 2 65 CANCER_TYPE 352 MSI 84 Growth Properties 65 TARGET 0 dtype: int64 Total missing values: 897 -------------------------------------------------- Missing values for Methotrexate: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 36 Gene Expression 36 Methylation 36 Drug Response 36 GDSC Tissue descriptor 1 36 GDSC Tissue descriptor 2 36 CANCER_TYPE 176 MSI 49 Growth Properties 36 TARGET 0 dtype: int64 Total missing values: 483 -------------------------------------------------- Missing values for Tretinoin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for Gefitinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Navitoclax: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Vorinostat: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Nilotinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Refametinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Temsirolimus: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 193 MSI 50 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 515 -------------------------------------------------- Missing values for Olaparib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Veliparib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Bosutinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Lenalidomide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Axitinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AZD7762: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for GW441756: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Lestaurtinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for SB216763: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Tanespimycin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Motesanib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for KU-55933: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Elesclomol: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for Afatinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Vismodegib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Staurosporine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 205 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 537 -------------------------------------------------- Missing values for PLX-4720: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for BX795: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for NU7441: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for SL0101: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for Doramapimod: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for JNK Inhibitor VIII: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Wee1 Inhibitor: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Nutlin-3a (-): COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Mirin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for PD173074: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for ZM447439: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Alisertib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 201 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 533 -------------------------------------------------- Missing values for RO-3306: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for MK-2206: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Palbociclib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Dactolisib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Pictilisib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AZD8055: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 362 -------------------------------------------------- Missing values for PD0325901: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 205 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 537 -------------------------------------------------- Missing values for SB590885: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Selumetinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 64 Gene Expression 64 Methylation 64 Drug Response 64 GDSC Tissue descriptor 1 64 GDSC Tissue descriptor 2 64 CANCER_TYPE 355 MSI 83 Growth Properties 64 TARGET 0 dtype: int64 Total missing values: 892 -------------------------------------------------- Missing values for CCT007093: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 200 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 532 -------------------------------------------------- Missing values for Obatoclax Mesylate: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 30 Gene Expression 30 Methylation 30 Drug Response 30 GDSC Tissue descriptor 1 30 GDSC Tissue descriptor 2 30 CANCER_TYPE 170 MSI 35 Growth Properties 30 TARGET 0 dtype: int64 Total missing values: 416 -------------------------------------------------- Missing values for EHT-1864: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 52 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 533 -------------------------------------------------- Missing values for Avagacestat: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for 5-Fluorouracil: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Dasatinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Paclitaxel: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Crizotinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Rapamycin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Sorafenib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for BI-2536: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 196 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 520 -------------------------------------------------- Missing values for Irinotecan: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Oxaliplatin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 65 Gene Expression 65 Methylation 65 Drug Response 65 GDSC Tissue descriptor 1 65 GDSC Tissue descriptor 2 65 CANCER_TYPE 359 MSI 84 Growth Properties 65 TARGET 0 dtype: int64 Total missing values: 904 -------------------------------------------------- Missing values for BMS-536924: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for GSK1904529A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Tozasertib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 48 MSI 25 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 176 -------------------------------------------------- Missing values for PF-4708671: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 48 MSI 25 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 176 -------------------------------------------------- Missing values for PRIMA-1MET: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for Serdemetan: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 199 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 523 -------------------------------------------------- Missing values for TW 37: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 12 Gene Expression 12 Methylation 12 Drug Response 12 GDSC Tissue descriptor 1 12 GDSC Tissue descriptor 2 12 CANCER_TYPE 81 MSI 13 Growth Properties 12 TARGET 0 dtype: int64 Total missing values: 179 -------------------------------------------------- Missing values for Erlotinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for CCT-018159: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for Rucaparib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for Niraparib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for MK-1775: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Dinaciclib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for Gemcitabine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Bortezomib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for GSK269962A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 48 MSI 25 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 176 -------------------------------------------------- Missing values for SB505124: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 15 Gene Expression 15 Methylation 15 Drug Response 15 GDSC Tissue descriptor 1 15 GDSC Tissue descriptor 2 15 CANCER_TYPE 48 MSI 25 Growth Properties 15 TARGET 0 dtype: int64 Total missing values: 183 -------------------------------------------------- Missing values for Tamoxifen: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Fulvestrant: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 65 Gene Expression 65 Methylation 65 Drug Response 65 GDSC Tissue descriptor 1 65 GDSC Tissue descriptor 2 65 CANCER_TYPE 359 MSI 84 Growth Properties 65 TARGET 0 dtype: int64 Total missing values: 904 -------------------------------------------------- Missing values for EPZ004777: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for YK-4-279: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Piperlongumine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for Daporinad: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 127 MSI 37 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 352 -------------------------------------------------- Missing values for BMS-345541: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 187 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 478 -------------------------------------------------- Missing values for AZ960: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 186 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 477 -------------------------------------------------- Missing values for Talazoparib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for XAV939: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 187 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 478 -------------------------------------------------- Missing values for Trametinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Dabrafenib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Temozolomide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Bleomycin (50 uM): COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 155 MSI 28 Growth Properties 24 TARGET 0 dtype: int64 Total missing values: 352 -------------------------------------------------- Missing values for AZD5438: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for IAP_5620: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for AZD2014: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for AZD1208: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for AZD1332: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for SN-38: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Bicalutamide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for Ruxolitinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 35 Gene Expression 35 Methylation 35 Drug Response 35 GDSC Tissue descriptor 1 35 GDSC Tissue descriptor 2 35 CANCER_TYPE 189 MSI 49 Growth Properties 35 TARGET 0 dtype: int64 Total missing values: 488 -------------------------------------------------- Missing values for Linsitinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Epirubicin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Cyclophosphamide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Pevonedistat: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Sapitinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Uprosertib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 58 Gene Expression 58 Methylation 58 Drug Response 58 GDSC Tissue descriptor 1 58 GDSC Tissue descriptor 2 58 CANCER_TYPE 344 MSI 76 Growth Properties 58 TARGET 0 dtype: int64 Total missing values: 832 -------------------------------------------------- Missing values for LCL161: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 187 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 478 -------------------------------------------------- Missing values for Lapatinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Luminespib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 52 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Alpelisib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Taselisib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 52 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for EPZ5676: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for SCH772984: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for IWP-2: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for Leflunomide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for GSK2801: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Bromosporine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for SGC-CBP30: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for GSK-LSD1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for BDOCA000347a: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for BDF00022089a: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for BDILV000379a: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Entinostat: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for OSI-027: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for LGK974: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for VE-822: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for WZ4003: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for CZC24832: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for AZD5582: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 33 Gene Expression 33 Methylation 33 Drug Response 33 GDSC Tissue descriptor 1 33 GDSC Tissue descriptor 2 33 CANCER_TYPE 185 MSI 47 Growth Properties 33 TARGET 0 dtype: int64 Total missing values: 468 -------------------------------------------------- Missing values for GSK2606414: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 185 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 476 -------------------------------------------------- Missing values for PFI3: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for PCI-34051: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for Wnt-C59: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for I-BET-762: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for RVX-208: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for OTX015: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for GSK343: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 59 Gene Expression 59 Methylation 59 Drug Response 59 GDSC Tissue descriptor 1 59 GDSC Tissue descriptor 2 59 CANCER_TYPE 346 MSI 77 Growth Properties 59 TARGET 0 dtype: int64 Total missing values: 842 -------------------------------------------------- Missing values for ML323: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for Entospletinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for PRT062607: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for Ribociclib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AGI-6780: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for Picolinici-acid: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for AZD5153: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for CDK9_5576: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for CDK9_5038: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for Eg5_9814: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 153 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 366 -------------------------------------------------- Missing values for ERK_2440: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for ERK_6604: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for IRAK4_4710: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for JAK1_8709: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for AZD5991: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 152 MSI 30 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 357 -------------------------------------------------- Missing values for PAK_5339: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for TAF1_5496: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for ULK1_4989: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 367 -------------------------------------------------- Missing values for VSP34_8731: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for IGF1R_3801: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for JAK_8517: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for GSK2256098C: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for GSK2276186C: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for GSK2110183B: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for GSK626616AC: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for GSK3337463A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for GSK2830371A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for LMB_AB1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for LMB_AB2: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for LMB_AB3: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for AZD4547: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Ibrutinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for Zoledronate: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Acetalax: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 52 Gene Expression 52 Methylation 52 Drug Response 52 GDSC Tissue descriptor 1 52 GDSC Tissue descriptor 2 52 CANCER_TYPE 310 MSI 62 Growth Properties 52 TARGET 1434 dtype: int64 Total missing values: 2170 -------------------------------------------------- Missing values for Topotecan: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Teniposide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Mitoxantrone: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Dactinomycin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 65 Gene Expression 65 Methylation 65 Drug Response 65 GDSC Tissue descriptor 1 65 GDSC Tissue descriptor 2 65 CANCER_TYPE 357 MSI 84 Growth Properties 65 TARGET 0 dtype: int64 Total missing values: 902 -------------------------------------------------- Missing values for Bleomycin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Fludarabine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Nelarabine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 716 dtype: int64 Total missing values: 1084 -------------------------------------------------- Missing values for Dacarbazine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for Romidepsin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for 123829: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 765771: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 123138: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Podophyllotoxin bromide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 50869: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Dihydrorotenone: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 715 dtype: int64 Total missing values: 1083 -------------------------------------------------- Missing values for 720427: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 667880: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Gallibiscoquinazole: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for L-Oxonoreleagnine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 729189: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 741909: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 743380: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Elephantin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 150412: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Sinularin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 615590: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for 630600: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for LMP744: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 0 dtype: int64 Total missing values: 368 -------------------------------------------------- Missing values for 776928: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 154 MSI 31 Growth Properties 26 TARGET 716 dtype: int64 Total missing values: 1083 -------------------------------------------------- Missing values for Schweinfurthin A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 716 dtype: int64 Total missing values: 1084 -------------------------------------------------- Missing values for BEN: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 26 Gene Expression 26 Methylation 26 Drug Response 26 GDSC Tissue descriptor 1 26 GDSC Tissue descriptor 2 26 CANCER_TYPE 155 MSI 31 Growth Properties 26 TARGET 717 dtype: int64 Total missing values: 1085 -------------------------------------------------- Missing values for Sabutoclax: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for LY2109761: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 188 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 479 -------------------------------------------------- Missing values for OF-1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for MN-64: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for KRAS (G12C) Inhibitor-12: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 34 Gene Expression 34 Methylation 34 Drug Response 34 GDSC Tissue descriptor 1 34 GDSC Tissue descriptor 2 34 CANCER_TYPE 189 MSI 48 Growth Properties 34 TARGET 0 dtype: int64 Total missing values: 480 -------------------------------------------------- Missing values for MG-132: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 205 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 537 -------------------------------------------------- Missing values for BDP-00009066: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for Buparlisib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Ulixertinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 7 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 64 Gene Expression 64 Methylation 64 Drug Response 64 GDSC Tissue descriptor 1 64 GDSC Tissue descriptor 2 64 CANCER_TYPE 361 MSI 82 Growth Properties 64 TARGET 0 dtype: int64 Total missing values: 898 -------------------------------------------------- Missing values for Venetoclax: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for ABT737: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Afuresertib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for AGI-5198: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AZD3759: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AZD5363: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AZD6738: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for AZD8186: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Osimertinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 203 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 535 -------------------------------------------------- Missing values for Cediranib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Ipatasertib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for GDC0810: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for GNE-317: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 202 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 526 -------------------------------------------------- Missing values for GSK2578215A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for I-BRD9: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Telomerase Inhibitor IX: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for MIRA-1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for NVP-ADW742: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for P22077: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Savolitinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for UMI-77: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for WIKI4: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for Sepantronium bromide: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for MIM1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for WEHI-539: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 204 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 536 -------------------------------------------------- Missing values for BPD-00008900: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 743 dtype: int64 Total missing values: 1107 -------------------------------------------------- Missing values for N25720-51-A1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 742 dtype: int64 Total missing values: 1106 -------------------------------------------------- Missing values for N27922-53-1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 743 dtype: int64 Total missing values: 1107 -------------------------------------------------- Missing values for N30652-18-1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 743 dtype: int64 Total missing values: 1107 -------------------------------------------------- Missing values for N29087-69-1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 743 dtype: int64 Total missing values: 1107 -------------------------------------------------- Missing values for HKMTI-1-005: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 741 dtype: int64 Total missing values: 1103 -------------------------------------------------- Missing values for ICL-SIRT078: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 362 -------------------------------------------------- Missing values for UNC0638: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 362 -------------------------------------------------- Missing values for AGK2: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 3 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 37 Gene Expression 37 Methylation 37 Drug Response 37 GDSC Tissue descriptor 1 37 GDSC Tissue descriptor 2 37 CANCER_TYPE 197 MSI 48 Growth Properties 37 TARGET 0 dtype: int64 Total missing values: 507 -------------------------------------------------- Missing values for Foretinib: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for BIBR-1532: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Pyridostatin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for AMG-319: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 200 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 532 -------------------------------------------------- Missing values for MK-8776: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 202 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 534 -------------------------------------------------- Missing values for Vinorelbine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 201 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 525 -------------------------------------------------- Missing values for Mycophenolic acid: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 156 MSI 28 Growth Properties 24 TARGET 737 dtype: int64 Total missing values: 1090 -------------------------------------------------- Missing values for Remodelin: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 12 Gene Expression 12 Methylation 12 Drug Response 12 GDSC Tissue descriptor 1 12 GDSC Tissue descriptor 2 12 CANCER_TYPE 76 MSI 15 Growth Properties 12 TARGET 370 dtype: int64 Total missing values: 545 -------------------------------------------------- Missing values for VX-11e: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 201 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 525 -------------------------------------------------- Missing values for LJI308: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 201 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 525 -------------------------------------------------- Missing values for AZ6102: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 201 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 525 -------------------------------------------------- Missing values for GSK591: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 201 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 525 -------------------------------------------------- Missing values for VE821: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 199 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 523 -------------------------------------------------- Missing values for VTP-A: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 156 MSI 28 Growth Properties 24 TARGET 737 dtype: int64 Total missing values: 1090 -------------------------------------------------- Missing values for VTP-B: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 156 MSI 28 Growth Properties 24 TARGET 737 dtype: int64 Total missing values: 1090 -------------------------------------------------- Missing values for PBD-288: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 741 dtype: int64 Total missing values: 1105 -------------------------------------------------- Missing values for POMHEX: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 741 dtype: int64 Total missing values: 1105 -------------------------------------------------- Missing values for CT7033-2: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for GSK-LSD1-2HCl : COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 362 -------------------------------------------------- Missing values for 5-azacytidine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 158 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 363 -------------------------------------------------- Missing values for A-366: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for CPI-637: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for UNC0379: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 159 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 364 -------------------------------------------------- Missing values for AZD6482: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 48 MSI 25 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 176 -------------------------------------------------- Missing values for AT13148: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for BMS-754807: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for JQ1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 38 Gene Expression 38 Methylation 38 Drug Response 38 GDSC Tissue descriptor 1 38 GDSC Tissue descriptor 2 38 CANCER_TYPE 200 MSI 52 Growth Properties 38 TARGET 0 dtype: int64 Total missing values: 524 -------------------------------------------------- Missing values for PFI-1: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 200 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 532 -------------------------------------------------- Missing values for IOX2: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for CHIR-99021: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 5 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 14 Gene Expression 14 Methylation 14 Drug Response 14 GDSC Tissue descriptor 1 14 GDSC Tissue descriptor 2 14 CANCER_TYPE 47 MSI 24 Growth Properties 14 TARGET 0 dtype: int64 Total missing values: 174 -------------------------------------------------- Missing values for SGC0946: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 6 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 39 Gene Expression 39 Methylation 39 Drug Response 39 GDSC Tissue descriptor 1 39 GDSC Tissue descriptor 2 39 CANCER_TYPE 200 MSI 53 Growth Properties 39 TARGET 0 dtype: int64 Total missing values: 532 -------------------------------------------------- Missing values for GSK2830371: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 155 MSI 28 Growth Properties 24 TARGET 0 dtype: int64 Total missing values: 352 -------------------------------------------------- Missing values for THR-101: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 155 MSI 28 Growth Properties 24 TARGET 0 dtype: int64 Total missing values: 352 -------------------------------------------------- Missing values for THR-102: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 155 MSI 28 Growth Properties 24 TARGET 0 dtype: int64 Total missing values: 352 -------------------------------------------------- Missing values for THR-103: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 24 Gene Expression 24 Methylation 24 Drug Response 24 GDSC Tissue descriptor 1 24 GDSC Tissue descriptor 2 24 CANCER_TYPE 155 MSI 28 Growth Properties 24 TARGET 0 dtype: int64 Total missing values: 352 -------------------------------------------------- Missing values for ascorbate (vitamin C): COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 362 -------------------------------------------------- Missing values for glutathione: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 157 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 362 -------------------------------------------------- Missing values for alpha-lipoic acid: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 155 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 360 -------------------------------------------------- Missing values for N-acetyl cysteine: COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 1 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 25 Gene Expression 25 Methylation 25 Drug Response 25 GDSC Tissue descriptor 1 25 GDSC Tissue descriptor 2 25 CANCER_TYPE 155 MSI 29 Growth Properties 25 TARGET 0 dtype: int64 Total missing values: 360 --------------------------------------------------
Different drugs have different patterns of null data Will be approaching missing values by drugs and by categories
GDSC tissue descriptor / Cancer type / TGCA desc: use related tissue information (mode) within each drug subset
TARGET / PATHWAY_NAME : fill in with unknown
WES / Gene Expression / Methylation: will attempt to impute based on tissue type, then use KNN imputer
MSI, Growth Properties : use mode within each drug subset also
Use KNN imputer, which fills in missing values utilizing KNN algorithm
In [349]:
def handling_null(df):
knn_imputer = KNNImputer(n_neighbors = 5) # Instantiate object
for drug in df['DRUG_NAME'].unique():
drug_data = df[df['DRUG_NAME'] == drug].copy() # Since creating multiple seperate drug datasets use .copy()
# Descriptor information filling
desc_cols = ['TCGA_DESC', 'GDSC Tissue descriptor 1', 'GDSC Tissue descriptor 2', 'CANCER_TYPE']
for col in desc_cols:
if drug_data[col].isnull().any(): # if there are any null values
for other_col in [c for c in desc_cols if c != col]: # Other columns in desc_cols
grouped = drug_data.groupby(other_col)[col] # Group by other columns
modes = grouped.transform(lambda x: x.mode()[0] if not x.mode().empty else 'Unknown') # Return the first mode value if mode is not empty
drug_data[col] = drug_data[col].fillna(modes)
# If still null, use overall mode
drug_data[col] = drug_data[col].fillna(drug_data[col].mode()[0] if not drug_data[col].mode().empty else 'Unknown')
# Target and pathway filling
tp_cols = ['TARGET', 'PATHWAY_NAME']
for col in tp_cols:
if drug_data[col].isnull().all():
drug_data[col] = 'Unknown for this drug'
#else:
#known_target = drug_data[col].dropna().iloc[0]
#drug_data[col] = drug_data[col].fillna(known_target)
# MSI and Growth properties
msi_gp_cols = ['MSI', 'Growth Properties']
for col in msi_gp_cols:
if drug_data[col].isnull().any():
# Group by primary tissue description
drug_data[col] = drug_data.groupby('GDSC Tissue descriptor 1')[col].transform(
lambda x: x.fillna(x.mode()[0] if not x.mode().empty else 'Unknown')
)
# Genomic Features
genomic_cols = ['Whole Exome Sequencing (WES)', 'Gene Expression', 'Methylation', 'Drug Response']
for col in genomic_cols:
if drug_data[col].isnull().any():
# Group by primary tissue description
drug_data[col] = drug_data.groupby('GDSC Tissue descriptor 1')[col].transform(
lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan)
)
# If still null use knn imputer
if drug_data[col].isnull().any():
feature_data = pd.get_dummies(drug_data[col], prefix=col) # One hot encoding
imputed_data = knn_imputer.fit_transform(feature_data)
imputed_df = pd.DataFrame(imputed_data, columns=feature_data.columns, index=feature_data.index)
drug_data[col] = imputed_df.idxmax(axis=1).str.split('_').str[1]
df.loc[df['DRUG_NAME'] == drug] = drug_data
return df
cleaned_data = handling_null(final_data)
/var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan) /var/folders/gn/8692wbbn2jqbdbljkddblglm0000gn/T/ipykernel_77083/1356287288.py:47: FutureWarning: Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)` lambda x: x.fillna(x.mode()[0] if not x.mode().empty else np.nan)
In [350]:
# Check for missing values again
print(cleaned_data.isnull().sum())
COSMIC_ID 0 CELL_LINE_NAME 0 TCGA_DESC 0 DRUG_ID 0 DRUG_NAME 0 PATHWAY_NAME 0 MIN_CONC 0 MAX_CONC 0 LN_IC50 0 AUC 0 RMSE 0 Z_SCORE 0 Whole Exome Sequencing (WES) 0 Gene Expression 0 Methylation 0 Drug Response 0 GDSC Tissue descriptor 1 0 GDSC Tissue descriptor 2 0 CANCER_TYPE 0 MSI 0 Growth Properties 0 TARGET 0 dtype: int64
In [351]:
# Check unique values of features
print(cleaned_data.info())
print(cleaned_data.nunique())
<class 'pandas.core.frame.DataFrame'> RangeIndex: 242036 entries, 0 to 242035 Data columns (total 22 columns): # Column Non-Null Count Dtype --- ------ -------------- ----- 0 COSMIC_ID 242036 non-null int64 1 CELL_LINE_NAME 242036 non-null object 2 TCGA_DESC 242036 non-null object 3 DRUG_ID 242036 non-null int64 4 DRUG_NAME 242036 non-null object 5 PATHWAY_NAME 242036 non-null object 6 MIN_CONC 242036 non-null float64 7 MAX_CONC 242036 non-null float64 8 LN_IC50 242036 non-null float64 9 AUC 242036 non-null float64 10 RMSE 242036 non-null float64 11 Z_SCORE 242036 non-null float64 12 Whole Exome Sequencing (WES) 242036 non-null object 13 Gene Expression 242036 non-null object 14 Methylation 242036 non-null object 15 Drug Response 242036 non-null object 16 GDSC Tissue descriptor 1 242036 non-null object 17 GDSC Tissue descriptor 2 242036 non-null object 18 CANCER_TYPE 242036 non-null object 19 MSI 242036 non-null object 20 Growth Properties 242036 non-null object 21 TARGET 242036 non-null object dtypes: float64(6), int64(2), object(14) memory usage: 40.6+ MB None COSMIC_ID 969 CELL_LINE_NAME 969 TCGA_DESC 32 DRUG_ID 286 DRUG_NAME 286 PATHWAY_NAME 24 MIN_CONC 39 MAX_CONC 27 LN_IC50 237097 AUC 142587 RMSE 118662 Z_SCORE 233614 Whole Exome Sequencing (WES) 1 Gene Expression 2 Methylation 2 Drug Response 2 GDSC Tissue descriptor 1 20 GDSC Tissue descriptor 2 55 CANCER_TYPE 32 MSI 3 Growth Properties 4 TARGET 186 dtype: int64
In [366]:
# Encode categorical features
def encoding_features(df, target = 'LN_IC50'):
# For binary features
binary = [col for col in df.columns if df[col].nunique() == 2]
for feature in binary:
df[feature] = (df[feature] == df[feature].unique()[0]).astype(int) # Creates boolean series consisting of 1 and 0
# For features with small counts of unique value (low-cardinality), use one hot encoder
onehot_encoder = OneHotEncoder(sparse_output=False, handle_unknown='ignore') # sparse=False returns as np array
msi_encoded = onehot_encoder.fit_transform(df[['MSI']])
msi_columns = onehot_encoder.get_feature_names_out(['MSI']) # renames the columns
msi_onehot = pd.DataFrame(msi_encoded, columns=msi_columns, index=df.index)
gp_encoded = onehot_encoder.fit_transform(df[['Growth Properties']])
gp_columns = onehot_encoder.get_feature_names_out(['Growth Properties'])
gp_onehot = pd.DataFrame(gp_encoded, columns=gp_columns, index=df.index)
# For high cardinality features
high_feature = ['TCGA_DESC', 'DRUG_NAME', 'GDSC Tissue descriptor 1', 'GDSC Tissue descriptor 2',
'CANCER_TYPE', 'TARGET', 'PATHWAY_NAME']
target_encoder = TargetEncoder()
df_high_encoded = target_encoder.fit_transform(df[high_feature], df[target])
df_high_encoded = pd.DataFrame(df_high_encoded, columns=high_feature, index=df.index)
# Label encoding for drug ID, cosmic id, and cell line name
label_feature = ['DRUG_ID','COSMIC_ID','CELL_LINE_NAME']
df_label_encoded = pd.DataFrame(index=df.index)
for col in label_feature:
le = LabelEncoder()
df_label_encoded[col] = le.fit_transform(df[col])
# Combine all encoded features
df_encoded = pd.concat([df[binary],msi_onehot, gp_onehot, df_high_encoded, df_label_encoded], axis = 1)
return df_encoded
encoded = encoding_features(cleaned_data)
In [371]:
encoded['LN_IC50']=cleaned_data['LN_IC50']
encoded['AUC']=cleaned_data['AUC']
encoded['Z_SCORE']=cleaned_data['Z_SCORE']
print(encoded.columns)
print(len(encoded.columns))
print()
print(cleaned_data.columns)
print(len(cleaned_data.columns))
Index(['Gene Expression', 'Methylation', 'Drug Response', 'MSI_MSI-H', 'MSI_MSS/MSI-L', 'MSI_Unknown', 'Growth Properties_Adherent', 'Growth Properties_Semi-Adherent', 'Growth Properties_Suspension', 'Growth Properties_Unknown', 'TCGA_DESC', 'DRUG_NAME', 'GDSC Tissue descriptor 1', 'GDSC Tissue descriptor 2', 'CANCER_TYPE', 'TARGET', 'PATHWAY_NAME', 'DRUG_ID', 'COSMIC_ID', 'CELL_LINE_NAME', 'LN_IC50', 'AUC', 'Z_SCORE'], dtype='object') 23 Index(['COSMIC_ID', 'CELL_LINE_NAME', 'TCGA_DESC', 'DRUG_ID', 'DRUG_NAME', 'PATHWAY_NAME', 'MIN_CONC', 'MAX_CONC', 'LN_IC50', 'AUC', 'RMSE', 'Z_SCORE', 'Whole Exome Sequencing (WES)', 'Gene Expression', 'Methylation', 'Drug Response', 'GDSC Tissue descriptor 1', 'GDSC Tissue descriptor 2', 'CANCER_TYPE', 'MSI', 'Growth Properties', 'TARGET'], dtype='object') 22
In [375]:
# Correlation Analysis of encoded
plt.figure(figsize=(20, 16))
correlation_matrix = encoded.corr()
sns.heatmap(correlation_matrix, annot=True)
plt.title('Correlation Heatmap of Encoded Features')
plt.tight_layout()
plt.show()
In [373]:
# Features to select with correlation
features = ['Z_SCORE', 'AUC', 'PATHWAY_NAME', 'TARGET', 'DRUG_NAME', 'GDSC Tissue descriptor 1',
'GDSC Tissue descriptor 2', 'CANCER_TYPE', 'TCGA_DESC', 'Growth Properties_Adherent']
In [374]:
# Dataframe to csv
encoded.to_csv('modeling_data.csv', index=False)