-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathexplore_dataset.R
23 lines (18 loc) · 940 Bytes
/
explore_dataset.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
setwd("Desktop/Molecular_autoencoder/")
kiDB.raw <- read.csv("Data/KiDatabase.csv")
#Top 10 receptors by count
sort(table(kiDB.raw$Name), decreasing = T)[1:10]
#Subset to 5-HT2A - ligand pairings
HT2A.subset <- kiDB.raw[kiDB.raw$Name == "5-HT2A",]
HT2A.subset <- HT2A.subset[HT2A.subset$SMILES != "", c("Ligand.ID",
"Ligand.Name",
"SMILES",
"Hotligand",
"species",
"source",
"ki.Note",
"ki.Val")]
head(HT2A.subset)
SMILES <- unique(HT2A.subset[,"SMILES"])
write.csv(SMILES, file='Focal_SMILES.csv')
write.csv(HT2A.subset, file="HT2A_kiDB.csv")