-
Notifications
You must be signed in to change notification settings - Fork 2
/
GESimulatePredictD10K30C.R
87 lines (50 loc) · 1.58 KB
/
GESimulatePredictD10K30C.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
### This simulation Checks if the model can predict well with 10 Dimensions
### Also CHECK THE TIME REQUIRED FOR THE MODEL
source('importDP.R')
### Remove The Past
rm(list = ls())
#################################### SIMULATED DATA PROPERTIES ####################################################
## Number of points
N.test = 100
N.train =100
N = N.test
## Number of Clusters
F = 3
## Distribution of the points within three clusters
p.dist = c(0.4,0.3,0.3)
## Total Number of features D
D = 10
## Total Percentage of irrelevant feature
prob.noise.feature = 0.6
## Total Percentage of censoring
prob.censoring = 0.10
## Overlap between Cluster of molecular Data of the relevant features
prob.overlap = 0.01
## Percentage of Noise/Overlap in Time Data
prob.noise = 0.1
############################# PARAMETERS for GIBB's SAMPLING ####
iter = 100
iter.burnin = 60
iter.thin =5
k =3
########################### Initialize the functions ############
source('simulateDPMM.R')
simulateDPMM()
source('initializeDPMM.R')
initializeDPMM()
######### Ground Truth ##############################
source('SIMgroundtruth.R')
SIMgroundtruth()
########### Train the Model #########################################
source('burninDPMM.R')
burninDPMM()
source('gibbsDPMM.R')
gibbsDPMM()
########## Analyze the fit ##########################################
source('SIManalyzeDPMM.R')
SIManalyzeDPMM()
######## Predict on New Data Set #####################################
source('predictCLASS.R')
predictCLASS(Y.new, time.new)
source('predictchineseAFTtime.R')
predictchineseAFTtime(Y.new)