## -----------------------------------------------------------------------------
set.seed(1)

## ----echo=TRUE, eval=TRUE, message=FALSE, warning=FALSE-----------------------
library(ordinalClust)

## -----------------------------------------------------------------------------
m=7
nr=10000
mu=5
pi=0.5

probaBOS=rep(0,m)
for (im in 1:m) probaBOS[im]=pejSim(im,m,mu,pi)
M <- sample(1:m,nr,prob = probaBOS, replace=TRUE)

## ----fig.width = 5, warning=FALSE, eval=TRUE, message=FALSE, tidy=TRUE, dev='png', echo=FALSE, fig.show='hold', fig.align='center'----
library(ggplot2)
library(ordinalClust)
m=7
nr=10000

probaBOS=rep(0,m)
for (im in 1:m) probaBOS[im]=pejSim(im,m,5,0.5)
M <- sample(1:m,nr,prob = probaBOS, replace=TRUE)
M <- as.data.frame(M)
cbPalette <- c("#560303", "#a30606", "#ceac18", "#e0e00d", "#f7f313", "#9bf713", "#0de037")
plot1 <- ggplot(data = M, aes(x = M,fill=factor(M))) +
  geom_histogram() +
  ylim(0, nr) +
  ggtitle("ordinal data with m=7 \n mu=5 and pi=0.5") +
  theme(plot.title = element_text(vjust = -20,hjust = 0.5,size = 16)) +
  scale_x_continuous(breaks=1:7, labels=c(1:7), limits=c(0,8)) +
  scale_fill_manual(values=cbPalette)

plot1

## ----echo=TRUE, eval=FALSE, message=FALSE, warning=FALSE----------------------
# set.seed(0)
# 
# library(ordinalClust)
# data("dataqol")
# 
# # loading the ordinal data
# M <- as.matrix(dataqol[,2:29])
# 
# m = 4
# 
# krow = 3
# 
# nbSEM=100
# nbSEMburn=90
# nbindmini=2
# init = "randomBurnin"
# percentRandomB = c(30)
# 
# object <- bosclust(x=M,kr=krow, m=m, nbSEM=nbSEM,
#     nbSEMburn=nbSEMburn, nbindmini=nbindmini,
#     percentRandomB=percentRandomB, init=init)
# 

## ----echo=TRUE, eval=FALSE, message=FALSE, warning=FALSE----------------------
# 
# plot(object)
# 

## ----echo=FALSE, out.width = "75%", out.extra='style="display: block;margin: auto;"', fig.cap=""----
library(knitr)    # For knitting document and include_graphics function

include_graphics("figures/clust.png")

## ----echo=TRUE, eval=FALSE, message=FALSE, warning=FALSE----------------------
# 
# set.seed(0)
# 
# library(ordinalClust)
# 
# # loading the real dataset
# data("dataqol")
# 
# # loading the ordinal data
# M <- as.matrix(dataqol[,2:29])
# 
# 
# # defining different number of categories:
# m=4
# 
# 
# # defining number of row and column clusters
# krow = 3
# kcol = 3
# 
# # configuration for the inference
# nbSEM=100
# nbSEMburn=90
# nbindmini=2
# init = "randomBurnin"
# percentRandomB = c(30, 30)
# 
# # Co-clustering execution
# object <- boscoclust(x = M,kr = krow, kc = kcol, m = m,
#                     nbSEM = nbSEM, nbSEMburn = nbSEMburn,
#                     nbindmini = nbindmini, init = init,
#                     percentRandomB = percentRandomB)
# 
# 
# 

## ----echo=TRUE, eval=FALSE, message=FALSE, warning=FALSE----------------------
# 
# plot(object)
# 

## ----echo=FALSE, out.width = "75%", out.extra='style="display: block;margin: auto;"', fig.cap=""----
library(knitr)    # For knitting document and include_graphics function

include_graphics("figures/coclust.png")

## ----echo=TRUE, message=FALSE, warning=FALSE----------------------------------
set.seed(1)

library(ordinalClust)
# loading the real dataset
data("dataqol.classif")


# loading the ordinal data
M <- as.matrix(dataqol.classif[,2:29])


# creating the classes values
y <- as.vector(dataqol.classif$death)


# sampling datasets for training and to predict
nb.sample <- ceiling(nrow(M)*7/10)
sample.train <- sample(1:nrow(M), nb.sample, replace=FALSE)

M.train <- M[sample.train,]
M.validation <- M[-sample.train,]
nb.missing.validation <- length(which(M.validation==0))


y.train <- y[sample.train]
y.validation <- y[-sample.train]

# number of classes to predict
kr <- 2

# configuration for SEM algorithm
nbSEM=200
nbSEMburn=175
nbindmini=2
init="randomBurnin"
percentRandomB = c(50, 50)


# different kc to test with cross-validation
kcol <- c(0,1,2,3)
m <- 4


# matrix that contains the predictions for all different kc
preds <- matrix(0,nrow=length(kcol),ncol=nrow(M.validation))

for(kc in 1:length(kcol)){
  res <- bosclassif(x=M.train, y=y.train, 
                    kr=kr, kc=kcol[kc], m=m, 
                    nbSEM=nbSEM, nbSEMburn=nbSEMburn, 
                    nbindmini=nbindmini, init=init, percentRandomB=percentRandomB)

  new.prediction <- predict(res, M.validation)
  preds[kc,] <- new.prediction@zr_topredict
  
}

preds = as.data.frame(preds)
row.names <- c()
for(kc in kcol){
  name= paste0("kc=",kc)
  row.names <- c(row.names,name)
}
rownames(preds)=row.names


## ----echo=TRUE, message=FALSE, warning=FALSE----------------------------------

library(caret)

actual <- y.validation -1

specificities <- rep(0,length(kcol))
sensitivities <- rep(0,length(kcol))

for(i in 1:length(kcol)){
  prediction <- unlist(as.vector(preds[i,])) -1
  u <- union(prediction, actual)
  conf_matrix<-table(factor(prediction, u),factor(actual, u))
  sensitivities[i] <- recall(conf_matrix)
  specificities[i] <- specificity(conf_matrix)
}

sensitivities
specificities


## ----echo=TRUE, eval=FALSE, message=FALSE, warning=FALSE----------------------
# set.seed(0)
# 
# library(ordinalClust)
# 
# # loading the real dataset
# data("dataqol")
# 
# # loading the ordinal data
# M <- as.matrix(dataqol[,2:31])
# 
# 
# # defining different number of categories:
# m=c(4,7)
# 
# 
# # defining number of row and column clusters
# krow = 3
# kcol = c(3,1)
# 
# # configuration for the inference
# nbSEM=50
# nbSEMburn=40
# nbindmini=2
# init='random'
# 
# d.list <- c(1,29)
# 
# # Co-clustering execution
# object <- boscoclust(x=M,kr=krow,kc=kcol,m=m, idx_list=d.list,
#                     nbSEM=nbSEM,nbSEMburn=nbSEMburn,
#                      nbindmini=nbindmini, init=init)
# 

