====== Clustering with relational constraint based on a dictionary ====== March 10, 2018 **!!! ward method (not implemented yet) - to be replaced by average**


# Clustering with relational constraint based on a dictionary

key <- function(i,j) 
  if(i0)&&(i!=j)) { dij <- get(key(i,j),envir=hD)
        if(dij < dd[[a]]) {dd[[a]] <- dij; ind[[a]] <- j}}}
    pq <- which.min(dd)
    if((length(pq)==0)|is.null(pq)) break
    dpq <- dd[[pq]]
  # join the closest pair of clusters
    p<-active[pq]; q <- ind[pq]; 
    if(is.infinite(q)){
      cat("several components\n")
      dpq <- h[k-1]*1.1; p <- active[1]
      for(q in active[2:length(active)]){
        if(node[p]==0) m[k,1] <- -p else m[k,1] <- node[p]
        if(node[q]==0) m[k,2] <- -q else m[k,2] <- node[q]
        w[p] <- w[q]+w[p]; node[[k]] <- k; h[k] <- dpq
        p <- k; k <- k+1 
      }
      break
    }
    h[k] <- dpq 
    if(node[p]==0) m[k,1] <- -p else m[k,1] <- node[p]
    if(node[q]==0) m[k,2] <- -q else m[k,2] <- node[q]
    active <- setdiff(active,q)
    Rop <- setdiff(Ro[[p]],q); Rip <- setdiff(Ri[[p]],q) 
    Roq <- setdiff(Ro[[q]],p); Riq <- setdiff(Ri[[q]],p)
    Sq <- setdiff(union(Roq,Riq),0)
    S <- setdiff(union(union(Rop,Rip),Sq),0)
    for(s in Riq) if(s>0) Ro[[s]] <- setdiff(Ro[[s]],q)
    r <- p; Ror <- 0; Rir <- Rip
    if(tol) Ror <- Rop else
      for(s in Rop) if(s>0) Ri[[s]] <- setdiff(Ri[[s]],p) 
    Ror <- union(Ror,Roq)
    for(s in Roq) if(s>0) Ri[[s]] <- setdiff(union(Ri[[s]],r),q)
    if(nos){
      Rir <- union(Rir,Riq)
      for(s in Riq) if(s>0) Ro[[s]] <- union(Ro[[s]],r)
    }
    Ro[[r]] <- Ror; Ri[[r]] <- Rir; Ro[[q]] <- 0; Ri[[q]] <- 0
  # determine dissimilarities to the new cluster
    for(s in S){
      if(method=="max") assign(key(p,s),max(
         get0(key(p,s),envir=hD,inherits=FALSE,ifnotfound=0),
         get0(key(q,s),envir=hD,inherits=FALSE,ifnotfound=0)),envir=hD) else
      if(method=="min") assign(key(p,s),min(
         get0(key(p,s),envir=hD,inherits=FALSE,ifnotfound=Inf),
         get0(key(q,s),envir=hD,inherits=FALSE,ifnotfound=Inf)),envir=hD) else
      if(method=="ward") { ww <- w[p]+w[q]+w[s]
        D[idx(p,s)] <- ((w[q]+w[s])*D[idx(q,s)] + (w[p]+w[s])*D[idx(p,s)] - w[s]*dpq)/ww
      } else {cat('unknown method','\n'); return(NULL)}
    }
    for(s in union(Sq,p)) {ky <- key(q,s) 
      if(exists(ky,envir=hD,inherits=FALSE)) remove(list=ky,envir=hD,inherits=FALSE)}
    w[p] <- w[q]+w[p]; node[[p]] <- k
  }
  hc <- list(merge=m,height=h,order=orDendro(numLm),labels=attr(hD,"Labels"),
    method="cluRelH",call=NULL,dist.method=method,leaders=NULL)
  class(hc) <- "hclust"
  print(paste("Finished:",Sys.time()))
  return(hc)
}


> source("C:\\Users\\batagelj\\work\\R\\RelCon\\relConH.R")
> # Create initial weights - dissimilarities
> # n is number of nodes
> Ri <- sRi; Ro <- sRo; D <- sD
> n <- nrow(D); np <- n+1; hD <- new.env()
> for(i in 1:length(R)) for(j in R[[i]])  assign(key(i,j),D[i,j],envir=hD)
> attr(hD,"Size") <- n; attr(hD,"Labels") <- names(R)
> res <- relConH(strategy="tolerant")
Clustering with relational constraint based on a dictionary
by Vladimir Batagelj, March 2018
Method: max   Strategy: tolerant 
[1] "Started: 2018-03-12 04:20:40"
[1] "Finished: 2018-03-12 04:20:40"
> plot(res,hang=-1,main="Some types ... example",sub="dict: tolerant / maximum")

{{pro:pics:sttolmaxh.png}} ====== ====== \\ [[pro:relc|Back to Relational constraints]]