change specific word color in wordcloud

前端 未结 1 1975
感情败类
感情败类 2021-02-05 10:23

I would like to build a word cloud with R (I have done so with the package wordcloud) and then color specific words a certain color. Currently the behavior of

相关标签:
1条回答
  • 2021-02-05 11:15

    EDIT: As described in the comments, the feature described below has now been added to the wordcloud library.


    My approach was to take the R function's code and customize it. It required changing only a few lines, and can now take either a single color or a vector of colors of the same length as words.

    library(wordcloud)
    
    colored.wordcloud <- function(words,freq,scale=c(4,.5),min.freq=3,max.words=Inf,random.order=TRUE,random.color=FALSE,
            rot.per=.1,colors="black",ordered.colors=FALSE,use.r.layout=FALSE,...) { 
        tails <- "g|j|p|q|y"
        last <- 1
        nc<- length(colors)
    
        if (ordered.colors) {
            if (length(colors) != 1 && length(colors) != length(words)) {
                stop(paste("Length of colors does not match length of words",
                           "vector"))
            }
        }
    
        overlap <- function(x1, y1, sw1, sh1) {
            if(!use.r.layout)
                return(.overlap(x1,y1,sw1,sh1,boxes))
            s <- 0
            if (length(boxes) == 0) 
                return(FALSE)
            for (i in c(last,1:length(boxes))) {
                bnds <- boxes[[i]]
                x2 <- bnds[1]
                y2 <- bnds[2]
                sw2 <- bnds[3]
                sh2 <- bnds[4]
                if (x1 < x2) 
                    overlap <- x1 + sw1 > x2-s
                else 
                    overlap <- x2 + sw2 > x1-s
    
                if (y1 < y2) 
                    overlap <- overlap && (y1 + sh1 > y2-s)
                else 
                    overlap <- overlap && (y2 + sh2 > y1-s)
                if(overlap){
                    last <<- i
                    return(TRUE)
                }
            }
            FALSE
        }
    
        ord <- rank(-freq, ties.method = "random")
        words <- words[ord<=max.words]
        freq <- freq[ord<=max.words]
        if (ordered.colors) {
            colors <- colors[ord<=max.words]
        }
    
        if(random.order)
            ord <- sample.int(length(words))
        else
            ord <- order(freq,decreasing=TRUE)
        words <- words[ord]
        freq <- freq[ord]
        words <- words[freq>=min.freq]
        freq <- freq[freq>=min.freq]
        if (ordered.colors) {
            colors <- colors[ord][freq>=min.freq]
        }
    
        thetaStep <- .1
        rStep <- .05
        plot.new()
        op <- par("mar")
        par(mar=c(0,0,0,0))
        plot.window(c(0,1),c(0,1),asp=1)
        normedFreq <- freq/max(freq)
        size <- (scale[1]-scale[2])*normedFreq + scale[2]
        boxes <- list()
    
    
    
        for(i in 1:length(words)){
            rotWord <- runif(1)<rot.per
            r <-0
            theta <- runif(1,0,2*pi)
            x1<-.5
            y1<-.5
            wid <- strwidth(words[i],cex=size[i],...)
            ht <- strheight(words[i],cex=size[i],...)
            #mind your ps and qs
            if(grepl(tails,words[i]))
                ht <- ht + ht*.2
            if(rotWord){
                tmp <- ht
                ht <- wid
                wid <- tmp  
            }
            isOverlaped <- TRUE
            while(isOverlaped){
                if(!overlap(x1-.5*wid,y1-.5*ht,wid,ht) &&
                        x1-.5*wid>0 && y1-.5*ht>0 &&
                        x1+.5*wid<1 && y1+.5*ht<1){
            if (!random.color) {
                    if (ordered.colors) {
                        cc <- colors[i]
                    }
                    else {
                        cc <- ceiling(nc*normedFreq[i])
                        cc <- colors[cc]
                    }
            } else {
             cc <- colors[sample(1:nc,1)]
            }
                    text(x1,y1,words[i],cex=size[i],offset=0,srt=rotWord*90,
                            col=cc,...)
                    #rect(x1-.5*wid,y1-.5*ht,x1+.5*wid,y1+.5*ht)
                    boxes[[length(boxes)+1]] <- c(x1-.5*wid,y1-.5*ht,wid,ht)
                    isOverlaped <- FALSE
                }else{
                    if(r>sqrt(.5)){
                        warning(paste(words[i],
                                        "could not be fit on page. It will not be plotted."))
                        isOverlaped <- FALSE
                    }
                    theta <- theta+thetaStep
                    r <- r + rStep*thetaStep/(2*pi)
                    x1 <- .5+r*cos(theta)
                    y1 <- .5+r*sin(theta)
                }
            }
        }
        par(mar=op)
        invisible()
    }
    

    Some code to try it out:

    colors = c("blue", "red", "orange", "green")
    colored.wordcloud(colors, c(10, 5, 3, 9), colors=colors)
    
    0 讨论(0)
提交回复
热议问题