f <- 'http://www.gnu.org/licenses/gpl.txt' sapply(names(table(unlist(strsplit((l<-readLines(f)),"\\W+")))), function(s) grep(s,l))