-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcoding_program_basis.R
27 lines (26 loc) · 1 KB
/
coding_program_basis.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
library(data.table)
library(dplyr)
library(stringr)
load(file="S_aggreg_1_grams.RData")
load(file="S_aggreg_2_grams.RData")
load(file="S_aggreg_3_grams.RData")
load(file="S_aggreg_4_grams.RData")
S_aggreg_grams.dt <- rbind(S_aggreg_4_grams.dt,S_aggreg_3_grams.dt,S_aggreg_2_grams.dt)
rm(S_aggreg_4_grams.dt, S_aggreg_3_grams.dt, S_aggreg_2_grams.dt)
object.size(S_aggreg_grams.dt)/1024/1024/1024
load(file="S_aggreg_5_grams.RData")
S_aggreg_grams.dt <- rbind(S_aggreg_grams.dt, S_aggreg_5_grams.dt)
rm(S_aggreg_5_grams.dt)
setkey(S_aggreg_grams.dt, W_n_1)
(aa <- "I'll dust them off and be on my")
(bb <- unlist(strsplit(tolower(aa), " ")))
(cc <- as.list(length(bb)-3:0))
(dd <- Filter(function(x) x > 0, cc))
(ee <- lapply(dd, seq, length(bb)))
(ff <- lapply(ee, function(x) bb[x]))
(gg <- lapply(ff, paste, collapse=" "))
(hh <- lapply(1:length(gg), function(x) S_aggreg_grams.dt[gg[x], 2:3]))
(ii <- do.call("rbind", hh))
(jj <- rbind(ii, S_aggreg_1_grams.dt))
(kk <- na.omit(jj, cols = "S"))
(ll <- kk[order(-kk$S)][1:5])