-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpreprocessing.r
105 lines (78 loc) · 2.37 KB
/
preprocessing.r
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
#Preprocessing supplement, good for data discovery:
#rm(list=ls(all=TRUE))
library(knitr)
library(data.table)
library(dplyr)
library(rmarkdown)
library(xts)
library(plyr)
library(dplyr)
library(pander)
library(descr)
library(ztable)
library(knitr)
library(readxl)
library(ggplot2)
library(lubridate)
library(zoo)
#library(likert)
library(reshape2)
library(RColorBrewer)
library(reshape2)
#library(scales)
library(grid)
library(gtable)
library(gridExtra)
library(haven)
library(cba)
library(blockcluster)
library(sampling)
library(splitstackshape)
library(imputeTS)
library(tidyr)
library(cluster)
library(fpc)
library(factoextra)
library(readr)
Avatars_Version_01 <- read_delim("C:/Users/Boura/Box Sync/CBMI-ADAM/CBMI Data Request/Tetrad/06 28 Avatars_Version 01.txt", "\t", escape_double = FALSE, trim_ws = TRUE)
View(Avatars_Version_01)
#Create a continuous variable out of the discrete data: HEIGHT
#
set.seed(1234)
Avatars_Version_01$HEIGHT_CT<-0
for(i in 1 : nrow(Avatars_Version_01)){
if(Avatars_Version_01$HEIGHT[i]=="176-185"){
Avatars_Version_01$HEIGHT_CT<-runif(1,min=176, max=185)
}else if(Avatars_Version_01$HEIGHT[i]=="161-168"){
Avatars_Version_01$HEIGHT_CT<-runif(1,min=161, max=168)
}else if(Avatars_Version_01$HEIGHT[i]=="150-160"){
Avatars_Version_01$HEIGHT_CT<-runif(1,min=150, max=160)
}else{
Avatars_Version_01$HEIGHT_CT<-runif(1,min=169, max=176)
}
}
#Create a continuous variable out of the discrete data: WEIGHT
Avatars_Version_01$WEIGHT_CT<-0
for(i in 1 : nrow(Avatars_Version_01)){
if(Avatars_Version_01$WEIGHT[i]=="55-64"){
Avatars_Version_01$WEIGHT_CT<-runif(1,min=55, max=64)
}else if(Avatars_Version_01$WEIGHT[i]=="65-160"){
Avatars_Version_01$WEIGHT_CT<-runif(1,min=65, max=160)
}else{
Avatars_Version_01$WEIGHT_CT<-runif(1,min=40, max=54)
}
}
#Create a continuous variable out of the discrete data: AGE
#
Avatars_Version_01$AGE_CT<-0
for(i in 1 : nrow(Avatars_Version_01)){
if(Avatars_Version_01$AGE[i]=="18-24"){
Avatars_Version_01$AGE_CT[i]<-runif(1,min=18, max=24)
}else if(Avatars_Version_01$AGE[i]=="25-44"){
Avatars_Version_01$AGE_CT[i]<-runif(1,min=25, max=44)
}else if(Avatars_Version_01$AGE[i]=="45-64"){
Avatars_Version_01$AGE_CT[i]<-runif(1,min=45, max=64)
}else{
Avatars_Version_01$AGE_CT[i]<-runif(1,min=65, max=95)
}
}