Skip to content

Commit 84280ef

Browse files
committed
checked
1 parent e09f17b commit 84280ef

File tree

1 file changed

+24
-46
lines changed

1 file changed

+24
-46
lines changed

R/prepare_recode.rmd

Lines changed: 24 additions & 46 deletions
Original file line numberDiff line numberDiff line change
@@ -17,18 +17,22 @@ library(osfr) # to download method codes
1717
```{r}
1818
readRDS("processed_data/TRACEmerged.RDS")->merged.data
1919
20-
# data<-readRDS("processed_data/TRACErecoded.RDS") # contains only included, recoded, data
20+
nrow(merged.data)
21+
# data<-readRDS("processed_data/TRACErecoded.RDS") # contains only included, recoded, data
2122
#data <- read.csv("processed_data/TRACEmerged.csv", sep = ";", dec = c(",", ".")) # Data
2223
23-
osf_retrieve_file("a6dmj") %>% osf_download(path = "data", conflicts="overwrite") # search 3
24+
osf_retrieve_file("25et8") %>% osf_download(path = "data", conflicts="overwrite") # search 3
2425
method <- read_excel("data/TRACE_method_codes.xlsx", sheet = "codes")
2526
# method <- read.csv("TRACE_method_codes.csv", sep = ";", na.strings = c(" ", "-"), dec = c(",", ".")) # Method codes
2627
27-
method %>% select(!notes) %>% filter(is.na(.)) # check, should be no missing.
28+
# method %>% select(!notes) %>% filter_all(any_vars( is.na(.))) %>% View() ## 11/2/23 wel msisings voor delay vars?
29+
# check, should be no missing.
30+
2831
# Select relevant colums dataset
2932
method %>% select(task, measure, type, phase, valence, recode, recode.for.ext, cuectx) -> method
3033
# Create reference var as character
3134
merged.data1<-merged.data %>% mutate(reference = as.character(paste(author, year, sep=" "))) %>% select(-c(author, year)) # Merge year & author & dropvars.
35+
nrow(merged.data1)
3236
```
3337

3438

@@ -39,7 +43,7 @@ merged.data1 %>% filter(decision == 1) %>% select(-decision) %>% droplevels() ->
3943
```
4044

4145

42-
## Add method codes to data
46+
## Add method codes to data and confirm merge was correct
4347
NB the combination of task and measure indicates which method is used to measure behavior. Those values are combined into a new variable ..
4448
```{r}
4549
merged.inclusions %>% mutate(measureID = as.factor(paste(task, measure, sep="."))) -> merged.inclusions.A
@@ -60,7 +64,7 @@ left_join(merged.inclusions.A ,method1, by="measureID", suffix = c(".d", ".m"))-
6064

6165
# Recoding Subject variables
6266

63-
## Age: set age groups
67+
## recode Age: set age groups
6468

6569
subject:
6670
(0=humanmixed(Civiel&Military); 1=ActiveDutyMilitary; 2=Veteran; 12=ActiveDutyMilitary & Veteran; 3=Civilian; 4=Rat; 5=Mice)
@@ -123,35 +127,27 @@ merged.inclusions.B %>% mutate(
123127
)-> merged.inclusions.recoded
124128
```
125129

126-
127-
no missing values after recoding age in included papers
128-
```{r eval=FALSE, include=FALSE}
129-
merged.inclusions.recoded %>% select(subject, age.PTSD, age.PTSD2, age.PTSD.cat,
130-
age.HC, age.HC2, age.HC.cat) %>% filter(is.na(.))
131-
```
132-
133-
130+
Confirm correct recoding of 'old adult'
134131
```{r eval=FALSE, include=FALSE}
135-
merged.inclusions.recoded %>% filter(age.PTSD2 > 65)%>% View()
136-
merged.inclusions.recoded %>% filter(age.HC2 > 65) %>% View()
132+
merged.inclusions.recoded %>% filter(age.PTSD2 > 65) %>% View()
133+
merged.inclusions.recoded %>% filter(age.HC2 > 65) %>% View()
137134
```
138135

136+
Remove redundant 'age' variables
139137
```{r}
140138
merged.inclusions.recoded %>% select(!c(age.PTSD, age.PTSD2, age.HC, age.HC2))-> merged.inclusions.recoded2
141139
```
142140

143141

144-
## Day/Night rhytem
145-
142+
## recode Day/Night rhytem
146143
```{r}
147144
merged.inclusions.recoded2 %>% mutate(rhythm = ifelse(subject %in% c("0", "1", "2", "12", "3"),"active", rhythm)) -> merged.inclusions.recoded3
148145
merged.inclusions.recoded3$rhythm <- recode(merged.inclusions.recoded3$rhythm, 'dark' = 'active', 'light' = 'inactive')
149-
# for checking
150-
merged.inclusions.recoded3 %>% filter(is.na(rhythm)) # good
146+
merged.inclusions.recoded3 %>% filter(is.na(rhythm)) # to confirm no NA values
151147
```
152148

153149

154-
## Time since trauma
150+
## recode Time since trauma
155151
```{r}
156152
merged.inclusions.recoded3 %>%
157153
mutate(
@@ -224,43 +220,37 @@ time.pseudo = case_when(
224220
merged.inclusions.recoded5 %>% select(-c(time.year, time.month, time.day, time.year2, time.month2, time.day2, time.year3, time.month3, time.day3, time.year4, time.month4, time.day4, time.recoded)) -> merged.inclusions.recoded6
225221
```
226222

223+
227224
## Subject: new Human-Animal variable
228225
```{r}
229226
merged.inclusions.recoded6 %>% mutate(subject.cat = ifelse(subject %in% c("0", "1", "2", "12", "3"), "Human", "Animal")) ->merged.inclusions.recoded7
230227
```
231228

232-
## recode control type
229+
230+
## recode Control type
233231
```{r}
234232
merged.inclusions.recoded7$control.type = recode(merged.inclusions.recoded7$control.type, "Handled" = "UnExp")
235233
```
236234

237235

238-
239-
240-
## Check missing values
236+
## Confirm no missing values
241237
```{r}
242238
which(is.na(merged.inclusions.recoded7$subject.cat))
243239
```
244240

245-
246241
```{r}
247242
which(is.na(merged.inclusions.recoded7$PMID))
248243
```
249244

250-
251245
```{r}
252246
which(is.na(merged.inclusions.recoded7$comparison))
253247
```
254248

255249

256250
## recode measure, PTSD type and population
257251
```{r}
258-
259252
# df4$subject.cat
260-
261253
# df4.1 %>% select(subject.cat, measure.d, measure2, ptsd.type, ptsd.type2, population, population2) %>% View()
262-
263-
264254
merged.inclusions.recoded7 %>% mutate(
265255
measure2 = case_when(
266256
# measure
@@ -306,20 +296,16 @@ merged.inclusions.recoded7 %>% mutate(
306296
```
307297

308298

309-
310-
311-
## set variable types
299+
## Set variable types
312300
313-
all are current character
301+
NB all are current character
314302
```{r variable types}
315303
names(merged.inclusions.recoded7A)
316304
317305
string_names <- c("author", "year",
318306
"PMID",
319307
"shocks.num", "shocks.amp",
320-
321308
"idPTSD", "idHC",
322-
323309
"outcomePTSD", "outcomeHC",
324310
"ptsd.measure",
325311
"task", "measure"
@@ -330,10 +316,8 @@ factor_names <-c( #"decision",
330316
"sex.PTSD", "sex.HC",
331317
"ptsd.type", 'control.type', 'population',
332318
"rhythm",
333-
334319
"comparison",
335320
"res.sus.split", "age.PTSD.cat", "age.HC.cat",
336-
337321
# and recoded factors
338322
"ptsd.type2", "population2","task.d", "measure.d", "measure2", "type", "phase", "valence", "cuectx"
339323
)
@@ -343,13 +327,10 @@ numeric_names <- c("nPTSD", "nHC", "meanPTSD", "sdPTSD", "semPTSD", "meanHC", "s
343327
# For checking -> ok!
344328
# merged.data.recoded2 %>% mutate_at(.vars=numeric_names, as.numeric) %>% filter(decision == 1) %>% select(numeric_names) %>% is.na() %>% View()
345329
346-
347-
348330
merged.inclusions.recoded7A %>%
349331
mutate_at(.vars=numeric_names, as.numeric) %>%
350332
mutate_at(.vars=factor_names, factor) ->merged.inclusions.recoded8
351333
352-
353334
# for checking
354335
# cbind(merged.data.recoded3$nHC,merged.data.recoded4$nHC)
355336
# unique(merged.inclusions.recoded8$author) %>% data.frame() %>%head()
@@ -395,10 +376,7 @@ merged.inclusions.recoded9$idHC %>% unique()
395376
```
396377

397378

398-
399-
400-
401-
## new variables for phase & valence (no longer used)
379+
## new variables for phase & valence (no longer used) -> can be deleated later
402380
```{r eval=FALSE, include=FALSE}
403381
merged.inclusions.recoded9 %>% mutate(
404382
@@ -434,7 +412,7 @@ Valence_Grouped = factor(Valence_Grouped)
434412
435413
```
436414

437-
415+
## Save recoded dataset
438416
```{r save}
439417
saveRDS(merged.inclusions.recoded9, "processed_data/TRACErecoded.RDS")
440418
# write.csv2(merged.inclusions.recoded8, "processed_data/TRACErecoded.csv", fileEncoding = "UTF-8") # writes spec characters weird

0 commit comments

Comments
 (0)