Hi GM, thank you for the reply, reading it and making the reprex I realized some code errors.
This is the data:
|
id |
c0011 |
c0019 |
c2059 |
c6000 |
c4444 |
c4419 |
c4459 |
c4460 |
date |
| 1 |
1 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2020 |
| 2 |
1 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2020 |
| 3 |
1 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2020 |
| 4 |
1 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2020 |
| 5 |
1 |
33989 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2021 |
| 6 |
1 |
1653 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2021 |
| 7 |
1 |
799 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2021 |
| 8 |
1 |
22383 |
NA |
NA |
NA |
NA |
NA |
NA |
NA |
2021 |
| 9 |
2 |
4011 |
2139 |
1639 |
233 |
991470 |
746901 |
217421 |
27148 |
2020 |
| 10 |
2 |
17621 |
8520 |
8273 |
828 |
991470 |
746901 |
217421 |
27148 |
2020 |
| 11 |
2 |
77525 |
33805 |
40138 |
3582 |
991470 |
746901 |
217421 |
27148 |
2020 |
| 12 |
2 |
69884 |
25737 |
38496 |
5651 |
991470 |
746901 |
217421 |
27148 |
2020 |
| 13 |
2 |
NA |
NA |
NA |
NA |
906534 |
679373 |
202449 |
24712 |
2021 |
| 14 |
2 |
NA |
NA |
NA |
NA |
906534 |
679373 |
202449 |
24712 |
2021 |
| 15 |
2 |
NA |
NA |
NA |
NA |
906534 |
679373 |
202449 |
24712 |
2021 |
| 16 |
2 |
NA |
NA |
NA |
NA |
906534 |
679373 |
202449 |
24712 |
2021 |
| 17 |
3 |
42365 |
14853 |
23338 |
4174 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 18 |
3 |
22188 |
8707 |
12032 |
1449 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 19 |
3 |
54738 |
21094 |
29265 |
4379 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 20 |
3 |
44200 |
17345 |
23968 |
2887 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 21 |
3 |
7685 |
2520 |
4380 |
785 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 22 |
3 |
9612 |
3174 |
5358 |
1080 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 23 |
3 |
8669 |
2999 |
4868 |
802 |
1012683 |
339358 |
563151 |
110174 |
2020 |
| 24 |
3 |
NA |
NA |
NA |
NA |
375736 |
124121 |
209384 |
42231 |
2021 |
| 25 |
3 |
NA |
NA |
NA |
NA |
375736 |
124121 |
209384 |
42231 |
2021 |
| 26 |
3 |
NA |
NA |
NA |
NA |
375736 |
124121 |
209384 |
42231 |
2021 |
| 27 |
3 |
NA |
NA |
NA |
NA |
375736 |
124121 |
209384 |
42231 |
2021 |
| 28 |
3 |
NA |
NA |
NA |
NA |
375736 |
124121 |
209384 |
42231 |
2021 |
| 29 |
3 |
NA |
NA |
NA |
NA |
375736 |
124121 |
209384 |
42231 |
2021 |
| 30 |
3 |
11465 |
5127 |
5430 |
908 |
375736 |
124121 |
209384 |
42231 |
2021 |
and the code:
# import from xlsx a data set with number of clients per category
df <-
# relabel
names(df) <- c('id', 'c0011', 'c0019', 'c0059', 'c0060',
'c4444', 'c4419', 'c4459', 'c4460', 'date')
#> Error in names(df) <- c("id", "c0011", "c0019", "c0059", "c0060", "c4444", : names() applied to a non-vector
# convert id and date to factor and others to integer with lapply
df[c(1, 10)] <- lapply(df[c(1, 10)], as.factor)
#> Error in df[c(1, 10)]: object of type 'closure' is not subsettable
df[c(2:9)] <- lapply(df[c(2:9)], as.integer)
#> Error in df[c(2:9)]: object of type 'closure' is not subsettable
# drop missing rows and factor vars
dfmis <- df[-c(1:4), -c(1, 10)]
#> Error in df[-c(1:4), -c(1, 10)]: object of type 'closure' is not subsettable
# check
sapply(dfmis, class)
#> Error in lapply(X = X, FUN = FUN, ...): object 'dfmis' not found
# impute
imp <- missForest(dfmis, xtrue = df)
#> Error in missForest(dfmis, xtrue = df): could not find function "missForest"