Newer
Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
# Take *_var parameters apart
take_var_params <- function(dim_params) {
# Take *_var parameters apart
var_params_ind <- grep('_var$', names(dim_params))
var_params <- dim_params[var_params_ind]
# Check all *_var are NULL or vectors of character strings, and
# that they all have a matching dimension param.
i <- 1
for (var_param in var_params) {
if (!is.character(var_param)) {
stop("All '*_var' parameters must be character strings.")
} else if (!any(grepl(paste0('^', strsplit(names(var_params)[i],
'_var$')[[1]][1], '$'),
names(dim_params)))) {
stop(paste0("All '*_var' parameters must be associated to a dimension parameter. Found parameter '",
names(var_params)[i], "' but no parameter '",
strsplit(names(var_params)[i], '_var$')[[1]][1], "'."))
}
i <- i + 1
}
# Make the keys of 'var_params' to be the name of
# the corresponding dimension.
if (length(var_params) < 1) {
var_params <- NULL
} else {
names(var_params) <- gsub('_var$', '', names(var_params))
}
return(var_params)
}
# Take *_reorder parameters apart
take_var_reorder <- function(dim_params) {
# Take *_reorder parameters apart
dim_reorder_params_ind <- grep('_reorder$', names(dim_params))
dim_reorder_params <- dim_params[dim_reorder_params_ind]
# Make the keys of 'dim_reorder_params' to be the name of
# the corresponding dimension.
if (length(dim_reorder_params) < 1) {
dim_reorder_params <- NULL
} else {
names(dim_reorder_params) <- gsub('_reorder$', '', names(dim_reorder_params))
}
return(dim_reorder_params)
}
# Take *_depends parameters apart
take_var_depends <- function(dim_params) {
depends_params_ind <- grep('_depends$', names(dim_params))
depends_params <- dim_params[depends_params_ind]
# Check all *_depends are NULL or vectors of character strings, and
# that they all have a matching dimension param.
i <- 1
for (depends_param in depends_params) {
if (!is.character(depends_param) || (length(depends_param) > 1)) {
stop("All '*_depends' parameters must be single character strings.")
} else if (!any(grepl(paste0('^', strsplit(names(depends_params)[i],
'_depends$')[[1]][1], '$'),
names(dim_params)))) {
stop(paste0("All '*_depends' parameters must be associated to a dimension parameter. Found parameter '",
names(depends_params)[i], "' but no parameter '",
strsplit(names(depends_params)[i], '_depends$')[[1]][1], "'."))
}
i <- i + 1
}
# Make the keys of 'depends_params' to be the name of
# the corresponding dimension.
if (length(depends_params) < 1) {
depends_params <- NULL
} else {
names(depends_params) <- gsub('_depends$', '', names(depends_params))
}
return(depends_params)
}
# Take *_across parameters apart
take_var_across <- function(dim_params) {
across_params_ind <- grep('_across$', names(dim_params))
across_params <- dim_params[across_params_ind]
# Check all *_across are NULL or vectors of character strings, and
# that they all have a matching dimension param.
i <- 1
for (across_param in across_params) {
if (!is.character(across_param) || (length(across_param) > 1)) {
stop("All '*_across' parameters must be single character strings.")
} else if (!any(grepl(paste0('^', strsplit(names(across_params)[i],
'_across$')[[1]][1], '$'),
names(dim_params)))) {
stop(paste0("All '*_across' parameters must be associated to a dimension parameter. Found parameter '",
names(across_params)[i], "' but no parameter '",
strsplit(names(across_params)[i], '_across$')[[1]][1], "'."))
}
i <- i + 1
}
# Make the keys of 'across_params' to be the name of
# the corresponding dimension.
if (length(across_params) < 1) {
across_params <- NULL
} else {
names(across_params) <- gsub('_across$', '', names(across_params))
}
return(across_params)
}
# Leave alone the dimension parameters in the variable dim_params
rebuild_dim_params <- function(dim_params, merge_across_dims,
inner_dims_across_files) {
var_params_ind <- grep('_var$', names(dim_params))
dim_reorder_params_ind <- grep('_reorder$', names(dim_params))
tolerance_params_ind <- grep('_tolerance$', names(dim_params))
depends_params_ind <- grep('_depends$', names(dim_params))
across_params_ind <- grep('_across$', names(dim_params))
# Leave alone the dimension parameters in the variable dim_params
if (length(c(var_params_ind, dim_reorder_params_ind, tolerance_params_ind,
depends_params_ind, across_params_ind)) > 0) {
dim_params <- dim_params[-c(var_params_ind, dim_reorder_params_ind,
tolerance_params_ind, depends_params_ind,
across_params_ind)]
# Reallocating pairs of across file and inner dimensions if they have
# to be merged. They are put one next to the other to ease merge later.
if (merge_across_dims) {
for (inner_dim_across in names(inner_dims_across_files)) {
inner_dim_pos <- which(names(dim_params) == inner_dim_across)
file_dim_pos <- which(names(dim_params) == inner_dims_across_files[[inner_dim_across]])
new_pos <- inner_dim_pos
if (file_dim_pos < inner_dim_pos) {
new_pos <- new_pos - 1
}
dim_params_to_move <- dim_params[c(inner_dim_pos, file_dim_pos)]
dim_params <- dim_params[-c(inner_dim_pos, file_dim_pos)]
new_dim_params <- list()
if (new_pos > 1) {
new_dim_params <- c(new_dim_params, dim_params[1:(new_pos - 1)])
}
new_dim_params <- c(new_dim_params, dim_params_to_move)
if (length(dim_params) >= new_pos) {
new_dim_params <- c(new_dim_params, dim_params[new_pos:length(dim_params)])
}
dim_params <- new_dim_params
}
}
}
dim_names <- names(dim_params)
if (is.null(dim_names)) {
stop("At least one pattern dim must be specified.")
}
return(dim_params)
}
# Look for chunked dims
look_for_chunks <- function(dim_params, dim_names) {
chunks <- vector('list', length(dim_names))
names(chunks) <- dim_names
for (dim_name in dim_names) {
if (!is.null(attr(dim_params[[dim_name]], 'chunk'))) {
chunks[[dim_name]] <- attr(dim_params[[dim_name]], 'chunk')
attributes(dim_params[[dim_name]]) <- attributes(dim_params[[dim_name]])[-which(names(attributes(dim_params[[dim_name]])) == 'chunk')]
} else {
chunks[[dim_name]] <- c(chunk = 1, n_chunks = 1)
}
}
return(chunks)
}
# This is a helper function to compute the chunk indices to take once the total
# number of indices for a dimension has been discovered.
chunk_indices <- function(n_indices, chunk, n_chunks, dim_name) {
if (n_chunks > n_indices) {
stop("Requested to divide dimension '", dim_name, "' of length ",
n_indices, " in ", n_chunks, " chunks, which is not possible.")
}
chunk_sizes <- rep(floor(n_indices / n_chunks), n_chunks)
chunks_to_extend <- n_indices - chunk_sizes[1] * n_chunks
if (chunks_to_extend > 0) {
chunk_sizes[1:chunks_to_extend] <- chunk_sizes[1:chunks_to_extend] + 1
}
chunk_size <- chunk_sizes[chunk]
offset <- 0
if (chunk > 1) {
offset <- sum(chunk_sizes[1:(chunk - 1)])
}
indices <- 1:chunk_sizes[chunk] + offset
array(indices, dim = setNames(length(indices), dim_name))
}