7e92c2caeadb1cf42ac9c026bf1dc586c82e1668
1 /*****************************************************************************
2 * RRDtool 1.2.23 Copyright by Tobi Oetiker, 1997-2007
3 *****************************************************************************
4 * rrd_fetch.c read date from an rrd to use for further processing
5 *****************************************************************************
6 * $Id$
7 * $Log$
8 * Revision 1.8 2004/05/18 18:53:03 oetiker
9 * big spell checking patch -- slif@bellsouth.net
10 *
11 * Revision 1.7 2003/11/11 19:46:21 oetiker
12 * replaced time_value with rrd_time_value as MacOS X introduced a struct of that name in their standard headers
13 *
14 * Revision 1.6 2003/01/16 23:27:54 oetiker
15 * fix border condition in rra selection of rrd_fetch
16 * -- Stanislav Sinyagin <ssinyagin@yahoo.com>
17 *
18 * Revision 1.5 2002/06/23 22:29:40 alex
19 * Added "step=1800" and such to "DEF"
20 * Cleaned some of the signed vs. unsigned problems
21 *
22 * Revision 1.4 2002/02/01 20:34:49 oetiker
23 * fixed version number and date/time
24 *
25 * Revision 1.3 2001/12/24 06:51:49 alex
26 * A patch of size 44Kbytes... in short:
27 *
28 * Found and repaired the off-by-one error in rrd_fetch_fn().
29 * As a result I had to remove the hacks in rrd_fetch_fn(),
30 * rrd_tool.c, vdef_calc(), data_calc(), data_proc() and
31 * reduce_data(). There may be other places which I didn't
32 * find so be careful.
33 *
34 * Enhanced debugging in rrd_fetch_fn(), it shows the RRA selection
35 * process.
36 *
37 * Added the ability to print VDEF timestamps. At the moment it
38 * is a hack, I needed it now to fix the off-by-one error.
39 * If the format string is "%c" (and nothing else!), the time
40 * will be printed by both ctime() and as a long int.
41 *
42 * Moved some code around (slightly altering it) from rrd_graph()
43 * initializing now in rrd_graph_init()
44 * options parsing now in rrd_graph_options()
45 * script parsing now in rrd_graph_script()
46 *
47 * Revision 1.2 2001/12/17 12:48:43 oetiker
48 * fix overflow error ...
49 *
50 * Revision 1.1.1.1 2001/02/25 22:25:05 oetiker
51 * checkin
52 *
53 *****************************************************************************/
55 #include "rrd_tool.h"
57 #include "rrd_is_thread_safe.h"
58 /*#define DEBUG*/
60 int
61 rrd_fetch(int argc,
62 char **argv,
63 time_t *start,
64 time_t *end, /* which time frame do you want ?
65 * will be changed to represent reality */
66 unsigned long *step, /* which stepsize do you want?
67 * will be changed to represent reality */
68 unsigned long *ds_cnt, /* number of data sources in file */
69 char ***ds_namv, /* names of data sources */
70 rrd_value_t **data) /* two dimensional array containing the data */
71 {
74 long step_tmp =1;
75 time_t start_tmp=0, end_tmp=0;
76 const char *cf;
78 struct rrd_time_value start_tv, end_tv;
79 char *parsetime_error = NULL;
80 optind = 0; opterr = 0; /* initialize getopt */
82 /* init start and end time */
83 parsetime("end-24h", &start_tv);
84 parsetime("now", &end_tv);
86 while (1){
87 static struct option long_options[] =
88 {
89 {"resolution", required_argument, 0, 'r'},
90 {"start", required_argument, 0, 's'},
91 {"end", required_argument, 0, 'e'},
92 {0,0,0,0}
93 };
94 int option_index = 0;
95 int opt;
96 opt = getopt_long(argc, argv, "r:s:e:",
97 long_options, &option_index);
99 if (opt == EOF)
100 break;
102 switch(opt) {
103 case 's':
104 if ((parsetime_error = parsetime(optarg, &start_tv))) {
105 rrd_set_error( "start time: %s", parsetime_error );
106 return -1;
107 }
108 break;
109 case 'e':
110 if ((parsetime_error = parsetime(optarg, &end_tv))) {
111 rrd_set_error( "end time: %s", parsetime_error );
112 return -1;
113 }
114 break;
115 case 'r':
116 step_tmp = atol(optarg);
117 break;
118 case '?':
119 rrd_set_error("unknown option '-%c'",optopt);
120 return(-1);
121 }
122 }
125 if (proc_start_end(&start_tv,&end_tv,&start_tmp,&end_tmp) == -1){
126 return -1;
127 }
130 if (start_tmp < 3600*24*365*10){
131 rrd_set_error("the first entry to fetch should be after 1980");
132 return(-1);
133 }
135 if (end_tmp < start_tmp) {
136 rrd_set_error("start (%ld) should be less than end (%ld)", start_tmp, end_tmp);
137 return(-1);
138 }
140 *start = start_tmp;
141 *end = end_tmp;
143 if (step_tmp < 1) {
144 rrd_set_error("step must be >= 1 second");
145 return -1;
146 }
147 *step = step_tmp;
149 if (optind + 1 >= argc){
150 rrd_set_error("not enough arguments");
151 return -1;
152 }
154 cf = argv[optind+1];
156 if (rrd_fetch_r(argv[optind],cf,start,end,step,ds_cnt,ds_namv,data) == -1)
157 return(-1);
158 return (0);
159 }
161 int
162 rrd_fetch_r(
163 const char *filename, /* name of the rrd */
164 const char *cf, /* which consolidation function ?*/
165 time_t *start,
166 time_t *end, /* which time frame do you want ?
167 * will be changed to represent reality */
168 unsigned long *step, /* which stepsize do you want?
169 * will be changed to represent reality */
170 unsigned long *ds_cnt, /* number of data sources in file */
171 char ***ds_namv, /* names of data_sources */
172 rrd_value_t **data) /* two dimensional array containing the data */
173 {
174 enum cf_en cf_idx;
176 if ((int)(cf_idx=cf_conv(cf)) == -1 ){
177 return -1;
178 }
180 return (rrd_fetch_fn(filename,cf_idx,start,end,step,ds_cnt,ds_namv,data));
181 }
183 int
184 rrd_fetch_fn(
185 const char *filename, /* name of the rrd */
186 enum cf_en cf_idx, /* which consolidation function ?*/
187 time_t *start,
188 time_t *end, /* which time frame do you want ?
189 * will be changed to represent reality */
190 unsigned long *step, /* which stepsize do you want?
191 * will be changed to represent reality */
192 unsigned long *ds_cnt, /* number of data sources in file */
193 char ***ds_namv, /* names of data_sources */
194 rrd_value_t **data) /* two dimensional array containing the data */
195 {
196 long i,ii;
197 FILE *in_file;
198 time_t cal_start,cal_end, rra_start_time,rra_end_time;
199 long best_full_rra=0, best_part_rra=0, chosen_rra=0, rra_pointer=0;
200 long best_full_step_diff=0, best_part_step_diff=0, tmp_step_diff=0, tmp_match=0, best_match=0;
201 long full_match, rra_base;
202 long start_offset, end_offset;
203 int first_full = 1;
204 int first_part = 1;
205 rrd_t rrd;
206 rrd_value_t *data_ptr;
207 unsigned long rows;
208 long rrd_head_size;
210 #ifdef DEBUG
211 fprintf(stderr,"Entered rrd_fetch_fn() searching for the best match\n");
212 fprintf(stderr,"Looking for: start %10lu end %10lu step %5lu\n",
213 *start,*end,*step);
214 #endif
216 if(rrd_open(filename,&in_file,&rrd, RRD_READONLY)==-1)
217 return(-1);
219 rrd_head_size = ftell(in_file);
221 /* when was the really last update of this file ? */
223 if (((*ds_namv) = (char **) malloc(rrd.stat_head->ds_cnt * sizeof(char*)))==NULL){
224 rrd_set_error("malloc fetch ds_namv array");
225 rrd_free(&rrd);
226 fclose(in_file);
227 return(-1);
228 }
230 for(i=0;(unsigned long)i<rrd.stat_head->ds_cnt;i++){
231 if ((((*ds_namv)[i]) = malloc(sizeof(char) * DS_NAM_SIZE))==NULL){
232 rrd_set_error("malloc fetch ds_namv entry");
233 rrd_free(&rrd);
234 free(*ds_namv);
235 fclose(in_file);
236 return(-1);
237 }
238 strncpy((*ds_namv)[i],rrd.ds_def[i].ds_nam,DS_NAM_SIZE-1);
239 (*ds_namv)[i][DS_NAM_SIZE-1]='\0';
241 }
243 /* find the rra which best matches the requirements */
244 for(i=0;(unsigned)i<rrd.stat_head->rra_cnt;i++){
245 if(cf_conv(rrd.rra_def[i].cf_nam) == cf_idx){
247 cal_end = (rrd.live_head->last_up - (rrd.live_head->last_up
248 % (rrd.rra_def[i].pdp_cnt
249 * rrd.stat_head->pdp_step)));
250 cal_start = (cal_end
251 - (rrd.rra_def[i].pdp_cnt
252 * rrd.rra_def[i].row_cnt
253 * rrd.stat_head->pdp_step));
255 full_match = *end -*start;
256 #ifdef DEBUG
257 fprintf(stderr,"Considering: start %10lu end %10lu step %5lu ",
258 cal_start,cal_end,
259 rrd.stat_head->pdp_step * rrd.rra_def[i].pdp_cnt);
260 #endif
261 /* we need step difference in either full or partial case */
262 tmp_step_diff = labs(*step - (rrd.stat_head->pdp_step
263 * rrd.rra_def[i].pdp_cnt));
264 /* best full match */
265 if(cal_end >= *end
266 && cal_start <= *start){
267 if (first_full || (tmp_step_diff < best_full_step_diff)){
268 first_full=0;
269 best_full_step_diff = tmp_step_diff;
270 best_full_rra=i;
271 #ifdef DEBUG
272 fprintf(stderr,"best full match so far\n");
273 #endif
274 } else {
275 #ifdef DEBUG
276 fprintf(stderr,"full match, not best\n");
277 #endif
278 }
280 } else {
281 /* best partial match */
282 tmp_match = full_match;
283 if (cal_start>*start)
284 tmp_match -= (cal_start-*start);
285 if (cal_end<*end)
286 tmp_match -= (*end-cal_end);
287 if (first_part ||
288 (best_match < tmp_match) ||
289 (best_match == tmp_match &&
290 tmp_step_diff < best_part_step_diff)){
291 #ifdef DEBUG
292 fprintf(stderr,"best partial so far\n");
293 #endif
294 first_part=0;
295 best_match = tmp_match;
296 best_part_step_diff = tmp_step_diff;
297 best_part_rra =i;
298 } else {
299 #ifdef DEBUG
300 fprintf(stderr,"partial match, not best\n");
301 #endif
302 }
303 }
304 }
305 }
307 /* lets see how the matching went. */
308 if (first_full==0)
309 chosen_rra = best_full_rra;
310 else if (first_part==0)
311 chosen_rra = best_part_rra;
312 else {
313 rrd_set_error("the RRD does not contain an RRA matching the chosen CF");
314 rrd_free(&rrd);
315 fclose(in_file);
316 return(-1);
317 }
319 /* set the wish parameters to their real values */
320 *step = rrd.stat_head->pdp_step * rrd.rra_def[chosen_rra].pdp_cnt;
321 *start -= (*start % *step);
322 *end += (*step - *end % *step);
323 rows = (*end - *start) / *step + 1;
325 #ifdef DEBUG
326 fprintf(stderr,"We found: start %10lu end %10lu step %5lu rows %lu\n",
327 *start,*end,*step,rows);
328 #endif
330 /* Start and end are now multiples of the step size. The amount of
331 ** steps we want is (end-start)/step and *not* an extra one.
332 ** Reasoning: if step is s and we want to graph from t to t+s,
333 ** we need exactly ((t+s)-t)/s rows. The row to collect from the
334 ** database is the one with time stamp (t+s) which means t to t+s.
335 */
336 *ds_cnt = rrd.stat_head->ds_cnt;
337 if (((*data) = malloc(*ds_cnt * rows * sizeof(rrd_value_t)))==NULL){
338 rrd_set_error("malloc fetch data area");
339 for (i=0;(unsigned long)i<*ds_cnt;i++)
340 free((*ds_namv)[i]);
341 free(*ds_namv);
342 rrd_free(&rrd);
343 fclose(in_file);
344 return(-1);
345 }
347 data_ptr=(*data);
349 /* find base address of rra */
350 rra_base=ftell(in_file);
351 for(i=0;i<chosen_rra;i++)
352 rra_base += ( *ds_cnt
353 * rrd.rra_def[i].row_cnt
354 * sizeof(rrd_value_t));
356 /* find start and end offset */
357 rra_end_time = (rrd.live_head->last_up
358 - (rrd.live_head->last_up % *step));
359 rra_start_time = (rra_end_time
360 - ( *step * (rrd.rra_def[chosen_rra].row_cnt-1)));
361 /* here's an error by one if we don't be careful */
362 start_offset =(long)(*start + *step - rra_start_time) / (long)*step;
363 end_offset = (long)(rra_end_time - *end ) / (long)*step;
364 #ifdef DEBUG
365 fprintf(stderr,"rra_start %lu, rra_end %lu, start_off %li, end_off %li\n",
366 rra_start_time,rra_end_time,start_offset,end_offset);
367 #endif
369 /* fill the gap at the start if needs be */
371 if (start_offset <= 0)
372 rra_pointer = rrd.rra_ptr[chosen_rra].cur_row+1;
373 else
374 rra_pointer = rrd.rra_ptr[chosen_rra].cur_row+1+start_offset;
376 if(fseek(in_file,(rra_base
377 + (rra_pointer
378 * *ds_cnt
379 * sizeof(rrd_value_t))),SEEK_SET) != 0){
380 rrd_set_error("seek error in RRA");
381 for (i=0;(unsigned)i<*ds_cnt;i++)
382 free((*ds_namv)[i]);
383 free(*ds_namv);
384 rrd_free(&rrd);
385 free(*data);
386 *data = NULL;
387 fclose(in_file);
388 return(-1);
390 }
391 #ifdef DEBUG
392 fprintf(stderr,"First Seek: rra_base %lu rra_pointer %lu\n",
393 rra_base, rra_pointer);
394 #endif
395 /* step trough the array */
397 for (i=start_offset;
398 i< (signed)rrd.rra_def[chosen_rra].row_cnt - end_offset;
399 i++){
400 /* no valid data yet */
401 if (i<0) {
402 #ifdef DEBUG
403 fprintf(stderr,"pre fetch %li -- ",i);
404 #endif
405 for(ii=0;(unsigned)ii<*ds_cnt;ii++){
406 *(data_ptr++) = DNAN;
407 #ifdef DEBUG
408 fprintf(stderr,"%10.2f ",*(data_ptr-1));
409 #endif
410 }
411 }
412 /* past the valid data area */
413 else if (i >= (signed)rrd.rra_def[chosen_rra].row_cnt) {
414 #ifdef DEBUG
415 fprintf(stderr,"post fetch %li -- ",i);
416 #endif
417 for(ii=0;(unsigned)ii<*ds_cnt;ii++){
418 *(data_ptr++) = DNAN;
419 #ifdef DEBUG
420 fprintf(stderr,"%10.2f ",*(data_ptr-1));
421 #endif
422 }
423 } else {
424 /* OK we are inside the valid area but the pointer has to
425 * be wrapped*/
426 if (rra_pointer >= (signed)rrd.rra_def[chosen_rra].row_cnt) {
427 rra_pointer -= rrd.rra_def[chosen_rra].row_cnt;
428 if(fseek(in_file,(rra_base+rra_pointer
429 * *ds_cnt
430 * sizeof(rrd_value_t)),SEEK_SET) != 0){
431 rrd_set_error("wrap seek in RRA did fail");
432 for (ii=0;(unsigned)ii<*ds_cnt;ii++)
433 free((*ds_namv)[ii]);
434 free(*ds_namv);
435 rrd_free(&rrd);
436 free(*data);
437 *data = NULL;
438 fclose(in_file);
439 return(-1);
440 }
441 #ifdef DEBUG
442 fprintf(stderr,"wrap seek ...\n");
443 #endif
444 }
446 if(fread(data_ptr,
447 sizeof(rrd_value_t),
448 *ds_cnt,in_file) != rrd.stat_head->ds_cnt){
449 rrd_set_error("fetching cdp from rra");
450 for (ii=0;(unsigned)ii<*ds_cnt;ii++)
451 free((*ds_namv)[ii]);
452 free(*ds_namv);
453 rrd_free(&rrd);
454 free(*data);
455 *data = NULL;
456 fclose(in_file);
457 return(-1);
458 }
459 #ifdef POSIX_FADVISE
460 /* don't pollute the buffer cache with data read from the file. We do this while reading to
461 keep damage minimal */
462 if (0 != posix_fadvise(fileno(in_file), rrd_head_size, ftell(in_file), POSIX_FADV_DONTNEED)) {
463 rrd_set_error("setting POSIX_FADV_DONTNEED on '%s': %s",file_name, rrd_strerror(errno));
464 fclose(in_file);
465 return(-1);
466 }
467 #endif
469 #ifdef DEBUG
470 fprintf(stderr,"post fetch %li -- ",i);
471 for(ii=0;ii<*ds_cnt;ii++)
472 fprintf(stderr,"%10.2f ",*(data_ptr+ii));
473 #endif
474 data_ptr += *ds_cnt;
475 rra_pointer ++;
476 }
477 #ifdef DEBUG
478 fprintf(stderr,"\n");
479 #endif
481 }
482 rrd_free(&rrd);
483 #ifdef POSIX_FADVISE
484 /* and just to be sure we drop everything except the header at the end */
485 if (0 != posix_fadvise(fileno(in_file), rrd_head_size, 0, POSIX_FADV_DONTNEED)) {
486 rrd_set_error("setting POSIX_FADV_DONTNEED on '%s': %s",file_name, rrd_strerror(errno));
487 fclose(in_file);
488 return(-1);
489 }
490 #endif
491 fclose(in_file);
492 return(0);
493 }