diff options
author | Thomas White <taw@physics.org> | 2020-06-23 17:57:37 +0200 |
---|---|---|
committer | Thomas White <taw@physics.org> | 2020-07-29 18:53:44 +0200 |
commit | bed1e11f220c315e1a01b917abf200e927a1621a (patch) | |
tree | 5fca620942d0588b13d27e421cfa999d1c10075b /libcrystfel | |
parent | 83f4aece3488f72496aad2ed2d9d559a06271557 (diff) |
Path part of event expansion
Diffstat (limited to 'libcrystfel')
-rw-r--r-- | libcrystfel/src/image-hdf5.c | 217 |
1 files changed, 214 insertions, 3 deletions
diff --git a/libcrystfel/src/image-hdf5.c b/libcrystfel/src/image-hdf5.c index a59154fc..82968575 100644 --- a/libcrystfel/src/image-hdf5.c +++ b/libcrystfel/src/image-hdf5.c @@ -1131,10 +1131,221 @@ ImageFeatureList *image_hdf5_read_peaks_hdf5(const DataTemplate *dtempl, } -struct event_list *image_hdf5_expand_frames(const DataTemplate *dtempl, - const char *filename) +/* This could be extended, later, to include patterns other than just + * a literal string (no placeholders) and just %. However, pattern + * matching is in general not that easy. */ +static char *matches_pattern(const char *name, const char *pattern, + const char *ev_str_old) { - struct event_list *master_el; + if ( strcmp(pattern, "%") == 0 ) { + char *nstr = malloc(strlen(ev_str_old)+strlen(name)+2); + if ( nstr == NULL ) { + ERROR("Couldn't allocate memory\n"); + return NULL; + } + strcpy(nstr, ev_str_old); + strcat(nstr, "/"); + strcat(nstr, name); + return nstr; + } else { + if ( strcmp(name, pattern) == 0 ) { + return strdup(ev_str_old); + } else { + return NULL; + } + } +} + + +/* Private structure, just to avoid passing char *** around */ +struct ev_list +{ + char **events; + int n_events; + int max_events; +}; + + +static void add_to_list(struct ev_list *list, char *ev_str) +{ + if ( list->n_events == list->max_events ) { + char **new_events = realloc(list->events, + (list->max_events+128)*sizeof(char *)); + if ( new_events == NULL ) return; + list->max_events += 128; + list->events = new_events; + } + + list->events[list->n_events++] = ev_str; +} + + +static int rec_expand_paths(hid_t gh, struct ev_list *list, + const char *ev_str, + char **pattern_bits, int n_pattern_bits) +{ + int i; + H5G_info_t group_info; + + if ( H5Gget_info(gh, &group_info) < 0 ) { + ERROR("Couldn't get group info\n"); + return 1; + } + + for ( i=0; i<group_info.nlinks; i++ ) { + + ssize_t size; + char *name; + H5O_info_t obj_info; + char *ev_str_new; + + size = H5Lget_name_by_idx(gh, ".", H5_INDEX_NAME, + H5_ITER_INC, i, NULL, 0, + H5P_DEFAULT); + if ( (size < 0) || (size > 20000) ) { + ERROR("Couldn't get link name\n"); + return 1; + } + + name = malloc(size+1); + if ( name == NULL ) { + ERROR("Couldn't allocate memory\n"); + return 1; + } + + if ( H5Lget_name_by_idx(gh, ".", H5_INDEX_NAME, + H5_ITER_INC, i, name, size+1, + H5P_DEFAULT) < 0 ) + { + ERROR("Couldn't get name\n"); + return 1; + } + + ev_str_new = matches_pattern(name, pattern_bits[0], + ev_str); + if ( ev_str_new == NULL ) { + free(name); + continue; + } + + if ( H5Oget_info_by_idx(gh, ".", H5_INDEX_NAME, + H5_ITER_INC, i, &obj_info, 0) ) + { + ERROR("Couldn't get info\n"); + free(name); + free(ev_str_new); + return 1; + } + + if ( obj_info.type == H5O_TYPE_GROUP ) { + + hid_t child_gh; + + if ( n_pattern_bits == 0 ) { + ERROR("Pattern doesn't match file" + " (too short)\n"); + free(name); + free(ev_str_new); + return 1; + } + + child_gh = H5Gopen1(gh, name); + if ( child_gh < 0 ) { + ERROR("Couldn't open '%s'\n", name); + free(name); + free(ev_str_new); + return 1; + } + + if ( rec_expand_paths(child_gh, list, + ev_str_new, + &pattern_bits[1], + n_pattern_bits - 1) ) + { + free(name); + free(ev_str_new); + return 1; + } + + free(ev_str_new); + H5Gclose(child_gh); + + } else if ( obj_info.type == H5O_TYPE_DATASET ) { + + if ( n_pattern_bits != 1 ) { + ERROR("Pattern doesn't match file" + " (too long by %i)\n", + n_pattern_bits); + free(name); + free(ev_str_new); + return 1; + } + + add_to_list(list, ev_str_new); + + } + + free(name); + + } + + return 0; +} + + +static char **expand_paths(hid_t fh, char *pattern, int *n_evs) +{ + int n_sep; + size_t len; + char **pattern_bits; + struct ev_list list; + int i; + char *start; + + if ( pattern == NULL ) return NULL; + if ( pattern[0] != '/' ) return NULL; + + /* Chop up the pattern into path bits */ + len = strlen(pattern); + n_sep = 0; + for ( i=0; i<len; i++ ) { + if ( pattern[i] == '/' ) n_sep++; + } + + pattern_bits = malloc(n_sep*sizeof(char *)); + if ( pattern_bits == NULL ) return NULL; + + start = pattern+1; + for ( i=0; i<n_sep; i++ ) { + char *sep = strchr(start, '/'); + assert(sep != NULL); + pattern_bits[i] = strndup(start, sep-start); + if ( pattern_bits[i] == NULL ) return NULL; + start = sep+1; + } + + list.n_events = 0; + list.max_events = 0; + list.events = NULL; + + rec_expand_paths(fh, &list, "", pattern_bits, n_sep); + + for ( i=0; i<n_sep; i++ ) { + free(pattern_bits[i]); + } + free(pattern_bits); + + *n_evs = list.n_events; + return list.events; +} + + +char **image_hdf5_expand_frames(const DataTemplate *dtempl, + const char *filename, + int *pn_frames) +{ + char **frames = NULL; + int n_frames; hid_t fh; fh = H5Fopen(filename, H5F_ACC_RDONLY, H5P_DEFAULT); |