-rw-r--r-- | src/load/load_asn.c | 173 | ||||
-rw-r--r-- | src/load/load_asn.h | 24 | ||||
-rw-r--r-- | src/load/load_features.c | 167 | ||||
-rw-r--r-- | src/load/load_features.h | 12 |
4 files changed, 376 insertions, 0 deletions
diff --git a/src/load/load_asn.h b/src/load/load_asn.h new file mode 100644 index 0000000..a7d54db --- a/dev/null +++ b/src/load/load_asn.h @@ -0,0 +1,24 @@ +#ifndef LOAD_ASN_H +#define LOAD_ASN_H + +#include <hdf5.h> + +/* + * Load the features and other meta-data pulled from Entrez via eFetch + * as ASN.1. + * + * Test: gi|453644 + * + * Retrieving the ASN.1 file via eFetch for gi|453644 worked smoothly + * however the hierarchy of the ASN.1 is difficult to align with other + * data by GI. This is due to the Bioseqset returned lacking + * identifiers and the gi|453644 appearing as a Bioseq member of the + * set. It is positioned on the same hierarchical level as gi|453643. + * The containing set includes the PUB records. Comparatively the XML + * files returned via the same process list the gi|453644 at the top + * of the hierarchy and above the PUB records. This output appears to + * be more consistent with the perspective requested in the input. + */ +void load_asn (hid_t file_id, const char* file_name); + +#endif // LOAD_ASN_H |