Skip to content

Commit 285c371

Browse files
committed
update to use htsFile in synced reader
1 parent c705bec commit 285c371

File tree

4 files changed

+127
-12
lines changed

4 files changed

+127
-12
lines changed

htslib/synced_bcf_reader.h

+20
Original file line numberDiff line numberDiff line change
@@ -233,10 +233,30 @@ void bcf_sr_destroy_threads(bcf_srs_t *files);
233233
*
234234
* See also the bcf_srs_t data structure for parameters controlling
235235
* the reader's logic.
236+
* Invokes bcf_sr_add_hreader with opened file
236237
*/
237238
HTSLIB_EXPORT
238239
int bcf_sr_add_reader(bcf_srs_t *readers, const char *fname);
239240

241+
/**
242+
* bcf_sr_add_hreader() - open new reader using htsfile
243+
* @readers: holder of the open readers
244+
* @file_ptr: htsfile already opened
245+
* @autoclose: close file along with reader or not, 1 - close, 0 - do not close
246+
* @fname: file name of @file_ptr
247+
*
248+
* Returns 1 if the call succeeded, or 0 on error.
249+
*
250+
* See also the bcf_srs_t data structure for parameters controlling
251+
* the reader's logic.
252+
* If fname is NULL, uses file_ptr->fn for fname
253+
* With fname as NULL, index file must be present in default location with
254+
* default name, as file_ptr->fn doesn't contain index information
255+
*/
256+
HTSLIB_EXPORT
257+
int bcf_sr_add_hreader(bcf_srs_t *readers, htsFile *file_ptr, int autoclose,
258+
const char *fname);
259+
240260
HTSLIB_EXPORT
241261
void bcf_sr_remove_reader(bcf_srs_t *files, int i);
242262

synced_bcf_reader.c

+44-8
Original file line numberDiff line numberDiff line change
@@ -69,6 +69,7 @@ typedef struct
6969
{
7070
sr_sort_t sort;
7171
int regions_overlap, targets_overlap;
72+
int *closefile; // close htsfile with sync reader close or not
7273
}
7374
aux_t;
7475

@@ -251,13 +252,28 @@ void bcf_sr_destroy_threads(bcf_srs_t *files) {
251252
int bcf_sr_add_reader(bcf_srs_t *files, const char *fname)
252253
{
253254
char fmode[5];
255+
int ret = 0;
256+
254257
strcpy(fmode, "r");
255258
vcf_open_mode(fmode+1, fname, NULL);
256259
htsFile* file_ptr = hts_open(fname, fmode);
257260
if ( ! file_ptr ) {
258261
files->errnum = open_failed;
259262
return 0;
260263
}
264+
if (!(ret = bcf_sr_add_hreader(files, file_ptr, 1, fname))) {
265+
hts_close(file_ptr); //failed, close the file
266+
}
267+
return ret;
268+
}
269+
270+
int bcf_sr_add_hreader(bcf_srs_t *files, htsFile *file_ptr, int autoclose, const char *fname)
271+
{
272+
aux_t *auxdata = NULL;
273+
if ( ! file_ptr ) {
274+
files->errnum = open_failed;
275+
return 0;
276+
}
261277

262278
files->has_line = (int*) realloc(files->has_line, sizeof(int)*(files->nreaders+1));
263279
files->has_line[files->nreaders] = 0;
@@ -274,7 +290,7 @@ int bcf_sr_add_reader(bcf_srs_t *files, const char *fname)
274290
BGZF *bgzf = hts_get_bgzfp(reader->file);
275291
if ( bgzf && bgzf_check_EOF(bgzf) == 0 ) {
276292
files->errnum = no_eof;
277-
hts_log_warning("No BGZF EOF marker; file '%s' may be truncated", fname);
293+
hts_log_warning("No BGZF EOF marker; file '%s' may be truncated", file_ptr->fn);
278294
}
279295
if (files->p)
280296
bgzf_thread_pool(bgzf, files->p->pool, files->p->qsize);
@@ -290,7 +306,7 @@ int bcf_sr_add_reader(bcf_srs_t *files, const char *fname)
290306
return 0;
291307
}
292308

293-
reader->tbx_idx = tbx_index_load(fname);
309+
reader->tbx_idx = tbx_index_load(fname ? fname : file_ptr->fn);
294310
if ( !reader->tbx_idx )
295311
{
296312
files->errnum = idx_load_failed;
@@ -309,7 +325,7 @@ int bcf_sr_add_reader(bcf_srs_t *files, const char *fname)
309325

310326
reader->header = bcf_hdr_read(reader->file);
311327

312-
reader->bcf_idx = bcf_index_load(fname);
328+
reader->bcf_idx = bcf_index_load(fname ? fname : file_ptr->fn);
313329
if ( !reader->bcf_idx )
314330
{
315331
files->errnum = idx_load_failed;
@@ -362,7 +378,7 @@ int bcf_sr_add_reader(bcf_srs_t *files, const char *fname)
362378
return 0;
363379
}
364380

365-
reader->fname = strdup(fname);
381+
reader->fname = strdup(fname ? fname : file_ptr->fn);
366382
if ( files->apply_filters )
367383
reader->filter_ids = init_filters(reader->header, files->apply_filters, &reader->nfilter_ids);
368384

@@ -413,6 +429,18 @@ int bcf_sr_add_reader(bcf_srs_t *files, const char *fname)
413429
}
414430
}
415431

432+
if ((auxdata = BCF_SR_AUX(files))) {
433+
//store closure status for htsfile
434+
int *tmp = realloc(auxdata->closefile, sizeof(int) * files->nreaders);
435+
if (!tmp) {
436+
hts_log_error("Failed to allocate memory");
437+
return 0;
438+
}
439+
tmp[files->nreaders - 1] = autoclose;
440+
auxdata->closefile = tmp;
441+
}
442+
443+
416444
return 1;
417445
}
418446

@@ -426,13 +454,15 @@ bcf_srs_t *bcf_sr_init(void)
426454
return files;
427455
}
428456

429-
static void bcf_sr_destroy1(bcf_sr_t *reader)
457+
static void bcf_sr_destroy1(bcf_sr_t *reader, int closefile)
430458
{
431459
free(reader->fname);
432460
if ( reader->tbx_idx ) tbx_destroy(reader->tbx_idx);
433461
if ( reader->bcf_idx ) hts_idx_destroy(reader->bcf_idx);
434462
bcf_hdr_destroy(reader->header);
435-
hts_close(reader->file);
463+
if (closefile) {
464+
hts_close(reader->file);
465+
}
436466
if ( reader->itr ) tbx_itr_destroy(reader->itr);
437467
int j;
438468
for (j=0; j<reader->mbuffer; j++)
@@ -445,8 +475,10 @@ static void bcf_sr_destroy1(bcf_sr_t *reader)
445475
void bcf_sr_destroy(bcf_srs_t *files)
446476
{
447477
int i;
478+
int *autoclose = BCF_SR_AUX(files)->closefile;
479+
448480
for (i=0; i<files->nreaders; i++)
449-
bcf_sr_destroy1(&files->readers[i]);
481+
bcf_sr_destroy1(&files->readers[i], autoclose[i]);
450482
free(files->has_line);
451483
free(files->readers);
452484
for (i=0; i<files->n_smpl; i++) free(files->samples[i]);
@@ -456,19 +488,23 @@ void bcf_sr_destroy(bcf_srs_t *files)
456488
if (files->tmps.m) free(files->tmps.s);
457489
if (files->n_threads) bcf_sr_destroy_threads(files);
458490
bcf_sr_sort_destroy(&BCF_SR_AUX(files)->sort);
491+
free(autoclose);
459492
free(files->aux);
460493
free(files);
461494
}
462495

463496
void bcf_sr_remove_reader(bcf_srs_t *files, int i)
464497
{
465498
assert( !files->samples ); // not ready for this yet
499+
int *autoclose = BCF_SR_AUX(files)->closefile;
500+
466501
bcf_sr_sort_remove_reader(files, &BCF_SR_AUX(files)->sort, i);
467-
bcf_sr_destroy1(&files->readers[i]);
502+
bcf_sr_destroy1(&files->readers[i], autoclose[i]);
468503
if ( i+1 < files->nreaders )
469504
{
470505
memmove(&files->readers[i], &files->readers[i+1], (files->nreaders-i-1)*sizeof(bcf_sr_t));
471506
memmove(&files->has_line[i], &files->has_line[i+1], (files->nreaders-i-1)*sizeof(int));
507+
memmove(&autoclose[i], &autoclose[i+1], (files->nreaders-i-1)*sizeof(int));
472508
}
473509
files->nreaders--;
474510
}

test/test-bcf-sr.c

+34-4
Original file line numberDiff line numberDiff line change
@@ -133,13 +133,15 @@ int main(int argc, char *argv[])
133133
{"targets",required_argument,NULL,'t'},
134134
{"no-index",no_argument,NULL,1000},
135135
{"args",no_argument,NULL,1001},
136+
{"usefptr",no_argument,NULL,'u'},
136137
{NULL,0,NULL,0}
137138
};
138139

139-
int c, pair = 0, use_index = 1, use_fofn = 1;
140+
int c, pair = 0, use_index = 1, use_fofn = 1, usefptr = 0;
140141
enum htsExactFormat out_fmt = text_format; // for original pos + alleles
141142
const char *out_fn = NULL, *regions = NULL, *targets = NULL;
142-
while ((c = getopt_long(argc, argv, "o:O:p:r:t:h", loptions, NULL)) >= 0)
143+
htsFile **htsfp = NULL;
144+
while ((c = getopt_long(argc, argv, "o:O:p:r:t:hu", loptions, NULL)) >= 0)
143145
{
144146
switch (c)
145147
{
@@ -179,6 +181,9 @@ int main(int argc, char *argv[])
179181
case 1001:
180182
use_fofn = 0;
181183
break;
184+
case 'u':
185+
usefptr = 1; //use htsfile interface instead of fname i/f
186+
break;
182187
case 'h':
183188
usage(EXIT_SUCCESS);
184189
default: usage(EXIT_FAILURE);
@@ -218,8 +223,29 @@ int main(int argc, char *argv[])
218223
error("Failed to set targets\n");
219224
}
220225

221-
for (i=0; i<nvcf; i++)
222-
if ( !bcf_sr_add_reader(sr,vcfs[i]) ) error("Failed to open %s: %s\n", vcfs[i],bcf_sr_strerror(sr->errnum));
226+
if (usefptr && !(htsfp = malloc(sizeof(htsFile*) * nvcf))) {
227+
error("Failed to allocate memory\n");
228+
}
229+
230+
for (i=0; i<nvcf; i++) {
231+
if (!usefptr) {
232+
if ( !bcf_sr_add_reader(sr,vcfs[i]) ) {
233+
error("Failed to open %s: %s\n", vcfs[i],
234+
bcf_sr_strerror(sr->errnum));
235+
}
236+
} else { //use htsfile i/f
237+
if (!(htsfp[i] = hts_open(vcfs[i], "r"))) {
238+
error("Failed to open %s: %s\n", vcfs[i],
239+
bcf_sr_strerror(sr->errnum));
240+
}
241+
/*with name, index can be anywhere, named as anything
242+
w/o name it has to be along with file with default naming*/
243+
if ( !bcf_sr_add_hreader(sr, htsfp[i], 1, vcfs[i]) ) {
244+
error("Failed to add reader %s: %s\n", vcfs[i],
245+
bcf_sr_strerror(sr->errnum));
246+
}
247+
}
248+
}
223249

224250
if (!sr->readers || sr->nreaders < 1)
225251
error("No readers set, even though one was added\n");
@@ -264,6 +290,10 @@ int main(int argc, char *argv[])
264290
free(vcfs[i]);
265291
free(vcfs);
266292
}
293+
if (usefptr) {
294+
//files are closed along with sr destroy
295+
free(htsfp);
296+
}
267297

268298
return 0;
269299
}

test/test.pl

+29
Original file line numberDiff line numberDiff line change
@@ -56,6 +56,7 @@
5656
run_test('test_bcf_sr_sort',$opts);
5757
run_test('test_bcf_sr_no_index',$opts);
5858
run_test('test_bcf_sr_range', $opts);
59+
run_test('test_bcf_sr_hreader', $opts);
5960
run_test('test_command',$opts,cmd=>'test-bcf-translate -',out=>'test-bcf-translate.out');
6061
run_test('test_convert_padded_header',$opts);
6162
run_test('test_rebgzip',$opts);
@@ -1345,6 +1346,34 @@ sub test_bcf_sr_range {
13451346
}
13461347
}
13471348

1349+
sub test_bcf_sr_hreader {
1350+
#uses input file from test_bcf_sr_sort / test-bcf-sr.pl
1351+
#invokes bcf sync reader with hread method
1352+
my ($opts, %args) = @_;
1353+
my $test = "test_bcf_sr_hreader";
1354+
my $fail = 0;
1355+
my $cmd = "$$opts{path}/test-bcf-sr -p all $$opts{tmp}/list.txt -o $$opts{tmp}/file.out";
1356+
my $cmd_header = "$$opts{path}/test-bcf-sr -p all $$opts{tmp}/list.txt -o $$opts{tmp}/filenew.out -u";
1357+
my $cmd_diff = "diff $$opts{tmp}/filenew.out $$opts{tmp}/file.out";
1358+
1359+
my ($ret, $out) = _cmd($cmd);
1360+
if ($ret != 0) {
1361+
failed($opts, $test, "Failed to create reference output\n");
1362+
return;
1363+
}
1364+
($ret, $out) = _cmd($cmd_header);
1365+
if ($ret != 0) {
1366+
failed($opts, $test, "Failed to create output\n");
1367+
return;
1368+
}
1369+
($ret, $out) = _cmd($cmd_diff);
1370+
if ($ret != 0) {
1371+
failed($opts, $test, "Output differs to reference output\n");
1372+
return;
1373+
}
1374+
passed($opts, $test);
1375+
}
1376+
13481377
sub test_command
13491378
{
13501379
my ($opts, %args) = @_;

0 commit comments

Comments
 (0)