@@ -198,7 +198,7 @@ int run_scaffolding(char *fai, char *agp, char *link_file, cov_norm_t *cov_norm,
198
198
fprintf (stderr , "[I::%s] RAM limit: %.3fGB\n" , __func__ , (double ) rss_limit / GB );
199
199
fprintf (stderr , "[I::%s] RAM required: %.3fGB\n" , __func__ , (double ) rss_intra / GB );
200
200
re = ENOMEM_ERR ;
201
- goto scaff_done ;
201
+ goto scaff_failed_0 ;
202
202
}
203
203
rss_limit -= rss_intra ;
204
204
fprintf (stderr , "[I::%s] starting norm estimation...\n" , __func__ );
@@ -213,9 +213,8 @@ int run_scaffolding(char *fai, char *agp, char *link_file, cov_norm_t *cov_norm,
213
213
norm_t * norm = calc_norms (intra_link_mat , d_min_cell , d_mass_frac );
214
214
if (norm == 0 ) {
215
215
fprintf (stderr , "[W::%s] No enough bands for norm calculation... End of scaffolding round.\n" , __func__ );
216
- intra_link_mat_destroy (intra_link_mat );
217
216
re = ENOBND_ERR ;
218
- goto scaff_done ;
217
+ goto scaff_failed_1 ;
219
218
}
220
219
221
220
rss_inter = no_mem_check ? 0 : estimate_inter_link_mat_init_rss (dict , resolution , norm -> r );
@@ -225,7 +224,7 @@ int run_scaffolding(char *fai, char *agp, char *link_file, cov_norm_t *cov_norm,
225
224
fprintf (stderr , "[I::%s] RAM limit: %.3fGB\n" , __func__ , (double ) rss_limit / GB );
226
225
fprintf (stderr , "[I::%s] RAM required: %.3fGB\n" , __func__ , (double ) rss_inter / GB );
227
226
re = ENOMEM_ERR ;
228
- goto scaff_done ;
227
+ goto scaff_failed_1 ;
229
228
}
230
229
rss_limit -= rss_inter ;
231
230
fprintf (stderr , "[I::%s] starting link estimation...\n" , __func__ );
@@ -242,8 +241,7 @@ int run_scaffolding(char *fai, char *agp, char *link_file, cov_norm_t *cov_norm,
242
241
double la ;
243
242
re = inter_link_norms (inter_link_mat , norm , 1 , max_noise_ratio , & la );
244
243
if (re ) {
245
- inter_link_mat_destroy (inter_link_mat );
246
- goto scaff_done ;
244
+ goto scaff_failed_2 ;
247
245
}
248
246
249
247
int8_t * directs = 0 ;
@@ -310,7 +308,7 @@ int run_scaffolding(char *fai, char *agp, char *link_file, cov_norm_t *cov_norm,
310
308
311
309
asm_dict_t * d = make_asm_dict_from_graph (g , g -> sdict );
312
310
// write scaffolds to AGP file
313
- FILE * agp_out ;
311
+ FILE * agp_out = NULL ;
314
312
if (out ) {
315
313
char * agp_out_name = (char * ) malloc (strlen (out ) + 5 );
316
314
sprintf (agp_out_name , "%s.agp" , out );
@@ -321,19 +319,23 @@ int run_scaffolding(char *fai, char *agp, char *link_file, cov_norm_t *cov_norm,
321
319
}
322
320
if (agp_out == NULL ) {
323
321
fprintf (stderr , "[E::%s] fail to open file to write\n" , __func__ );
324
- return 0 ;
322
+ re = 1 ;
323
+ } else {
324
+ write_asm_dict_to_agp (d , agp_out );
325
+ fclose (agp_out );
325
326
}
326
- write_asm_dict_to_agp (d , agp_out );
327
- fclose (agp_out );
328
-
327
+
329
328
asm_destroy (d );
329
+ graph_destroy (g );
330
330
331
- intra_link_mat_destroy ( intra_link_mat );
331
+ scaff_failed_2 :
332
332
inter_link_mat_destroy (inter_link_mat );
333
+
334
+ scaff_failed_1 :
333
335
norm_destroy (norm );
334
- graph_destroy ( g );
335
-
336
- scaff_done :
336
+ intra_link_mat_destroy ( intra_link_mat );
337
+
338
+ scaff_failed_0 :
337
339
asm_destroy (dict );
338
340
sd_destroy (sdict );
339
341
@@ -446,7 +448,7 @@ static void print_asm_stats(uint64_t *n_stats, uint32_t *l_stats, int all)
446
448
#endif
447
449
}
448
450
449
- int run_yahs (char * fai , char * agp , char * link_file , uint32_t ml , uint8_t mq , uint32_t wd , char * out , int * resolutions , int nr , int rr , re_cuts_t * re_cuts , int8_t * telo_ends , uint32_t d_min_cell , double d_mass_frac , int no_contig_ec , int no_scaffold_ec , int no_mem_check )
451
+ int run_yahs (char * fai , char * agp , char * link_file , uint32_t ml , uint8_t mq , char * out , int * resolutions , int nr , int rr , re_cuts_t * re_cuts , int8_t * telo_ends , uint32_t d_min_cell , double d_mass_frac , int no_contig_ec , int no_scaffold_ec , int no_mem_check )
450
452
{
451
453
int ec_round , resolution , re , r , rn , rc , ex ;
452
454
uint64_t n50 ;
@@ -468,8 +470,6 @@ int run_yahs(char *fai, char *agp, char *link_file, uint32_t ml, uint8_t mq, uin
468
470
out_fn = (char * ) malloc (strlen (out ) + 35 );
469
471
out_agp = (char * ) malloc (strlen (out ) + 35 );
470
472
out_agp_break = (char * ) malloc (strlen (out ) + 35 );
471
-
472
- cov_norm = cov_norm_from_file (link_file , sdict , wd );
473
473
474
474
if (no_contig_ec == 0 ) {
475
475
#ifdef DEBUG
@@ -521,6 +521,8 @@ int run_yahs(char *fai, char *agp, char *link_file, uint32_t ml, uint8_t mq, uin
521
521
print_asm_stats (n_stats , l_stats , 1 );
522
522
asm_destroy (dict );
523
523
524
+ cov_norm = cov_norm_from_file (link_file , sdict );
525
+
524
526
r = rc = 0 ;
525
527
rn = rr ;
526
528
ex = max_extra_try ;
@@ -696,22 +698,27 @@ static void print_help(FILE *fp_help, int is_long_help)
696
698
fprintf (fp_help , " -e STR restriction enzyme cutting sites [none]\n" );
697
699
fprintf (fp_help , " -l INT minimum length of a contig to scaffold [0]\n" );
698
700
fprintf (fp_help , " -q INT minimum mapping quality [10]\n" );
701
+ fprintf (fp_help , "\n" );
702
+ fprintf (fp_help , " --no-contig-ec do not do contig error correction\n" );
703
+ fprintf (fp_help , " --no-scaffold-ec do not do scaffold error correction\n" );
704
+ fprintf (fp_help , " --no-mem-check do not do memory check at runtime\n" );
705
+ fprintf (fp_help , " --file-type STR input file type BED|BAM|PA5|BIN, file name extension is ignored if set\n" );
706
+ fprintf (fp_help , " --read-length read length (required for PA5 format input) [150]\n" );
707
+ fprintf (fp_help , " --telo-motif STR telomeric sequence motif\n" );
699
708
if (is_long_help ) {
709
+ fprintf (fp_help , "\n" );
700
710
fprintf (fp_help , " --D-min-cells INT minimum number of cells to calculate the distance threshold [30]\n" );
701
711
fprintf (fp_help , " --D-mass-frac FLOAT fraction of HiC signals to calculate the distance threshold [0.99]\n" );
712
+ fprintf (fp_help , "\n" );
702
713
fprintf (fp_help , " --seq-ctype STR AGP output sequence component type [%s]\n" , agp_component_type_val (DEFAULT_AGP_SEQ_COMPONENT_TYPE ));
703
714
fprintf (fp_help , " --gap-ctype STR AGP output gap component type [%s]\n" , agp_component_type_val (DEFAULT_AGP_GAP_COMPONENT_TYPE ));
704
715
fprintf (fp_help , " --gap-link STR AGP output gap linkage evidence [%s]\n" , agp_linkage_evidence_val (DEFAULT_AGP_LINKAGE_EVIDENCE ));
705
716
fprintf (fp_help , " --gap-size INT AGP output gap size between sequence component [%d]\n" , DEFAULT_AGP_GAP_SIZE );
717
+ fprintf (fp_help , "\n" );
706
718
fprintf (fp_help , " --convert-to-binary make a binary ouput file from the input and exit\n" );
707
719
fprintf (fp_help , " --print-telo-motifs print telomeric motifs in the database and exit\n" );
708
720
}
709
- fprintf (fp_help , " --no-contig-ec do not do contig error correction\n" );
710
- fprintf (fp_help , " --no-scaffold-ec do not do scaffold error correction\n" );
711
- fprintf (fp_help , " --no-mem-check do not do memory check at runtime\n" );
712
- fprintf (fp_help , " --file-type STR input file type BED|BAM|PA5|BIN, file name extension is ignored if set\n" );
713
- fprintf (fp_help , " --read-length read length (required for PA5 format input) [150]\n" );
714
- fprintf (fp_help , " --telo-motif STR telomeric sequence motif\n" );
721
+ fprintf (fp_help , "\n" );
715
722
fprintf (fp_help , " -o STR prefix of output files [yahs.out]\n" );
716
723
fprintf (fp_help , " -v INT verbose level [%d]\n" , VERBOSE );
717
724
fprintf (fp_help , " -? print long help with extra option list\n" );
@@ -754,7 +761,6 @@ int main(int argc, char *argv[])
754
761
int * resolutions , nr , rr , mq , ml , rl ;
755
762
int no_contig_ec , no_scaffold_ec , no_mem_check , d_min_cell , print_telomotifs , convert_binary ;
756
763
int8_t * telo_ends ;
757
- uint32_t wd ;
758
764
double q_drop , d_mass_frac ;
759
765
enum fileTypes f_type ;
760
766
@@ -770,7 +776,6 @@ int main(int argc, char *argv[])
770
776
ml = 0 ;
771
777
rl = 150 ;
772
778
ecstr = 0 ;
773
- wd = 1000 ;
774
779
q_drop = 0.1 ;
775
780
d_min_cell = 30 ;
776
781
d_mass_frac = 0.99 ;
@@ -1032,17 +1037,17 @@ int main(int argc, char *argv[])
1032
1037
link_bin_file = malloc (strlen (out ) + 5 );
1033
1038
sprintf (link_bin_file , "%s.bin" , out );
1034
1039
fprintf (stderr , "[I::%s] dump hic links (BAM) to binary file %s\n" , __func__ , link_bin_file );
1035
- dump_links_from_bam_file (link_file , fai , ml , 0 , wd , q_drop , link_bin_file );
1040
+ dump_links_from_bam_file (link_file , fai , ml , 0 , q_drop , link_bin_file );
1036
1041
} else if (f_type == BED ) {
1037
1042
link_bin_file = malloc (strlen (out ) + 5 );
1038
1043
sprintf (link_bin_file , "%s.bin" , out );
1039
1044
fprintf (stderr , "[I::%s] dump hic links (BED) to binary file %s\n" , __func__ , link_bin_file );
1040
- dump_links_from_bed_file (link_file , fai , ml , 0 , wd , q_drop , link_bin_file );
1045
+ dump_links_from_bed_file (link_file , fai , ml , 0 , q_drop , link_bin_file );
1041
1046
} else if (f_type == PA5 ) {
1042
1047
link_bin_file = malloc (strlen (out ) + 5 );
1043
1048
sprintf (link_bin_file , "%s.bin" , out );
1044
1049
fprintf (stderr , "[I::%s] dump hic links (PA5) to binary file %s\n" , __func__ , link_bin_file );
1045
- dump_links_from_pa5_file (link_file , fai , ml , 0 , rl , wd , q_drop , link_bin_file );
1050
+ dump_links_from_pa5_file (link_file , fai , ml , 0 , rl , q_drop , link_bin_file );
1046
1051
} else if (f_type == BIN ) {
1047
1052
if (convert_binary ) {
1048
1053
fprintf (stderr , "[E::%s] Input is already in BIN format\n" , __func__ );
@@ -1083,7 +1088,7 @@ int main(int argc, char *argv[])
1083
1088
1084
1089
if (convert_binary ) goto final_clean ;
1085
1090
1086
- ret = run_yahs (fai , agp , link_bin_file , ml , mq8 , wd , out , resolutions , nr , rr , re_cuts , telo_ends , d_min_cell , d_mass_frac , no_contig_ec , no_scaffold_ec , no_mem_check );
1091
+ ret = run_yahs (fai , agp , link_bin_file , ml , mq8 , out , resolutions , nr , rr , re_cuts , telo_ends , d_min_cell , d_mass_frac , no_contig_ec , no_scaffold_ec , no_mem_check );
1087
1092
1088
1093
if (ret == 0 ) {
1089
1094
agp_final = (char * ) malloc (strlen (out ) + 35 );
0 commit comments