-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathConvertBam.cpp
More file actions
103 lines (90 loc) · 2.76 KB
/
ConvertBam.cpp
File metadata and controls
103 lines (90 loc) · 2.76 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
#include <stdio.h>
#include <htslib/sam.h>
using namespace std;
#include <string>
#include <sstream>
int main(int argc, char *argv[]) {
if (argc < 2) {
fprintf(stderr, "Usage: %s <bam_file>\n", argv[0]);
return 1;
}
const char *bam_filename = argv[1];
// Open BAM file for reading
samFile *bam_file = hts_open(bam_filename, "r");
if (bam_file == NULL) {
fprintf(stderr, "Error opening BAM file %s\n", bam_filename);
return 1;
}
// Initialize bam header and alignment record
bam_hdr_t *bam_header = sam_hdr_read(bam_file);
bam1_t *alignment = bam_init1();
string prevChrom="";
string prevCigar="";
int prevPos=-1;
int prevScore=-1;
int prevFlag=-1;
int prevMapQV=-1;
// Read and process each alignment
while (sam_read1(bam_file, bam_header, alignment) >= 0) {
// Skip secondary alignments
if (alignment->core.flag & BAM_FSECONDARY) continue;
// Extract information
int32_t tid = alignment->core.tid;
if (tid == -1) { continue;}
int32_t pos = alignment->core.pos + 1; // 1-based position
uint32_t mapq = alignment->core.qual;
int flag=(int) alignment->core.flag;
uint8_t *as_aux = bam_aux_get(alignment, "AS");
int32_t score = 0;
if (as_aux) {
score = bam_aux2i(as_aux);
} else {
fprintf(stderr, "Warning: AS tag not found for this alignment.\n");
}
uint32_t *cigar = bam_get_cigar(alignment);
int n_cigar = alignment->core.n_cigar;
string cigarStr;
stringstream strm;
for (int i = 0; i < n_cigar; ++i) {
char cigar_op = bam_cigar_opchr(bam_cigar_op(cigar[i]));
int cigar_len = bam_cigar_oplen(cigar[i]);
strm << cigar_len << cigar_op;
}
cigarStr = strm.str();
// Retrieve chromosome name
string chrom_name(bam_header->target_name[tid]);
// Print extracted information
if (prevChrom != chrom_name) {
printf("%s\t%d\t%d\t%s\t%d\t%d\n", chrom_name.c_str(), pos, mapq, cigarStr.c_str(), score, flag);
}
else if (prevPos != pos) {
printf("%d\t%d\t%s\t%d\t%d\n", pos, mapq, cigarStr.c_str(), score, flag);
}
else if (prevMapQV != mapq) {
printf("%d\t%s\t%d\t%d\n", mapq, cigarStr.c_str(), score, flag);
}
else if (prevCigar != cigarStr) {
printf("%s\t%d\t%d\n", cigarStr.c_str(), score, flag);
}
else if (prevScore != score) {
printf("%d\t%d\n", score, flag);
}
else if (prevFlag != flag) {
printf("%d\n", flag);
}
else {
printf("\n");
}
prevChrom = chrom_name;
prevPos = pos;
prevScore = score;
prevMapQV=mapq;
prevCigar=cigarStr;
prevFlag=flag;
}
// Clean up
bam_destroy1(alignment);
bam_hdr_destroy(bam_header);
sam_close(bam_file);
return 0;
}