Skip to content

Commit d77e5a0

Browse files
committed
Do not rename reverse complemented sequences
1 parent 2e8a134 commit d77e5a0

File tree

6 files changed

+17
-17
lines changed

6 files changed

+17
-17
lines changed

src/cfeintact/aligned_sequence.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ def coordinate_mapping(self):
3939

4040
def reverse(self):
4141
newthis = SeqRecord(Seq.reverse_complement(self.this.seq),
42-
id=(self.this.id or "*Unknown*") + "[REVERSE_COMPLEMENT]",
42+
id=self.this.id,
4343
name=self.this.name
4444
)
4545

tests/expected-results-edgy/errors.json

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1195,7 +1195,7 @@
11951195
"orf": null
11961196
}
11971197
],
1198-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED[REVERSE_COMPLEMENT]": [],
1198+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED": [],
11991199
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSED": [
12001200
{
12011201
"qseqid": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSED",
@@ -1420,7 +1420,7 @@
14201420
"orf": null
14211421
}
14221422
],
1423-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS[REVERSE_COMPLEMENT]": [
1423+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS": [
14241424
{
14251425
"qseqid": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS",
14261426
"error": "UnknownNucleotide",
@@ -1664,15 +1664,15 @@
16641664
"orf": null
16651665
}
16661666
],
1667-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT]": [
1667+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS": [
16681668
{
16691669
"qseqid": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS",
16701670
"error": "UnknownNucleotide",
16711671
"message": "Sequence contains invalid nucleotides: >1>#>@> (start: 45, end: 51).",
16721672
"orf": null
16731673
}
16741674
],
1675-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES[REVERSE_COMPLEMENT]": [
1675+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES": [
16761676
{
16771677
"qseqid": "Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES",
16781678
"error": "UnknownNucleotide",

tests/expected-results-edgy/holistic.json

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@
103103
"orfs_end": 8368,
104104
"blast_n_conseqs": 0
105105
},
106-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED[REVERSE_COMPLEMENT]": {
106+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED": {
107107
"intact": true,
108108
"qlen": 9718,
109109
"hypermutation_probablility": 0.0,
@@ -129,7 +129,7 @@
129129
"orfs_end": 8368,
130130
"blast_n_conseqs": 0
131131
},
132-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS[REVERSE_COMPLEMENT]": {
132+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS": {
133133
"intact": false,
134134
"qlen": 9711,
135135
"hypermutation_probablility": 0.0,
@@ -155,7 +155,7 @@
155155
"orfs_end": 8368,
156156
"blast_n_conseqs": 0
157157
},
158-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT]": {
158+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS": {
159159
"intact": false,
160160
"qlen": 9711,
161161
"hypermutation_probablility": 0.0,
@@ -168,7 +168,7 @@
168168
"orfs_end": 8793,
169169
"blast_n_conseqs": 3
170170
},
171-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES[REVERSE_COMPLEMENT]": {
171+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES": {
172172
"intact": false,
173173
"qlen": 9711,
174174
"hypermutation_probablility": 0.0,

tests/expected-results-edgy/intact.fasta

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -324,7 +324,7 @@ CTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG
324324
TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTG
325325
CTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGT
326326
GACTCTGGTAACTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA
327-
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED[REVERSE_COMPLEMENT] <unknown description>
327+
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED <unknown description>
328328
TGGAAGGGCTAATTCACTCCCAACGAAGACAAGATATCCTTGATCTGTGGATCTACCACA
329329
CACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGATCAGATATCCAC
330330
TGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGTTAGAAGAAGCCA

tests/expected-results-edgy/nonintact.fasta

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -332,7 +332,7 @@ CCCAGTAGGTAAGGTACGTCCGAGTGTCCCACATTGTTCGACCACAAGAGAGGAAACAAC
332332
CGAAGAAGATTGAAGAGACCGAGTTGACCATGATCGAACATCGTGGTAGGTTTCCAGTCA
333333
CCTATAGACTAGGGACCGGGACCACACATCAAGACGATTAGTCCCTTCATCGGAACACAC
334334
ACCATCTAGGTGTCTAGTTCCTATAGAACAGAAGCAACCCTCACTTAATCGGGAAGGT
335-
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS[REVERSE_COMPLEMENT] <unknown description>
335+
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS <unknown description>
336336
TGGAAGGGCTAATTCACTCCCAACGAAGACAAGATATCCTTGATCTGTGGATCTACCACA
337337
CACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGATCAGATATCCAC
338338
TGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGTTAGAAGAAGCCA
@@ -497,7 +497,7 @@ CTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGT
497497
GACTCTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA
498498
>small-sequence-with-xs <unknown description>
499499
ATCTCTAGAGTC
500-
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT] <unknown description>
500+
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS <unknown description>
501501
TGGAAGGGCTAATTCACTCCCAACGAAGACAAGATATCCTTGATCTGTGGATCTACCACA
502502
CACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGATCAGATATCCAC
503503
TGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGTTAGAAGAAGCCA
@@ -660,7 +660,7 @@ CTGGGGAGTGGCGAGCCCTCAGATCCTGCATATAAGCAGCTGCTTTTTGCCTGTACTGGG
660660
TCTCTCTGGTTAGACCAGATCTGAGCCTGGGAGCTCTCTGGCTAACTAGGGAACCCACTG
661661
CTTAAGCCTCAATAAAGCTTGCCTTGAGTGCTTCAAGTAGTGTGTGCCCGTCTGTTGTGT
662662
GACTCTAGAGATCCCTCAGACCCTTTTAGTCAGTGTGGAAAATCTCTAGCA
663-
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES[REVERSE_COMPLEMENT] <unknown description>
663+
>Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES <unknown description>
664664
TGGAAGGGCTAATTCACTCCCAACGAAGACAAGATATCCTTGATCTGTGGATCTACCACA
665665
CACAAGGCTACTTCCCTGATTAGCAGAACTACACACCAGGGCCAGGGATCAGATATCCAC
666666
TGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGAGAAGTTAGAAGAAGCCA

tests/expected-results-edgy/orfs.json

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1335,7 +1335,7 @@
13351335
"subtype_nucleotides": "TTTTTTAGGGAAAATTTGGCCTTCCAACAAGGGAAGGCCGGGGAATTTTCCTCAGAGCAGACCAGAGCCAACAGCCCCACCAGCAGAAAACTGGGGGATGGGGGAAGAGATAACGGGGGAAGAGATAACCTCCTTACCGAAGCAGGAGCAGAAAGACAAGGAACATCCTCCTCCTTTAGTTTCCCTCAAATCACTCTTTGGCAACGACCCCTTGTCACAGTAAAAATAGGAGGACAGCTGAAAGAAGCTCTATTAGATACAGGAGCAGATGATACAGTATTAGAAGATATAAATTTGCCAGGAAAATGGAAACCAAAAATGATAGGGGGAATTGGAGGTTTTATCAAGGTAAAGCAATATGATCAGATACTTATAGAAATCTGTGGAAAAAAGGCTATAGGTACAGTATTAGTAGGACCTACACCTGTCAACATAATTGGACGAAATATGTTGACTCAGATTGGTTGTACTTTAAATTTCCCAATTAGTCCTATTGACACTGTACCAGTAACATTAAAGCCAGGAATGGATGGACCAAAGGTTAAACAGTGGCCATTGACAGAAGAAAAAATAAAAGCATTAACAGAAATTTGTAAAGAGATGGAAGAGGAAGGAAAAATCTCAAAAATTGGGCCTGAAAATCCATACAATACTCCAGTATTTGCTATAAAGAAAAAGGACAGCACCAAATGGAGGAAATTAGTAGATTTCAGAGAGCTCAATAAAAGAACTCAGGACTTTTGGGAAGTTCAATTAGGAATACCGCATCCAGCAGGTTTAAAAAAGAAAAAATCAGTAACAGTACTAGATGTGGGAGATGCATATTTTTCAGTTCCTTTAGATGAAAGCTTTAGAAAGTATACTGCATTCACCATACCTAGTATAAACAATGAGACACCAGGAATCAGATATCAGTACAATGTGCTGCCACAGGGATGGAAAGGATCACCGGCAATATTCCAGAGTAGCATGACAAAAATCTTAGAGCCCTTTAGAATAAAAAATCCAGAAATGGTTATCTATCAATACAAGGATGACTTGTATGTAGGATCTGATTTAGAAATAGGGCAGCACAGAACAAAAATAGAGGAGCTAAGAGCTCATCTATTGAGCTGGGGATTTACTACACCAGACAAAAAGCATCAGAAGGAACCTCCATTCCTTTGGATGGGATATGAACTCCATCCTGACAGATGGACAGTCCAGCCTATAGAACTGCCAGAAAAAGACAGCTGGACTGTCAATGATATACAGAAATTAGTGGGAAAACTAAATTGGGCAAGTCAAATTTATGCAGGGATTAAGGTAAAGCAACTGTGTAAACTCCTCAGGGGAGCTAAAGCACTAACAGACATAGTACCACTGACTGAAGAAGCAGAATTAGAGTTGGCAGAGAACAGGGAGATTCTAAAAACCCCTGTGCATGGAGTATATTATGACCCATCAAAAGACTTAGTAGCAGAAGTACAGAAACAAGGGCAGGACCAATGGACATATCAAATTTATCAAGAGCCATTTAAAAATCTAAAAACAGGAAAATATGCCAGAAGAGGGTCTGCTCACACTAATGATGTAAGACAATTAACAGAAGTGGTGCAAAAAGTAGCCACAGAAAGCATAGTAATATGGGGAAAGACCCCTAAATTTAGACTACCCATACAAAGAGAAACATGGGAAACATGGTGGATGGAGTATTGGCAGGCTACCTGGATTCCTGAATGGGAGTTTGTTAATACCCCTCCTCTAGTAAAATTATGGTACCAATTAGAAAAAGACCCCATAGTAGGAGCAGAGACTTTCTATGTAGATGGGGCAGCTAGTAGGGAGACTAAGCTAGGAAAAGCAGGGTATGTCACTGACAGAGGAAGACAAAAGGTAGTTTCCCTAACTGAGACAACAAATCAAAAGACTGAATTACATGCGATCCATTTAGCCTTGCAGGATTCAGGATCAGAAGTAAATATAGTAACAGACTCACAATATGCATTAGGAATCATTCAGGCACAACCAGACAGGAGTGAATCAGAAGTAGTCAACCAAATAATAGAGGAGCTAATAAAAAAGGAGAAAGTCTACCTGTCATGGGTACCAGCACACAAGGGGATTGGAGGAAATGAACAAGTAGATAAATTAGTCAGTTCAGGAATCAGGAAGGTGCTATTTTTAGATGGGATAGATAAGGCTCAAGAAGAACATGAAAGATATCACAGCAATTGGAGAACAATGGCTAGTGATTTTAATTTGCCACCTATAGTAGCAAAGGAAATAGTAACCAACTGTGATAAATGTCAACTAAAAGGGGAAGCTATGCATGGACAAGTAGACTGTAGTCCAGGGATATGGCAATTAGATTGCACACATCTAGAAGGAAAAGTCATCCTGGTAGCAGTCCACGTGGCCAGTGGATATATAGAAGCAGAAGTTATCCCAGCAGAAACAGGACAGGAGACAGCATACTTTCTGCTAAAACTAGCAGGAAGATGGCCAGTAAAAGTAATACACACAGACAACGGTAGCAATTTCACCAGCGCTGCAGTTAAAGCAGCCTGTTGGTGGGCCAATGTCCAACAGGAATTTGGGATCCCCTACAATCCCCAAAGTCAAGGAGTAGTAGAATCTATGAATAAGGAATTAAAGAAAATCATAGGGCAGGTAAGAGAGCAAGCTGAACACCTTAAAACAGCAGTACAAATGGCAGTATTCATTCACAATTTTAAAAGAAAAGGGGGGATTGGGGGGTACAGTGCAGGGGAAAGAATAATAGACATAATAGCAACAGACATACAAACTAAAGAATTACAAAAACAAATTACAAAAATTCAAAATTTTCGGGTTTATTACAGGGACAGCAGAGACCCAATTTGGAAAGGACCAGCAAAACTACTCTGGAAAGGTGAAGGGGCAGTAGTAATACAAGACAATAGTGATATAAAAGTAGTACCAAGAAGAAAAGCAAAGATCATTAGGGATTATGGAAAACAGATGGCAGGTGATGATTGTGTGGCAGGTAGACAGGATGAGGATTAG"
13361336
}
13371337
],
1338-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED[REVERSE_COMPLEMENT]": [
1338+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.REVERSECOMPLEMENTED": [
13391339
{
13401340
"name": "gag",
13411341
"start": 789,
@@ -1669,7 +1669,7 @@
16691669
"subtype_nucleotides": "ATGGGAAGTAAGTGGTCAAAAAGTAGCATAGTGGGATGGCCTCAGGTCAGGGAAAAAATAAAGCAAACTCCTCCAGCAACAGAAGGAGTAGGAGCAGTATCTCAAGATCTAGATAAACATGGAGCAATAACAAGTAGTAATATAGATAATGCTGATTGTGTCTGGCTGAGAGCACAAGAGGACGAGGAGGTAGGCTTTCCAGTCATGCCGCAGGTACCTCTAAGACCAATGACTTATAAGGGAGCTTTTGATCTTAGCTTCTTTTTAAAAGAAAAGGGGGGACTGGATGGGCTAATTTACTCCAAGAAAAGACAAGAGATCCTTGACTTATGGGTCTATAATACACAAGGCTTCTTCCCTGATTGGCAAAACTACACACCAGGGCCAGGGATCAGATTCCCACTGTGTTTTGGATGGTGCTTCAAGCTAGTACCAGTTGACCAAAGAGAAGTAGAGGAGGACAACAAAGGAGAAAACAACTGCCTGTTACACCCCATGAGCCAGCATGGAATAGAGGACGAAGAAAGAGAAGTGCTGATGTGGAAGTTTGACAGTGCCCTAGCACGAAAACACGTAGCCCGAGAACAGCATCCAGAGTACTATAAAGACTGCTGA"
16701670
}
16711671
],
1672-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS[REVERSE_COMPLEMENT]": [
1672+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-XS": [
16731673
{
16741674
"name": "gag",
16751675
"start": 789,
@@ -2003,7 +2003,7 @@
20032003
"subtype_nucleotides": "ATGGCAGGAAGAAGCGGAAGCACCGACGAGGAACTCCTCAGAGCAGTAAGGATCATCAAAATCCTATACCAAAGCA"
20042004
}
20052005
],
2006-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS[REVERSE_COMPLEMENT]": [
2006+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-BAD-SYMBOLS": [
20072007
{
20082008
"name": "gag",
20092009
"start": 789,
@@ -2170,7 +2170,7 @@
21702170
"subtype_nucleotides": "ATGGGTGGCAAGTGGTCAAAAAGTAGTGTGATTGGATGGCCTACTGTAAGGGAAAGAATGAGACGAGCTGAGCCAGCAGCAGATAGGGTGGGAGCAGCATCTCGAGACCTGGAAAAACATGGAGCAATCACAAGTAGCAATACAGCAGCTACCAATGCTGCTTGTGCCTGGCTAGAAGCACAAGAGGAGGAGGAGGTGGGTTTTCCAGTCACACCTCAGGTACCTTTAAGACCAATGACTTACAAGGCAGCTGTAGATCTTAGCCACTTTTTAAAAGAAAAGGGGGGACTGGAAGGGCTAATTCACTCCCAAAGAAGACAAGATATCCTTGATCTGTGGATCTACCACACACAAGGCTACTTCCCTGATTGGCAGAACTACACACCAGGGCCAGGGGTCAGATATCCACTGACCTTTGGATGGTGCTACAAGCTAGTACCAGTTGAGCCAGATAAGATAGAAGAGGCCAATAAAGGAGAGAACACCAGCTTGTTACACCCTGTGAGCCTGCATGGGATGGATGACCCGGAGAGAGAAGTGTTAGAGTGGAGGTTTGACAGCCGCCTAGCATTTCATCACGTGGCCCGAGAGCTGCATCCGGAGTACTTCAAGAACTGCTGA"
21712171
}
21722172
],
2173-
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES[REVERSE_COMPLEMENT]": [
2173+
"Ref.B.FR.83.HXB2_LAI_IIIB_BRU.K03455.CfE.BUT.WITH-DASHES": [
21742174
{
21752175
"name": "gag",
21762176
"start": 789,

0 commit comments

Comments
 (0)