Skip to content

Commit 368ef70

Browse files
committed
lint
1 parent 2367cd4 commit 368ef70

File tree

1 file changed

+13
-11
lines changed

1 file changed

+13
-11
lines changed

bin/parse_chromosomes.py

Lines changed: 13 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@
1313
"([MDCLXVI]+[a-z]?)"
1414
]
1515

16+
1617
class ChromosomeParser:
1718
def __init__(self, gff) -> None:
1819
self.species = ''
@@ -22,21 +23,21 @@ def __init__(self, gff) -> None:
2223
self.sequence_regions = []
2324
self.chr_candidates = []
2425
self._parse(gff)
25-
26+
2627
@property
2728
def regex(self) -> str:
2829
return "{}{}{}".format(self.prefix, self.pattern, self.suffix)
29-
30+
3031
def __repr__(self) -> str:
3132
return "\t".join(filter(None, (self.species, self.regex)))
32-
33+
3334
def _parse(self, gff) -> None:
3435
self.species, _ = os.path.splitext(os.path.basename(gff))
3536
with open(gff, 'rt') as f:
3637
data = f.readlines()
37-
self.sequence_regions = [list(filter(None, l.split(" ")))[1] for l in data if l.startswith("##sequence-region")]
38+
self.sequence_regions = [list(filter(None, li.split(" ")))[1] for li in data if li.startswith("##sequence-region")]
3839
self.chr_candidates = [r for r in self.sequence_regions if {".", "_"}.intersection(r)]
39-
40+
4041
def generate_regex(self) -> None:
4142
self.has_suffix()
4243
prefix_pool = self._iter_prefix_pool()
@@ -60,7 +61,7 @@ def generate_regex(self) -> None:
6061
max_match = len_match
6162
self.prefix = prefix
6263
self.pattern = pattern
63-
64+
6465
def has_suffix(self) -> bool:
6566
"""
6667
Assume any sequence_region with a version number "_v#" is a likely candidate for a chromosome.
@@ -72,24 +73,25 @@ def has_suffix(self) -> bool:
7273
self.suffix = re.search(r"_v\d+", with_suffix[0]).group()
7374
return True
7475
return False
75-
76+
7677
def _iter_prefix_pool(self):
7778
yield from common_prefixes(self.chr_candidates)
7879
# yield from [
7980
# common_prefixes(self.chr_candidates),
8081
# (self.chr_candidates[0].split("_")[0] + "_", 1),
8182
# ]
82-
83+
8384
def correct_prefix(self):
8485
try:
8586
r = re.compile(r"{}$".format(self.regex), re.IGNORECASE)
8687
first_match = list(filter(r.match, self.chr_candidates))[0]
87-
prefix = re.split('_|\.', first_match)[0]
88+
prefix = re.split(r"_|\.", first_match)[0]
8889
separator = first_match.split(prefix)[1][0]
8990
self.prefix = prefix + separator
90-
except:
91+
except Exception:
9192
print(self.species)
9293

94+
9395
def common_prefixes(li):
9496
prefixes = []
9597
for first_letter, prefix_batch in groupby(sorted(li), key=itemgetter(0)):
@@ -104,7 +106,7 @@ def common_prefixes(li):
104106
prefixes.append((''.join(prefix), threshold))
105107
break
106108
threshold = count
107-
prefix.append(char)
109+
prefix.append(char)
108110
return sorted(prefixes, key=itemgetter(1))
109111

110112

0 commit comments

Comments
 (0)