diff --git a/Cargo.lock b/Cargo.lock index d84574f0..a6a4339e 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -5423,6 +5423,7 @@ dependencies = [ "pyo3", "pyo3-log", "rand", + "rayon", "sequila-core", "tokio", "tracing", diff --git a/Cargo.toml b/Cargo.toml index 47d326b7..220c08be 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -15,6 +15,7 @@ datafusion-python = { git = "https://github.com/apache/datafusion-python.git", r pyo3 = { version = "0.22"} pyo3-log = "0.11.0" sequila-core = { git = "https://github.com/biodatageeks/sequila-native.git", rev = "43453dca320cc25a02f440850e3b947b813785c3" } +rayon = "1.8" datafusion = { version = "43.0.0"} arrow = "53.3.0" diff --git a/Zapis_genomow_decoded.md b/Zapis_genomow_decoded.md new file mode 100644 index 00000000..87e82aed --- /dev/null +++ b/Zapis_genomow_decoded.md @@ -0,0 +1,21 @@ +# Jak to działa? + +Na przykładzie tej sekwencji (poniżej cała jedna sekwencja): +```` py + +@SRR9130495.1 D00236:723:HG32CBCX2:1:1108:1330:1935/1 +NCAATACAAAAGCAATATGGGAGAAGCTACCTACCATGCTTAAAAACGCCAATGAGCAGNGATTTGTCANCNNNNNNNNCNNNNNNNNTNNTANNANNCTC ++ +#4BDFDFFHGHGGJJJHIIIIGGIIJGJJGIIIIBHIJJJIIJIJJIJDHIGGGIJJJI#-@AEHGEFF#,########,########+##++##+##+2< + +```` + +## Zgodnie z linijkami kolejno + +1. '@identyfikator sekwencji' małpa symbolizuje początek rekordu --> dalej jest ciąg znaków a xxx.1 to liczba porządkowa +2. sekwencja genetyczna DNA czyli zapisane geny gdzie N - niepewny odczyt +3. '+' separator "jakości" czyli po tym są wyniki +4. jakość odczytu (Czyli ten Phred Score) dla każdego nukleotydu (genu) w postaci znaków ASCII + +W tabeli wynikowej jeden wiersz odpowiada jednej sekwencji + diff --git a/benchmark/src/base_seq_quality.py b/benchmark/src/base_seq_quality.py new file mode 100644 index 00000000..bd62b526 --- /dev/null +++ b/benchmark/src/base_seq_quality.py @@ -0,0 +1,12 @@ +import polars_bio as pb +import pandas + +path = "example.fastq" + +print('Odczytan zawartość pliku', path) +fastq = pb.read_fastq(path).collect().head() +print(fastq) + +print('Base sequence quality dla pliku', path) +test = pb.cacl_base_seq_quality(path, target_partitions=4, output_type='pandas.DataFrame') +print(test.head()) \ No newline at end of file diff --git a/benchmark/src/base_seq_quality_report.py b/benchmark/src/base_seq_quality_report.py new file mode 100644 index 00000000..108399fa --- /dev/null +++ b/benchmark/src/base_seq_quality_report.py @@ -0,0 +1,136 @@ +import sys +from pathlib import Path + +import numpy as np +import pandas as pd +import plotly.graph_objects as go +import polars_bio as pb + + +def main(): + script_dir = Path(__file__).parent + fastq = script_dir / "example.fastq" + out_html = script_dir / "report_full.html" + + if not fastq.exists(): + print(f"Nie znaleziono pliku: {fastq}", file=sys.stderr) + sys.exit(1) + print(f"Parsuję FASTQ: {fastq}") + + df = pb.cacl_base_seq_quality(str(fastq), output_type='pandas.DataFrame') + print(df.columns) + print(df[['min', 'q1', 'median', 'q3', 'max']].apply(len)) + print(f"Policzono statystyki: {df.shape[0]} pozycji") + + traces = [] + + for _, r in df.iterrows(): + traces.append(go.Scatter( + x=[r["min"], r["max"]], + y=[r["position"], r["position"]], + mode="lines", + line=dict(color="gray", width=2), + showlegend=False, + hoverinfo="skip" + )) + + customdata = df[['min', 'q1', 'median', 'q3', 'max']].to_numpy() + + traces.append(go.Bar( + x=df["q3"] - df["q1"], + y=df["position"], + base=df["q1"], + orientation="h", + marker_color="rgba(0,100,80,0.6)", + marker_line=dict(color="rgba(0,100,80,1)", width=2), + width=0.6, + showlegend=False, + customdata=customdata, + hovertemplate=( + "Position: %{y}
" + "Min: %{customdata[0]}
" + "Q1: %{customdata[1]}
" + "Median: %{customdata[2]}
" + "Q3: %{customdata[3]}
" + "Max: %{customdata[4]}
" + ) + )) + + traces.append(go.Scatter( + x=df["median"], + y=df["position"], + mode="markers", + marker=dict( + color="white", + symbol="line-ns-open", + size=16, + line=dict(width=2) + ), + showlegend=False, + hoverinfo="skip" + )) + + traces.append(go.Scatter( + x=df["median"], + y=df["position"], + mode="lines+markers", + line=dict(color="red", width=2), + marker=dict(size=4), + name="Median", + hoverinfo="skip" + )) + + height = max(600, df.shape[0] * 60 + 200) + + fig = go.Figure(traces) + fig.update_yaxes( + autorange="reversed", + title="Position in read (bp)", + dtick=1, + range=[0, 100] + ) + fig.update_xaxes( + title="Phred score", + dtick=2 + ) + fig.update_layout( + title="Phred Score per Base Position", + template="plotly_white", + height=height, + margin=dict(l=80, r=20, t=60, b=60) + ) + + plot_html = fig.to_html(full_html=False, include_plotlyjs='cdn') + + table_html = df.to_html(classes="table table-striped", index=False) + + html = f""" + + + + + FastQC-like report + + + + +

Phred Score per Base Position

+
+ {plot_html} +
+

Statistics Table

+
+ {table_html} +
+ + +""" + out_html.write_text(html, encoding='utf-8') + print(f" Wygenerowano pełny raport: {out_html}") + +if __name__ == "__main__": + main() diff --git a/benchmark/src/example.fastq b/benchmark/src/example.fastq new file mode 100755 index 00000000..4b357e52 --- /dev/null +++ b/benchmark/src/example.fastq @@ -0,0 +1,800 @@ +@SRR9130495.1 D00236:723:HG32CBCX2:1:1108:1330:1935/1 +NCAATACAAAAGCAATATGGGAGAAGCTACCTACCATGCTTAAAAACGCCAATGAGCAGNGATTTGTCANCNNNNNNNNCNNNNNNNNTNNTANNANNCTC ++ +#4BDFDFFHGHGGJJJHIIIIGGIIJGJJGIIIIBHIJJJIIJIJJIJDHIGGGIJJJI#-@AEHGEFF#,########,########+##++##+##+2< +@SRR9130495.2 D00236:723:HG32CBCX2:1:1108:1472:1938/1 +NGTCAAAGATAAGATCAAAAGGCACTGGCTTACCTGATTAAGAAATTGTGTAGTCCAACATCAAAATACNTNTNNNNNAGAGNCANGNCAAGCNNANNAAT ++ +#1=DDDDD>DHFH@EFHHGHGGFGIIIGIGGGGIIGIIDDCHIIIIIID@FEGGGIIIIICHIIIIIIG#-#-#####,,;;#,5#,#,,85@A:AB@8>@:@A@9(:((+(834 +@SRR9130495.6 D00236:723:HG32CBCX2:1:1108:2392:1965/1 +CGATAAAGGACTTTCAGTCAACCAACTAGATAATGACCACTGGGCACCCATTCATTATGCATGCTGGTAAATAAATTATTCTGTTCAGGAACATTGAACTC ++ +CC@DDDBDFFHHHJJIJJIIJIJJJIIIHGIGGHCGGIGHHAACC??A< +@SRR9130495.11 D00236:723:HG32CBCX2:1:1108:4089:1977/1 +CATTCCAACCAGCCGCTTAAAGTTTCTAAAAGAAGCTGGTCATGGAACCCAGAAGGAGGAGATACCTGAGGAGGAATTAGCAGAGGATGTTGAAGAGATTG ++ +CCCFFFDFHHHHHJIJJJJIIJJJJJJJJJJJIIGJJJIGHGIJJIJJIJJIIFHGHIJJGHEHHFCEFFDEDDBDDDDDDDDDDDBACDDDDDDDDDDDD +@SRR9130495.12 D00236:723:HG32CBCX2:1:1108:6197:1936/1 +NCTTAAAGGCAAGGTGCTCGGCTTCCGCTATCAAGACCTCCGACAGAAAATCCGGCCTGNGGCTAAAGANCNNNNNNNNANNNNNNNNCNNGGNNCNNGGC ++ +#1BDFDEFGHHHHIJJJJJJIJJJJJJJJJJIJJIGIJJIJJJIJJJJHIJJHHHFFDC#,;?BBDDDD#,########+########+##++##+##++8 +@SRR9130495.13 D00236:723:HG32CBCX2:1:1108:6415:1939/1 +NTGTGTATGGGGATGAGGAAGGATATTAATATGTTCTATTTGAGATTTAGGGATTACATTTGTTTTTGCNCNCNNNNNTTTTNTCNTCATTTGNNGTNAAT ++ +#1:ADDDFHGGHFGGBHIGGIIJJEIIIJJIJIJJJFGJIIHGHGDGHJGHIHIIIIJJIIHFHIIJJJ#-#-#####,,;?#,;#,8?DDEE##,+#+2< +@SRR9130495.14 D00236:723:HG32CBCX2:1:1108:6361:1952/1 +TCAGATCTTATTTTAATAGTTGACTTTACCTCTTCTTTGACTTCCTCTTCCTCGGTCTCAGTAGATATAGATGGTACCTTGGGCTTATGCCATGAGATCTG ++ +CCCFFFFFHHHHDHIIIIJJJJJJJJJJHIIIJJJJJJJIHJHJII>GHIEGHIIIIJJJIJJIHHIJJJIJIGHIJJGJJHFHHFFDCFFEDCEDCCDEC +@SRR9130495.15 D00236:723:HG32CBCX2:1:1108:6263:1960/1 +CAATATCTGACTGAATGGGCCCATTTTCATAATATTCTGAAACTGTTCATACATGTCTCGCAATGTAAACTGACCTGAAATGCAATACAAAAAAATTCAGA ++ +CCCFFFFFHHGHGGGIIIIJJIJIJJIIIIIIIIEIHGGIEGGHGIJJIJJJCECGHIIIJJJJJIFGHIIHGIIJJHHGEFHDFFFFFCCCDDBBCCDCA +@SRR9130495.16 D00236:723:HG32CBCX2:1:1108:6338:1988/1 +AGACACTAAAATGCCATGTATGAGACTACATAGACATACCAATTTACAACACAAACACATGAAATATACATGAGAAAACATTAACTTACTTCCAGTTGGGA ++ +C@CFFDDDHGHHHIIIIHJJIIHIHGIJJJJJIJJJIJIIHEHIIJJJJJJIJJIIIIIJJDHIJIJGIJIJJIJJHHGGHFFFFFFFEEEDCCC@ACCBA +@SRR9130495.17 D00236:723:HG32CBCX2:1:1108:6742:1944/1 +NGAAACACTCTTTTTCTGGAATTTGCAAGTGGAGATTTCAGCCGCTTTGTGGTCAATGGTAGAAAAGGAAATATNTNCATATAAAAACTAGACAGAATGAT ++ +#1BDFDFFHGHGHJJJJJJJJHIJHHIJIIJJIJJGIJJIJIIJJGIJIHIJJJIIJJJHIEIIJJJJIHDEFH#,#,5=ADEEEDCDDDDDDDCDD5@CD +@SRR9130495.18 D00236:723:HG32CBCX2:1:1108:7076:1942/1 +NGTCTAAGAATGAAGTGCTTATGGTCAACATAGGCTCCCTGTCGACAGGAGGAAGAGTTAGTGCAGTCAAGGCTNANTTGGGCAAAATTGTTTNNACCAAT ++ +#1:B:BDDHHFFHIEGGIGIDEHGEEGIGHIIIFACHIGIGCFGEHIGGHHGHGH@DCGGIDEIIIIFFHHAEE#,#,5=@BBC@BCCCCCCC##,+8?BC +@SRR9130495.19 D00236:723:HG32CBCX2:1:1108:7440:1957/1 +CACCTGATGTCCCACAGTCCTCATAGACACTAGCACTGACTGCTGGCCATCGTCTCAGCCAGATGATGTTGACCTGCTAGCTTTTCAATTAAATTATTAAA ++ ++=144=DD>D4CCD?E@AECFFIIIIEI?E+??;3EBDECEIBEECDIEIIADDDDEIDCDCA;=A@CECE7ACD=(;;A@DA@A@A:ADAAAD>AADBB> +@SRR9130495.20 D00236:723:HG32CBCX2:1:1108:7363:1977/1 +ACTCATAGAGTTGAAGATTCCCTTTCATAGAGCAGGTTTGAAACACTCTTTCTGGAGTATCTGGATGTGGACATTTGGAGCGCTTTGATGCCTACGGTGGA ++ +CCCFFDDDFHHHHJJJIJJJJHHIIHGIJIJJJIGGHGIJIJJIIIJJJJJIJIGBFDHIIJIJGIJIGGCHGGIJHIIHHHFECDECEEDCDDCBD9?B? +@SRR9130495.21 D00236:723:HG32CBCX2:1:1108:7298:1979/1 +AACCGTCGCCAGGTACCATCCCAGAGAACTCTGTCTTCCTTACTTATAGCCAAGTTGCCGGCAGATCACAGCTGCATGCTTATCGGTCCATCCGTCATCGC ++ +BCCDDDFFGGFGFJIBBHHIJJIIHHIIIGJIIHIIJJJIIEIGHJIIJJJJIIHHGIJFGHGFDDCEECDDDDDDDDDDEDDDDDDDBDEDDDCCC +@SRR9130495.23 D00236:723:HG32CBCX2:1:1108:7307:1995/1 +TAATTTGGTATATGTCTTTTTAAAGGCATTTTTATTAGATATTTCCTTAATTTACATTTCAAATGTTATCCCCAAAGCCCCCTATAATCTACCCCTGCCTT ++ +;?7DD?;DBFHHFIA;A@AABBB@B?2<58+:?<<9<@: +@SRR9130495.25 D00236:723:HG32CBCX2:1:1108:7870:1955/1 +CTATCCCGTCGGGTGACTGTTTCCTGCTTTGCAGTTATTCAGTGGCAGAGCGTGGCGCTCTAATTTCTGCTTTCCTCTTTCCTGCAGATTGTGTGCTACAT ++ +CCCFFFDFFHHFHBHGJIIIHGIIIJJIJIIIIJHIIIIEIJJIIJJJJIJIJIJDFEDDDCEEEEEEDDDDDDDDCDDDCDDDDDDDCDDDCDDDDDDDD +@SRR9130495.26 D00236:723:HG32CBCX2:1:1108:8157:1994/1 +GAAGTGCTCTTCGTTACTACTTAAATCCCCCTGGGCATGTTTCATTATTTTACAATTTGTGCAGAACCCTATCCAAACACACATGGAGTACAAATGACTTC ++ +CCCFFDDDDHHDHHIGIIBIHHHJJJ@FGGA?@CCCCCC@CCCDD +@SRR9130495.27 D00236:723:HG32CBCX2:1:1108:8703:1937/1 +NATAAAAAAATAACATCCTTTCCTCCTAATAGCTTAATTATTTGAAAAAAAATATTTTCNAATCACATGNANNNNNNNNTNNNNNNNNTCTTTNNTNNCCT ++ +#1=DFDDDHHHHHIIJJJJJFIJJJIGIEGIIJJJHHIJJJJJIIJIIIIIJEHEHHHA#,;??AEDDC#,########,########++8??##+##(+2 +@SRR9130495.28 D00236:723:HG32CBCX2:1:1108:8702:1991/1 +CTCAGAGATTAAAAATGAATAACGCCTGCCGGCCAATGAGCGGACTCACAGTCCCTGTTTGTTTGTAAGCTAGGTGATTTTCAATCCACAGGGCAGGCTGA ++ +@@@DFDFFGGDHFGIIBGEHJIIIBGIIIJJIIJIJIIFGGEGIJJJHGGHHHDCFFDDDEDEDDDDDCDDDCBDDACDEDEDDDDCCCCDGII@GIFGFE???BFBBEHIGGIEEHIHIGGHHGIHA3?CH;?@CB@DCCEDEDD3 +@SRR9130495.34 D00236:723:HG32CBCX2:1:1108:10535:1962/1 +AATACAGAAAAGTTAAGAGCCAGCCCCAGGCGGATTGGATGAATAGGTTGCATCTCTTTCTTGCTTATATCAAATGCCTCTTGGCAGGCTCCTTGGGAATT ++ +???BD:A:3=?B:;?;;CA;;;A3-5>5-5:(::@8/2?8?9>>3(83(+ +@SRR9130495.35 D00236:723:HG32CBCX2:1:1108:11147:1968/1 +GCTGCCTTCTCCCCTCAAGGATGCAGTGGAAGTGTCAACCTGGAGAAGATGCTACACGATGCAGGAGGTGAACTCGGCCCTCAGTAAAATCCAGCTGGTGG ++ +CCCFFFDFHHHGHJFEGIHEGHIGIIGCCGGGIIJJIJJGGGGHCGIF>DGHIIIEHHGIIJJDBGHFHFCCFFFDDCDDDDBDDDCCDEDA:CACD@CDD +@SRR9130495.36 D00236:723:HG32CBCX2:1:1108:11124:1986/1 +GACAGGGTTTCACCATGTTAGCCAGGACGGTCTTGATCTCCTGACCTCGTGATCCGCCTGTCTCGGCCTCCCAAAGTCCTGGGATTACAGGCGTGAGCCAC ++ +CCCFFFFBFFFHGGHGHIHIIGIJFJJJIJHIIIFGHGGIIGEGHIH@@FGGIJIIGGIHIEEHEEFFDDCCCCBDDACCDCDBAACCDDDBDDDDBDDCC +@SRR9130495.37 D00236:723:HG32CBCX2:1:1108:11773:1947/1 +TACCTGCCTCTGCCTCTCGAGTGCTGGGATGAAAGATGTGCACACCCCCACCACCACCACCACCACTGCCTGGCNCNGTTTTTGATTTCTTATTCTCCAGA ++ +CCCFFFFFHGHHHJIJIJIIEHIJJIJJIJJIHIHJJIGFIIIIJBHHGFF>HGIJIEHHHFGDEEEEEECC?B#,#,,5?@HF1CGBGHCDDFF7=DEG.?AAC?3@EED;6@;>(-;@AC?31(,5?(4::A>AC +@SRR9130495.46 D00236:723:HG32CBCX2:1:1108:14226:1948/1 +AACCTGCACCCAGAATGGCAGGAGGTCCTGGTGGCCCAGGGGGTCCTGGTGGTCCAGGAACACCAGGTCTCCCANANCCAGGTGGCCCAGGCAGGCCTGGA ++ +??1D1BDDHFHHBBHGGGAFG)AF1:?CEGD@BGAFDGIGGB'5;CE77?=???>>CC3#+#++228>>28((2(>ACC?CCDDCCD@ +@SRR9130495.48 D00236:723:HG32CBCX2:1:1108:15049:1993/1 +TGACCAAGAACTCACAGAGATCCCCCCCCCCAGGGCTAAGATTAAAGGCATGTGCCACTGCCACTGGATAGATATTATCTTTTATTTTACCTGACTGGTTG ++ +@CCFFDDDHDFHGJJJJIJGIHHHIIJJIJFE=(5;?@>@A@;@C>CAB=@<:@C@CA:>CC3:>CB<@@?344>>@@A>CDC>ACDD:>4>>>ACD?CC( +@SRR9130495.49 D00236:723:HG32CBCX2:1:1108:15487:1951/1 +ACGGAGGGTGGGGCTGGGTGATTGTGGTTGTCTCCTTCTTCACCCAGTTCCTCTCTTACGGATCCCCGTTAGCTNTNGGGGTCTTGTATGTAGAATGGCTG ++ +BCCFD@DFDFHHGDGIIICGHIIJJIJGHIIJIIJJJIJIJIJEHIGHHHHHHHFFFFFFDDCDDCD@DDDDD:#+#+2<@8GHIIIEHGACFHIIGGIBHIIHHC??BDC@BBCECDCE63>@@CACCDD@ +@SRR9130495.51 D00236:723:HG32CBCX2:1:1108:15923:1957/1 +CCGCAACTGCCATGGAGCCACAGCCTGGTCCGTAATAGATGCAAAGCTTCTCAATAGTCAGGGGCGTGGTTTCGCGCAGCTTGGAGGCCAGCAACAGGCAG ++ +CCCFFFFFHFHHHIIFIIIGIIFIIGJIIJJIFHGHIIIIIJIIFIJIIIJJJJJJJGGIGJFFH@?BBBDBCDDDDDDDDDDDDDDDDDDDDDDDDDDD? +@SRR9130495.52 D00236:723:HG32CBCX2:1:1108:15793:1968/1 +GTTTTTCCACAGACCTCTGATCTCTTACATTCGAAAGTTCTACTACTATGATCCTCAGGAAGAGGTGTACCTGTCCCTAAAGGAAGCGCAGCTCATTTCCA ++ +BB@FFFFFFFHGDGFHJJJJIFIIGGG@FIIIGIBGGDHIIIJCHIIJJDHIIJJJIIIGIIJJFHHIJCHGDHIIHHHHHFFFFFDDDDDDCDDDDEDDE +@SRR9130495.53 D00236:723:HG32CBCX2:1:1108:16082:1968/1 +GAAACTTGTTTGTGACGTGTGTATTCAACTAACAGAGTTGAACCTTTCTTTTTACAGAGCAGCTTTGAAACACGCTTTTTGTAGAATCAGATCGGAAGAGC ++ +@<@ADDDECBFFHIFEGDG;EEHHB@FHGHIIGGEHGGHGGEGEGICGCEFFDB@D>AE>ADC@CBBFGIIJJJJIHHIJJGH?DGGHCFHHIJJEEIIJAHIJJFG=FGGGIFHHIIDHGEHIHHHHGHGEB;?CDCECEEDD +@SRR9130495.55 D00236:723:HG32CBCX2:1:1108:16048:2000/1 +AGGACAGGAAGGACGCTTTGAGATATGATTTCACAGGCGACAGTGAGAGAAAACCAATGTCTTTAATGCATTTCTCTGCAGCATGTGACAAACTTTCAACA ++ +CCCFFFFDFHGHHIIJJJJIFGGIJJIIIIJIJIHJIIJIHGIJJIJGGIIJIJJHHHHEDCDFFFEEEDDEDEEDDDDDDDDDDCDEDDCDDDDDDCCD@ +@SRR9130495.56 D00236:723:HG32CBCX2:1:1108:16580:1970/1 +GCCTGTACTCCCAGCTACTTGGGAGGCTGAGACAGGAGAATCACTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCAAGACCGGGCTATTGCACTAGATCG ++ +@@@FFD?DBFFHHIIEHCIJIFIJHEDCH@GGEBFHHIJJIIIIIJJJJJIFHFHF@G-6@AAEDFFF>AEC@@A?;=?BCD6/<@>BAAC>:@C:CDDA? +@SRR9130495.57 D00236:723:HG32CBCX2:1:1108:16594:1971/1 +TCCTCTGACTTTGACACTAGTGTTGACCTTGCATGAGGAGATGTTCTCCATTTGGACTAACCTGATGTACACAGACGTTACACTTATCACAGAATACCATA ++ +CCCFFDDFFHFHFHIJIJJIHIIIJJJJJIJJJJIIIIHIGIIJJJIGIIJJIIJEHIIJIJJJIGIJJJEIHJJIIHHEFFFFFFCCEEEEDCDDDDDDC +@SRR9130495.58 D00236:723:HG32CBCX2:1:1108:16808:1998/1 +ACCAATTTTCCCCTCCCCTTCCTCCCTCCCTCCCAGCCCCCTTCCTCTCTCTACCTCCTGTTATTGTTTTGTTCCTTGTTCTATGTAGGATTGAAGCATCT ++ +@@@FFDDFHDFHGIJJJJIIGGDFHI>DGC;DHI9??FHIJIIHG>>3>;ACCCC9:@>@:>AA +@SRR9130495.59 D00236:723:HG32CBCX2:1:1108:17428:1967/1 +TGCATGGTGCTGAAAGCTTTGTTGCAGCTTTTCTTGGGATTGCTTAGCTGCTCCGGGTCGATCCACTTGCAGATGAGCTCTTGCTTGATGCACTGCTGCCG ++ +?<A3>A>>AAAA?3 +@SRR9130495.60 D00236:723:HG32CBCX2:1:1108:17508:1988/1 +TTGTTCAGAAAAAAGTATCTTGAAACCAAAAGAACTGGGATCTTGTTAAATGCAGATTCTGTTCATTAGGTATAGGTATGCAGTCTTACAAAATGAGGTAG ++ +CCCFFEFFHHHHHJJJJJJJJJJJJJJJJJGIJJJJJJJIIJJJJJJJJIJJIJJJJJJJJJJJIJJIIIEHHBHGHHEFFFFFEEEEDEEDDCDCDDCDC +@SRR9130495.61 D00236:723:HG32CBCX2:1:1108:18425:1951/1 +CCACTTAATAAATCACCTATCAAGTTGAATTATTTGTGCAAAGGCACTAGGCTGAATAGAGACCACTCAGTAGCNTNTTTTTAATCTTGCTAAGAAAGAAT ++ +CCCFFDDFHFHHGJIIJJJJJJHGHEHHHIIJIJJIJGJIHIJHEFDHGHIFIJJGHIJJJFIGGIHIIIJIII#-#-5@DFFEEEDEEEDEDDACDCCBC +@SRR9130495.62 D00236:723:HG32CBCX2:1:1108:18468:1964/1 +CTATTGACTTTTATTAGAAAGGGTCTTGTTGCATAGGTAGGTCTTTAACAACCATCTCTTAAAGGGCTGGGATTGCCAGAGTAGGCCAACACGCCCAGCTA ++ +CCCFFFFFGGHHGIGIJIJJIIIJJJJIJJIJJJJIIJDGEHGIIJJJIJJJHIJJIGFHGIJGEGIJJJIIHHHHHHFFFFFEDEEDDDDDDDBDDBBD@ +@SRR9130495.63 D00236:723:HG32CBCX2:1:1108:18615:1941/1 +NAGCCGAGAGGCGCCGGCTCACCTGCCTGGGTCCCGGCCTTTCTCCTGCAGTGCCAGGGATTCACCTGANGNCNNNNNNTCTNCTAGGCAAGCNNATNCTT ++ +#1:DDFDDHHHHHIIJIIFGJJIEFHHIHHIIIJJIEHFFEEEEEEE?DFF;5:AAB9>29(#+#++8++4>>:@>AA:@1<@@A(:4? +@SRR9130495.72 D00236:723:HG32CBCX2:1:1108:1440:2047/1 +GCTGGTGCAGGACACCAGAATCCGCTCGATCATGCTCCCTAGAGAGGAGGGGCACAGTGAGTACACATAAGCACATGTACACACACACCCAGGACCCAAAG ++ +CCCFFFDEHHGHHHIIIIIIIIJJIJJJGEGHIJIJJJJIIJGHIIJJJIDFEDFFFFEEEEDEDDDDDDDDDDDDDEEEEDDDDDDDDDDDDDDDDDDDA +@SRR9130495.73 D00236:723:HG32CBCX2:1:1108:1468:2080/1 +ACTGTCTTTTTTTTAAAACAGGTGATTGCCCGTTGATTGTTCAGTTTGCTGCTAATGATGCAAGACTTTTATCTGATGCTGCCCTGCTAGTCTGTCCCTAT ++ +CCCFFDDEHFFDHIEIIJHGCGFHCIIHIIIHH@FGGIHIGHIJJIJGIIIJBHIGEIHGHHGGHFFFFFFEEEEDEDDDDDDDDDDDCDDDEDDDDDDDD +@SRR9130495.74 D00236:723:HG32CBCX2:1:1108:1333:2084/1 +ATGAGCACACAAGGGATGATCAGATTGATGGTGTAGAAGAGTGGCTTGCGCTTGATGATGAAGTCATAGGTCACGTCCACATAGCTGGGGTCCTGTGGGTT ++ +CCCFFFFFHHHHHJIJHDIIHHHIIJIIJJJJJIJJIIJIJJJIBDGIJJJJIJJJJGIIIJIAHEEHEFFFFF>EDCDDDDDCDDCDDDDDDDDDCDDDD +@SRR9130495.75 D00236:723:HG32CBCX2:1:1108:1447:2137/1 +TCCACTTGTACAAAAAATTACAAAAATTAGCTGGGCATGGTGGCACACACCTGTAGTCCCAGCTACTCGGGAGGCTGAAGTGGCAGGATCACTTGAGGCAG ++ +CCCFFEFFHFHGHJJJJIJJJJIIDIEHJIIJJJIGJJJHGJIIDHIDGIJIJJIGHIJJJJJHHHFEEBDCDBBDDDDDDDDDDDDDDDDDDDDDCDDD@ +@SRR9130495.76 D00236:723:HG32CBCX2:1:1108:1499:2151/1 +GAGAAAAAGCATCCCTTTAATAAGGCCGCCCCGGTTCCAAATCAATCCTGGCATTGCAGGAGGCAAGGGGGAAACACAGCCACGAAATTGGATTAGCTCTT ++ +CCCFFFFFGGHHHJIIJHIEIJJIIIIJIIGJJIHJIJJIGIJJJIIJJHHHHHFFFFFFDCDBDDDDDDDDDDDCDDDBDBDDBBDDDDDCDDDDCDDCD +@SRR9130495.77 D00236:723:HG32CBCX2:1:1108:1280:2166/1 +GCCTTCTTCCCAGCAGCAATATGGCTCTTTCTTCAGCTCTTATCAGTCACATCCATCAACGAGTGGCTTTTAAAAGGGTATGTTTAAACCTTTTGACGGGA ++ +CCCFFDEFHHHGGJIJJIJIJEIJJJJJIFGIIIIIIIJIIGIJJGIIBHIJJJJIJIEH>CG;CHCHGHICHFFFFFFDDC;@CCEEDDCDDCCDDDDDB +@SRR9130495.78 D00236:723:HG32CBCX2:1:1108:1458:2216/1 +TTTCTTTCCACACATCCCACCTAACACCCAAACTAAGCACTCAGTGCTTGGAATCTCCCCACCCATTCCCTCACCCCTGCTCTTCCATCATTTCCTCCAGC ++ +CCCFFFFFHHHHHIDHIIJJJJHIIJFHIJIJIGIJHGIIIIGJEHIGIIJCGEEHJJJJJJJDHEHHGFFFFFDCDDDDDDDDDDDECCDDEEEDDDDDD +@SRR9130495.79 D00236:723:HG32CBCX2:1:1108:1634:2001/1 +TGTGCATTTCTCATTTTTCACGATTTTCAGTGATTTCGTCATTTTTCAAGTCGTCAAGTGGATGTTTATGATTTTCCATGATTTTCAGTTTTCTTGCCATA ++ +CCCFFFFFHHHHGJJJJJJJJIJHGIJJJJIIIIJJIGIIJJJIJJJIIFIIJJJJJIJJJIJIIIIIIJIJGJJJJFHHGGHGFFFFCEFFDEEDEEDDD +@SRR9130495.80 D00236:723:HG32CBCX2:1:1108:1566:2120/1 +GGACGAAGTAAGGGAGGAGCAACTGACAACATTCATCTTGTCTGTCTCCTCCACGTCCCGAGGTACAAGGCGGATGTCATTCTTACTAATTTTTTTCTTCT ++ +CCCFFFFFHHHHHIIJJJJIJJJIJJJJJJJIFIJJJIJIJIJIIJJIJIJJJJIJJIIJHHFFEEEEEDDDDDDDCDEDEDEEDDDEDDEECDDDDDDDD +@SRR9130495.81 D00236:723:HG32CBCX2:1:1108:1863:2047/1 +AAATTCGGACCCCTTGGGTGGAATATTCCTTACGAATTCAATGAGACAGATCTAAGAATCAGTGTGCAGCAACTCCACATGTTCCTGGACCAGTATGAGGT ++ +@BCFFFFFHHFHHHIJIJGIIIJIJJJJIIJJIIIIJJJJGIJJJIJJIEGIIGIJIJJJEGHHHGEEHFFFFDEEEDDDDEEEDDDDDDDBBCDDCCCCC +@SRR9130495.82 D00236:723:HG32CBCX2:1:1108:1844:2145/1 +TAACTCTCTGCCTGCGATGTCCCTACCTTCCAGAATGGTGCCATGACAACGGTGTCAACTACAAGATCGGAGAGAAGTGGGATCGGCAGGGAGAAAATGGC ++ +@CCFFFFFHHGHHJJJJJJJIJJJJJIJIIIHIIIJIIJJJJIJIIJIJJJJJJJJJIJJIIJEHHGHHFDFDDDDDCDCDDDDDDDDDDD?>BDDDDDDD +@SRR9130495.83 D00236:723:HG32CBCX2:1:1108:1772:2188/1 +GAGGTAGGGGTGTGTGTGAATGGGTGAGTGTGTGCCTATGCTTGTATGCCATATGAGAGAAAATGCAGCATTTAAAATCAGTGGTTAACGGCCAGCACAGT ++ +B@BFDFDDHHDDHHGIGIJIJGIJ:CFHHIGGIJJIEHGIIIJIIIFHGIJBHIJJJJJJCHHIHHHHHGFDFFFFEEEECEEDDDDDDDDDDBDDDDDCA +@SRR9130495.84 D00236:723:HG32CBCX2:1:1108:2103:2085/1 +TACAAATGTGCCAGGCACTCTTCTAAGTCCTCACATGCATGAAGTTATACAACTCTACAACAAACCTAGGAATATAAACTGAGGGCAGGGACCCCCAGCAA ++ +CCCFFFFFHHHHHJIJIJJJJJJJJJJJJIJJJJJJIJJJIJJJFHIJJJJIIJJJJJIJIIHIICHHIJJJIIIJJHHHFHHFDDDDDBDDDDDBDDDDD +@SRR9130495.85 D00236:723:HG32CBCX2:1:1108:2067:2091/1 +ACCAGCCCTGCTGCCACCCAGCCCACGTCCCGCGCGCCACCCATGCTGCTGCCTCGGAGCTGCAGGGAGCCGGGGAGCCAGGGCCACACGCAGGTGCAGCT ++ +?@@D?A:BF8DDFFFFFFFFAECBF@GFECAEFIIIIIIFBE?DBBD;@CCCCBBBBBB@B::AABBBBBB7>BBB>@BB?B>B>BB?/?A?BCCCBDDDD>@ +@SRR9130495.87 D00236:723:HG32CBCX2:1:1108:2387:2038/1 +GGCTAACCACTGCCTTGTCAAGTTGTGTAGAGTGAGATTCAGGGGTGTTGAAGTAATGTCCTTGTTACTTGCTGTAGGGCATCTGTTTTCTGTGTATCCCA ++ +CCCFFDDDDHGHGJEIGHHIJIHGGIIHGIIIIIEGBEHGGHIGGAFHIJJJJJJJJIDGHIIGIJJJIIHGFHEHFDFEDCEECDCDDACCCAACDFCCC +@SRR9130495.88 D00236:723:HG32CBCX2:1:1108:2285:2075/1 +CTGAAAGCTGAGCGTGAGCGTGGTATCACTATTGACATCTCCCTGTGGAAATTCGAGACCAGCAAATACTATGTGACCATCATTGATGCCCCAGGACACAG ++ +?;@DDBDDDFFD>ACGED@D8@):E*::??FFC@;FEF>E;CC=CC=@DDD>?;>A>A>A;AB3;A(;@:??DFBCB4<CCD@=BB@-(4812>>> +@SRR9130495.93 D00236:723:HG32CBCX2:1:1108:2748:2098/1 +CATCATCTTTTTTTTTTTTTTCTCCTGAAAACTGTCTAGTAGTTTGATATATTTTGTCCGAGGTTATTTCAAGTGTTTTTTTTTTTTTTTTTAAAACGGTG ++ +@@@DDDDDHHHHHIIFEHIIH8))7)7CEF9).)7;;>B@>9BD;;(6(55>DDDCBCC@/8-084@CC>C(((+4>?CBBBBBBBBBBB>&23:A(5?(( +@SRR9130495.94 D00236:723:HG32CBCX2:1:1108:2733:2156/1 +GACTGAGAAGAACAGAAAGGGAGAGAGAGGCCAATGGAAATACATGAGAAGGGAGAGAGGGAGAGAGAGGGAGGGAGGGAGGGAAGGAGGGGGAGAGGGAG ++ +CCCFFFEFGHHHHJJGIIIJJHIIHHIIJJJJJIJIIHGJJJGIJJJJJJJJJHGGHHIHHHFDFCDCDDD>BDDBDDDDDDD>BDD?BDDDDBDBDBD@D?ABD@BD?BBDDDC +@SRR9130495.96 D00236:723:HG32CBCX2:1:1108:2818:2076/1 +ACACTTCATGGCAACCTGGCTTAGATTCTTCAAAATTTCTGATCCTATACCAAAGCCTCTGTAATCACTCATCACGAAGAAGTCTTCAAGATACAGTAACT ++ +CCCFFFDDHGHHHJJJJIIJIIHIJHGCHIFEGGJJJJIJIGIIJJJIIJCEHIIIIJIBGHGGIIJIIBFGGGGHHGHFFFFDEEDECEDDDDCD>CCDE +@SRR9130495.97 D00236:723:HG32CBCX2:1:1108:2848:2112/1 +AACCTCTTCTCTTTGTCTTTCTCTTTATCCTTCTCCCTCTTGCCAGGACTGGACTCGCTGGTGATGGTGACGACGCTGGTGGGTAAGGTCTGCGCCCGACT ++ +@@BFFFFEHGHHGIJDEHIJIIIIIIJIFHIIIJEIDHIIIIJJIIIGIEIIJJIIIJFEHFHIIIGIIJIFBEDDBD>=?BB@CACCCAACDDBDBB5;6@;ACBCCCC?@AA>C>?<<<9)?FHFCAG=GFFG>FGGEGHIEEBEDEFC>C@::=BB@BCACCC@CA3:(8@C<8?CC +@SRR9130495.100 D00236:723:HG32CBCX2:1:1108:3014:2117/1 +CCCTCCTGAAAAGGTCCAGCTCCAAAGCCTGACCCGTAGCTGCAGAGAAGAAAGCTTTTCCTCTAAAGGCTGAGGAAAAGATGAAAAATCACTGCTAGAAC ++ +CCCFFFFFHHHHGIJIJJJJJJJJJJJJJJJIJJJIJJIJJJJIJGIDHHIIIJJIJJJJJIJJJHHHHHFFFFDEEEEDDDDDDDDDDDDDDDDDDDDDD +@SRR9130495.101 D00236:723:HG32CBCX2:1:1108:3316:2011/1 +GCAGAGCTGAATGGGCAAGCCCAGGACCCTTTTCAGACATTCTGCTGGCCTTTGGAAAGTGTACTCCTGTTGTATTTGATTACTTTTAGAGGACAGTACAT ++ +CCCFFDDFHHHGHJJJJIJFGIGHJGIJIIIIIHIIGIIJIIIIJJJIIIIJIIIGIJGIJJJJIIJJJEEEE?ECFFFFFFCCEDEEEDDDDDDDDEDCD +@SRR9130495.102 D00236:723:HG32CBCX2:1:1108:3264:2036/1 +GGGTGCTGGAGATAGCCCACGTACACTCCTTCTTGCTGGGGTACTTGTCAGGCCAGTTGGGGCTGGTGATGGTGCCACTGGTGGATGTCACCTTGTGTTCA ++ +=@<=B+AD>BFDFIIDEDGEIGFIIIIIICDFGFFGIII;D?F>?*/9BF>DAF;CFFGI>/:=?>7@BAA:;@5=A5>@=,98?:>@(;:4>ABAB?ABD +@SRR9130495.103 D00236:723:HG32CBCX2:1:1108:3400:2065/1 +TCTGTCTGTCACCAGGTTGGAGTGCAGTGGTAGGATCATGGCTCACTGCAGCCTCGTCCTCTTGGGTTCAAGCAATCCTCCTGCCTCAGCCTCCCAGGTAG ++ +@@BDFFFFHHHGHIJJFHEG@GHHIIAFD@HGGGEHIJJJGIJJGGGIHFDAHHHHJFCGGGHGJI;CHFCEDDFFFCEDEEDDDDDDDD<C +@SRR9130495.104 D00236:723:HG32CBCX2:1:1108:3468:2219/1 +TGCACTTCGTTCTCTTAATGAAACCCTTTGACTTAACCATGACTCCGCTCTGCTCTTGAGTTTGCAAGTGTGTGCGAGTGCCCGAGAGACAGTTTTTTTTT ++ +CCCFFEFFHHHHHJIJIIJJIIJJJIIJJIHIHJJJJJFHFHIIJIJJJJIJIJJJJJGGIIJJJGDIJJJIHHHGFFDDEEEDDDDDDDCCDCEDDDDDD +@SRR9130495.105 D00236:723:HG32CBCX2:1:1108:3722:2006/1 +TCCATAGTTTCGCAGAAGACTTGGAAGGATGTTGATGTATATGCAGGTCCATTATCAGTTTTTAAATTAGATGGTTTTCCCCAAGCTGCCCATGCGTCTAA ++ +CCCFFFDDHHHHHJJIJJIIHGHIGIIDFHHIIIHHIJJIJJIJIJJJJJJIIJJIJG=DHHJJIJIIIJJJJJIGHGHHFFBFDDEEEDDDDDDBBDDDD +@SRR9130495.106 D00236:723:HG32CBCX2:1:1108:3517:2148/1 +CTCTGTTCTGTTCCATTGATCTATATCTCTGTTTTGGTACCAGTACCATGCTGTTTTGGTTACTGTAGCCTTGTAGTATAGTTTGAAGTCAGGTAACGTGA ++ +CCCFFEBFHHHHFGGGIEEHIIJIJJIJJIIJIJJHIIJIIJJIIFHGIIIIJJJJJJFIJIJJJJGIIJIJCHIJIJHGJIJHHHHHHFFFFFFEEDECA +@SRR9130495.107 D00236:723:HG32CBCX2:1:1108:3927:2234/1 +CTGTGCTCTATGTACACGCCCATCTGTTTGCCTGACTACCACAAGCCGCTACCACCGTGCCGTTCCGTGTGCGAGCGCGCCAAGGCCGGCTGCTCGCCGCT ++ +@C@FFFFFHHHHHJJJJGIIJIJJIJEHIIGHGJJIJJJJJJIIGHHIJIJIGHJIIJIHHGFFDEDE?BBDDBDCDDDBDDDDBDD>BDBDDDDBDDDB< +@SRR9130495.108 D00236:723:HG32CBCX2:1:1108:4124:2011/1 +GACTCAGAGCCAGGGCCCGGGAACAGAGATGACTCGAAGGCTAGGGCTCCAGCCAGACTTACCGGCACACGTACACCTCTAGGGGTGGCAGGGTGCTGGGT ++ +CCCFFDDEGGGHHIJIIIJIIIIJIHHJJIJIIJIJIGGIIGIIHIGGIGHBHGHFEFFEECEDDDDDDDDBDDDDDCBACCDDDDDDBDDDDDDDDCD?9 +@SRR9130495.109 D00236:723:HG32CBCX2:1:1108:4130:2090/1 +TTCTATTTCTATAAACTGGCCTATTTTGGGTATTTCATATATATGGAAATATATAATTTGATTTTTTTGTTCTCTTAGCTGTATGTTTTCAGGATTCTTTC ++ +@BBFDFFFHHGHHIJJJJJJJIIIJJJJIJJJIJJJJIJJIIIJJJIJJJJIJIIJJJJJJJJJIHJIJJHHHHHHFFFFFFEEEDECEEDDDDDCDDEDD +@SRR9130495.110 D00236:723:HG32CBCX2:1:1108:4176:2091/1 +AAATTGAAAGTAAATGTATACTGTAGTCCCACGCACGAGTGAATAAAGGGGTGTCTAAAAGGAGTGTGTTCTCTTCCAGGCTGCATCTCTCGGTACTCAGC ++ +;8;ABD?+AA=ADBHIGBHE?ACCCCC +@SRR9130495.111 D00236:723:HG32CBCX2:1:1108:4108:2121/1 +ATGCGGAAGTAGGCAAAAATGATGTGCTAGACTACAAGAATTCCTTTTACAGAAAGTAACAAATACAGAGCCAAGAAAGTTTTTGTTAATTATCACGGTGT ++ +@@@ADADA@AD>FIIBBBFGIBGHJDCIGEGGGHHHIJIIJJJJGHIIEHHEGHJIHGGGIFAGGGGIIG>=CHHFD?@;CCEDDDDCDD>>ACDCB@8<5 +@SRR9130495.112 D00236:723:HG32CBCX2:1:1108:4384:2110/1 +ACACAGGCAGCAATGATGTCTTTACTTCTTTATTTTTTTCGACTTCATCTACAGAGCTTAGCACAGCCATTGGAACAAAATTGGAGCTCAGTGCACAGTTA ++ +@@@FDEFDDFF3CCF?FHCH@DEEGEFHIIFGBGGGDGIHAFBGDDHHIBAGGDGHE@CHAHBFFFFBDD +@SRR9130495.115 D00236:723:HG32CBCX2:1:1108:4445:2247/1 +TCTGTATTCTGTGTCATCTGCCATTCCTTGACTCCCTGCGCCCTTCAGCCCACAGGAAACGTGTGGATGACACACGAGGAGATGGAGTCTCTGACGGCAGC ++ +CCCFFDDDHHHHGJJJJIJJJJBHHJJIIGIIJJJIIGIFIJJIIIIGIJJIIIJIJCHIIJJJIHHFHEFFFFDDDDDBDDCDDCDCDDDDCCCDBBDDB +@SRR9130495.116 D00236:723:HG32CBCX2:1:1108:4698:2005/1 +GAGGGAAGGAGGGAGGGAAAGAAGAAGGGAGAGAGGGAGGAAGGCAGGACTGTCGATGCAAGTACCTCGCTTCCTTGTTCTTAACTCATTTGATTCTTGCT ++ +C@BFFFFFGHHGHIIIJJIBGGDHC@FEGDHIIIHGEHHEGCGIHHHFFFFDEEDDDEDDDDCDCCCDDDDDDDDDDDDDEDCCCDDDCDDDED:CCDDDD +@SRR9130495.117 D00236:723:HG32CBCX2:1:1108:4588:2182/1 +CTGGGGTGCAGTGGTGCAATCATAGCTCACTGCAGCCTCAATTTCCTAGGCTTAAGCATTTCTTCCACCTCAACTTCCCAAGTAGCCAGGATTACAAGCAC ++ +CCCFFADDFFHHGGHHGIIJIJJJJJJHIIJIJJIFIJJEIIJIJIGIJIJJJJJJIJJJIIHIIJHIIFFHGHHFFFFFEDEECCCCBDBDDDDDDCDBC +@SRR9130495.118 D00236:723:HG32CBCX2:1:1108:4964:2029/1 +CCCCGTCTCTACTGAAACACACACACACACACACACACACACACACACACAATTAGCCAGGCGTGGCAGCGTCTGCCTGTAGTCCCAGCTACTCAGGAGGC ++ +;8=:DDDDFFFAFIIFFBEIIEFIFIFIEFFFIIBEGEF?BF<4;A@EE/?;AB>7;7;>@?>B?''5<@;@?;0((4:@>34@@>:4<@>BAB@(948&+ +@SRR9130495.119 D00236:723:HG32CBCX2:1:1108:4831:2078/1 +GCGAAGAAAACTGAAAAAGGTGGAAAATTTAGAAATGTCCACTGTAGGACGTGGAATATGGCAAGAAAACTGAAAATCATGGAAAATGAGAAACATCCACT ++ +CCCFFFFFGFHHFFHGIHDICFHIGGIDHIIJJJJIIIIIGIGHGIJJJJJJJJJJJIJJJIJJIHHHHHFFFFFEEEEEEEDDDDDDDDDDDDDDDDCDD +@SRR9130495.120 D00236:723:HG32CBCX2:1:1108:4877:2117/1 +GCATAATGTTGCCACTGCACTCCAGCTGGGACGACAAAGACTGTCTCTAAAAAAGTAATAAATAAATAAAAGTTTGAAATGCATTGTCCTAGGTTTTAGTC ++ +CCCFFDEFHHHHHIIJJJJJIJIIIGIJJJJJJIIJIJJJIJJJJJJJJJJJJJIIHHGHHHHHFDFFFFFEEEEEEDDDDDCEEDEEDDDDDCDDDDDDD +@SRR9130495.121 D00236:723:HG32CBCX2:1:1108:4918:2158/1 +AAACATGTCAATGGCCAAAAAAAACAGACAATCAAAAAATGGACAAATATATGAACAGACATTTCTCACAAGAGGACATACAAATGGCCAGCAAATATATA ++ +CCCFFFFDHHGHHIIJIJJJIIIJJJJJJJIJJIJJJIIJJJJIJJIJJIHGFHHHHFFFFFEFEEEEEDDDDDDDDCDDDDDDDCCBCDDDDDDDDEEEE +@SRR9130495.122 D00236:723:HG32CBCX2:1:1108:4939:2211/1 +CCTGGTCTCAGCATTCCTCACACGTCATAGCGAGGCCCATGGCTGTAGAAATCCCACCATTCTCTTCTCCCCAGGCCTGGCATCCGTAGAAGCCTACAGCT ++ +@CCFFFFFHHHHDHIDIHIJIJJJJJIGGEGIJIIGIIIJJJGGIJJJJIGGHGIIIJJGHHHHHFFFFEFDEDDDDDDBDDDDDDDDD?CDDDDDDDDAC +@SRR9130495.123 D00236:723:HG32CBCX2:1:1108:5169:2188/1 +TCTGACCCCATGTCCTCAGGCCAGAACCCGGGAGCCTGTCAGAAAAGGTCTCTCACCTAGAGTCCATGCTCTGGAAGCTCCAGGAGGACCTGCAGAGGGTG ++ +??@DD?DFHDFHFIIIIGFHEGGDFFHIBHGIAFIGGIIIFI@CHE@FGH@CDGGIFHEEFCCED@DEEEECCCCCCCCCCCCCCBB8ABC?ACAAABBBB +@SRR9130495.124 D00236:723:HG32CBCX2:1:1108:5192:2231/1 +ACTCTCCTGGCCCACGAGAGAGTCCACACAGGAGAGAAACCTTACCAGTGTCATGAGTGCGGCAAGAACTTTAGTCAGAAATCCTACCTTCAAAGCCATCA ++ +CCCFFFFFHFHHGJJGEFGHGIIEIIFJJJIHGIJIIJIIIJIIGIEHHIGIHIJIIJIIBDFDDDDDDDDDCDDDCCDDDDDDDCDDCDDDDDCDDDDDA +@SRR9130495.125 D00236:723:HG32CBCX2:1:1108:5408:2041/1 +TGTGTGCATCCTCATGTGTCCTTGATAAGTGGTGTGATAAATGAAGGCTTTGCCACATTCCTTACACATGTAGGGCTTCTCTCCAGTGTGAGTCCTCTCAT ++ +@@@DDDEBFHHHHIIIHIFHIDHIIIJHHJIHEGFIIHIJJIIJJEIJGHHIEIEGIIJIJJJGIGHGJJIIGIGIHJEHHHHHFFEFFFCC@CEEDDDDE +@SRR9130495.126 D00236:723:HG32CBCX2:1:1108:5351:2057/1 +CTCTATATATTTTAACAAATGCATAATGTCATGTGTTTACCATTACAGTAGGATAAAGAACAGTCTCATTGCCTTAAAAAGTTCCCTAACATTTTAATTGT ++ +CCCFFDEDFHHHHJIJIIJJJIJJJHJJJJIJIIIHHIJIJIJJJJIIHIJJIIJJJJJIJJJJJJIJIJIJIIJJJJJJJGGIGHHFHFFFFFFFEEEEE +@SRR9130495.127 D00236:723:HG32CBCX2:1:1108:5475:2108/1 +AGCCCAGAAGGCTGGACACACCTCCCCCTCACCCCATCCCGCTCCCCAATCAACCCAGTCCTCAAGAAGCACACTGTGGCTGCTTGCTCTCTTGCCCCCCT ++ +CCCFFDFFHGHGHJJIJJJIGIIIHIGIIJIIJJJIJJJHGIJIJIIIJHHGHHFFEDEEEECCDDDDDDDDDDDDDDDDDDDDDDDDDDCCDCDDDDDDB +@SRR9130495.128 D00236:723:HG32CBCX2:1:1108:5542:2138/1 +TGGCTAGCTACTGCTGCTGCTGCATCAAAGCCCAAATATTCACTGGCATCAGCTGTTTTGTTCTTTAGCATATTAGTAAAGTGCTCATTTAGAGACATCTT ++ +@CCFFFFFHHHHGJIJJIJJJIJJJJJJJJJJJJJJIGGIJJJJJHJJJJJJJJJHIEIIJJJIIJJJIJIIJJJJHHHHHHHF@DFFFFEDEEEEDDCDD +@SRR9130495.129 D00236:723:HG32CBCX2:1:1108:5707:2147/1 +CCAGCATCACTCATGGAACCGGAGGCACTAAGGCCCCTCGGGAGACGCTGAGCAGGTGGGTAGAGGCATACTTCTGGGAGATGGCATCAAGAGCCAGTCAA ++ +CC@FFDDFFDHG>FFFHGGIJIEIIIHIGIGHBHCEHGGGFH@FHGIHHFBFDEEDDEDDDDBDC?BBDCDDDDDC:?A?BDDDCCDC>ACDDDBDDACCC +@SRR9130495.130 D00236:723:HG32CBCX2:1:1108:5614:2168/1 +AAACCATGTCTCTACTAAAACTACAAAAATTAGCTGGGCAACATGGTGGGTGCCTGTATCCCAGCTACCTGGGAGGGTGAGGCACGAGAATCACTTGAACC ++ +CCCFFFFFHHHHHIJJJJIJGJIJJJIJJJJIJJJJJIJJJJIJJHIIHJIJJJJJJJJJJJJJJJJGHFHHF@DDDDDDDDDDDDDDDBDDDDDDDDDDD +@SRR9130495.131 D00236:723:HG32CBCX2:1:1108:5985:2027/1 +GCGGCAGCGGCCGCGATGGAAGAACTTACGGCGTTCGTCTCCAAGTCTTTTGACCAGAAAGTGAAGGAGAAGAAGGAGGCCATCACGTACCGGGAGGTGCT ++ +CCCFFFDDHHDGHFIJFHFFHHBFGHGEIJJJFFDDDDDDDDDDD@CCDCDDDDDAAACACDC@CCDBBBDBD@ +@SRR9130495.132 D00236:723:HG32CBCX2:1:1108:5816:2071/1 +TTTACATATAAGAACCTGATGACCTTTTGTTTTTGTCCAGGAGAGTCCTTCTTGTCTACGAAATGCAGCTATCACAGCAGCTGGACTTGTTTCCTGAATGC ++ +C@CFFDDAFFFHHHHHHGFIHJIJFHHHCAAEHIGHJGCCGHIHEHJJJEHGIIIFIGBBAEHGIJIGIIHHEHHHFFFFEECCABCDCCCCACDDACDA: +@SRR9130495.133 D00236:723:HG32CBCX2:1:1108:5835:2081/1 +CCAGGGCTCCAAGGGGCTGGTTACGAAGTGTCTCCTGCTGCATGAGGTCCCCACGGGAGAGATTGTGGTCCGCCTTGACCTGCAGTTGTTTGATGAGCCGT ++ +@CCDDDFFHHHGHGJGJFHIEHIGCGHIGJGIIIJJJJJJJJJIIIEIJFGIJJIJGCCDDBDDCDDDBDDDDCDDDDDDDD>BACDDDEDDCBD +@SRR9130495.134 D00236:723:HG32CBCX2:1:1108:5841:2101/1 +GGGCATGGTGGCATGCGCCTGTAGTCCCAGCTATTCGGGAAGCTGAGGCAGGAAAATCTCTTGAACCCAGGAGGCGGAGGTTGCAGTGAGCCAAGCTTGCA ++ +@CCF?BDDHFHGHIIIIIIIIIGHGHHIIIFIIIIIGGFGGIIIIEFGGEGHCD>CGGFHHHGGHFFFCDDADDDDDDDBDBCDCCCCA@CCCCBDDDDDD +@SRR9130495.135 D00236:723:HG32CBCX2:1:1108:6165:2044/1 +TTTATACCATTTTTTTTTTTAGCATATATCCTTGTACTTTATAGGAATTATTTGCTTTATTCTCTTGTGACTTGTAAATTGATGTACTTAATTAAATCTTT ++ +@@CBAB;DHFFHHIGIIGGHGFF@?BGB@8=FHEGHIGD=@CGHIA;@EHFHGHBFFFCBD;>(>@A@C>>;>CA;;35>@3;>5>,;3>:;(:@:>:@@C +@SRR9130495.136 D00236:723:HG32CBCX2:1:1108:6059:2069/1 +CTATGACCGCTATGTTGCCATCTGTAGCCCACTGCTTTATAACACTGTAATGTCCCACAAGGTCTGTTCCATAATGATGGCTGTGGTATACTCACTGGGCT ++ +CCBFFDBEHHHHFEGIIGHGIIIJIIHIJIFIJJJJJJJJJJIIJJIJJJJIIHHIJIIIFIHIJFIGIIIHGGHHHHFFFFDEEEEEDEFEDDDCDDDBC +@SRR9130495.137 D00236:723:HG32CBCX2:1:1108:6161:2181/1 +ATGAAGCAACAACCTTATAGGCATTTTAACTCATAGGTTTTAAAACTTAAGGTTATTTTCATAGGAGTCCCTTTTAGCAGAAATGCTCACCACAGGACCAG ++ +@@CGGDD@4???BDHCH@GH<=FHGEGGGIGCEG@E7ACH@:77?C@A@CBAA???2FFFIGIIGIIIIFDADBDDDDDDDBBBBBBCDD@CDDDD?BDDDDDDCDDBDDDBDDDCCCCCBBCCCDCCCCDDAC>ABDDDCDDDDA@C +@SRR9130495.144 D00236:723:HG32CBCX2:1:1108:6837:2146/1 +CCTGTTATTTTAGTTGTTAAAGGTGGCATTCTGTTCTTGTGGCTGTCTTCTTTTAGGTTTGTTGAGGGATTACCTTCTTGTTTTTTCTAGGGCATTGTTCC ++ +BCCFDDFDHFDHFGIIIIJIGIIJJIDGHIJIIJJJJJJGFIIIHFHHIJJJIGDGIGHGHIJICHGGEHGCHGFEHFHHFDDDDDDDDDDDC?CDDDDCC +@SRR9130495.145 D00236:723:HG32CBCX2:1:1108:6804:2189/1 +TGAATCTCTCTTGGCCTCCTCCCCTCTCATGTCCCCTCCTCCCTCCTCTCCACTTACTCCTCCTCCTCCCCTCCCTCCTCCCAGATGGTTCTGTGTCTTTT ++ +CCCFFEFFHHGHHJJJIJJIJJJJIJJJJJIJIFIJIGIIGGJIJJIIIIIGIIJIJIJGIIIJIJJHHHFDFFDCDCCDDDCDBCCDCDDD@ACCCDDDD +@SRR9130495.146 D00236:723:HG32CBCX2:1:1108:6940:2229/1 +CTTAATGCCACTATCACCACTTCCTTCAAGAGTGAGGGAGAGGAAGAGGAGGAAGAGGAGGAGGAAGAAGAGGAGGAGGAGGAAGAGGAGGGTGAAGGGGA ++ +@@@DBDDEFHHHHGIJIEGGIGECHIFIIJGFHHACCF?D:DFF;?FHH9DFCGGHFG@CA?AB?DD>?A@BDDBB=?B5@BBFCAA@A;;5?BB9;=>;BB?1>A?ABDCC +@SRR9130495.149 D00236:723:HG32CBCX2:1:1108:7167:2101/1 +TTTCATGTTTTAGGTCTTGTAAGCAAGATTTTTCCTGTTGAAAAACTGGTTGAAGAAGCCATCCAATGTGCAGAAAAAATTGCCAGCAATTCTAAAATCGT ++ +?@?DB?DDHHGDHIHHGBIECFDHHE>C7?BB7;@A(5==;88323>CDC9B +@SRR9130495.152 D00236:723:HG32CBCX2:1:1108:7449:2110/1 +GGCTTCAGGAGCTTCAGAAGTTAAGAGCTGCAAAAAAGAAGAAAAAGGATCGGCCAAGTAAAGACTGTTCCAAGTTGGACATGCTTGCTAGAAATTTCCAG ++ +CCCFFDFEHGHHGJIIBEEHHIIIHHIGGJIIJIIGIIGGHIIIJIGGGGGGGIIJJHHFHHGFFFFFEEEEEEEDDDDDDDCDDEDDDDDDDDDDDDEDC +@SRR9130495.153 D00236:723:HG32CBCX2:1:1108:7499:2197/1 +TTCTCATAGTTCAGCTTCCACTTGCGGTAGCTTGTTCCACTTGCGGAACATGTGGTGTTTGGTTTTTTGTACCTGCACTAGTTTGCTGAGAAAGATCGGAA ++ +@@@DDDDEHHFFHABECCAFHHHFDGIHJIIEFGHIIGIGEHEBGG0AEDHGFFFGIDG@EH=ADEBADDE@CCCBCACDDDEEDDCCCBCCC@CC>AB@@ +@SRR9130495.154 D00236:723:HG32CBCX2:1:1108:7309:2205/1 +GGAGGCTGAGGCAGGAGAATCGCTTGGACCCGGGAGGTGTAGGTTGCAGTGAGCCAAGATTGCGCCACTGCACTCCAGCCTGGGTGACAAAGTGAGATATT ++ +BC@FFFDFDHHGFIGIIIJIJJJJJIJJJIIJJJIIIHHIJIJJJIJHHHHGHFFFEBAEECEDDB:@CDDDDCDDDDDDDDDBCBDCDCDDDCDBDCC?ACDD34>C@BD<>>:CB<>@BA8 +@SRR9130495.156 D00236:723:HG32CBCX2:1:1108:7518:2119/1 +TTATCAAAGAGGCCCAAGAGAAACCACTTGTCTGACTTCTACCATATGAGTTTAGAATAAGATGATGGCTGCCTATGAGGAAGCAGGCCCTCAACAGATAC ++ +@@@DDBD4CFFAAHII=G9FDHG;?F@;EEBEFCF>BGBGDBECC@BBBBBBBCCABC@CC +@SRR9130495.157 D00236:723:HG32CBCX2:1:1108:7577:2169/1 +AGTTACTTAATATACCTTAGCCGAAACTTCTGCACTGATTTCCTCCTGTGTTTCAGCCAGCCGCTTTTTGGCAAGTTCGGTTCTCCGATCACACTCTGCAA ++ +@@@DDDFFFFHGHIICGHFH@FGGHGHHJGIHJIJIJGIIIBDHCBGGHEHIJJIGIIIBGIEIGGHHCEBDFEDECD?@DDDDDDDDDDBCCDDDDDDC> +@SRR9130495.158 D00236:723:HG32CBCX2:1:1108:7659:2196/1 +TTCTGATTTTTGCTGCAGCTTCTGCTTATAATCATATGGCCAGTTGTGCTTGTCAGAGTAATGGTGAAGTCCACAAAACAAATTTCCACATCGGCAGTCAA ++ +CCCFDDDDHDFHFGIFCHIII9FHHIGGHHIJJJJIJJEHGEGIIJJJJJJJJDHGI:DFGIIGHGJGCGHGIJJGIIHGHGFFECB@CEC@B@BDD?CCD +@SRR9130495.159 D00236:723:HG32CBCX2:1:1108:7733:2213/1 +GGCCAGATGTTTCTGTAAAGATTGAATTAGATCCCCAGGGAGAGGCAGCACAAAGTGCAAATGAATCAAAAACTGAGTAGAATATTGTAGAGTGCCAATTA ++ +@<@DDA+AFFHHHIIFBHC@@F>@>CC: +@SRR9130495.160 D00236:723:HG32CBCX2:1:1108:7590:2217/1 +GGGGCTGGGCCCACCTGGGACAGAGGGCCACATGTAGAGGCAGCGCTCCCCCGTCTTGAGCTGATCTTTGCAGTCGAATAGCATGAGGTTGGCCCAAGCGA ++ +CC@FFDDDGHHDHIJDGIIACBDDBBBDDD@ +@SRR9130495.161 D00236:723:HG32CBCX2:1:1108:7735:2228/1 +GCAGCACTGTCTGAGTATGGGAGCAAAGCCTAATCTGGCTTGCCCGGCCTCTCACCTCTGTGGCGCTCTGCATCATGGTGCTTCTTGTCATCTTTTATTGC ++ +?@;DDDDDFCFFHIHHGBHIBH?FHIBDEHB@GEIHIEHGHAFFHGEEH<@CC@C@CCA +@SRR9130495.162 D00236:723:HG32CBCX2:1:1108:7898:2065/1 +GTTGGCTTCCCCCTCCCCTCTCCCGTGAGCTGAAAAGCAACAAGGGCTCCACCAGCCTGCAAAATAAGACTTGGGGGGGGGGGGGCAGGGATTGCTTTTTT ++ +@@@FDDDDHHFHFIJIFHIIJJJDHFGIGIGJAFHIDG>@GGFHGGHJIGCHIIGEEHFGF@CFEECC>;>CCABBD<99B@BD99&)&&+9(3(4>(+:0 +@SRR9130495.163 D00236:723:HG32CBCX2:1:1108:7872:2066/1 +CACGCTGGATGAGTTCCTGTTCAGCGACCTGCAGGCGCTGGAAGTGCTGTTGCTCTACAATAACCACATTGTGGTGGTGGACCGGAATGCCTTTGAGGACA ++ +CCCFFFFFGHGGHJJJJJJJJJJIJJJJJJHJJJJJIJJIJJJIGIJJIJJJJIHHHHHHFFDFFEDDEEEEDDDDBDDDDDDDDDDDDDDDDDDDDDDDD +@SRR9130495.164 D00236:723:HG32CBCX2:1:1108:7826:2191/1 +ATCTCTGGACCCAAACTGGAGGGTGACATTAAAGTTCCCAGGGTGGATTTGAAGGGCCCAGAAGTGGACATTTCTGCTCCCAAGGTCAATATTGATGGGAA ++ +CCCFFEFFGHHGHIHHIIJIIIJJIJIGIIJIHIGIJJJJIJJBFGGIJJIJJJJJIJIHFHHFFF@EEDEEFEEDDDDDDDDDBACDDF@CDEDEDDBDD +@SRR9130495.165 D00236:723:HG32CBCX2:1:1108:7791:2195/1 +GGAGAACAGCGTGTAGAGCACTCACAGTCTGCTGCCTTCAGGTGTGGGAGGCACTGCTCACACTGATCTTCTTCCCGGTGTGTGTGGTGTTTGCCTGGATG ++ +CCCFFDEFFGHHHJDIIJJIFJJJJJIJJJGIJJIIJIIIJIJIIGEGHHJJJJJIIFIJJJHHHHFHFFDDFFEDC>9;?BBDDD?CDDDDDDDCC?BDC +@SRR9130495.166 D00236:723:HG32CBCX2:1:1108:7767:2199/1 +GACTAGCCTGGCCAACATGGCAAAACCCAGTCTCTATTAAAAATACAAAAATTAGCTGGGCATGGTGGTGCACGCCTGTAGTCCCAGCTATTCAAGAGGCT ++ +@@@DDDFFFHHFBHBHBDEHHGGGHIIJIIHIHJIEEEIGHEIHIIGHIIHHGJIEHGI?G@CDHI=CA?BDFFACDCCDFCC32??A +@SRR9130495.167 D00236:723:HG32CBCX2:1:1108:7824:2210/1 +GCACCACCGTGCCTGGCTAATTTTTATATATTTAGTAGAGATTGGGTTTCACTGTGTTGGCCAGGCTGATCTTGAACTCTGGACCTCAGGTGATCCTCCCG ++ +@@@FFDDFDFAHHJJIJIIGHHHHHIIJIIDGG>GHHIGGCGHGIEHGGH>FFHJJJHDGBGHJCGGGHFEHHHHFFFFFECDECEDDDCDDDDCCDDCDD +@SRR9130495.168 D00236:723:HG32CBCX2:1:1108:8205:2084/1 +CTTAGCCGCTGGTGATGCTAAGGGCATGGTCAAAGTGTGGCAGCTGAGCACAGCCTTCACAGAACAAGGGCCCCGGGAGGTGGAGGACTTGGATCAGCTAG ++ +CCCFFDEDFFHHHJEGIDHHIIIIJJJIJGIJJJGHJIJIJJJIIIJIGGIIGIJJIGHIIJGEFHGBEFDDDBDDD;>B2<@BBDBBCCCCDDDDDDDDD +@SRR9130495.169 D00236:723:HG32CBCX2:1:1108:8202:2124/1 +GAGACTCTTGCACACATACCGGGGAGCTGGCTCACCCTGGCCCCTCCATCCTGTCAGACTGAAGAGAACAAGTGTCTTAATTTGGGTTTTTCTTATTATTA ++ +CCCFFEFDHFHGHGJIIIJJIJJJIIIGIJJJJFIJJHGIJGHIIJJEEEHFGFFEFECCEEEEDDDDCCAD>CCDDDDCCD?@@A=?8=?=BA93>CA??B@A????8CD(8&8?()(+224@?@>35 +@SRR9130495.179 D00236:723:HG32CBCX2:1:1108:8868:2131/1 +GTACATTGTATCTTTGTTCTCATTAGTTTCAGAGAAATTATTGATTTCTGCCTTTATTTCATTATTTACCCAAGAGTGATTTGGAAGCAGGTTGTTCAGTT ++ +<;;B?D>DFC:DBF@AEDHHAHHGH:A:AC4?BFFEDA?ABD@ACCD:> +@SRR9130495.183 D00236:723:HG32CBCX2:1:1108:9106:2031/1 +CTAGAAATCCTGGATTTTCAGCACAATAACTTAGCCAGGCTCTGGAAACGCGCAAACCCCGGTGGTCCCGTTAATTTCCTGAAGGGGCTGTCTCACCTCCA ++ +C@CFFDFFGGHHFJHIIJGIHCCEHHIGIFIIHIJJFIGJIGIJJIIJHIFGIJIJFFHHFDAD@BCCBDDDDBCC@CDDCCDDAEFC'8;&+)+((&28&&&+((&)&&++((++8((2(((25(&&&(++(0&&&(+((+4(+ +@SRR9130495.186 D00236:723:HG32CBCX2:1:1108:9230:2213/1 +ACTTAGTGCAGTACCCACTATTCCCGCTCAGGCTCCGAATAGTAGATAGAGGGTTCCGATATCTTTGTGATTGGTTGAGAATAATCAACGATTAATGAACA ++ +CCCFFFFEHGFFHFIICIIFIJHHGBHHGIGJJIJGGHIGFHIGIIJJJIIGJCFIJI@EFDFEDFFCCEEEEDDDBDDDDDDDECCDD@BDDDCDDDCDC +@SRR9130495.187 D00236:723:HG32CBCX2:1:1108:9264:2024/1 +AACATAAGGTTTCTCATAAAACAAAGAAAAATGTCAATTCAGTTGTGAATTCATATTGATACCTGGAACTCTCCTGCTAGACCACCTCTAAAGGCCCAGGG ++ +CCCFFFFFHHHGHIJJIDJIJJJDHIIJJJJIJJJJJJJIJJGCHIIJJJJJJJJJJIHJJJJJJGIJJIJIJIIIIJJHHHHGFFFFFECEEDDDDBBBB +@SRR9130495.188 D00236:723:HG32CBCX2:1:1108:9293:2034/1 +GTGGGGAGGTTTGGGAGTGAGCAGCACACCCCAGTTAGACTCCTGTTGGGTTTCATAGGAGCTGGCTGCTGAATGTAAGAGTGCAGGCTACCCCGGGACTT ++ +@@@FDA;1DAFHFIIFBGIGHGADHIGIIIIIIIIHBFEHIIIIIIIIHIACEEEHHBD@CDECECCBBCCACCCCEECCCCCCCCBBBCCCB?9>>>>BC +@SRR9130495.189 D00236:723:HG32CBCX2:1:1108:9484:2048/1 +ATGTAGAGAGAGGGAAAAAAGGAGAGAGAGAAGGATAAAGAGAAGGATGCACAAGAAGACCAAAATACCTGATCATGTAGGGGAGAGCCTCTGGGAGAAGG ++ +@@@DFDDDCDDFHICFHHDGIIHHCHCFFDGHHDCGIJIH@FFHFHGIIGIJIGIGF@CEBDFF@EECDCCCCCCDDEEEDDDDDDDDDDCDDCD<@BDCB +@SRR9130495.190 D00236:723:HG32CBCX2:1:1108:9388:2219/1 +AGCTGCTGCGAGATGGTGGCTTGCATCTCCTTGGACGGCCGCTTGTTCTCCTTGAAGATGGCAATCAGCGTGCGGCGCTGCAGGTCTGTGAACACGAGGCG ++ +B?>3=?>;@DF@>CACC>;>@A>',,88>>-09599(+8>C95>>>00 +@SRR9130495.191 D00236:723:HG32CBCX2:1:1108:9404:2245/1 +TCCGGCTGGTACCTTCATAACTACAGTAATAGAAGACATTGAGTGCCTCCACCGCAGCTGGCCCTCTCTGTTTGTAGCCAAAGATCAGATCTATCCATTCA ++ +CCCFFFFFHHHHHJJIJIIJEIIJJJJJIJJJIJJJIJIIIIIJJJIJJIIJJJJEIJJIHIGHHHFFFFFFDEEEEEDDDDDDDDDDDDDEDCDDDCDCC +@SRR9130495.192 D00236:723:HG32CBCX2:1:1108:9632:2134/1 +ATAGTGGCTGCTGATGGATGTGCTCTATGCAAGGGAGGTGCTCACTATTTCTGTTCGTCAATTTGTAACCCACGGGAGGAAAGGGAACAAAGAGTGAACAA ++ +CCCFFFFFHHHGAEFFHIICHGIJHGFIIIHIJDGIJJIIIEGIJJIIFHEGHGIICHIIFIJJJJIIJJHHHFFDBDD?BDDDDBDBDDBCDD:@CCCCD +@SRR9130495.193 D00236:723:HG32CBCX2:1:1108:9647:2175/1 +AATACCAGCCCAAGACTTTGGGAGAAGGGAAGAAAACAAAGTAAAATAACTTACCACTTTGGCCCAGTCCGAGAACAAGTGAAAATACCCAGGCTGCCCCA ++ +CCCFFFDFGHHFHIIJJGIIIJDIIJIJJJJIIHIIIIJJJHCFHHFHIJJJJJJGIHJJJIJJHGHHHFFFDDDDDCD>CCDDDDDDCDDDBDDDDDDDD +@SRR9130495.194 D00236:723:HG32CBCX2:1:1108:9552:2194/1 +CCATGCCGACACAGGTAGATGGTACGGGGCTGCACGTGGATGTTCATCAGGTAGTATACAATTCGGCTCTGGATGTGGTCCTGCACTCTGTTCACCAAGAA ++ +@@CFFFFFGHGHHJJJIJJJJIJJJIGHFEGGIFIJIJIIIIIJJIIJJIHHHHHHHFFFFFFFDCDDDC@@ACDDCDDDDDDDDDDDDCDDD@CCDDDDD +@SRR9130495.195 D00236:723:HG32CBCX2:1:1108:9620:2235/1 +CCAATGATGGCCAACTAGGCCATCTTCTACTATGTACGCAGCTAGAGGCACGAGCGCTGGGGGTACCGATTAGTTCATATTGGTGTTCCACCTATAGGGTT ++ +===BD?DBAABD8AC3?F?D9C6'5;:>7<<>8:(',&22>(((:>3>+:(+28(43>@B(>:>A((32 +@SRR9130495.196 D00236:723:HG32CBCX2:1:1108:9908:2124/1 +TCTTGTGAAGAAGATGCTGTTGGAAGCCTCTAAGAAGCCCGAACTGAATGCTCTTATAAACAATACCAGAGGAATTATTTTTTACAGTGTCCCTCACCATG ++ +CCCFFFFFHGDFGIIJJIJJIGGJJIIJJIIJHIIIIJJJJI>HHIFIJIJIJJIIHIHIJJJJIHIHHHGFDEFFEEEEEEDDDDDFDEDCCDCDDDDDD +@SRR9130495.197 D00236:723:HG32CBCX2:1:1108:9923:2206/1 +TGGGGCTGTGAACCGAAGTCTGCTCCTTTGCGTGAGCCACCCCTGCAGCCCCTCCCACAGTTCCTGAGGAGCCTTTAGTCCTCGTCCTTTCTCAGCTGTAT ++ +@BCFFDAFHHHHHIIIIHIIJIIJIIJJJIIIJJIGGIIIJJFGGGGGEIIIGFHHEFFFEECCCC@CB@BDDDCDDCCDCCDDABBBCDDCC@CCDCCCD +@SRR9130495.198 D00236:723:HG32CBCX2:1:1108:10131:2036/1 +ATGTGCTCAAAGGCTGGGTGGACCTTACCTCCAGTAAACCCCACGTTGTGAAGAAATCCATCAAGTACCTGGAACAAGGAACTCAAGACACCAAAGATGTG ++ +@CCFFFDDFFBHDHIIIBFEGFGHGHGDFHFGIJJIIHDGEGHIJHFHIIIIJJJJJIIIFHHHFHFFFFFFBAEAACBBCADDDDDDDDADBABCCC>AA +@SRR9130495.199 D00236:723:HG32CBCX2:1:1108:10246:2089/1 +GCCCTGGGATTGTCCCTCTGGGCACAGGGAGTCCTGGGGTTGTCCCTCTGAGTAGTTCTGTTGGGAGAGGAGGCCCTGGGATTGTCCCTCTGGGTACAGGG ++ +CCCFFBDDHHHFHJIIIJJJJIIIIIFIIEHGIGJIJDHJIJIIJJFJIJ@FFCHJJJBEGEHHHDFDCD@DBB;=?A?@BDDDCACDDDDD@?CCCCDCB +@SRR9130495.200 D00236:723:HG32CBCX2:1:1108:10051:2156/1 +ATGGAGGATGGCACCCTGCAGGCTGGCCCAGGAGGTGCCAGTGGGCCTCGTGCCCTGGAAATAAATAAAATGATTTCTTTTTGGAGGAATGCTCATAAACG ++ +@@CDFFDFGFHFFIJGGIICCDDADDB diff --git a/benchmark/src/min_example.fastq b/benchmark/src/min_example.fastq new file mode 100644 index 00000000..f4ef5f68 --- /dev/null +++ b/benchmark/src/min_example.fastq @@ -0,0 +1,12 @@ +@SRR9130495.1 D00236:723:HG32CBCX2:1:1108:1330:1935/1 +NCAATA ++ +#4BDFD +@SRR9130495.2 D00236:723:HG32CBCX2:1:1108:1472:1938/1 +NGTCAA ++ +#1=DDD +@SRR9130495.3 D00236:723:HG32CBCX2:1:1108:1728:1948/1 +GTTTTC ++ +@@@DDD \ No newline at end of file diff --git a/benchmark/src/report_full.html b/benchmark/src/report_full.html new file mode 100644 index 00000000..50276b40 --- /dev/null +++ b/benchmark/src/report_full.html @@ -0,0 +1,948 @@ + + + + + + FastQC-like report + + + + +

Phred Score per Base Position

+
+
+
+
+

Statistics Table

+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
positionminmaxmedianq1q3sample_count
02.034.033.031.0034.00200
110.034.034.031.0034.00200
216.034.034.031.0034.00200
319.037.037.035.0037.00200
416.037.037.035.0037.00200
510.037.035.035.0037.00200
610.037.035.035.0037.00200
710.037.036.035.0037.00200
827.039.039.037.0039.00200
919.039.039.037.0039.00200
1019.039.039.037.0039.00200
1118.039.039.037.0039.00200
1219.039.039.037.0039.00200
1325.041.040.038.0041.00200
1427.041.040.038.0041.00200
1518.041.040.038.0041.00200
1610.041.040.038.0041.00200
1727.041.040.038.0041.00200
1816.041.040.038.0041.00200
1910.041.040.038.0041.00200
2023.041.040.038.0041.00200
218.041.040.038.0040.00200
228.041.040.038.0041.00200
238.041.040.038.0041.00200
2410.041.040.038.0041.00200
258.041.040.038.0041.00200
2610.041.040.038.0040.00200
2710.041.040.038.0041.00200
2816.041.040.038.0041.00200
2923.041.040.038.0041.00200
308.041.040.038.0040.00200
318.041.040.038.0041.00200
329.041.040.038.0041.00200
337.041.040.038.0041.00200
3418.041.040.037.7541.00200
3517.041.040.038.0041.00200
367.041.040.038.0040.00200
378.041.040.038.0040.00200
386.041.040.037.7541.00200
396.041.040.038.0040.00200
4014.041.040.037.7540.00200
418.041.040.037.0041.00200
426.041.040.037.0040.00200
438.041.040.038.0040.00200
446.041.040.037.0041.00200
458.041.040.036.0041.00200
467.041.039.537.0041.00200
475.041.039.037.0041.00200
487.041.040.036.0041.00200
498.041.039.036.0040.00200
5010.041.039.035.7541.00200
517.041.039.036.0041.00200
527.041.039.037.0040.00200
535.041.039.037.0040.25200
545.041.039.536.0041.00200
556.041.039.036.0040.00200
565.041.039.036.0040.00200
575.041.039.036.0040.00200
585.041.038.035.0040.00200
592.041.038.035.0040.00200
607.041.038.035.0040.00200
617.041.038.034.7540.00200
625.041.038.034.7540.00200
637.041.038.035.0040.00200
645.041.037.035.0040.00200
655.041.037.035.0039.00200
666.041.037.035.0039.00200
676.041.036.534.0039.00200
687.041.036.034.0039.00200
692.041.036.034.0039.00200
707.041.035.034.0038.00200
712.041.035.033.0038.00200
722.041.035.033.0037.00200
732.041.035.033.0037.00200
742.041.035.032.0037.00200
752.041.035.030.7537.00200
762.041.035.030.7537.00200
772.041.035.030.0036.00200
782.041.035.031.0036.00200
797.041.035.031.7536.00200
802.041.035.032.0036.00200
812.041.035.033.0036.00200
822.041.035.033.0035.25200
832.040.035.033.0035.00200
842.041.035.033.0035.00200
852.040.035.032.7535.00200
862.040.035.033.0035.00200
872.040.035.032.0035.00200
885.039.035.033.0035.00200
892.039.035.033.0035.00200
902.039.034.533.0035.00200
915.040.035.032.0035.00200
925.039.035.032.0035.00200
932.039.034.032.0035.00200
942.040.034.032.0035.00200
957.037.034.032.0035.00200
962.038.034.032.0035.00200
972.038.034.031.0035.00200
987.040.034.032.0035.00200
995.038.034.032.0035.00200
1007.037.034.031.0035.00200
+
+ + diff --git a/docs/notebooks/.ipynb_checkpoints/best_sequence_quality-checkpoint.ipynb b/docs/notebooks/.ipynb_checkpoints/best_sequence_quality-checkpoint.ipynb new file mode 100644 index 00000000..01334167 --- /dev/null +++ b/docs/notebooks/.ipynb_checkpoints/best_sequence_quality-checkpoint.ipynb @@ -0,0 +1,637 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "fa5e0b95", + "metadata": {}, + "source": [ + "\n", + "# Analiza jakości sekwencji bazowej z pliku FASTQ\n", + "\n", + "Ten notebook przedstawia przykładowe użycie funkcji `cacl_base_seq_quality` z biblioteki `polars_bio` do analizy jakości bazowej sekwencji DNA.\n" + ] + }, + { + "cell_type": "markdown", + "id": "51f25988", + "metadata": {}, + "source": [ + "## Importowanie bibliotek" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "aaa6c4e7", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/karolzebala/Desktop/studia/Semestr 2/tbd/proj2/tbd_proj_2/lib/python3.13/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n", + "INFO:polars_bio:Creating BioSessionContext\n" + ] + } + ], + "source": [ + "\n", + "import polars_bio as pb" + ] + }, + { + "cell_type": "markdown", + "id": "aa0c3d8b", + "metadata": {}, + "source": [ + "## Wczytanie przykładowego pliku FASTQ" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "250d8dd1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Odczytano zawartość pliku example.fastq\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "200rows [00:00, 81728.45rows/s]" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "shape: (200, 4)\n", + "┌────────────────┬───────────────────────────┬──────────────────────────┬──────────────────────────┐\n", + "│ name ┆ description ┆ sequence ┆ quality_scores │\n", + "│ --- ┆ --- ┆ --- ┆ --- │\n", + "│ str ┆ str ┆ str ┆ str │\n", + "╞════════════════╪═══════════════════════════╪══════════════════════════╪══════════════════════════╡\n", + "│ SRR9130495.1 ┆ D00236:723:HG32CBCX2:1:11 ┆ NCAATACAAAAGCAATATGGGAGA ┆ #4BDFDFFHGHGGJJJHIIIIGGI │\n", + "│ ┆ 08:13… ┆ AGCTAC… ┆ IJGJJG… │\n", + "│ SRR9130495.2 ┆ D00236:723:HG32CBCX2:1:11 ┆ NGTCAAAGATAAGATCAAAAGGCA ┆ #1=DDDDD>DHFH@EFHHGHGGFG │\n", + "│ ┆ 08:14… ┆ CTGGCT… ┆ IIIGIG… │\n", + "│ SRR9130495.3 ┆ D00236:723:HG32CBCX2:1:11 ┆ GTTTTCCTCTGGTTATTTCTAGGT ┆ @@@DDDFFHHHFHBHIIGJIJIIJ │\n", + "│ ┆ 08:17… ┆ ACACTG… ┆ IIIEHG… │\n", + "│ SRR9130495.4 ┆ D00236:723:HG32CBCX2:1:11 ┆ GGGAGGCGCCCCGACCGGCCAGGG ┆ CCCFFFFFHHHHGHIIIGIIJIII │\n", + "│ ┆ 08:16… ┆ CGTGAG… ┆ JJGHFF… │\n", + "│ SRR9130495.5 ┆ D00236:723:HG32CBCX2:1:11 ┆ CACTCCGCCACTACAGCAGTCCCC ┆ ++=A1A:1ADA<;FFDC?;CG\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
positionminmaxmedianq1q3sample_count
002.034.033.031.034.0200
1110.034.034.031.034.0200
2216.034.034.031.034.0200
3319.037.037.035.037.0200
4416.037.037.035.037.0200
........................
96962.038.034.032.035.0200
97972.038.034.031.035.0200
98987.040.034.032.035.0200
99995.038.034.032.035.0200
1001007.037.034.031.035.0200
\n", + "

101 rows × 7 columns

\n", + "" + ], + "text/plain": [ + " position min max median q1 q3 sample_count\n", + "0 0 2.0 34.0 33.0 31.0 34.0 200\n", + "1 1 10.0 34.0 34.0 31.0 34.0 200\n", + "2 2 16.0 34.0 34.0 31.0 34.0 200\n", + "3 3 19.0 37.0 37.0 35.0 37.0 200\n", + "4 4 16.0 37.0 37.0 35.0 37.0 200\n", + ".. ... ... ... ... ... ... ...\n", + "96 96 2.0 38.0 34.0 32.0 35.0 200\n", + "97 97 2.0 38.0 34.0 31.0 35.0 200\n", + "98 98 7.0 40.0 34.0 32.0 35.0 200\n", + "99 99 5.0 38.0 34.0 32.0 35.0 200\n", + "100 100 7.0 37.0 34.0 31.0 35.0 200\n", + "\n", + "[101 rows x 7 columns]" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pb.cacl_base_seq_quality(path, output_type='pandas.DataFrame')" + ] + }, + { + "cell_type": "markdown", + "id": "74720ec0", + "metadata": {}, + "source": [ + "Mozna równiez zmieniać liczbę wątków" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "218aad32", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
positionminmaxmedianq1q3sample_count
002.034.033.031.034.0200
1110.034.034.031.034.0200
2216.034.034.031.034.0200
3319.037.037.035.037.0200
4416.037.037.035.037.0200
........................
96962.038.034.032.035.0200
97972.038.034.031.035.0200
98987.040.034.032.035.0200
99995.038.034.032.035.0200
1001007.037.034.031.035.0200
\n", + "

101 rows × 7 columns

\n", + "
" + ], + "text/plain": [ + " position min max median q1 q3 sample_count\n", + "0 0 2.0 34.0 33.0 31.0 34.0 200\n", + "1 1 10.0 34.0 34.0 31.0 34.0 200\n", + "2 2 16.0 34.0 34.0 31.0 34.0 200\n", + "3 3 19.0 37.0 37.0 35.0 37.0 200\n", + "4 4 16.0 37.0 37.0 35.0 37.0 200\n", + ".. ... ... ... ... ... ... ...\n", + "96 96 2.0 38.0 34.0 32.0 35.0 200\n", + "97 97 2.0 38.0 34.0 31.0 35.0 200\n", + "98 98 7.0 40.0 34.0 32.0 35.0 200\n", + "99 99 5.0 38.0 34.0 32.0 35.0 200\n", + "100 100 7.0 37.0 34.0 31.0 35.0 200\n", + "\n", + "[101 rows x 7 columns]" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pb.cacl_base_seq_quality(path, target_partitions=4, output_type='pandas.DataFrame')" + ] + }, + { + "cell_type": "markdown", + "id": "d86ea6c9", + "metadata": {}, + "source": [ + "Notebook zakończony pomyślnie. Możesz teraz przeanalizować wyniki powyżej lub przeprowadzić testy. " + ] + }, + { + "cell_type": "markdown", + "id": "3378e751", + "metadata": {}, + "source": [ + "## Aby przeprowadzić dedykowane testy funkcji należy:\n", + "Przejśc do katalogu z testami a następnie wykonać komendę:\n", + "```bash\n", + "pythest test_quality_op.py\n", + "```\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "id": "8d90199b", + "metadata": {}, + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.13.3" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/notebooks/best_sequence_quality.ipynb b/docs/notebooks/best_sequence_quality.ipynb new file mode 100644 index 00000000..5107d30d --- /dev/null +++ b/docs/notebooks/best_sequence_quality.ipynb @@ -0,0 +1,643 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "fa5e0b95", + "metadata": {}, + "source": [ + "\n", + "# Analiza jakości sekwencji bazowej z pliku FASTQ\n", + "\n", + "Ten notebook przedstawia przykładowe użycie funkcji `cacl_base_seq_quality` z biblioteki `polars_bio` do analizy jakości bazowej sekwencji DNA.\n" + ] + }, + { + "cell_type": "markdown", + "id": "51f25988", + "metadata": {}, + "source": [ + "## Importowanie bibliotek" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "aaa6c4e7", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/karolzebala/Desktop/studia/Semestr 2/tbd/proj2/tbd_proj_2/lib/python3.13/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n", + "INFO:polars_bio:Creating BioSessionContext\n" + ] + } + ], + "source": [ + "\n", + "import polars_bio as pb" + ] + }, + { + "cell_type": "markdown", + "id": "aa0c3d8b", + "metadata": {}, + "source": [ + "## Wczytanie przykładowego pliku FASTQ" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "250d8dd1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Odczytano zawartość pliku example.fastq\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "200rows [00:00, 81728.45rows/s]" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "shape: (200, 4)\n", + "┌────────────────┬───────────────────────────┬──────────────────────────┬──────────────────────────┐\n", + "│ name ┆ description ┆ sequence ┆ quality_scores │\n", + "│ --- ┆ --- ┆ --- ┆ --- │\n", + "│ str ┆ str ┆ str ┆ str │\n", + "╞════════════════╪═══════════════════════════╪══════════════════════════╪══════════════════════════╡\n", + "│ SRR9130495.1 ┆ D00236:723:HG32CBCX2:1:11 ┆ NCAATACAAAAGCAATATGGGAGA ┆ #4BDFDFFHGHGGJJJHIIIIGGI │\n", + "│ ┆ 08:13… ┆ AGCTAC… ┆ IJGJJG… │\n", + "│ SRR9130495.2 ┆ D00236:723:HG32CBCX2:1:11 ┆ NGTCAAAGATAAGATCAAAAGGCA ┆ #1=DDDDD>DHFH@EFHHGHGGFG │\n", + "│ ┆ 08:14… ┆ CTGGCT… ┆ IIIGIG… │\n", + "│ SRR9130495.3 ┆ D00236:723:HG32CBCX2:1:11 ┆ GTTTTCCTCTGGTTATTTCTAGGT ┆ @@@DDDFFHHHFHBHIIGJIJIIJ │\n", + "│ ┆ 08:17… ┆ ACACTG… ┆ IIIEHG… │\n", + "│ SRR9130495.4 ┆ D00236:723:HG32CBCX2:1:11 ┆ GGGAGGCGCCCCGACCGGCCAGGG ┆ CCCFFFFFHHHHGHIIIGIIJIII │\n", + "│ ┆ 08:16… ┆ CGTGAG… ┆ JJGHFF… │\n", + "│ SRR9130495.5 ┆ D00236:723:HG32CBCX2:1:11 ┆ CACTCCGCCACTACAGCAGTCCCC ┆ ++=A1A:1ADA<;FFDC?;CG\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
positionminmaxmedianq1q3sample_count
002.034.033.031.034.0200
1110.034.034.031.034.0200
2216.034.034.031.034.0200
3319.037.037.035.037.0200
4416.037.037.035.037.0200
........................
96962.038.034.032.035.0200
97972.038.034.031.035.0200
98987.040.034.032.035.0200
99995.038.034.032.035.0200
1001007.037.034.031.035.0200
\n", + "

101 rows × 7 columns

\n", + "" + ], + "text/plain": [ + " position min max median q1 q3 sample_count\n", + "0 0 2.0 34.0 33.0 31.0 34.0 200\n", + "1 1 10.0 34.0 34.0 31.0 34.0 200\n", + "2 2 16.0 34.0 34.0 31.0 34.0 200\n", + "3 3 19.0 37.0 37.0 35.0 37.0 200\n", + "4 4 16.0 37.0 37.0 35.0 37.0 200\n", + ".. ... ... ... ... ... ... ...\n", + "96 96 2.0 38.0 34.0 32.0 35.0 200\n", + "97 97 2.0 38.0 34.0 31.0 35.0 200\n", + "98 98 7.0 40.0 34.0 32.0 35.0 200\n", + "99 99 5.0 38.0 34.0 32.0 35.0 200\n", + "100 100 7.0 37.0 34.0 31.0 35.0 200\n", + "\n", + "[101 rows x 7 columns]" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pb.cacl_base_seq_quality(path, output_type='pandas.DataFrame')" + ] + }, + { + "cell_type": "markdown", + "id": "74720ec0", + "metadata": {}, + "source": [ + "Mozna równiez zmieniać liczbę wątków" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "218aad32", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
positionminmaxmedianq1q3sample_count
002.034.033.031.034.0200
1110.034.034.031.034.0200
2216.034.034.031.034.0200
3319.037.037.035.037.0200
4416.037.037.035.037.0200
........................
96962.038.034.032.035.0200
97972.038.034.031.035.0200
98987.040.034.032.035.0200
99995.038.034.032.035.0200
1001007.037.034.031.035.0200
\n", + "

101 rows × 7 columns

\n", + "
" + ], + "text/plain": [ + " position min max median q1 q3 sample_count\n", + "0 0 2.0 34.0 33.0 31.0 34.0 200\n", + "1 1 10.0 34.0 34.0 31.0 34.0 200\n", + "2 2 16.0 34.0 34.0 31.0 34.0 200\n", + "3 3 19.0 37.0 37.0 35.0 37.0 200\n", + "4 4 16.0 37.0 37.0 35.0 37.0 200\n", + ".. ... ... ... ... ... ... ...\n", + "96 96 2.0 38.0 34.0 32.0 35.0 200\n", + "97 97 2.0 38.0 34.0 31.0 35.0 200\n", + "98 98 7.0 40.0 34.0 32.0 35.0 200\n", + "99 99 5.0 38.0 34.0 32.0 35.0 200\n", + "100 100 7.0 37.0 34.0 31.0 35.0 200\n", + "\n", + "[101 rows x 7 columns]" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pb.cacl_base_seq_quality(path, target_partitions=4, output_type='pandas.DataFrame')" + ] + }, + { + "cell_type": "markdown", + "id": "d86ea6c9", + "metadata": {}, + "source": [ + "Notebook zakończony pomyślnie. Możesz teraz przeanalizować wyniki powyżej lub przeprowadzić testy. " + ] + }, + { + "cell_type": "markdown", + "id": "3378e751", + "metadata": {}, + "source": [ + "## Aby przeprowadzić dedykowane testy funkcji należy:\n", + "Przejśc do katalogu z testami a następnie wykonać komendę:\n", + "```bash\n", + "pythest test_quality_op.py\n", + "```\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "id": "8d90199b", + "metadata": {}, + "source": [ + "## Wizualizacja \n", + "Aby stworzyć plik html nalezy przejsc do katalogu benchmark/src i uruchomić\n", + "```bash\n", + "pytest base_seq_quality_report.py\n", + "```\n" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.13.3" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/notebooks/example.fastq b/docs/notebooks/example.fastq new file mode 100755 index 00000000..4b357e52 --- /dev/null +++ b/docs/notebooks/example.fastq @@ -0,0 +1,800 @@ +@SRR9130495.1 D00236:723:HG32CBCX2:1:1108:1330:1935/1 +NCAATACAAAAGCAATATGGGAGAAGCTACCTACCATGCTTAAAAACGCCAATGAGCAGNGATTTGTCANCNNNNNNNNCNNNNNNNNTNNTANNANNCTC ++ +#4BDFDFFHGHGGJJJHIIIIGGIIJGJJGIIIIBHIJJJIIJIJJIJDHIGGGIJJJI#-@AEHGEFF#,########,########+##++##+##+2< +@SRR9130495.2 D00236:723:HG32CBCX2:1:1108:1472:1938/1 +NGTCAAAGATAAGATCAAAAGGCACTGGCTTACCTGATTAAGAAATTGTGTAGTCCAACATCAAAATACNTNTNNNNNAGAGNCANGNCAAGCNNANNAAT ++ +#1=DDDDD>DHFH@EFHHGHGGFGIIIGIGGGGIIGIIDDCHIIIIIID@FEGGGIIIIICHIIIIIIG#-#-#####,,;;#,5#,#,,85@A:AB@8>@:@A@9(:((+(834 +@SRR9130495.6 D00236:723:HG32CBCX2:1:1108:2392:1965/1 +CGATAAAGGACTTTCAGTCAACCAACTAGATAATGACCACTGGGCACCCATTCATTATGCATGCTGGTAAATAAATTATTCTGTTCAGGAACATTGAACTC ++ +CC@DDDBDFFHHHJJIJJIIJIJJJIIIHGIGGHCGGIGHHAACC??A< +@SRR9130495.11 D00236:723:HG32CBCX2:1:1108:4089:1977/1 +CATTCCAACCAGCCGCTTAAAGTTTCTAAAAGAAGCTGGTCATGGAACCCAGAAGGAGGAGATACCTGAGGAGGAATTAGCAGAGGATGTTGAAGAGATTG ++ +CCCFFFDFHHHHHJIJJJJIIJJJJJJJJJJJIIGJJJIGHGIJJIJJIJJIIFHGHIJJGHEHHFCEFFDEDDBDDDDDDDDDDDBACDDDDDDDDDDDD +@SRR9130495.12 D00236:723:HG32CBCX2:1:1108:6197:1936/1 +NCTTAAAGGCAAGGTGCTCGGCTTCCGCTATCAAGACCTCCGACAGAAAATCCGGCCTGNGGCTAAAGANCNNNNNNNNANNNNNNNNCNNGGNNCNNGGC ++ +#1BDFDEFGHHHHIJJJJJJIJJJJJJJJJJIJJIGIJJIJJJIJJJJHIJJHHHFFDC#,;?BBDDDD#,########+########+##++##+##++8 +@SRR9130495.13 D00236:723:HG32CBCX2:1:1108:6415:1939/1 +NTGTGTATGGGGATGAGGAAGGATATTAATATGTTCTATTTGAGATTTAGGGATTACATTTGTTTTTGCNCNCNNNNNTTTTNTCNTCATTTGNNGTNAAT ++ +#1:ADDDFHGGHFGGBHIGGIIJJEIIIJJIJIJJJFGJIIHGHGDGHJGHIHIIIIJJIIHFHIIJJJ#-#-#####,,;?#,;#,8?DDEE##,+#+2< +@SRR9130495.14 D00236:723:HG32CBCX2:1:1108:6361:1952/1 +TCAGATCTTATTTTAATAGTTGACTTTACCTCTTCTTTGACTTCCTCTTCCTCGGTCTCAGTAGATATAGATGGTACCTTGGGCTTATGCCATGAGATCTG ++ +CCCFFFFFHHHHDHIIIIJJJJJJJJJJHIIIJJJJJJJIHJHJII>GHIEGHIIIIJJJIJJIHHIJJJIJIGHIJJGJJHFHHFFDCFFEDCEDCCDEC +@SRR9130495.15 D00236:723:HG32CBCX2:1:1108:6263:1960/1 +CAATATCTGACTGAATGGGCCCATTTTCATAATATTCTGAAACTGTTCATACATGTCTCGCAATGTAAACTGACCTGAAATGCAATACAAAAAAATTCAGA ++ +CCCFFFFFHHGHGGGIIIIJJIJIJJIIIIIIIIEIHGGIEGGHGIJJIJJJCECGHIIIJJJJJIFGHIIHGIIJJHHGEFHDFFFFFCCCDDBBCCDCA +@SRR9130495.16 D00236:723:HG32CBCX2:1:1108:6338:1988/1 +AGACACTAAAATGCCATGTATGAGACTACATAGACATACCAATTTACAACACAAACACATGAAATATACATGAGAAAACATTAACTTACTTCCAGTTGGGA ++ +C@CFFDDDHGHHHIIIIHJJIIHIHGIJJJJJIJJJIJIIHEHIIJJJJJJIJJIIIIIJJDHIJIJGIJIJJIJJHHGGHFFFFFFFEEEDCCC@ACCBA +@SRR9130495.17 D00236:723:HG32CBCX2:1:1108:6742:1944/1 +NGAAACACTCTTTTTCTGGAATTTGCAAGTGGAGATTTCAGCCGCTTTGTGGTCAATGGTAGAAAAGGAAATATNTNCATATAAAAACTAGACAGAATGAT ++ +#1BDFDFFHGHGHJJJJJJJJHIJHHIJIIJJIJJGIJJIJIIJJGIJIHIJJJIIJJJHIEIIJJJJIHDEFH#,#,5=ADEEEDCDDDDDDDCDD5@CD +@SRR9130495.18 D00236:723:HG32CBCX2:1:1108:7076:1942/1 +NGTCTAAGAATGAAGTGCTTATGGTCAACATAGGCTCCCTGTCGACAGGAGGAAGAGTTAGTGCAGTCAAGGCTNANTTGGGCAAAATTGTTTNNACCAAT ++ +#1:B:BDDHHFFHIEGGIGIDEHGEEGIGHIIIFACHIGIGCFGEHIGGHHGHGH@DCGGIDEIIIIFFHHAEE#,#,5=@BBC@BCCCCCCC##,+8?BC +@SRR9130495.19 D00236:723:HG32CBCX2:1:1108:7440:1957/1 +CACCTGATGTCCCACAGTCCTCATAGACACTAGCACTGACTGCTGGCCATCGTCTCAGCCAGATGATGTTGACCTGCTAGCTTTTCAATTAAATTATTAAA ++ ++=144=DD>D4CCD?E@AECFFIIIIEI?E+??;3EBDECEIBEECDIEIIADDDDEIDCDCA;=A@CECE7ACD=(;;A@DA@A@A:ADAAAD>AADBB> +@SRR9130495.20 D00236:723:HG32CBCX2:1:1108:7363:1977/1 +ACTCATAGAGTTGAAGATTCCCTTTCATAGAGCAGGTTTGAAACACTCTTTCTGGAGTATCTGGATGTGGACATTTGGAGCGCTTTGATGCCTACGGTGGA ++ +CCCFFDDDFHHHHJJJIJJJJHHIIHGIJIJJJIGGHGIJIJJIIIJJJJJIJIGBFDHIIJIJGIJIGGCHGGIJHIIHHHFECDECEEDCDDCBD9?B? +@SRR9130495.21 D00236:723:HG32CBCX2:1:1108:7298:1979/1 +AACCGTCGCCAGGTACCATCCCAGAGAACTCTGTCTTCCTTACTTATAGCCAAGTTGCCGGCAGATCACAGCTGCATGCTTATCGGTCCATCCGTCATCGC ++ +BCCDDDFFGGFGFJIBBHHIJJIIHHIIIGJIIHIIJJJIIEIGHJIIJJJJIIHHGIJFGHGFDDCEECDDDDDDDDDDEDDDDDDDBDEDDDCCC +@SRR9130495.23 D00236:723:HG32CBCX2:1:1108:7307:1995/1 +TAATTTGGTATATGTCTTTTTAAAGGCATTTTTATTAGATATTTCCTTAATTTACATTTCAAATGTTATCCCCAAAGCCCCCTATAATCTACCCCTGCCTT ++ +;?7DD?;DBFHHFIA;A@AABBB@B?2<58+:?<<9<@: +@SRR9130495.25 D00236:723:HG32CBCX2:1:1108:7870:1955/1 +CTATCCCGTCGGGTGACTGTTTCCTGCTTTGCAGTTATTCAGTGGCAGAGCGTGGCGCTCTAATTTCTGCTTTCCTCTTTCCTGCAGATTGTGTGCTACAT ++ +CCCFFFDFFHHFHBHGJIIIHGIIIJJIJIIIIJHIIIIEIJJIIJJJJIJIJIJDFEDDDCEEEEEEDDDDDDDDCDDDCDDDDDDDCDDDCDDDDDDDD +@SRR9130495.26 D00236:723:HG32CBCX2:1:1108:8157:1994/1 +GAAGTGCTCTTCGTTACTACTTAAATCCCCCTGGGCATGTTTCATTATTTTACAATTTGTGCAGAACCCTATCCAAACACACATGGAGTACAAATGACTTC ++ +CCCFFDDDDHHDHHIGIIBIHHHJJJ@FGGA?@CCCCCC@CCCDD +@SRR9130495.27 D00236:723:HG32CBCX2:1:1108:8703:1937/1 +NATAAAAAAATAACATCCTTTCCTCCTAATAGCTTAATTATTTGAAAAAAAATATTTTCNAATCACATGNANNNNNNNNTNNNNNNNNTCTTTNNTNNCCT ++ +#1=DFDDDHHHHHIIJJJJJFIJJJIGIEGIIJJJHHIJJJJJIIJIIIIIJEHEHHHA#,;??AEDDC#,########,########++8??##+##(+2 +@SRR9130495.28 D00236:723:HG32CBCX2:1:1108:8702:1991/1 +CTCAGAGATTAAAAATGAATAACGCCTGCCGGCCAATGAGCGGACTCACAGTCCCTGTTTGTTTGTAAGCTAGGTGATTTTCAATCCACAGGGCAGGCTGA ++ +@@@DFDFFGGDHFGIIBGEHJIIIBGIIIJJIIJIJIIFGGEGIJJJHGGHHHDCFFDDDEDEDDDDDCDDDCBDDACDEDEDDDDCCCCDGII@GIFGFE???BFBBEHIGGIEEHIHIGGHHGIHA3?CH;?@CB@DCCEDEDD3 +@SRR9130495.34 D00236:723:HG32CBCX2:1:1108:10535:1962/1 +AATACAGAAAAGTTAAGAGCCAGCCCCAGGCGGATTGGATGAATAGGTTGCATCTCTTTCTTGCTTATATCAAATGCCTCTTGGCAGGCTCCTTGGGAATT ++ +???BD:A:3=?B:;?;;CA;;;A3-5>5-5:(::@8/2?8?9>>3(83(+ +@SRR9130495.35 D00236:723:HG32CBCX2:1:1108:11147:1968/1 +GCTGCCTTCTCCCCTCAAGGATGCAGTGGAAGTGTCAACCTGGAGAAGATGCTACACGATGCAGGAGGTGAACTCGGCCCTCAGTAAAATCCAGCTGGTGG ++ +CCCFFFDFHHHGHJFEGIHEGHIGIIGCCGGGIIJJIJJGGGGHCGIF>DGHIIIEHHGIIJJDBGHFHFCCFFFDDCDDDDBDDDCCDEDA:CACD@CDD +@SRR9130495.36 D00236:723:HG32CBCX2:1:1108:11124:1986/1 +GACAGGGTTTCACCATGTTAGCCAGGACGGTCTTGATCTCCTGACCTCGTGATCCGCCTGTCTCGGCCTCCCAAAGTCCTGGGATTACAGGCGTGAGCCAC ++ +CCCFFFFBFFFHGGHGHIHIIGIJFJJJIJHIIIFGHGGIIGEGHIH@@FGGIJIIGGIHIEEHEEFFDDCCCCBDDACCDCDBAACCDDDBDDDDBDDCC +@SRR9130495.37 D00236:723:HG32CBCX2:1:1108:11773:1947/1 +TACCTGCCTCTGCCTCTCGAGTGCTGGGATGAAAGATGTGCACACCCCCACCACCACCACCACCACTGCCTGGCNCNGTTTTTGATTTCTTATTCTCCAGA ++ +CCCFFFFFHGHHHJIJIJIIEHIJJIJJIJJIHIHJJIGFIIIIJBHHGFF>HGIJIEHHHFGDEEEEEECC?B#,#,,5?@HF1CGBGHCDDFF7=DEG.?AAC?3@EED;6@;>(-;@AC?31(,5?(4::A>AC +@SRR9130495.46 D00236:723:HG32CBCX2:1:1108:14226:1948/1 +AACCTGCACCCAGAATGGCAGGAGGTCCTGGTGGCCCAGGGGGTCCTGGTGGTCCAGGAACACCAGGTCTCCCANANCCAGGTGGCCCAGGCAGGCCTGGA ++ +??1D1BDDHFHHBBHGGGAFG)AF1:?CEGD@BGAFDGIGGB'5;CE77?=???>>CC3#+#++228>>28((2(>ACC?CCDDCCD@ +@SRR9130495.48 D00236:723:HG32CBCX2:1:1108:15049:1993/1 +TGACCAAGAACTCACAGAGATCCCCCCCCCCAGGGCTAAGATTAAAGGCATGTGCCACTGCCACTGGATAGATATTATCTTTTATTTTACCTGACTGGTTG ++ +@CCFFDDDHDFHGJJJJIJGIHHHIIJJIJFE=(5;?@>@A@;@C>CAB=@<:@C@CA:>CC3:>CB<@@?344>>@@A>CDC>ACDD:>4>>>ACD?CC( +@SRR9130495.49 D00236:723:HG32CBCX2:1:1108:15487:1951/1 +ACGGAGGGTGGGGCTGGGTGATTGTGGTTGTCTCCTTCTTCACCCAGTTCCTCTCTTACGGATCCCCGTTAGCTNTNGGGGTCTTGTATGTAGAATGGCTG ++ +BCCFD@DFDFHHGDGIIICGHIIJJIJGHIIJIIJJJIJIJIJEHIGHHHHHHHFFFFFFDDCDDCD@DDDDD:#+#+2<@8GHIIIEHGACFHIIGGIBHIIHHC??BDC@BBCECDCE63>@@CACCDD@ +@SRR9130495.51 D00236:723:HG32CBCX2:1:1108:15923:1957/1 +CCGCAACTGCCATGGAGCCACAGCCTGGTCCGTAATAGATGCAAAGCTTCTCAATAGTCAGGGGCGTGGTTTCGCGCAGCTTGGAGGCCAGCAACAGGCAG ++ +CCCFFFFFHFHHHIIFIIIGIIFIIGJIIJJIFHGHIIIIIJIIFIJIIIJJJJJJJGGIGJFFH@?BBBDBCDDDDDDDDDDDDDDDDDDDDDDDDDDD? +@SRR9130495.52 D00236:723:HG32CBCX2:1:1108:15793:1968/1 +GTTTTTCCACAGACCTCTGATCTCTTACATTCGAAAGTTCTACTACTATGATCCTCAGGAAGAGGTGTACCTGTCCCTAAAGGAAGCGCAGCTCATTTCCA ++ +BB@FFFFFFFHGDGFHJJJJIFIIGGG@FIIIGIBGGDHIIIJCHIIJJDHIIJJJIIIGIIJJFHHIJCHGDHIIHHHHHFFFFFDDDDDDCDDDDEDDE +@SRR9130495.53 D00236:723:HG32CBCX2:1:1108:16082:1968/1 +GAAACTTGTTTGTGACGTGTGTATTCAACTAACAGAGTTGAACCTTTCTTTTTACAGAGCAGCTTTGAAACACGCTTTTTGTAGAATCAGATCGGAAGAGC ++ +@<@ADDDECBFFHIFEGDG;EEHHB@FHGHIIGGEHGGHGGEGEGICGCEFFDB@D>AE>ADC@CBBFGIIJJJJIHHIJJGH?DGGHCFHHIJJEEIIJAHIJJFG=FGGGIFHHIIDHGEHIHHHHGHGEB;?CDCECEEDD +@SRR9130495.55 D00236:723:HG32CBCX2:1:1108:16048:2000/1 +AGGACAGGAAGGACGCTTTGAGATATGATTTCACAGGCGACAGTGAGAGAAAACCAATGTCTTTAATGCATTTCTCTGCAGCATGTGACAAACTTTCAACA ++ +CCCFFFFDFHGHHIIJJJJIFGGIJJIIIIJIJIHJIIJIHGIJJIJGGIIJIJJHHHHEDCDFFFEEEDDEDEEDDDDDDDDDDCDEDDCDDDDDDCCD@ +@SRR9130495.56 D00236:723:HG32CBCX2:1:1108:16580:1970/1 +GCCTGTACTCCCAGCTACTTGGGAGGCTGAGACAGGAGAATCACTTGAACCCAGGAGGTGGAGGTTGCAGTGAGCCAAGACCGGGCTATTGCACTAGATCG ++ +@@@FFD?DBFFHHIIEHCIJIFIJHEDCH@GGEBFHHIJJIIIIIJJJJJIFHFHF@G-6@AAEDFFF>AEC@@A?;=?BCD6/<@>BAAC>:@C:CDDA? +@SRR9130495.57 D00236:723:HG32CBCX2:1:1108:16594:1971/1 +TCCTCTGACTTTGACACTAGTGTTGACCTTGCATGAGGAGATGTTCTCCATTTGGACTAACCTGATGTACACAGACGTTACACTTATCACAGAATACCATA ++ +CCCFFDDFFHFHFHIJIJJIHIIIJJJJJIJJJJIIIIHIGIIJJJIGIIJJIIJEHIIJIJJJIGIJJJEIHJJIIHHEFFFFFFCCEEEEDCDDDDDDC +@SRR9130495.58 D00236:723:HG32CBCX2:1:1108:16808:1998/1 +ACCAATTTTCCCCTCCCCTTCCTCCCTCCCTCCCAGCCCCCTTCCTCTCTCTACCTCCTGTTATTGTTTTGTTCCTTGTTCTATGTAGGATTGAAGCATCT ++ +@@@FFDDFHDFHGIJJJJIIGGDFHI>DGC;DHI9??FHIJIIHG>>3>;ACCCC9:@>@:>AA +@SRR9130495.59 D00236:723:HG32CBCX2:1:1108:17428:1967/1 +TGCATGGTGCTGAAAGCTTTGTTGCAGCTTTTCTTGGGATTGCTTAGCTGCTCCGGGTCGATCCACTTGCAGATGAGCTCTTGCTTGATGCACTGCTGCCG ++ +?<A3>A>>AAAA?3 +@SRR9130495.60 D00236:723:HG32CBCX2:1:1108:17508:1988/1 +TTGTTCAGAAAAAAGTATCTTGAAACCAAAAGAACTGGGATCTTGTTAAATGCAGATTCTGTTCATTAGGTATAGGTATGCAGTCTTACAAAATGAGGTAG ++ +CCCFFEFFHHHHHJJJJJJJJJJJJJJJJJGIJJJJJJJIIJJJJJJJJIJJIJJJJJJJJJJJIJJIIIEHHBHGHHEFFFFFEEEEDEEDDCDCDDCDC +@SRR9130495.61 D00236:723:HG32CBCX2:1:1108:18425:1951/1 +CCACTTAATAAATCACCTATCAAGTTGAATTATTTGTGCAAAGGCACTAGGCTGAATAGAGACCACTCAGTAGCNTNTTTTTAATCTTGCTAAGAAAGAAT ++ +CCCFFDDFHFHHGJIIJJJJJJHGHEHHHIIJIJJIJGJIHIJHEFDHGHIFIJJGHIJJJFIGGIHIIIJIII#-#-5@DFFEEEDEEEDEDDACDCCBC +@SRR9130495.62 D00236:723:HG32CBCX2:1:1108:18468:1964/1 +CTATTGACTTTTATTAGAAAGGGTCTTGTTGCATAGGTAGGTCTTTAACAACCATCTCTTAAAGGGCTGGGATTGCCAGAGTAGGCCAACACGCCCAGCTA ++ +CCCFFFFFGGHHGIGIJIJJIIIJJJJIJJIJJJJIIJDGEHGIIJJJIJJJHIJJIGFHGIJGEGIJJJIIHHHHHHFFFFFEDEEDDDDDDDBDDBBD@ +@SRR9130495.63 D00236:723:HG32CBCX2:1:1108:18615:1941/1 +NAGCCGAGAGGCGCCGGCTCACCTGCCTGGGTCCCGGCCTTTCTCCTGCAGTGCCAGGGATTCACCTGANGNCNNNNNNTCTNCTAGGCAAGCNNATNCTT ++ +#1:DDFDDHHHHHIIJIIFGJJIEFHHIHHIIIJJIEHFFEEEEEEE?DFF;5:AAB9>29(#+#++8++4>>:@>AA:@1<@@A(:4? +@SRR9130495.72 D00236:723:HG32CBCX2:1:1108:1440:2047/1 +GCTGGTGCAGGACACCAGAATCCGCTCGATCATGCTCCCTAGAGAGGAGGGGCACAGTGAGTACACATAAGCACATGTACACACACACCCAGGACCCAAAG ++ +CCCFFFDEHHGHHHIIIIIIIIJJIJJJGEGHIJIJJJJIIJGHIIJJJIDFEDFFFFEEEEDEDDDDDDDDDDDDDEEEEDDDDDDDDDDDDDDDDDDDA +@SRR9130495.73 D00236:723:HG32CBCX2:1:1108:1468:2080/1 +ACTGTCTTTTTTTTAAAACAGGTGATTGCCCGTTGATTGTTCAGTTTGCTGCTAATGATGCAAGACTTTTATCTGATGCTGCCCTGCTAGTCTGTCCCTAT ++ +CCCFFDDEHFFDHIEIIJHGCGFHCIIHIIIHH@FGGIHIGHIJJIJGIIIJBHIGEIHGHHGGHFFFFFFEEEEDEDDDDDDDDDDDCDDDEDDDDDDDD +@SRR9130495.74 D00236:723:HG32CBCX2:1:1108:1333:2084/1 +ATGAGCACACAAGGGATGATCAGATTGATGGTGTAGAAGAGTGGCTTGCGCTTGATGATGAAGTCATAGGTCACGTCCACATAGCTGGGGTCCTGTGGGTT ++ +CCCFFFFFHHHHHJIJHDIIHHHIIJIIJJJJJIJJIIJIJJJIBDGIJJJJIJJJJGIIIJIAHEEHEFFFFF>EDCDDDDDCDDCDDDDDDDDDCDDDD +@SRR9130495.75 D00236:723:HG32CBCX2:1:1108:1447:2137/1 +TCCACTTGTACAAAAAATTACAAAAATTAGCTGGGCATGGTGGCACACACCTGTAGTCCCAGCTACTCGGGAGGCTGAAGTGGCAGGATCACTTGAGGCAG ++ +CCCFFEFFHFHGHJJJJIJJJJIIDIEHJIIJJJIGJJJHGJIIDHIDGIJIJJIGHIJJJJJHHHFEEBDCDBBDDDDDDDDDDDDDDDDDDDDDCDDD@ +@SRR9130495.76 D00236:723:HG32CBCX2:1:1108:1499:2151/1 +GAGAAAAAGCATCCCTTTAATAAGGCCGCCCCGGTTCCAAATCAATCCTGGCATTGCAGGAGGCAAGGGGGAAACACAGCCACGAAATTGGATTAGCTCTT ++ +CCCFFFFFGGHHHJIIJHIEIJJIIIIJIIGJJIHJIJJIGIJJJIIJJHHHHHFFFFFFDCDBDDDDDDDDDDDCDDDBDBDDBBDDDDDCDDDDCDDCD +@SRR9130495.77 D00236:723:HG32CBCX2:1:1108:1280:2166/1 +GCCTTCTTCCCAGCAGCAATATGGCTCTTTCTTCAGCTCTTATCAGTCACATCCATCAACGAGTGGCTTTTAAAAGGGTATGTTTAAACCTTTTGACGGGA ++ +CCCFFDEFHHHGGJIJJIJIJEIJJJJJIFGIIIIIIIJIIGIJJGIIBHIJJJJIJIEH>CG;CHCHGHICHFFFFFFDDC;@CCEEDDCDDCCDDDDDB +@SRR9130495.78 D00236:723:HG32CBCX2:1:1108:1458:2216/1 +TTTCTTTCCACACATCCCACCTAACACCCAAACTAAGCACTCAGTGCTTGGAATCTCCCCACCCATTCCCTCACCCCTGCTCTTCCATCATTTCCTCCAGC ++ +CCCFFFFFHHHHHIDHIIJJJJHIIJFHIJIJIGIJHGIIIIGJEHIGIIJCGEEHJJJJJJJDHEHHGFFFFFDCDDDDDDDDDDDECCDDEEEDDDDDD +@SRR9130495.79 D00236:723:HG32CBCX2:1:1108:1634:2001/1 +TGTGCATTTCTCATTTTTCACGATTTTCAGTGATTTCGTCATTTTTCAAGTCGTCAAGTGGATGTTTATGATTTTCCATGATTTTCAGTTTTCTTGCCATA ++ +CCCFFFFFHHHHGJJJJJJJJIJHGIJJJJIIIIJJIGIIJJJIJJJIIFIIJJJJJIJJJIJIIIIIIJIJGJJJJFHHGGHGFFFFCEFFDEEDEEDDD +@SRR9130495.80 D00236:723:HG32CBCX2:1:1108:1566:2120/1 +GGACGAAGTAAGGGAGGAGCAACTGACAACATTCATCTTGTCTGTCTCCTCCACGTCCCGAGGTACAAGGCGGATGTCATTCTTACTAATTTTTTTCTTCT ++ +CCCFFFFFHHHHHIIJJJJIJJJIJJJJJJJIFIJJJIJIJIJIIJJIJIJJJJIJJIIJHHFFEEEEEDDDDDDDCDEDEDEEDDDEDDEECDDDDDDDD +@SRR9130495.81 D00236:723:HG32CBCX2:1:1108:1863:2047/1 +AAATTCGGACCCCTTGGGTGGAATATTCCTTACGAATTCAATGAGACAGATCTAAGAATCAGTGTGCAGCAACTCCACATGTTCCTGGACCAGTATGAGGT ++ +@BCFFFFFHHFHHHIJIJGIIIJIJJJJIIJJIIIIJJJJGIJJJIJJIEGIIGIJIJJJEGHHHGEEHFFFFDEEEDDDDEEEDDDDDDDBBCDDCCCCC +@SRR9130495.82 D00236:723:HG32CBCX2:1:1108:1844:2145/1 +TAACTCTCTGCCTGCGATGTCCCTACCTTCCAGAATGGTGCCATGACAACGGTGTCAACTACAAGATCGGAGAGAAGTGGGATCGGCAGGGAGAAAATGGC ++ +@CCFFFFFHHGHHJJJJJJJIJJJJJIJIIIHIIIJIIJJJJIJIIJIJJJJJJJJJIJJIIJEHHGHHFDFDDDDDCDCDDDDDDDDDDD?>BDDDDDDD +@SRR9130495.83 D00236:723:HG32CBCX2:1:1108:1772:2188/1 +GAGGTAGGGGTGTGTGTGAATGGGTGAGTGTGTGCCTATGCTTGTATGCCATATGAGAGAAAATGCAGCATTTAAAATCAGTGGTTAACGGCCAGCACAGT ++ +B@BFDFDDHHDDHHGIGIJIJGIJ:CFHHIGGIJJIEHGIIIJIIIFHGIJBHIJJJJJJCHHIHHHHHGFDFFFFEEEECEEDDDDDDDDDDBDDDDDCA +@SRR9130495.84 D00236:723:HG32CBCX2:1:1108:2103:2085/1 +TACAAATGTGCCAGGCACTCTTCTAAGTCCTCACATGCATGAAGTTATACAACTCTACAACAAACCTAGGAATATAAACTGAGGGCAGGGACCCCCAGCAA ++ +CCCFFFFFHHHHHJIJIJJJJJJJJJJJJIJJJJJJIJJJIJJJFHIJJJJIIJJJJJIJIIHIICHHIJJJIIIJJHHHFHHFDDDDDBDDDDDBDDDDD +@SRR9130495.85 D00236:723:HG32CBCX2:1:1108:2067:2091/1 +ACCAGCCCTGCTGCCACCCAGCCCACGTCCCGCGCGCCACCCATGCTGCTGCCTCGGAGCTGCAGGGAGCCGGGGAGCCAGGGCCACACGCAGGTGCAGCT ++ +?@@D?A:BF8DDFFFFFFFFAECBF@GFECAEFIIIIIIFBE?DBBD;@CCCCBBBBBB@B::AABBBBBB7>BBB>@BB?B>B>BB?/?A?BCCCBDDDD>@ +@SRR9130495.87 D00236:723:HG32CBCX2:1:1108:2387:2038/1 +GGCTAACCACTGCCTTGTCAAGTTGTGTAGAGTGAGATTCAGGGGTGTTGAAGTAATGTCCTTGTTACTTGCTGTAGGGCATCTGTTTTCTGTGTATCCCA ++ +CCCFFDDDDHGHGJEIGHHIJIHGGIIHGIIIIIEGBEHGGHIGGAFHIJJJJJJJJIDGHIIGIJJJIIHGFHEHFDFEDCEECDCDDACCCAACDFCCC +@SRR9130495.88 D00236:723:HG32CBCX2:1:1108:2285:2075/1 +CTGAAAGCTGAGCGTGAGCGTGGTATCACTATTGACATCTCCCTGTGGAAATTCGAGACCAGCAAATACTATGTGACCATCATTGATGCCCCAGGACACAG ++ +?;@DDBDDDFFD>ACGED@D8@):E*::??FFC@;FEF>E;CC=CC=@DDD>?;>A>A>A;AB3;A(;@:??DFBCB4<CCD@=BB@-(4812>>> +@SRR9130495.93 D00236:723:HG32CBCX2:1:1108:2748:2098/1 +CATCATCTTTTTTTTTTTTTTCTCCTGAAAACTGTCTAGTAGTTTGATATATTTTGTCCGAGGTTATTTCAAGTGTTTTTTTTTTTTTTTTTAAAACGGTG ++ +@@@DDDDDHHHHHIIFEHIIH8))7)7CEF9).)7;;>B@>9BD;;(6(55>DDDCBCC@/8-084@CC>C(((+4>?CBBBBBBBBBBB>&23:A(5?(( +@SRR9130495.94 D00236:723:HG32CBCX2:1:1108:2733:2156/1 +GACTGAGAAGAACAGAAAGGGAGAGAGAGGCCAATGGAAATACATGAGAAGGGAGAGAGGGAGAGAGAGGGAGGGAGGGAGGGAAGGAGGGGGAGAGGGAG ++ +CCCFFFEFGHHHHJJGIIIJJHIIHHIIJJJJJIJIIHGJJJGIJJJJJJJJJHGGHHIHHHFDFCDCDDD>BDDBDDDDDDD>BDD?BDDDDBDBDBD@D?ABD@BD?BBDDDC +@SRR9130495.96 D00236:723:HG32CBCX2:1:1108:2818:2076/1 +ACACTTCATGGCAACCTGGCTTAGATTCTTCAAAATTTCTGATCCTATACCAAAGCCTCTGTAATCACTCATCACGAAGAAGTCTTCAAGATACAGTAACT ++ +CCCFFFDDHGHHHJJJJIIJIIHIJHGCHIFEGGJJJJIJIGIIJJJIIJCEHIIIIJIBGHGGIIJIIBFGGGGHHGHFFFFDEEDECEDDDDCD>CCDE +@SRR9130495.97 D00236:723:HG32CBCX2:1:1108:2848:2112/1 +AACCTCTTCTCTTTGTCTTTCTCTTTATCCTTCTCCCTCTTGCCAGGACTGGACTCGCTGGTGATGGTGACGACGCTGGTGGGTAAGGTCTGCGCCCGACT ++ +@@BFFFFEHGHHGIJDEHIJIIIIIIJIFHIIIJEIDHIIIIJJIIIGIEIIJJIIIJFEHFHIIIGIIJIFBEDDBD>=?BB@CACCCAACDDBDBB5;6@;ACBCCCC?@AA>C>?<<<9)?FHFCAG=GFFG>FGGEGHIEEBEDEFC>C@::=BB@BCACCC@CA3:(8@C<8?CC +@SRR9130495.100 D00236:723:HG32CBCX2:1:1108:3014:2117/1 +CCCTCCTGAAAAGGTCCAGCTCCAAAGCCTGACCCGTAGCTGCAGAGAAGAAAGCTTTTCCTCTAAAGGCTGAGGAAAAGATGAAAAATCACTGCTAGAAC ++ +CCCFFFFFHHHHGIJIJJJJJJJJJJJJJJJIJJJIJJIJJJJIJGIDHHIIIJJIJJJJJIJJJHHHHHFFFFDEEEEDDDDDDDDDDDDDDDDDDDDDD +@SRR9130495.101 D00236:723:HG32CBCX2:1:1108:3316:2011/1 +GCAGAGCTGAATGGGCAAGCCCAGGACCCTTTTCAGACATTCTGCTGGCCTTTGGAAAGTGTACTCCTGTTGTATTTGATTACTTTTAGAGGACAGTACAT ++ +CCCFFDDFHHHGHJJJJIJFGIGHJGIJIIIIIHIIGIIJIIIIJJJIIIIJIIIGIJGIJJJJIIJJJEEEE?ECFFFFFFCCEDEEEDDDDDDDDEDCD +@SRR9130495.102 D00236:723:HG32CBCX2:1:1108:3264:2036/1 +GGGTGCTGGAGATAGCCCACGTACACTCCTTCTTGCTGGGGTACTTGTCAGGCCAGTTGGGGCTGGTGATGGTGCCACTGGTGGATGTCACCTTGTGTTCA ++ +=@<=B+AD>BFDFIIDEDGEIGFIIIIIICDFGFFGIII;D?F>?*/9BF>DAF;CFFGI>/:=?>7@BAA:;@5=A5>@=,98?:>@(;:4>ABAB?ABD +@SRR9130495.103 D00236:723:HG32CBCX2:1:1108:3400:2065/1 +TCTGTCTGTCACCAGGTTGGAGTGCAGTGGTAGGATCATGGCTCACTGCAGCCTCGTCCTCTTGGGTTCAAGCAATCCTCCTGCCTCAGCCTCCCAGGTAG ++ +@@BDFFFFHHHGHIJJFHEG@GHHIIAFD@HGGGEHIJJJGIJJGGGIHFDAHHHHJFCGGGHGJI;CHFCEDDFFFCEDEEDDDDDDDD<C +@SRR9130495.104 D00236:723:HG32CBCX2:1:1108:3468:2219/1 +TGCACTTCGTTCTCTTAATGAAACCCTTTGACTTAACCATGACTCCGCTCTGCTCTTGAGTTTGCAAGTGTGTGCGAGTGCCCGAGAGACAGTTTTTTTTT ++ +CCCFFEFFHHHHHJIJIIJJIIJJJIIJJIHIHJJJJJFHFHIIJIJJJJIJIJJJJJGGIIJJJGDIJJJIHHHGFFDDEEEDDDDDDDCCDCEDDDDDD +@SRR9130495.105 D00236:723:HG32CBCX2:1:1108:3722:2006/1 +TCCATAGTTTCGCAGAAGACTTGGAAGGATGTTGATGTATATGCAGGTCCATTATCAGTTTTTAAATTAGATGGTTTTCCCCAAGCTGCCCATGCGTCTAA ++ +CCCFFFDDHHHHHJJIJJIIHGHIGIIDFHHIIIHHIJJIJJIJIJJJJJJIIJJIJG=DHHJJIJIIIJJJJJIGHGHHFFBFDDEEEDDDDDDBBDDDD +@SRR9130495.106 D00236:723:HG32CBCX2:1:1108:3517:2148/1 +CTCTGTTCTGTTCCATTGATCTATATCTCTGTTTTGGTACCAGTACCATGCTGTTTTGGTTACTGTAGCCTTGTAGTATAGTTTGAAGTCAGGTAACGTGA ++ +CCCFFEBFHHHHFGGGIEEHIIJIJJIJJIIJIJJHIIJIIJJIIFHGIIIIJJJJJJFIJIJJJJGIIJIJCHIJIJHGJIJHHHHHHFFFFFFEEDECA +@SRR9130495.107 D00236:723:HG32CBCX2:1:1108:3927:2234/1 +CTGTGCTCTATGTACACGCCCATCTGTTTGCCTGACTACCACAAGCCGCTACCACCGTGCCGTTCCGTGTGCGAGCGCGCCAAGGCCGGCTGCTCGCCGCT ++ +@C@FFFFFHHHHHJJJJGIIJIJJIJEHIIGHGJJIJJJJJJIIGHHIJIJIGHJIIJIHHGFFDEDE?BBDDBDCDDDBDDDDBDD>BDBDDDDBDDDB< +@SRR9130495.108 D00236:723:HG32CBCX2:1:1108:4124:2011/1 +GACTCAGAGCCAGGGCCCGGGAACAGAGATGACTCGAAGGCTAGGGCTCCAGCCAGACTTACCGGCACACGTACACCTCTAGGGGTGGCAGGGTGCTGGGT ++ +CCCFFDDEGGGHHIJIIIJIIIIJIHHJJIJIIJIJIGGIIGIIHIGGIGHBHGHFEFFEECEDDDDDDDDBDDDDDCBACCDDDDDDBDDDDDDDDCD?9 +@SRR9130495.109 D00236:723:HG32CBCX2:1:1108:4130:2090/1 +TTCTATTTCTATAAACTGGCCTATTTTGGGTATTTCATATATATGGAAATATATAATTTGATTTTTTTGTTCTCTTAGCTGTATGTTTTCAGGATTCTTTC ++ +@BBFDFFFHHGHHIJJJJJJJIIIJJJJIJJJIJJJJIJJIIIJJJIJJJJIJIIJJJJJJJJJIHJIJJHHHHHHFFFFFFEEEDECEEDDDDDCDDEDD +@SRR9130495.110 D00236:723:HG32CBCX2:1:1108:4176:2091/1 +AAATTGAAAGTAAATGTATACTGTAGTCCCACGCACGAGTGAATAAAGGGGTGTCTAAAAGGAGTGTGTTCTCTTCCAGGCTGCATCTCTCGGTACTCAGC ++ +;8;ABD?+AA=ADBHIGBHE?ACCCCC +@SRR9130495.111 D00236:723:HG32CBCX2:1:1108:4108:2121/1 +ATGCGGAAGTAGGCAAAAATGATGTGCTAGACTACAAGAATTCCTTTTACAGAAAGTAACAAATACAGAGCCAAGAAAGTTTTTGTTAATTATCACGGTGT ++ +@@@ADADA@AD>FIIBBBFGIBGHJDCIGEGGGHHHIJIIJJJJGHIIEHHEGHJIHGGGIFAGGGGIIG>=CHHFD?@;CCEDDDDCDD>>ACDCB@8<5 +@SRR9130495.112 D00236:723:HG32CBCX2:1:1108:4384:2110/1 +ACACAGGCAGCAATGATGTCTTTACTTCTTTATTTTTTTCGACTTCATCTACAGAGCTTAGCACAGCCATTGGAACAAAATTGGAGCTCAGTGCACAGTTA ++ +@@@FDEFDDFF3CCF?FHCH@DEEGEFHIIFGBGGGDGIHAFBGDDHHIBAGGDGHE@CHAHBFFFFBDD +@SRR9130495.115 D00236:723:HG32CBCX2:1:1108:4445:2247/1 +TCTGTATTCTGTGTCATCTGCCATTCCTTGACTCCCTGCGCCCTTCAGCCCACAGGAAACGTGTGGATGACACACGAGGAGATGGAGTCTCTGACGGCAGC ++ +CCCFFDDDHHHHGJJJJIJJJJBHHJJIIGIIJJJIIGIFIJJIIIIGIJJIIIJIJCHIIJJJIHHFHEFFFFDDDDDBDDCDDCDCDDDDCCCDBBDDB +@SRR9130495.116 D00236:723:HG32CBCX2:1:1108:4698:2005/1 +GAGGGAAGGAGGGAGGGAAAGAAGAAGGGAGAGAGGGAGGAAGGCAGGACTGTCGATGCAAGTACCTCGCTTCCTTGTTCTTAACTCATTTGATTCTTGCT ++ +C@BFFFFFGHHGHIIIJJIBGGDHC@FEGDHIIIHGEHHEGCGIHHHFFFFDEEDDDEDDDDCDCCCDDDDDDDDDDDDDEDCCCDDDCDDDED:CCDDDD +@SRR9130495.117 D00236:723:HG32CBCX2:1:1108:4588:2182/1 +CTGGGGTGCAGTGGTGCAATCATAGCTCACTGCAGCCTCAATTTCCTAGGCTTAAGCATTTCTTCCACCTCAACTTCCCAAGTAGCCAGGATTACAAGCAC ++ +CCCFFADDFFHHGGHHGIIJIJJJJJJHIIJIJJIFIJJEIIJIJIGIJIJJJJJJIJJJIIHIIJHIIFFHGHHFFFFFEDEECCCCBDBDDDDDDCDBC +@SRR9130495.118 D00236:723:HG32CBCX2:1:1108:4964:2029/1 +CCCCGTCTCTACTGAAACACACACACACACACACACACACACACACACACAATTAGCCAGGCGTGGCAGCGTCTGCCTGTAGTCCCAGCTACTCAGGAGGC ++ +;8=:DDDDFFFAFIIFFBEIIEFIFIFIEFFFIIBEGEF?BF<4;A@EE/?;AB>7;7;>@?>B?''5<@;@?;0((4:@>34@@>:4<@>BAB@(948&+ +@SRR9130495.119 D00236:723:HG32CBCX2:1:1108:4831:2078/1 +GCGAAGAAAACTGAAAAAGGTGGAAAATTTAGAAATGTCCACTGTAGGACGTGGAATATGGCAAGAAAACTGAAAATCATGGAAAATGAGAAACATCCACT ++ +CCCFFFFFGFHHFFHGIHDICFHIGGIDHIIJJJJIIIIIGIGHGIJJJJJJJJJJJIJJJIJJIHHHHHFFFFFEEEEEEEDDDDDDDDDDDDDDDDCDD +@SRR9130495.120 D00236:723:HG32CBCX2:1:1108:4877:2117/1 +GCATAATGTTGCCACTGCACTCCAGCTGGGACGACAAAGACTGTCTCTAAAAAAGTAATAAATAAATAAAAGTTTGAAATGCATTGTCCTAGGTTTTAGTC ++ +CCCFFDEFHHHHHIIJJJJJIJIIIGIJJJJJJIIJIJJJIJJJJJJJJJJJJJIIHHGHHHHHFDFFFFFEEEEEEDDDDDCEEDEEDDDDDCDDDDDDD +@SRR9130495.121 D00236:723:HG32CBCX2:1:1108:4918:2158/1 +AAACATGTCAATGGCCAAAAAAAACAGACAATCAAAAAATGGACAAATATATGAACAGACATTTCTCACAAGAGGACATACAAATGGCCAGCAAATATATA ++ +CCCFFFFDHHGHHIIJIJJJIIIJJJJJJJIJJIJJJIIJJJJIJJIJJIHGFHHHHFFFFFEFEEEEEDDDDDDDDCDDDDDDDCCBCDDDDDDDDEEEE +@SRR9130495.122 D00236:723:HG32CBCX2:1:1108:4939:2211/1 +CCTGGTCTCAGCATTCCTCACACGTCATAGCGAGGCCCATGGCTGTAGAAATCCCACCATTCTCTTCTCCCCAGGCCTGGCATCCGTAGAAGCCTACAGCT ++ +@CCFFFFFHHHHDHIDIHIJIJJJJJIGGEGIJIIGIIIJJJGGIJJJJIGGHGIIIJJGHHHHHFFFFEFDEDDDDDDBDDDDDDDDD?CDDDDDDDDAC +@SRR9130495.123 D00236:723:HG32CBCX2:1:1108:5169:2188/1 +TCTGACCCCATGTCCTCAGGCCAGAACCCGGGAGCCTGTCAGAAAAGGTCTCTCACCTAGAGTCCATGCTCTGGAAGCTCCAGGAGGACCTGCAGAGGGTG ++ +??@DD?DFHDFHFIIIIGFHEGGDFFHIBHGIAFIGGIIIFI@CHE@FGH@CDGGIFHEEFCCED@DEEEECCCCCCCCCCCCCCBB8ABC?ACAAABBBB +@SRR9130495.124 D00236:723:HG32CBCX2:1:1108:5192:2231/1 +ACTCTCCTGGCCCACGAGAGAGTCCACACAGGAGAGAAACCTTACCAGTGTCATGAGTGCGGCAAGAACTTTAGTCAGAAATCCTACCTTCAAAGCCATCA ++ +CCCFFFFFHFHHGJJGEFGHGIIEIIFJJJIHGIJIIJIIIJIIGIEHHIGIHIJIIJIIBDFDDDDDDDDDCDDDCCDDDDDDDCDDCDDDDDCDDDDDA +@SRR9130495.125 D00236:723:HG32CBCX2:1:1108:5408:2041/1 +TGTGTGCATCCTCATGTGTCCTTGATAAGTGGTGTGATAAATGAAGGCTTTGCCACATTCCTTACACATGTAGGGCTTCTCTCCAGTGTGAGTCCTCTCAT ++ +@@@DDDEBFHHHHIIIHIFHIDHIIIJHHJIHEGFIIHIJJIIJJEIJGHHIEIEGIIJIJJJGIGHGJJIIGIGIHJEHHHHHFFEFFFCC@CEEDDDDE +@SRR9130495.126 D00236:723:HG32CBCX2:1:1108:5351:2057/1 +CTCTATATATTTTAACAAATGCATAATGTCATGTGTTTACCATTACAGTAGGATAAAGAACAGTCTCATTGCCTTAAAAAGTTCCCTAACATTTTAATTGT ++ +CCCFFDEDFHHHHJIJIIJJJIJJJHJJJJIJIIIHHIJIJIJJJJIIHIJJIIJJJJJIJJJJJJIJIJIJIIJJJJJJJGGIGHHFHFFFFFFFEEEEE +@SRR9130495.127 D00236:723:HG32CBCX2:1:1108:5475:2108/1 +AGCCCAGAAGGCTGGACACACCTCCCCCTCACCCCATCCCGCTCCCCAATCAACCCAGTCCTCAAGAAGCACACTGTGGCTGCTTGCTCTCTTGCCCCCCT ++ +CCCFFDFFHGHGHJJIJJJIGIIIHIGIIJIIJJJIJJJHGIJIJIIIJHHGHHFFEDEEEECCDDDDDDDDDDDDDDDDDDDDDDDDDDCCDCDDDDDDB +@SRR9130495.128 D00236:723:HG32CBCX2:1:1108:5542:2138/1 +TGGCTAGCTACTGCTGCTGCTGCATCAAAGCCCAAATATTCACTGGCATCAGCTGTTTTGTTCTTTAGCATATTAGTAAAGTGCTCATTTAGAGACATCTT ++ +@CCFFFFFHHHHGJIJJIJJJIJJJJJJJJJJJJJJIGGIJJJJJHJJJJJJJJJHIEIIJJJIIJJJIJIIJJJJHHHHHHHF@DFFFFEDEEEEDDCDD +@SRR9130495.129 D00236:723:HG32CBCX2:1:1108:5707:2147/1 +CCAGCATCACTCATGGAACCGGAGGCACTAAGGCCCCTCGGGAGACGCTGAGCAGGTGGGTAGAGGCATACTTCTGGGAGATGGCATCAAGAGCCAGTCAA ++ +CC@FFDDFFDHG>FFFHGGIJIEIIIHIGIGHBHCEHGGGFH@FHGIHHFBFDEEDDEDDDDBDC?BBDCDDDDDC:?A?BDDDCCDC>ACDDDBDDACCC +@SRR9130495.130 D00236:723:HG32CBCX2:1:1108:5614:2168/1 +AAACCATGTCTCTACTAAAACTACAAAAATTAGCTGGGCAACATGGTGGGTGCCTGTATCCCAGCTACCTGGGAGGGTGAGGCACGAGAATCACTTGAACC ++ +CCCFFFFFHHHHHIJJJJIJGJIJJJIJJJJIJJJJJIJJJJIJJHIIHJIJJJJJJJJJJJJJJJJGHFHHF@DDDDDDDDDDDDDDDBDDDDDDDDDDD +@SRR9130495.131 D00236:723:HG32CBCX2:1:1108:5985:2027/1 +GCGGCAGCGGCCGCGATGGAAGAACTTACGGCGTTCGTCTCCAAGTCTTTTGACCAGAAAGTGAAGGAGAAGAAGGAGGCCATCACGTACCGGGAGGTGCT ++ +CCCFFFDDHHDGHFIJFHFFHHBFGHGEIJJJFFDDDDDDDDDDD@CCDCDDDDDAAACACDC@CCDBBBDBD@ +@SRR9130495.132 D00236:723:HG32CBCX2:1:1108:5816:2071/1 +TTTACATATAAGAACCTGATGACCTTTTGTTTTTGTCCAGGAGAGTCCTTCTTGTCTACGAAATGCAGCTATCACAGCAGCTGGACTTGTTTCCTGAATGC ++ +C@CFFDDAFFFHHHHHHGFIHJIJFHHHCAAEHIGHJGCCGHIHEHJJJEHGIIIFIGBBAEHGIJIGIIHHEHHHFFFFEECCABCDCCCCACDDACDA: +@SRR9130495.133 D00236:723:HG32CBCX2:1:1108:5835:2081/1 +CCAGGGCTCCAAGGGGCTGGTTACGAAGTGTCTCCTGCTGCATGAGGTCCCCACGGGAGAGATTGTGGTCCGCCTTGACCTGCAGTTGTTTGATGAGCCGT ++ +@CCDDDFFHHHGHGJGJFHIEHIGCGHIGJGIIIJJJJJJJJJIIIEIJFGIJJIJGCCDDBDDCDDDBDDDDCDDDDDDDD>BACDDDEDDCBD +@SRR9130495.134 D00236:723:HG32CBCX2:1:1108:5841:2101/1 +GGGCATGGTGGCATGCGCCTGTAGTCCCAGCTATTCGGGAAGCTGAGGCAGGAAAATCTCTTGAACCCAGGAGGCGGAGGTTGCAGTGAGCCAAGCTTGCA ++ +@CCF?BDDHFHGHIIIIIIIIIGHGHHIIIFIIIIIGGFGGIIIIEFGGEGHCD>CGGFHHHGGHFFFCDDADDDDDDDBDBCDCCCCA@CCCCBDDDDDD +@SRR9130495.135 D00236:723:HG32CBCX2:1:1108:6165:2044/1 +TTTATACCATTTTTTTTTTTAGCATATATCCTTGTACTTTATAGGAATTATTTGCTTTATTCTCTTGTGACTTGTAAATTGATGTACTTAATTAAATCTTT ++ +@@CBAB;DHFFHHIGIIGGHGFF@?BGB@8=FHEGHIGD=@CGHIA;@EHFHGHBFFFCBD;>(>@A@C>>;>CA;;35>@3;>5>,;3>:;(:@:>:@@C +@SRR9130495.136 D00236:723:HG32CBCX2:1:1108:6059:2069/1 +CTATGACCGCTATGTTGCCATCTGTAGCCCACTGCTTTATAACACTGTAATGTCCCACAAGGTCTGTTCCATAATGATGGCTGTGGTATACTCACTGGGCT ++ +CCBFFDBEHHHHFEGIIGHGIIIJIIHIJIFIJJJJJJJJJJIIJJIJJJJIIHHIJIIIFIHIJFIGIIIHGGHHHHFFFFDEEEEEDEFEDDDCDDDBC +@SRR9130495.137 D00236:723:HG32CBCX2:1:1108:6161:2181/1 +ATGAAGCAACAACCTTATAGGCATTTTAACTCATAGGTTTTAAAACTTAAGGTTATTTTCATAGGAGTCCCTTTTAGCAGAAATGCTCACCACAGGACCAG ++ +@@CGGDD@4???BDHCH@GH<=FHGEGGGIGCEG@E7ACH@:77?C@A@CBAA???2
FFFIGIIGIIIIFDADBDDDDDDDBBBBBBCDD@CDDDD?BDDDDDDCDDBDDDBDDDCCCCCBBCCCDCCCCDDAC>ABDDDCDDDDA@C +@SRR9130495.144 D00236:723:HG32CBCX2:1:1108:6837:2146/1 +CCTGTTATTTTAGTTGTTAAAGGTGGCATTCTGTTCTTGTGGCTGTCTTCTTTTAGGTTTGTTGAGGGATTACCTTCTTGTTTTTTCTAGGGCATTGTTCC ++ +BCCFDDFDHFDHFGIIIIJIGIIJJIDGHIJIIJJJJJJGFIIIHFHHIJJJIGDGIGHGHIJICHGGEHGCHGFEHFHHFDDDDDDDDDDDC?CDDDDCC +@SRR9130495.145 D00236:723:HG32CBCX2:1:1108:6804:2189/1 +TGAATCTCTCTTGGCCTCCTCCCCTCTCATGTCCCCTCCTCCCTCCTCTCCACTTACTCCTCCTCCTCCCCTCCCTCCTCCCAGATGGTTCTGTGTCTTTT ++ +CCCFFEFFHHGHHJJJIJJIJJJJIJJJJJIJIFIJIGIIGGJIJJIIIIIGIIJIJIJGIIIJIJJHHHFDFFDCDCCDDDCDBCCDCDDD@ACCCDDDD +@SRR9130495.146 D00236:723:HG32CBCX2:1:1108:6940:2229/1 +CTTAATGCCACTATCACCACTTCCTTCAAGAGTGAGGGAGAGGAAGAGGAGGAAGAGGAGGAGGAAGAAGAGGAGGAGGAGGAAGAGGAGGGTGAAGGGGA ++ +@@@DBDDEFHHHHGIJIEGGIGECHIFIIJGFHHACCF?D:DFF;?FHH9DFCGGHFG@CA?AB?DD>?A@BDDBB=?B5@BBFCAA@A;;5?BB9;=>;BB?1>A?ABDCC +@SRR9130495.149 D00236:723:HG32CBCX2:1:1108:7167:2101/1 +TTTCATGTTTTAGGTCTTGTAAGCAAGATTTTTCCTGTTGAAAAACTGGTTGAAGAAGCCATCCAATGTGCAGAAAAAATTGCCAGCAATTCTAAAATCGT ++ +?@?DB?DDHHGDHIHHGBIECFDHHE>C7?BB7;@A(5==;88323>CDC9B +@SRR9130495.152 D00236:723:HG32CBCX2:1:1108:7449:2110/1 +GGCTTCAGGAGCTTCAGAAGTTAAGAGCTGCAAAAAAGAAGAAAAAGGATCGGCCAAGTAAAGACTGTTCCAAGTTGGACATGCTTGCTAGAAATTTCCAG ++ +CCCFFDFEHGHHGJIIBEEHHIIIHHIGGJIIJIIGIIGGHIIIJIGGGGGGGIIJJHHFHHGFFFFFEEEEEEEDDDDDDDCDDEDDDDDDDDDDDDEDC +@SRR9130495.153 D00236:723:HG32CBCX2:1:1108:7499:2197/1 +TTCTCATAGTTCAGCTTCCACTTGCGGTAGCTTGTTCCACTTGCGGAACATGTGGTGTTTGGTTTTTTGTACCTGCACTAGTTTGCTGAGAAAGATCGGAA ++ +@@@DDDDEHHFFHABECCAFHHHFDGIHJIIEFGHIIGIGEHEBGG0AEDHGFFFGIDG@EH=ADEBADDE@CCCBCACDDDEEDDCCCBCCC@CC>AB@@ +@SRR9130495.154 D00236:723:HG32CBCX2:1:1108:7309:2205/1 +GGAGGCTGAGGCAGGAGAATCGCTTGGACCCGGGAGGTGTAGGTTGCAGTGAGCCAAGATTGCGCCACTGCACTCCAGCCTGGGTGACAAAGTGAGATATT ++ +BC@FFFDFDHHGFIGIIIJIJJJJJIJJJIIJJJIIIHHIJIJJJIJHHHHGHFFFEBAEECEDDB:@CDDDDCDDDDDDDDDBCBDCDCDDDCDBDCC?ACDD34>C@BD<>>:CB<>@BA8 +@SRR9130495.156 D00236:723:HG32CBCX2:1:1108:7518:2119/1 +TTATCAAAGAGGCCCAAGAGAAACCACTTGTCTGACTTCTACCATATGAGTTTAGAATAAGATGATGGCTGCCTATGAGGAAGCAGGCCCTCAACAGATAC ++ +@@@DDBD4CFFAAHII=G9FDHG;?F@;EEBEFCF>BGBGDBECC@BBBBBBBCCABC@CC +@SRR9130495.157 D00236:723:HG32CBCX2:1:1108:7577:2169/1 +AGTTACTTAATATACCTTAGCCGAAACTTCTGCACTGATTTCCTCCTGTGTTTCAGCCAGCCGCTTTTTGGCAAGTTCGGTTCTCCGATCACACTCTGCAA ++ +@@@DDDFFFFHGHIICGHFH@FGGHGHHJGIHJIJIJGIIIBDHCBGGHEHIJJIGIIIBGIEIGGHHCEBDFEDECD?@DDDDDDDDDDBCCDDDDDDC> +@SRR9130495.158 D00236:723:HG32CBCX2:1:1108:7659:2196/1 +TTCTGATTTTTGCTGCAGCTTCTGCTTATAATCATATGGCCAGTTGTGCTTGTCAGAGTAATGGTGAAGTCCACAAAACAAATTTCCACATCGGCAGTCAA ++ +CCCFDDDDHDFHFGIFCHIII9FHHIGGHHIJJJJIJJEHGEGIIJJJJJJJJDHGI:DFGIIGHGJGCGHGIJJGIIHGHGFFECB@CEC@B@BDD?CCD +@SRR9130495.159 D00236:723:HG32CBCX2:1:1108:7733:2213/1 +GGCCAGATGTTTCTGTAAAGATTGAATTAGATCCCCAGGGAGAGGCAGCACAAAGTGCAAATGAATCAAAAACTGAGTAGAATATTGTAGAGTGCCAATTA ++ +@<@DDA+AFFHHHIIFBHC@@F>@>CC: +@SRR9130495.160 D00236:723:HG32CBCX2:1:1108:7590:2217/1 +GGGGCTGGGCCCACCTGGGACAGAGGGCCACATGTAGAGGCAGCGCTCCCCCGTCTTGAGCTGATCTTTGCAGTCGAATAGCATGAGGTTGGCCCAAGCGA ++ +CC@FFDDDGHHDHIJDGIIACBDDBBBDDD@ +@SRR9130495.161 D00236:723:HG32CBCX2:1:1108:7735:2228/1 +GCAGCACTGTCTGAGTATGGGAGCAAAGCCTAATCTGGCTTGCCCGGCCTCTCACCTCTGTGGCGCTCTGCATCATGGTGCTTCTTGTCATCTTTTATTGC ++ +?@;DDDDDFCFFHIHHGBHIBH?FHIBDEHB@GEIHIEHGHAFFHGEEH<@CC@C@CCA +@SRR9130495.162 D00236:723:HG32CBCX2:1:1108:7898:2065/1 +GTTGGCTTCCCCCTCCCCTCTCCCGTGAGCTGAAAAGCAACAAGGGCTCCACCAGCCTGCAAAATAAGACTTGGGGGGGGGGGGGCAGGGATTGCTTTTTT ++ +@@@FDDDDHHFHFIJIFHIIJJJDHFGIGIGJAFHIDG>@GGFHGGHJIGCHIIGEEHFGF@CFEECC>;>CCABBD<99B@BD99&)&&+9(3(4>(+:0 +@SRR9130495.163 D00236:723:HG32CBCX2:1:1108:7872:2066/1 +CACGCTGGATGAGTTCCTGTTCAGCGACCTGCAGGCGCTGGAAGTGCTGTTGCTCTACAATAACCACATTGTGGTGGTGGACCGGAATGCCTTTGAGGACA ++ +CCCFFFFFGHGGHJJJJJJJJJJIJJJJJJHJJJJJIJJIJJJIGIJJIJJJJIHHHHHHFFDFFEDDEEEEDDDDBDDDDDDDDDDDDDDDDDDDDDDDD +@SRR9130495.164 D00236:723:HG32CBCX2:1:1108:7826:2191/1 +ATCTCTGGACCCAAACTGGAGGGTGACATTAAAGTTCCCAGGGTGGATTTGAAGGGCCCAGAAGTGGACATTTCTGCTCCCAAGGTCAATATTGATGGGAA ++ +CCCFFEFFGHHGHIHHIIJIIIJJIJIGIIJIHIGIJJJJIJJBFGGIJJIJJJJJIJIHFHHFFF@EEDEEFEEDDDDDDDDDBACDDF@CDEDEDDBDD +@SRR9130495.165 D00236:723:HG32CBCX2:1:1108:7791:2195/1 +GGAGAACAGCGTGTAGAGCACTCACAGTCTGCTGCCTTCAGGTGTGGGAGGCACTGCTCACACTGATCTTCTTCCCGGTGTGTGTGGTGTTTGCCTGGATG ++ +CCCFFDEFFGHHHJDIIJJIFJJJJJIJJJGIJJIIJIIIJIJIIGEGHHJJJJJIIFIJJJHHHHFHFFDDFFEDC>9;?BBDDD?CDDDDDDDCC?BDC +@SRR9130495.166 D00236:723:HG32CBCX2:1:1108:7767:2199/1 +GACTAGCCTGGCCAACATGGCAAAACCCAGTCTCTATTAAAAATACAAAAATTAGCTGGGCATGGTGGTGCACGCCTGTAGTCCCAGCTATTCAAGAGGCT ++ +@@@DDDFFFHHFBHBHBDEHHGGGHIIJIIHIHJIEEEIGHEIHIIGHIIHHGJIEHGI?G@CDHI=CA?BDFFACDCCDFCC32??A +@SRR9130495.167 D00236:723:HG32CBCX2:1:1108:7824:2210/1 +GCACCACCGTGCCTGGCTAATTTTTATATATTTAGTAGAGATTGGGTTTCACTGTGTTGGCCAGGCTGATCTTGAACTCTGGACCTCAGGTGATCCTCCCG ++ +@@@FFDDFDFAHHJJIJIIGHHHHHIIJIIDGG>GHHIGGCGHGIEHGGH>FFHJJJHDGBGHJCGGGHFEHHHHFFFFFECDECEDDDCDDDDCCDDCDD +@SRR9130495.168 D00236:723:HG32CBCX2:1:1108:8205:2084/1 +CTTAGCCGCTGGTGATGCTAAGGGCATGGTCAAAGTGTGGCAGCTGAGCACAGCCTTCACAGAACAAGGGCCCCGGGAGGTGGAGGACTTGGATCAGCTAG ++ +CCCFFDEDFFHHHJEGIDHHIIIIJJJIJGIJJJGHJIJIJJJIIIJIGGIIGIJJIGHIIJGEFHGBEFDDDBDDD;>B2<@BBDBBCCCCDDDDDDDDD +@SRR9130495.169 D00236:723:HG32CBCX2:1:1108:8202:2124/1 +GAGACTCTTGCACACATACCGGGGAGCTGGCTCACCCTGGCCCCTCCATCCTGTCAGACTGAAGAGAACAAGTGTCTTAATTTGGGTTTTTCTTATTATTA ++ +CCCFFEFDHFHGHGJIIIJJIJJJIIIGIJJJJFIJJHGIJGHIIJJEEEHFGFFEFECCEEEEDDDDCCAD>CCDDDDCCD?@@A=?8=?=BA93>CA??B@A????8CD(8&8?()(+224@?@>35 +@SRR9130495.179 D00236:723:HG32CBCX2:1:1108:8868:2131/1 +GTACATTGTATCTTTGTTCTCATTAGTTTCAGAGAAATTATTGATTTCTGCCTTTATTTCATTATTTACCCAAGAGTGATTTGGAAGCAGGTTGTTCAGTT ++ +<;;B?D>DFC:DBF@AEDHHAHHGH:A:AC4?BFFEDA?ABD@ACCD:> +@SRR9130495.183 D00236:723:HG32CBCX2:1:1108:9106:2031/1 +CTAGAAATCCTGGATTTTCAGCACAATAACTTAGCCAGGCTCTGGAAACGCGCAAACCCCGGTGGTCCCGTTAATTTCCTGAAGGGGCTGTCTCACCTCCA ++ +C@CFFDFFGGHHFJHIIJGIHCCEHHIGIFIIHIJJFIGJIGIJJIIJHIFGIJIJFFHHFDAD@BCCBDDDDBCC@CDDCCDDAEFC'8;&+)+((&28&&&+((&)&&++((++8((2(((25(&&&(++(0&&&(+((+4(+ +@SRR9130495.186 D00236:723:HG32CBCX2:1:1108:9230:2213/1 +ACTTAGTGCAGTACCCACTATTCCCGCTCAGGCTCCGAATAGTAGATAGAGGGTTCCGATATCTTTGTGATTGGTTGAGAATAATCAACGATTAATGAACA ++ +CCCFFFFEHGFFHFIICIIFIJHHGBHHGIGJJIJGGHIGFHIGIIJJJIIGJCFIJI@EFDFEDFFCCEEEEDDDBDDDDDDDECCDD@BDDDCDDDCDC +@SRR9130495.187 D00236:723:HG32CBCX2:1:1108:9264:2024/1 +AACATAAGGTTTCTCATAAAACAAAGAAAAATGTCAATTCAGTTGTGAATTCATATTGATACCTGGAACTCTCCTGCTAGACCACCTCTAAAGGCCCAGGG ++ +CCCFFFFFHHHGHIJJIDJIJJJDHIIJJJJIJJJJJJJIJJGCHIIJJJJJJJJJJIHJJJJJJGIJJIJIJIIIIJJHHHHGFFFFFECEEDDDDBBBB +@SRR9130495.188 D00236:723:HG32CBCX2:1:1108:9293:2034/1 +GTGGGGAGGTTTGGGAGTGAGCAGCACACCCCAGTTAGACTCCTGTTGGGTTTCATAGGAGCTGGCTGCTGAATGTAAGAGTGCAGGCTACCCCGGGACTT ++ +@@@FDA;1DAFHFIIFBGIGHGADHIGIIIIIIIIHBFEHIIIIIIIIHIACEEEHHBD@CDECECCBBCCACCCCEECCCCCCCCBBBCCCB?9>>>>BC +@SRR9130495.189 D00236:723:HG32CBCX2:1:1108:9484:2048/1 +ATGTAGAGAGAGGGAAAAAAGGAGAGAGAGAAGGATAAAGAGAAGGATGCACAAGAAGACCAAAATACCTGATCATGTAGGGGAGAGCCTCTGGGAGAAGG ++ +@@@DFDDDCDDFHICFHHDGIIHHCHCFFDGHHDCGIJIH@FFHFHGIIGIJIGIGF@CEBDFF@EECDCCCCCCDDEEEDDDDDDDDDDCDDCD<@BDCB +@SRR9130495.190 D00236:723:HG32CBCX2:1:1108:9388:2219/1 +AGCTGCTGCGAGATGGTGGCTTGCATCTCCTTGGACGGCCGCTTGTTCTCCTTGAAGATGGCAATCAGCGTGCGGCGCTGCAGGTCTGTGAACACGAGGCG ++ +B?>3=?>;@DF@>CACC>;>@A>',,88>>-09599(+8>C95>>>00 +@SRR9130495.191 D00236:723:HG32CBCX2:1:1108:9404:2245/1 +TCCGGCTGGTACCTTCATAACTACAGTAATAGAAGACATTGAGTGCCTCCACCGCAGCTGGCCCTCTCTGTTTGTAGCCAAAGATCAGATCTATCCATTCA ++ +CCCFFFFFHHHHHJJIJIIJEIIJJJJJIJJJIJJJIJIIIIIJJJIJJIIJJJJEIJJIHIGHHHFFFFFFDEEEEEDDDDDDDDDDDDDEDCDDDCDCC +@SRR9130495.192 D00236:723:HG32CBCX2:1:1108:9632:2134/1 +ATAGTGGCTGCTGATGGATGTGCTCTATGCAAGGGAGGTGCTCACTATTTCTGTTCGTCAATTTGTAACCCACGGGAGGAAAGGGAACAAAGAGTGAACAA ++ +CCCFFFFFHHHGAEFFHIICHGIJHGFIIIHIJDGIJJIIIEGIJJIIFHEGHGIICHIIFIJJJJIIJJHHHFFDBDD?BDDDDBDBDDBCDD:@CCCCD +@SRR9130495.193 D00236:723:HG32CBCX2:1:1108:9647:2175/1 +AATACCAGCCCAAGACTTTGGGAGAAGGGAAGAAAACAAAGTAAAATAACTTACCACTTTGGCCCAGTCCGAGAACAAGTGAAAATACCCAGGCTGCCCCA ++ +CCCFFFDFGHHFHIIJJGIIIJDIIJIJJJJIIHIIIIJJJHCFHHFHIJJJJJJGIHJJJIJJHGHHHFFFDDDDDCD>CCDDDDDDCDDDBDDDDDDDD +@SRR9130495.194 D00236:723:HG32CBCX2:1:1108:9552:2194/1 +CCATGCCGACACAGGTAGATGGTACGGGGCTGCACGTGGATGTTCATCAGGTAGTATACAATTCGGCTCTGGATGTGGTCCTGCACTCTGTTCACCAAGAA ++ +@@CFFFFFGHGHHJJJIJJJJIJJJIGHFEGGIFIJIJIIIIIJJIIJJIHHHHHHHFFFFFFFDCDDDC@@ACDDCDDDDDDDDDDDDCDDD@CCDDDDD +@SRR9130495.195 D00236:723:HG32CBCX2:1:1108:9620:2235/1 +CCAATGATGGCCAACTAGGCCATCTTCTACTATGTACGCAGCTAGAGGCACGAGCGCTGGGGGTACCGATTAGTTCATATTGGTGTTCCACCTATAGGGTT ++ +===BD?DBAABD8AC3?F?D9C6'5;:>7<<>8:(',&22>(((:>3>+:(+28(43>@B(>:>A((32 +@SRR9130495.196 D00236:723:HG32CBCX2:1:1108:9908:2124/1 +TCTTGTGAAGAAGATGCTGTTGGAAGCCTCTAAGAAGCCCGAACTGAATGCTCTTATAAACAATACCAGAGGAATTATTTTTTACAGTGTCCCTCACCATG ++ +CCCFFFFFHGDFGIIJJIJJIGGJJIIJJIIJHIIIIJJJJI>HHIFIJIJIJJIIHIHIJJJJIHIHHHGFDEFFEEEEEEDDDDDFDEDCCDCDDDDDD +@SRR9130495.197 D00236:723:HG32CBCX2:1:1108:9923:2206/1 +TGGGGCTGTGAACCGAAGTCTGCTCCTTTGCGTGAGCCACCCCTGCAGCCCCTCCCACAGTTCCTGAGGAGCCTTTAGTCCTCGTCCTTTCTCAGCTGTAT ++ +@BCFFDAFHHHHHIIIIHIIJIIJIIJJJIIIJJIGGIIIJJFGGGGGEIIIGFHHEFFFEECCCC@CB@BDDDCDDCCDCCDDABBBCDDCC@CCDCCCD +@SRR9130495.198 D00236:723:HG32CBCX2:1:1108:10131:2036/1 +ATGTGCTCAAAGGCTGGGTGGACCTTACCTCCAGTAAACCCCACGTTGTGAAGAAATCCATCAAGTACCTGGAACAAGGAACTCAAGACACCAAAGATGTG ++ +@CCFFFDDFFBHDHIIIBFEGFGHGHGDFHFGIJJIIHDGEGHIJHFHIIIIJJJJJIIIFHHHFHFFFFFFBAEAACBBCADDDDDDDDADBABCCC>AA +@SRR9130495.199 D00236:723:HG32CBCX2:1:1108:10246:2089/1 +GCCCTGGGATTGTCCCTCTGGGCACAGGGAGTCCTGGGGTTGTCCCTCTGAGTAGTTCTGTTGGGAGAGGAGGCCCTGGGATTGTCCCTCTGGGTACAGGG ++ +CCCFFBDDHHHFHJIIIJJJJIIIIIFIIEHGIGJIJDHJIJIIJJFJIJ@FFCHJJJBEGEHHHDFDCD@DBB;=?A?@BDDDCACDDDDD@?CCCCDCB +@SRR9130495.200 D00236:723:HG32CBCX2:1:1108:10051:2156/1 +ATGGAGGATGGCACCCTGCAGGCTGGCCCAGGAGGTGCCAGTGGGCCTCGTGCCCTGGAAATAAATAAAATGATTTCTTTTTGGAGGAATGCTCATAAACG ++ +@@CDFFDFGFHFFIJGGIICCDDADDB diff --git a/docs/notebooks/min_example.fastq b/docs/notebooks/min_example.fastq new file mode 100644 index 00000000..f4ef5f68 --- /dev/null +++ b/docs/notebooks/min_example.fastq @@ -0,0 +1,12 @@ +@SRR9130495.1 D00236:723:HG32CBCX2:1:1108:1330:1935/1 +NCAATA ++ +#4BDFD +@SRR9130495.2 D00236:723:HG32CBCX2:1:1108:1472:1938/1 +NGTCAA ++ +#1=DDD +@SRR9130495.3 D00236:723:HG32CBCX2:1:1108:1728:1948/1 +GTTTTC ++ +@@@DDD \ No newline at end of file diff --git a/docs/notebooks/tutorial.ipynb b/docs/notebooks/tutorial.ipynb index acd8b329..0aaf92e9 100644 --- a/docs/notebooks/tutorial.ipynb +++ b/docs/notebooks/tutorial.ipynb @@ -4,10 +4,13 @@ "cell_type": "markdown", "id": "947f441f13ced60a", "metadata": {}, - "source": "### Import dependencies" + "source": [ + "### Import dependencies" + ] }, { "cell_type": "code", + "execution_count": null, "id": "7b173024d3e8f76", "metadata": { "ExecuteTime": { @@ -15,30 +18,35 @@ "start_time": "2025-02-24T16:59:36.960817Z" } }, - "source": [ - "import polars_bio as pb\n", - "import pandas as pd\n", - "from polars_bio.range_viz import visualize_intervals" - ], "outputs": [ { - "name": "stderr", - "output_type": "stream", - "text": [ - "INFO:polars_bio:Creating BioSessionContext\n" + "ename": "", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[1;31mRunning cells with 'Python 3.12.10' requires the ipykernel package.\n", + "\u001b[1;31mRun the following command to install 'ipykernel' into the Python environment. \n", + "\u001b[1;31mCommand: '/opt/homebrew/bin/python3.12 -m pip install ipykernel -U --user --force-reinstall'" ] } ], - "execution_count": 1 + "source": [ + "import polars_bio as pb\n", + "import pandas as pd\n", + "from polars_bio.range_viz import visualize_intervals" + ] }, { "cell_type": "markdown", "id": "d2bb8c193890f27f", "metadata": {}, - "source": "### Sample data" + "source": [ + "### Sample data" + ] }, { "cell_type": "code", + "execution_count": 2, "id": "86fe039c3780140e", "metadata": { "ExecuteTime": { @@ -46,6 +54,7 @@ "start_time": "2025-02-24T16:59:37.452650Z" } }, + "outputs": [], "source": [ "df1 = pd.DataFrame(\n", " [[\"chr1\", 1, 5], [\"chr1\", 3, 8], [\"chr1\", 8, 10], [\"chr1\", 12, 14]],\n", @@ -55,18 +64,19 @@ "df2 = pd.DataFrame(\n", " [[\"chr1\", 4, 8], [\"chr1\", 10, 11]], columns=[\"chrom\", \"start\", \"end\"]\n", ")" - ], - "outputs": [], - "execution_count": 2 + ] }, { "cell_type": "markdown", "id": "a884cd2960796fdb", "metadata": {}, - "source": "### Overlap" + "source": [ + "### Overlap" + ] }, { "cell_type": "code", + "execution_count": 3, "id": "304f3aa6fcdc9650", "metadata": { "ExecuteTime": { @@ -74,9 +84,6 @@ "start_time": "2025-02-24T16:59:37.538707Z" } }, - "source": [ - "overlapping_intervals = pb.overlap(df1, df2, output_type=\"pandas.DataFrame\")" - ], "outputs": [ { "name": "stderr", @@ -86,10 +93,13 @@ ] } ], - "execution_count": 3 + "source": [ + "overlapping_intervals = pb.overlap(df1, df2, output_type=\"pandas.DataFrame\")" + ] }, { "cell_type": "code", + "execution_count": 4, "id": "61c9254622598622", "metadata": { "ExecuteTime": { @@ -97,17 +107,9 @@ "start_time": "2025-02-24T16:59:37.552440Z" } }, - "source": [ - "display(overlapping_intervals)" - ], "outputs": [ { "data": { - "text/plain": [ - " chrom_1 start_1 end_1 chrom_2 start_2 end_2\n", - "0 chr1 1 5 chr1 4 8\n", - "1 chr1 3 8 chr1 4 8" - ], "text/html": [ "
\n", "