{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "Count the number of lines in workshop1.bam after using head" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "samtools view: writing to standard output failed: Broken pipe\n", "samtools view: error closing standard output: -1\n", "10\n" ] } ], "source": [ "samtools view /data/bam/workshop1.bam | head | wc -l" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "How many single reads aligned for workshop1.bam?" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "1241\n" ] } ], "source": [ "samtools view -F 1 /data/bam/workshop1.bam | wc -l" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "What does column 3 mean? Its the chromosome!" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n", "17\n" ] } ], "source": [ "samtools view /data/bam/workshop1.bam | cut -f 3" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Convert to lowercase and check for N" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "caaagagaaatggattggctggacagtaacccttcttcatacccagggccttctgggatcctgttcctttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacc\n", "cccagggccttctgggatcctgttcctttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgat\n", "ccagggccttctgggatcctgttcctttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattggg\n", "cttctgggatcctgttcctttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattcttt\n", "ctgttcctttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattcgtt\n", "tttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaac\n", "tttgaaccagcctttctggctgtcttatgtagaatattttcagggtcatagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggc\n", "ttgaaccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaa\n", "gaaccagccttgctggctgtcttatgtagaatattttcagggtcctagattggtaaacagttggaggtttcagaaaaacccgataaaaattcttt\n", "ccagcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggg\n", "agcctttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggg\n", "tttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaac\n", "ttctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacc\n", "tctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattg\n", "tctggctgtcttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggct\n", "ttatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaa\n", "tatgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctca\n", "tgtagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaac\n", "tagaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattggg\n", "agaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtg\n", "agaatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaaga\n", "aatattttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattcttta\n", "attttcagggtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaac\n", "gtcctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaaca\n", "gtcctagattggtgaacagttggaggtttcaggaaaaccc\n", "tcctagattggtgaacagttggaggtttcaggaaaac\n", "cctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggagg\n", "ctagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctc\n", "tagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattggggga\n", "tagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaaca\n", "tagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaa\n", "tagattggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgg\n", "attggtgaacagttggaggtttcaggaaaacccgataaaaattctttattgg\n", "ggtgaacagttggaggtttcaggaaaacccgataaaaattctttatt\n", "gtgaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaggg\n", "tgaacagttggaggtttcaggaaaacccgataaaaattatttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaNggc\n", "gaacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtgga\n", "aacagttggaggtttcaggaaaacccgataaaaattctttatt\n", "aacagttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtc\n", "agttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggc\n", "agttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtg\n", "agttggaggtttcaggaaaacccgataaaaattctt\n", "ttggaggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaaca\n", "aggtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaa\n", "gtttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaaca\n", "tttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagt\n", "tttcaggaaaacccgataaaaattctttattgggggag\n", "tttcaggaaaacccgataaaaattctttattgggggag\n", "tttcaggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaat\n", "ttcgggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaa\n", "ttcaggaaaacccgataaaaattctttattgggggag\n", "aggaaaacccgataaaaattctttattgggggaggggctcaaacaagaaaataatcaat\n", "aaaacccgataaaaattctttattgggggaggggctcaaacaa\n", "aacccgataaaaattctttattgggggagcggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcct\n", "aacccgataaaaattctttattgggggaggggctcaaacaagaaaataa\n", "ccgataaaaattctttattgggggaggggctcaaacaagaaaata\n", "cgataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagt\n", "aataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctc\n", "ataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggt\n", "ataaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaggg\n", "taaaaattctttattgggggaggggctcaaacaagaaaataatca\n", "taaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgg\n", "aaaaattctttattgggggaggggctcaaacaagaaaataatcaa\n", "aaaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggag\n", "aaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcct\n", "aaaattctttattgggggaggggctcaaacaagaaaataatcaacaagtg\n", "aattctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacag\n", "ttctttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggg\n", "tttattgggggaggggctcaaacaagaaaataatcaacaagtg\n", "tattgggggaggggctcaaacaagaaaataatcaacaagtggtgtc\n", "tattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaag\n", "aggggagggcctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaggga\n", "gggaggggctcaaacaagaaaataatcaacaagtggtgtccag\n", "ggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctgg\n", "ggaggggctcaaacaagaaaataatcaacaagtggtgtcca\n", "ggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaggg\n", "aggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaggg\n", "aggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaggg\n", "aaggctcaaacaagaaaataatcaacaagtggtgtccagagtg\n", "ggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactg\n", "ggctcaaacaagaaaataatcaacaagtggtgtccagag\n", "ctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcct\n", "ctcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctggg\n", "tcaaacaagaaaataatcaacaagtggtgtccagagtgga\n", "tcaaacaagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgcca\n", "caaacaagaaaataatcaacaagtggtgtccagagtgga\n", "aagaaaataatcaacaagtcgtgtccagagtggagccagggcctc\n", "aagaaaataatcaacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagca\n", "aacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtggctgg\n", "aacaagtggtgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagca\n", "agtggtgtccagagtggagccagggcctcctggggacagcaa\n", "tggtgtccagagtggagccagggcctcctggggacagcaagactgc\n", "gtgtccagagtggagccagggcctcctggggacagcaagactgcctg\n", "tgtccagagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagca\n", "tgtccagagtggagccagggcctcctggggacagcaagactgcctcgg\n", "tccagagtggagccagggcctcctggggacagcaaga\n", "cagagtggagccagggcctcctggggacagcaagact\n", "cagagtggagccagggcctcctggggacagcaagactgcctggggagc\n", "agagtggagccagggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgt\n", "agtggagccagggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggg\n", "ccagggcctcctggggacagcaagactgcctggggagcaggaagcagc\n", "ccagggcctcctggggacagcaagactgcctggggagcgggaagcag\n", "agggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgta\n", "gggcctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgt\n", "ggcctcctggggacagcaagactgcctggggagcgggaagcagctc\n", "ctcctggggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtg\n", "tcctggggacagcaagactgcctggggagcgggaagcagctcccccgtct\n", "gggacagcaagactgcctggggagcgggaagcagctcccccgtctctggggt\n", "acagcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtggctggagg\n", "agcaagactgcctggggagcgggaagcagctcccctgtctctggggtaggcgtggctgga\n", "gcaagactgcctggggagcgggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggca\n", "caagactgcctggggagcgggaagcagctcccccgtctttggg\n", "aatactgcctggggagcgggaagcagctcccccgtctctgg\n", "cctggggagcgggaagcagctcccccgtctctggggtaggcgtggctggaggggaggc\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "cctggggagcgggaagcagctcccccgtctctggggtaggcgtggctgga\n", "agcgggaagcagctcccccgtctctggggtaggcgtggctggagggga\n", "aacgggaagcagctcccgcgtctctggggtaggcgtggctggaggggagg\n", "ggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggca\n", "ggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccct\n", "ggaagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaa\n", "aagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaaN\n", "agctcccccgtctctggggtaggcgtggctggaggggaggctgg\n", "gctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggag\n", "gctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaa\n", "cccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaa\n", "cccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagc\n", "ccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggag\n", "tcccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgt\n", "tccgtctctggggtaggcgtggctggaggggaggctagaccacaggagggca\n", "ccgtctctggggtaggcgtggctggaggggaggctggaccacagga\n", "tctctggggtaggcgtggctggaggggaggctggaccacaggagggcagc\n", "tctggggtaggcatggNtggaggggaggctggaccacaggagggcagcgccctgggcaaacctatgtagatgaagctgccggagaggatcaaaga\n", "ctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaa\n", "tggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctggg\n", "gggtaggcgtggctggaggggaggctggaccacaggagggcagcgccct\n", "taggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaa\n", "taggcgtggctggaggggaggctggaccacaggagggcagcgc\n", "cgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtg\n", "gctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccgga\n", "ggggaggctggaccacaggagggcagcgccctgggcaac\n", "gggaggctggaccacaggagggcagtgccctgggcaaccctatgtagat\n", "ggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatccctt\n", "ctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcct\n", "ctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagtggatcaaa\n", "ctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaa\n", "tggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcat\n", "gaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtNaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggg\n", "acaggagggcagcgccctgggcaaccctatgtagatgaagctgccgg\n", "aggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccag\n", "agggcagcgccctgggcaaccctatgtagatgaagctgccggg\n", "gcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacagga\n", "gcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacagga\n", "cagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaaga\n", "cagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacagga\n", "cagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatccctta\n", "ctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtct\n", "ctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaaga\n", "tgggcaaccctatgtagatgaagctgccggagaggatcaaagaa\n", "gggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagac\n", "ggcaaccctatgtagatgaagctgccggagaggatcaaa\n", "gcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatccctt\n", "gcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcccgtctcatcccttagg\n", "acaaccctatgtagatgaagctgccggagaggatcaaagaaccagacagga\n", "caaccctaagtagatgaagctgccggagaggatcaaagaaccagacaggaggaaa\n", "caaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctg\n", "aaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtc\n", "cctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagag\n", "atgtagatgaagctgccggagaggatcaaagaaccagacagga\n", "tagatgaagctgccggagaggatcaaagaaccagacagga\n", "tagatgaagctgccggagaggatcaaagaaccagacaggaggaaaga\n", "gatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtct\n", "atgaagctgccggagaggatcaaagaaccagacaggaggaaaga\n", "atgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaac\n", "agctgccggagaggatcaaagaaccagacaggaggaaagaggcg\n", "ctgccggagaggatcaaagaaccagacaggaggaaagaggcggt\n", "ctgccggagaggatcaaagaaccagacaggaggaaagaggcg\n", "tgccggagaggatcaaagaaccagacaggaggaaagaggcggt\n", "ccggagaggatcaaagaaccagacaggaggaaagaggcggtgaa\n", "ggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgagg\n", "agaggatcaaagaaccagacaggaggaaagaggcggtgaagt\n", "aggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatccct\n", "aggatcaaagaaccagacaggaggaaagaggcggtgaagtctcct\n", "aggatcaaagaaccagacaggaggaaagaggcggtgaagtctc\n", "ggatcaaagaaccagacaggaggaaagaggcggtgaagtctc\n", "tcaaagaaccagacaggaggaaagaggcggtgaagtctcctgt\n", "tcaaagaaccagacaggaggaaagaggcggtgaagtct\n", "aaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcat\n", "aaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagtt\n", "aaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacagg\n", "agaaccagacaggaggaaagaggcggttaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcttttacaagcctcaaacNc\n", "aaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaa\n", "aaccagacaggaggaaagaggcggtgaagtctcctgtctcatccct\n", "aaccagacaggaggaaagaggcggtgaagtctcctgtctca\n", "aaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaac\n", "accagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggta\n", "agacaggaggaaagaggcggtgaagtctcctgtctcatccctta\n", "agacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagg\n", "aggaggaaagaggtggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttaga\n", "aggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaa\n", "aggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatt\n", "ggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatg\n", "gaggaaagaggcggtgaagtctcctgtctcatcccttagga\n", "gaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcattta\n", "gaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaa\n", "aagaggcggtgaagtctcctgtctcatcccttaggaag\n", "agaggcggtgaagtctcctgtctcatcccttaggaagcctgagg\n", "aggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcattta\n", "tNgtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatct\n", "tgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgt\n", "gaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaacc\n", "gaagtctcctgtctcatcccttaggaagcctgaggagatgggtaag\n", "aagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaat\n", "aagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcaga\n", "agtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtga\n", "gtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcaga\n", "gtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctagaaccccaggggcagaggatagtt\n", "tctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaat\n", "cctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctt\n", "cctgtctcatcccttaggaagcctgaggagatgggtaagggcattt\n", "ctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctt\n", "ctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaa\n", "tgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggcccagga\n", "tctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagag\n", "tcatcccttaggaagcctgaggagatgggtaagggcatttagaa\n", "catcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtcctta\n", "atcccttNggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccagg\n", "atcccttaggaagcctgaggagatgggtaagggcatttagaa\n", "atcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcag\n", "atcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccc\n", "cccttaggaagcctgaggagatgggtaagggcatttagaagcctc\n", "ccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggata\n", "ttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggata\n", "agcctgaggagatgggtaacggcatttagaagcctcgaaccccaggggcaga\n", "ctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggc\n", "gaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtga\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "aggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgt\n", "ggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagtt\n", "agatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtga\n", "agatgggtaagggcatttagaagcctcgaaccccaggggca\n", "gatgtgtaagggcatttagaagcctcgaaccccaggggcagaggatagttgta\n", "ggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtag\n", "gtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctca\n", "taagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggca\n", "catttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtcctta\n", "atttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggccca\n", "ttagaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggcccaggagccccccgaggct\n", "gaagcctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtcct\n", "aaagcctcgaaccccaggggcagaggatagttgtaggcagatctgt\n", "gaagcctcgaaccccaggggcagaggatagttgtaggcagatctgt\n", "aagcctcgaaccccaggggcagaggatagttgtaggcagatct\n", "cctcgaaccccaggggcagaggatagttgtaggcagatct\n", "ctcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggcccagga\n", "tcgaaccccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctga\n", "aaccccatgggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggc\n", "cccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacagggga\n", "ccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacagggga\n", "ccaggggcagaggatagttgtaggcagatctgtgagctcaggtcctta\n", "ccaggggcagaggatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggccca\n", "gggcagaggatagttgtaggcagatctgtgagctcaggtcct\n", "gggcagaggatagttgtaggcagatctgtgagctcaggtcctt\n", "gggcagaggatagttgtaggcagatctgtgagctcag\n", "ggcagaggatagttgtaggcagatctgtgagctcaggtcctta\n", "cagaggatagttgtaggcagatctgtgagctcaggtccttacctgaca\n", "agaggatagttgtaggcagatctgtgagctcaggtccttacctgac\n", "aggatagttgtaggcagatctgtgagctcaggtccttacctgacagggga\n", "gatagttgtaggcagatctgtgagctcaggtccttacctgacagggga\n", "gatagttgtaggcagatctgtgagctcaggtccttacctgacaggggagggccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccg\n", "agttgtaggcagatctgtgagctcaggtccttacctgacaggggaggg\n", "ttgtaggcagatctgtgagctcaggtccttacctgacaggggag\n", "taggcagatctgtgagctcaggtccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccct\n", "ggcagatctgtgagctcaggtccttacctgacaggggagggcccaggagccccacgaggctcatcagcatcat\n", "gcagatctgtgagctcaggtccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaacca\n", "gcagatctgtgagctcaggtccttacctgacaggggaa\n", "atctgtgagctcaggtccttacctgacaggggagggccc\n", "atctgtgagctcaggtccttacctgacaggggagg\n", "tctgtgagctcaggtccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacct\n", "tgagctcaggtccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaacca\n", "ctcaggtccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcacta\n", "gtccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccct\n", "tccttacctgacaggggagggcccaggagccccccgaggctcatcagcat\n", "tccttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggg\n", "tccttacctgacaggggagggcccaggagccccccgaggctcatca\n", "tccttacctgacaggggagggcccaggagccccccga\n", "ttacctgacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccctgt\n", "gacaggggagggcccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaact\n", "aacaggggagggcccaggagccccccgaggctcatcagcat\n", "acaggggagggcccaggagccccccgaggctcatcagcatca\n", "agagggcccaggagccccccgaggctcatcagcatcatcaccagc\n", "agggcccaggagcccccNgaggctcatcagcatcatcaccagccctgtggcctgcacca\n", "ccaggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaact\n", "aggagccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctctcttcgccgcc\n", "agccccccgaggctcatcagcatcatcaccagccctgtggcctg\n", "gccccccgaggctcatcagcatcatcaccagccctgtggcctgcaccaca\n", "ccccgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagccc\n", "cccgaggctcatcagcatcatcaccagccctgtggcctgcacaacacctcc\n", "ccgaggctcatcagcatcatcaccagccctgtggcctgt\n", "cgaggctcatcagcatcatcaccagccctgtggcctgcat\n", "cgaggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgccca\n", "cgaggctcatcagcatcatcaccagccctgtggcctgcaccacac\n", "aaggctcatcagcatcatcaccagccctgtggcctgcaccacac\n", "aggctcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccacc\n", "tcatcagcatcatcaccagccctgtggcctgcaccacacct\n", "tcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccacca\n", "tcatcagcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagccc\n", "tcatcagcatcatcaccagccctgtggcctgcaccacacctcc\n", "gcatcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaacca\n", "catcatcaccagccctgtggcctgcaccacacctccgacgcccaccag\n", "atcatcaccagccctgtggcctgcaccacacctccgacgcccacc\n", "atcatcaccagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacacc\n", "tcaccagccctgtggcctgcaccacacctccgacgcccaccagcccgggga\n", "accagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcagggga\n", "cagccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggc\n", "agccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaact\n", "agccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagccc\n", "ccctgtggcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcgtggcgtaactccccg\n", "gcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagc\n", "gcctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctctcttcgccgccca\n", "acctgcaccacacctccgacgcccaccagcccggggagtaca\n", "cctgcaccacacctccgactcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccaca\n", "cctgcaccacacctccgacgcccaccagcccggggagtacaccgaaaat\n", "tgcaccacacctccgacgcccaccagcccggggagtaca\n", "tgcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgt\n", "gcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcNtNac\n", "caccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcagg\n", "taccacacctccgacgcacaccagcccggggagtacaccgaaaaccagcg\n", "accacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagcc\n", "cacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgta\n", "acacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcaga\n", "acctccgacgctcaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctca\n", "acctccgacgcccaccagcccggggagtacaccgaaaaccagcgg\n", "acctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgct\n", "acctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcaggg\n", "tccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagcc\n", "tccgacgcccaccagcccggggagtacaccgaaaaccagcggggcgtaact\n", "gcccaccagcccggggagtacaccgaaaaccagcggggcgtaactccc\n", "cccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagc\n", "ccaccagcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagt\n", "caccagcccggggagtacaccgaaaaccagcggggcgta\n", "accagcccggggagtacaccgaaaaccagcggggcgtaat\n", "cagcccggggagtacaccgaaaaccNgcggggcgtaactccccgcgctcagcccatag\n", "agcccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccaca\n", "cccggggagtacaccgaaaaccagcggggcgtaactccccgcgctca\n", "ccggggagtacaccgaaaaccagcggggcgtaactccccgcgctcagc\n", "ggagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctctcttcgccgcccaccacgggcacca\n", "gaagtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccag\n", "agtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggcca\n", "agtacaccgaaaaccagcggggcgtaactccccgcgctcag\n", "agtacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctct\n", "ttacaccgaaaaccagcggggcgtaactccccgcgctcagcccataggccacag\n", "tacaccgaaaaccagcggggcgtaactccccgcactca\n", "tacaccgaaaaccagcggggcgtaactccccgcgctcagc\n", "accgaaaaccagcggggcgtaactccccgcgctcagcccataggccacagc\n", "accgaaaaccagcggggcgtaactccccgcgctcag\n", "cgaaaaccagcggggcgtaactccccgcgctcagcccat\n", "agcggggcgtaactccccgcgctcagctcataggccacagccgcggcca\n", "cgtaactccccgcgctcagcccataggccacagccgctgcca\n", "gtaactccccgcgctcagcccataggccacagccgcggccagcaggggactccccc\n", "taactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtca\n", "aactccccgcgctcagcccataggccacagccgcggccagcaggggactcccccagctctcttcgccgcc\n", "actccccgcgctcagcccataggccacagccgcggccagcagggga\n", "ataggccacagccgcggccagcaggggactcccccagctctcttcgccgcccaccacggg\n", "ataggccacagccgtggccagcaggggactcccccagctctcttcg\n", "ataggccacagccgcggccagcaggggactcccccagctctcttcgccgccca\n", "ccacagccgcggccagcaggggactcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcggg\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "ccgcggccagcaggggactcccccagctctcttcgccgccca\n", "ggccagcaggggactcccccagctctcttcgccgcccaccaccggcacca\n", "agccagcaggggactcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcagagccccgaata\n", "ccagcaggggactcccccagctctcttcgccgcccaccacgg\n", "aggggactcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatcgcagccacgg\n", "aactcccccagctctcttcgccgcccaccacgggcacc\n", "actcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagtt\n", "actcccccagctctcttcgccgcccaccacgggcaccagccccaccacccaca\n", "actcccccagctctcttcgccgcccaccacgggcaccagccccaccacccacag\n", "ccccagctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagtcacccgcagac\n", "agctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcaccca\n", "agctctcttcgccgcccaccacgggcaccagccccaccacccacagcccca\n", "gctctcttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagt\n", "ttctcttcgccgcccaccacgggcaccagccccaccaccca\n", "cttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagt\n", "ttcgccgcccaccacgggcaccagccccaccacccacagccccagcccagtcagag\n", "gccgcccaccacgggcaccagccccaacacccacagcaccagc\n", "ccacgggcaccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgg\n", "cacgggcaccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccag\n", "acgggcaccagccccaccacccacagccccagcccagtcagagccccgaata\n", "acgggcacccgccccaccacccacagccccagcccagtcagagccccgaatacggacagcagccgcgga\n", "cgggcaccagccccaccacccacagccccagcccagtcagagcctt\n", "caccagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcggg\n", "cagccccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccaaccgcagacca\n", "cccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggagg\n", "ccaccacccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacc\n", "acccacagccccagcccagtcagagccccgaatacggccagca\n", "cccacagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccgggcgcc\n", "ccacagccccagcccagtcagagccccgaatacggccagcagccgcgg\n", "acagccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagcct\n", "tagccccagcccagtcagagccccgaatacggccagcagccgcgggag\n", "agccccagcccagtcagagccccgaatacggccagcagccgcgg\n", "agccccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccgggcgcccgcatc\n", "ccagcccagtcagagccccgaatacggccagcagccgcgggaggggcacccagcct\n", "agcccagtcagagccccgaatacggccagcagccgcgg\n", "ccagtcagagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccg\n", "agagccccgaatacggccagcagccgcgggaggggcacccagcct\n", "gagccccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccac\n", "agcaccgaatacggccagcagccgcgggaggagcacccagacttggtctgccagccacccgcagaacagccgggcgaccgcatcccccatcgcagccacggccaccaccagctctgctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaagga\n", "cccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccacc\n", "ccgaatacggccagcagccgcgggaggggcacccagccttggtctgccagccac\n", "cgaatacggccagcagccgcgggaggggcacccagcctta\n", "gaatacggccagcagccgcgggaggggcacccagccttggt\n", "gaatacggccagcagccgcgggaggggcacccagccttggtc\n", "tagcagccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccgg\n", "cagcagccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgctccg\n", "cagccgcgggaggggcacccagccttggtctgccagccacccgcagacc\n", "agccgcgggaggggcacccagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgc\n", "agccgcgggaggggcacccagccttggtctgccagccacccgcagaccagcc\n", "ccgcgggaggggcacccagccttggtctgccagccacg\n", "cgcgggaggggcacccagccttggtctgccagccacccgcagac\n", "aaggccacccagccttggtctgccagccacccgcagaccagccgggcgcccgcattccccatcgcagccacggccgccaccagcgctgctccgtt\n", "aggggcacccagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgct\n", "gggcacccagccttggtctgccagccacccgcagaccagccgg\n", "gcacccagccttggtctgccagccacccgcagaccagcca\n", "cacccagccttggtctgccagccacccgcagaccagccgggcgcctgcatcccccatcgcagccacggccaccaccagcgctgctccg\n", "acccagccttggtctgccagccacccgcagaccag\n", "cccagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccat\n", "ccagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatc\n", "cagccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaagg\n", "ccttggtctgccagccacccgcagaccagccgggcgcccgcatcccccatc\n", "tctgccagccacccgcagaccagccgggcgcccgcatcccccatc\n", "tctgccagccacccgcagaccagccgggcgcccgcatcccccatcgca\n", "tctgccagccacccgcagaccagccgggcgcccgcatcctccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcatggggagccaagtgcagg\n", "ctgccagccacccgcagaccagccgggcgcccgcatc\n", "accagccacccgcagaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgct\n", "caccctcagaccacccgggcgcccgcatcccccatcgcagccacggccat\n", "acccgcagaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgct\n", "ccgcagaccagccgggcgcccgcatcccccatcgcagccacgg\n", "cgcagaccagccgggcgcccgcatcccccatcgcagccac\n", "agaccagccgggcacccgcatcccccatcgcagccacggcca\n", "gaccagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagccaa\n", "accagccgggcgcccgcatcccccatcgcagccacggccaccaccag\n", "accagccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagccaa\n", "cagccgggcgcccgcatcccccatcgcagccacggccaccacca\n", "ccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgctccgtat\n", "ccgggcgcccgcatcccccatcgcagccacggccaccaccagcgct\n", "ccgggcgcccgcatcccccatcgcagccacggccaccaccagcgctgct\n", "gcgcccgcatcccccatcgcagccacggccaccaccagcgctgctccgtatccccccaggc\n", "gcggccgcctcccccatcacagcgacggccagcaccagcgctgctccgtatcaccccaggccccggtctaaagcgtggggagccaagtgcacgta\n", "tcgcatcccccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgccccca\n", "cgcatcccccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagct\n", "tcccccatcgcagccacggccaccaccagcgctgctccgtat\n", "cccatcgcagccacggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgc\n", "ccatcgcagccacggccaccaccagcgctgctacgtatccccccaggccccggtctaaagcgtgg\n", "ccatcgcagccaaggccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcc\n", "atcgcagccacggccaccaccagcgctgctccgtatccccccaggc\n", "cagccacggccaccaccagcgctgctccgtatccccccaggccccgg\n", "acggccaccaccagcgctgctccgtatccccccaggccccggtctaaatcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagatt\n", "gccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtggggagcca\n", "gccaccaccagcgctgctccgtatccccccaggccccggtctaaagcgtgggga\n", "ctgctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggct\n", "gctccgtatccccccaggccccggtctaaagcgtggggagccaagtgc\n", "actccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccg\n", "ctccgtatccccccagaccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgc\n", "ctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaa\n", "ctccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggacta\n", "tccgtatccccccaggccccggtctaaagcgtggggagcca\n", "ccgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaa\n", "ccgtatccccccaggccccggtctaaagcgtgggga\n", "cgtatccccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagta\n", "tatccccccaggccccggtctaaagcgtggggagccaagtgcacgta\n", "cccccaggccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaag\n", "ccccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcc\n", "cccggtctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcc\n", "agtataaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacaga\n", "gtctaaagcgtggggagccaagtgcacataaggaac\n", "ctaaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctag\n", "taaagcgtggggagccaagtgcacgtaaggaacgaagt\n", "aaagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccaggg\n", "aagcgtggggagccaagtgcacgtaaggaacgaagtacccgcccccaa\n", "tggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgccta\n", "tggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtg\n", "tggggagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagact\n", "gagccaagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaa\n", "caagtgcacgtaaggaacgaagtacccgcccccaaccagggctg\n", "aagtgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggaagctaggggactacg\n", "tgcacgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaa\n", "tgcacgtaaggaacgaagtacccgcccccaaccagggcta\n", "acgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggacgag\n", "cgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagct\n", "cgtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagct\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "ataaggaacgaagtacccgcccccaaccagggctgtgccta\n", "ataaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctagg\n", "gtaaggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagatt\n", "taaggaacgaagtacccgcccccaaccagggctgtgccta\n", "aggaacgaagtatccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgaggg\n", "ggaacgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtga\n", "acgaagtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgt\n", "gtacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaaca\n", "tacccgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcag\n", "tacccgcccccaaccagggctgtgcctagagcaaagattg\n", "tccgcccccaaccagggctgtgtctagagcaaagattgaga\n", "cccgcccccaaccagggctgtgcctagagcaaagattgagaaggt\n", "ccgcccccaaccagggctgtgcctagagcaaagattg\n", "cgcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagcta\n", "gcccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggg\n", "acccccaaccagggctgtgcctagagcaaagattgagaaggc\n", "cccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccga\n", "ccccaaccagggctgtgcctagagcaaagattgagaaggcccgg\n", "ccccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacaga\n", "cccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgaggg\n", "ccaaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgaggg\n", "caaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacag\n", "aaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcag\n", "aaccagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactc\n", "accagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcagg\n", "cagggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagact\n", "agggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtc\n", "agggctgtgcctagagcaaggattgagaaggcacggcgtgtgaacagactcgggccgagggcagctagggtactacgcggtggggctggggggtc\n", "agggctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactac\n", "ctgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctg\n", "tgtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcag\n", "gtgcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccga\n", "gcctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctgg\n", "ctagagcaaagattgagaaggcccggcgtgtgaacagactcaggccgaggg\n", "gcaaagattgggaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtgggg\n", "gcaaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggct\n", "aaagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctgg\n", "aagattgagaaggcccggcgtgtgaacagactcaggccgagggcagctagggg\n", "aagattgagaaggcccggcgtgtgaacagactcaggccgagggcagc\n", "agattgacaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtgg\n", "agaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcag\n", "agaaggcccggcgtgtgaacagactcaggccgagggcagc\n", "agaaggcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgcca\n", "gcccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccaca\n", "cccggcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacaggg\n", "agcgtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaagga\n", "gcgtgtgaacagactcaggccgagggcagctaggggactacgcggtgg\n", "gtgtgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaa\n", "tgaacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagca\n", "aacagactcaggccgagggcagctaggggactacgcggtggggctggggggtct\n", "aacagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagc\n", "acagactcaggccgagggcagctaggggactacgcggtggggctggggggtctcca\n", "cagactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtgga\n", "agactcaggccgagggcagctaggggactacgcggtggggctggggggtctccag\n", "gactcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagg\n", "actcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagcgggtgaggt\n", "tcaggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggac\n", "ggccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggac\n", "ccgagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgagga\n", "cgagggcagctaggggactacgcggtggggctggggggtctccaggaaggac\n", "cgagggcatctaggggactacgcggtggggctggggggtctc\n", "gagggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagt\n", "gagggcagctaggggactacgcggtggggctggcgggtctccaggaa\n", "gagggcagctaggggactacgcggtggggctggggggtctccaggaagga\n", "agggcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgat\n", "gcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcag\n", "gcagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagca\n", "cagctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtaa\n", "agctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgagg\n", "agctaggggactacgcggtggggctggggggtctccaggaaggaccaggggtag\n", "ctaggggactacgcggtggggctggggggtctccag\n", "taggggactacgcggtggggctggggggtctccaggaaggaccaggggta\n", "ggggactacgcggtggggctggggggtctccaggaaggaccag\n", "ggactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtg\n", "gactacgcggtggggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgacccgccagccgaaag\n", "actacgcggaggggctggggggtctccaggaaggaccagg\n", "actacgcggtggggctggggggtctccaggaaggaccaggggt\n", "acgcggtggggctggggggtctccaggaaggaccaggggtagca\n", "gtggggctggggggtctccaggaaggaccaggggtagc\n", "ggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccagga\n", "ggctggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagg\n", "actggggggtctccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgagg\n", "gtctccaggaaggaccaggggtagcagcagggcgccacagggggtgag\n", "tctccaggaaggaccaggggtagcagcagggcgccacagggggtgag\n", "tctccaggaaggaccaggggtagcagcagggcgtcacagggggtgaggtggagggtgatcgcgccgaggagg\n", "tccaggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggagga\n", "tcaggaaggaccaggggtagcagcagggcgccacagggggtgag\n", "aggaaggaccaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgcc\n", "ggaaggaccagggatagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgc\n", "accaggggtagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcac\n", "ccaggggtagcagcagggcgccacagggggtgatgtggagggtgat\n", "tagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcg\n", "tagcagcagggcgccacagggggtgaggtggagggtgatcgcgccgagg\n", "agcagcagggcgccacagggggtgaggtggagggtgatcgcgccgaggaggag\n", "cagggcgccacagggggtgaggtggagggtgatcgcgccga\n", "gcgccacagggggtgaggtggagggtgatctcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgat\n", "acgccacagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagt\n", "cagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccN\n", "ggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaag\n", "ggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaag\n", "ggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgcca\n", "gtNaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgagga\n", "tgaggtggagggtgatcgcgccgaggaggagcagagcgccccgcca\n", "tggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaag\n", "aaagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgagga\n", "ggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcga\n", "atcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctg\n", "tcgcgccgaggaggagcagagcgccccgccagccgaaagtatc\n", "cgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgcca\n", "aggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaag\n", "aggaacagggcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccag\n", "agcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcggg\n", "agagcgccccgccagccgaaagtatcgaggagaagctgcaa\n", "agcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggt\n", "ccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagt\n", "ccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgcc\n", "cgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggcccc\n", "aaagtatcgaggagaagctgcaaggcgggcgccaggagcagcga\n", "agtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggagtccccgttgccggtg\n", "tatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgt\n", "atcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccg\n", "gaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccac\n", "agaagctgcaaggcgggcgccaggagcagcgaggaggccccgtt\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "agaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagaggg\n", "gctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgcca\n", "tgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgggggcgaacaccagg\n", "gcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccaccgcc\n", "aaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgcca\n", "gggcgccgggagcagNgaggaggcccNNttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgg\n", "gcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcggg\n", "tcaggagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgccta\n", "aggagcagcgaggaggccccgttgccggtgagcgccagccccac\n", "aggagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgaaagggtgcctagggcgggggcgaac\n", "gagcagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaag\n", "cagcgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgac\n", "cgaggaggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgggggcgaacaccaggg\n", "gaggaggccccgttgccggtgagcgccagccccaccgccaagact\n", "aggaggccccgttgccggtgagcgccagccccaccgcca\n", "ggccccgttgccggtgagcgccagccccaccgccaagactcgacggcggga\n", "ggccccgttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagag\n", "ccgttgccggtgagcgccagccccaccgccaagactcgacggcggg\n", "ggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgccta\n", "gtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgc\n", "tgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgaga\n", "gccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgggggcgaat\n", "ccaccgccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgg\n", "ccaagactcgacggcgggagaagtaacgcgagagggtgcctagggc\n", "ccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgggggcga\n", "caagactcgacggcgggagaagtaacgcgagagggtgcctagggcgggg\n", "aagactcgacggcgggagaagtaacgcgagagggtgcctaggg\n", "agactcgacggcgggagaggtaacgcgagagggtgcctagggcgggggcgaacacca\n", "gacggcgggagaagtaacgcgagagggtgcctagggcgggggcgaacaccagggcccaaccaa\n", "aacggcgggagaagtaacgcgagagggtgcctagggcg\n", "ggcgggagaagtaacgcgagagggtgcctagggcgaggg\n", "gaagtaacgcgagagggtgcctagggcgggggcgaacaccagggcccaac\n", "aagtaacgcgagagggtgcctagggcgggggcgaacacc\n", "aacgcgagagggtgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggggccggcactgg\n", "gcgagagggtgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatggggg\n", "gagggtgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggggccggcactggggacgccgccccagcattcc\n", "gagggtgcctagggcaggtgcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggggccggcaatgaggccgccgccccagcattcc\n", "gagggtgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggggccggcactg\n", "gtgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgtatgaataggaggggat\n", "tgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaata\n", "tgcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaataggagg\n", "gcctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggggccggcactggggacgcccgccccagcattccca\n", "cctagggcgggggcgaacaccagggcccaaccaaagcctgcgaatgaata\n", "ggggcgaacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggg\n", "ggcgaacaccagggcccaaccaaagcctgcgaatgaataggagggg\n", "ggcgaacaccagggcccaaccaaagcctgcgaatgaatagga\n", "cgaacaccagggcccaaccaaagcctgcgaatgaataggaggg\n", "cgaacaccagggcccaaccaaagcctgcgaatgaataggagggga\n", "cgaacaccagggcccaaccaaagcctgcgaatgaat\n", "aacaccagggcccaaccaaagcctgcgaatgaataggaggggatgggggcc\n", "aacaccagcgcccaaccaaagcctgcaaatgaataggaggggatgg\n", "acaccagggcccaaccaaagcctgcgaatgaataggagg\n", "accagggcccaaccaaagcctgcgaatgaataggaggggatgggggccggcactggggacgcccgccccagcattcccagcccggctctccgcaccag\n", "ccaaccaaagcctgcgaatgaataggaggggatgggggccggcactggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccg\n", "caaccaaagcctgcgaatgaataggaggggatgggggccggca\n", "aaccaaagcctgcgaatgaataggaggggatgggggccggcactggggacgcccgcccca\n", "aaccaaagcctgcgaatgaataggaggggatgggggccggcactggggacgcccgccccagcatt\n", "aaagcctgcgaatgaataggaggggatgggggccggcactggggacgcccgcc\n", "cctgcgaatgaataggaggggatgggggccggcactggggacgcccgccccagca\n", "ctgcgaatgaataggaggggatgggggccggcactggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagat\n", "gcgaatgaataggaggggatgggggccggcactggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgct\n", "aataggaggggatgggggccggcactggggacgcccgccccagcattccc\n", "aggggatgggggccggcactggggacgcccgccccagcat\n", "gggatgggggccggcactgtggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctc\n", "gggatgggggccggcactggggacgcccgccccagcatt\n", "ggatgggggccggcactggggacgcccgccccagcattcccagcccggctctccgca\n", "aatgggggccggcactggggacgcccgccccagcattcccagccc\n", "gccggcactggggacgcccgccccagcattcccagcccggctctccgt\n", "gccggcactggggacgcccgccccagcattcccagcccggct\n", "ccggcactggggacgcccgccccagcattcccagcccggctctccgt\n", "ccggcactggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcctgtcacctc\n", "tggcactggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgcta\n", "cggcactggggacgcccgccccagcattcccagcccggctctc\n", "actggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctca\n", "actggggacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatccaaacaag\n", "gggacgcccgccccagcattcccagcccggctctccgcaccag\n", "agacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcct\n", "gacgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcc\n", "acgcccgccccagcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccaga\n", "cccgccccagcattcccagcccggctctccgcactaggcccccgcctcgttcgcta\n", "ccgccccagcattcccagcccgcctctccgcaccaggcccccgcctcgttcgctac\n", "agcattcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcctgta\n", "attcccagcccggctctccgcaccaggcccccgcctcgt\n", "attcccagcccggcNctccgcaccaggcccccgcctcgttcg\n", "attcccagcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaat\n", "ttcccagcccggctctccgcaccaggcccccgcctcgttcgct\n", "agcccggctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcatgtcacc\n", "ctctccgcaccaggcccccgcctcgttcgctaccccagatcccaac\n", "ctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccct\n", "ctctccgcaccaggcccccgcctcgttcgctaccccagatcccaacaagctcctgtcac\n", "accaggcccccgcctcgttcgctaccccagatcccaacaagctcctgtcacctccttcacc\n", "accaggcccccgcctcgttcgctaccccagatcccaacaag\n", "caggcccccgcctcgttcgctaccccagatcccaacaagctcctgtca\n", "ggcccccgcctcgttcgctaccccagatcccaacaagctcct\n", "tcccgcctcgttcgctaccccagatcccaacaagctcctgtcacct\n", "cccgcctcgttcgctaccccagatcccaacaagctcctgtca\n", "ccgcctcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcat\n", "cacctcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaatgacc\n", "gcctcgttcgctaccccagatcccaacaagctcctgtcacctccttca\n", "cctcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccga\n", "cctcgttcgctaccccagatcccaacaagctcctgtcacctcctt\n", "tcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcNgaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcc\n", "taccccagatcccaacaagctcctgtcacctccttcaccctgaat\n", "taccccagatcccaacaagctcctgtcacctccttcaccctg\n", "taccccagatcccaacaagctcctgtcacctccttcaccctga\n", "ccagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggta\n", "cagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccagg\n", "agatcccaacaagctcctgtcacctccttcaccctgaat\n", "ccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgagg\n", "aacaagctcctgtcacctccttcaccctgaatgacccgggcat\n", "acaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctgg\n", "caagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccct\n", "aagctgctgtcacctccttcacactgaatgacccgggcatcccacttccctca\n", "ctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagaga\n", "tcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggcc\n", "ctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgag\n", "ctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggagg\n", "tgtcacctccttcaccctgaatgacccgggcatcccacttccctcac\n", "tcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcaga\n", "tcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccg\n", "acctccttcaccctgaatgacccgggcatcccacttcc\n", "ctccttcaccctgaatgacccgggcatcccacttccctcaccagcgag\n", "ctccttcaccctgaatgacccgggcatcccacttcc\n", "tccttcaccctgaatgacccgggcatcccacttccctcaccagcgag\n", "tccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaag\n", "ccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagacca\n", "cttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccag\n", "ttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggc\n", "tcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgag\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "ccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgtt\n", "ccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagaga\n", "ctgaatgacccgggcatcccacttccctcaccagcgaggagg\n", "cccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtag\n", "cgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaa\n", "catcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctg\n", "atcccacttccctcaccagcgaggaggcccaggccgaggtagaga\n", "atcccacttccctcaccagcgaggaggcccaggccgaggtagagatg\n", "tcccacttccctcaccagcgaggaggcccaggccgaggtag\n", "ccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagc\n", "tttccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaa\n", "tccctcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatg\n", "tcaccagcgaggaggcccaggccgaggtagagatgcagcagaccgctagcgaaagc\n", "accagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcga\n", "accagcgaggaggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcacca\n", "cagcgaggaggcccaggccgaggtagagatgcagcagaccgctggc\n", "aggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcc\n", "aggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcga\n", "aggcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggg\n", "gcccaggccgaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaacca\n", "aggccgaggtagagatgcagcagaccgctggcgaaagccgagaagac\n", "gaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatca\n", "gaggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcaggg\n", "aggtagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgagg\n", "gtagagatgcagcagaccgctggcgaaagccgagaa\n", "tagagatgcagcagaccgctggcgaaagccagaagacgaagcccagcgaggcga\n", "tagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcacca\n", "Nagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagaca\n", "agatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgccccc\n", "agatgcagcagacNgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaa\n", "agatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaa\n", "acagcagacagctggcgaaagccgagaagacgaagccaagcgaggcgag\n", "agcagacccctggcgaaagccgagaagacgaagcccagcgaggcgag\n", "aaaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgc\n", "gaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgg\n", "cgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgccccca\n", "cgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggc\n", "gctggcgaaagccgagaagacgaagcccagcgaggcgaggatg\n", "tggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgct\n", "ggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccat\n", "aaaagccaagaagacgaagcccagcgaggcgaggatgcccccaaccatcacca\n", "aaagccgagaagacgaagcccagcgaggcgaggatgcccccaact\n", "aaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcacca\n", "aaagccgagaagacgaagcccagcgaggcgaggatgcccccaa\n", "agaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgc\n", "aaaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggc\n", "gaagacgaagcccagcgaggcgaggatgcccccaaccatcaccac\n", "Nagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaaga\n", "agacgaagcccagcgaggcgaggatgcccccaaccatcaccacgg\n", "acgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgg\n", "acgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacgg\n", "ccagcgaggcgaggatgcccccaaccatcaccacggg\n", "gcgaggcgaggatgcccccaaccatcaccacggggcgggcccccca\n", "aggcgaggatgcccccaaccatcaccacggggcgggccccccatcgc\n", "aggcgaggatgcccccaaccatcaccacggggcggg\n", "aggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggc\n", "ggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaaca\n", "gcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgct\n", "gaggatgcccccaaccatcaccacggggcgggccccccagcgcgt\n", "aggatgcccccaaccatcaccacggggggggccccccagcgcgtgctcaggg\n", "aggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagg\n", "ggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacg\n", "ccccaaccatcaccacggggcgggccccacagcgcgtgctcag\n", "catcaccacggggcgggccccccagcgcgtgctcagggcgctgcccac\n", "atcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgc\n", "accacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccc\n", "ccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctga\n", "gggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaa\n", "gcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcg\n", "cccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaagac\n", "cccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaa\n", "cgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacc\n", "gcgtgctcagggtgctgcccacggggcctgaaagggggcggagtcaacggaagaca\n", "tgctcagggcgctgcccacggggcctgaaagggggcggagtcaacgg\n", "tcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctcca\n", "gggcgctgcccacggggcctgaaagggggcggagtcaacggaaga\n", "gcgctgcccacggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggc\n", "ctgcccacggggcctgaaagggggcggagtcaacggaagacat\n", "ccatggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattgg\n", "tggggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgca\n", "ggcctgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctc\n", "ctgaaagggggcggagtcaacggaaaatacgcccccgggcccccaaac\n", "tgaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctca\n", "gaaagggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtt\n", "aaagggggcggagtcaacggaagacacgaccccgggcccccaaactctctccaac\n", "agggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctc\n", "ggggcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaa\n", "gcggagtcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgttt\n", "gagtcaacggaagacacgcccccgggcccccaaactctctt\n", "tcaacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgctt\n", "tcaacggaagacacgcccccgggcccccaaactctctccaaca\n", "tcaacggaagacacgcccccgggcccccaaactctct\n", "aacggaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctc\n", "aaaagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggtt\n", "aagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctc\n", "aagacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttttctagagc\n", "agacacgcccccgggcccccaaactctctccaacacttctcatt\n", "agacacgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggt\n", "acgcccccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttc\n", "cgcccccgggcccccaaactctctccaacacttctcatt\n", "cccccgggcccccaaactctctccaacacttctcattggctgtttgcctc\n", "ccgggcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacct\n", "gcccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttct\n", "cccccaaactctctccaacacttctcattggctgtttgcctccctcgaact\n", "ccccaaactctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttttctaga\n", "cccaaactctctccaacacttctcattggctgtttgcctccctcaaactactggttcttctccttgacctcaagatgcactcttttctagagccggttgcc\n", "cccaaactctctccaacacttctcattggctgtttgcctccctcgcactaatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcct\n", "cccaaactctctccaacacttctcattggctgtttgcctccctcgaact\n", "cccaaactctctccaacacttctcattggctgtttgcctccctcgaact\n", "cccaaactctctccaacacttctcattggctgtttgcctccctcgaa\n", "aaactctctccaacacttctcattggctgtttgcctccctc\n", "tctctccaacacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttttctagagccggttg\n", "caacacttctcattggctgtttgcctccctcgaactaatggttcttctc\n", "aacacttctcattggctgtttgcctccctcgaactaatggttcttctc\n", "acacttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagat\n", "acttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttt\n", "acttctcattggctgtttgcctccctcgaactaatggttcttctcctt\n", "acttctcattggctgtttgcctccctcgaactaatggttcttctccttgac\n", "cttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttttctaga\n", "ttctcattggctgtttgcctccctcgaactaatggttcttctccttgacct\n", "ttctcattggctgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggt\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "tctcattggctgtttgcctccctcgaactaatggttcttctcctt\n", "tcattggctgtttgcctccctcgaactaatggttcttctccttgac\n", "gctgtttgcctccctcgaactaatggttcttctcct\n", "ctgtttgcctccctcgaactaatggttcttctccttgacctcaaga\n", "cgtttgcctccctcgaactaatggttcttctccttgacctcaagatgcactcttttc\n", "ttgcctccctcgaactaatggttcttctccttgacctcaagatgcactctttt\n", "cctccctcgaactaatggttcttctccttaacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtct\n", "tccctcgaactaatggttcttctccttgacctcacgatgcactcttttctagagccagttgccctttctcaggttgtc\n", "tccctcgaactaatggttcttctccttgacctcaagatgcactcttatctagagccggttgccctttctc\n", "ctcgaactaatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtg\n", "tcgaactaatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggt\n", "gaactaatggttcttctccttgacctcaagatgcactcttttctagagccggttgc\n", "aactaatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatca\n", "actaatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtg\n", "aatggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctcca\n", "aatggttcttctccttgacctcaagatgcactcttttctagagccg\n", "aatggttcttctccttgacctcaagatgcactcttttctagagccggttgccct\n", "atggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcag\n", "tggttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccat\n", "gttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcct\n", "gttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaa\n", "ttcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctcca\n", "ttcttctccttgacctcaagatgcactcttttctagagccggttg\n", "tcttctccttgacctcaagatgcactcttttctagagccggttggcctttct\n", "tcttctccttgacctcaagatgcactcttttctagagccggttgccctttctcag\n", "tcttctccttgacctcaagatgcactcttttctagagccggttgccc\n", "ttctccttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgg\n", "cttgacctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatc\n", "ttgacctcaagatgcactcttttctagagccggttgccctttctcaggttg\n", "ttgacctcaagatgcactcttttctagagccggttgc\n", "acctcaagatgcactcttttctagagccggttgccctttctcaggttgt\n", "cctcaagatgcactcttttctagagccggttgccctttctca\n", "cctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccat\n", "ctcaagatgcactcttttctagagccggttgccctttctca\n", "ctcaagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgg\n", "aagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcct\n", "aagatgcactcttttctagagccggttgccctttctca\n", "aagatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctccc\n", "agatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatca\n", "aatgcactcttttctagagccggttgccctttctcaggttgtcgggtaatca\n", "actcttttctagagccggttgccctttctcaggttgtcggctaatcaggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcccg\n", "actcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtct\n", "actcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctccca\n", "ctcttttctagagccggttgccctttctcaggttgtcgggtaatca\n", "ctcttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccact\n", "tcttttctagagccggttgccctttctcaggttgtcgggtaatcaggt\n", "tcttttctagagccggttgccctttctcaggttgtcggg\n", "tcttttctagagccggttgccctttctcaggttgtcgggtaatcag\n", "cttttctagagccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatcc\n", "aaccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcccgcct\n", "aaccggttgccctttctcaggttgtcgggtaatcaggtgggtctcc\n", "gccggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctcca\n", "gcaggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccac\n", "tctttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccatccactcacggctcctcctccccgttcc\n", "ggttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcac\n", "ttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcccgcctcagggcccccctcactg\n", "ttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcct\n", "ttgccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcctccccgt\n", "ttgccctttctcaggttgtcgggtaatcaggtgggtctcccatc\n", "ccctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcct\n", "cctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcct\n", "cctttctcaggttgtcgggtaatcaggtgggtctcccatccctccactcacggctcctcctccccgttcctgtc\n", "tttctcaggttgtcgggtaatcaggtgggtctgccatccctccactca\n", "gtaatcaggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcccgcctcagggcc\n", "taatcaggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcccgcctcagg\n", "aggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcccgcctcagggcccccctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtc\n", "aggtgggtctcccatccctccactcacggctcctcctccccgttcctgtctcc\n", "gtctcccatccctccactcacggctcctcctccccgttcctgtctcccgcctcagggcccccctcactggctgcctgctgcacggccagggccagggcgct\n", "cccatccctccactcacggctcctcctccccgttcctgtctcccgcctcagggccccccctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcct\n", "tcacggctcctcctccccgttcctgtctcccgcctcagggcccccctcact\n", "acggctcctcctccccgttcctgtctcccgcctcagggcccccctcactga\n", "tcctcctccccgttcctgtctcccgcctcagggcccccctcactggctgc\n", "tcctcctccccgttcctgtctcccgcctcagggcccccctcactggctgcctgctgcacggccaggg\n", "ttcctgtctcccgcctcagggcccccctcactggctgcctgctgcacggccagggccagg\n", "tgtctcccgcctcagggcccccctcactggctgcctg\n", "tgtctcccgcctcagggcccccctcactggctgcctgctgcacggccagggccagggcgctgatcc\n", "ctcccgcctcagggcccccctcactggctgcctgctgcacggccag\n", "cccgtctcagggcccccctcactggctgcctgctgcacggccagggccagggcgctgatccac\n", "ccgcctcagggcccccctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcagggaaggcaa\n", "ccgcctcagggcccccctcactggctgcctgctgcacggccagggcca\n", "ctcagggcccccctcactggctgcctgctgcacggccagggccagggcgct\n", "tcagggcccccctcactggctgcctgctgcacggccagggccagggcgc\n", "gcccccctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgct\n", "gcccccctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagt\n", "ccccctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcg\n", "ctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaN\n", "tcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcagggaa\n", "actggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggc\n", "tggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcct\n", "gctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtca\n", "tgcacggccagggccagggcgctgatccacgcagtgtcctgggc\n", "tgcacggccagggccagggcgctgatccacgcagtgtcctgggc\n", "gcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtc\n", "acggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcaggga\n", "acggccagggccagggcgctgatccacgcagtgtcctgg\n", "acggccagggccagggcgctgatccacgcagtgtcctggg\n", "ccagggccagggcgctgatccacgcagtgtcctgggcgcttc\n", "ccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaag\n", "ccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgttta\n", "cagggcaagggcgctgatccacgcagtgtcctgggcgcttcg\n", "gccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagt\n", "ccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaa\n", "cacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagca\n", "tcctgggcgcttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagt\n", "ttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtNggacagcccgtttatcgcgaaggctgc\n", "ttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccag\n", "aagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaagtctgcggccgccaccacccagccccagccccca\n", "tgctcggcaaggtcagggaaggcaaggcccagcgagcgca\n", "tcggcaaggtcagggaaggcaaggcccaccgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctN\n", "tcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcgg\n", "tcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagc\n", "cagcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagc\n", "gcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgta\n", "caaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacag\n", "caaggtcagggaaggcaaggcccagcgagcgcagcagccc\n", "caaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccacca\n", "aggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccacca\n", "aggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgttt\n", "tcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggct\n", "tcagggaaggcaaggcccagcgagcgcagcagcccgtaggaca\n", "agggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaagg\n", "aggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccaccca\n", "caaggcccagcgagcgcagcagcccgtaggacagcccgttta\n", "aaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatcc\n", "aggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccaccc\n", "agcgagcgcagcagcccgtaggacagcccgtttatcgcga\n", "agcgagcgcagaagcccgtaggacagcccgtttatcgcgaaggctgcggccgc\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "aagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgc\n", "cgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcc\n", "gcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgg\n", "cagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcggggtggggaaacatct\n", "agcagcccgtaggacagcccgtttatcgcgaaggctgcggccgcca\n", "cagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccag\n", "cagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctgggg\n", "cagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggg\n", "agcccgtaggacagcccgtttatcgggaaggccgcggcc\n", "cccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcggggtgggtaaacatct\n", "cccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacacagcccc\n", "ccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggg\n", "gtaggacagcccgtttatcgcgaaggctgcggccaccaccacccagccccagcccccatccg\n", "taggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcggg\n", "taggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggt\n", "ggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccat\n", "agcccgtttatcgcgaaggctgcggccgccaccacccag\n", "agcccgtttatcgcgaaggctgcggccgccaccacccagccccagccc\n", "cgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgc\n", "cgtttatcgcgaaggctgcggccgccaccacccagccccagaccccat\n", "gtttatcgcgaaggctgcggccgccaccacccagccccagccc\n", "tttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctgggg\n", "atcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccg\n", "atcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccgg\n", "acgaaggctgcggccgccaccacccagccccagccccaatccgggggtccgg\n", "aaggctgcggccgccaccacccagccccagcccccatccgggggtccggcggg\n", "aaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcggggtggggaaacatctgtgagagaaa\n", "ggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcg\n", "gctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctg\n", "gctgcggccgccaccacccagccccagcccccatccgggggtccggcgg\n", "ctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtca\n", "ctgcggccgccacaacccagccccagcccccatccgggggtccggcgggc\n", "cggccgccaccacccagccccagcccccatccgggggtccggcgggctggggggtcatc\n", "accacccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcc\n", "acccagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcggggtggg\n", "cagccccagcccccatccgggggtccggcgggctggggggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtgg\n", "ggtccggcgggctggggggtcatcgccgtctgcggggtggggaaacatctgtgagagaa\n", "gtccggcgggctggggggtcatcgccgtctgcggggtggggaaacatc\n", "tccggcgggctggggggtcatcgccgtctgcggggtggggaaacatctgt\n", "tccggcggtctggggggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacg\n", "tccggcgggctggggggtcatcgccgtctgcggggtggggaaacatctgtgaga\n", "gggggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttc\n", "gggggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcct\n", "ggggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtg\n", "gggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgag\n", "ggtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctcca\n", "ggtcatcgctgtctgcggggtggggaaacatctgtgagagaa\n", "gtcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctg\n", "tcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcat\n", "tcatcgccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctgga\n", "gccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccag\n", "gccgtctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggca\n", "atctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctgggg\n", "tctgcggggtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagat\n", "gcggtgtggggaaacatctgtgagagaagcctccacgcctgtgctt\n", "gtggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggag\n", "tggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggc\n", "ggggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatcc\n", "gggaaacatctgtgagagaagcctccacgcctgtgcttccgct\n", "ggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtggggg\n", "ggaaacatctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtggg\n", "aaaacatctgtgagagaagcctccacgcctgtgctt\n", "aacatctgtgagagaagcctccacgcctgtgcttccgctggggagatggcatccctgaga\n", "atctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcg\n", "tctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctg\n", "ctgtgagagaagcctccacgcctgtgcttccgctggggagctggcatccctgagat\n", "agagaagcctccacgcctgtgcttccgctggggagctggcatccctga\n", "gagaagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcct\n", "agNagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcgg\n", "gacgcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagg\n", "aagcctccacgcctgtgcttccgctggggagctggcatccctgagatcca\n", "agcctccacgcctgtgcttccgctggggagctggcatccctga\n", "cctccacgcctgtgcttccgctggggagctggcatccctgag\n", "cacgcctgtgcttccgctggggagctggcatccctgagatccagcctgt\n", "cacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagc\n", "acgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggc\n", "gccctgtgctagcgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggg\n", "gcctgtgcttccgctggggagctggcatccctgagatcca\n", "cctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggg\n", "cctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggcgggggcccgtcactccgagcgcgatggcgcggggg\n", "tgtgcttccgctggggagctggcatccctgagatccagcctgtggctgNtcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccg\n", "tgtgcttcagctggggagctggcatccctgagatccagcctgtgg\n", "tgcttccgctggggagctggcatccctgagatccagcctgtggctg\n", "acttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtggg\n", "cttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagc\n", "ttccgctggggagctggcatccctgagatccagcctgtggct\n", "gctggggagctggcatccctgagatccagcctgtggctg\n", "gctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcc\n", "gggagctggcatccctgagatccagcctgtggctgctcgcccggggt\n", "gggagctggcatccctgagatccagcctgtggctgctcgcccggggtggg\n", "agagctggcatccctgagatccagcctgtggctgctcgcccggggtgggc\n", "gagctggcatccctgagatccagcctgtggctgctcgcc\n", "gagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatgg\n", "gctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgc\n", "ggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgag\n", "catccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggc\n", "atccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccga\n", "ctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcga\n", "ctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggaca\n", "gagatccagcctgtggctgctcgcccggggtgggcccgtcactccgag\n", "agatccagcctgtggctgctcgcccggggtgggcccgtcact\n", "agcctgtggctgctcgcccggggtgggcccgtcactccg\n", "gcctgtggctgcccgcccggggtggggccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgc\n", "cctgtggctgctcgcccggggtgggaccgtcactccgagcgcgatggc\n", "ctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgc\n", "tgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctgg\n", "actgctcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgagg\n", "ctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcgggg\n", "tcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccgg\n", "cggggtgggcccgtcactccgagcgcgatggcgcggggcggag\n", "ggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcc\n", "ggggtgggcccgtcactccgagcgcggtggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtcc\n", "gtgggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggta\n", "gggcccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtcc\n", "cccgtcactccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaact\n", "tccgagcgcgatggcgcggggcggagggagccggggcctggcctaggg\n", "ccgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactc\n", "cgagcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatcccca\n", "agcgcgatggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacgggg\n", "gatggcgcggggcggagggagccggagcctggcctagggctggaactct\n", "gatggcgcggggcggagggagccggagcctggcctagggctggaact\n", "atggcgcggggcggagggagccggagcctggcctagggctggaac\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "atggcgcggggcggagggacccggagcctggcctagggctggaactcccgggtccgcgcga\n", "atggcgcggggcggagggagccggagcctggcctagggctggaactcccgggtcc\n", "gcgcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtcc\n", "cgcggggcggagggagccggagcctggcctagggctggaac\n", "gcggggcggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacg\n", "cggggcggagggagccggagcctggcctagggctggaactcccgggt\n", "cggggcggagggagccggagcctggcctagggctggaact\n", "atctacggagggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatcccca\n", "cggagggagccggagcctggcctagggctggaactcccgg\n", "agggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatcccc\n", "gggagccggagcctggcctagggctggaactcccgggtccgc\n", "ggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggtccgaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgc\n", "ggagccggagcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtcccacgcacactcct\n", "ccggagcctggcctagggctggaactcccgggtct\n", "cggagcctggcctagggctggaacgcccgggtccgcgcgaggtacggggacgggga\n", "cggcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccag\n", "agcctggcctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccag\n", "ctggcctagggctggaactcccgggtcagcgcgaggtacggggacggggacagccagatcc\n", "tggcctaggcctggaactcccgtgtccgcgcgagg\n", "ctagggctggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtcccacgcacactcctt\n", "ctagggctggaactcccgggtccgcgcgaggtacggggacgggga\n", "tagggctggaactcccgggtccgcgcgaggtacggggacggggac\n", "ttggaactcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtcccacgcacact\n", "ctggaactcccgggtccgcgcgaggtacggggacggggacagcca\n", "tcccgggtccgcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtccca\n", "gtccgcgcgaggtacggggacggggacagccagat\n", "gtccgcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtccca\n", "gcgcgaggtacggggacggggacagccagatccccaggcccgaggttccccgtcc\n", "acgaggtacggggacggggacagccagatccccaggcccgaggttc\n", "gtacggggacggggacagccagatccccaggcccgaggttccccgtcccacgcacactccttcccccttacccga\n", "atacggggacggggacagccagatccccaggcccgaggttcc\n", "tacgggggcggggacagccagatccccaggcccgaggttccccgtcccacgcacactccttccccctta\n", "cggggacggggacagccagatccccaggcccgaggttccccgtcccacgc\n", "cggggacggggacagccagatccccaggcccgaggttccccgtcccacgcacactccttcccc\n", "ggggacggggacagccagatccccaggcccgaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcggggaggg\n", "ggacagccagatccccaggcccgaggttccccgtcccacgcacact\n", "gacagccagatccccaggcccgaggttccccgtcccacgcacactccttccccct\n", "agccagatccccaggcccgaggttccccgtcccacgcacactccttcccccttacccgacctctcagga\n", "agccagatacccaggcccgaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtg\n", "ccagatccccaggcccgaggttccccgtcccacgcacactccttcccccttatcc\n", "ccagatccccaggcccgaggttccccgtcccacgcacatt\n", "cagatccccaggcccgaggttccccgtcccacgcacactccttcccccttacccga\n", "cagatccccaggcccgaggttacccgtcccacgcacactccttccccctt\n", "gatccccaggcccgaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgagga\n", "gcccgagtttccccgtcccacgcacactccttcccccttacccgacctctccgg\n", "tccgaggttccccgtcccacgcactctccttcccccttac\n", "ccgaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggg\n", "ccgaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcgg\n", "gaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggcttt\n", "gaggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcg\n", "aggttccccgtcccacgcacactccttcccccttacccga\n", "aggttccccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgag\n", "aggttccccgtcccacgcacactccttcccccttacccgac\n", "ttccccgtcccacgcacactccttcccccttacccgacctctt\n", "ttccccgtcccacgcacactccttcccccttacccgacctctccgggc\n", "ccgtcccacgcacactccttcccccttacccgacctctccgggcggtgcggggaggggaa\n", "acgcacactccttcccccttacccgacctctccgggcggtgcggggaggggaa\n", "actccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgaggaaggcctgggcccggcttt\n", "actccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctct\n", "actccttcccccttacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgg\n", "tccttcccccttacccgacctctccgggcgttgcggggaggggaa\n", "cttcccccttacccgacctctccgggcggtgcggggaggggaagggtgag\n", "cttcccccttacccgacctctccgggcggtgcgggga\n", "cccttacccgacctctccgggcggtgcgggaggggaagggtgaggaagggctgggcccggctt\n", "ttacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttc\n", "ttacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctggg\n", "tacccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcga\n", "acccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatgga\n", "ccgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgct\n", "cgacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgg\n", "gacctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccgggcgggcgggggccccgaaggg\n", "acctctccgggcggtgcggggaggggaagggtgaggaagggt\n", "cctctccgggcggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggc\n", "tctccgggcggtgcggggaggggaagggtgaggaaggggtgggcccggctttctctctgcttcccagg\n", "tctccgggcggtgcggggaggggtagggtgaggaagggctgg\n", "gcggtgcggggaggggaagggtgaggaagggctgggcccggcttt\n", "acggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttg\n", "cggtgcggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttgga\n", "tgcggggaggggaagggtgaggaagggctgggcccggctttctc\n", "cggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcg\n", "ggggaggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcggggg\n", "aggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggc\n", "aggggaagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaact\n", "aagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcg\n", "aagggtgaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggg\n", "agggtgaggaagggctgggcccggctttctctctgcttcccaggc\n", "ggtgaggaagggctgggcccggctttctctctgcttcccaggcg\n", "gaggaagggctgggcccggctttctctctgcttcccaggcggg\n", "gaggaagggctgggcccggctttctctctgcttcccaggcgggcgggggc\n", "aggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaa\n", "aggaagggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcga\n", "gaagggctgggcccggctttctctctgcttcccaggcgggcgg\n", "aagggctgggcccggctttctctctgcttcccaggcgggcggggg\n", "agggctgggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggag\n", "gctgggcccggctttctctctgcttcccaggcgggcgggggccccga\n", "gctgggcccggctttctctctgcttcccaggcgggcgggggccccgaa\n", "tgggcccggctttctctctgcttcccaggcgggcgggggccccgaa\n", "ggcccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaa\n", "ccggctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcct\n", "ctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagcc\n", "ttttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggag\n", "ctttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagataa\n", "ttctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagc\n", "tctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaaca\n", "ctctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacc\n", "tctctgcttcccaggcgggcgggggccccgaaggggagcga\n", "tctctgcttcccaggcgggcgggggccccgaaggggag\n", "tctctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacctgggac\n", "tctgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccaca\n", "tgcttcccaggcgggcgggggccccgaaggggagcgagggca\n", "tgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttgga\n", "tgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggag\n", "tgcttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggac\n", "gcttcccaggcgggcgggggccccgaaggggagcgagggca\n", "ttcccaggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaactt\n", "caggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaatagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcggga\n", "ggcgggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggg\n", "gggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggct\n", "gggcgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgg\n", "acgggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagaga\n", "cgggggccccgaaggggagcgagggcagcgatggagcccaactt\n", "gggggccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaac\n", "ccccgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagctgaaaca\n", "cgaaggggagcgaaggcagcgatggagcccaacttggacgggctctctcggtaaac\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "cgaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcacc\n", "gaaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagctgaaaca\n", "aaggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacaga\n", "aggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggc\n", "aggggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaaca\n", "ggagcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctga\n", "gagcgagggcagcgatggagcccaacttggacgggctctct\n", "gagcgagggcagcgatggagcccaacttggacgggctctctcggtaaaca\n", "gcgagggcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggggcctga\n", "ggcagcgatggagcccaacttggacgggctctctcggtaaacag\n", "gcagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccat\n", "tagcgatggagcccaacttggacgggctctctcggtaaacagagatcaccacaggg\n", "agcgatggagcccaacttggacgggctatctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagc\n", "tccaacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacct\n", "aacttggacgggctctctcggtaaacagagatcaccac\n", "aacttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacct\n", "acttggacgggctctctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagg\n", "ggacgggctctctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagctgaaacagccaatccggcaagccgcgcgtgaggcta\n", "ctctctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggg\n", "ctctctcggtaaacagagatcaccacaggggcctaagccacct\n", "ctctcggtaaacagagatcaccacaggggcctgagccacctgg\n", "ctcggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagctgaaacagt\n", "tcggtaaacagagatcaccacaggggccttagccac\n", "tcggtaaacagagatcaccacaggggcctgagccacctggga\n", "ggtgaacagagatcaccacaggggcctgagccacctgggacgcggg\n", "ggtaaacagagatcaccacaggggcctgagccacctgggacgcggggtgt\n", "aaacagagatcaccacaggggcctgagccacctgggacgcgg\n", "acagagatcaccacaggggcctgagccacctgggacgcgg\n", "agagatcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagctgaaacagccaatct\n", "agagatcaccacaggggcctgagccacctgggacgcggggtgtacgga\n", "agatcaccacaggggcctgagccacctgggacgcggg\n", "agatcaccacaggggcctgagccacctgggaggcggggt\n", "atcaccacaggggcctgagccacctgggacgcggggtgtacggagggcgggggcgagctgaaacagccaatccggcaacccgcgcgtg\n" ] } ], "source": [ "samtools view /data/bam/workshop1.bam | cut -f 10 | tr \"ACGT\" \"acgt\"" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "tgaacagttggaggtttcaggaaaacccgataaaaattatttattgggggaggggctcaaacaagaaaataatcaacaagtggtgtccagagtggagccaNggc\n", "aagcagctcccccgtctctggggtaggcgtggctggaggggaggctggaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaaN\n", "tctggggtaggcatggNtggaggggaggctggaccacaggagggcagcgccctgggcaaacctatgtagatgaagctgccggagaggatcaaaga\n", "gaccacaggagggcagcgccctgggcaaccctatgtagatgaagctgccggagaggatcaaagaaccagacaggaggaaagaggcggtNaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggg\n", "agaaccagacaggaggaaagaggcggttaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcttttacaagcctcaaacNc\n", "tNgtgaagtctcctgtctcatcccttaggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccaggggcagaggatagttgtaggcagatct\n", "atcccttNggaagcctgaggagatgggtaagggcatttagaagcctcgaaccccagg\n", "agggcccaggagcccccNgaggctcatcagcatcatcaccagccctgtggcctgcacca\n", "gcaccacacctccgacgcccaccagcccggggagtacaccgaaaaccagcggggcNtNac\n", "cagcccggggagtacaccgaaaaccNgcggggcgtaactccccgcgctcagcccatag\n", "cagggggtgaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgaggaggccccgttgccggtgagcgccagccccN\n", "gtNaggtggagggtgatcgcgccgaggaggagcagagcgccccgccagccgaaagtatcgaggagaagctgcaaggcgggcgccaggagcagcgagga\n", "gggcgccgggagcagNgaggaggcccNNttgccggtgagcgccagccccaccgccaagactcgacggcgggagaagtaacgcgagagggtgcctagggcgg\n", "attcccagcccggcNctccgcaccaggcccccgcctcgttcg\n", "tcgttcgctaccccagatcccaacaagctcctgtcacctccttcaccctgaatgacccgggcatcccacttccctcaccagcgaggaggcccaggccgaggtagagatgcagcNgaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcc\n", "Nagagatgcagcagaccgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaagaca\n", "agatgcagcagacNgctggcgaaagccgagaagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaa\n", "Nagacgaagcccagcgaggcgaggatgcccccaaccatcaccacggggcgggccccccagcgcgtgctcagggcgctgcccacggggcctgaaagggggcggagtcaacggaaga\n", "ctcactggctgcctgctgcacggccagggccagggcgctgatccacgcagtgtcctgggcgcttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtaggacagcccgtttatcgcgaaN\n", "ttcggtcaaagtgctcggcaaggtcagggaaggcaaggcccagcgagcgcagcagcccgtNggacagcccgtttatcgcgaaggctgc\n", "tcggcaaggtcagggaaggcaaggcccaccgagcgcagcagcccgtaggacagcccgtttatcgcgaaggctgcggccgccaccacccagccccagcccccatccgggggtccggcgggctN\n", "agNagcctccacgcctgtgcttccgctggggagctggcatccctgagatccagcctgtggctgctcgcccggggtgggcccgtcactccgagcgcgatggcgcgg\n", "tgtgcttccgctggggagctggcatccctgagatccagcctgtggctgNtcgcccggggtgggcccgtcactccgagcgcgatggcgcggggcggagggagccg\n" ] } ], "source": [ "samtools view /data/bam/workshop1.bam | cut -f 10 | tr \"ACGT\" \"acgt\"| grep \"N\"" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Cool way of printing the lines containing N using awk:" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "SN7001204_0131_BC0M3YACXX_PEdi_SS_L9302_L9303_2:8:2110:21334:24359\t16\t17\t6944926\t37\t104M\t*\t0\t0\tTGAACAGTTGGAGGTTTCAGGAAAACCCGATAAAAATTATTTATTGGGGGAGGGGCTCAAACAAGAAAATAATCAACAAGTGGTGTCCAGAGTGGAGCCANGGC\t=@=8<7>CA,YW[Y]]]\\YZ[\\[ZV[][Z]]][ZXY]]]]]]W]]]\\ZXRW[TTUX0Z\\WSW]X\\Z[\\Z]]Y[Z[Y]YVVWYV]XZX[XX[XVWVB8899!*88\tX0:i:1\tX1:i:0\tMD:Z:38C61G3\tXF:i:2\tRG:Z:L9303\tXG:i:0\tXI:Z:ACTAAGT\tYI:Z:;;987:9\tXJ:Z:AGAATTA\tYJ:Z:6=67CA8\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:7:2303:4296:113381\t0\t17\t6945064\t37\t181M\t*\t0\t0\tAAGCAGCTCCCCCGTCTCTGGGGTAGGCGTGGCTGGAGGGGAGGCTGGACCACAGGAGGGCAGCGCCCTGGGCAACCCTATGTAGATGAAGCTGCCGGAGAGGATCAAAGAACCAGACAGGAGGAAAGAGGCGGTGAAGTCTCCTGTCTCATCCCTTAGGAAGCCTGAGGAGATGGGTAAN\tRQORPGOXUSYZZPZTW]]XPPSSSTM[URQVWVSWIOPHVUSPNSULQQUTRSRPNSTTOSSOROVWJMJSIJWJRTQT]]]][]]]]]]TN]]]]]]]]GHONBKPOLOKMNRMONSNO@SQPP=PTOKIFCTCRPLJHLJPRPLKQLOJNJNRNNIJXSOQNWMVLQSNX=AHJNOO!\tX0:i:1\tX1:i:0\tMD:Z:23G156G0\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGN\tYI:Z:56.,9/!\tNM:i:2\tXM:i:2\tXO:i:0\tXP:i:2\tXT:A:U\n", "SN7001204_0131_BC0M3YACXX_PEdi_SS_L9302_L9303_2:3:2211:6482:58783\t163\t17\t6945080\t60\t95M\t=\t6945172\t186\tTCTGGGGTAGGCATGGNTGGAGGGGAGGCTGGACCACAGGAGGGCAGCGCCCTGGGCAAACCTATGTAGATGAAGCTGCCGGAGAGGATCAAAGA\t9:><;>;::;:=4>=;!><<:;8<75;8;;89:<98<7:97:985:9;:8;>;8;;7997:8;8:<97;9;9:>;9887:;29765859\tX0:i:1\tX1:i:0\tMD:Z:7G4G3C42C35\tRG:Z:L9302\tXG:i:0\tXI:Z:TGCTTCC\tYI:Z:3704679\tXJ:Z:TAGGCCG\tYJ:Z:66::8;>\tAM:i:37\tNM:i:4\tSM:i:37\tXM:i:4\tXO:i:0\tMQ:i:60\tXT:A:U\n", "SN928_0068_BB022WACXX:2:2104:16028:159102\t16\t17\t6945111\t37\t161M\t*\t0\t0\tGACCACAGGAGGGCAGCGCCCTGGGCAACCCTATGTAGATGAAGCTGCCGGAGAGGATCAAAGAACCAGACAGGAGGAAAGAGGCGGTNAAGTCTCCTGTCTCATCCCTTAGGAAGCCTGAGGAGATGGGTAAGGGCATTTAGAAGCCTCGAACCCCAGGG\tYXTSV]]]]W]]]XS]Y]\\[\\\\]Y]X]]]\\]]]]]]]]\\]]]Y]]]]]]]]]]ZZ]]Y]U]]]]]]]]]]]]]]]]]]]]]]]]]]]]!]]]]]]]Y][]]Z]Z]]]]]]]]]]]W]]]]]]P]V]]Z]]]]]]]Y]]]]]]]]]]]]]]\\]]XYVU]XUQ\tX0:i:1\tX1:i:0\tMD:Z:88G72\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGN\tYI:Z::G<>CC!\tXJ:Z:CNGGTNN\tYJ:Z:\tAM:i:37\tNM:i:5\tSM:i:37\tXM:i:5\tXO:i:0\tMQ:i:60\tXT:A:U\n", "SN7001204_0131_BC0M3YACXX_PEdi_SS_L9302_L9303_2:3:2316:7959:59899\t0\t17\t6945195\t37\t102M\t*\t0\t0\tTNGTGAAGTCTCCTGTCTCATCCCTTAGGAAGCCTGAGGAGATGGGTAAGGGCATTTAGAAGCCTCGAACCCCAGGGGCAGAGGATAGTTGTAGGCAGATCT\t8!;;<=@Y\\]]\\]]]\\]][][Z\\]]]]]]]]]]]]]]]]]]]\\]]]]]]]]]]]\\]]]]]]]]]]]]]]]]]]]]]]]\\]]]]]\\]]]]]]Z]]V>C?@=A=\tX0:i:1\tX1:i:0\tMD:Z:0C0G100\tXF:i:2\tRG:Z:L9302\tXG:i:0\tXI:Z:TGCTTCC\tYI:Z:>@6?B\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "SN7001204_0130_AC0M6HACXX_PEdi_SS_L9302_L9303_1:5:1113:8739:48871\t0\t17\t6945214\t37\t57M\t*\t0\t0\tATCCCTTNGGAAGCCTGAGGAGATGGGTAAGGGCATTTAGAAGCCTCGAACCCCAGG\t]]]]]]]!]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]\tX0:i:1\tX1:i:0\tMD:Z:7A49\tXF:i:2\tRG:Z:L9303\tXG:i:0\tXI:Z:ACTAAGT\tYI:Z:>?B;=A?\tXJ:Z:AGAATTA\tYJ:Z:=?<B\tXJ:Z:TAGGCCG\tYJ:Z:;;==9>>\tNM:i:1\tXM:i:1\tXO:i:0\tXP:i:2\tXT:A:U\n", "SN7001204_0130_AC0M6HACXX_PEdi_SS_L9302_L9303_1:3:1106:18037:6562\t16\t17\t6945378\t37\t60M\t*\t0\t0\tGCACCACACCTCCGACGCCCACCAGCCCGGGGAGTACACCGAAAACCAGCGGGGCNTNAC\tDIELMEM>MMFMIMFMAKMGKMMJMLMMMMMKJMJMMFMLMMMKHL,%10-0,*+!K!FF\tX0:i:1\tX1:i:0\tMD:Z:55G1A2\tXF:i:2\tRG:Z:L9303\tXG:i:0\tXI:Z:ACTAAGT\tYI:Z:@AC?AA@\tXJ:Z:AGAATTA\tYJ:Z:>@<>@A>\tNM:i:2\tXM:i:2\tXO:i:0\tXP:i:5\tXT:A:U\n", "SN928_0068_BB022WACXX:1:1305:13679:29102\t0\t17\t6945400\t37\t58M\t*\t0\t0\tCAGCCCGGGGAGTACACCGAAAACCNGCGGGGCGTAACTCCCCGCGCTCAGCCCATAG\t]]]]]]]]]]]]]]]]]]]]]]]]]!]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]\tX0:i:1\tX1:i:0\tMD:Z:25A32\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGN\tYI:Z::H;>FD!\tXJ:Z:CNGGNNC\tYJ:Z:0!BA!!@\tNM:i:1\tXM:i:1\tXO:i:0\tXP:i:2\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:6:2102:11566:54336\t0\t17\t6945872\t37\t133M\t*\t0\t0\tCAGGGGGTGAGGTGGAGGGTGATCGCGCCGAGGAGGAGCAGAGCGCCCCGCCAGCCGAAAGTATCGAGGAGAAGCTGCAAGGCGGGCGCCAGGAGCAGCGAGGAGGCCCCGTTGCCGGTGAGCGCCAGCCCCN\t?8=>;=;9:@<<;<9=<<:<<>?>??=>=PQMXNOWQPXVUORT[UTS.RUYUVTV[WU[YYRTW[YXWZQUY\\ZUVXVVSVOQ-UXVZYVTT[WSRS:8;8649518965:897=;=;766./87876!\tX0:i:1\tX1:i:0\tMD:Z:68A63A0\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGN\tYI:Z:<>40>5!\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "SN7001204_0131_BC0M3YACXX_PEdi_SS_L9302_L9303_2:6:2114:9910:48286\t0\t17\t6945878\t37\t98M\t*\t0\t0\tGTNAGGTGGAGGGTGATCGCGCCGAGGAGGAGCAGAGCGCCCCGCCAGCCGAAAGTATCGAGGAGAAGCTGCAAGGCGGGCGCCAGGAGCAGCGAGGA\t=8!W<97899<885]]U]][]Y]]\\]]]]]\\]]]\\][Q][]]]X\\X]]]]]]]]]X]Y]]]]]]]]]]]U]\\]]]]]]]]]]]]]]]]]]]X]\\]>@:\tX0:i:1\tX1:i:0\tMD:Z:2G59A35\tXF:i:2\tRG:Z:L9303\tXG:i:0\tXI:Z:ACTAAGT\tYI:Z:9;897>6\tXJ:Z:AGAATTA\tYJ:Z:9=98@A8\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:8:1107:11181:120725\t659\t17\t6945955\t60\t101M\t=\t6945789\t-266\tGGGCGCCGGGAGCAGNGAGGAGGCCCNNTTGCCGGTGAGCGCCAGCCCCACCGCCAAGACTCGACGGCGGGAGAAGTAACGCGAGAGGGTGCCTAGGGCGG\t;EEA=EB0+=.+\tAM:i:37\tNM:i:4\tSM:i:37\tXM:i:4\tXO:i:0\tXP:i:2\tMQ:i:60\tZQ:A:Q\tXT:A:U\n", "SN928_0068_BB022WACXX:1:2304:5861:103162\t16\t17\t6946136\t37\t42M\t*\t0\t0\tATTCCCAGCCCGGCNCTCCGCACCAGGCCCCCGCCTCGTTCG\t]]]]]]]]]]]]]]!]]]]]]]]]]]]]]]]]]]]]]]]]]]\tX0:i:1\tX1:i:0\tMD:Z:14T27\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGN\tYI:Z:3I7AHD!\tXJ:Z:NNGGTNN\tYJ:Z:!!?@-!!\tNM:i:1\tXM:i:1\tXO:i:0\tXP:i:2\tXT:A:U\n", "SN928_0068_BB022WACXX:2:1206:11210:198703\t16\t17\t6946171\t37\t163M\t*\t0\t0\tTCGTTCGCTACCCCAGATCCCAACAAGCTCCTGTCACCTCCTTCACCCTGAATGACCCGGGCATCCCACTTCCCTCACCAGCGAGGAGGCCCAGGCCGAGGTAGAGATGCAGCNGACCGCTGGCGAAAGCCGAGAAGACGAAGCCCAGCGAGGCGAGGATGCC\t]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]!]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]\tX0:i:1\tX1:i:0\tMD:Z:113A2T42C3\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGN\tYI:Z:6>6>D@!\tXJ:Z:GNGGNNN\tYJ:Z:)!:>!!!\tNM:i:3\tXM:i:3\tXO:i:0\tXP:i:4\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:6:2102:12288:96559\t16\t17\t6946272\t37\t150M\t*\t0\t0\tNAGAGATGCAGCAGACCGCTGGCGAAAGCCGAGAAGACGAAGCCCAGCGAGGCGAGGATGCCCCCAACCATCACCACGGGGCGGGCCCCCCAGCGCGTGCTCAGGGCGCTGCCCACGGGGCCTGAAAGGGGGCGGAGTCAACGGAAGACA\t!9;568-.99998::67=5:97766:58688777978774<43566635JRUPPHPQQMGPOSTR]UQPWJSQRSLSUTLNNROLLJSVNORRPNNIIHLF9<<8?:;?>=9=<;<@?:<>==>A?=>>9:67=?<><6?;9=<8;<86:\tX0:i:1\tX1:i:0\tMD:Z:0T14T42C91\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGN\tYI:Z:;>56=8!\tNM:i:3\tXM:i:3\tXO:i:0\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:8:1302:2685:131287\t16\t17\t6946275\t37\t124M\t*\t0\t0\tAGATGCAGCAGACNGCTGGCGAAAGCCGAGAAGACGAAGCCCAGCGAGGCGAGGATGCCCCCAACCATCACCACGGGGCGGGCCCCCCAGCGCGTGCTCAGGGCGCTGCCCACGGGGCCTGAAA\tILKKII>6GTKQO!SMO(LEKLS]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]S]]]]]]]]]]]]]]]]]]]]ZUQ]\\VRQ]Z]][VWSW\\]ZZ\tX0:i:1\tX1:i:0\tMD:Z:12T0C41C68\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGT\tYI:Z:@@1.>5/\tNM:i:3\tXM:i:3\tXO:i:0\tXP:i:2\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:7:2203:1652:15044\t16\t17\t6946305\t37\t115M\t*\t0\t0\tNAGACGAAGCCCAGCGAGGCGAGGATGCCCCCAACCATCACCACGGGGCGGGCCCCCCAGCGCGTGCTCAGGGCGCTGCCCACGGGGCCTGAAAGGGGGCGGAGTCAACGGAAGA\t!98886309:<99;PWZTRXWUVPZYTSTUVY]ZW][XXTV[]ZWYSRXR+UXVIYU[T2XQWQRRTTW1NSRRPQPUTXUUWRXQRTQUQYRWSRNRTK,9@;?8@=:;<>.<>\tX0:i:1\tX1:i:0\tMD:Z:0A24C89\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGN\tYI:Z:;>.+>/!\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "NIOBE_0139_A_D0B5GACXX:6:2101:10929:12034\t0\t17\t6946626\t37\t145M\t*\t0\t0\tCTCACTGGCTGCCTGCTGCACGGCCAGGGCCAGGGCGCTGATCCACGCAGTGTCCTGGGCGCTTCGGTCAAAGTGCTCGGCAAGGTCAGGGAAGGCAAGGCCCAGCGAGCGCAGCAGCCCGTAGGACAGCCCGTTTATCGCGAAN\t@A==@A?:@CA?CC?BEA>D@?B?AB>?@?CD?@A>AB@>AA@APRWSXYWRZVYXXXVQZW]\\VXXZSY5]WXZX]YYX]]][\\R]]]XRZ]Z\\Z]]VSS:::285:9:89::9<89689<=96=9<8;88;;9<;22887:;!\tX0:i:1\tX1:i:0\tMD:Z:144G0\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGN\tYI:Z::?:9@=!\tNM:i:1\tXM:i:1\tXO:i:0\tXT:A:U\n", "SN928_0068_BB022WACXX:4:2307:16755:9768\t16\t17\t6946688\t37\t88M\t*\t0\t0\tTTCGGTCAAAGTGCTCGGCAAGGTCAGGGAAGGCAAGGCCCAGCGAGCGCAGCAGCCCGTNGGACAGCCCGTTTATCGCGAAGGCTGC\t]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]!]]]]]]]]]]]]]]]]]]]]]]]]]]]\tX0:i:1\tX1:i:0\tMD:Z:60A27\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGG\tYI:Z::D:?AC3\tXJ:Z:CNGGTNN\tYJ:Z:;!@@1!!\tNM:i:1\tXM:i:1\tXO:i:0\tXP:i:2\tXT:A:U\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "NIOBE_0139_A_D0B5GACXX:7:2102:12032:9259\t0\t17\t6946702\t37\t122M\t*\t0\t0\tTCGGCAAGGTCAGGGAAGGCAAGGCCCACCGAGCGCAGCAGCCCGTAGGACAGCCCGTTTATCGCGAAGGCTGCGGCCGCCACCACCCAGCCCCAGCCCCCATCCGGGGGTCCGGCGGGCTN\t8@@:?;=<>=@A@9<@B?@?BSVQLVW3*TVZYSQXXTUWTSZXV]ZYTUTVYSZYX]]]]]WYWXYTSRZWXUVWUXY\\[UYTRRZZ[[XYYW]YVVQRN<4:788867:59<129738:!\tX0:i:1\tX1:i:0\tMD:Z:28G92G0\tXF:i:2\tRG:Z:L9105\tXG:i:0\tXI:Z:CCGGCGN\tYI:Z:?@2,?2!\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "SN928_0068_BB022WACXX:8:2204:19030:66280\t0\t17\t6946865\t37\t105M\t*\t0\t0\tAGNAGCCTCCACGCCTGTGCTTCCGCTGGGGAGCTGGCATCCCTGAGATCCAGCCTGTGGCTGCTCGCCCGGGGTGGGCCCGTCACTCCGAGCGCGATGGCGCGG\t;:!=9:=A?>UY[]]]]]]]]]]]]]]]]Z]]]\\\\]\\]]]]]]]]Z][]]]]]]]]]]]]]]]]Y]]]]]]\\]]]]]]]]]]\\]\\]]]]]Y]]]]<>:?;>?>::\tX0:i:1\tX1:i:0\tMD:Z:2A53C48\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGG\tYI:Z::G;@FD5\tXJ:Z:CNGGTNN\tYJ:Z:+!AC/!!\tNM:i:2\tXM:i:2\tXO:i:0\tXT:A:U\n", "SN928_0068_BB022WACXX:6:1105:17159:36735\t0\t17\t6946880\t37\t104M\t*\t0\t0\tTGTGCTTCCGCTGGGGAGCTGGCATCCCTGAGATCCAGCCTGTGGCTGNTCGCCCGGGGTGGGCCCGTCACTCCGAGCGCGATGGCGCGGGGCGGAGGGAGCCG\tUQVWTZ[Z\\]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]!]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]]\\NZY\\TTXT\tX0:i:1\tX1:i:0\tMD:Z:41C6C55\tXF:i:2\tRG:Z:L9198\tXG:i:0\tXI:Z:AGATGGC\tYI:Z:9B8=BC;\tXJ:Z:CNGNNNC\tYJ:Z:8!\tNM:i:2\tXM:i:2\tXO:i:0\tXP:i:2\tXT:A:U\n" ] } ], "source": [ "samtools view /data/bam/workshop1.bam | awk '$10~/N/{print}'" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Sequences aligning to each chromosome" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " 1265 17\n" ] } ], "source": [ "samtools view /data/bam/workshop1.bam | cut -f 3 | sort | uniq -c" ] }, { "cell_type": "code", "execution_count": 18, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " 63 *\n", " 18651 1\n", " 10619 10\n", " 10647 11\n", " 10317 12\n", " 6713 13\n", " 7117 14\n", " 6806 15\n", " 7372 16\n", " 7164 17\n", " 5586 18\n", " 5461 19\n", " 18268 2\n", " 5222 20\n", " 2808 21\n", " 3448 22\n", " 14650 3\n", " 13618 4\n", " 13289 5\n", " 12701 6\n", " 12189 7\n", " 11467 8\n", " 9508 9\n", " 7 GL000191.1\n", " 38 GL000192.1\n", " 47 GL000193.1\n", " 41 GL000194.1\n", " 33 GL000195.1\n", " 2 GL000196.1\n", " 4 GL000197.1\n", " 6 GL000198.1\n", " 280 GL000199.1\n", " 8 GL000200.1\n", " 3 GL000201.1\n", " 3 GL000202.1\n", " 1 GL000203.1\n", " 3 GL000204.1\n", " 56 GL000205.1\n", " 1 GL000206.1\n", " 32 GL000208.1\n", " 9 GL000209.1\n", " 2 GL000210.1\n", " 14 GL000211.1\n", " 26 GL000212.1\n", " 3 GL000213.1\n", " 144 GL000214.1\n", " 7 GL000215.1\n", " 26 GL000216.1\n", " 19 GL000217.1\n", " 14 GL000218.1\n", " 31 GL000219.1\n", " 1019 GL000220.1\n", " 24 GL000221.1\n", " 9 GL000222.1\n", " 8 GL000223.1\n", " 110 GL000224.1\n", " 44 GL000225.1\n", " 465 GL000226.1\n", " 3 GL000227.1\n", " 16 GL000228.1\n", " 7 GL000229.1\n", " 3 GL000230.1\n", " 4 GL000231.1\n", " 2 GL000232.1\n", " 9 GL000233.1\n", " 6 GL000234.1\n", " 4 GL000235.1\n", " 3 GL000236.1\n", " 8 GL000237.1\n", " 3 GL000238.1\n", " 8 GL000239.1\n", " 5 GL000240.1\n", " 3 GL000241.1\n", " 3 GL000242.1\n", " 8 GL000243.1\n", " 3 GL000244.1\n", " 5 GL000245.1\n", " 2 GL000246.1\n", " 8 GL000247.1\n", " 3 GL000248.1\n", " 3 GL000249.1\n", " 10595 hs37d5\n", " 962 MT\n", " 11694 X\n", " 399 Y\n" ] } ], "source": [ "samtools view /data/bam/workshop2.bam | cut -f 3 | sort | uniq -c " ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "-> similar number of alignments on X and 7, probably female" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Average size of seqs, not paired end" ] }, { "cell_type": "code", "execution_count": 20, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "65.021\n" ] } ], "source": [ "samtools view -F 1 /data/bam/workshop1.bam | awk '{x=x+length($10)}END{print x/NR}'" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "GC and AT bases" ] }, { "cell_type": "code", "execution_count": 23, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "53226\n" ] } ], "source": [ "# number of CG\n", "samtools view /data/bam/workshop1.bam | tr -d 'ATN' | awk '{x=x+length($10)}END{print x}'" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "29755\n" ] } ], "source": [ "# number of AT\n", "samtools view /data/bam/workshop1.bam | tr -d 'CGN' | awk '{x=x+length($10)}END{print x}'" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Average Coverage an X and 7" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "0.00376993\n" ] } ], "source": [ "samtools depth /data/bam/workshop2.bam -a -r 7 | awk '{x+=$3}END{print x/NR}'" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "0.00373218\n" ] } ], "source": [ "samtools depth /data/bam/workshop2.bam -a -r X | awk '{x+=$3}END{print x/NR}'" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "34.3182\n" ] } ], "source": [ "samtools depth -a -r 17:6944949-6947242 /data/bam/workshop1.bam | awk '{x+=$3}END{print x/NR}'" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Bash", "language": "bash", "name": "bash" }, "language_info": { "codemirror_mode": "shell", "file_extension": ".sh", "mimetype": "text/x-sh", "name": "bash" } }, "nbformat": 4, "nbformat_minor": 2 }