{ "cells": [ { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "res = pd.read_csv(\"species_cranky_wozniak\", sep = \"\\t\", header = None, \n", " names = ['taxid', 'rank', 'taxpath', 'taxpathsn', 'percentage'],\n", " skiprows= 1)" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | taxid | \n", "rank | \n", "taxpath | \n", "taxpathsn | \n", "percentage | \n", "
---|---|---|---|---|---|
0 | \n", "56636 | \n", "species | \n", "2157|28889|183924|114380|2272|56635|56636 | \n", "Archaea|Crenarchaeota|Thermoprotei|Desulfuroco... | \n", "0.0 | \n", "
1 | \n", "477693 | \n", "species | \n", "2157|28889|183924|114380|2272|2273|477693 | \n", "Archaea|Crenarchaeota|Thermoprotei|Desulfuroco... | \n", "0.0 | \n", "
2 | \n", "160233 | \n", "species | \n", "2157|28889|183924|114380|2272|54258|160233 | \n", "Archaea|Crenarchaeota|Thermoprotei|Desulfuroco... | \n", "0.0 | \n", "
3 | \n", "54248 | \n", "species | \n", "2157|28889|183924|114380|2307|54247|54248 | \n", "Archaea|Crenarchaeota|Thermoprotei|Desulfuroco... | \n", "0.0 | \n", "
4 | \n", "2285 | \n", "species | \n", "2157|28889|183924|2281|118883|2284|2285 | \n", "Archaea|Crenarchaeota|Thermoprotei|Sulfolobale... | \n", "0.0 | \n", "
\n", " | taxid | \n", "rank | \n", "taxpath | \n", "taxpathsn | \n", "percentage | \n", "
---|---|---|---|---|---|
0 | \n", "10 | \n", "genus | \n", "2|1224|1236|72274|135621|10 | \n", "Bacteria|Proteobacteria|Gammaproteobacteria|Ps... | \n", "0.010060 | \n", "
1 | \n", "100715 | \n", "genus | \n", "2|1090|191410|191411|191412|100715 | \n", "Bacteria|Chlorobi|Chlorobia|Chlorobiales|Chlor... | \n", "0.000000 | \n", "
2 | \n", "100883 | \n", "genus | \n", "2|1239|526524|526525|128827|100883 | \n", "Bacteria|Firmicutes|Erysipelotrichia|Erysipelo... | \n", "0.000000 | \n", "
3 | \n", "1016 | \n", "genus | \n", "2|976|117743|200644|49546|1016 | \n", "Bacteria|Bacteroidetes|Flavobacteriia|Flavobac... | \n", "0.000000 | \n", "
4 | \n", "1021 | \n", "genus | \n", "2|1224|1236|72273|135617|1021 | \n", "Bacteria|Proteobacteria|Gammaproteobacteria|Th... | \n", "0.000000 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1033 | \n", "97050 | \n", "genus | \n", "2|1224|28211|204455|31989|97050 | \n", "Bacteria|Proteobacteria|Alphaproteobacteria|Rh... | \n", "0.191146 | \n", "
1034 | \n", "972 | \n", "family | \n", "2|1239|186801|53433|972 | \n", "Bacteria|Firmicutes|Clostridia|Halanaerobiales... | \n", "0.010060 | \n", "
1035 | \n", "976 | \n", "phylum | \n", "2|976 | \n", "Bacteria|Bacteroidetes | \n", "2.263578 | \n", "
1036 | \n", "978 | \n", "genus | \n", "2|976|768503|768507|89373|978 | \n", "Bacteria|Bacteroidetes|Cytophagia|Cytophagales... | \n", "0.010060 | \n", "
1037 | \n", "995019 | \n", "family | \n", "2|1224|28216|80840|995019 | \n", "Bacteria|Proteobacteria|Betaproteobacteria|Bur... | \n", "0.010060 | \n", "
1038 rows × 5 columns
\n", "