{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "### Archiving of Ostrea lurida (Olympia oyster) genome data from BGI" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Print system info" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Software:\n", "\n", " System Software Overview:\n", "\n", " System Version: Mac OS X 10.7.5 (11G63)\n", " Kernel Version: Darwin 11.4.2\n", " Boot Volume: SSD2\n", " Boot Mode: Normal\n", " Computer Name: greenbird (2)\n", " User Name: Sam (Sam)\n", " Secure Virtual Memory: Enabled\n", " 64-bit Kernel and Extensions: No\n", " Time since boot: 6 days 22:35\n", "\n" ] } ], "source": [ "%%bash\n", "system_profiler SPSoftwareDataType" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### List of files from BGI" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_1.fq.gz\n", "151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_2.fq.gz\n", "151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_1.fq.gz\n", "151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz\n", "151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz\n", "151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_2.fq.gz\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_1.fq.gz\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_2.fq.gz\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_1.fq.gz\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_2.fq.gz\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_1.fq.gz\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_2.fq.gz\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_1.fq.gz\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_2.fq.gz\n", "160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_1.fq.gz\n", "160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_2.fq.gz\n", "160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_1.fq.gz\n", "160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_2.fq.gz\n", "md5.txt\n" ] } ], "source": [ "%%bash\n", "ls /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Generate checksums file to verify downloaded data remained intact." ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "collapsed": false }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "\n", "real\t54m34.245s\n", "user\t2m45.154s\n", "sys\t4m33.476s\n" ] } ], "source": [ "%%bash\n", "\n", "#For loop generates a md5 checksum has value for each file\n", "#and appends the output to the checksums.md5 file.\n", "time for file in /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/*.gz\n", " do\n", " md5 \"$file\" >> /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/checksums.md5\n", " done" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### View checksums.md5 file" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_1.fq.gz) = 810d188468dbd8bb36b2af3bf3b9fee6\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_2.fq.gz) = cf92b18e0815dc0471d61f9107142257\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_1.fq.gz) = 3dc2137d7df0af8d6a007516908361a3\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz) = 8bc0d7c7a7af3954baca31a4a7fe9f2b\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz) = 08cfdc6fdc5a6190cb05cdcb81fa5b9c\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_2.fq.gz) = a503043167457337a65d51151ceb5dd0\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_1.fq.gz) = a0c0177a7a4a4ca28c37bd3802361564\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_2.fq.gz) = 74e51d608de7a409a29545a95ac3ec14\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_1.fq.gz) = e829da6f7e7a047586802a05d3b96d18\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_2.fq.gz) = 74953d0143c392f111eec178667d3fcd\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_1.fq.gz) = 9b5f7c1593f216f710814c299738493f\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_2.fq.gz) = 5a6392d9c23aa85d170d7f50de4f0b54\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_1.fq.gz) = 2cf349b55558e7424fa0ed029ae0bfca\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_2.fq.gz) = 5cb745671596d5d5d307986d35ea9792\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_1.fq.gz) = b371a3b3588060bb2200f5caaf9a9d5c\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_2.fq.gz) = dd8b0fef21fc5e330d08ae4a48c8d67b\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_1.fq.gz) = 50b5dbff9426738005b81efd49d66329\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_2.fq.gz) = 29be6e734ad65c180aee23d1514c5c35\r\n" ] } ], "source": [ "cat /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/checksums.md5" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### View md5.txt file from BGI" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "810d188468dbd8bb36b2af3bf3b9fee6 151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_1.fq.gz\r\n", "cf92b18e0815dc0471d61f9107142257 151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_2.fq.gz\r\n", "3dc2137d7df0af8d6a007516908361a3 151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_1.fq.gz\r\n", "8bc0d7c7a7af3954baca31a4a7fe9f2b 151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz\r\n", "08cfdc6fdc5a6190cb05cdcb81fa5b9c 151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz\r\n", "a503043167457337a65d51151ceb5dd0 151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_2.fq.gz\r\n", "a0c0177a7a4a4ca28c37bd3802361564 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_1.fq.gz\r\n", "74e51d608de7a409a29545a95ac3ec14 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_2.fq.gz\r\n", "e829da6f7e7a047586802a05d3b96d18 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_1.fq.gz\r\n", "74953d0143c392f111eec178667d3fcd 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_2.fq.gz\r\n", "9b5f7c1593f216f710814c299738493f 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_1.fq.gz\r\n", "5a6392d9c23aa85d170d7f50de4f0b54 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_2.fq.gz\r\n", "2cf349b55558e7424fa0ed029ae0bfca 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_1.fq.gz\r\n", "5cb745671596d5d5d307986d35ea9792 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_2.fq.gz\r\n", "b371a3b3588060bb2200f5caaf9a9d5c 160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_1.fq.gz\r\n", "dd8b0fef21fc5e330d08ae4a48c8d67b 160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_2.fq.gz\r\n", "50b5dbff9426738005b81efd49d66329 160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_1.fq.gz\r\n", "29be6e734ad65c180aee23d1514c5c35 160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_2.fq.gz\r\n" ] } ], "source": [ "cat /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/md5.txt" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Save hash values from checksums.md5 and md5.txt to variables. Compare hash values from each to ensure they match (i.e. downloaded data is intact)." ] }, { "cell_type": "code", "execution_count": 17, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "4e95a487fd10e60ea5af7b62287f88a0 ce78b1856aa612473de14a9599d0c4ff a21f45349c1ebae6f8723d07613189cb 23fcb4cda2aba74e97644a8cfac46a59 4b6225d3d0280fc9bf4161c6f86b5586 b9f80f96fda43362da9ee08aced56bef b0dfe5ea6ded0272024d97bdc387f0d0 4d6dcf410e7a110d94fca646dff07ea7 146fcf32aac04eecc41671389e37ae61 62017aeb0276b3da77a4b014255a1bf8 efcefa598dfc9230aa2f5b4d787388ee 0d3fabf04fc56e6249378fcddc286f06 c2f4fa5c539cc028e4afdfd7765416ca 4a8fa8aee94bccf81e6f600b63935242 666f18e9cf0ba248e41bc089736932bb e73619c9bff1dbc816b6b17ca16518b1 46f6762bafdeec810c12496c43f0c85c 1da60e5843632956234b0a4cf10427f5\n", "\n", "4e95a487fd10e60ea5af7b62287f88a0 ce78b1856aa612473de14a9599d0c4ff a21f45349c1ebae6f8723d07613189cb 23fcb4cda2aba74e97644a8cfac46a59 4b6225d3d0280fc9bf4161c6f86b5586 b9f80f96fda43362da9ee08aced56bef b0dfe5ea6ded0272024d97bdc387f0d0 4d6dcf410e7a110d94fca646dff07ea7 146fcf32aac04eecc41671389e37ae61 62017aeb0276b3da77a4b014255a1bf8 efcefa598dfc9230aa2f5b4d787388ee 0d3fabf04fc56e6249378fcddc286f06 c2f4fa5c539cc028e4afdfd7765416ca 4a8fa8aee94bccf81e6f600b63935242 666f18e9cf0ba248e41bc089736932bb e73619c9bff1dbc816b6b17ca16518b1 46f6762bafdeec810c12496c43f0c85c 1da60e5843632956234b0a4cf10427f5\n", "\n", "0\n" ] } ], "source": [ "%%bash\n", "\n", "#Use awk to print the 4th field (the checksum hash values) and saves the values to the new_checksums variable.\n", "new_checksums=$( awk '{print $4}' /Volumes/owl_home/F15FTSUSAT0328_PANwalD/checksums.md5 )\n", "\n", "#Use awk to print the 1st field (the checksum hash values) and saves the values to the original_checksums variable.\n", "original_checksums=$( awk '{print $1}' /Volumes/owl_home/F15FTSUSAT0328_PANwalD/md5.txt)\n", "\n", "#Print contents of new_checksums variable to verify the contents.\n", "echo $new_checksums\n", "\n", "#Print an empty line for improved readibility in the output.\n", "echo \"\"\n", "\n", "#Print contents of original_checksums variable to verify the contents.\n", "echo $original_checksums\n", "\n", "#Prints an empty line for improved readibility in the output.\n", "echo \"\"\n", "\n", "\n", "#Compare differences between the checksum hash values in each of the two variables.\n", "#Uses the bash concept of process substitution \"<(\" to accomplish task using variable contents instead of two files.\n", "diff <(echo \"$new_checksums\") <(echo \"$original_checksums\")\n", "\n", "#Check exit status of last command executed (i.e. if diff command found no differences, then the output should be 0)\n", "echo $?" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Calculate total number of reads generated by this project" ] }, { "cell_type": "code", "execution_count": 14, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "1225964680\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "\n", "real\t79m17.932s\n", "user\t36m45.185s\n", "sys\t6m51.916s\n" ] } ], "source": [ "%%bash\n", "\n", "totalreads=0#Initializes variable.\n", "\n", "#For loop counts the lines in each file and divides them by four. This is performed because\n", "#Illumina sequencing files are composed of four lines per read.\n", "#A running total of the total number of reads is generated [totalreads=$((readcount+totalreads))]\n", "#and is printed after the for loop completes.\n", "time for file in /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/*.gz\n", " do linecount=`gunzip -c \"$file\" | wc -l`\n", " readcount=$((linecount/4))\n", " totalreads=$((readcount+totalreads))\n", "done\n", "echo $totalreads" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Calculate number of reads per file and append filename and corresponding number of reads to readme file" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_1.fq.gz\t61253141\n", "\n", "151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_2.fq.gz\t61253141\n", "\n", "151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_1.fq.gz\t58755925\n", "\n", "151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz\t53307837\n", "\n", "151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz\t27731148\n", "\n", "151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_2.fq.gz\t43938762\n", "\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_1.fq.gz\t87198584\n", "\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_2.fq.gz\t87198584\n", "\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_1.fq.gz\t43766527\n", "\n", "160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_2.fq.gz\t43766527\n", "\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_1.fq.gz\t87135961\n", "\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_2.fq.gz\t87135961\n", "\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_1.fq.gz\t43138844\n", "\n", "160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_2.fq.gz\t43138844\n", "\n", "160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_1.fq.gz\t95270180\n", "\n", "160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_2.fq.gz\t95270180\n", "\n", "160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_1.fq.gz\t92524416\n", "\n", "160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_2.fq.gz\t92524416\n", "\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "gunzip: /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz: unexpected end of file\n", "gunzip: /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz: uncompress failed\n", "gunzip: data stream error\n", "gunzip: /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz: uncompress failed\n", "\n", "real\t57m35.277s\n", "user\t31m3.366s\n", "sys\t4m2.700s\n" ] } ], "source": [ "%%bash\n", "\n", "#For loop counts the lines in each file and divides them by four. This is performed because\n", "#Illumina sequencing files are composed of four lines per read.\n", "#Format the output (printf) to print the filename, followed by a tab, followed by the readcount.\n", "#The command \"tee -a\" is used to both print the output to the screen and append the output to the readme.md file.\n", "time for file in /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/*.gz\n", " do linecount=`gunzip -c \"$file\" | wc -l`\n", " readcount=$(($linecount/4))\n", " printf \"%s\\t%s\\n\\n\" \"${file##*/}\" \"$readcount\" | tee -a /Volumes/owl_web/nightingales/O_lurida/readme.md\n", "done" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Move .gz files to web accessible location on Owl" ] }, { "cell_type": "code", "execution_count": 20, "metadata": { "collapsed": false }, "outputs": [], "source": [ "%%bash\n", "\n", "mv -n /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/*.gz /Volumes/owl_web/nightingales/O_lurida/" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### List files in Owl/web/nightingales/O_lurida" ] }, { "cell_type": "code", "execution_count": 26, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " 6.6G Jan 25 01:59 151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_1.fq.gz\n", " 6.8G Jan 25 02:12 151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_2.fq.gz\n", " 6.5G Jan 25 02:16 151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_1.fq.gz\n", " 6.1G Jan 27 12:52 151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz\n", " 2.4G Jan 27 12:59 151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz\n", " 4.0G Jan 25 02:06 151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_2.fq.gz\n", " 2.4G Jan 25 02:14 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_1.fq.gz\n", " 2.7G Jan 25 02:39 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_2.fq.gz\n", " 1.3G Jan 25 02:14 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_1.fq.gz\n", " 1.4G Jan 25 02:20 160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_2.fq.gz\n", " 2.4G Jan 25 02:19 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_1.fq.gz\n", " 2.7G Jan 25 02:36 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_2.fq.gz\n", " 1.3G Jan 25 02:21 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_1.fq.gz\n", " 1.4G Jan 25 02:25 160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_2.fq.gz\n", " 2.7G Jan 25 02:29 160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_1.fq.gz\n", " 3.0G Jan 25 02:30 160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_2.fq.gz\n", " 2.5G Jan 25 02:41 160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_1.fq.gz\n", " 2.9G Jan 25 02:35 160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_2.fq.gz\n" ] } ], "source": [ "%%bash\n", "\n", "#List the files from this project (grep FCH3*), showing human-readable file sizes,\n", "#and get rid of file permission info in output (cut -d ' ' -f7)\n", "ls -lh /Volumes/owl_web/nightingales/O_lurida/ | grep 'FCH3*' | cut -d ' ' -f7-" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Append new checksums to existing checksums file in Owl/web/nightingales/O_lurida" ] }, { "cell_type": "code", "execution_count": 23, "metadata": { "collapsed": false }, "outputs": [], "source": [ "%%bash\n", "\n", "cat /Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/checksums.md5 >> /Volumes/owl_web/nightingales/O_lurida/checksums.md5" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "##### Verify checksums were added to Owl/web/nightingales/O_lurida/checksums.md5" ] }, { "cell_type": "code", "execution_count": 24, "metadata": { "collapsed": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_1.fq.gz) = 810d188468dbd8bb36b2af3bf3b9fee6\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L1_wHAIPI023992-37_2.fq.gz) = cf92b18e0815dc0471d61f9107142257\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_1.fq.gz) = 3dc2137d7df0af8d6a007516908361a3\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151114_I191_FCH3Y35BCXX_L2_wHAMPI023991-66_2.fq.gz) = 8bc0d7c7a7af3954baca31a4a7fe9f2b\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_1.fq.gz) = 08cfdc6fdc5a6190cb05cdcb81fa5b9c\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/151118_I137_FCH3KNJBBXX_L5_wHAXPI023905-96_2.fq.gz) = a503043167457337a65d51151ceb5dd0\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_1.fq.gz) = a0c0177a7a4a4ca28c37bd3802361564\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCABDLAAPEI-62_2.fq.gz) = 74e51d608de7a409a29545a95ac3ec14\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_1.fq.gz) = e829da6f7e7a047586802a05d3b96d18\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L3_WHOSTibkDCACDTAAPEI-75_2.fq.gz) = 74953d0143c392f111eec178667d3fcd\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_1.fq.gz) = 9b5f7c1593f216f710814c299738493f\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCABDLAAPEI-62_2.fq.gz) = 5a6392d9c23aa85d170d7f50de4f0b54\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_1.fq.gz) = 2cf349b55558e7424fa0ed029ae0bfca\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L4_WHOSTibkDCACDTAAPEI-75_2.fq.gz) = 5cb745671596d5d5d307986d35ea9792\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_1.fq.gz) = b371a3b3588060bb2200f5caaf9a9d5c\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L5_WHOSTibkDCAADWAAPEI-74_2.fq.gz) = dd8b0fef21fc5e330d08ae4a48c8d67b\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_1.fq.gz) = 50b5dbff9426738005b81efd49d66329\r\n", "MD5 (/Volumes/owl_home/O_lurida_BGI_F15FTSUSAT0327_OSTibkD/160103_I137_FCH3V5YBBXX_L6_WHOSTibkDCAADWAAPEI-74_2.fq.gz) = 29be6e734ad65c180aee23d1514c5c35\r\n" ] } ], "source": [ "%%bash\n", "\n", "cat /Volumes/owl_web/nightingales/O_lurida/checksums.md5 | grep 'FCH3*'" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "collapsed": true }, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 2", "language": "python", "name": "python2" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 2 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython2", "version": "2.7.9" } }, "nbformat": 4, "nbformat_minor": 0 }