From c33f2ad04667fd21fce6ec8eefa3694e2209a852 Mon Sep 17 00:00:00 2001 From: Niko <nikolaos.papadopoulos@univie.ac.at> Date: Wed, 27 Nov 2024 20:45:06 +0100 Subject: [PATCH] now running on cluster --- 08-submission/gff-02-functional_annot.ipynb | 29 ++++++++------------- 1 file changed, 11 insertions(+), 18 deletions(-) diff --git a/08-submission/gff-02-functional_annot.ipynb b/08-submission/gff-02-functional_annot.ipynb index 1ab90de..c26e7eb 100644 --- a/08-submission/gff-02-functional_annot.ipynb +++ b/08-submission/gff-02-functional_annot.ipynb @@ -14,7 +14,7 @@ "metadata": {}, "outputs": [], "source": [ - "from tqdm import tqdm\n", + "# from tqdm import tqdm # install it for nice progress bars\n", "\n", "import pandas as pd" ] @@ -118,11 +118,11 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ - "best_per_gene = '/Users/npapadop/Documents/data/pycnogonum/draft/out.emapper.best.annotations'\n", + "best_per_gene = '/lisc/scratch/zoology/pycnogonum/genome/draft/annot_merge/emapper/out.emapper.best.annotations'\n", "emapper = pd.read_csv(best_per_gene, sep='\\t', header=0)\n", "\n", "emapper['gene'] = emapper['#query'].apply(parse_gene_id)\n", @@ -148,26 +148,19 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 7, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "100%|██████████| 779251/779251 [00:04<00:00, 183551.40it/s]\n" - ] - } - ], + "outputs": [], "source": [ - "gff_loc = '/Volumes/scratch/pycnogonum/genome/submission/merged_sorted.gff3'\n", - "named_loc = '/Volumes/scratch/pycnogonum/genome/submission/merged_sorted_named.gff3'\n", + "gff_loc = '/lisc/scratch/zoology/pycnogonum/genome/submission/merged_sorted.gff3'\n", + "named_loc = '/lisc/scratch/zoology/pycnogonum/genome/submission/merged_sorted_named.gff3'\n", "\n", "with open(gff_loc, 'r') as gff:\n", " with open(named_loc, 'w') as named:\n", " gene = ''\n", " mRNA = ''\n", - " for line in tqdm(gff.readlines()):\n", + " # for line in tqdm(gff.readlines()):\n", + " for line in gff.readlines():\n", " line = line.strip()\n", " conditions_skip = line.startswith('#') or 'tRNA' in line or 'name=' in line\n", " if not conditions_skip:\n", @@ -190,7 +183,7 @@ ], "metadata": { "kernelspec": { - "display_name": "ascc24", + "display_name": "jupyterhub-5.1.0", "language": "python", "name": "python3" }, @@ -204,7 +197,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.19" + "version": "3.12.4" } }, "nbformat": 4, -- GitLab