From 807bf3f0dadafd35b05ac1429748d3a959ba9ca2 Mon Sep 17 00:00:00 2001
From: Swastik Mishra <swastik.mishra@hhu.de>
Date: Wed, 25 Dec 2024 00:09:32 +0000
Subject: [PATCH] Update readme

---
 README.md                           |  2 ++
 notebooks/01-01_download_data.ipynb | 14 +++++++-------
 2 files changed, 9 insertions(+), 7 deletions(-)

diff --git a/README.md b/README.md
index 114d5df..a8f6acd 100644
--- a/README.md
+++ b/README.md
@@ -20,3 +20,5 @@ The only other file you need to install is `xlsx2csv` using `pip`:
 ```
 pip install xlsx2csv
 ```
+
+Additionally, I used `ripgrep` instead of `grep` for faster extraction of subset data from EggNOG. In case you rely on `grep` make edits accordingly in the notebooks (replace commands of `rg`)
diff --git a/notebooks/01-01_download_data.ipynb b/notebooks/01-01_download_data.ipynb
index 265a725..9e6f784 100644
--- a/notebooks/01-01_download_data.ipynb
+++ b/notebooks/01-01_download_data.ipynb
@@ -9,8 +9,10 @@
    ]
   },
   {
-   "cell_type": "raw",
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
+   "outputs": [],
    "source": [
     "e6_url = \"http://eggnog6.embl.de/download/eggnog_6.0/\"\n",
     "all_trees_path = e6_url + \"e6.all_raw_trees_and_algs.tsv\"\n",
@@ -38,12 +40,10 @@
    ]
   },
   {
-   "cell_type": "raw",
-   "metadata": {
-    "vscode": {
-     "languageId": "raw"
-    }
-   },
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
    "source": [
     "%%bash -s \"$data_dir\" \"$all_trees_path\" \"$og2seqs_species_path\" \"$seq2ogs_path\" \"$gold_url\"\n",
     "pip install xlsx2csv\n",
-- 
GitLab