From ec69c27f70444440fdcd38a854e7739c4012d1fa Mon Sep 17 00:00:00 2001 From: anakin87 Date: Thu, 21 May 2026 09:58:54 +0200 Subject: [PATCH] tut 46: fix images download --- tutorials/46_Multimodal_RAG.ipynb | 41 ++++++++++++++----------------- 1 file changed, 18 insertions(+), 23 deletions(-) diff --git a/tutorials/46_Multimodal_RAG.ipynb b/tutorials/46_Multimodal_RAG.ipynb index 70145547..657c203b 100644 --- a/tutorials/46_Multimodal_RAG.ipynb +++ b/tutorials/46_Multimodal_RAG.ipynb @@ -130,26 +130,26 @@ "outputId": "08febdb6-3e36-4330-bed8-385710eb3339", "scrolled": true }, - "outputs": [ - { - "data": { - "text/plain": [ - "('capybara.jpg', )" - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ - "from urllib.request import URLopener\n", + "import shutil\n", + "from urllib.request import Request, urlopen\n", + "\n", + "HEADERS = {\"User-Agent\": \"haystack-tutorials\"}\n", "\n", - "url_opener = URLopener()\n", - "url_opener.addheader(\"User-Agent\", \"Mozilla/5.0\")\n", + "def download_image(url, filename):\n", + " req = Request(url, headers=HEADERS)\n", + " with urlopen(req) as r, open(filename, \"wb\") as f:\n", + " shutil.copyfileobj(r, f)\n", "\n", - "url_opener.retrieve(\"https://upload.wikimedia.org/wikipedia/commons/2/26/Pink_Lady_Apple_%284107712628%29.jpg?download\", \"apple.jpg\")\n", - "url_opener.retrieve(\"https://upload.wikimedia.org/wikipedia/commons/thumb/e/e1/Cattle_tyrant_%28Machetornis_rixosa%29_on_Capybara.jpg/960px-Cattle_tyrant_%28Machetornis_rixosa%29_on_Capybara.jpg?download\", \"capybara.jpg\")" + "download_image(\n", + " \"https://upload.wikimedia.org/wikipedia/commons/2/26/Pink_Lady_Apple_%284107712628%29.jpg\",\n", + " \"apple.jpg\",\n", + ")\n", + "download_image(\n", + " \"https://upload.wikimedia.org/wikipedia/commons/thumb/e/e1/Cattle_tyrant_%28Machetornis_rixosa%29_on_Capybara.jpg/960px-Cattle_tyrant_%28Machetornis_rixosa%29_on_Capybara.jpg\",\n", + " \"capybara.jpg\",\n", + ")" ] }, { @@ -350,12 +350,7 @@ } ], "source": [ - "from urllib.request import URLopener\n", - "\n", - "url_opener = URLopener()\n", - "url_opener.addheader(\"User-Agent\", \"Mozilla/5.0\")\n", - "\n", - "url_opener.retrieve(\"https://arxiv.org/pdf/1706.03762\", \"attention_is_all_you_need.pdf\")" + "download_image(\"https://arxiv.org/pdf/1706.03762\", \"attention_is_all_you_need.pdf\")" ] }, {