test all good

master
Frans Masereel Centrum 1 year ago
parent f908e60804
commit b9f740f3f4

@ -2,7 +2,7 @@
"cells": [
{
"cell_type": "code",
"execution_count": 7,
"execution_count": 1,
"id": "bbf97edb-4082-49fd-9946-56aa3f3d0eb4",
"metadata": {},
"outputs": [],
@ -26,7 +26,7 @@
},
{
"cell_type": "code",
"execution_count": 8,
"execution_count": 16,
"id": "d53ab4b1-da92-4ae2-ae11-02fa2d8ffe7c",
"metadata": {},
"outputs": [],
@ -35,7 +35,7 @@
" dictionary = open('axios-example/pics.json',)\n",
" l = json.load(dictionary)\n",
" \n",
" cycles = 3\n",
" cycles = 10\n",
"\n",
" def scroll_to_end(wd):\n",
" wd.execute_script(\"window.scrollTo(0, document.body.scrollHeight);\")\n",
@ -82,7 +82,10 @@
"\n",
" # extract image url\n",
" actual_images = wd.find_elements(By.CLASS_NAME,'n3VNCb')\n",
" actual_image = actual_images[-1]\n",
" try:\n",
" actual_image = actual_images[-1]\n",
" except Exception:\n",
" continue\n",
" if actual_image.get_attribute('src') and 'http' in actual_image.get_attribute('src'):\n",
" image_urls.add(actual_image.get_attribute('src'))\n",
" linkPic = actual_image.get_attribute('src')\n",
@ -124,7 +127,7 @@
},
{
"cell_type": "code",
"execution_count": 9,
"execution_count": 17,
"id": "6de53389-ded8-47e2-b0aa-c132405a308f",
"metadata": {},
"outputs": [
@ -132,8 +135,8 @@
"name": "stdout",
"output_type": "stream",
"text": [
"Found: 267 search results. Extracting links from 0:267\n",
"Found: 200 image links, done!\n"
"Found: 281 search results. Extracting links from 0:281\n",
"Found: 260 image links, looking for more ...\n"
]
}
],
@ -150,7 +153,7 @@
" search_box = wd.find_element(By.CLASS_NAME,'gLFyf')\n",
" search_box.send_keys(query)\n",
" \n",
" links = harvesting(query,1000,wd)\n",
" links = harvesting(query,300,wd)\n",
" \n",
" wd.quit()"
]

File diff suppressed because one or more lines are too long

@ -39,8 +39,13 @@
<script>
// TODO: check higher quality pics
// TODO: automation scripts in parallel
// TODO: check array of links
// TODO: eliminare tutto json quando viene ricompilato
// TODO: test viewport to delete pictures dynamically
// TODO: automation scripts in parallel?
// TODO: last sentence on google image before credits
// TODO: credits at the end
var fetchInterval = 3200
@ -129,7 +134,7 @@
// 3D stuff
var numberOfItems = 800;
var numberOfItems = 280;
document.addEventListener("DOMContentLoaded", function() {
window.addEventListener("scroll", moveCamera);

Loading…
Cancel
Save