mathieu revised this gist . Go to revision
1 file changed, 176 insertions, 36 deletions
crawler_output
@@ -1,4 +1,8 @@ | |||
1 | - | https://brasseriebernard.com (has a restrictive robot.txt) | |
1 | + | Visiting: https://brasseriebernard.com | |
2 | + | Error when requesting https://brasseriebernard.com: [Errno 104] Connection reset by peer | |
3 | + | Error when making HEAD request to https://brasseriebernard.com: [Errno 104] Connection reset by peer | |
4 | + | ################################################################ | |
5 | + | https://brasseriebernard.com : | |
2 | 6 | ||
3 | 7 | {'html_static': set(), | |
4 | 8 | 'html_dynamic': {'https://brasseriebernard.com'}, | |
@@ -6,8 +10,64 @@ https://brasseriebernard.com (has a restrictive robot.txt) | |||
6 | 10 | 'images': set(), | |
7 | 11 | 'others': set(), | |
8 | 12 | 'external': set()} | |
13 | + | ################################################################ | |
9 | 14 | ||
10 | - | https://www.gibbys.com | |
15 | + | Visiting: https://www.gibbys.com | |
16 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/03/GB-BTL-vin_1920x1080-1280x720.jpg | |
17 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/03/GB-BTL-vin_1920x1080-1280x720.jpg (Content-Type: image/jpeg) | |
18 | + | Visiting: https://www.gibbys.com/menus | |
19 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_QUEUES-DE-HOMARD-1080x720.jpg | |
20 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_QUEUES-DE-HOMARD-1080x720.jpg (Content-Type: image/jpeg) | |
21 | + | Visiting: https://www.gibbys.com/gift-certificates | |
22 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_St-Sauveur_WEB_en.pdf | |
23 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_St-Sauveur_WEB_en.pdf (Content-Type: application/pdf) | |
24 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_FILET-MIGNON-KEBAB-1080x720.jpg | |
25 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_FILET-MIGNON-KEBAB-1080x720.jpg (Content-Type: image/jpeg) | |
26 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/12/GB-CarteBoire.pdf | |
27 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/12/GB-CarteBoire.pdf (Content-Type: application/pdf) | |
28 | + | Visiting: https://www.gibbys.com/contact | |
29 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_STEAK-1080x720.jpg | |
30 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_STEAK-1080x720.jpg (Content-Type: image/jpeg) | |
31 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_CREVETTES-SAUTEES-A-LAIL-1080x720.jpg | |
32 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_CREVETTES-SAUTEES-A-LAIL-1080x720.jpg (Content-Type: image/jpeg) | |
33 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/07/GB-MAJ-Always-On-07-480x720.jpg | |
34 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/07/GB-MAJ-Always-On-07-480x720.jpg (Content-Type: image/jpeg) | |
35 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-CarteBoire_Octobre_2024.pdf | |
36 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-CarteBoire_Octobre_2024.pdf (Content-Type: application/pdf) | |
37 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_ESCARGOTS-A-LA-BOURGUIGNONNE-1080x720.jpg | |
38 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_ESCARGOTS-A-LA-BOURGUIGNONNE-1080x720.jpg (Content-Type: image/jpeg) | |
39 | + | Visiting: https://www.gibbys.com/fr | |
40 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2019/06/gal3-1152x720.jpg | |
41 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2019/06/gal3-1152x720.jpg (Content-Type: image/jpeg) | |
42 | + | Visiting: https://www.gibbys.com/fr/evenements | |
43 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Groupe_DUO_EN.pdf | |
44 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Groupe_DUO_EN.pdf (Content-Type: application/pdf) | |
45 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_HUITRES-FRAICHES-1-1080x720.jpg | |
46 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_HUITRES-FRAICHES-1-1080x720.jpg (Content-Type: image/jpeg) | |
47 | + | Visiting: https://www.gibbys.com/fr/menus | |
48 | + | Visiting: https://www.gibbys.com/contactez-nous | |
49 | + | Visiting: https://www.gibbys.com/about | |
50 | + | Visiting: https://www.gibbys.com/events | |
51 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_Vieux-Montreal_WEB_fr.pdf | |
52 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_Vieux-Montreal_WEB_fr.pdf (Content-Type: application/pdf) | |
53 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/07/GB-MAJ-Always-On-12-565x720.jpg | |
54 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/07/GB-MAJ-Always-On-12-565x720.jpg (Content-Type: image/jpeg) | |
55 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_BOEUF-WELLINGTON-1080x720.jpg | |
56 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_BOEUF-WELLINGTON-1080x720.jpg (Content-Type: image/jpeg) | |
57 | + | Visiting: https://www.gibbys.com/2019/06/20/the-historical-site-old-montreal | |
58 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_Vieux-Montreal_WEB_en.pdf | |
59 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_Vieux-Montreal_WEB_en.pdf (Content-Type: application/pdf) | |
60 | + | Visiting: https://www.gibbys.com/fr/certificats-cadeaux | |
61 | + | Visiting: https://www.gibbys.com/fr/a-propos | |
62 | + | Visiting: https://www.gibbys.com/evenements | |
63 | + | Visiting: https://www.gibbys.com/fr/contactez-nous | |
64 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Groupe_DUO_FR.pdf | |
65 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Groupe_DUO_FR.pdf (Content-Type: application/pdf) | |
66 | + | Visiting: https://www.gibbys.com/2019/06/20/vieux-montreal-site-historique | |
67 | + | Visiting: https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_St-Sauveur_WEB_fr.pdf | |
68 | + | Non-text content detected at https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_St-Sauveur_WEB_fr.pdf (Content-Type: application/pdf) | |
69 | + | ################################################################ | |
70 | + | https://www.gibbys.com : | |
11 | 71 | ||
12 | 72 | {'html_static': set(), | |
13 | 73 | 'html_dynamic': {'https://www.gibbys.com', | |
@@ -59,8 +119,64 @@ https://www.gibbys.com | |||
59 | 119 | 'https://www.opentable.ca/r/gibbys-restaurant-reservations-montreal', | |
60 | 120 | 'https://www.opentable.ca/restref/client', | |
61 | 121 | 'https://www.tripadvisor.ca/Restaurant_Review-g155032-d704521-Reviews-Gibbys-Montreal_Quebec.html'}} | |
122 | + | ################################################################ | |
62 | 123 | ||
63 | - | https://lov.com | |
124 | + | Visiting: https://lov.com | |
125 | + | Visiting: https://lov.com/fr/philosophie | |
126 | + | Visiting: https://lov.com/fr/opentable-widget | |
127 | + | Visiting: https://lov.com/fr/nous-joindre | |
128 | + | Visiting: https://lov.com/fr | |
129 | + | Visiting: https://lov.com/en | |
130 | + | Visiting: https://lov.com/en/delivery-ubereats | |
131 | + | Visiting: https://lov.com/workspace/uploads/files/comptoir_menu-4_2.pdf | |
132 | + | Non-text content detected at https://lov.com/workspace/uploads/files/comptoir_menu-4_2.pdf (Content-Type: application/pdf) | |
133 | + | Visiting: https://lov.com/workspace/uploads/files/comptoir_menu-4_1.pdf | |
134 | + | Non-text content detected at https://lov.com/workspace/uploads/files/comptoir_menu-4_1.pdf (Content-Type: application/pdf) | |
135 | + | Visiting: https://lov.com/workspace/uploads/files/lov_brunch_en-_1.pdf | |
136 | + | Non-text content detected at https://lov.com/workspace/uploads/files/lov_brunch_en-_1.pdf (Content-Type: application/pdf) | |
137 | + | Visiting: https://lov.com/en/philosophie | |
138 | + | Visiting: https://lov.com/en/restaurants | |
139 | + | Visiting: https://lov.com/fr/nos-horaires | |
140 | + | Visiting: https://lov.com/workspace/uploads/files/comptoir_menu-4.pdf | |
141 | + | Non-text content detected at https://lov.com/workspace/uploads/files/comptoir_menu-4.pdf (Content-Type: application/pdf) | |
142 | + | Visiting: https://lov.com/workspace/uploads/files/lov_brunch_fr-_1.pdf | |
143 | + | Non-text content detected at https://lov.com/workspace/uploads/files/lov_brunch_fr-_1.pdf (Content-Type: application/pdf) | |
144 | + | Visiting: https://lov.com/cdn-cgi/l/email-protection | |
145 | + | Visiting: https://lov.com/workspace/uploads/files/comptoir_menu-4_3.pdf | |
146 | + | Non-text content detected at https://lov.com/workspace/uploads/files/comptoir_menu-4_3.pdf (Content-Type: application/pdf) | |
147 | + | Visiting: https://lov.com/workspace/uploads/files/lov-regu-soir-ang.pdf | |
148 | + | Non-text content detected at https://lov.com/workspace/uploads/files/lov-regu-soir-ang.pdf (Content-Type: application/pdf) | |
149 | + | Visiting: https://lov.com/en/restaurants/lov-dix30 | |
150 | + | Visiting: https://lov.com/en/contact-us | |
151 | + | Visiting: https://lov.com/fr/livraison-ubereats | |
152 | + | Visiting: https://lov.com/fr/restaurants/lov-dix30 | |
153 | + | Visiting: https://lov.com/en/opentable-widget | |
154 | + | Visiting: https://lov.com/en/careers | |
155 | + | Visiting: https://lov.com/fr/carrieres | |
156 | + | Visiting: https://lov.com/fr/reservation-groupe | |
157 | + | Visiting: https://lov.com/workspace/uploads/files/lov-regu-soir-fr.pdf | |
158 | + | Non-text content detected at https://lov.com/workspace/uploads/files/lov-regu-soir-fr.pdf (Content-Type: application/pdf) | |
159 | + | Visiting: https://lov.com/fr/restaurants | |
160 | + | Visiting: https://lov.com/en/opening-hours | |
161 | + | Visiting: https://lov.com/en/group-reservation | |
162 | + | Visiting: https://lov.com/en/restaurants/lov-mcgill | |
163 | + | Visiting: https://lov.com/fr/restaurants/lov-dix30/Menuprincipal-2020 | |
164 | + | Visiting: https://lov.com/fr/restaurants/lov-dix30/menu-breuvages-Automn-2020 | |
165 | + | Visiting: https://lov.com/en/restaurants/lov-dix30/Principalmenu-2020 | |
166 | + | Visiting: https://lov.com/fr/restaurants/lov-dix30/cocktails-bieres | |
167 | + | Visiting: https://lov.com/fr/restaurants/lov-mcgill | |
168 | + | Visiting: https://lov.com/fr/restaurants/lov-mcgill/menu-breuvages-Automn-2020 | |
169 | + | Visiting: https://lov.com/en/careers/www-lov-comcarriereskitchenmanager | |
170 | + | Visiting: https://lov.com/en/restaurants/lov-dix30/Menu-Beverages-Fall-2020 | |
171 | + | Visiting: https://lov.com/fr/carrieres/www-lov-comcarriereschefdecuisine | |
172 | + | Visiting: https://lov.com/en/restaurants/lov-mcgill/cocktails-beers | |
173 | + | Visiting: https://lov.com/en/restaurants/lov-mcgill/Menu-Beverages-Fall-2020 | |
174 | + | Visiting: https://lov.com/en/restaurants/lov-dix30/cocktails-beers | |
175 | + | Visiting: https://lov.com/en/restaurants/lov-mcgill/Principalmenu-2020 | |
176 | + | Visiting: https://lov.com/fr/restaurants/lov-mcgill/cocktails-bieres | |
177 | + | Visiting: https://lov.com/fr/restaurants/lov-mcgill/Menuprincipal-2020 | |
178 | + | ################################################################ | |
179 | + | https://lov.com : | |
64 | 180 | ||
65 | 181 | {'html_static': {'https://lov.com/cdn-cgi/l/email-protection', | |
66 | 182 | 'https://lov.com/en/opentable-widget', | |
@@ -68,17 +184,12 @@ https://lov.com | |||
68 | 184 | 'html_dynamic': {'https://lov.com', | |
69 | 185 | 'https://lov.com/en', | |
70 | 186 | 'https://lov.com/en/careers', | |
71 | - | 'https://lov.com/en/careers/httpslov-comencook', | |
72 | 187 | 'https://lov.com/en/careers/www-lov-comcarriereskitchenmanager', | |
73 | 188 | 'https://lov.com/en/contact-us', | |
74 | 189 | 'https://lov.com/en/group-reservation', | |
75 | 190 | 'https://lov.com/en/opening-hours', | |
76 | 191 | 'https://lov.com/en/philosophie', | |
77 | 192 | 'https://lov.com/en/restaurants', | |
78 | - | 'https://lov.com/en/restaurants/lov-centropolis', | |
79 | - | 'https://lov.com/en/restaurants/lov-centropolis/Menu-Beverages-Fall-2020', | |
80 | - | 'https://lov.com/en/restaurants/lov-centropolis/Principalmenu-2020', | |
81 | - | 'https://lov.com/en/restaurants/lov-centropolis/cocktails-beers', | |
82 | 193 | 'https://lov.com/en/restaurants/lov-dix30', | |
83 | 194 | 'https://lov.com/en/restaurants/lov-dix30/Menu-Beverages-Fall-2020', | |
84 | 195 | 'https://lov.com/en/restaurants/lov-dix30/Principalmenu-2020', | |
@@ -90,16 +201,11 @@ https://lov.com | |||
90 | 201 | 'https://lov.com/fr', | |
91 | 202 | 'https://lov.com/fr/carrieres', | |
92 | 203 | 'https://lov.com/fr/carrieres/www-lov-comcarriereschefdecuisine', | |
93 | - | 'https://lov.com/fr/carrieres/www-lov-comcarrierescuisinier', | |
94 | 204 | 'https://lov.com/fr/nos-horaires', | |
95 | 205 | 'https://lov.com/fr/nous-joindre', | |
96 | 206 | 'https://lov.com/fr/philosophie', | |
97 | 207 | 'https://lov.com/fr/reservation-groupe', | |
98 | 208 | 'https://lov.com/fr/restaurants', | |
99 | - | 'https://lov.com/fr/restaurants/lov-centropolis', | |
100 | - | 'https://lov.com/fr/restaurants/lov-centropolis/Menuprincipal-2020', | |
101 | - | 'https://lov.com/fr/restaurants/lov-centropolis/cocktails-bieres', | |
102 | - | 'https://lov.com/fr/restaurants/lov-centropolis/menu-breuvages-Automn-2020', | |
103 | 209 | 'https://lov.com/fr/restaurants/lov-dix30', | |
104 | 210 | 'https://lov.com/fr/restaurants/lov-dix30/Menuprincipal-2020', | |
105 | 211 | 'https://lov.com/fr/restaurants/lov-dix30/cocktails-bieres', | |
@@ -124,7 +230,6 @@ https://lov.com | |||
124 | 230 | 'https://+15797218304', | |
125 | 231 | 'https://438-580-9409', | |
126 | 232 | 'https://bit.ly/2Oju9gR', | |
127 | - | 'https://bit.ly/3krKE59', | |
128 | 233 | 'https://bit.ly/3l2UKtl', | |
129 | 234 | 'https://bit.ly/3mnVFpX', | |
130 | 235 | 'https://boutique.lov.com', | |
@@ -150,8 +255,28 @@ https://lov.com | |||
150 | 255 | 'https://www.instagram.com/lovrestaurant', | |
151 | 256 | 'https://www.opentable.ca/restaurant/profile/1040107/reserve', | |
152 | 257 | 'https://www.opentable.ca/restaurant/profile/343654/reserve'}} | |
258 | + | ################################################################ | |
153 | 259 | ||
154 | - | https://www.mikadomontreal.com | |
260 | + | Visiting: https://www.mikadomontreal.com | |
261 | + | Visiting: https://www.mikadomontreal.com/contact | |
262 | + | Visiting: https://www.mikadomontreal.com/fr/contact | |
263 | + | Visiting: https://www.mikadomontreal.com/about | |
264 | + | Visiting: https://www.mikadomontreal.com/menu_group.pdf | |
265 | + | Non-text content detected at https://www.mikadomontreal.com/menu_group.pdf (Content-Type: application/pdf) | |
266 | + | Visiting: https://www.mikadomontreal.com/fr/menu_group.pdf | |
267 | + | Non-text content detected at https://www.mikadomontreal.com/fr/menu_group.pdf (Content-Type: application/pdf) | |
268 | + | Visiting: https://www.mikadomontreal.com/fr/about | |
269 | + | Visiting: https://www.mikadomontreal.com/catering | |
270 | + | Visiting: https://www.mikadomontreal.com/menu_alcohol.pdf | |
271 | + | Non-text content detected at https://www.mikadomontreal.com/menu_alcohol.pdf (Content-Type: application/pdf) | |
272 | + | Visiting: https://www.mikadomontreal.com/menu_main.pdf | |
273 | + | Non-text content detected at https://www.mikadomontreal.com/menu_main.pdf (Content-Type: application/pdf) | |
274 | + | Visiting: https://www.mikadomontreal.com/menu_lunch.pdf | |
275 | + | Non-text content detected at https://www.mikadomontreal.com/menu_lunch.pdf (Content-Type: application/pdf) | |
276 | + | Visiting: https://www.mikadomontreal.com/fr | |
277 | + | Visiting: https://www.mikadomontreal.com/fr/catering | |
278 | + | ################################################################ | |
279 | + | https://www.mikadomontreal.com : | |
155 | 280 | ||
156 | 281 | {'html_static': set(), | |
157 | 282 | 'html_dynamic': {'https://www.mikadomontreal.com', | |
@@ -179,30 +304,33 @@ https://www.mikadomontreal.com | |||
179 | 304 | 'https://www.grafikadesigns.com', | |
180 | 305 | 'https://www.grafikadesigns.com/fr', | |
181 | 306 | 'https://www.instagram.com/restaurant.mikado'}} | |
307 | + | ################################################################ | |
182 | 308 | ||
183 | - | https://montrealcrepes.com | |
309 | + | Visiting: https://montrealcrepes.com | |
310 | + | Error when requesting https://montrealcrepes.com: | |
311 | + | Error processing https://montrealcrepes.com: Page.goto: net::ERR_CONNECTION_CLOSED at https://montrealcrepes.com/ | |
312 | + | Call log: | |
313 | + | - navigating to "https://montrealcrepes.com/", waiting until "domcontentloaded" | |
314 | + | ||
315 | + | ################################################################ | |
316 | + | https://montrealcrepes.com : | |
184 | 317 | ||
185 | 318 | {'html_static': set(), | |
186 | - | 'html_dynamic': {'https://montrealcrepes.com', | |
187 | - | 'https://montrealcrepes.com/accueil', | |
188 | - | 'https://montrealcrepes.com/crêpes', | |
189 | - | 'https://montrealcrepes.com/english', | |
190 | - | 'https://montrealcrepes.com/raviolis', | |
191 | - | 'https://montrealcrepes.com/à-côtés'}, | |
319 | + | 'html_dynamic': set(), | |
192 | 320 | 'pdf': set(), | |
193 | 321 | 'images': set(), | |
194 | - | 'others': set(), | |
195 | - | 'external': {'https://5143127284', | |
196 | - | 'https://policies.google.com/privacy', | |
197 | - | 'https://policies.google.com/terms', | |
198 | - | 'https://www.facebook.com/200839793745148', | |
199 | - | 'https://www.foodbooking.com/widget', | |
200 | - | 'https://www.instagram.com/montrealcrepes', | |
201 | - | 'https://www.yelp.com/biz/0zabNTBrOgQLy0hYsi1Tpg', | |
202 | - | 'https://www.youtube.com/channel/UCztYxakyqq1LYkpoiL9iPWA'}} | |
203 | - | ||
322 | + | 'others': {'https://montrealcrepes.com'}, | |
323 | + | 'external': set()} | |
324 | + | ################################################################ | |
204 | 325 | ||
205 | - | https://seasaltmtl.com | |
326 | + | Visiting: https://seasaltmtl.com | |
327 | + | Visiting: https://seasaltmtl.com/contact-us | |
328 | + | Visiting: https://seasaltmtl.com/fr/contact-us | |
329 | + | Visiting: https://seasaltmtl.com/wp-content/uploads/2024/11/Menu-Seasalt-11-11-2024.pdf | |
330 | + | Non-text content detected at https://seasaltmtl.com/wp-content/uploads/2024/11/Menu-Seasalt-11-11-2024.pdf (Content-Type: application/pdf) | |
331 | + | Visiting: https://seasaltmtl.com/fr | |
332 | + | ################################################################ | |
333 | + | https://seasaltmtl.com : | |
206 | 334 | ||
207 | 335 | {'html_static': set(), | |
208 | 336 | 'html_dynamic': {'https://seasaltmtl.com', | |
@@ -222,8 +350,13 @@ https://seasaltmtl.com | |||
222 | 350 | 'https://www.doordash.com/store/seasalt-mtl-montréal-28475004', | |
223 | 351 | 'https://www.google.com/maps/dir//seasalt+montreal/data=!4m6!4m5!1m1!4e2!1m2!1m1!1s0x4cc91bdf26d2e5c1:0x6958914ec0545214', | |
224 | 352 | 'https://www.opentable.com/restref/client'}} | |
353 | + | ################################################################ | |
225 | 354 | ||
226 | - | https://www.venicemtl.com | |
355 | + | Visiting: https://www.venicemtl.com | |
356 | + | Visiting: https://www.venicemtl.com/english-1 | |
357 | + | Visiting: https://www.venicemtl.com/francais | |
358 | + | ################################################################ | |
359 | + | https://www.venicemtl.com : | |
227 | 360 | ||
228 | 361 | {'html_static': set(), | |
229 | 362 | 'html_dynamic': {'https://www.venicemtl.com', | |
@@ -236,8 +369,15 @@ https://www.venicemtl.com | |||
236 | 369 | 'https://www.facebook.com/venicemtl', | |
237 | 370 | 'https://www.instagram.com/venicemtl', | |
238 | 371 | 'https://www.linkedin.com/company/venice-mtl'}} | |
372 | + | ################################################################ | |
239 | 373 | ||
240 | - | https://leclubchasseetpeche.com | |
374 | + | Visiting: https://leclubchasseetpeche.com | |
375 | + | Visiting: https://leclubchasseetpeche.com/map | |
376 | + | Visiting: https://leclubchasseetpeche.com/wp-content/uploads/2024/08/CCeP_Vins_Juin_2024.pdf | |
377 | + | Non-text content detected at https://leclubchasseetpeche.com/wp-content/uploads/2024/08/CCeP_Vins_Juin_2024.pdf (Content-Type: application/pdf) | |
378 | + | Visiting: https://leclubchasseetpeche.com/index.php/home-en | |
379 | + | ################################################################ | |
380 | + | https://leclubchasseetpeche.com : | |
241 | 381 | ||
242 | 382 | {'html_static': set(), | |
243 | 383 | 'html_dynamic': {'https://leclubchasseetpeche.com', | |
@@ -259,4 +399,4 @@ https://leclubchasseetpeche.com | |||
259 | 399 | 'https://www.mapbox.com/about/maps', | |
260 | 400 | 'https://www.mapbox.com/contribute', | |
261 | 401 | 'https://www.openstreetmap.org/about'}} | |
262 | - | ||
402 | + | ################################################################ |
mathieu revised this gist . Go to revision
No changes
mathieu revised this gist . Go to revision
1 file changed, 0 insertions, 0 deletions
crawler_output.py renamed to crawler_output
File renamed without changes
mathieu revised this gist . Go to revision
1 file changed, 0 insertions, 0 deletions
crawler_output.json renamed to crawler_output.py
File renamed without changes
mathieu revised this gist . Go to revision
1 file changed, 0 insertions, 0 deletions
crawler_output.log renamed to crawler_output.json
File renamed without changes
mathieu revised this gist . Go to revision
1 file changed, 262 insertions
crawler_output.log(file created)
@@ -0,0 +1,262 @@ | |||
1 | + | https://brasseriebernard.com (has a restrictive robot.txt) | |
2 | + | ||
3 | + | {'html_static': set(), | |
4 | + | 'html_dynamic': {'https://brasseriebernard.com'}, | |
5 | + | 'pdf': set(), | |
6 | + | 'images': set(), | |
7 | + | 'others': set(), | |
8 | + | 'external': set()} | |
9 | + | ||
10 | + | https://www.gibbys.com | |
11 | + | ||
12 | + | {'html_static': set(), | |
13 | + | 'html_dynamic': {'https://www.gibbys.com', | |
14 | + | 'https://www.gibbys.com/about', | |
15 | + | 'https://www.gibbys.com/contact', | |
16 | + | 'https://www.gibbys.com/contactez-nous', | |
17 | + | 'https://www.gibbys.com/evenements', | |
18 | + | 'https://www.gibbys.com/events', | |
19 | + | 'https://www.gibbys.com/fr', | |
20 | + | 'https://www.gibbys.com/fr/a-propos', | |
21 | + | 'https://www.gibbys.com/fr/certificats-cadeaux', | |
22 | + | 'https://www.gibbys.com/fr/contactez-nous', | |
23 | + | 'https://www.gibbys.com/fr/evenements', | |
24 | + | 'https://www.gibbys.com/fr/menus', | |
25 | + | 'https://www.gibbys.com/gift-certificates', | |
26 | + | 'https://www.gibbys.com/menus'}, | |
27 | + | 'pdf': {'https://www.gibbys.com/wp-content/uploads/2024/10/GB-CarteBoire_Octobre_2024.pdf', | |
28 | + | 'https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Groupe_DUO_EN.pdf', | |
29 | + | 'https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Groupe_DUO_FR.pdf', | |
30 | + | 'https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_St-Sauveur_WEB_en.pdf', | |
31 | + | 'https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_St-Sauveur_WEB_fr.pdf', | |
32 | + | 'https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_Vieux-Montreal_WEB_en.pdf', | |
33 | + | 'https://www.gibbys.com/wp-content/uploads/2024/10/GB-Menu_Soir_Vieux-Montreal_WEB_fr.pdf', | |
34 | + | 'https://www.gibbys.com/wp-content/uploads/2024/12/GB-CarteBoire.pdf'}, | |
35 | + | 'images': {'https://www.gibbys.com/wp-content/uploads/2019/06/gal3-1152x720.jpg', | |
36 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_BOEUF-WELLINGTON-1080x720.jpg', | |
37 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_CREVETTES-SAUTEES-A-LAIL-1080x720.jpg', | |
38 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_ESCARGOTS-A-LA-BOURGUIGNONNE-1080x720.jpg', | |
39 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_FILET-MIGNON-KEBAB-1080x720.jpg', | |
40 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_HUITRES-FRAICHES-1-1080x720.jpg', | |
41 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_QUEUES-DE-HOMARD-1080x720.jpg', | |
42 | + | 'https://www.gibbys.com/wp-content/uploads/2023/10/GIBBYS_STEAK-1080x720.jpg', | |
43 | + | 'https://www.gibbys.com/wp-content/uploads/2024/03/GB-BTL-vin_1920x1080-1280x720.jpg', | |
44 | + | 'https://www.gibbys.com/wp-content/uploads/2024/07/GB-MAJ-Always-On-07-480x720.jpg', | |
45 | + | 'https://www.gibbys.com/wp-content/uploads/2024/07/GB-MAJ-Always-On-12-565x720.jpg'}, | |
46 | + | 'others': {'https://www.gibbys.com/2019/06/20/the-historical-site-old-montreal', | |
47 | + | 'https://www.gibbys.com/2019/06/20/vieux-montreal-site-historique'}, | |
48 | + | 'external': {'https://4502272623', | |
49 | + | 'https://514-282-1837', | |
50 | + | 'https://5142821837', | |
51 | + | 'https://foursquare.com/v/gibbys/4ad4c06af964a520f6f820e3', | |
52 | + | 'https://gibbys.verifiervotresolde.com/en/login', | |
53 | + | 'https://gibbys.verifiervotresolde.com/fr/login', | |
54 | + | 'https://info@gibbys.com', | |
55 | + | 'https://mincmagic.com', | |
56 | + | 'https://twitter.com/GibbysMontreal', | |
57 | + | 'https://www.facebook.com/GibbysRestaurant', | |
58 | + | 'https://www.instagram.com/gibbysrestaurant', | |
59 | + | 'https://www.opentable.ca/r/gibbys-restaurant-reservations-montreal', | |
60 | + | 'https://www.opentable.ca/restref/client', | |
61 | + | 'https://www.tripadvisor.ca/Restaurant_Review-g155032-d704521-Reviews-Gibbys-Montreal_Quebec.html'}} | |
62 | + | ||
63 | + | https://lov.com | |
64 | + | ||
65 | + | {'html_static': {'https://lov.com/cdn-cgi/l/email-protection', | |
66 | + | 'https://lov.com/en/opentable-widget', | |
67 | + | 'https://lov.com/fr/opentable-widget'}, | |
68 | + | 'html_dynamic': {'https://lov.com', | |
69 | + | 'https://lov.com/en', | |
70 | + | 'https://lov.com/en/careers', | |
71 | + | 'https://lov.com/en/careers/httpslov-comencook', | |
72 | + | 'https://lov.com/en/careers/www-lov-comcarriereskitchenmanager', | |
73 | + | 'https://lov.com/en/contact-us', | |
74 | + | 'https://lov.com/en/group-reservation', | |
75 | + | 'https://lov.com/en/opening-hours', | |
76 | + | 'https://lov.com/en/philosophie', | |
77 | + | 'https://lov.com/en/restaurants', | |
78 | + | 'https://lov.com/en/restaurants/lov-centropolis', | |
79 | + | 'https://lov.com/en/restaurants/lov-centropolis/Menu-Beverages-Fall-2020', | |
80 | + | 'https://lov.com/en/restaurants/lov-centropolis/Principalmenu-2020', | |
81 | + | 'https://lov.com/en/restaurants/lov-centropolis/cocktails-beers', | |
82 | + | 'https://lov.com/en/restaurants/lov-dix30', | |
83 | + | 'https://lov.com/en/restaurants/lov-dix30/Menu-Beverages-Fall-2020', | |
84 | + | 'https://lov.com/en/restaurants/lov-dix30/Principalmenu-2020', | |
85 | + | 'https://lov.com/en/restaurants/lov-dix30/cocktails-beers', | |
86 | + | 'https://lov.com/en/restaurants/lov-mcgill', | |
87 | + | 'https://lov.com/en/restaurants/lov-mcgill/Menu-Beverages-Fall-2020', | |
88 | + | 'https://lov.com/en/restaurants/lov-mcgill/Principalmenu-2020', | |
89 | + | 'https://lov.com/en/restaurants/lov-mcgill/cocktails-beers', | |
90 | + | 'https://lov.com/fr', | |
91 | + | 'https://lov.com/fr/carrieres', | |
92 | + | 'https://lov.com/fr/carrieres/www-lov-comcarriereschefdecuisine', | |
93 | + | 'https://lov.com/fr/carrieres/www-lov-comcarrierescuisinier', | |
94 | + | 'https://lov.com/fr/nos-horaires', | |
95 | + | 'https://lov.com/fr/nous-joindre', | |
96 | + | 'https://lov.com/fr/philosophie', | |
97 | + | 'https://lov.com/fr/reservation-groupe', | |
98 | + | 'https://lov.com/fr/restaurants', | |
99 | + | 'https://lov.com/fr/restaurants/lov-centropolis', | |
100 | + | 'https://lov.com/fr/restaurants/lov-centropolis/Menuprincipal-2020', | |
101 | + | 'https://lov.com/fr/restaurants/lov-centropolis/cocktails-bieres', | |
102 | + | 'https://lov.com/fr/restaurants/lov-centropolis/menu-breuvages-Automn-2020', | |
103 | + | 'https://lov.com/fr/restaurants/lov-dix30', | |
104 | + | 'https://lov.com/fr/restaurants/lov-dix30/Menuprincipal-2020', | |
105 | + | 'https://lov.com/fr/restaurants/lov-dix30/cocktails-bieres', | |
106 | + | 'https://lov.com/fr/restaurants/lov-dix30/menu-breuvages-Automn-2020', | |
107 | + | 'https://lov.com/fr/restaurants/lov-mcgill', | |
108 | + | 'https://lov.com/fr/restaurants/lov-mcgill/Menuprincipal-2020', | |
109 | + | 'https://lov.com/fr/restaurants/lov-mcgill/cocktails-bieres', | |
110 | + | 'https://lov.com/fr/restaurants/lov-mcgill/menu-breuvages-Automn-2020'}, | |
111 | + | 'pdf': {'https://lov.com/workspace/uploads/files/comptoir_menu-4.pdf', | |
112 | + | 'https://lov.com/workspace/uploads/files/comptoir_menu-4_1.pdf', | |
113 | + | 'https://lov.com/workspace/uploads/files/comptoir_menu-4_2.pdf', | |
114 | + | 'https://lov.com/workspace/uploads/files/comptoir_menu-4_3.pdf', | |
115 | + | 'https://lov.com/workspace/uploads/files/lov-regu-soir-ang.pdf', | |
116 | + | 'https://lov.com/workspace/uploads/files/lov-regu-soir-fr.pdf', | |
117 | + | 'https://lov.com/workspace/uploads/files/lov_brunch_en-_1.pdf', | |
118 | + | 'https://lov.com/workspace/uploads/files/lov_brunch_fr-_1.pdf'}, | |
119 | + | 'images': set(), | |
120 | + | 'others': {'https://lov.com/en/delivery-ubereats', | |
121 | + | 'https://lov.com/fr/livraison-ubereats'}, | |
122 | + | 'external': {'https://+14507208338', | |
123 | + | 'https://+15142871155', | |
124 | + | 'https://+15797218304', | |
125 | + | 'https://438-580-9409', | |
126 | + | 'https://bit.ly/2Oju9gR', | |
127 | + | 'https://bit.ly/3krKE59', | |
128 | + | 'https://bit.ly/3l2UKtl', | |
129 | + | 'https://bit.ly/3mnVFpX', | |
130 | + | 'https://boutique.lov.com', | |
131 | + | 'https://boutique.lov.com/en', | |
132 | + | 'https://boutique.lov.com/en/home', | |
133 | + | 'https://google.com/maps', | |
134 | + | 'https://instagram.com/lovrestaurant', | |
135 | + | 'https://lesglaceurs.ca/collections/collection-gateaux-veganes', | |
136 | + | 'https://lesglaceurs.ca/collections/collection-vegane', | |
137 | + | 'https://lesglaceurs.ca/en/collections/collection-gateaux-veganes', | |
138 | + | 'https://party-expert.com', | |
139 | + | 'https://party-expert.com/fr', | |
140 | + | 'https://policies.google.com/privacy', | |
141 | + | 'https://policies.google.com/terms', | |
142 | + | 'https://restaurantguru.com', | |
143 | + | 'https://restaurantguru.com/Lov-Toronto', | |
144 | + | 'https://support.cloudflare.com/hc/en-us/articles/200170016-What-is-Email-Address-Obfuscation-', | |
145 | + | 'https://support.cloudflare.com/hc/en-us/categories/200275218-Getting-Started', | |
146 | + | 'https://web.ishopfood.com', | |
147 | + | 'https://www.cloudflare.com/5xx-error-landing', | |
148 | + | 'https://www.cloudflare.com/sign-up', | |
149 | + | 'https://www.facebook.com/LOVRestaurant', | |
150 | + | 'https://www.instagram.com/lovrestaurant', | |
151 | + | 'https://www.opentable.ca/restaurant/profile/1040107/reserve', | |
152 | + | 'https://www.opentable.ca/restaurant/profile/343654/reserve'}} | |
153 | + | ||
154 | + | https://www.mikadomontreal.com | |
155 | + | ||
156 | + | {'html_static': set(), | |
157 | + | 'html_dynamic': {'https://www.mikadomontreal.com', | |
158 | + | 'https://www.mikadomontreal.com/about', | |
159 | + | 'https://www.mikadomontreal.com/catering', | |
160 | + | 'https://www.mikadomontreal.com/contact', | |
161 | + | 'https://www.mikadomontreal.com/fr', | |
162 | + | 'https://www.mikadomontreal.com/fr/about', | |
163 | + | 'https://www.mikadomontreal.com/fr/catering', | |
164 | + | 'https://www.mikadomontreal.com/fr/contact'}, | |
165 | + | 'pdf': {'https://www.mikadomontreal.com/fr/menu_group.pdf', | |
166 | + | 'https://www.mikadomontreal.com/menu_alcohol.pdf', | |
167 | + | 'https://www.mikadomontreal.com/menu_group.pdf', | |
168 | + | 'https://www.mikadomontreal.com/menu_lunch.pdf', | |
169 | + | 'https://www.mikadomontreal.com/menu_main.pdf'}, | |
170 | + | 'images': set(), | |
171 | + | 'others': set(), | |
172 | + | 'external': {'https://514-279-4809', | |
173 | + | 'https://info@mikadomontreal.com', | |
174 | + | "https://jQuery('", | |
175 | + | 'https://mikado.order-online.ai/en', | |
176 | + | 'https://mikado.order-online.ai/fr', | |
177 | + | "https://showPopup('https://www.tbdine.com/book/restaurant/mikado-laurier", | |
178 | + | 'https://www.facebook.com/restaurantmikadolaurier', | |
179 | + | 'https://www.grafikadesigns.com', | |
180 | + | 'https://www.grafikadesigns.com/fr', | |
181 | + | 'https://www.instagram.com/restaurant.mikado'}} | |
182 | + | ||
183 | + | https://montrealcrepes.com | |
184 | + | ||
185 | + | {'html_static': set(), | |
186 | + | 'html_dynamic': {'https://montrealcrepes.com', | |
187 | + | 'https://montrealcrepes.com/accueil', | |
188 | + | 'https://montrealcrepes.com/crêpes', | |
189 | + | 'https://montrealcrepes.com/english', | |
190 | + | 'https://montrealcrepes.com/raviolis', | |
191 | + | 'https://montrealcrepes.com/à-côtés'}, | |
192 | + | 'pdf': set(), | |
193 | + | 'images': set(), | |
194 | + | 'others': set(), | |
195 | + | 'external': {'https://5143127284', | |
196 | + | 'https://policies.google.com/privacy', | |
197 | + | 'https://policies.google.com/terms', | |
198 | + | 'https://www.facebook.com/200839793745148', | |
199 | + | 'https://www.foodbooking.com/widget', | |
200 | + | 'https://www.instagram.com/montrealcrepes', | |
201 | + | 'https://www.yelp.com/biz/0zabNTBrOgQLy0hYsi1Tpg', | |
202 | + | 'https://www.youtube.com/channel/UCztYxakyqq1LYkpoiL9iPWA'}} | |
203 | + | ||
204 | + | ||
205 | + | https://seasaltmtl.com | |
206 | + | ||
207 | + | {'html_static': set(), | |
208 | + | 'html_dynamic': {'https://seasaltmtl.com', | |
209 | + | 'https://seasaltmtl.com/contact-us', | |
210 | + | 'https://seasaltmtl.com/fr', | |
211 | + | 'https://seasaltmtl.com/fr/contact-us'}, | |
212 | + | 'pdf': {'https://seasaltmtl.com/wp-content/uploads/2024/11/Menu-Seasalt-11-11-2024.pdf'}, | |
213 | + | 'images': set(), | |
214 | + | 'others': set(), | |
215 | + | 'external': {'https://5149376555', | |
216 | + | 'https://booking.libroreserve.com/25e5903ae79aa5a/QC015756480354', | |
217 | + | 'https://booking.libroreserve.com/25e5903ae79aa5a/QC015756480354/seat', | |
218 | + | 'https://carmahospitality.checkyourcardbalance.com/en/login', | |
219 | + | 'https://carmahospitality.checkyourcardbalance.com/fr/login', | |
220 | + | 'https://resy.com/cities/montreal-qc/venues/seasalt', | |
221 | + | 'https://void(0)', | |
222 | + | 'https://www.doordash.com/store/seasalt-mtl-montréal-28475004', | |
223 | + | 'https://www.google.com/maps/dir//seasalt+montreal/data=!4m6!4m5!1m1!4e2!1m2!1m1!1s0x4cc91bdf26d2e5c1:0x6958914ec0545214', | |
224 | + | 'https://www.opentable.com/restref/client'}} | |
225 | + | ||
226 | + | https://www.venicemtl.com | |
227 | + | ||
228 | + | {'html_static': set(), | |
229 | + | 'html_dynamic': {'https://www.venicemtl.com', | |
230 | + | 'https://www.venicemtl.com/english-1', | |
231 | + | 'https://www.venicemtl.com/francais'}, | |
232 | + | 'pdf': set(), | |
233 | + | 'images': set(), | |
234 | + | 'others': set(), | |
235 | + | 'external': {'https://resa.venicemtl@gmail.com', | |
236 | + | 'https://www.facebook.com/venicemtl', | |
237 | + | 'https://www.instagram.com/venicemtl', | |
238 | + | 'https://www.linkedin.com/company/venice-mtl'}} | |
239 | + | ||
240 | + | https://leclubchasseetpeche.com | |
241 | + | ||
242 | + | {'html_static': set(), | |
243 | + | 'html_dynamic': {'https://leclubchasseetpeche.com', | |
244 | + | 'https://leclubchasseetpeche.com/index.php/home-en', | |
245 | + | 'https://leclubchasseetpeche.com/map'}, | |
246 | + | 'pdf': {'https://leclubchasseetpeche.com/wp-content/uploads/2024/08/CCeP_Vins_Juin_2024.pdf'}, | |
247 | + | 'images': set(), | |
248 | + | 'others': set(), | |
249 | + | 'external': {'https://helen@leclubchasseetpeche.com', | |
250 | + | 'https://latableronde.ca', | |
251 | + | 'https://maps.google.com', | |
252 | + | 'https://tooly.ca', | |
253 | + | 'https://trifectamtl.com/products/certificat-cadeau-restaurant-le-club-chasse-et-peche', | |
254 | + | 'https://www.facebook.com/leclubchasseetpeche', | |
255 | + | 'https://www.instagram.com/leclubchasseetpeche', | |
256 | + | 'https://www.leclubchasseetpeche.com/carte', | |
257 | + | 'https://www.lefilet.ca', | |
258 | + | 'https://www.leserpent.ca', | |
259 | + | 'https://www.mapbox.com/about/maps', | |
260 | + | 'https://www.mapbox.com/contribute', | |
261 | + | 'https://www.openstreetmap.org/about'}} | |
262 | + |