From 098bc159cb2c268f9daec7f2fe6aa4ec95721c91 Mon Sep 17 00:00:00 2001 From: Yohann Dedy Date: Thu, 10 May 2018 19:31:59 +0200 Subject: [PATCH] Premier commit --- CinemScraper/__init__.py | 0 CinemScraper/__init__.pyc | Bin 0 -> 142 bytes CinemScraper/items.py | 14 ++++ CinemScraper/middlewares.py | 103 +++++++++++++++++++++++++ CinemScraper/pipelines.py | 11 +++ CinemScraper/settings.py | 90 +++++++++++++++++++++ CinemScraper/settings.pyc | Bin 0 -> 341 bytes CinemScraper/spiders/__init__.py | 4 + CinemScraper/spiders/__init__.pyc | Bin 0 -> 150 bytes CinemScraper/spiders/grabVideoData.py | 20 +++++ CinemScraper/spiders/grabVideoData.pyc | Bin 0 -> 1144 bytes CinemScraper/spiders/listeVideos.py | 18 +++++ CinemScraper/spiders/listeVideos.pyc | Bin 0 -> 929 bytes README.md | 0 scrapy.cfg | 11 +++ 15 files changed, 271 insertions(+) create mode 100644 CinemScraper/__init__.py create mode 100644 CinemScraper/__init__.pyc create mode 100644 CinemScraper/items.py create mode 100644 CinemScraper/middlewares.py create mode 100644 CinemScraper/pipelines.py create mode 100644 CinemScraper/settings.py create mode 100644 CinemScraper/settings.pyc create mode 100644 CinemScraper/spiders/__init__.py create mode 100644 CinemScraper/spiders/__init__.pyc create mode 100644 CinemScraper/spiders/grabVideoData.py create mode 100644 CinemScraper/spiders/grabVideoData.pyc create mode 100644 CinemScraper/spiders/listeVideos.py create mode 100644 CinemScraper/spiders/listeVideos.pyc create mode 100644 README.md create mode 100644 scrapy.cfg diff --git a/CinemScraper/__init__.py b/CinemScraper/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/CinemScraper/__init__.pyc b/CinemScraper/__init__.pyc new file mode 100644 index 0000000000000000000000000000000000000000..fc061b3de9f5571cf12cf4ab53054c514c76ef72 GIT binary patch literal 142 zcmZSn%*)l<^f@Y-0SXv_v;z8GsJK^gu^Yh9Hw3{&Xh@ z<7#VaxoTe<)7r~_!q7HViMoxj(Yd#)8=k~|vX3wls^Hm-xichkKBX)#W`aIFGU+Z* z;_UfAb>4l#7%kXxE^<{cJ{EM!ADmxCwVl~Jfgc5S_J?v`Je&gv5nQB`z)!vBIGe5keG#xb=`g5Rs6zwKvIDj_vMDnpP^O za^l8sg*(iwqtISBfs-B2ynQ=6^L8En*z2_OpOX~UPss0AJn(=`#(xDlz=WLu48W;^ zse&wouK?EopC*AYMp1*=_7^|L^nl%WPM@6H%#@iXJ*wDqn;jI-zvkh0;FJ^2$JQsB zDVT(^l{k&{K9eR4>m6v1*UdQhSaJ_IH$GxyPE_^dc(qz}Q(KsYrnxy=n(oxa_~h^N zzR0-utoOV-r$wFyOcx2HAE_9>v$^;NR|-zO7}p90pD*D{0JaHNfky*il$BvYSee5$ z+PHx>H)zYFyn?w~8+7{yx4l6-H@G`+I96x(;3I1_igvlGW87hz+4IL~S&%6Rw>h5o z`h7ANL`@FJk~1ix&3pS;>7t&)4kK7D@o7!C!(sQtmaJ?ww+8ns@~I7`&Q@g00`D`$ zPMuzueqR&02wi&MSzf`BOFy{W=k1c7txFIQIl@R3B{36DVGbx5?uGi#)# z%0e{xl%yl>pyCP)30moyiTDlP;DEh&T;|J#!FX`={wN;29mj9v5{y#r#<<%7`m2cX ztvl4MF1=cnc4)jbA_%C5D&$fBq81~*oFpk&g(M+iCds1Ambrvdoy^c(c66SXE0ZNz zxzM&i&qdOXk|oPDl;iu;#lLN3$hkod-(QE8YN@tr2eq!!1fQwqhQ+NvOuyiNRpTXl OQH%6aJ}wlq8~z3j<`7i? literal 0 HcmV?d00001 diff --git a/CinemScraper/spiders/listeVideos.py b/CinemScraper/spiders/listeVideos.py new file mode 100644 index 0000000..e25581b --- /dev/null +++ b/CinemScraper/spiders/listeVideos.py @@ -0,0 +1,18 @@ +# -*- coding: utf-8 -*- +import scrapy + + +class ListevideosSpider(scrapy.Spider): + name = 'listeVideos' + allowed_domains = ['http://www.cinematheque.fr/'] + start_urls = ['http://www.cinematheque.fr/decouvrir.html'] + + def parse(self, response): + for lien in response.xpath('//a/@href[contains(.,"video")]/../..'): + yield { + 'adresse' : lien.css('a::attr(href)').extract(), + 'dateUpload' : lien.css('::attr(data-sort)').extract(), + + } + + diff --git a/CinemScraper/spiders/listeVideos.pyc b/CinemScraper/spiders/listeVideos.pyc new file mode 100644 index 0000000000000000000000000000000000000000..ca00c6ae0b2e8cb194058c8b16ab2e82e23edeaa GIT binary patch literal 929 zcmcIi!EVz)5S_Kt0EJ3$=^0fV90|O)B1H(b5F`$$NHGLqR9P!~LmWA_yEASQshrAR z@mX+(nRNu^4y*Osnc4B%H?tdlKiL1a{gLLd8zHYJ{Nae9;HjVjNZAO$0xT8G6%-+S z1-J(Imerp(6ZX+A4RLpg}a z(*aDANYv0>hDr!$p3o~>5Vd2i*Xwnhm$h9PTG)%u#&f3&n>XF1D_y*xRh0+)x6p_} zQGst6Hm~7I!P1v^tzdHg6utyd25=Qfi7bJmOGeHJ;dmDv+=%YM@l0LZhYzeiiH6L1 zhL0GvHu_}Y?EF*S)MUyUqxkWWZ^hB*T*om_Jm5q#9vdPTN$!YlNu+QV(V{ePw^x9x3Z`wr|(YnI~p4%INY6ZCx( dAEoXsiP^tmpZ