From 5955efe77bc59bf1e2f7007d3e14e503a8454762 Mon Sep 17 00:00:00 2001 From: guange <8863824@gmail.com> Date: Fri, 25 Jan 2019 15:54:57 +0800 Subject: [PATCH] =?UTF-8?q?=E6=B7=BB=E5=8A=A0=E4=BA=A7=E5=93=81=E8=A7=84?= =?UTF-8?q?=E6=A0=BC?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .gitignore | 3 +- .../__pycache__/middlewares.cpython-37.pyc | Bin 4326 -> 5147 bytes chapter1/crawler/taobao/items.py | 9 ++++ chapter1/crawler/taobao/middlewares.py | 24 ++++++++- chapter1/crawler/taobao/pipelines.py | 14 ++++- chapter1/crawler/taobao/spiders/jd.py | 51 +++++++++++++++--- chapter4/check_proxy.py | 31 +++++++++++ 7 files changed, 121 insertions(+), 11 deletions(-) create mode 100644 chapter4/check_proxy.py diff --git a/.gitignore b/.gitignore index ebc0014..40dad18 100644 --- a/.gitignore +++ b/.gitignore @@ -7,4 +7,5 @@ chapter1/crawler/datas/comments1/ chapter1/crawler/datas/products/ chapter1/crawler/taobao/settings.py chapter2/mysite/mysite/settings.py -.env \ No newline at end of file +.env +chapter4/results.csv diff --git a/chapter1/crawler/taobao/__pycache__/middlewares.cpython-37.pyc b/chapter1/crawler/taobao/__pycache__/middlewares.cpython-37.pyc index a0323b1ab08474ed549198bc4f6f30ecfff7493e..f5c641910037b1c3ed7bca4b9049eeaf188bc9df 100644 GIT binary patch delta 2066 zcmZ`)&2QX96!-XJ?fvlXrp*TlAx)qO-L}foLRyptDiWeJDosNcm0*D^XUC)t-nE%= z)Ff<_NXe}Slv=1#dr8!5B@P@pAtCV>aKHz|2@VJei9Z0|n@zH-l-Qb|-^{%CX5R0; z8UH@?^g@2pG&2%BKcAodw5Mk;|I*fT=uwFhU$UBCViD1oEm?dOOM$QKt2NEi2M@#-Pj>s)2L;vrM~dRX2>hpe~HtE#tS}l1+T0hU?LvW zo(_n8q1H*2ER5ZXf6?fC2hL(Z4EM%fMnDG)Rocv2F&Hp`vGN>%q2+WVZDb6?$T6JR z`?ouOmU?_64RT3gI(!(`iSP#lXv9o}Jc4lB@{POsFkaOc#|1x%;3v_U$W4>g6DCO^ zWI@&C+&)xVjCJGV31NOn@9Ve_?)U{_VJs=O?0Fc}xl7|G#^O6KIOsdgLC2AU;{?{? za(cUb4h;qoh5$-(GuNkO<3apu`nvThs=tPC9$^?kWat7)C4`FzrzU3vW3T?kjJnf5j;y*)c!VK;CQ!P5*%EqBL0*(I3x3R;sLqRNJB zWDT8Nii1q=)*#Hd65d&syez?8MX0VPyP8`{B8vl6@5f+3m#>6e0q=Katw;G9Cn&CYmj)U;o7TECy5@Vtk&{f}k ZR|j2=*B^!lubd-?ubfkg*Nf$1|9^L$rH=pr delta 1317 zcmZ`&T~E_c818Ae_H=8zAs^u*0a3w?3yFjUgI_@$1Ta~`43Y-Yu$?AOJ33Fh1a5>x zZ@e&yCtmR<{P+b#jb3@H=@0PAAK;boyk}!06Snl}`+eT?yl)RPzecS)rkRlVuauwO z*y%a2`uFy^MkInf$!@%njkqp*a#gVv1UAKsRpWMC$T3f?YPKfixQDB{tqWQ864j)g zMAD)}G=iT?1iQvF#WuOFlLXfjLbte{BnH(9G9|j+6~qo4v|XTpzejV7Zg-!B(*d9xH-dqE1Sz; z%f?P*>h4b2t%VhTTO@a6M*TJFm)#(6f?9>R)M-UeF&2AsO*GOd7g<5LMMHU7N?7iBH zH1<_}cO7#*t56l+!l2mAK047W9I4mlf#fO0&t!~R&EUY zES~FZC^2J?Lih!MivX7Z1oxLg$^c{m&ZK>edzbkWKm?8(8aA+w6LgFf(gPpAB)-cz z7CRPG!3iI?hw}&HRjV?4@;kO00|E5bk1|)ZOMA z=@O^pliiLA6#9O_{#yIt;K`yW-H*UFD5SlzO=|}Zo5bzuh~&5 zx7R_@G>@~j`9fi3DPN?saERb)0i<@hR!us=9lQK#Foa?N{y809QQ}b zpiH-FyH_5DVU5b%Vh;wc$L@8nZm12H*yc#}OOM=gNMYkC@GnZ8c6NksRDDwS+*=SE S03#S-*+Am27)p93J^2r-!~4