From 828a4320c79ce96ea224825df3804f61f777d84f Mon Sep 17 00:00:00 2001 From: Fisher Date: Tue, 13 Jul 2021 10:01:31 +0800 Subject: [PATCH 1/2] =?UTF-8?q?=E5=A2=9E=E5=8A=A0=E7=BC=96=E8=AF=91?= =?UTF-8?q?=E8=AF=B4=E6=98=8E.docx?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- doc/编译说明.docx | Bin 0 -> 14506 bytes 1 file changed, 0 insertions(+), 0 deletions(-) create mode 100644 doc/编译说明.docx diff --git a/doc/编译说明.docx b/doc/编译说明.docx new file mode 100644 index 0000000000000000000000000000000000000000..27c7fab72c2f9ead41305d6885cf1075fc43d0db GIT binary patch literal 14506 zcma*O1yo(j(lv^+ahKrk?(XgyJh*FccbA~Soj`CWxH|+(Ah=ry?hbF0bI-|1zWd+t z))-sHS~a_?XRofVuC7*+1&4qIdAY(AHiTY&|Gr>=e@yI+l^pFIoEVjWV(7pdfS+QE zk&oGWpdcWQU?3pK{}wZJaA0t^waJR_w(DU+7CU}_hopQIkp&V!Vk{=gtxk`chZnz1 z*Jov<^GW#R+C>U-uc0wZ%j2P5bSI?$q|!+84)~A_q_;#`T8eK@kFNTcf$!Y zGCg!{fe5=7w-MzrUkoxqaBl#X=7!su*(4?&kO*}(`m&weR9~5P3%N;LxB!T<{fY=u zVJgwA5LnQ)!7N{{yQ*a~vzPruW&3pm?$vc0po>2EOU!--eYAM{qe-oj`1?@;J8xhi zjPSCM>qt_vQD95J76xlHuiwXS2h?W_AN=;l>`tUZ@e#hxj2%#`P!0YNVG~k)o)V2m zFlXP&P9e~=4ag0f8t_}JV3@8gd|rNL_j2G}FO4y4BlR@6@~)k1!OY~==UT4d?B1?OhrJ*Myt3-yAlcjEct z8j+r*YqSwPfE%#-X+Q)fce$gz-g-a5;{(4gz$HowU!XADS$L10%=D3jb;}o zXM5Whq6_2YWqXB?LyrTW4d=aT>lSy)$f$SV`hp;>kBR5&157v%>`KKSj_pd+`P`>A zPY@^gSkbEV2SM?hzqF&n6fqd|iIXnAIY4`8tH?wqwY8f17KF~%O<8%$)7~DzDWjm9 zmThf23Ny^VS0AX$DNlj#L5YRywLjJ?F}T5RyTV` zlRs>YhwP3nCJ^Cl1_FZgw}_LohmEPz3+oMfvW}ZA7+D`_ybRtZ!Q0$kZ_QS|?)-5@ zc@%lb6`#c!DmBz&onUZNbFd;3Ixp!Ow@h|F1S#~TUMxREb|t$>JYrXOWr7$4Y;92g z&Bl<|juwLn%Q@0Dl6Nd+0KE7a+c_a&<(2PMdz*pu5J}oe+VhChbBbc;^YY-O)|)m7 zzH1Po;fW1{ovKI@{tUS@gMQ=WOAxHe4K? z9hfd@vANGj>A1^?u8dGjSW-qsvK%Q=WKm9jDEdfzf~(>_7lAVUoG8Moz(Np!z%r~s zGG<+m9R-!rR4SZpi*<@8d3pS;HLk)GvnUPTJzG?6V+fm&HJ*(rj8aD^X7j51Et=CU z8YJXLLW1wl4F_C&)mpmEdRcm^J5!j(lJ)ZF_I)JAX)vs0LZe4)f{f=P16bt-2rHiL zEBYUAedE;38uMM<`2wm|6wcbYxbE+ghN9_7q{c7TBc5ScSd+RT^=nyZ950z$CrV>y zC?9uaD8!E{CNv2E%;$t+@WbANvn#76pSzm(>t=Szj-Nv7+HNx8s_*=spLYG8&lxZG ziB_S~yzjWC9xhjt@hy$t-_C?i#bw5oI;k4_GmL&ny_Hm@QfdNK||xT&J;fk~VV z3$DIXhw#L8WI=?mRKzeYe8kgphj64U3&G!_&liIcz`VLXI@WRrtbwknH3l-~BU;&dvlr7!x;SRAl<6`(9H z|A0@mb8-WNPq-AhOyX<4NZu&%5lOKr zo89dWAj~OH=MJWemugB$It?V5RlO2}9#2%-$INrGg2l14p^16lFLT)dDc;ZzFEKPQ zF)qR~L17exz9F#%(MS^V!-u*cTs2@7WhVYpX6|9>TNs=woNJSZ4_})g#x!EAS%UJT zCPP1-xtj97|4QplvzpOEeC`9OxP1?sJ#vlV-FVE26D2C4ODKkdQg1v?T0$TfT?OTI zn#5$W>arO9Hu}|MMd(_)S8~nA=t5dWei-c4Cq@?UO9ClRJp?wbMrG>-?i+D3Q#TN( zMvyj~Y&k3(Fd9<}KyiH@@%PtZ!puz}9cflw`q$Uh%;Mk9+sxlEz~X?W*A=sgB5%$z z@uiUsJvE-SqrPI(E*bD`@t_(xRES|J5hH0vYtw@kCcQ<-6e3^gl8>hL?(7$Si;u#G zOVN_1*IC3D^fuCdGv)YwG)ePLUY3#Eds>$Hub4RT+bjwibXd1Hh^@tDL+*`q_=JxF zf%Al7TF%YTs#D;9Xpo#jwJo=<4?AKrSe>IyEcxaSzsQF_FbOqL87HyrK;ZoIb4 zHI;I}`ZhWF3K<4|Ogd26ME=D5sU;5HOd&>KymI~6&|Pf;oQ4adKeL}&d{BAu8Dyg~ zv_?5{-BSLUw!W(DqvA?RH3v4 zlOePObHq|MEA0RaJbk4K>o+1Mg=H9{fcXaa(E)xmV-#@J17E3EWD=)p&WKQ^>YGkp zb~#-;9}2fOV)AHpST7Er=@leyw@Ofsy2U6YALC@vt+E3j5bC>oHwRw{toyX}3n$;x zBi6zyDT=yh_E_Z{xCr@GeuOha-(cBLjNW*g8_+qirBbn#AU&~>f+D8CZ$*5#{>r;n zEfAEW1v3_mvLTb`zLN=iAQV!Q4JlFHsPqa^U7o+oQ)vq%TI=YWY7OUxrMmn1jQ^m5 zYJ0+1WYq=XZrWbFww5{MV5^U(4QS_f9@XXo`YfH*S zA9qMoGl!%bpzZXH;uC)~HWe)^o zEo|ixdT=kU65+(?!T*;AAZ#+ta1U|7b++2)rL(2UG&s8tE;H6;0G=cjIQ8g-Hu5V7tUPJS@T&UKGc&->S!wJRPW= z1FHwtfvMws2W({s3a}afLCbFatH}vN@@+L_*g!Jo>+`0j|J}+hhLs_$kars~rZtcj zKe_vU5y6=ZN4lcP@F!s}>XF4~xEo6|0Tl=GUr=HTbR&qJ#nR4D7!R!I7~Ca5n;9#gX4X4(R~zP{@vHu3WcUa?v5 z_Ugop4&Za_4+f+l{{1pzzIm@q+T?}Ev}d0NH{Xwl^!`>mbvE`-%`H|w%?_75AdAFs zuaWD7Dn5nOd5O4|yFJ;5eg0(pWpSDrzaO7u!Co(K_S= zZlM0g3j?XKBSXHi?NR2c&O7AThX6Yp{~Cjn(C|*SX04cntGm+DJfRAU;IgkJo*>Va zmC^bmcex9I&vXq?iJU4m9pMjOpFw|j-o2#U@?fDrKyZL-)t5EWPcPHS)Y;k6&itnn zS%@|4xX5v_lJ*o7=BA@7r1C{<*r6h8E`qW)gH=of)e3bDBp2g$A2=csNT%q$?i`dvLVUlM2y_pdBCTSwOS&aev+=Ja%=G zP6A``03}JyobB&fpqcqhiKb;E9kY#L4*=gvkHVq7LC=tm=~rFU#cZ>y&ZpH@Zpdl+ zgs&Nd-BGRGy%Q8ZnvNML+wnTxbbQuYJ8pe-h}c)cej@EGzXC=zYaoIMW3DT0>5Ig> zFF*9(LowJ%5>ME3pXzFmE|1r&=Ho3bzf~sS@*UtCn*_W;rY074nQ7HA9zit1bEf!? z{DT&7`C*oSD&K#(ruFNTqgK`_Ztb%9X>uh5rcZhvh(fuA$rqXaeRNvyxW>i9O4pb+ znmL0$>2G-UV8x_~F3MQv83>zTRWwu+SwZF3N*RoqvskSjqGF(Xp*>eN*7+#p&!5$0 zOjXw(`B&mn8ln9!{59~CbsQWbl_vaCdMPxm0$6zPJ6Aqg~~bslx_w2 z?~s@}bPk|3*mQDTu-#?K71;=2GS_0`U9$)XS>iC2@tIMBivsjbJ>^8QO6u|MRZ=55 zRM0+m60!~aW>3j$=BS$+(yuk`Ncq3=nCS2Wov&J7US=+dG*)imf<_!$QSwEISos4$`2*8LtIRC| z+zN|7Q&u{o0}}rMZUP#-Rxs|t?6QxnmIkYbcm^+Qf$&Ady`E{}a+_jGrB_ptEH^<% z58tb=21tJG9_a`EZwsg{dh)LI4STwrlu~is&GzWv3#R=e+Ph?nDnS#W-o-jj_zx@n z7)%=u#Dk=AsdFNr1gv8r^&U=JnWxX?#fX3_zRM)aL4>@Gq*S!2?plkDnndrT3uZ>S7hm!#9OmT(ZC=4_-nSN%MKTvzWT&-!0&sk##Q-So|WvzHz*dk8ym5tIRAmz}C+mYFwCNtNd_vwtTzH6A7ueCW4%dAmuX=5`| zc5Zu9MgPcTt_Jhl=oQOtdGk6>MW2eG+%Udfx-YGsZDxr29{Ko`4Q$66^U1VNImeN| z6EB{(rS5eA+##J3614mzVSp7Ep5Y4M{2i0K@1^s1z`10qUoa#oJi$=wEoL&dvho!~ z#)A9w340Yy2kG`DKv&Z|R{*g5&apSLlpY2hz$dtcphM%Hy$>KHygYt}{C|fh;QpRC zoGnakP5%f|RQm^2-T?y`WUoL#Fn$;ODbD;7syNh=x5wo~ZpZrWr+Ls`W3u1NLIV9s zV1vUIRZJ!lkD9(=G`v+eE(w1*a!WH;XsUiF4>aFR#}nDBm)^%x&kl}x2LfOwmK8&`({2RC{Y zmbfTiyxA?>;%it0nCtZ5b>Xox8Cjdf9r@#g{$fX4=qE=~8jU#|*NWHXbu(j!jzI=( zmAhN(xvBLkC9kb`L;MhO9be6sxLIXsuPcI2IsjA3ek51{U5mEPH}vs0bxYxTIb(ue1V%;v)D>-A{RTwcEJ@3B@2t)gGwFU)c+v;#`z zlf7chlbuQ0F#$x0=0b{R5yL{() zb_bDs`F(FrZn_!MNJp)Z$nz{OcfuH-JTu2Q}=7Z1TCY zG*Dl z%ky#+V1C<(%;P+^EE4g4b({?Hl8hmx0-(cYuaYE%z5yYt*luhbjbGL(8;&sx&ax#} z9e;6zYLA6tE_G*Op#F8qBDOCsr6h`IYcX=H8{a-fdA4-%W>TW3QfOMZBen!%pv;0q z`M_~rl9?U6Bi3Y#WIp38FJd16lZMD_`i8Pgq{+t4L9;6U!kUQasGe}r(uTB|%s6Gj zr!O_artU4R$lD)1S5l~HbFux{GUy(hY0lk9sqLcEtXrVuv|oL~3}}}r%erkR6%xO+ z2~B6fxNV)$n7w|yDsm34PR5CIm8~&O$fR1Ghu@`KB6?rd;j^*kqfG7$U zy-D1|j+r1Xs%qSpP1??A4tbRRM>|(1mie zNz&C;(uPl7>?)Y2;$(=h=|{%wrlzPulm|85R}|F_#F7gGn{vJ~Ceu+$u#(rcRhhvg zZuqc_reKxPo^yLT>w9DZ2Ewk}bSX2JENDmpTi$JI^aJZHM6Avg0-X{VN9>DA`flbB zNr$a*OcZs}He6EE=0P-4ca8|cPH~g8yjYkB&{6W+zR9KJm_ijpuz2tIxK!95tsv#P z07r7+8$#REvX^wNJZZpnt$KGoO)dl>#~Ey@c}reXrEa#i-fOFmL-pc4RGb;X@1l1dJXntmX zUzhvHEIcT?NCIb%a4}B#E48u=Og+-g>e~Hmn-3)B;X7^S+NJp|MLPZEugq)>h?C8& z&!Eb*!t?af@dXl(#D{G^*W0aUDmlXd+))H2XZgiNnTp3K>x!udMp??)cnKT425kZ; zm3ZY7nbbNtoLZ3^^Ch`H26eN#_*UzbYh&Y#jlbvlauDbp`qi+Kbv! z{WZiU+152I*@oB0D45QMy!L|>ODNv~2&hpPhZ0dAL_(a9L3&?kHH0y4>YhePC0X_v z#+9z#eCQg4k-^*^O=5QfeU{hpZPxSk5@Y8NxN|i|TG~u1wpMSuswg8!33vyQ>iNsf z3VSOYy`=mvBK|w#0k*D}b&>mJ$*a#tqZX<{CM1Thm8gk`spOR-EL}s?)UD3k(JA^u zE&K6zu(j0s2xi8@4P)oN_A-}K(u{yAR?O};RFY|#Xo?4%YFp-|yw>GtK9RP{?}KG} z9ZMBvss1*~aT2X)n-`@7s#vyu#Knp4;}y8Ay=Z*&+(G1!NFsk;`j_AnT6q(ZE6G!Y z+ddkaXxSB;I&OoQ@9|m$J4CQD;fW)o#mP8y%xak`#~(4LaCf36#L07>``io3b0C8_ z(%ylgn+8%2sT)Z6x1sOA5HfX`stJB@#|#{#M&ApyRG^YCZwVnVd_QqdU9^x8K&e7d z`_#82IJ~GW+Yt*-9Uzk>DQq`nBt|1IxiKzTq1U9EAHsgmYPMs`Rl~Mj2gsa!97m?F zDcqBiu@+PAcfhUqLf$fEF^&Hoos)DfbSwPo_6OgI>Mc1IhFSVTP$1RUWxjIyALpvd z`urgneKTO6%5>l_HWi2Oz7lUD5u;LI;jNCUP8GdLw|Di>Be-w85<2B2d>VJ!f=p|p z^dp5W1yc;+61H`PoFm}rDPy<^EX25Egq2(cs{?$6abl|5zj8AH$;J#6zbjWdH{P9^ zP1m~?VXqLJ>(wskK1txG$=2U~g&tO67jBWbU_{3H{nqDvJGX;7IHg=04%&77lzv6a zPoP^UN(-|J_@mJEd3&C~0N0(!aULh%6q$A(=v-i2QiN?^-1zJf!xfF#-1vcr-2K+pq@Nxqlk(T>kLXJ)%~y zxL!PbtN*LkJlI7sJv;O)Hd9F>@BTQcCskLtIml^ zVbr~=`_5vQd#lH3LfnUiHyetGni>F1;Uf7Rq6tP^fgb>+H>)Ke;@ki(ZQ`!?{jl9{ zsX^$VJzj5lv&nRfp@T2kp*SvKC9f;FIkQ4txDlE^8<;0y|*d(e>P zsg4iPASMZ#UHdv`$R}&MB57G;NYr7#hJa6kv}{_DK-`RPnawE-11$S^frp#{#6<(? z))~1)1X>y%2jfWN=uAyMI6+*w(CWi=NK>;Q_*~xS;!~TrH7Qg+w)T(P8g#Up-UD}` zDt+OftIPJ5L91fr>3z)a1Q*B2gPHP~t2gD{wF=$SUH%=>p4*An`kA$~NBqB|9 z9_sM(=0Ecx*(t`#6ABQ_7^_l!$}@%je27oasohZERDJ*>IcwV=x?B-?dD~p5Y~yrU z;o{@2GAfV9a4Zt3k~K2J{dC-mytOp6w%kr3p8u+NONOPa+L3YJDld9oo<3#Tv8v&K z1d;T*2q~p8<{|pYM3a^d`&K$>EPq(i0uOb(Nq{4FTVw1q4HXpxr^VYWYzKGc9KSFq z6>Sbs&xkK@JCFS3MZn<${tjC=Zo8e0nF!O(5dhER4>(D~y`F-iVws!eO81N~qK<<; zzojLiu`rIaI(9I4Z0NPJZ1iBN_}C~cinQxTak9q7LRmuAQb&5GfI;rWguXZD4Tm~W;ly*YAuBm&PXHRwYssc;bYL?6^^6GK#$`H^Q2nN-Rr^W{q&n4W)eX%afyvl@2ps)T8d{k^ zGQojRCSJIXsUgN6i$McRfMUoSA=HXMrTmM^CkrUGAS%q@kDB&Ei3tYsIR!U>t2oB6 z=q>O#*<7d%cR5Ua=32Ke%%lQNZjZIPB+Nn(&b7F)0dJN`C&BytsUhTdet>dG_`E$h zdE$wTS%8rv4tvefV!G*E4k4}O^=@P*NF{z@n9T=;MRS<>#*mb5a-X`pnSoB_M6&y{*HBA zXF1Da#xR@e68hTW1tr&z7LmoZlLuR?Sb_K@@8V7JHgUPqn7o5_xRS{oi{GM|arf_y53Wg(h-hXF#d{ai z)V4CAO6MtNy3Jq#_`V*9lE&7NV@2p&;gDsY(-3Ks2fNJGZ)S|w;;x|Fif(O;vS`hg zHgz_sGl-<(^Iwa%p(iU#&nUvWu7JbggrLQDSl=)aXYK{;hYqwz z7%3L6T_+2}{Ae5Pw1}~&n@q@dO2R^EPw*0jKAI;a~cU?SsLQ1 z+EOyr*{FovpD~-}(VN&`aNM^Xv*f7~M@|ip{5DIkhoL(jHbwveE!wch#|^1CsPz3( z#?g)vv7<_k$w+|swF8{t5Q=fMG#*z?aEGP#K8^jy73D75^h1Zr5l&dRjAv=VE><1{LCc#*%Z@QW$Pd&^pI8PdnCtI zc8UFIBf5Hp@B4EGRm5)={iXZ*7MQPAu{g1veOfZTnpU|R7xZS3bscKISU|Bw5)0AG zQC>!LFIwYbB5Mx13_=&gcSCE>&BP+9n>XUSE%C6fPvyZrh}?PDV0#}~rtR9U1WRWg z_R8x{R)5$dmWwhI%{iyD9^HZi%clzwiY{)S&yaq*yX{O;bX?dq z5U!QyN*1w6Nn%D=wK4;8xv+bE2kGTSJ8N}L_N|AV(OdWx{5HDVTyN0aYA`|j5)^~ge zFs*?En?ctYD&aM@kf>a$g$oci@jd9Ry+efRB|ckP>+h^zm7~!- zoj*$2-b$4M6m}~!IdWoVEg6!WF+azRl7}1ZkJI(8P(qZs1)@y0pBEK3^&)RBV7w3c_LkRYO7B#Do%MxH`TIbF^O_zCFK}N-^{4* zH_}vh=5*mV;5Fz~6@)rA(G)j-7+0<<_#nI}51CRXfvfK%-TSGGZAtPA7J2njja0#> zC*T^8XPWF-RZ}xl)v~%v_8KHxN%-NIuUMoEPVJE!4 z{jk6V2LV|E237wV3}*Ir&T586Hb1i#+mn9|hR|zBPw0Squ_QX3S`FAd{2^LbayM;qNdZ3~imK6SfX_m+5ozh0r>-7v{V)#NFiG^$lt<6!ngpiWqa`{(B6<(VdO&B2@qoA%A0J3Ba>aW7VKu!4%0t%RuK+ZRs=C zRXEDr$FUO07q>y=vR*^n&dhQMex+ZB9Rp5F$s5rnyLTH?;m-a=?y_;(ZG z2dwZF27o99zAcGPP_-mP^|S=?&RS5A9&+QJtxcepr)DFP&+Y$kFo0X!Ao`A`Hh-pT zgOZRCJ_4Vu1LvQYZH&KU7+xeR5|(AanUO<|AyODBwv4d+ z5GU8*;}zuBR9)GA;>cn??(H<>>Es;bo|j~M0-LOk5ZHz|aHr6Heq{I-j)c`SNc7~x zn%FCjvF-l52&gTVBrn`LDh2`C?`fM^Nm|!iOd7-qj9DCHVY(yJ!{MH>_`~XYt3wxG z!PDbE&f!2>T2~4mDAd?IE%Me^%s3NXbjR;TU^tdjji>S$K~@pJvJ`+W3xsz}H**mf zJ5G_2jD~tuh!}y%{5}(PG2wty$DJ-QyWd^r)EjEb9CKN|uAx?R@@qn?kzNEwr+HF%G7P4_V(1DBzQ6 zWw1w0a`DQOSYmm!+!{!KxaiqCKiLXh83GAqO9abOgm`dVJU_`IO-U=Uv623t!888CiR>(UT7vGKSLDMofEv+NNDD-m5iaeVAb zIA^&bT4Q-nHP)cJ*=Z-PFDthuM^h#(XeHMx}uCz}@hW2XM}jLLuJ3 zGt0^%D_V=B5+^k3dv9|`kj2;0=!j&{Pw`bsi$1(zFk^Y|sEzfC!c2-r9AQ>et#+J>0KA41rKl7wVCaUvck# zZLX0_Y?vB`6;T`Cu}MYH1bf{gGA};9V$Qh7FG~We130AHvH_2mADGoBm>&?8ld?4) zPY!DbW)6mE)Ai*D{v!DUI~&+73D-7 zdtxcccEz-Tnt;e&w5Mz~$Op4E3Q1@*fVA|^28d~rH zjTz19F=_>ghYQTI!i(6(bO#ymydjJyT>q^d83h@J_=&%FrI`?v6Xyv$_w+DEvc)EV zb7J&3XTXebIAhf30cbuz!O%f|or?LhtAM=)0t!L|{7zv0uO0VS0sq|sz1Z@&Gyf{f zX6mo&Z)*N^g6elB{yanV0{e>zO5neLVE;K$^{4889{c%)t_2#4f6#v)0{RpF=W&)_ z@K-={{R{rj;gNv62}QQ_ZZ{He&F%a&hobDICae_O=-iT^VO@C&aE?DPK{ z5%?4TXCC7({5Qn^;QyV~_$U0&lQh5JiGTOmuX8njf&aU0`n~s%fC(=@b^kjt=J)sf i&(xS-wQ~Iq{FNx9Bn$b|{9%G%f@lHXE?(9b(EkS|MMSs& literal 0 HcmV?d00001 From df795b62d9b3cd4ffeb6a3761f8a7b69b76c7cb6 Mon Sep 17 00:00:00 2001 From: Fisher Date: Tue, 13 Jul 2021 10:05:23 +0800 Subject: [PATCH 2/2] Update spider --- src/backend/JDSpiders/Spider/JDSpider.py | 50 ++++++++++++------------ 1 file changed, 25 insertions(+), 25 deletions(-) diff --git a/src/backend/JDSpiders/Spider/JDSpider.py b/src/backend/JDSpiders/Spider/JDSpider.py index 0e71dc0..e7000a0 100644 --- a/src/backend/JDSpiders/Spider/JDSpider.py +++ b/src/backend/JDSpiders/Spider/JDSpider.py @@ -2,7 +2,7 @@ Description: Author: Fishermanykx LastEditors: Fishermanykx -LastEditTime: 2021-07-13 09:17:32 +LastEditTime: 2021-07-13 10:04:13 ''' import re @@ -851,10 +851,10 @@ class MotherboardSpider(JDSpider): def main(self): motherboard_link = "https://list.jd.com/list.html?cat=670%2C677%2C681&psort=3&psort=3&pvid=e726d0ee460448b6a16cf24950c1dabb&page=" # 爬取数据 - # page_num = 26 # 一共爬了26页 - page_num = 1 # for testing + page_num = 26 # 一共爬了26页 + # page_num = 1 # for testing start_page = 1 - # self.productSpider(motherboard_link, page_num, start_page) + self.productSpider(motherboard_link, page_num, start_page) # 清洗数据 self.cleanMotherboard() print("Successfully get Motherboard data!") @@ -1015,10 +1015,10 @@ class GraphicsCardSpider(JDSpider): def main(self): graphics_card_link = "https://list.jd.com/list.html?cat=670%2C677%2C679&psort=3&psort=3&pvid=e726d0ee460448b6a16cf24950c1dabb&page=" # 爬取数据 - # page_num = 30 - page_num = 1 + page_num = 30 + # page_num = 1 start_page = 1 - # self.productSpider(graphics_card_link, page_num, start_page) + self.productSpider(graphics_card_link, page_num, start_page) # 清洗数据 self.cleanGraphicsCard() print("Successfully get Graphics Card data!") @@ -1196,10 +1196,10 @@ class MemorySpider(JDSpider): def main(self): memory_link = "https://list.jd.com/list.html?cat=670%2C677%2C680&psort=3&ev=210_1558%5E&psort=3&page=" # 爬取数据 - # page_num = 40 - page_num = 1 + page_num = 40 + # page_num = 1 start_page = 1 - # self.productSpider(memory_link, page_num, start_page) + self.productSpider(memory_link, page_num, start_page) # 清洗数据 self.cleanMemory() print("Successfully get Memory data!") @@ -1384,8 +1384,8 @@ class CPURadiatorSpider(JDSpider): def main(self): radiator_link = "https://list.jd.com/list.html?cat=670%2C677%2C682&psort=3&ev=3680_97402%7C%7C97403%7C%7C106254%7C%7C106255%5E&psort=3&page=" # 爬取数据 - # page_num = 27 - page_num = 1 + page_num = 27 + # page_num = 1 start_page = 1 self.productSpider(radiator_link, page_num, start_page) # 清洗数据 @@ -1557,10 +1557,10 @@ class SSDSpider(JDSpider): def main(self): ssd_link = "https://list.jd.com/list.html?cat=670%2C677%2C11303&psort=3&psort=3&page=" - # page_num = 36 # 一共爬了36页 - page_num = 1 # 一共爬了36页 + page_num = 36 # 一共爬了36页 + # page_num = 1 # 一共爬了36页 start_page = 1 - # self.productSpider(ssd_link, page_num, start_page) + self.productSpider(ssd_link, page_num, start_page) self.cleanSSD() print("Successfully get SSD data!") @@ -1735,10 +1735,10 @@ class HDDSpider(JDSpider): def main(self): hdd_link = "https://list.jd.com/list.html?cat=670%2C677%2C683&psort=3&psort=3&page=" - # page_num = 11 - page_num = 1 + page_num = 11 + # page_num = 1 start_page = 1 - # self.productSpider(hdd_link, page_num, start_page) + self.productSpider(hdd_link, page_num, start_page) self.cleanHDD() print("Successfully get HDD data!") @@ -1892,10 +1892,10 @@ class PowerSupplySpider(JDSpider): def main(self): power_supply_link = "https://list.jd.com/list.html?cat=670%2C677%2C691&psort=3&psort=3&page=" - # page_num = 25 # 抓25页 - page_num = 1 + page_num = 25 # 抓25页 + # page_num = 1 start_page = 1 - # self.productSpider(power_supply_link, page_num, start_page) + self.productSpider(power_supply_link, page_num, start_page) self.cleanPowerSupply() print("Successfully get Power Supply data!") @@ -2078,10 +2078,10 @@ class CaseSpider(JDSpider): def main(self): case_link = "https://list.jd.com/list.html?cat=670%2C677%2C687&psort=3&psort=3&page=" - # page_num = 36 - page_num = 1 + page_num = 36 + # page_num = 1 start_page = 1 - # self.productSpider(case_link, page_num, start_page) + self.productSpider(case_link, page_num, start_page) self.cleanCase() print("Successfully get Computer Case data!") @@ -2089,7 +2089,7 @@ class CaseSpider(JDSpider): if __name__ == "__main__": accessory_type = 'all' - accessory_type = 'graphics_card' + # accessory_type = 'graphics_card' if accessory_type == 'cpu': cpu_spider = CPUSpider('cpu') cpu_spider.main()