From 846c92198346b9830779d46506b3cae33a137a5f Mon Sep 17 00:00:00 2001 From: YYL469 <2049360881@qq.com> Date: Wed, 3 Jul 2024 19:52:52 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8D=E7=88=AC=E8=99=ABbug?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- spider/__pycache__/saveData.cpython-38.pyc | Bin 1214 -> 0 bytes spider/__pycache__/spiderComments.cpython-38.pyc | Bin 3109 -> 0 bytes spider/__pycache__/spiderContent.cpython-38.pyc | Bin 3612 -> 0 bytes spider/__pycache__/spiderData.cpython-38.pyc | Bin 510 -> 0 bytes spider/article.csv | 1 + spider/saveData.py | 4 ++-- 6 files changed, 3 insertions(+), 2 deletions(-) delete mode 100644 spider/__pycache__/saveData.cpython-38.pyc delete mode 100644 spider/__pycache__/spiderComments.cpython-38.pyc delete mode 100644 spider/__pycache__/spiderContent.cpython-38.pyc delete mode 100644 spider/__pycache__/spiderData.cpython-38.pyc create mode 100644 spider/article.csv diff --git a/spider/__pycache__/saveData.cpython-38.pyc b/spider/__pycache__/saveData.cpython-38.pyc deleted file mode 100644 index 97fee395ffa2d2c795ec85c1a14fea17cf1b9c19..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 1214 zcmZWp&u`R56rLG-ZD*6P`OzSbIdIul+CT#mjamvK>M;ZXBDGesX8k7MjXicfvnjjU zs0R>2LQyOAQgMigREhSooDhgZ{t)+Aw%z^#?U`q<6K&|M=FR)Qd4BKn%=6xzovjia z=l^)T{X>P2KXWiS7=mj!)m1b=fQH1)R~FKUxr~lE!!-p1;}LZ$U_#|FaV=qkwZqai zVLc)kMQ@Y3{SW3K8+Dq^`l;YrctYL}r0BJxuKF(gEa?{O+RDmSz~ilsxD~9Oc-Jmo zXngT`WA$?5;_Avh5wv1&v(pL#|7H@%AeP>B$-}M+)a|a)BKq2Yz*8mkR~@~5C2C#r z^U}w|LT3u+4V>yfG`(Lmc|n0{cF6V!`UbE=x_x zEEuEDPMAvHY*)Yr2d1F9Z&1>&AfBGUX4`@p&0rSJKyBYFA}pAjWbP5UPVw;QX+;JU zD*E()84P4jW%!mzwneo4!h!iiig|KxA@_jbg)DCLmXrvEua`ev-cI9anWsANL(!|1 z&N|n;;j7)=+0$`;97RHE)mtnBZJCI4peUaIIEH!4#>@s0yr=r;Urfy^g?z&UKwkIA2N~^p8h=-YTB4fU>^0DHj z6KYaheJW!KxDNIoc-VBAHSWQZ$<bP{YbY*yu3IxZezvC6DeMDebu zTkdpTI21QS*aUZ`RIwqx&rzwb+$+&|uQsl7eSF{;JU1qe#csmyBwfVb{FkGFwdP$V zQq^pCxLm!o+FTcEN5@I?{o9}4zkNP>b<`aG`f_;i?C;;64d4AZ8XS!Vhr_|a=*{cq z@MtjHe?EHpWHfj;eEQ_CgP)oz2|%Px#dk$v+1dX`$qRp|mf$Eq}4!nn-wyod+V^Xg7IkAz#r!{wp>Kt$a%{}XYogiGKmJ%b>v n<>vT7$s^%;#mi2ZPcS5NzKmk%gyJeiq-M}KD8^y(ekaT^=QV8BUP6)*X(TTPfN`M%}8r{m4F5jiM^g{Tt@BAt8T2wbedUJ$DS*Y<5O-?zwm7 zo;mk?{LU#34Fx#3-o5_oo&OGU+`rl6^-F-s&*7m45X2!~=PLb?ukh|%s0i*TRzw&D zU1~}diRX}rq`O?jgFMI!qZj#*45JVEQ2<664WL07{b&eXf-!&x(B)l$G;rXUgWY_A z3lG19e{#7n@5o58u%$I|jjdc1@hdNKDu$l zSyInqb0_=}Z}UAbay4SwFin^is{e%Nxe}M)*0?;k38w@dF6X|w6dkRZ%_cT18m-ZN zhwpslXM9cPdes1XdRqpD&#gSxhhX|-my zL6YMoSk+9!@zqSj0@+SLXe^X zLbn=i#TXkO+e%@&YniRBXODmT?D2!MFP?6le)^}=habN9?8DP1ADumVdiLn#^wGn! zfBb#x^y#D1`w!0Uy?^%T$?3iKpFjM~7Hw&u{`oL>VZzp-BWZ?a`QV52`#?B;kbjF0 z@DeY)d4EaXh4(d{eRY0`F#6$fojwkX1;O%~qu)8=EeHY|g5XH7g`UV<{w=q9bA$>M#{u-?x9E! zxEhPpi%SBA{nI_b6fk}DKM{@u7QZ%UgYrnaFCK}u*btBhvLa@SJ@JG?-VumN7ME^p z`f>^nk~a(abYy)cJD;0Atk2LDL(Li8eBmJ5Y|z6yYBpOa+zuAz($h1|Rw}t(+*{Z0 z>^8RBJ8d<4(A{tD83@7bnu0%}8Nv`7jmFEN*U? z)yUxrNo`E67IWK8Yi407zqGzvO6G9fsAm$DgPSYGlCGp$69=7mVy&6XZlvamc%BY}c~$^Yu(|XLf_m1EE8#MtNFE7TAM9)t$2EEGPQ_fYNTAMmW#6snOSQkxmvQyHMGlkQVrh3`A)?ZiZmh0W+S?nQRcho9sa43&&d#qcG}h;{U3Gf8Yc88zP1lvt zL^Kw>UeXL?c4#oS9=sWgGW|7U0#0@?F&+-iv|2hY;q9zujV8t>qhk}n>)FNi<)s@z z22a5ST-!Cn!MQpyn|SnQd?E@WKx#qRQHXZF1u(=rXPUbj?gkiOL}pY#ForC3tU$^G zy0sLdH0jHKL3}$Bptlm19GT#~Hf8`Ns@QS{sHIqK28akdQiGZXd?U7rPJRfx$Pd_7 z*g{*T0snX-;bf3dWpY{i(Mv!$0pR0*UTGMhWKbYCV5P>EFD{mMuYh9_CMpLt;T3q? z7okSH1|61Y^Tz-jwvgg}aS3vf>q)lApk(hSU)Knm)d)|nI}{x~2mOADATF$gc_PD) z!k(`&h2cIkks}%Sz;e7w3!oZ>rAmP9*YOenIElh0$KU^O4nSNql>Ijia0Lu7qw6#M zQp2|W7zA13Y=$z>xry(o(M;t5@!taP_3a}%SWCvX9$~MFXV@>y)Xtq&H(VfbAAwb z`J5jD-ha+t0zP0#HgAizWP5C{?XzXuZwFLA^T3{TUWo})y8CuW35K?VAruTP-U=<> z3KfE(ZZK5t%As;3)Qp5sWq^h9t3pf7HmTt@!{q0`|Kr&Qe|FKnEwcIVdX8*?BdSE{ zI8qzp48js>Ha4mT6yk~(0-JeD*3Ft?v3fnIxOKOxD@4WMSqANn3{GpY{>0^WT+T;u zOIK>xtpMQx@>BS*BKN%vodMK+x2JFqMOYg{h8SU?OfEAr%*Yi+-eTm91PDNeQCwwd z6NA^3#SG^`6#s31WF{@fb=N@<36OEH9Ka=@`Pr@_}>3V*y-x z)pe;i*NxOIt3_{(j&`uNZAQT;qe??L80}*NrlZ?!O-C2a17V#&I|StU-~Mp=$!9O_ z{q^*tk2Q4qtA9Rw{3JwQJh=P(;}2f^rFZtlUFbtzGUos+2^y*lYqU!1W~aK{)^+G5 zjj-%C7jAkuo)*!d2a{aSd8m$Y%MoG4g%Q_KVQ(dH?y@4$D+A~0&JwTUJD(8NOZU-> zdHYS5dEijQ%D@}SItvcc)C)ID(?LEUcwP7k@MIp|IdZkyR5YVn4G)r8SRg-Q#BEEy z!#H-d{sDrFV{qpl#Z~r|2o}WE>T8O)QRKEP^3R$kYU}ttW>Z%oriiPIAP>tPc|i8d JBk~oQ|33^vF9`qu diff --git a/spider/__pycache__/spiderContent.cpython-38.pyc b/spider/__pycache__/spiderContent.cpython-38.pyc deleted file mode 100644 index 53bfe037287419f04cd98e290cfab43746d6737a..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 3612 zcmaJ^-A^Oe6`vW8?ZFt9C1gL+FIS11^(qFh!LZ(hD1b4r2E$^&Fe0)B-|O*!Ju}=H z+h7fSAx$Gin@v?Ul~z#%YNRG=vTYxtuF@*c{Tt@B%YHmniqw}>s(Q|t-E1~$$C`7_ zy>sum=iYnH?;Nl8^n^HgE?oLW<>!4I_YZ75{rI5q2E3LDgm8qfadLb0}CSl-R;u&`2rW~e*~*?`55m?M6s!@)oB@f9zOyIXW^ZK*V+VPbKCrpK=@Scpyx+({C+NxdHoz_Fn+qp*EaQfybW_f6_{ z5o#-1ZI#vBu+p%r2AgOqw!+*{r7vc0dwi{ z+YjG)`{A80Pu_X^{zva`TBb%QJ7rUya~L%DT~X6DI|%DpKLf(?VZNUa@ggt$@88$# zr!cb2x)a$9dahFM?D?2Y>vC zAmEzb2Cjn8G5{TpmCV}0 zZfm4kOwF%v&yK|B20{Dkh{FU{PO(DPBERQNxeFklJ~AGt`=)b#vI*iB~v%*>D*dodUYf-$D|yR=tX7)z##R(g9^UC5?VsbqR7ok9B@?2{* zm7mR|Q#bNga&)X<3?^umnni0Qvs>P#ljZ&Sv|53_N%)o;c{MUIpB+ymOIOB{$y7Qy zmQK7HDNZgGrVE8}HdkoQrd2ve%q&f)@r`0>V|8+7Zqi;%FBR>Ljf$F_ z8eW(4@%?mrwYW1n6IZRpcA~1vjjgrTlBF;2TXtc2a&mfUW_x8i*H*{J+s1;?)@n6n zC^eXfTqkVv(sTGwO8cN^*1%RDjlkQc;+8IwdB^fhoh-(P%q_$Pu4V0qYQAs#Jm4 zx7>iKFr{ui`aAfyELpZN62t*_Ch>zN223HIN81YZBlVCsrd8luE8N)X?79{^I#>$ zGYJ-n`M<>!%n*1)uBg*J$QOzUm`(6tFd@tXj%Fk`iCS&t zbPi7G901@cZeD`lIi4k;|2yCVwE>5(2R{9Ps}7gp-sj&8AXXCoA_tokhyYv!?gQ=z zE&>m<2SD;);oKbu6ns-GHR?p=b`iOi+ zv2D$65PF*2<=)4Mzmx1)7)Nz?GJZ*iRNcTL?Bv$3PVOGw`|`brmsJ`*=)3>hBU!TH z!b?nP$sv@WAW-cp!^>!&k1CPqRwPOy(b;R!g=^75B-)NdH`-EkBOa~CqomzmwQbY7 zHZ;_t+Lkd0mJEHv56Qv$R?SeMIuRkhm>gET@}X2ym`WkIpx~goXIgvU`wALEa-dl< zYYi(FaD!0D)RZ!1n5$d}S!QCL=1CP#@J^| z9wZo->9yZt_fee0#n6Y*cu>Azw4nxWb5dV3uBAf$v2Yoo+k5~diEx;HIxTPzsMhi0)qS9JVXpe);>it86QKLlsKN zP}KlOu2ZaJ8E*LzUU36Y_5SC-JNfXF2k(4#a_fT!x8Hj3=f6Ug_s_rGj#`m>cR$CT z&pwMSZ~k=u<{gGb%Okw%_F1A?Wur-%1C??K7mN92No7XEENMiB zN?C{c7M6uZpswser|b7BWm$q4@RCGK@`^kUtDr1KpYvNaN=?_#6kUau$u!;ez}&mG zSeG0`u!LG%4w{PU38B+^9!hC81g6R1(;-t>mv>whs%3}@Oigvg>bUSTPUnYo#BBTr zVqF5l0h$KjCnBD5=xx3H1wJHTpXXoy4g^Dhx9klV>q@0k9X4Ak#RTt&JQ54D*We?2 z8Hra^o<|99ptJ24QM!yIfdu{Xi8{oTQt7G4@XU?C5LbGwZjeTezK$1aT>yeXfxoaI RJumsCZmCOpIdo3q{|kQ>rHTLm diff --git a/spider/__pycache__/spiderData.cpython-38.pyc b/spider/__pycache__/spiderData.cpython-38.pyc deleted file mode 100644 index 254127dd636a8a24acfd339b662edeeb75fefef1..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 510 zcmZ`#&r1S96rNdkbrZc*$2xWL;vqXlM4)F0#LKdk!8>{(OViTQlpQ6HEO7kUcwwI;Lza0Wul?brlkOs!TBx(0r~{@ zL0#Zj0fB;6UBbg4hugf{B$SmqzM#ISDZOxK#d#iZJSJZeOT$DQe$+;CY}Ywu+`jC& ze(9)WS150ZPS;*c9~RTGe4E?R({nT#eZP#N*_{mLGI)%FiTrrCqj?bBj^%J5gIP2j zd`<4{WaVF~xWX-VuflA?DyYLst^&eY%uL9k={TO-^c|;K$XI*p)^oSfDy~k5&tmGw tnVPot|LIFkWrk{8sr#-+9cO)aQf1=ZCtip2+VoU?BUb}CoYPF*#J>)jk&FNU diff --git a/spider/article.csv b/spider/article.csv new file mode 100644 index 0000000..a481b83 --- /dev/null +++ b/spider/article.csv @@ -0,0 +1 @@ +id,likeNum,commentsLen,reposts_count,region,content,contentLen,created_at,type,detailUrl,authorAvatar,authorName,authorDetail,isVip diff --git a/spider/saveData.py b/spider/saveData.py index e688541..523bc9c 100644 --- a/spider/saveData.py +++ b/spider/saveData.py @@ -7,9 +7,9 @@ engine = create_engine('mysql+pymysql://XiaoXueQi:XiaoXueQi@10.92.35.13/Weibo_Pu def save_to_sql(): try: artileOldPd = pd.read_sql('select * from article',engine) - articleNewPd = pd.read_csv('articleData.csv') + articleNewPd = pd.read_csv('article.csv') commentOldPd = pd.read_sql('select * from comments',engine) - commentNewPd = pd.read_csv('articleComments.csv') + commentNewPd = pd.read_csv('comments.csv') concatArticlePd = pd.concat([articleNewPd,artileOldPd],join='inner') concatCommentsPd = pd.concat([commentNewPd,commentOldPd],join='inner')