From a8d60689bcb02ee1bf320f6c42db086505787294 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=BB=84=E6=B5=B7?= <10402852@qq.com> Date: Fri, 8 Nov 2024 19:50:15 +0800 Subject: [PATCH] 'commit' --- BaiHu/Tools/DocxTuBiaoAdd.py | 43 +++++++++++++++++++++++++++++++ BaiHu/Tools/YunNan.py | 24 +++++++++++++++-- BaiHu/Tools/汇总的内容.xlsx | Bin 0 -> 5467 bytes 3 files changed, 65 insertions(+), 2 deletions(-) create mode 100644 BaiHu/Tools/DocxTuBiaoAdd.py create mode 100644 BaiHu/Tools/汇总的内容.xlsx diff --git a/BaiHu/Tools/DocxTuBiaoAdd.py b/BaiHu/Tools/DocxTuBiaoAdd.py new file mode 100644 index 00000000..b0c40367 --- /dev/null +++ b/BaiHu/Tools/DocxTuBiaoAdd.py @@ -0,0 +1,43 @@ +# pip install pywin32 +import win32com +from win32com.client import Dispatch + +docApp = win32com.client.Dispatch('Word.Application') +docApp.Visible = True +docApp.DisplayAlerts = 0 +doc = docApp.Documents.Open('c:/1.docx') + +# 创建图表,图表的插入位置为预先在word文档中插入的书签,书签名为“插入图表位置” +shape_chart = doc.Shapes.AddChart2(Style=201, Type=51, Top=doc.Bookmarks("插入图表位置").Select()) +shape_chart.WrapFormat.Type = 7 # 设置图表为嵌入型 + +# 设置Word中的图表 +chart = shape_chart.Chart +worksheet = chart.ChartData.Workbook.Worksheets(1) # 图表数据对应的工作表 +chart.SetSourceData("Sheet1!$A$1:$C$4") # 设置数据源范围 + +# 簇状柱形图测试数据 +chart_data = [["", "系列A", "系列B", "系列C", "系列D"], + [2020, 2, 4, 2, 3], + [2019, 4, 5, 3, 2]] + +# 清空工作表默认数据 +worksheet.Range("A1:D5").value = None + +# 填入测试数据 +for row_index, row in enumerate(chart_data): + for column_index, value in enumerate(row): + worksheet.Cells(row_index + 1, column_index + 1).Value = value + +chart.SetSourceData("Sheet1!$A$1:$E$3") # 设置数据源范围 + +# 设置图表样式示例 +chart.ChartTitle.Text = '测试标题' # 设置标题 +chart.FullSeriesCollection(2).Format.Fill.ForeColor.ObjectThemeColor = 10 # 设置系列2的填充颜色 + +chart.ChartData.Workbook.Close() # 关闭workbook窗口 + +doc.Save() +doc.Close() +docApp.Quit() + diff --git a/BaiHu/Tools/YunNan.py b/BaiHu/Tools/YunNan.py index de365397..96af6f67 100644 --- a/BaiHu/Tools/YunNan.py +++ b/BaiHu/Tools/YunNan.py @@ -1,9 +1,15 @@ # pip install pymysql # pip install requests beautifulsoup4 +# 查看结果 +# select * from t_dm_area where province_id='FD61813E-70A1-42AB-9A8E-141ED4D47B98' order by level_id; + +import time + import pymysql import requests from bs4 import BeautifulSoup +import re if __name__ == '__main__': # 遍历 mysql数据库,然后开启爬虫 @@ -28,9 +34,11 @@ if __name__ == '__main__': result: tuple = cursor.fetchall() for e in result: + id = e[0] area_name = e[1] url = "https://baike.baidu.com/item/" + area_name + "?fromModule=lemma_search-box" + print(url) # 发送HTTP GET请求 response = requests.get(url) # 检查请求是否成功 @@ -39,10 +47,22 @@ if __name__ == '__main__': soup = BeautifulSoup(response.text, 'html.parser') # 假设我们要抓取的是
fWzkl5mJEod1rd4R+9D6Jvczqm&OkY`g>CMUfFt6!R=er|Ih_s2}*xO^h zmi3J}N0FhSJduRtlEipLBkK3M%T0NL*}n_#o^o{gh|O6~t5ViValY9*2na+mt?ehD zkts*0fV-FKR_?tsjYP4BfIdtH(Vj6eLs&TOzZT<#uuaQ&0w(JbnCGw-ONqTXM=s@XX|B z%*sy@VSrr<8Xu6uHdho$9}$x#Bcch_nxAc`ss8$4;G}% Z!wc?=t9>clWbYqVmA84Qj_Q# *TaV3=rh|`;#w(vu-P* zAGv_tLsYA9CkYF)JZe(G=Xz(57HaWK_~PP7|8P7Jd0+OlJ2qAN;y6q0Y-e1!PoV%a zEASlkqVPpl;K50jysT(TJvQ^^E(SDGMY4-*YK?5dnp7ct(UCHQbeJ5Q7{d;5WMFb_ zF5{7P+Y|7luQ!%BfMR#^@V?r3h>ix81fV=Z7r&uLYRmPJ_}WuGh@=fYuJyv>lBFY{ zoOsu_H+W7i=?dKX6g|#hb^C9?$eYAq4N7(79zGjR)rX{%AMYXltz0bpo~gOSFi yuhnS5)Tt1CTUnCG1oyiMu 0MjVWJDMBy|6Qun{!OE&||#i(=+%P90`x{uP;d%->K`taoF;3>kuwsOz2Fi z#FVgD4)48Nja6{Rf1;O~Zs;+$wo-!tBH1;lWm1Ctp1+cz59uNn;#OLy0`)u0C~~0% z&WDEk{c(wuu>(g EPCOiAO@Y%tEaKf9DeDUwILER6{A3-55+`U~v4(cAV)#6A4 zySi1)BAn3S#E--8)^gb_L^$$BkWwMOCjGZnL=hZ%h|fU!Me#9Dv#rtl!}(6)a~f09 zieEl8QY|)lMCv(lsUO)(RW&pz-N{ZiJ{DMB%6Ec3N(k=Z!3Yp_Qh0^!Hob57sGC3L zB)@gF#?w9-Csl=0sf0 s&YKYjz?MPi*l_NU`-QULc47|K5^&G( zQ@^|E%#yw;Lh+WglJZTeGulJ1gKc_U{DIihXKdL@v+R4_$qx)#yNtzEpFB(nZCF 3Sa3kQoNrlN;Lq_hQ6Q*{kGY!O09p(98_ zT1HXRY?|OIu%VKG|3b#5I&rE$|JqB*MplC}afM)|Lj4?8OKmDIcyOBjcviUwNHxo} zh(Ga%H<%coA%ApQW2au{7Lq%RLv*GqdlI%uk8@t{v+u^woi*GUQowpFP#yVJ!hc7% zV$Yf{V^7yi((K;xSilIkD@tL5M% 2ADl z1HEJKhG!d+ArBbkBy1%4GW_2+jC 8$q zWIF%Mb!5B$QWPL}l;F8_#W6J!x1DpNTLE2k14@Q&1uR`GblhEBJ%lY>+^v3gL754C zKaEl-G7KIvG@D|TN*cPOVCHV0J(!d-7h0pHQp& FX#Rp%8dijnhuM zv2;iX3j#cPh8uk%Ani#h*}+Twc%yDY^rElsd5mn gpqduEDgukDR6Y}x|_`)ub0EIHj Q#;|wdNU3gq4eF0 zCr?;CkYKCnwF90>$2M)sV~*Zho<~r8eRXz9As+bmy?NtS48jjBDj6mKK>EK$edOx; zTT?}cB@xmvWY{?g=vc+eB!%2EIbr)tdkRiMosA)LXKodzxPIc{xUpB{R*m1?thrv< zH*zmHorz2Pq$6#c_)UQWrZ`$>-3|U-%-(_4;{wWhWqM;WJd 5FCD#Cy(AB^`V)#XHw(WVLiv%stWbi zDkEye-GT51%u!*dJPj3I>APOpU7bXIes`yXt%M13I(bbCb9Lh;y1e*soG|s02ISz6 zF%@`F6O79vGNY@70yxU#sUW#vPXDL|F-r`VO=$EX$>L*mS&<6-rMfkK_+F;=X+rb9 zla7#J{EN+Uw{jG%S3oIV|5lS@v{N3t!3IvplNZ ZyVSQ94iK%Xcy85 z#e9<0o_Aead-FBR#WVoj2xDBM{MGXR`xpxytzVzIpr6aX47IKjT%E%Fh64a~LBZ$@ z_+K-btH7(Xia)?)bS?h>lZ&f7R~`Kyo_cipp?Ut*-(O|9YDE9AfY1%#KP>;TrB}gM z-P9j29OvJ?)m4V8j^qzR6Yg(@|N4`w(5p@AALugvFX+{l^(w*DBk&JFC)$$#p9AqK k{A#iPfit2H)c?Z&DSaIXHd+z@fB^k{j*jyu@}Ix{2a*U>ApigX literal 0 HcmV?d00001