From 7ae67ba965ea680407ae21fedbd035d43ce8c313 Mon Sep 17 00:00:00 2001 From: liusheng <337615773@qq.com> Date: 星期二, 30 一月 2024 14:45:07 +0800 Subject: [PATCH] 代码提交 --- ruoyi-admin/src/main/java/com/ruoyi/web/test/pctest.java | 138 +++++++++++++++++++++++++++------------------- 1 files changed, 81 insertions(+), 57 deletions(-) diff --git a/ruoyi-admin/src/main/java/com/ruoyi/web/test/pctest.java b/ruoyi-admin/src/main/java/com/ruoyi/web/test/pctest.java index e176112..b28ead7 100644 --- a/ruoyi-admin/src/main/java/com/ruoyi/web/test/pctest.java +++ b/ruoyi-admin/src/main/java/com/ruoyi/web/test/pctest.java @@ -15,72 +15,96 @@ import java.nio.file.Paths; import java.util.ArrayList; import java.util.List; +import java.util.regex.Matcher; +import java.util.regex.Pattern; public class pctest { public static void main(String[] args) { - String str = null; -// for (int i = 51; i <= 189; i++) { -// System.out.print(i + " "); - try { + // 寰呭尮閰嶇殑瀛楃涓� + String sentence = "135465465濂�46546"; -// long l = System.currentTimeMillis(); -//// str = "2263艙189艙艙232105105搂鑳搁儴鑲跨槫绉戞棩闂寸梾鎴挎偅鑰�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂11陇232334680搂鑳搁儴鑲跨槫绉戞偅鑰呭嚭闄�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂19陇232313714搂鑳搁儴鑲跨槫绉戦绠$檶鎮h�呭嚭闄�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂20陇232294126搂鑳搁儴鑲跨槫绉戣偤鐧屾偅鑰呭嚭闄�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂22陇232231895搂TKA鏈悗<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂16陇232349695搂<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>1鏈埪�29陇232303115搂楂樼硸<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>宸ヤ綔鍩硅璇曢搂16陇232295017搂鑲跨槫<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>鐧昏鍩硅娴嬭瘯棰樎�15陇232233427搂鑰佸勾鍋ュ悍鐩戞祴闃熷垪<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>鍩硅娴嬭瘯搂10陇232215217搂24鐥呭尯IBD鎮h��<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>闂嵎锛�8.22-8.28锛壜�20陇232169849搂2023.8.25灏忛噾浜轰勘涔愰儴MDT闂ㄨ瘖<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂9陇232173705搂<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>淇℃伅鍙嶉琛�6陇"; -//// str = HttpUtils.sendGet("https://www.wjx.cn/handler/Search.ashx?input=%E9%9A%8F%E8%AE%BF&qc=&cp=" + i + "&nw=1&qt=1&accurate=0&t=" + l); -// while (true) { -// if (str.contains("<font")) { -// str = str.substring(0, str.indexOf("<font")) + str.substring(str.indexOf("</font>") + 7); -// } else { -//// System.out.println(str); + // 瀹氫箟姝e垯琛ㄨ揪寮� +// String regex = ".*鍚冧簡.*鏃╀笂濂�.*"; +// String regex = ".*鍚冧簡.*|.*鏃╀笂濂�.*"; +// String regex = "^(?!.*寰堝ソ锛屽悆浜嗗悧).*|.*娌″悆.*鏃╀笂濂�.*鍖婚櫌.*"; + String regex = "^(?!.鍒珅涓嶅彲|涓嶅彲闈�)(.(濂絴骞哥)+.*)$"; - List<String> list = new ArrayList<>(); - String folderPath = "E:/pc"; - try { - Files.walk(Paths.get(folderPath)).filter(Files::isRegularFile).forEach(path -> list.add(path.getFileName().toString())); - } catch (IOException e) { - System.out.println("An error occurred while traversing the folder."); - e.printStackTrace(); - } + // 缂栬瘧姝e垯琛ㄨ揪寮� + Pattern pattern = Pattern.compile(regex); - for (String name : list) { - name = name.substring(0, name.indexOf(".html")); -// String sd = "https://www.wjx.cn/xz/" + name + ".aspx"; -// String content = HttpUtils.sendGet(sd, "review=1&u_atoken=31d3a0e6-e00e-483c-b956-b6177972e734&u_asession=01691hXKO9p1D59fHgd0NAIGdr-8HrPakCUS6X_v_Z43ohuMPPQJnwrrPl3mly-UFXYrO71Pz35K7wOrV6v8t3g9sq8AL43dpOnCClYrgFm6o&u_asig=052KZ_HPijdQddSitCTcvhNlwy7cGO2t46JgQGTyclFPT7xwZjoK0YBNED-DbuN5gugFYO36lFqDfxMpnRFufeLFk7BSuILL02zWW0QNCM-NWgLElQ9wTw7yMg4BFlXpIhOVzkXl1W45ZWoBPny57uZ3WVmTrcdvNBGM1L1rWev0UwpA9oQuqX4mfRyWspmK8gksmHjM0JOodanL5-M1Qs1Srh04GpT7zItRH0TxDThMR15LDAE7pTBPfvFUyoAgUl5gGKGQH-vEmN2Ae1t4GLLQkS6fjps_twKYxR-u2135jY94r_LXIIil3Y3aVPRGAe&u_aref=gk2k7DQa4vfdgaFwA4iVd7KUI4Q%3D", Constants.UTF8); -// String sd = "https://www.wjx.cn/xz/214877887.aspx?review=1&u_atoken=7ea94b7e-ff2c-4f9f-a16a-2377e7b932f7&u_asession=01mUmaPv86XmI35R93EFzW4vAn-_bjd_hg8O3aV3Qj_hY4LTkzoq3vcQyaBAt_bXG0L3UvT1OC8yhlQ_Vrlj1nD9sq8AL43dpOnCClYrgFm6o&u_asig=05qqfmDpV5jnzQ3zaOR-kKvhCvox19kVoC-lC8wI68PnJ7lkckawOfhM2Sz6TSlLyxhPCLiM-UkS5JtWfnNrZeTMme2Xl4_nh34yljc8iiZeJybY6mcSFGRriqnFvQfUeuCvV5odDJuWRnGyKMRbx_RypafWqYj328He90miD2j6an7QQBtuwLgtjfNI6ktmk7ksmHjM0JOodanL5-M1Qs1cOGKb4pT6nOz7TsF50O_Y5mwcLzFTlOSTrqpuPzNwho1AC5ZokKrUg3JS1GlbH-sRHfAvD91UjmwUK--AQbESDY94r_LXIIil3Y3aVPRGAe&u_aref=muWANYNZeB7WW%2B%2F7kLKv3uRT8ws%3D"; -// String content = HttpUtils.sendGet(sd); - HttpRequest get = HttpUtil.createGet("https://www.wjx.cn/xz/215122141.aspx?review=1&u_atoken=ae7fe80c-bf23-4e45-bcda-e1a79738fa28&u_asession=014vQCkRvW7c3i2ofZKQ4cwL_Kbllht28bP58Yv5WaOmib7bTm0yOu3E9ghHeDwRromXsXiqHPUHP-r4N4zkLsNdsq8AL43dpOnCClYrgFm6o&u_asig=05cv8a98zgMB5Y5sCj2tshR0ymwhcsf5o0ZnRdzw_MWEqjWv9qUXA2y-W56hqxwwu62XCEZ1EDfpROWbv7u5K0esMlHJrRxH3x6MobynAbRVK73TZbz-pPzJrSvkDKmiOfptL_k4wm25Oa44SC2LnI-f_gUMOBxNBqpVgCnR54boOBWxWY3t65iSXiQbR5_szmksmHjM0JOodanL5-M1Qs1XAPImYHnI2tMZUJbFSrHeeZf56fnMo9lJFDBHsYIUFUSQYCfCQCLXjf34sWIadxtsAb6Kn2CIzT3kClvRmyaM_Y94r_LXIIil3Y3aVPRGAe&u_aref=OUtfes0VUTyTV7SKqEByRa9VGaU%3D"); - String content = get.execute().body(); - //鍒涘缓鏂囦欢澶� - Path folder = Paths.get("E:/pc2/" + name + ".html"); - Files.createFile(folder); - Files.write(Paths.get("E:/pc2/" + name + ".html"), content.getBytes()); - } + // 鍒涘缓 Matcher 瀵硅薄 + Matcher matcher = pattern.matcher(sentence); - -// int index = 0; -// while (true) { -// int dd = str.indexOf("陇", index) + 1; -// String newStr = str.substring(dd, str.indexOf("搂", dd)); -// index = dd; -// String sd = "https://www.wjx.cn/xz/" + newStr + ".aspx"; -// String content = HttpUtils.sendGet(sd, "review=1"); -// -// //鍒涘缓鏂囦欢澶� -// Path folder = Paths.get("E:/pc/" + newStr + ".html"); -// Files.createFile(folder); -// Files.write(Paths.get("E:/pc/" + newStr + ".html"), content.getBytes()); -// -// if (index == -1) { -// break; -// } -// } -// break; -// } - -// } - - } catch (Exception e) { + // 杩涜鍖归厤 + if (matcher.matches()) { + System.out.println("鍙ュ瓙涓寘鍚玕"鍚冧簡锛屾棭涓婂ソ\"銆�"); + } else { + System.out.println("鍙ュ瓙涓笉鍖呭惈\"鍚冧簡锛屾棭涓婂ソ\"銆�"); } +// String str = null; +//// for (int i = 51; i <= 189; i++) { +//// System.out.print(i + " "); +// try { +// +//// long l = System.currentTimeMillis(); +////// str = "2263艙189艙艙232105105搂鑳搁儴鑲跨槫绉戞棩闂寸梾鎴挎偅鑰�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂11陇232334680搂鑳搁儴鑲跨槫绉戞偅鑰呭嚭闄�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂19陇232313714搂鑳搁儴鑲跨槫绉戦绠$檶鎮h�呭嚭闄�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂20陇232294126搂鑳搁儴鑲跨槫绉戣偤鐧屾偅鑰呭嚭闄�<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂22陇232231895搂TKA鏈悗<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂16陇232349695搂<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>1鏈埪�29陇232303115搂楂樼硸<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>宸ヤ綔鍩硅璇曢搂16陇232295017搂鑲跨槫<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>鐧昏鍩硅娴嬭瘯棰樎�15陇232233427搂鑰佸勾鍋ュ悍鐩戞祴闃熷垪<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>鍩硅娴嬭瘯搂10陇232215217搂24鐥呭尯IBD鎮h��<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>闂嵎锛�8.22-8.28锛壜�20陇232169849搂2023.8.25灏忛噾浜轰勘涔愰儴MDT闂ㄨ瘖<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>搂9陇232173705搂<font color='#30a6f5'>闅�</font><font color='#30a6f5'>璁�</font>淇℃伅鍙嶉琛�6陇"; +////// str = HttpUtils.sendGet("https://www.wjx.cn/handler/Search.ashx?input=%E9%9A%8F%E8%AE%BF&qc=&cp=" + i + "&nw=1&qt=1&accurate=0&t=" + l); +//// while (true) { +//// if (str.contains("<font")) { +//// str = str.substring(0, str.indexOf("<font")) + str.substring(str.indexOf("</font>") + 7); +//// } else { +////// System.out.println(str); +// +// List<String> list = new ArrayList<>(); +// String folderPath = "E:/pc"; +// try { +// Files.walk(Paths.get(folderPath)).filter(Files::isRegularFile).forEach(path -> list.add(path.getFileName().toString())); +// } catch (IOException e) { +// System.out.println("An error occurred while traversing the folder."); +// e.printStackTrace(); +// } +// +// for (String name : list) { +// name = name.substring(0, name.indexOf(".html")); +//// String sd = "https://www.wjx.cn/xz/" + name + ".aspx"; +//// String content = HttpUtils.sendGet(sd, "review=1&u_atoken=31d3a0e6-e00e-483c-b956-b6177972e734&u_asession=01691hXKO9p1D59fHgd0NAIGdr-8HrPakCUS6X_v_Z43ohuMPPQJnwrrPl3mly-UFXYrO71Pz35K7wOrV6v8t3g9sq8AL43dpOnCClYrgFm6o&u_asig=052KZ_HPijdQddSitCTcvhNlwy7cGO2t46JgQGTyclFPT7xwZjoK0YBNED-DbuN5gugFYO36lFqDfxMpnRFufeLFk7BSuILL02zWW0QNCM-NWgLElQ9wTw7yMg4BFlXpIhOVzkXl1W45ZWoBPny57uZ3WVmTrcdvNBGM1L1rWev0UwpA9oQuqX4mfRyWspmK8gksmHjM0JOodanL5-M1Qs1Srh04GpT7zItRH0TxDThMR15LDAE7pTBPfvFUyoAgUl5gGKGQH-vEmN2Ae1t4GLLQkS6fjps_twKYxR-u2135jY94r_LXIIil3Y3aVPRGAe&u_aref=gk2k7DQa4vfdgaFwA4iVd7KUI4Q%3D", Constants.UTF8); +//// String sd = "https://www.wjx.cn/xz/214877887.aspx?review=1&u_atoken=7ea94b7e-ff2c-4f9f-a16a-2377e7b932f7&u_asession=01mUmaPv86XmI35R93EFzW4vAn-_bjd_hg8O3aV3Qj_hY4LTkzoq3vcQyaBAt_bXG0L3UvT1OC8yhlQ_Vrlj1nD9sq8AL43dpOnCClYrgFm6o&u_asig=05qqfmDpV5jnzQ3zaOR-kKvhCvox19kVoC-lC8wI68PnJ7lkckawOfhM2Sz6TSlLyxhPCLiM-UkS5JtWfnNrZeTMme2Xl4_nh34yljc8iiZeJybY6mcSFGRriqnFvQfUeuCvV5odDJuWRnGyKMRbx_RypafWqYj328He90miD2j6an7QQBtuwLgtjfNI6ktmk7ksmHjM0JOodanL5-M1Qs1cOGKb4pT6nOz7TsF50O_Y5mwcLzFTlOSTrqpuPzNwho1AC5ZokKrUg3JS1GlbH-sRHfAvD91UjmwUK--AQbESDY94r_LXIIil3Y3aVPRGAe&u_aref=muWANYNZeB7WW%2B%2F7kLKv3uRT8ws%3D"; +//// String content = HttpUtils.sendGet(sd); +// HttpRequest get = HttpUtil.createGet("https://www.wjx.cn/xz/215122141.aspx?review=1&u_atoken=ae7fe80c-bf23-4e45-bcda-e1a79738fa28&u_asession=014vQCkRvW7c3i2ofZKQ4cwL_Kbllht28bP58Yv5WaOmib7bTm0yOu3E9ghHeDwRromXsXiqHPUHP-r4N4zkLsNdsq8AL43dpOnCClYrgFm6o&u_asig=05cv8a98zgMB5Y5sCj2tshR0ymwhcsf5o0ZnRdzw_MWEqjWv9qUXA2y-W56hqxwwu62XCEZ1EDfpROWbv7u5K0esMlHJrRxH3x6MobynAbRVK73TZbz-pPzJrSvkDKmiOfptL_k4wm25Oa44SC2LnI-f_gUMOBxNBqpVgCnR54boOBWxWY3t65iSXiQbR5_szmksmHjM0JOodanL5-M1Qs1XAPImYHnI2tMZUJbFSrHeeZf56fnMo9lJFDBHsYIUFUSQYCfCQCLXjf34sWIadxtsAb6Kn2CIzT3kClvRmyaM_Y94r_LXIIil3Y3aVPRGAe&u_aref=OUtfes0VUTyTV7SKqEByRa9VGaU%3D"); +// String content = get.execute().body(); +// //鍒涘缓鏂囦欢澶� +// Path folder = Paths.get("E:/pc2/" + name + ".html"); +// Files.createFile(folder); +// Files.write(Paths.get("E:/pc2/" + name + ".html"), content.getBytes()); +// } +// +// +//// int index = 0; +//// while (true) { +//// int dd = str.indexOf("陇", index) + 1; +//// String newStr = str.substring(dd, str.indexOf("搂", dd)); +//// index = dd; +//// String sd = "https://www.wjx.cn/xz/" + newStr + ".aspx"; +//// String content = HttpUtils.sendGet(sd, "review=1"); +//// +//// //鍒涘缓鏂囦欢澶� +//// Path folder = Paths.get("E:/pc/" + newStr + ".html"); +//// Files.createFile(folder); +//// Files.write(Paths.get("E:/pc/" + newStr + ".html"), content.getBytes()); +//// +//// if (index == -1) { +//// break; +//// } +//// } +//// break; +//// } +// +//// } +// +// } catch (Exception e) { +// } } } //} + -- Gitblit v1.9.3