当前位置:   article > 正文

猿人学第四题-雪碧图、样式干扰(第一届)__b,xtydv-),: (%) x,c(-x,,,a~,x#zc_)~:()'(cx:-56,3t

_b,xtydv-),: (%) x,c(-x,,,a~,x#zc_)~:()'(cx:-56,3tc2 ,

 这里只放代码了,解析在下面代码的注释里,其他解析可参考我参考的文章。

参考文章:

 【猿人学WEB题目专解】猿人学第4题_user_from_future的博客-CSDN博客

猿人学web端爬虫攻防大赛赛题解析_第四题:雪碧图、样式干扰_itwxvq-CSDN博客 

  1. var hexcase = 0;
  2. var b64pad = "";
  3. var chrsz = 8;
  4. const jsdom = require("jsdom");
  5. const { JSDOM } = jsdom;
  6. const { window } = new JSDOM(`<!DOCTYPE html>`);
  7. const $ = require('jQuery')(window);
  8. function hex_md5(s) {
  9. return binl2hex(core_md5(str2binl(s), s.length * chrsz))
  10. }
  11. function b64_md5(s) {
  12. return binl2b64(core_md5(str2binl(s), s.length * chrsz))
  13. }
  14. function str_md5(s) {
  15. return binl2str(core_md5(str2binl(s), s.length * chrsz))
  16. }
  17. function hex_hmac_md5(key, data) {
  18. return binl2hex(core_hmac_md5(key, data))
  19. }
  20. function b64_hmac_md5(key, data) {
  21. return binl2b64(core_hmac_md5(key, data))
  22. }
  23. function str_hmac_md5(key, data) {
  24. return binl2str(core_hmac_md5(key, data))
  25. }
  26. function md5_vm_test() {
  27. return hex_md5("abc") == "900150983cd24fb0d6963f7d28e17f72"
  28. }
  29. function core_md5(x, len) {
  30. x[len >> 5] |= 0x80 << ((len) % 32);
  31. x[(((len + 64) >>> 9) << 4) + 14] = len;
  32. var a = 1732584193;
  33. var b = -271733879;
  34. var c = -1732584194;
  35. var d = 271733878;
  36. for (var i = 0; i < x.length; i += 16) {
  37. var olda = a;
  38. var oldb = b;
  39. var oldc = c;
  40. var oldd = d;
  41. a = md5_ff(a, b, c, d, x[i + 0], 7, -680876936);
  42. d = md5_ff(d, a, b, c, x[i + 1], 12, -389564586);
  43. c = md5_ff(c, d, a, b, x[i + 2], 17, 606105819);
  44. b = md5_ff(b, c, d, a, x[i + 3], 22, -1044525330);
  45. a = md5_ff(a, b, c, d, x[i + 4], 7, -176418897);
  46. d = md5_ff(d, a, b, c, x[i + 5], 12, 1200080426);
  47. c = md5_ff(c, d, a, b, x[i + 6], 17, -1473231341);
  48. b = md5_ff(b, c, d, a, x[i + 7], 22, -45705983);
  49. a = md5_ff(a, b, c, d, x[i + 8], 7, 1770035416);
  50. d = md5_ff(d, a, b, c, x[i + 9], 12, -1958414417);
  51. c = md5_ff(c, d, a, b, x[i + 10], 17, -42063);
  52. b = md5_ff(b, c, d, a, x[i + 11], 22, -1990404162);
  53. a = md5_ff(a, b, c, d, x[i + 12], 7, 1804603682);
  54. d = md5_ff(d, a, b, c, x[i + 13], 12, -40341101);
  55. c = md5_ff(c, d, a, b, x[i + 14], 17, -1502002290);
  56. b = md5_ff(b, c, d, a, x[i + 15], 22, 1236535329);
  57. a = md5_gg(a, b, c, d, x[i + 1], 5, -165796510);
  58. d = md5_gg(d, a, b, c, x[i + 6], 9, -1069501632);
  59. c = md5_gg(c, d, a, b, x[i + 11], 14, 643717713);
  60. b = md5_gg(b, c, d, a, x[i + 0], 20, -373897302);
  61. a = md5_gg(a, b, c, d, x[i + 5], 5, -701558691);
  62. d = md5_gg(d, a, b, c, x[i + 10], 9, 38016083);
  63. c = md5_gg(c, d, a, b, x[i + 15], 14, -660478335);
  64. b = md5_gg(b, c, d, a, x[i + 4], 20, -405537848);
  65. a = md5_gg(a, b, c, d, x[i + 9], 5, 568446438);
  66. d = md5_gg(d, a, b, c, x[i + 14], 9, -1019803690);
  67. c = md5_gg(c, d, a, b, x[i + 3], 14, -187363961);
  68. b = md5_gg(b, c, d, a, x[i + 8], 20, 1163531501);
  69. a = md5_gg(a, b, c, d, x[i + 13], 5, -1444681467);
  70. d = md5_gg(d, a, b, c, x[i + 2], 9, -51403784);
  71. c = md5_gg(c, d, a, b, x[i + 7], 14, 1735328473);
  72. b = md5_gg(b, c, d, a, x[i + 12], 20, -1926607734);
  73. a = md5_hh(a, b, c, d, x[i + 5], 4, -378558);
  74. d = md5_hh(d, a, b, c, x[i + 8], 11, -2022574463);
  75. c = md5_hh(c, d, a, b, x[i + 11], 16, 1839030562);
  76. b = md5_hh(b, c, d, a, x[i + 14], 23, -35309556);
  77. a = md5_hh(a, b, c, d, x[i + 1], 4, -1530992060);
  78. d = md5_hh(d, a, b, c, x[i + 4], 11, 1272893353);
  79. c = md5_hh(c, d, a, b, x[i + 7], 16, -155497632);
  80. b = md5_hh(b, c, d, a, x[i + 10], 23, -1094730640);
  81. a = md5_hh(a, b, c, d, x[i + 13], 4, 681279174);
  82. d = md5_hh(d, a, b, c, x[i + 0], 11, -358537222);
  83. c = md5_hh(c, d, a, b, x[i + 3], 16, -722521979);
  84. b = md5_hh(b, c, d, a, x[i + 6], 23, 76029189);
  85. a = md5_hh(a, b, c, d, x[i + 9], 4, -640364487);
  86. d = md5_hh(d, a, b, c, x[i + 12], 11, -421815835);
  87. c = md5_hh(c, d, a, b, x[i + 15], 16, 530742520);
  88. b = md5_hh(b, c, d, a, x[i + 2], 23, -995338651);
  89. a = md5_ii(a, b, c, d, x[i + 0], 6, -198630844);
  90. d = md5_ii(d, a, b, c, x[i + 7], 10, 1126891415);
  91. c = md5_ii(c, d, a, b, x[i + 14], 15, -1416354905);
  92. b = md5_ii(b, c, d, a, x[i + 5], 21, -57434055);
  93. a = md5_ii(a, b, c, d, x[i + 12], 6, 1700485571);
  94. d = md5_ii(d, a, b, c, x[i + 3], 10, -1894986606);
  95. c = md5_ii(c, d, a, b, x[i + 10], 15, -1051523);
  96. b = md5_ii(b, c, d, a, x[i + 1], 21, -2054922799);
  97. a = md5_ii(a, b, c, d, x[i + 8], 6, 1873313359);
  98. d = md5_ii(d, a, b, c, x[i + 15], 10, -30611744);
  99. c = md5_ii(c, d, a, b, x[i + 6], 15, -1560198380);
  100. b = md5_ii(b, c, d, a, x[i + 13], 21, 1309151649);
  101. a = md5_ii(a, b, c, d, x[i + 4], 6, -145523070);
  102. d = md5_ii(d, a, b, c, x[i + 11], 10, -1120210379);
  103. c = md5_ii(c, d, a, b, x[i + 2], 15, 718787259);
  104. b = md5_ii(b, c, d, a, x[i + 9], 21, -343485551);
  105. a = safe_add(a, olda);
  106. b = safe_add(b, oldb);
  107. c = safe_add(c, oldc);
  108. d = safe_add(d, oldd)
  109. }
  110. return Array(a, b, c, d)
  111. }
  112. function md5_cmn(q, a, b, x, s, t) {
  113. return safe_add(bit_rol(safe_add(safe_add(a, q), safe_add(x, t)), s), b)
  114. }
  115. function md5_ff(a, b, c, d, x, s, t) {
  116. return md5_cmn((b & c) | ((~b) & d), a, b, x, s, t)
  117. }
  118. function md5_gg(a, b, c, d, x, s, t) {
  119. return md5_cmn((b & d) | (c & (~d)), a, b, x, s, t)
  120. }
  121. function md5_hh(a, b, c, d, x, s, t) {
  122. return md5_cmn(b ^ c ^ d, a, b, x, s, t)
  123. }
  124. function md5_ii(a, b, c, d, x, s, t) {
  125. return md5_cmn(c ^ (b | (~d)), a, b, x, s, t)
  126. }
  127. function core_hmac_md5(key, data) {
  128. var bkey = str2binl(key);
  129. if (bkey.length > 16) bkey = core_md5(bkey, key.length * chrsz);
  130. var ipad = Array(16),
  131. opad = Array(16);
  132. for (var i = 0; i < 16; i++) {
  133. ipad[i] = bkey[i] ^ 0x36363636;
  134. opad[i] = bkey[i] ^ 0x5C5C5C5C
  135. }
  136. var hash = core_md5(ipad.concat(str2binl(data)), 512 + data.length * chrsz);
  137. return core_md5(opad.concat(hash), 512 + 128)
  138. }
  139. function safe_add(x, y) {
  140. var lsw = (x & 0xFFFF) + (y & 0xFFFF);
  141. var msw = (x >> 16) + (y >> 16) + (lsw >> 16);
  142. return (msw << 16) | (lsw & 0xFFFF)
  143. }
  144. function bit_rol(num, cnt) {
  145. return (num << cnt) | (num >>> (32 - cnt))
  146. }
  147. function str2binl(str) {
  148. var bin = Array();
  149. var mask = (1 << chrsz) - 1;
  150. for (var i = 0; i < str.length * chrsz; i += chrsz) bin[i >> 5] |= (str.charCodeAt(i / chrsz) & mask) << (i % 32);
  151. return bin
  152. }
  153. function binl2str(bin) {
  154. var str = "";
  155. var mask = (1 << chrsz) - 1;
  156. for (var i = 0; i < bin.length * 32; i += chrsz) str += String.fromCharCode((bin[i >> 5] >>> (i % 32)) & mask);
  157. return str
  158. }
  159. function binl2hex(binarray) {
  160. var hex_tab = hexcase ? "0123456789ABCDEF": "0123456789abcdef";
  161. var str = "";
  162. for (var i = 0; i < binarray.length * 4; i++) {
  163. str += hex_tab.charAt((binarray[i >> 2] >> ((i % 4) * 8 + 4)) & 0xF) + hex_tab.charAt((binarray[i >> 2] >> ((i % 4) * 8)) & 0xF)
  164. }
  165. return str
  166. }
  167. function binl2b64(binarray) {
  168. var tab = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
  169. var str = "";
  170. for (var i = 0; i < binarray.length * 4; i += 3) {
  171. var triplet = (((binarray[i >> 2] >> 8 * (i % 4)) & 0xFF) << 16) | (((binarray[i + 1 >> 2] >> 8 * ((i + 1) % 4)) & 0xFF) << 8) | ((binarray[i + 2 >> 2] >> 8 * ((i + 2) % 4)) & 0xFF);
  172. for (var j = 0; j < 4; j++) {
  173. if (i * 8 + j * 6 > binarray.length * 32) str += b64pad;
  174. else str += tab.charAt((triplet >> 6 * (3 - j)) & 0x3F)
  175. }
  176. }
  177. return str
  178. }
  179. n = function(a, b) {
  180. return new n.fn.init(a,b)
  181. }
  182. function run(key,value){ /*这个函数自己写的,用于获取j_key*/
  183. var j_key = hex_md5(btoa(key + value).replace(/=/g, ''));
  184. /*datas = info;
  185. $('.number').text('').append(datas);
  186. $(j_key).css('display', 'none');
  187. $('.img_number').removeClass().addClass('img_number')*/
  188. return j_key
  189. }

 

  1. '''
  2. 题目设计思路:首先,客户端向服务器发送请求,返回一个数据包(info是包含数字图片的HTML标签,key和value用于js隐藏图片的操作);
  3. 然后,用js将数据包中的图片进行隐藏、偏移操作,最终加载到元素界面.
  4. 难点:1.如何将数字图片转换为数字(比赛规定不能用图片识别)?
  5. 2.如何找到偏移规律,将数字图片复位?
  6. '''
  7. import requests
  8. import execjs
  9. import json
  10. from lxml import etree
  11. import numpy as np
  12. headers = {
  13. 'authority': 'match.yuanrenxue.cn',
  14. 'accept': 'application/json, text/javascript, */*; q=0.01',
  15. 'accept-language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6',
  16. 'cookie': 'sessionid=s6txbalcpqflb5rrikn4ezm002oj1oi3',
  17. 'referer': 'https://match.yuanrenxue.cn/match/4',
  18. 'user-agent': 'yuanrenxue.project',
  19. }
  20. response = requests.get('https://match.yuanrenxue.cn/api/match/4',headers=headers)
  21. data = json.loads(response.text) # data是一个字典结构的数据包
  22. info = data['info']
  23. obj = execjs.compile(open('vs_project1\猿人学第四题\hex_md5.js').read()) #利用扣下来的加密代码获取关键参数j_key,图片中class属性值中含有这个参数的将不展示。
  24. #params = [data['key'], data['value']]
  25. j_key = obj.call("run", data['key'], data['value']) # 计算j_key值,传参方式可以替换成obj.call("run", *params)
  26. #发现相同数字图片的base64编码是一样的,所以这里选择用字典中一一对应的关系,将图片转化为数字,手动完成。
  27. css_dict = {
  28. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAdCAYAAACqhkzFAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAMTSURBVEhLrZY/TBNRHMe/bY82LeGA0Dp4NTGYqO1gdKEMwmQcGh38M5CQlGDSwWiMAwwYg2iCJsZJQ9CJ0ETsQMJgwuagLIUFXIAFXNoYcqDloLRXrq3v7v3aXktbSPCTXO77fZRvf/feu9+r5dz5iwX8R+oESigMPka6/wb2vSJUBx+1QoVD3kTz7DScb+f4YBVHA6U+ZKLPsON1IE9DtbDLP9AxEIawRgOEle4cKYSD+ZeQq8IcKquMXTbyOllPL7aiEWgSDRCmQAnahyHsiGQZruUvkIKXcObyFeM62zcOd1ylvwJ5MYDkuxA5Tjlw8A2S12iyGM7YODrujsFqfqTFCJw9L+CWyTPS3QPIBMgwKFBC9n4AaW4AdQVtQxEy1czBObkIJznAi9TDO6SLgVIYqt9QBq5YFEKCTC2momg2VXngD5bmnAc+uIqUIXQUOL/X3hJl5mHfUEgzPJ04pMUxAnN+CYeG1UlAmCLZANtqAk2kARG5m1zxQI9paWUZAsmGsArLnxOh0ZSxwCBypjwo2zQPxzCTgJ2kTtbbZ9zZ/7pRKO8WOOWqrX9iePyJiqnNGgTTuhRhgT5o5kc+JaeosDYssHbpx+OtXEziSIWqx0fqOFpg7ns2Zd24s8B1WE0V5h2mJW/ELTc0kjo2Zcm4s8ClikCIlR+si59tZpL66yosc2U8clM8bhgDkfVFUzuqR569rqXOqG7CPsOlEWiJJSraUaa/i3Q9upC94CHNCtr4WXoN+aJMzcFlakd73eGG5wnuhZHykmZ1tnx9TboYqDfNWLxoWDvqhfK+h0w1Pcg87cUBOavMmu1HMoxShuXJNNpNi7N3ewLJTyEUzIdQIIT0wgQ7EcmzxWifZMcEOZ3KY3Qwgp3RQOnbOfqJx5XGtlSOS4aK1tlHEIcXyHNsrW0dY6SBFX0ufShc70S21OwE5AR+lb+ZVfb5OVpGviGTTkHeSmBfScJqtdX55SAFoY0OsMXxISM6SvvNrshwrS7A9WoENupyv+O/oGm831sslno/RU6OsvsHu3+3yQH/AOyW6SvqnweCAAAAAElFTkSuQmCC':'0',
  29. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABUAAAAcCAYAAACOGPReAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAD0SURBVEhLY5RVUPvPQGXABKUJAA2GvzP3Mry6f5PhzfI4qBhuQNjQqD6Gzxc3Mjxzk2H4CRUiBHAYKs3wP7Gd4evhSwzPWr0ZPvBBhYkEqIaaBzL8nrmS4f3FfQzP6oIY3smwM/yFSpECkAyNY/g2q4PhhZsBwxegy/5BRZlfP2HgIdbfUIAnTD8xCGyuZ5AyW8jATqmhzD9fMwjumsUgbWPKwJu3AipKGkAydC8DZ24sg5SGDQNPei8D01OoMBkAydCnDIyHTkHZlAE8YUo+GDWU+mAEGfq46RCUhQAUGypbZwdlIcBoRFEfjBpKfUADQxkYAKYHOb9g+7HMAAAAAElFTkSuQmCC':'1',
  30. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAdCAYAAACqhkzFAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAKCSURBVEhLrZZLaBNRFIb/PDp5SFMxjqVOAjYLNUGUbhI3cdEGwaAgbmopWFIQBEUwFhQVldIqCuqilLoymEVVlCqWuNdVXRk31Y1uTKAQMRI0ycQk453JaWaSJjYPPxjmnJPwcefOuSfROXftlvAfaSAUIIXOITfuR9bBQzQBZfqEEzPgVuPY8uIeuMXPVK2lVnjoCrKzJ5F2mKqSZpi/xGCfCEOfpAKhCkPz+HEpgN9sRVpMoqjcJZMJBSVS0Wfeoz94CkaNVE93wOOqygyZr9i+cBnOwT3YsXe/cvUPDsMxHcPWTOU7MmWbD+m5i5RVUIUKGfQt38DOA0dgufuSauskoYuE0RuchV0jzQ8FIAqUMFShmIB9+jhs559SoQnJKKwLcZgpBVwoTFLIUIXXTsMaqdvhZjz8qBECRYeXog2P3CoJts8UMko2F0UdC90o2ihkcAl1mzoTnnGh0kwyGRhXKWR0IBRQOOZGnjL57RsjFDLaF87MI+1Ru9+ysgSOYpn2hKEovo+71RMjfoJtKkpJhRaFAsozr5C67kOOKvLe2e+cBVfXaZsLhSD+LD3DGluZum8p5RA06tt/C4/exK83D7A2xKNEJT07UfzV0aaHoImQHnFuDGlNv8kja2BkBObF5ieqgdDf8BG3PboAPrBx/tVTN7H9KMTuI+WxVQesIRUHPzWKnndU2ATNCgUUn9TKrB8eY8DbukxGFYZu4+dBVWZZYXPvxC3oKG8VEnqRn1R7rCfBfi/Gahu2VSpC3wRyDiViiOhdDre9snUqwsOCZnqkYHhLYSfIb9n5+psESerq6nvOPMylrLDEa7q3C7L7hrVt0z1Fu9Dor0g3AH8BJlTqZkAngxQAAAAASUVORK5CYII=':'2',
  31. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAdCAYAAACqhkzFAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAALaSURBVEhLrZVPSBRRHMe/O+rOuuaUyRoyBlGQfw5lh9xTekg8qIdMKSsQFKRAD0WUROhBCIlSBD1YQsJKQSB1iRa8VRf1Up4UQiNcRVw1nXVdx3V3euP+ZnZmR9EVP/CY3/vx5sPMe+/3nu3suYsKjhGrUCxB5GErNssKERIEyDzlIYOX/MgY+4r0zm5w85ROwCRU2j1Yu+fGhi7ZG072Iau3Bc6BacrE4ejJ6EKgySyzy+yrdptpIKJ8HlbahrHZKFImjnEcIeHU6FuIlfk4U3AJObstH2L9C7hmJKTQKEBg0h7sUE/DJLT5x5FbeRWZ99kcTVFSY9wDR/kN5Pxkn6vBFyPUTjFhEPYjs6YBqYkiE/NIfTeODOqpyEUNFMUwCNmy7bNyJr5M787pfuwxhwfhh+1YhWIxtgWKGXafh6IYSQuVjssIUgxMwdFLIZGc8IEHKxV5iFL3xGg37AnzfnAtu68jUlYFueIa1i4IiFDaOfYa2XcGqRfHKnzlxVzdeepYSZVmkfXyERwfrGWnktQvc7If6T62yrxhVRKwCvX6jTet3KK8C4EiN5Y6hrEw6YV811rLhzwPRSi19dhqqmFCFzvINPzI7rwN51B8ZQ4pNNA4iNW2UgTpVOL835Fb0qz/atL7EEPNyPrm01+MutwIPaUOI3khw9Y5aTggeISu1FN8RCHm5YQX7fQ8qlDk9WpR4eRlinQhW37rDtgXpc1Yz2xrsYtLg4StCHz+iHD1IazVPQgY6hnSLzgGKGbov6y4irHY58W/T13YKS2grIHCGoTfeLHcV4V1w9V6+v0zwz2j78MuSH9uYp2SKhwbnKbvYB5hJjHOmyo7OdIC4ckP6segL5wAb7rR1Jd5dslrzSxLYQeE6/ktXbYVCmJp0YfghpRQKbWPsVVXjs0iEWGBxzalVXhZQtrMFJwj/eCHJigbY2FuFpFI7EJNvvT2wPf3NxRF1QD/AbAv8WdRHzjKAAAAAElFTkSuQmCC':'3',
  32. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABUAAAAbCAYAAACTHcTmAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAHHSURBVEhLrZW9LwNhHMe/WrT10mrKVE2EROIfUAuTTQxMLISBQSxeIjQSTZRIsYgYhYVRIrWzaCxiMjFVoqjWaatPaR9Pe09bbfT6XHKf5Mn9vne9T+55fs/1qhxtnRRqWD1DcLILSR5Nfg+aR495ktHxoyBDiA8WhOVQJaXeKUgtPCggLrXPs6dsxzePSghLU9sjiBh4qICYtG8fUo8Z6UxNXlEvZc+WRUDaC+LpR5SnhssLGHldjopS6l1BpFWuda9XsEwH5KCAstS5iU/WHHkLSbAerAmtl8JvupH0DOCDN8d4e4q6wyc5VKCslHrdCHdwI7mHZXZHrgX4X9r3d9oElvMN1Io9ZJZ/pL1IeIbz06598KFx8UYOgpRI7fg52UWIdzszbev4Mqp4FKVYOrGJSG6Ts27btmZUTTtHQcrWUVpy4otHk39PuNulyFL7GOJ7hXWsCfhgK/mPVAOTstfwaAEhMz9DHmF1zalexyIcbj81UUqh0TBdr9OS7muDDoRAz4ZBxajmN2dggqJrepKE+g8fWFPvXPkeaPDhE0MzaeIrhpfnAGJRSTvp+1sQJBFHOBTUTppOp7LHzM7STGpusvEK+AUL4d3X/AgqvQAAAABJRU5ErkJggg==':'4',
  33. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABUAAAAcCAYAAACOGPReAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAIxSURBVEhLrZU/aBNRHMe/bWKexnoiaSg0FSSCaAfFwT+L7dKloUs7OqRVcHBwcZOCiCAOhk4dxAwdHFRwEEoRSjvoZNqhdDE4tC7aIYmWvOiV1941vnf51dy7S0ou6Qfu+P5+B9/7/e7e+72us+cuVHHE+EzF0jcUzlPQCjyH/itphChUdKub+bcCXv4tVQr7hsp0hmNqWXsob5ek6kWVqUxneNpPw1yfxi+nWo7Y02uIzjkPAuFUWucSrKNqvzEcoUWSAdFNbyewSxJK/SQZEN1U+0kCXaSCopvGGfZJgsv2SQbFY2rI+jqn+Y/ipbYr1dap/WYVWzfra0q98f/nkDDBcWwjj+j7WbC5Fcr6aV6pxG2oEMzAn8EbKDx+ja31jxBytTRCM7WNepVhIWRl6qKEB9tIovDsA8w7fuPWR9/QPezenQAfTmKHUg5iE32To4jkKJYc2r7G5ywiU6PoTWUQK7rKZ0lU7o9TUKN10wPyWUQfLOA0hQrz6jhs0orgporcI0TXXNUacVgkFe2ZSsI/iqT8tG162DBv23RvYICURG4K3xkVmKEZmIOkJWqXhUkrgpsm0tjJjKBCoRqRp+afkK7hMr2I6tgt0g1IXIf94h22l6dRkiPygMjXtzj5kgLCtaOeg3+fQNnR/u1pMaatRUVkYwHxyYfo9pwQTdpncnjol24o0PMpg74Rv6HCZbqC41/y6OG1QeKdpSGZO1HcRGz+FRKpyzgzlaUnXoB/3J2gmVZucHAAAAAASUVORK5CYII=':'5',
  34. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABUAAAAdCAYAAABFRCf7AAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAANLSURBVEhLrZZNSFRRFMf/48e8UZtRktFkRsiEdCIKVwaikrlJbZG0MEGDwEWUIPaBQoiIZIJGG4mikoyyIBJKW4gbs4W66WOhtlAXzixq/HzGjG/8eN0378yb+5w3qdAPLnPOmXf/nHfvOfc+U+bR4zL+M/sTrW6F71Ih/CfskAQB2xQ2SyLMU5OwPr+HuEEPRfcSddXB96QeK04BOxQyZg7pWedhJi+GfiOp7sHqwC0s7RKMkyQIwaGfzGdmLFrUAbGlFOsC+ZBwaLwfjqoSZOSeQlpw5MBR1oQjw3NIoKdCGLz+Rfgn72PRTq7khr2tFpbX4TWLwJULTM+QY5Cp/PgGlkOCEJHauYegAieosEuUbUyxU1tDy9c3SOzdQ9AAvWh7ObeOblg7u8k+GJyoA4E8FzbJi5mdhGWCnAPCiVZhM5tMRuLsAFkHJyxakcu6hWy2QcL4pGpW3IR/6AsWZ35iYV4dnvkfWBp7C/+dMvWZ3SglFRzPpuR4WZYRHAtyWsFZ2fFhVha0mPEQFkbljALSoBHO1G7V1hMIQG54Cu+FY6zsVcyhTiI/hOQswq9PfdhyUIChiW7bbWQpOLDOBANMMknppLIcpIc6KasEzrYhJIv0KGPHlo/VrlrydBvFI2CDNXfyu+s4fLkVMdMUDuKBqbcRtvr3SA69BsN/phIByjaKKPvDPQLr7THyDPjcDOuwmxNwYaNBtaKKWse7YSI7GqbO70giWyHgVJdAE431covESipuah/t6fkGMzdNsruCv+FMveuIJzMavpMlEItryIskdGaERYc9XLnYsO0kk2Mr1YG1c3XkRZLgVXc0LDoxAYF7lY28yMm20ZfIbCkij5GfD4mrxFhRPQK5jepjR52XbEW0XCuRaOxcO40/ZLP1g+Wj2tqcKHMesZuRbKVEVl506O4eHRU9WCvWTnPEz47BMqjaOlFMNLJSErVgILsSiyMPsJ3Pp5yLnfY+LHeVclm6kdLWrJWgwR1VCGmkB7+z9V2u9H5wErv3uUZiiEh5xZK5G24UfaZBxiBcaUL6lIhYiigEFLFdgjHsUkztrNEJKvz7Y6K6A76rhfA5lS+TUB1KrHQ8SBztR8LDPpgMemR/nz0HAvgL80YzEyuMQpQAAAAASUVORK5CYII=':'6',
  35. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAeCAYAAAAsEj5rAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAHhSURBVEhLrZY9LANhGMf/PprDVQkxyFXSVCKIwYStiZoqhoqEhTCQWCwiBBEDiUTMBpOJhKQDkw1L1YDFxoSlBi2tlurrrn2uH9xX2/sll/6f4X557n3e903LWhxtDCZSTr/mIXXY4thgjSHGwEp76o7amOkdmih8BHcMlDAULz4DW3htSlf8+RIaJn3Fd8i2ZxAiGeK3sK34UrE4oTCP6JAT31TWneyg8jmdixKyNQ/eOCqCF7AuBKgoRigs48NlR5LK+rP1PEnBwuRmfnf8Kn0rUZhQWEfEJU/if3cSBQmTmwN4o6zUnYRxobh2kb5sd7X+PcWXDQvZohthee3EfWedy042F4PCCXzmTLbGf4hKyn8xJtwYRthGGU/gd9OnQgkDwh7EXB2ZU2G5v0TVFRUK6At7xxCzUxbhb/YoKaMrTM724J2yNIxqha2Si47Qi1hndqtw9wHFYUS7+hF2jaeytnDKi2jGFwfv36GcT6JRQMg9ncqaF+zPwTVe+mi84uc2t4+qbhcZjQ49+GrN7BVYHu50ZRLqwt5BxLLLh6qHfUraqAtHnIhSFG8CcGfa05VRFSZahcxRQ/wZllPKOqgIPfi2yzeBSPAVFRT1UBF2I5GzflzwEWWU9TD5zxLwC1sVsHrJiVs0AAAAAElFTkSuQmCC':'7',
  36. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAdCAYAAACqhkzFAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAANtSURBVEhLrZXfS1NhGMe/rumZbR4nOcO2IA1CvQi8UW8y8EJqZCR1IQiKwvRCuiqTfomtkkrqIpN+EFSGNaFECL0IbzQvnH/A6EavNiinJVubO/5a73nPs51zNqf04wPjfJ8X9uV5n/d93ifr8JFjcfxHMhueuYS1dieiFTZIgoAtvihBCAVhnptErvshDAG+qGMHwzJsvh7Cj5MO9vfMGCQ/Ckb6sP/2F1pRMNCXsGPz/Vt8TzEzSiwz/qMFxrbgwEr7I0Tb7LSioDe8OYSVGhHbFOYEZ1DcVIfisuMo4r86ONxTyEsai1jpGcK6xlNj6MRaQznWKTL4p1BU5YLRqy1UAFmvumDtGEN+wlQoR7SnigKd4Qls2EiyDVs/dSGLojRmrsIyF6QAiFQ0ktIaslokspMzMT4gmQFDMEyK1ZO+MqqhL4x9JFn1EK8m+Yeohl4vu2Ok4UCsWa1LOmw3FaWkAbNfvTqaGg4jd86fXAjX34JUS0EK8YGX+FlBARZhfjpJWmfIbnlnHwoX6PiEUiy9mEVkwIV4ubKEWheksVksXSilekvI/9APwcsDTnqn2JsQ81zDikPQFTsdCXmf+2Ht9FCsoMuQE/DAdHkQBeqt2BHz9CDy3XozmZQM7dh+Pozlen3rGViUzRa22COxSWsycj8fcLfA9E69/JoM5T4exTeNWe7CBA6x1rOXKK1XXCK33gSsdBvkfg7eHdX1s5phG8ustxprPJCL3QWxW/+SJLE7Ib25h6WjghKHvCh2tsDIEqUMqxBrT5ixa+3zZDaTCUxCaPXAmtiKWI1f1M+KYXUr1hxcMSRYpvtJ70KgH7k+tdLhGhe/FYphvV1zCHv3cQLjguYlsjn4gSmGooANLv4N+TAUw2AIVF5GIbbaSO7BlqOQFEMK8cdFMRxZhIkLGRGRBhfp3XAhVimSZkbBgMYw8AQmH1ecWGVH2qzQEo3kYfVUGKvqtpA35+EPsmLIDiLn/hQsSsBgs6J3HKHHLYin+p5n47XtLMLP3MleN7DZY+me51rXevE741huLkeM4gQ5bOIp40BgM5qLJAZpEYUdpyHMUKx8FLJunIPtutpaCdZZD8vDPtXM5J/BwUbVTGaHQS9Thu0rF9kUrELEJmKDGSW2J7DTzPbNwzIyiOyPX2lVJYPh3wL8BvLZG6cpuRANAAAAAElFTkSuQmCC':'8',
  37. 'data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAcCAYAAABh2p9gAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAMzSURBVEhLpZZPSBRhGMYfV9dpdV3UHDVXIw1KDUwJVy/VLTAVWugQRJqUpxAkFyuMIBMPWRGYiCGGC7J0KCRKL13Si9pBvKiH9NIYoavgqKvjujt9M/OuM+uustUPvpn3edl9eL/3+7Mbl3fqjIxoFDnhb76Bzcoi7No47FI6QRJxbHYKKQOdSPi8RFmdKIZ2BDt6sHazCNuUiY4E67cXSLvtJq1hojdhx57nPX4fMDOxL3OSMiihwmHzchu8njrSGmGGclc/Vit5BEibxEXw7bdgzy9BZqEyziLP5UH6Cn2AsV3ZBF+DnVTYlBuxNe/CGqcpSHPIdl6DeY60EXsdfCNtWLVp0rQyhhOORrU6vcKOamyEzNgUU4fuRTdTWHIj6fUkLCSDfCl2GrR433CvuAB+ipXqLM8iVzCMd29gFSiGDb4rWi/J0IE9fr88QFhEAoWHMwWzIFLMeplbAaV3ZFiIIPXjb4gXvBQx+Ax1MfUeGuEM1cYKZzMauhFv2Arg2X6k8CgCuRkUKaQgWGOo0CwYHLlS+LocJA7B3oKdMmOfOMi8wdDUy84nxQrrtU8h1egbNpyLkAbr9T1rQO/h5EtYJ0Q9wRVguXsYG30tCFwq1HJ2B4KtPdiY6cfyac3NrD4VJMQpk1ROij7uyJk/dmTIcgxjXT7+aUK27OsFOZN56BWqjIOrf4isWRHxlImOiLSh+0iaJqnCKmTPA4aMpREkVpcjx/UWGdOLSBZDNw0booC0iY/IuVoO6+NxoJjXbyVRK+LwCzYGAp7v+FWprbR5dhDZ1Z1RKowZB/y5+rbhhK/qO2bD/FMncb7kHClGRT07vxRDgGVgSo1iNrTZUnChrIQUm26zA5sUm4QZcJNa/G89bHDD+6SCFkRCem8Vkp9r1114hfbDToaBmlcQH4TMgMSFL0giM4Vww2Z2AqaGsd3qpIQB5We1bxTe7mqsh46ctIjU9kfq/gsRPuWuUfy8XkCCrRzbexTBz0yCpBRMzCzDdRfcgd/mIxdFYveiNsLNOGEMWc6qCDOFA4vCbu7WJmzXOrDF21SjEBz7x2Bm/xisQ90wf5inbCT/dVIiAf4ApbEnkB6qHqsAAAAASUVORK5CYII=':'9'
  38. }
  39. html_tree = etree.HTML(info) # 利用etree库解析数据包中的td标签
  40. td_list = html_tree.xpath('//td') # 选择所有的td标签
  41. def PX(A, num): # A为正确索引值列表,num为数值列表,该函数输出正确排序的数值
  42. dict={}
  43. for i in range(len(A)):
  44. dict[str(A[i])]=num[i]
  45. s=''
  46. for j in range(len(dict)):
  47. s+=dict[str(j)]
  48. return s
  49. for td in td_list: # 每一个td标签下有很多img,js正是对每个td标签下的img进行了隐藏,偏移操作,所以这个for循环下有很多相应的操作。
  50. td_idv = etree.tostring(td).decode('utf-8') # 用tostring()获得每个模块的td标签,命名为td_idv。
  51. td_idv_list = td.xpath('./img') #用xpath选择td下的所有img, td_idv_list是一个列表类型。
  52. num = [] # 用于存放所显示的数字
  53. num_pos = [] # 用于存放num中数字的索引值
  54. num_iv = [] # 用于存放num中数字的偏移值
  55. for img in td_idv_list: # 每个td_idv下的img标签
  56. cla = img.xpath('./@class')[0] #cla为img的class属性值
  57. src = img.xpath('./@src')[0] #src为img的src属性值
  58. style = img.xpath('./@style')[0] #style为img的style属性值
  59. if j_key in cla: # 如果j_key值存在于img的class属性值,则把这个img移除。
  60. td.remove(img)
  61. else: # 如果j_key不在img的class属性值里:
  62. img.attrib.pop('class') # 将img的class属性及属性值删除
  63. img.set('style',style.replace('left:', '').replace('px', '')) # 将img的style属性值中'left:'和'px'换为空值,因为这样方便获取其偏移值。
  64. img.set('src',css_dict[src]) # 将src的属性值设定为css_dict[src],其实就是把src中图片base64编码内容换为数值。
  65. a = str(img.xpath('./@src')[0]) # 用a代表数值,并转换为str类型
  66. b = int(float(img.xpath('./@style')[0])/11.5) # 用b代表 偏移值/11.5 的值,我们发现其偏移值总是11.5的倍数,为了方便操作,都将其除以11.5
  67. num.append(a) # 将a存放在列表num中
  68. num_iv.append(b) # 将b存放在列表num_iv中
  69. for i in range(len(num)): #这个for循环将num中的初始索引值单独存放在列表num_pos中
  70. num_pos.append(i)
  71. A = list(np.array(num_pos) + np.array(num_iv)) # 利用矩阵的加法,将初始索引值和偏移值相加,得到正确的索引值,到这里就解决了偏移问题。
  72. print(PX(A, num))
  73. #print(etree.tostring(td, pretty_print=True).decode('utf-8')) # 输出显示数字的HTML+
  74. #print('&*%^'*50)

声明:本文内容由网友自发贡献,不代表【wpsshop博客】立场,版权归原作者所有,本站不承担相应法律责任。如您发现有侵权的内容,请联系我们。转载请注明出处:https://www.wpsshop.cn/article/detail/59775
推荐阅读
相关标签
  

闽ICP备14008679号