文章目录
1. 网址
https://g.hongshu.com/content/96680/14747430.html
2. 抓包分析
得出结论:
(1)部分数据通过伪元素加载
(2)伪元素加载的数据都包裹在span标签内
(3)每个span标签的class属性值都不就一样
(4)class 属性值都是context_kw + 数字
形式表示
3. 科普
伪元素:整个css就两个伪元素;::before
和 ::after
4. 解决问题第一步
首先查看网页源代码;发现一堆js文件,暂时不清楚是啥玩意儿
5. 解决问题第二步
全局搜索.context_kw
; 只有一个显示,正是网页源代码显示的内容
6. 点击进入
继续搜索 .context_kw
; 显示在script标签里,既然是在script标签里,那大概率是能在控制台输出结果的
控制台输出结果正是伪元素的显示形式,说明这段js文件大概率是有用的
7. 分析js文件
先将整段js代码抠出来,便于分析; 数据量过大,不方便显示;从494行一直到1355行
8. 解读js文件(1)
前面这一部分都是和CryptoJS相关的内容,先折叠起来不管
9. 解读js文件(2)
后面这一部分也并非什么正常人可读的数据,都是通过混淆过后的数据,看的一脸懵逼;虽然正常人是不可读,但是浏览器是可读的;可通过浏览器控制台查看变量内容。
js文件:
浏览器显示:
显示内容千差万别;
这里就没什么好的办法了,只有一个一个看(一般情况查看等号左侧的变量名就好了,赋值才是有意义的变量)
10. 解读js文件(3)
我这里是在791~792行,在控制台查看这两个变量名;words就是我们需要的数据
11. 解读js文件(4)
var secWords = decrypted[_0xfbb0('0x13')](CryptoJS[_0xfbb0('0xb')][_0xfbb0('0x14')])['split'](',');
var words = new Array(secWords['length']);
浏览器查看相关数据
12. 解读js文件(5)
注意看words的索引号;回过头再来看伪元素的类名
也:12
个:5
正好和words的索引号是吻合的
13. 以上就是全部分析
14. 代码实现
15. 先将所有js代码封装在一个function里面通过node执行
16. bug解决(1)
报错:ReferenceError: document is not defined
原因:document 是客户端才有的东西,服务端没有
解决:将所有document相关的代码都删除
17. bug解决(2)
window也是客户端的东西,删除所有与window相关的代码
18. 源码参考
function spider() {
var CryptoJS = CryptoJS || function (u, p) {
var d = {}
, l = d.lib = {}
, s = function () {
}
, t = l.Base = {
extend: function (a) {
s.prototype = this;
var c = new s;
a && c.mixIn(a);
c.hasOwnProperty("init") || (c.init = function () {
c.$super.init.apply(this, arguments)
}
);
c.init.prototype = c;
c.$super = this;
return c
},
create: function () {
var a = this.extend();
a.init.apply(a, arguments);
return a
},
init: function () {
},
mixIn: function (a) {
for (var c in a)
a.hasOwnProperty(c) && (this[c] = a[c]);
a.hasOwnProperty("toString") && (this.toString = a.toString)
},
clone: function () {
return this.init.prototype.extend(this)
}
}
, r = l.WordArray = t.extend({
init: function (a, c) {
a = this.words = a || [];
this.sigBytes = c != p ? c : 4 * a.length
},
toString: function (a) {
return (a || v).stringify(this)
},
concat: function (a) {
var c = this.words
, e = a.words
, j = this.sigBytes;
a = a.sigBytes;
this.clamp();
if (j % 4)
for (var k = 0; k < a; k++)
c[j + k >>> 2] |= (e[k >>> 2] >>> 24 - 8 * (k % 4) & 255) << 24 - 8 * ((j + k) % 4);
else if (65535 < e.length)
for (k = 0; k < a; k += 4)
c[j + k >>> 2] = e[k >>> 2];
else
c.push.apply(c, e);
this.sigBytes += a;
return this
},
clamp: function () {
var a = this.words
, c = this.sigBytes;
a[c >>> 2] &= 4294967295 << 32 - 8 * (c % 4);
a.length = u.ceil(c / 4)
},
clone: function () {
var a = t.clone.call(this);
a.words = this.words.slice(0);
return a
},
random: function (a) {
for (var c = [], e = 0; e < a; e += 4)
c.push(4294967296 * u.random() | 0);
return new r.init(c, a)
}
})
, w = d.enc = {}
, v = w.Hex = {
stringify: function (a) {
var c = a.words;
a = a.sigBytes;
for (var e = [], j = 0; j < a; j++) {
var k = c[j >>> 2] >>> 24 - 8 * (j % 4) & 255;
e.push((k >>> 4).toString(16));
e.push((k & 15).toString(16))
}
return e.join("")
},
parse: function (a) {
for (var c = a.length, e = [], j = 0; j < c; j += 2)
e[j >>> 3] |= parseInt(a.substr(j, 2), 16) << 24 - 4 * (j % 8);
return new r.init(e, c / 2)
}
}
, b = w.Latin1 = {
stringify: function (a) {
var c = a.words;
a = a.sigBytes;
for (var e = [], j = 0; j < a; j++)
e.push(String.fromCharCode(c[j >>> 2] >>> 24 - 8 * (j % 4) & 255));
return e.join("")
},
parse: function (a) {
for (var c = a.length, e = [], j = 0; j < c; j++)
e[j >>> 2] |= (a.charCodeAt(j) & 255) << 24 - 8 * (j % 4);
return new r.init(e, c)
}
}
, x = w.Utf8 = {
stringify: function (a) {
try {
return decodeURIComponent(escape(b.stringify(a)))
} catch (c) {
throw Error("Malformed UTF-8 data");
}
},
parse: function (a) {
return b.parse(unescape(encodeURIComponent(a)))
}
}
, q = l.BufferedBlockAlgorithm = t.extend({
reset: function () {
this._data = new r.init;
this._nDataBytes = 0
},
_append: function (a) {
"string" == typeof a && (a = x.parse(a));
this._data.concat(a);
this._nDataBytes += a.sigBytes
},
_process: function (a) {
var c = this._data
, e = c.words
, j = c.sigBytes
, k = this.blockSize
, b = j / (4 * k)
, b = a ? u.ceil(b) : u.max((b | 0) - this._minBufferSize, 0);
a = b * k;
j = u.min(4 * a, j);
if (a) {
for (var q = 0; q < a; q += k)
this._doProcessBlock(e, q);
q = e.splice(0, a);
c.sigBytes -= j
}
return new r.init(q, j)
},
clone: function () {
var a = t.clone.call(this);
a._data = this._data.clone();
return a
},
_minBufferSize: 0
});
l.Hasher = q.extend({
cfg: t.extend(),
init: function (a) {
this.cfg = this.cfg.extend(a);
this.reset()
},
reset: function () {
q.reset.call(this);
this._doReset()
},
update: function (a) {
this._append(a);
this._process();
return this
},
finalize: function (a) {
a && this._append(a);
return this._doFinalize()
},
blockSize: 16,
_createHelper: function (a) {
return function (b, e) {
return (new a.init(e)).finalize(b)
}
},
_createHmacHelper: function (a) {
return function (b, e) {
return (new n.HMAC.init(a, e)).finalize(b)
}
}
});
var n = d.algo = {};
return d
}(Math);
(function () {
var u = CryptoJS
, p = u.lib.WordArray;
u.enc.Base64 = {
stringify: function (d) {
var l = d.words
, p = d.sigBytes
, t = this._map;
d.clamp();
d = [];
for (var r = 0; r < p; r += 3)
for (var w = (l[r >>> 2] >>> 24 - 8 * (r % 4) & 255) << 16 | (l[r + 1 >>> 2] >>> 24 - 8 * ((r + 1) % 4) & 255) << 8 | l[r + 2 >>> 2] >>> 24 - 8 * ((r + 2) % 4) & 255, v = 0; 4 > v && r + 0.75 * v < p; v++)
d.push(t.charAt(w >>> 6 * (3 - v) & 63));
if (l = t.charAt(64))
for (; d.length % 4;)
d.push(l);
return d.join("")
},
parse: function (d) {
var l = d.length
, s = this._map
, t = s.charAt(64);
t && (t = d.indexOf(t),
-1 != t && (l = t));
for (var t = [], r = 0, w = 0; w < l; w++)
if (w % 4) {
var v = s.indexOf(d.charAt(w - 1)) << 2 * (w % 4)
, b = s.indexOf(d.charAt(w)) >>> 6 - 2 * (w % 4);
t[r >>> 2] |= (v | b) << 24 - 8 * (r % 4);
r++
}
return p.create(t, r)
},
_map: "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/="
}
}
)();
(function (u) {
function p(b, n, a, c, e, j, k) {
b = b + (n & a | ~n & c) + e + k;
return (b << j | b >>> 32 - j) + n
}
function d(b, n, a, c, e, j, k) {
b = b + (n & c | a & ~c) + e + k;
return (b << j | b >>> 32 - j) + n
}
function l(b, n, a, c, e, j, k) {
b = b + (n ^ a ^ c) + e + k;
return (b << j | b >>> 32 - j) + n
}
function s(b, n, a, c, e, j, k) {
b = b + (a ^ (n | ~c)) + e + k;
return (b << j | b >>> 32 - j) + n
}
for (var t = CryptoJS, r = t.lib, w = r.WordArray, v = r.Hasher, r = t.algo, b = [], x = 0; 64 > x; x++)
b[x] = 4294967296 * u.abs(u.sin(x + 1)) | 0;
r = r.MD5 = v.extend({
_doReset: function () {
this._hash = new w.init([1732584193, 4023233417, 2562383102, 271733878])
},
_doProcessBlock: function (q, n) {
for (var a = 0; 16 > a; a++) {
var c = n + a
, e = q[c];
q[c] = (e << 8 | e >>> 24) & 16711935 | (e << 24 | e >>> 8) & 4278255360
}
var a = this._hash.words
, c = q[n + 0]
, e = q[n + 1]
, j = q[n + 2]
, k = q[n + 3]
, z = q[n + 4]
, r = q[n + 5]
, t = q[n + 6]
, w = q[n + 7]
, v = q[n + 8]
, A = q[n + 9]
, B = q[n + 10]
, C = q[n + 11]
, u = q[n + 12]
, D = q[n + 13]
, E = q[n + 14]
, x = q[n + 15]
, f = a[0]
, m = a[1]
, g = a[2]
, h = a[3]
, f = p(f, m, g, h, c, 7, b[0])
, h = p(h, f, m, g, e, 12, b[1])
, g = p(g, h, f, m, j, 17, b[2])
, m = p(m, g, h, f, k, 22, b[3])
, f = p(f, m, g, h, z, 7, b[4])
, h = p(h, f, m, g, r, 12, b[5])
, g = p(g, h, f, m, t, 17, b[6])
, m = p(m, g, h, f, w, 22, b[7])
, f = p(f, m, g, h, v, 7, b[8])
, h = p(h, f, m, g, A, 12, b[9])
, g = p(g, h, f, m, B, 17, b[10])
, m = p(m, g, h, f, C, 22, b[11])
, f = p(f, m, g, h, u, 7, b[12])
, h = p(h, f, m, g, D, 12, b[13])
, g = p(g, h, f, m, E, 17, b[14])
, m = p(m, g, h, f, x, 22, b[15])
, f = d(f, m, g, h, e, 5, b[16])
, h = d(h, f, m, g, t, 9, b[17])
, g = d(g, h, f, m, C, 14, b[18])
, m = d(m, g, h, f, c, 20, b[19])
, f = d(f, m, g, h, r, 5, b[20])
, h = d(h, f, m, g, B, 9, b[21])
, g = d(g, h, f, m, x, 14, b[22])
, m = d(m, g, h, f, z, 20, b[23])
, f = d(f, m, g, h, A, 5, b[24])
, h = d(h, f, m, g, E, 9, b[25])
, g = d(g, h, f, m, k, 14, b[26])
, m = d(m, g, h, f, v, 20, b[27])
, f = d(f, m, g, h, D, 5, b[28])
, h = d(h, f, m, g, j, 9, b[29])
, g = d(g, h, f, m, w, 14, b[30])
, m = d(m, g, h, f, u, 20, b[31])
, f = l(f, m, g, h, r, 4, b[32])
, h = l(h, f, m, g, v, 11, b[33])
, g = l(g, h, f, m, C, 16, b[34])
, m = l(m, g, h, f, E, 23, b[35])
, f = l(f, m, g, h, e, 4, b[36])
, h = l(h, f, m, g, z, 11, b[37])
, g = l(g, h, f, m, w, 16, b[38])
, m = l(m, g, h, f, B, 23, b[39])
, f = l(f, m, g, h, D, 4, b[40])
, h = l(h, f, m, g, c, 11, b[41])
, g = l(g, h, f, m, k, 16, b[42])
, m = l(m, g, h, f, t, 23, b[43])
, f = l(f, m, g, h, A, 4, b[44])
, h = l(h, f, m, g, u, 11, b[45])
, g = l(g, h, f, m, x, 16, b[46])
, m = l(m, g, h, f, j, 23, b[47])
, f = s(f, m, g, h, c, 6, b[48])
, h = s(h, f, m, g, w, 10, b[49])
, g = s(g, h, f, m, E, 15, b[50])
, m = s(m, g, h, f, r, 21, b[51])
, f = s(f, m, g, h, u, 6, b[52])
, h = s(h, f, m, g, k, 10, b[53])
, g = s(g, h, f, m, B, 15, b[54])
, m = s(m, g, h, f, e, 21, b[55])
, f = s(f, m, g, h, v, 6, b[56])
, h = s(h, f, m, g, x, 10, b[57])
, g = s(g, h, f, m, t, 15, b[58])
, m = s(m, g, h, f, D, 21, b[59])
, f = s(f, m, g, h, z, 6, b[60])
, h = s(h, f, m, g, C, 10, b[61])
, g = s(g, h, f, m, j, 15, b[62])
, m = s(m, g, h, f, A, 21, b[63]);
a[0] = a[0] + f | 0;
a[1] = a[1] + m | 0;
a[2] = a[2] + g | 0;
a[3] = a[3] + h | 0
},
_doFinalize: function () {
var b = this._data
, n = b.words
, a = 8 * this._nDataBytes
, c = 8 * b.sigBytes;
n[c >>> 5] |= 128 << 24 - c % 32;
var e = u.floor(a / 4294967296);
n[(c + 64 >>> 9 << 4) + 15] = (e << 8 | e >>> 24) & 16711935 | (e << 24 | e >>> 8) & 4278255360;
n[(c + 64 >>> 9 << 4) + 14] = (a << 8 | a >>> 24) & 16711935 | (a << 24 | a >>> 8) & 4278255360;
b.sigBytes = 4 * (n.length + 1);
this._process();
b = this._hash;
n = b.words;
for (a = 0; 4 > a; a++)
c = n[a],
n[a] = (c << 8 | c >>> 24) & 16711935 | (c << 24 | c >>> 8) & 4278255360;
return b
},
clone: function () {
var b = v.clone.call(this);
b._hash = this._hash.clone();
return b
}
});
t.MD5 = v._createHelper(r);
t.HmacMD5 = v._createHmacHelper(r)
}
)(Math);
(function () {
var u = CryptoJS
, p = u.lib
, d = p.Base
, l = p.WordArray
, p = u.algo
, s = p.EvpKDF = d.extend({
cfg: d.extend({
keySize: 4,
hasher: p.MD5,
iterations: 1
}),
init: function (d) {
this.cfg = this.cfg.extend(d)
},
compute: function (d, r) {
for (var p = this.cfg, s = p.hasher.create(), b = l.create(), u = b.words, q = p.keySize, p = p.iterations; u.length < q;) {
n && s.update(n);
var n = s.update(d).finalize(r);
s.reset();
for (var a = 1; a < p; a++)
n = s.finalize(n),
s.reset();
b.concat(n)
}
b.sigBytes = 4 * q;
return b
}
});
u.EvpKDF = function (d, l, p) {
return s.create(p).compute(d, l)
}
}
)();
CryptoJS.lib.Cipher || function (u) {
var p = CryptoJS
, d = p.lib
, l = d.Base
, s = d.WordArray
, t = d.BufferedBlockAlgorithm
, r = p.enc.Base64
, w = p.algo.EvpKDF
, v = d.Cipher = t.extend({
cfg: l.extend(),
createEncryptor: function (e, a) {
return this.create(this._ENC_XFORM_MODE, e, a)
},
createDecryptor: function (e, a) {
return this.create(this._DEC_XFORM_MODE, e, a)
},
init: function (e, a, b) {
this.cfg = this.cfg.extend(b);
this._xformMode = e;
this._key = a;
this.reset()
},
reset: function () {
t.reset.call(this);
this._doReset()
},
process: function (e) {
this._append(e);
return this._process()
},
finalize: function (e) {
e && this._append(e);
return this._doFinalize()
},
keySize: 4,
ivSize: 4,
_ENC_XFORM_MODE: 1,
_DEC_XFORM_MODE: 2,
_createHelper: function (e) {
return {
encrypt: function (b, k, d) {
return ("string" == typeof k ? c : a).encrypt(e, b, k, d)
},
decrypt: function (b, k, d) {
return ("string" == typeof k ? c : a).decrypt(e, b, k, d)
}
}
}
});
d.StreamCipher = v.extend({
_doFinalize: function () {
return this._process(!0)
},
blockSize: 1
});
var b = p.mode = {}
, x = function (e, a, b) {
var c = this._iv;
c ? this._iv = u : c = this._prevBlock;
for (var d = 0; d < b; d++)
e[a + d] ^= c[d]
}
, q = (d.BlockCipherMode = l.extend({
createEncryptor: function (e, a) {
return this.Encryptor.create(e, a)
},
createDecryptor: function (e, a) {
return this.Decryptor.create(e, a)
},
init: function (e, a) {
this._cipher = e;
this._iv = a
}
})).extend();
q.Encryptor = q.extend({
processBlock: function (e, a) {
var b = this._cipher
, c = b.blockSize;
x.call(this, e, a, c);
b.encryptBlock(e, a);
this._prevBlock = e.slice(a, a + c)
}
});
q.Decryptor = q.extend({
processBlock: function (e, a) {
var b = this._cipher
, c = b.blockSize
, d = e.slice(a, a + c);
b.decryptBlock(e, a);
x.call(this, e, a, c);
this._prevBlock = d
}
});
b = b.CBC = q;
q = (p.pad = {}).Pkcs7 = {
pad: function (a, b) {
for (var c = 4 * b, c = c - a.sigBytes % c, d = c << 24 | c << 16 | c << 8 | c, l = [], n = 0; n < c; n += 4)
l.push(d);
c = s.create(l, c);
a.concat(c)
},
unpad: function (a) {
a.sigBytes -= a.words[a.sigBytes - 1 >>> 2] & 255
}
};
d.BlockCipher = v.extend({
cfg: v.cfg.extend({
mode: b,
padding: q
}),
reset: function () {
v.reset.call(this);
var a = this.cfg
, b = a.iv
, a = a.mode;
if (this._xformMode == this._ENC_XFORM_MODE)
var c = a.createEncryptor;
else
c = a.createDecryptor,
this._minBufferSize = 1;
this._mode = c.call(a, this, b && b.words)
},
_doProcessBlock: function (a, b) {
this._mode.processBlock(a, b)
},
_doFinalize: function () {
var a = this.cfg.padding;
if (this._xformMode == this._ENC_XFORM_MODE) {
a.pad(this._data, this.blockSize);
var b = this._process(!0)
} else
b = this._process(!0),
a.unpad(b);
return b
},
blockSize: 4
});
var n = d.CipherParams = l.extend({
init: function (a) {
this.mixIn(a)
},
toString: function (a) {
return (a || this.formatter).stringify(this)
}
})
, b = (p.format = {}).OpenSSL = {
stringify: function (a) {
var b = a.ciphertext;
a = a.salt;
return (a ? s.create([1398893684, 1701076831]).concat(a).concat(b) : b).toString(r)
},
parse: function (a) {
a = r.parse(a);
var b = a.words;
if (1398893684 == b[0] && 1701076831 == b[1]) {
var c = s.create(b.slice(2, 4));
b.splice(0, 4);
a.sigBytes -= 16
}
return n.create({
ciphertext: a,
salt: c
})
}
}
, a = d.SerializableCipher = l.extend({
cfg: l.extend({
format: b
}),
encrypt: function (a, b, c, d) {
d = this.cfg.extend(d);
var l = a.createEncryptor(c, d);
b = l.finalize(b);
l = l.cfg;
return n.create({
ciphertext: b,
key: c,
iv: l.iv,
algorithm: a,
mode: l.mode,
padding: l.padding,
blockSize: a.blockSize,
formatter: d.format
})
},
decrypt: function (a, b, c, d) {
d = this.cfg.extend(d);
b = this._parse(b, d.format);
return a.createDecryptor(c, d).finalize(b.ciphertext)
},
_parse: function (a, b) {
return "string" == typeof a ? b.parse(a, this) : a
}
})
, p = (p.kdf = {}).OpenSSL = {
execute: function (a, b, c, d) {
d || (d = s.random(8));
a = w.create({
keySize: b + c
}).compute(a, d);
c = s.create(a.words.slice(b), 4 * c);
a.sigBytes = 4 * b;
return n.create({
key: a,
iv: c,
salt: d
})
}
}
, c = d.PasswordBasedCipher = a.extend({
cfg: a.cfg.extend({
kdf: p
}),
encrypt: function (b, c, d, l) {
l = this.cfg.extend(l);
d = l.kdf.execute(d, b.keySize, b.ivSize);
l.iv = d.iv;
b = a.encrypt.call(this, b, c, d.key, l);
b.mixIn(d);
return b
},
decrypt: function (b, c, d, l) {
l = this.cfg.extend(l);
c = this._parse(c, l.format);
d = l.kdf.execute(d, b.keySize, b.ivSize, c.salt);
l.iv = d.iv;
return a.decrypt.call(this, b, c, d.key, l)
}
})
}();
(function () {
for (var u = CryptoJS, p = u.lib.BlockCipher, d = u.algo, l = [], s = [], t = [], r = [], w = [], v = [], b = [], x = [], q = [], n = [], a = [], c = 0; 256 > c; c++)
a[c] = 128 > c ? c << 1 : c << 1 ^ 283;
for (var e = 0, j = 0, c = 0; 256 > c; c++) {
var k = j ^ j << 1 ^ j << 2 ^ j << 3 ^ j << 4
, k = k >>> 8 ^ k & 255 ^ 99;
l[e] = k;
s[k] = e;
var z = a[e]
, F = a[z]
, G = a[F]
, y = 257 * a[k] ^ 16843008 * k;
t[e] = y << 24 | y >>> 8;
r[e] = y << 16 | y >>> 16;
w[e] = y << 8 | y >>> 24;
v[e] = y;
y = 16843009 * G ^ 65537 * F ^ 257 * z ^ 16843008 * e;
b[k] = y << 24 | y >>> 8;
x[k] = y << 16 | y >>> 16;
q[k] = y << 8 | y >>> 24;
n[k] = y;
e ? (e = z ^ a[a[a[G ^ z]]],
j ^= a[a[j]]) : e = j = 1
}
var H = [0, 1, 2, 4, 8, 16, 32, 64, 128, 27, 54]
, d = d.AES = p.extend({
_doReset: function () {
for (var a = this._key, c = a.words, d = a.sigBytes / 4, a = 4 * ((this._nRounds = d + 6) + 1), e = this._keySchedule = [], j = 0; j < a; j++)
if (j < d)
e[j] = c[j];
else {
var k = e[j - 1];
j % d ? 6 < d && 4 == j % d && (k = l[k >>> 24] << 24 | l[k >>> 16 & 255] << 16 | l[k >>> 8 & 255] << 8 | l[k & 255]) : (k = k << 8 | k >>> 24,
k = l[k >>> 24] << 24 | l[k >>> 16 & 255] << 16 | l[k >>> 8 & 255] << 8 | l[k & 255],
k ^= H[j / d | 0] << 24);
e[j] = e[j - d] ^ k
}
c = this._invKeySchedule = [];
for (d = 0; d < a; d++)
j = a - d,
k = d % 4 ? e[j] : e[j - 4],
c[d] = 4 > d || 4 >= j ? k : b[l[k >>> 24]] ^ x[l[k >>> 16 & 255]] ^ q[l[k >>> 8 & 255]] ^ n[l[k & 255]]
},
encryptBlock: function (a, b) {
this._doCryptBlock(a, b, this._keySchedule, t, r, w, v, l)
},
decryptBlock: function (a, c) {
var d = a[c + 1];
a[c + 1] = a[c + 3];
a[c + 3] = d;
this._doCryptBlock(a, c, this._invKeySchedule, b, x, q, n, s);
d = a[c + 1];
a[c + 1] = a[c + 3];
a[c + 3] = d
},
_doCryptBlock: function (a, b, c, d, e, j, l, f) {
for (var m = this._nRounds, g = a[b] ^ c[0], h = a[b + 1] ^ c[1], k = a[b + 2] ^ c[2], n = a[b + 3] ^ c[3], p = 4, r = 1; r < m; r++)
var q = d[g >>> 24] ^ e[h >>> 16 & 255] ^ j[k >>> 8 & 255] ^ l[n & 255] ^ c[p++]
, s = d[h >>> 24] ^ e[k >>> 16 & 255] ^ j[n >>> 8 & 255] ^ l[g & 255] ^ c[p++]
, t = d[k >>> 24] ^ e[n >>> 16 & 255] ^ j[g >>> 8 & 255] ^ l[h & 255] ^ c[p++]
, n = d[n >>> 24] ^ e[g >>> 16 & 255] ^ j[h >>> 8 & 255] ^ l[k & 255] ^ c[p++]
, g = q
, h = s
, k = t;
q = (f[g >>> 24] << 24 | f[h >>> 16 & 255] << 16 | f[k >>> 8 & 255] << 8 | f[n & 255]) ^ c[p++];
s = (f[h >>> 24] << 24 | f[k >>> 16 & 255] << 16 | f[n >>> 8 & 255] << 8 | f[g & 255]) ^ c[p++];
t = (f[k >>> 24] << 24 | f[n >>> 16 & 255] << 16 | f[g >>> 8 & 255] << 8 | f[h & 255]) ^ c[p++];
n = (f[n >>> 24] << 24 | f[g >>> 16 & 255] << 16 | f[h >>> 8 & 255] << 8 | f[k & 255]) ^ c[p++];
a[b] = q;
a[b + 1] = s;
a[b + 2] = t;
a[b + 3] = n
},
keySize: 8
});
u.AES = p._createHelper(d)
}
)();
var _0xbb0f = ['E81FF6195C0BAFCB', 'toString', 'Utf8', 'createElement', 'setAttribute', 'type', 'text/css', 'async', 'head', 'link', 'getElementsByTagName', 'AoUzw', 'saoSi', 'length', 'parentNode', 'insertBefore', 'appendChild', '2|0|4|3|5|1', 'split', 'IoJsz', 'fromCharCode', 'EEpzt', 'uvFfC', 'styleSheets', 'addRule', '::before', 'content:\x20\x22', 'insertRule', '.context_kw', '::before{content:\x20\x22', 'cssRules', 'pad', 'ZeroPadding', 'PRpDa', 'sigBytes', 'words', 'zphVL', 'kLSuP', 'bysiq', 'prototype', 'endWith', 'test', 'enc', 'Latin1', 'F8F5A56F0EACEABF', 'window', 'location', 'href', 'parse'];
(function (_0x31837c, _0x543a03) {
var _0x4a264e = function (_0x47c787) {
while (--_0x47c787) {
_0x31837c['push'](_0x31837c['shift']());
}
};
_0x4a264e(++_0x543a03);
}(_0xbb0f, 0x114));
var _0xfbb0 = function (_0x371d7e, _0x32dd55) {
_0x371d7e = _0x371d7e - 0x0;
var _0x9185f5 = _0xbb0f[_0x371d7e];
return _0x9185f5;
};
CryptoJS[_0xfbb0('0x0')][_0xfbb0('0x1')] = {
'pad': function (_0x4c32e6, _0x58cb41) {
var _0x4168ad = {
'PRpDa': function _0x23ef8e(_0x40a321, _0x44108c) {
return _0x40a321 * _0x44108c;
},
'hXngN': function _0x11805a(_0x710122, _0x2ac3e8) {
return _0x710122 - _0x2ac3e8;
}
};
var _0x396553 = _0x4168ad[_0xfbb0('0x2')](_0x58cb41, 0x4);
_0x4c32e6['clamp']();
_0x4c32e6[_0xfbb0('0x3')] += _0x4168ad['hXngN'](_0x396553, _0x4c32e6[_0xfbb0('0x3')] % _0x396553 || _0x396553);
},
'unpad': function (_0x59bda2) {
var _0x101bf1 = {
'zphVL': function _0x130231(_0x4030c7, _0x290f0a) {
return _0x4030c7 >>> _0x290f0a;
},
'jXAvx': function _0x4e4cfd(_0x1b998e, _0x191575) {
return _0x1b998e - _0x191575;
},
'kLSuP': function _0x58bcd5(_0xdeba7b, _0x1e7c0c) {
return _0xdeba7b * _0x1e7c0c;
},
'bysiq': function _0x51bf4b(_0x37dd85, _0x5c2f04) {
return _0x37dd85 + _0x5c2f04;
}
};
var _0x4673b7 = _0x59bda2[_0xfbb0('0x4')];
var _0x4c0957 = _0x59bda2['sigBytes'] - 0x1;
while (!(_0x101bf1[_0xfbb0('0x5')](_0x4673b7[_0x101bf1[_0xfbb0('0x5')](_0x4c0957, 0x2)], _0x101bf1['jXAvx'](0x18, _0x101bf1[_0xfbb0('0x6')](_0x4c0957 % 0x4, 0x8))) & 0xff)) {
_0x4c0957--;
}
_0x59bda2[_0xfbb0('0x3')] = _0x101bf1[_0xfbb0('0x7')](_0x4c0957, 0x1);
}
};
String[_0xfbb0('0x8')][_0xfbb0('0x9')] = function (_0x472b16) {
var _0x10b800 = {
'olVeo': function _0x3739a6(_0xc39157, _0x378da) {
return _0xc39157 + _0x378da;
}
};
var _0x53c01a = new RegExp(_0x10b800['olVeo'](_0x472b16, '$'));
return _0x53c01a[_0xfbb0('0xa')](this);
}
;
var data = 'mxVThfXmfzpCTQnSwVRn8Y8UZFeaQjNmPfROJ7U/MdggXPsyJe6laZiDFUi3vOmBNq6EC/vuzTVUaMTprya3+wtw7qy5GBUrECIWK5N6gorU/HRhaGDCUjkvGCKPKcaz8YlU7fKItxDZkVEQreagVufjm16fu+/Llms5cmguefxPliLhaTUGLb87VfxH2UI1l6wt0dzvjCUcJ3WSOGg3Mhh2pLmc/IQgNWz/+DddLU8=';
var keywords = CryptoJS[_0xfbb0('0xb')][_0xfbb0('0xc')]['parse'](_0xfbb0('0xd'));
var iv = '';
try {
iv = CryptoJS[_0xfbb0('0xb')][_0xfbb0('0xc')][_0xfbb0('0x11')](_0xfbb0('0x12'));
} catch (_0x362367) {
iv = CryptoJS[_0xfbb0('0xb')][_0xfbb0('0xc')][_0xfbb0('0x11')]('146385F634C9CB00');
}
var decrypted = CryptoJS['AES']['decrypt'](data, keywords, {
'iv': iv,
'padding': CryptoJS['pad']['ZeroPadding']
});
var secWords = decrypted[_0xfbb0('0x13')](CryptoJS[_0xfbb0('0xb')][_0xfbb0('0x14')])['split'](',');
var words = new Array(secWords['length']);
for (var i = 0x0; i < secWords[_0xfbb0('0x1f')]; i++) {
var _0x25e5b5 = _0xfbb0('0x23')[_0xfbb0('0x24')]('|')
, _0x371559 = 0x0;
while (!![]) {
switch (_0x25e5b5[_0x371559++]) {
case '0':
var _0x525f75 = function (_0x4c5da1) {
var _0xcb9042 = {
'MvouK': function _0x5105d2(_0x4cf14c, _0x3ffe5d) {
return _0x4cf14c % _0x3ffe5d;
},
'IoJsz': function _0x55758e(_0x142bc7, _0x461911) {
return _0x142bc7 - _0x461911;
}
};
return _0xcb9042['MvouK'](_0x4c5da1, 0x2) ? _0x4c5da1 - 0x2 : _0xcb9042[_0xfbb0('0x25')](_0x4c5da1, 0x4);
};
continue;
case '1':
words[i] = String[_0xfbb0('0x26')](_0x589457);
continue;
case '2':
var _0x589457 = secWords[i];
continue;
case '3':
_0x589457 = _0x525f75(_0x589457);
continue;
case '4':
var _0x22fde8 = function (_0x2658b1) {
var _0x26525f = {
'EEpzt': function _0x33e859(_0x257080, _0x22e64c) {
return _0x257080 === _0x22e64c;
},
'uvFfC': 'undefined'
};
return _0x2658b1 + 0x3 * +!_0x26525f[_0xfbb0('0x27')]("object", _0x26525f[_0xfbb0('0x28')]);
};
continue;
case '5':
_0x589457 = _0x22fde8(_0x589457);
continue;
}
break;
}
}
console.log(words);
}
spider();
19. node 执行结果
和浏览器显示一致,回答正确
20. 获取源数据
import requests
import re
url = 'https://g.hongshu.com/content/96680/14747430.html'
response = requests.get(url).text
# 伪元素显示的数据列表
li = [",", "…", "了", "一", "的", "个", "好", "我", "有", "是", "到", "天", "也", "不", "在", "!", "你", "说", "没", "文", "大", "想", "为", "们"]
# 将网页源码中的span标签替换为伪元素显示的数据
num_list = [li[int(index)] for index in re.findall(r'<span class="context_kw(.*?)"></span>',response)]
# 所span标签
span_list = re.findall(r'<span class="context_kw.*?"></span>', response)
# 批量替换
for num, span in zip(num_list, span_list):
response = response.replace(span, num).replace('\r\n', '').replace('<p>', '').replace('</p>', '').replace('\r', '')
# 获取指定数据
text = re.findall(r"""<div class="rdtext" fsize="16">(.*?)</div>""", response, re.S)[0]
print(text)