Grab vBulletin pages in logged-in mode
This task use javascript sandbox with jsoup support to grab vBulletin pages in logged-in mode.
Grab vBulletin pages in logged-in mode
- Create javascript sandbox with jsoup support
- Create javascript as following
javascript
function main(env, args) {
var links = args.get('links');
var username = '';
var password = '';
var conn;
try {
conn = env.newJsoup().connect('http://www.sitepoint.com/forums/login.php?do=login');
conn.userAgent('Mozilla/5.0 (Windows NT x.y; rv:10.0.1) Gecko/20100101 Firefox/10.0.1');
conn.data('do', 'login');
conn.data('vb_login_username', username);
conn.data('vb_login_password', password);
conn.data('vb_login_md5password', hex_md5(str_to_ent(trim(password))));
conn.data('securitytoken', 'guest');
conn.data('cookieuser', '1');
var doc = conn.post();
var ele = doc.select('.standard_error .restore').first();
if (ele == null) {
env.error('Cannot login!');
return;
}
if (!ele.text().startsWith('Thank you for logging in')) {
env.error('Cannot login!');
return;
}
var cookies = conn.getCookies();
var url = env.newURL('http://www.sitepoint.com/forums/subscription.php');
conn = env.newJsoup().connect(url);
conn.userAgent('Mozilla/5.0 (Windows NT x.y; rv:10.0.1) Gecko/20100101 Firefox/10.0.1');
conn.cookies(cookies);
doc = conn.get();
var elements = doc.select('#threads .threadbit');
for (var i = 0; i < elements.size(); i++) {
var element = elements.get(i);
var item = env.newHashMap();
var child = element.select('.threadtitle .title').first();
item.put('title', child.text());
var href = env.newURL(url, child.attr('href'));
item.put('link', href + '');
links.add(item);
}
} catch (e) {
env.error(e);
}
}
var hexcase=0;
var b64pad="";
var chrsz=8;
function hex_md5(A){
return binl2hex(core_md5(str2binl(A),A.length*chrsz))
}
function b64_md5(A){
return binl2b64(core_md5(str2binl(A),A.length*chrsz))
}
function str_md5(A){
return binl2str(core_md5(str2binl(A),A.length*chrsz))
}
function hex_hmac_md5(A,B){
return binl2hex(core_hmac_md5(A,B))
}
function b64_hmac_md5(A,B){
return binl2b64(core_hmac_md5(A,B))
}
function str_hmac_md5(A,B){
return binl2str(core_hmac_md5(A,B))
}
function core_md5(K,F){
K[F>>5]|=128<<((F)%32);
K[(((F+64)>>>9)<<4)+14]=F;
var J=1732584193;
var I=-271733879;
var H=-1732584194;
var G=271733878;
for(var C=0;C<K.length;C+=16){
var E=J;
var D=I;
var B=H;
var A=G;
J=md5_ff(J,I,H,G,K[C+0],7,-680876936);
G=md5_ff(G,J,I,H,K[C+1],12,-389564586);
H=md5_ff(H,G,J,I,K[C+2],17,606105819);
I=md5_ff(I,H,G,J,K[C+3],22,-1044525330);
J=md5_ff(J,I,H,G,K[C+4],7,-176418897);
G=md5_ff(G,J,I,H,K[C+5],12,1200080426);
H=md5_ff(H,G,J,I,K[C+6],17,-1473231341);
I=md5_ff(I,H,G,J,K[C+7],22,-45705983);
J=md5_ff(J,I,H,G,K[C+8],7,1770035416);
G=md5_ff(G,J,I,H,K[C+9],12,-1958414417);
H=md5_ff(H,G,J,I,K[C+10],17,-42063);
I=md5_ff(I,H,G,J,K[C+11],22,-1990404162);
J=md5_ff(J,I,H,G,K[C+12],7,1804603682);
G=md5_ff(G,J,I,H,K[C+13],12,-40341101);
H=md5_ff(H,G,J,I,K[C+14],17,-1502002290);
I=md5_ff(I,H,G,J,K[C+15],22,1236535329);
J=md5_gg(J,I,H,G,K[C+1],5,-165796510);
G=md5_gg(G,J,I,H,K[C+6],9,-1069501632);
H=md5_gg(H,G,J,I,K[C+11],14,643717713);
I=md5_gg(I,H,G,J,K[C+0],20,-373897302);
J=md5_gg(J,I,H,G,K[C+5],5,-701558691);
G=md5_gg(G,J,I,H,K[C+10],9,38016083);
H=md5_gg(H,G,J,I,K[C+15],14,-660478335);
I=md5_gg(I,H,G,J,K[C+4],20,-405537848);
J=md5_gg(J,I,H,G,K[C+9],5,568446438);
G=md5_gg(G,J,I,H,K[C+14],9,-1019803690);
H=md5_gg(H,G,J,I,K[C+3],14,-187363961);
I=md5_gg(I,H,G,J,K[C+8],20,1163531501);
J=md5_gg(J,I,H,G,K[C+13],5,-1444681467);
G=md5_gg(G,J,I,H,K[C+2],9,-51403784);
H=md5_gg(H,G,J,I,K[C+7],14,1735328473);
I=md5_gg(I,H,G,J,K[C+12],20,-1926607734);
J=md5_hh(J,I,H,G,K[C+5],4,-378558);
G=md5_hh(G,J,I,H,K[C+8],11,-2022574463);
H=md5_hh(H,G,J,I,K[C+11],16,1839030562);
I=md5_hh(I,H,G,J,K[C+14],23,-35309556);
J=md5_hh(J,I,H,G,K[C+1],4,-1530992060);
G=md5_hh(G,J,I,H,K[C+4],11,1272893353);
H=md5_hh(H,G,J,I,K[C+7],16,-155497632);
I=md5_hh(I,H,G,J,K[C+10],23,-1094730640);
J=md5_hh(J,I,H,G,K[C+13],4,681279174);
G=md5_hh(G,J,I,H,K[C+0],11,-358537222);
H=md5_hh(H,G,J,I,K[C+3],16,-722521979);
I=md5_hh(I,H,G,J,K[C+6],23,76029189);
J=md5_hh(J,I,H,G,K[C+9],4,-640364487);
G=md5_hh(G,J,I,H,K[C+12],11,-421815835);
H=md5_hh(H,G,J,I,K[C+15],16,530742520);
I=md5_hh(I,H,G,J,K[C+2],23,-995338651);
J=md5_ii(J,I,H,G,K[C+0],6,-198630844);
G=md5_ii(G,J,I,H,K[C+7],10,1126891415);
H=md5_ii(H,G,J,I,K[C+14],15,-1416354905);
I=md5_ii(I,H,G,J,K[C+5],21,-57434055);
J=md5_ii(J,I,H,G,K[C+12],6,1700485571);
G=md5_ii(G,J,I,H,K[C+3],10,-1894986606);
H=md5_ii(H,G,J,I,K[C+10],15,-1051523);
I=md5_ii(I,H,G,J,K[C+1],21,-2054922799);
J=md5_ii(J,I,H,G,K[C+8],6,1873313359);
G=md5_ii(G,J,I,H,K[C+15],10,-30611744);
H=md5_ii(H,G,J,I,K[C+6],15,-1560198380);
I=md5_ii(I,H,G,J,K[C+13],21,1309151649);
J=md5_ii(J,I,H,G,K[C+4],6,-145523070);
G=md5_ii(G,J,I,H,K[C+11],10,-1120210379);
H=md5_ii(H,G,J,I,K[C+2],15,718787259);
I=md5_ii(I,H,G,J,K[C+9],21,-343485551);
J=safe_add(J,E);
I=safe_add(I,D);
H=safe_add(H,B);
G=safe_add(G,A)
}
return Array(J,I,H,G)
}
function md5_cmn(F,C,B,A,E,D){
return safe_add(bit_rol(safe_add(safe_add(C,F),safe_add(A,D)),E),B)
}
function md5_ff(C,B,G,F,A,E,D){
return md5_cmn((B&G)|((~B)&F),C,B,A,E,D)
}
function md5_gg(C,B,G,F,A,E,D){
return md5_cmn((B&F)|(G&(~F)),C,B,A,E,D)
}
function md5_hh(C,B,G,F,A,E,D){
return md5_cmn(B^G^F,C,B,A,E,D)
}
function md5_ii(C,B,G,F,A,E,D){
return md5_cmn(G^(B|(~F)),C,B,A,E,D)
}
function core_hmac_md5(C,F){
var E=str2binl(C);
if(E.length>16){
E=core_md5(E,C.length*chrsz)
}
var A=Array(16),D=Array(16);
for(var B=0;B<16;B++){
A[B]=E[B]^909522486;D[B]=E[B]^1549556828
}
var G=core_md5(A.concat(str2binl(F)),512+F.length*chrsz);
return core_md5(D.concat(G),512+128)
}
function safe_add(A,D){
var C=(A&65535)+(D&65535);
var B=(A>>16)+(D>>16)+(C>>16);
return(B<<16)|(C&65535)
}
function bit_rol(A,B){
return(A<<B)|(A>>>(32-B))
}
function str2binl(D){
var C=new Array();
var A=(1<<chrsz)-1;
for(var B=0;B<D.length*chrsz;B+=chrsz){
C[B>>5]|=(D.charCodeAt(B/chrsz)&A)<<(B%32)
}
return C
}
function binl2str(C){
var D="";
var A=(1<<chrsz)-1;
for(var B=0;B<C.length*32;B+=chrsz){
D+=String.fromCharCode((C[B>>5]>>>(B%32))&A)
}
return D
}
function binl2hex(C){
var B=hexcase?"0123456789ABCDEF":"0123456789abcdef";
var D="";
for(var A=0;A<C.length*4;A++){
D+=B.charAt((C[A>>2]>>((A%4)*8+4))&15)+B.charAt((C[A>>2]>>((A%4)*8))&15)
}
return D
}
function binl2b64(D){
var C="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
var F="";
for(var B=0;B<D.length*4;B+=3){
var E=(((D[B>>2]>>8*(B%4))&255)<<16)|(((D[B+1>>2]>>8*((B+1)%4))&255)<<8)|((D[B+2>>2]>>8*((B+2)%4))&255);
for(var A=0;A<4;A++){
if(B*8+A*6>D.length*32){
F+=b64pad
}else{
F+=C.charAt((E>>6*(3-A))&63)
}
}
}
return F
}
function str_to_ent(D){
var A="";
var C;
for(C=0;C<D.length;C++){
var E=D.charCodeAt(C);
var B="";
if(E>255){
while(E>=1){
B="0123456789".charAt(E%10)+B;E=E/10
}
if(B==""){B="0"}
B="#"+B;
B="&"+B;B=B+";";
A+=B
}else{
A+=D.charAt(C)
}
}
return A
}
function trim(A){
while(A.substring(0,1)==" "){
A=A.substring(1,A.length)
}
while(A.substring(A.length-1,A.length)==" "){
A=A.substring(0,A.length-1)
}
return A
}
No comments:
Post a Comment