js采集:新浪微博标签采集
第一步加载js
/*加载jq*/var _doc=document.getElementsByTagName('head')[0];var script=document.createElement('script'); script.setAttribute('type','text/javascript'); script.setAttribute('src','http://lib.sinaapp.com/js/jquery/1.7.2/jquery.min.js'); _doc.appendChild(script); 第二步
var tags=[];var run=1;function get_tags(){console.log("start:"+run);console.log("tag num:"+tags.length);$.get("http://account.weibo.com/set/aj/tagsuggest?__rnd=1384928386600",{},function(data){ for(var i in data['data']){ tags.push(data['data'][i]['tag']); } run++; if(run<500){ setTimeout(get_tags,300); }},"json");}第3步
console.log(tags.join(","))新浪的标签大概有700多个,采集下来需要去重