清华大佬耗费三个月吐血整理的几百G的资源,免费分享!....>>>
PHP采集腾讯微博只留文字部分
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 | <?php header( "Content-type:text/html;charset=utf-8" ); $weibo = file_get_contents ( 'http://t.qq.com/starank' ); $preg = '/<div class="msgCnt">(.*)<\/div><div class="mediaWrap">/Uis' ; preg_match_all( $preg , $weibo , $string ); foreach ( $string [1] as $key => $value ){ echo delhtml( $value ). "<br/><br/><br/>" ; } function delhtml( $str ) // 清除HTML标签 { $st = -1; //开始 $et = -1; //结束 $stmp = array (); $stmp [] = " " ; $len = strlen ( $str ); for ( $i = 0; $i < $len ; $i ++) { $ss = substr ( $str , $i , 1); if (ord( $ss ) == 60) // ord("<")==60 { $st = $i ; } if (ord( $ss ) == 62) // ord(">")==62 { $et = $i ; if ( $st != -1) { $stmp [] = substr ( $str , $st , $et - $st + 1); } } } $str = str_replace ( $stmp , "" , $str ); return $str ; } ?> |