提取网页内容,去掉标签,去掉无用链接,主要服务于自然语言处理中对网页内容要求的应用。
-extract the content of the sites and remove labels, eliminating useless links, major service on natural language processing of web content requirements of the application.
SHOW FULL COLUMNS FROM `jrk_downrecords` [ RunTime:0.001281s ]
SELECT `a`.`aid`,`a`.`title`,`a`.`create_time`,`m`.`username` FROM `jrk_downrecords` `a` INNER JOIN `jrk_member` `m` ON `a`.`uid`=`m`.`id` WHERE `a`.`status` = 1 GROUP BY `a`.`aid` ORDER BY `a`.`create_time` DESC LIMIT 10 [ RunTime:0.089393s ]
SHOW FULL COLUMNS FROM `jrk_tagrecords` [ RunTime:0.001245s ]
SELECT * FROM `jrk_tagrecords` WHERE `status` = 1 ORDER BY `num` DESC LIMIT 20 [ RunTime:0.001905s ]
SHOW FULL COLUMNS FROM `jrk_member` [ RunTime:0.001297s ]
SELECT `id`,`username`,`userhead`,`usertime` FROM `jrk_member` WHERE `status` = 1 ORDER BY `usertime` DESC LIMIT 10 [ RunTime:0.003587s ]
SHOW FULL COLUMNS FROM `jrk_searchrecords` [ RunTime:0.001057s ]
SELECT * FROM `jrk_searchrecords` WHERE `status` = 1 ORDER BY `num` DESC LIMIT 5 [ RunTime:0.003167s ]
SELECT aid,title,count(aid) as c FROM `jrk_downrecords` GROUP BY `aid` ORDER BY `c` DESC LIMIT 10 [ RunTime:0.014740s ]
SHOW FULL COLUMNS FROM `jrk_articles` [ RunTime:0.001386s ]
UPDATE `jrk_articles` SET `hits` = 1 WHERE `id` = 143182 [ RunTime:0.001269s ]