应用背景WebCollector is an open source web crawler framework based on Java.It provides some simple interfaces for crawling the Web,you can setup a multi-threaded web crawler in less than 5 minutes.关键技术WebCollector致力于维护一个稳定、可扩的爬虫内核,源码中集成了Jsoup,可进行精准的网页解析;便于开发者学习并进行开发。内核具有健壮的扩展性,用户可以在此基础上开发自己想要的爬虫。
SHOW FULL COLUMNS FROM `jrk_downrecords` [ RunTime:0.001847s ]
SELECT `a`.`aid`,`a`.`title`,`a`.`create_time`,`m`.`username` FROM `jrk_downrecords` `a` INNER JOIN `jrk_member` `m` ON `a`.`uid`=`m`.`id` WHERE `a`.`status` = 1 GROUP BY `a`.`aid` ORDER BY `a`.`create_time` DESC LIMIT 10 [ RunTime:0.084123s ]
SHOW FULL COLUMNS FROM `jrk_tagrecords` [ RunTime:0.002421s ]
SELECT * FROM `jrk_tagrecords` WHERE `status` = 1 ORDER BY `num` DESC LIMIT 20 [ RunTime:0.002354s ]
SHOW FULL COLUMNS FROM `jrk_member` [ RunTime:0.002135s ]
SELECT `id`,`username`,`userhead`,`usertime` FROM `jrk_member` WHERE `status` = 1 ORDER BY `usertime` DESC LIMIT 10 [ RunTime:0.004389s ]
SHOW FULL COLUMNS FROM `jrk_searchrecords` [ RunTime:0.002091s ]
SELECT * FROM `jrk_searchrecords` WHERE `status` = 1 ORDER BY `num` DESC LIMIT 5 [ RunTime:0.004017s ]
SELECT aid,title,count(aid) as c FROM `jrk_downrecords` GROUP BY `aid` ORDER BY `c` DESC LIMIT 10 [ RunTime:0.014688s ]
SHOW FULL COLUMNS FROM `jrk_articles` [ RunTime:0.002325s ]
UPDATE `jrk_articles` SET `hits` = 1 WHERE `id` = 78067 [ RunTime:0.001161s ]