README.md
hexo-selenium-site-parser
first:
npm install hexo-selenium-site-parser
second:
create teampleate file called: 'teamplate_record.md' you can copy in from module directory
---
title: [[title]]
---
[[img]]
[[desc]]
[[imgs]]
[link:]([[link]] "[[title]]")
use example:
- create file test.js in hexo blog folder because it create posts in source/_post and store images in source/images folders put next code to see the result
- check everyone can write permision to '/source' folder
- you can copy test.js from module directory
var Parser = ;var parser = ; var sites_config = ; sites_config1 = ;sites_config1'site_url' = 'http://seasonvar.ru/'; sites_config1'records_links_xpath' = "//div[@class='news']//a";sites_config1'records_title_xpath' = "//h1[@class='pgs-sinfo-title']";sites_config1'records_content_xpath' = "//div[@class='pgs-sinfo-info']//p";sites_config1'records_img_xpath' = "//div[@class='pgs-sinfo-imgwrap']//span//img"; //leave it empty if use many images at the same page "//div[@class='full-str']//img"; sites_config1'categories_xpath' = '';sites_config1'tags_xpath' = '';sites_config1'records_imgs_xpath' = '';////div[@class="entry-content"]//p//img'; //leave it empty if use only one imagesites_config1'records_imgs_to_parse' = 0; // num on images to parse per parsed postsites_config1'records_meta1_xpath' = '';//"//div[@class='tile-primary']//textarea"; sites_config1'click' = "//div[@class='player-extBtn-getcode']";//"//div[@class='tile-primary']//textarea";sites_config1'click_and_get' = "//div[@id='svmodal-in']";//"//div[@class='tile-primary']//textarea"; sites_config1'offset_of_pages_to_parse' = 0;sites_config1'num_of_pages_to_parse' = 100;sites_config1'records_translit_title_letters_to_english' = 0; sites_config1'allow_owerite' = 1; // 0 = not rewrite /important not remove parser;