Nitrogen Pumpkin Mulch

    hexo-selenium-site-parser

    1.0.12 • Public • Published

    README.md

    hexo-selenium-site-parser

    first:

    npm install hexo-selenium-site-parser

    second:

    create teampleate file called: 'teamplate_record.md' you can copy in from module directory

    ---
    title: [[title]]
    ---
    
    [[img]]
    
    [[desc]]
    
    [[imgs]]
    
    [link:]([[link]] "[[title]]")
    
    

    use example:

    • create file test.js in hexo blog folder because it create posts in source/_post and store images in source/images folders put next code to see the result
    • check everyone can write permision to '/source' folder
    • you can copy test.js from module directory
    var Parser = require('hexo-selenium-site-parser');
    var parser = new Parser();
     
    var sites_config = [];
     
     
    sites_config[1] = [];
    sites_config[1]['site_url'] = 'http://seasonvar.ru/'; 
    sites_config[1]['records_links_xpath'] = "//div[@class='news']//a";
    sites_config[1]['records_title_xpath'] = "//h1[@class='pgs-sinfo-title']";
    sites_config[1]['records_content_xpath'] = "//div[@class='pgs-sinfo-info']//p";
    sites_config[1]['records_img_xpath'] = "//div[@class='pgs-sinfo-imgwrap']//span//img"; //leave it empty if use many images at the same page  "//div[@class='full-str']//img"; 
    sites_config[1]['categories_xpath'] = '';
    sites_config[1]['tags_xpath'] = '';
    sites_config[1]['records_imgs_xpath'] = '';////div[@class="entry-content"]//p//img'; //leave it empty if use only one image
    sites_config[1]['records_imgs_to_parse'] = 0; // num on images to parse per parsed post
    sites_config[1]['records_meta1_xpath'] = '';//"//div[@class='tile-primary']//textarea";
     
    sites_config[1]['click'] = "//div[@class='player-extBtn-getcode']";//"//div[@class='tile-primary']//textarea";
    sites_config[1]['click_and_get'] = "//div[@id='svmodal-in']";//"//div[@class='tile-primary']//textarea";
     
    sites_config[1]['offset_of_pages_to_parse'] = 0;
    sites_config[1]['num_of_pages_to_parse'] = 100;
    sites_config[1]['records_translit_title_letters_to_english'] = 0; 
    sites_config[1]['allow_owerite'] = 1; //  0 = not rewrite /important not remove
     
    parser.parse(sites_config);

    Keywords

    Install

    npm i hexo-selenium-site-parser

    DownloadsWeekly Downloads

    1

    Version

    1.0.12

    License

    ISC

    Last publish

    Collaborators

    • allimist