Created
January 9, 2019 23:47
-
-
Save Ranner198/7da8aa8644fb544cd4e05cf2e93226c7 to your computer and use it in GitHub Desktop.
Webscrape Tutorial Source Code
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
//Loading the npm packages | |
const cheerio = require('cheerio') | |
const request = require('request') | |
//The Url that will be scraped | |
var URL = 'http://rancrump.com/aboutme/'; | |
//The attribute that will be searched, follows the HTML class and ID syntax i.e. '.' and '#' | |
//can also select a span by simply typing span in the begining i.e. 'span.someClassName' | |
var selector = '.myTopBorder' | |
//run the request for the URL and run the return function... | |
request(URL, function(error, resp, html) { | |
//If there is no error | |
if (!err){ | |
//Parse The URL Data with cheerio | |
const $ = cheerio.load(html); | |
//Using a foreach loop iterate through the webpage and select the specified class or span | |
$(selector).each(function(i, element){ | |
//Select the current index inner html with the .text() function | |
var temp = $(this).text(); | |
//print the temp data | |
Print(temp); | |
}); | |
} else { | |
//If there was an Error we should log it out.... | |
Print(error) | |
} | |
}); | |
//I don't like typeing out console.log so this is just a print function | |
// "I put the fun in function (:" - ran 2018 | |
function Print(val) { | |
console.log(val); | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment