Created
November 3, 2016 23:36
-
-
Save onlurking/40aac52a64ee41a080a5830d438b3335 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#! /usr/bin/env hy | |
(import requests | |
string | |
[bs4 [BeautifulSoup]] | |
[sys [argv]]) | |
(defn get_page [link] | |
(-> (. (.get requests link) text) | |
(BeautifulSoup "html.parser"))) | |
(defn get_title [source] | |
(-> (. source title) | |
(. text) | |
(.lower) | |
(.strip "speaker deck") | |
(.replace "/" "") | |
(string.capwords))) | |
(defn get_author[source] | |
(. (. (.find source "div" :class "presenter") h2) text)) | |
(defn crawl[link] | |
(setv response (get_page link)) | |
(print (get_author response)) | |
(print (get_title response)) | |
(print (speaker_deck response))) | |
(defn speaker_deck [source] | |
(.find source "div" :class "speakerdeck-embed")) | |
(if (= __name__ "__main__") | |
(do | |
(if (< (len argv) 2) | |
(print "Please, provide an URL.") | |
(crawl (second argv))))) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment