abearxiong/important.markdown

## important.markdown

      
    Raw
  

              important.markdown
            
          
github [52.74.223.119]
csdn.net [47.95.47.253]
jianshu.com [106.75.17.181]


## know.py
# -*- coding: utf-8 -*-
"""
Created on Mon Apr 29 20:39:22 2019

@author: xiong
"""
import requests
import lxml
from bs4 import BeautifulSoup
#import hashlib
def getContent(url):
    html = requests.get(url)
    soup = BeautifulSoup(html.text, 'lxml')
    #print(soup.prettify())
    bodys = soup.find_all(name = 'body')
    links = soup.find_all('a')
    for body in bodys:
        print(body.attrs, '\n')
    for link in links:
        if link.get('href'):
            print(link.get('href'))
        else:
            print(link)
    print(len(links))
if __name__ == '__main__':
            #url = "https://csdn.net"
            url = "https://blog.csdn.net/csdn15698845876/article/details/78305467"
            getContent(url)

## table-of-content.markdown

      
    Raw
  

              table-of-content.markdown
            
          
    使用技巧


import
爬爬
	# -- coding: utf-8 --
	"""
	Created on Mon Apr 29 20:39:22 2019

	@author: xiong
	"""
	import requests
	import lxml
	from bs4 import BeautifulSoup
	#import hashlib
	def getContent(url):
	html = requests.get(url)
	soup = BeautifulSoup(html.text, 'lxml')
	#print(soup.prettify())
	bodys = soup.find_all(name = 'body')
	links = soup.find_all('a')
	for body in bodys:
	print(body.attrs, '\n')
	for link in links:
	if link.get('href'):
	print(link.get('href'))
	else:
	print(link)
	print(len(links))
	if __name__ == '__main__':
	#url = "https://csdn.net"
	url = "https://blog.csdn.net/csdn15698845876/article/details/78305467"
	getContent(url)