Synchronize your medium blog with python

Screenshot from my homepage,
from bs4 import BeautifulSoup ## for web scraping
import urllib.request
import re ## regex
from linkpreview import link_preview
import pandas as pd
url = <your medium blog>
req = urllib.request.Request(url, headers = {'User-agent': 'your bot 0.1'})
response = urllib.request.urlopen(req)
html =
# Parsing response
soup = BeautifulSoup(html, 'html.parser')
# Find all a classes
text = soup.find_all("a")
list_urls = []
for item in text:
## convert it to strings
item = str(item)
pos = item.find('href="/')
if pos is not None: ## if you find a link
if pos > 0 and item.find("user_profile")>0:
result ='href="\/+([a-z])\w+', item)
if result:

Exkurs regex (regular expressions)

Lets continue

result ='href="\/+([a-z])\w+', item)
if result:
start = result.start()## Start pattern
end_item = item[start:]
end ='-"', end_item).end() ## End of pattern

url_extract_pos = item[start:start+end] ## cut out url
url = ""+url_extract_pos[6:-1]

if url not in list_urls:
list_of_links = []
for i in list_urls:
preview = link_preview(i)

dic_preview = {"title": preview.title,
"description": preview.description,
"image": preview.image,
"force_title": preview.force_title,
"absolute_image": preview.absolute_image,
"url": i}




I am a data analyst discovering the unlimited world of coding and data.

