Alin Preda aleenprd

## timing_function.py
from time import time

def timing(f: Callable) -> None:
    """Times a function runtime in minutes.

    Args:
        f (callable): a function/method.
    """
    def wrap(*args, **kw):
        ts = time()

## make_soup_with_selenium.py
import requests
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.chrome.service import Service
from webdriver_manager.chrome import ChromeDriverManager

def make_soup_with_selenium(url: str, driver_service: Service) -> BeautifulSoup:
    """Return an HTML body from an URL.

## imports_imdb_scraping.py
# Data manipulation
import pandas as pd
import re as regex

# Scraping
import requests
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.chrome.service import Service

## get_episodes_links.py
import re as regex

def get_episodes_links(link: str, driver_service) -> List[str]:
    """Retrieve links to episodes, from series' season main page.

    Args:
        link (str): link to season main page.
        driver_service (Service): a Chrome web driver.

    Returns:

## get_ratings_and_reviews_page.py
def get_ratings_page(episode_page: str, suffix: str="/ratings/?ref_=tt_ov_rt"):
    return ("/").join(episode_page.split("/")[:-1]) + suffix

def get_reviews_page(episode_page: str, suffix: str="/reviews?ref_=tt_urv"):
    return ("/").join(episode_page.split("/")[:-1]) + suffix

## fetch_el_if_available.py
from typing import Union

def fetch_el_if_available(soup: BeautifulSoup, element_type: str, class_type: str) -> Union[str, None]:
    """Returns element text if found, otherwise returns None.

    Args:
        soup (BeautifulSoup): a b24 soup.
        element_type (str): HTML type e.g. 'div'.
        class_type (str): the class of the desired element.


## scrape_reviews_page.py
def scrape_reviews_page(reviews_soup: BeautifulSoup) -> pd.DataFrame:
    """Scrape IMDB reviews page.

    Note: Extracts ratings, usernames, review date, titles, review body text,
    number of reactions, total reactions to review.

    Args:
        reviews_soup (BeautifulSoup): soup of the entirely loaded reviews page.

    Returns:

## scrape_imdb_reviews_pages_main.py
@timing
def main(season_link: str, show_link: str, driver_service: Service, output_path: str) -> None:
    """Main function to scrape an IMDB season's reviews for each episode and also the general reviews.

    Args:
        season_link (str): URL pointing to season page.
        show_link (str): URL pointing to show general reviews.
        driver_service (Service): a Chrome web driver.
        output_path (str): path including filename where we want to save the CSV.
    """

## imports_scraper_classes.py
# Data manipulation
import pandas as pd
import re as regex

# Scraping
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.chrome.service import Service
from webdriver_manager.chrome import ChromeDriverManager

## scraper_base_class.py
class ScraperException(Exception):
    """Starting point for Scraper exceptions."""
    pass


class ImdbScraperException(ScraperException):
    """Starting point for Scraper exceptions."""
    pass
	from time import time

	def timing(f: Callable) -> None:
	"""Times a function runtime in minutes.

	Args:
	f (callable): a function/method.
	"""
	def wrap(args, *kw):
	ts = time()
	import requests
	from bs4 import BeautifulSoup
	from selenium import webdriver
	from selenium.webdriver.common.by import By
	from selenium.webdriver.chrome.service import Service
	from webdriver_manager.chrome import ChromeDriverManager

	def make_soup_with_selenium(url: str, driver_service: Service) -> BeautifulSoup:
	"""Return an HTML body from an URL.
	# Data manipulation
	import pandas as pd
	import re as regex

	# Scraping
	import requests
	from bs4 import BeautifulSoup
	from selenium import webdriver
	from selenium.webdriver.common.by import By
	from selenium.webdriver.chrome.service import Service
	import re as regex

	def get_episodes_links(link: str, driver_service) -> List[str]:
	"""Retrieve links to episodes, from series' season main page.

	Args:
	link (str): link to season main page.
	driver_service (Service): a Chrome web driver.

	Returns:
	def get_ratings_page(episode_page: str, suffix: str="/ratings/?ref_=tt_ov_rt"):
	return ("/").join(episode_page.split("/")[:-1]) + suffix

	def get_reviews_page(episode_page: str, suffix: str="/reviews?ref_=tt_urv"):
	return ("/").join(episode_page.split("/")[:-1]) + suffix
	from typing import Union

	def fetch_el_if_available(soup: BeautifulSoup, element_type: str, class_type: str) -> Union[str, None]:
	"""Returns element text if found, otherwise returns None.

	Args:
	soup (BeautifulSoup): a b24 soup.
	element_type (str): HTML type e.g. 'div'.
	class_type (str): the class of the desired element.
	def scrape_reviews_page(reviews_soup: BeautifulSoup) -> pd.DataFrame:
	"""Scrape IMDB reviews page.

	Note: Extracts ratings, usernames, review date, titles, review body text,
	number of reactions, total reactions to review.

	Args:
	reviews_soup (BeautifulSoup): soup of the entirely loaded reviews page.

	Returns:
	@timing
	def main(season_link: str, show_link: str, driver_service: Service, output_path: str) -> None:
	"""Main function to scrape an IMDB season's reviews for each episode and also the general reviews.

	Args:
	season_link (str): URL pointing to season page.
	show_link (str): URL pointing to show general reviews.
	driver_service (Service): a Chrome web driver.
	output_path (str): path including filename where we want to save the CSV.
	"""
	class ScraperException(Exception):
	"""Starting point for Scraper exceptions."""
	pass


	class ImdbScraperException(ScraperException):
	"""Starting point for Scraper exceptions."""
	pass