Scrape mynixos.com

This commit is contained in:
Peter Vacho 2024-11-25 11:50:39 +01:00
parent ac0c2a8c21
commit 71b33db9d9
Signed by: school
GPG key ID: 8CFC3837052871B4

View file

@ -12,8 +12,8 @@ from src.pagerank import pagerank, test_pagerank
from src.util import add_ratings_to_dataframe, dataframe_to_urlmap, extract_ratings_from_dataframe, urlmap_to_dataframe from src.util import add_ratings_to_dataframe, dataframe_to_urlmap, extract_ratings_from_dataframe, urlmap_to_dataframe
from src.visualization import display_top_urls from src.visualization import display_top_urls
URL = httpx.URL("https://ailab.fai.utb.cz") URL = httpx.URL("https://mynixos.com/")
ALLOWED_HOSTS_RE = re.compile(r"(?:.*\.)?utb\.cz") ALLOWED_HOSTS_RE = re.compile(r".*")
CACHE_RESULTS_DIR = Path.cwd() / "cache" CACHE_RESULTS_DIR = Path.cwd() / "cache"