Skip to content
Open
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
21 changes: 10 additions & 11 deletions main.py
Original file line number Diff line number Diff line change
@@ -1,16 +1,9 @@
"""FreeWork Data Scraper — CLI entry point.

Usage:
python main.py # Interactive mode
python main.py --url "https://..." # Direct URL mode
streamlit run app.py # Streamlit UI mode
"""

from __future__ import annotations

import argparse
import logging
import sys
import re

from freework_scraper import __version__
from freework_scraper.scraper.browser import BrowserManager
Expand All @@ -28,6 +21,8 @@
)
logger = logging.getLogger("freework")

TRUSTED_DOMAIN = r"^https://www\.free-work\.com/"


def parse_args() -> argparse.Namespace:
parser = argparse.ArgumentParser(
Expand Down Expand Up @@ -78,6 +73,10 @@ def parse_args() -> argparse.Namespace:
return parser.parse_args()


def validate_url(url: str) -> bool:
return re.match(TRUSTED_DOMAIN, url) is not None


def main() -> None:
args = parse_args()

Expand All @@ -86,8 +85,8 @@ def main() -> None:
if not search_url:
search_url = input("Entrez l'URL de recherche FreeWork : ").strip()

if not search_url:
logger.error("Aucune URL fournie. Abandon.")
if not search_url or not validate_url(search_url):
logger.error("URL invalide ou non fournie. Abandon.")
sys.exit(1)

headless = args.headless and not args.no_headless
Expand Down Expand Up @@ -178,4 +177,4 @@ def on_job(idx, total, job):


if __name__ == "__main__":
main()
main()