mirror of
https://github.com/Crocmagnon/charasheet.git
synced 2025-01-03 19:51:49 +01:00
Complete path import
This commit is contained in:
parent
f601b71928
commit
bc0c6108e4
1 changed files with 45 additions and 17 deletions
|
@ -1,5 +1,6 @@
|
|||
from django.core.management import BaseCommand
|
||||
from selenium import webdriver
|
||||
from selenium.webdriver import Keys
|
||||
from selenium.webdriver.common.by import By
|
||||
|
||||
from character.models import Path, Profile, Race
|
||||
|
@ -10,9 +11,13 @@ class Command(BaseCommand):
|
|||
url = "https://www.co-drs.org/fr/jeu/voies"
|
||||
self.setup_selenium()
|
||||
self.selenium.get(url)
|
||||
anchors = self.selenium.find_elements(
|
||||
By.CSS_SELECTOR, ".card-body .card-title a"
|
||||
)
|
||||
anchors = []
|
||||
expected_path_count = 95
|
||||
while len(anchors) < expected_path_count:
|
||||
self.selenium.find_element(By.TAG_NAME, "body").send_keys(Keys.END)
|
||||
anchors = self.selenium.find_elements(
|
||||
By.CSS_SELECTOR, ".card-body .card-title a"
|
||||
)
|
||||
urls = [anchor.get_attribute("href") for anchor in anchors]
|
||||
for url in urls:
|
||||
try:
|
||||
|
@ -23,18 +28,27 @@ class Command(BaseCommand):
|
|||
|
||||
def import_path(self, url: str):
|
||||
self.selenium.get(url)
|
||||
name = self.selenium.find_element(By.TAG_NAME, "h1").text
|
||||
category = self.get_category(name)
|
||||
name = self.selenium.find_element(By.TAG_NAME, "h1").text.replace("’", "'")
|
||||
if name == "Voie du haut-elfe": # Fix for incorrect data
|
||||
category = Path.Category.RACE
|
||||
else:
|
||||
category = self.get_category(name)
|
||||
profile = None
|
||||
if category == Path.Category.PROFILE:
|
||||
profile = self.get_profile()
|
||||
profile = self.get_profile(name)
|
||||
race = None
|
||||
if category == Path.Category.RACE:
|
||||
profile = self.get_race(name)
|
||||
race = self.get_race(name)
|
||||
notes = self.get_notes(name)
|
||||
|
||||
path, _ = Path.objects.update_or_create(
|
||||
name=name,
|
||||
defaults={"category": category, "profile": profile, "race": race},
|
||||
defaults={
|
||||
"category": category,
|
||||
"profile": profile,
|
||||
"race": race,
|
||||
"notes": notes,
|
||||
},
|
||||
)
|
||||
self.stdout.write(self.style.SUCCESS(f"Created/updated path {path}"))
|
||||
|
||||
|
@ -61,18 +75,32 @@ class Command(BaseCommand):
|
|||
return Path.Category.CREATURE
|
||||
return Path.Category(category)
|
||||
|
||||
def get_profile(self) -> Profile:
|
||||
profile_name = self.selenium.find_element(
|
||||
By.CSS_SELECTOR, ".field--name-type + strong + a"
|
||||
).text
|
||||
return Profile.objects.get_by_natural_key(profile_name)
|
||||
def get_profile(self, name: str) -> Profile | None:
|
||||
try:
|
||||
profile_name = self.selenium.find_element(
|
||||
By.CSS_SELECTOR, ".field--name-type + strong + a"
|
||||
).text
|
||||
return Profile.objects.get_by_natural_key(profile_name)
|
||||
except Exception:
|
||||
self.stdout.write(self.style.WARNING(f"Couldn't find profile for {name}"))
|
||||
|
||||
def get_race(self, path_name: str) -> Race:
|
||||
return None
|
||||
to_remove = [""]
|
||||
def get_race(self, path_name: str) -> Race | None:
|
||||
to_remove = ["voie de la", "voie de l'", "voie du"]
|
||||
path_name = path_name.lower()
|
||||
for text in to_remove:
|
||||
path_name = path_name.replace(text, "")
|
||||
return Race.objects.get(name__iexact=path_name)
|
||||
try:
|
||||
return Race.objects.get(name__iexact=path_name.strip())
|
||||
except Exception:
|
||||
self.stdout.write(self.style.WARNING(f"Couldn't find race for {path_name}"))
|
||||
|
||||
def get_notes(self, path_name: str) -> str:
|
||||
try:
|
||||
return self.selenium.find_element(
|
||||
By.CLASS_NAME, "field--name-description"
|
||||
).text.strip()
|
||||
except Exception:
|
||||
return ""
|
||||
|
||||
def setup_selenium(self):
|
||||
options = webdriver.FirefoxOptions()
|
||||
|
|
Loading…
Reference in a new issue