From 4f1a7073abead3e2d5c614557853094ccf0dabb8 Mon Sep 17 00:00:00 2001 From: Alban Gruin Date: Thu, 6 Sep 2018 18:17:35 +0200 Subject: management: nouveau script pour scrapper les salles Signed-off-by: Alban Gruin --- management/commands/scraprooms.py | 36 ++++++++++++++++++++++++++++++++++++ 1 file changed, 36 insertions(+) create mode 100644 management/commands/scraprooms.py (limited to 'management/commands') diff --git a/management/commands/scraprooms.py b/management/commands/scraprooms.py new file mode 100644 index 0000000..c448d61 --- /dev/null +++ b/management/commands/scraprooms.py @@ -0,0 +1,36 @@ +# Copyright (C) 2018 Alban Gruin +# +# celcatsanitizer is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published +# by the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. +# +# celcatsanitizer is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. +# +# You should have received a copy of the GNU Affero General Public License +# along with celcatsanitizer. If not, see . + +from bs4 import BeautifulSoup +from django.core.management.base import BaseCommand +from django.db import transaction + +from edt.models import Room + + +class Command(BaseCommand): + help = "Scraps rooms from file" + + def add_arguments(self, parser): + parser.add_argument("--file", type=str, required=True) + + @transaction.atomic + def handle(self, *args, **options): + with open(options["file"], "r") as rooms: + soup = BeautifulSoup(rooms.read(), "html.parser") + + rooms = [option.text for option in soup.find_all("option")[1:]] + for room in set(rooms): + Room(name=room).save() -- cgit v1.2.1