From 9bbf769b40b1da6d92fbaa15572e8589f3676b5a Mon Sep 17 00:00:00 2001 From: Valentin CZERYBA Date: Sat, 1 Jul 2023 22:16:35 +0200 Subject: [PATCH] test WIP --- import_export_canalblog.py | 2 +- lib/WPMenu.py | 23 ++++++++++++++--------- 2 files changed, 15 insertions(+), 10 deletions(-) diff --git a/import_export_canalblog.py b/import_export_canalblog.py index de1c15e..70cccdd 100644 --- a/import_export_canalblog.py +++ b/import_export_canalblog.py @@ -247,7 +247,7 @@ if __name__ == '__main__': os.makedirs(args.tmp, exist_ok=True) - if args.command == "import" or args.command == "remove" or args.command = "menu": + if args.command == "import" or args.command == "remove" or args.command == "menu": password = args.password if len(args.password) == 0: password = getpass() diff --git a/lib/WPMenu.py b/lib/WPMenu.py index 90d9dfc..b118276 100644 --- a/lib/WPMenu.py +++ b/lib/WPMenu.py @@ -16,19 +16,23 @@ class WPMenu: self._logger = logger self._parser = parser self._headers_json = {'Content-Type': 'application/json; charset=utf-8', 'Accept':'application/json'} - self._protocol_wordpress, self._protocol_canalblog = "https" + self._protocol_wordpress = "https" + self._protocol_canalblog = "https" self._directory = "backup" if ssl_wordpress is False: self._protocol_wordpress = "http" if ssl_canalblog is False: self._protocol_canalblog = "http" - self._request = requests.Session() + self._request_canalblog = requests.Session() + self._request_wordpress = requests.Session() retries = Retry(connect=10, read=10, redirect=5, status_forcelist=[429, 500, 502, 503, 504], backoff_factor=2) - self._request.mount('{0}://'.format(self._protocol), HTTPAdapter(max_retries=retries)) + self._request_canalblog.mount('{0}://'.format(self._protocol_canalblog), HTTPAdapter(max_retries=retries)) + self._request_wordpress.mount('{0}://'.format(self._protocol_wordpress), HTTPAdapter(max_retries=retries)) + # Destructor def __del__(self): @@ -56,7 +60,7 @@ class WPMenu: o = urlparse(canalblog) o = o._replace(scheme=self._protocol_canalblog) i = o.geturl().replace(":///", "://") - page = self._request.get(i) + page = self._request_canalblog.get(i) if page.status_code == 200: self._logger.info("{0} : Page web is being processed : {1}".format(self._name, i)) self._menu(page.content) @@ -64,17 +68,18 @@ class WPMenu: self._logger.error("{0} : index didn't get due status code : {1}".format(self._name, page.status_code)) self._logger.debug("{0} : {1}".format(self._name, page.content)) except ConnectionError as err: - self._logger.error("{0} : Connection error for get url {1} : {2}".format(self._name, webpage[i], err)) + self._logger.error("{0} : Connection error for get url {1} : {2}".format(self._name, canalblog, err)) exit(1) except Exception as err: - self._logger.error("{0} : Exception error for get url {1} : {2}".format(self._name, webpage[i], err)) + self._logger.error("{0} : Exception error for get url {1} : {2}".format(self._name, canalblog, err)) def _menu(self, content): - soup = BeautifulSoup(page.text, self._parser) + soup = BeautifulSoup(content, self._parser) ul = soup.find_all("ul", id="listsmooth") for anchor in ul[0].find_all("li"): li = anchor.find_all("li") - for content in li: - a = content.find("a") + for child in li: + a = child.find("a") + self._logger.info("{0} {1} : {2}".format(self._name, child, a))