add open file tmp

This commit is contained in:
Valentin CZERYBA 2023-06-20 21:38:39 +02:00
parent 35ff22d463
commit 0eab1d885b
2 changed files with 39 additions and 19 deletions

View File

@ -161,7 +161,14 @@ class WPExport:
except Exception as err: except Exception as err:
self._logger.error("{0} : Exception error : {1}".format(self._name, err)) self._logger.error("{0} : Exception error : {1}".format(self._name, err))
exit(1) exit(1)
return webpage try:
string_webpage = json.dumps(webpage)
open("{0}/{1}.json".format(self._tmp, self._name), "wt").write(string_webpage)
except Exception as ex:
self._logger.error("{0} : Error for writing webpage : {1}".format(self._name, ex))

View File

@ -40,25 +40,38 @@ class WPimport:
self._wordpress = wordpress self._wordpress = wordpress
def fromUrl(self, first, second): def fromUrl(self, first, second):
for i in range(0, len(webpage[first][second])): try:
try: content_file = open("{0}/{1}.json".format(self._name, self._tmp))
r = self._request.get(webpage[i]) webpage_content = json.loads(content_file)
if r.status_code == 200: webpage = webpage_content[first][second]
self._logger.info("{0} : ({1}/{2}) : Page is importing : {3}".format(self._name, i+1, len(webpage), webpage[i])) for i in range(0, len(webpage)):
soup = BeautifulSoup(r.content, self._parser) try:
articlebody = soup.find_all("div", class_="articlebody") r = self._request.get(webpage[i])
if len(articlebody) > 0: if r.status_code == 200:
self._addOrUpdatePost(soup) self._logger.info("{0} : ({1}/{2}) : Page is importing : {3}".format(self._name, i+1, len(webpage), webpage[i]))
soup = BeautifulSoup(r.content, self._parser)
articlebody = soup.find_all("div", class_="articlebody")
if len(articlebody) > 0:
self._addOrUpdatePost(soup)
else:
self._addOrUpdateFeaturedMedia(soup)
del webpage_content[first][second][i]
open("{0}/{1}.json".format(self._tmp, self._name), "wt").write(webpage_content)
else: else:
self._addOrUpdateFeaturedMedia(soup) self._logger.error("{0} : Connection error for get url {1} with status code : {2}".format(self._name, webpage[i], r.status_code))
else: self._logger.debug("{0} : {1}".format(self._name, r.content))
self._logger.error("{0} : Connection error for get url {1} with status code : {2}".format(self._name, webpage[i], r.status_code)) except ConnectionError as err:
self._logger.debug("{0} : {1}".format(self._name, r.content)) self._logger.error("{0} : Connection error for get url {1} : {2}".format(self._name, webpage[i], err))
except ConnectionError as err: exit(1)
self._logger.error("{0} : Connection error for get url {1} : {2}".format(self._name, webpage[i], err)) except IOError as err:
exit(1) self._logger.error("{0} : Connection error for IO url {1} : {2}".format(self._name, webpage[i], err))
except Exception as err: exit(1)
self._logger.error("{0} : Exception error for get url {1} : {2}".format(self._name, webpage[i], err)) except Exception as err:
self._logger.error("{0} : Exception error for get url {1} : {2}".format(self._name, webpage[i], err))
except Exception as ex:
self._logger.error("{0} : Read file json from tmp : {1}".format(self._name, ex))
def fromDirectory(self, directory="", number_thread=1, max_thread=1): def fromDirectory(self, directory="", number_thread=1, max_thread=1):