insert #6

Merged
v4l3n71n merged 60 commits from insert into master 2023-04-11 21:29:54 +00:00
2 changed files with 27 additions and 2 deletions
Showing only changes of commit e74dfc2b73 - Show all commits

View File

@ -14,6 +14,18 @@ class WPimport:
# Public method
def fromUrl(self, webpage):
for page in webpage:
r = requests.get(page)
if r.status_code == 200:
soup = BeautifulSoup(r.content, self._parser)
articlebody = soup.find_all("div", class_="articlebody")
if len(articlebody) > 0:
self._addOrUpdatePost(soup)
else:
self._addOrUpdateFeaturedMedia(soup)
def fromDirectory(self, directory):
directory = "{0}/archives".format(directory)
directories = self._getDirectories([], "{0}".format(directory))

View File

@ -37,7 +37,7 @@ if __name__ == '__main__':
args = parser.parse_args()
logger = logging.getLogger('insert wordpress')
logger = logging.getLogger('import export canalblog')
formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
if args.quiet is False:
@ -74,7 +74,20 @@ if __name__ == '__main__':
exit(0)
if len(args.directory) > 0:
importWp.fromDirectory(args.directory)
exit(0)
exit(0)
if len(args.canalblog) > 0:
try:
o = urlparse(args.canalblog)
o = o._replace(scheme="https")
url = o.geturl().replace(":///", "://")
except Exception as err:
logger.error("parsing error : {0}".format(err))
exit(1)
exportWp = WPExport.WPExport(url, logger, args.parser, args.directory)
webpage = exportWp.getUrlPage()
importWp.fromUrl(webpage)
if args.command == "export":
try:
o = urlparse(args.url)