Compare commits

..

No commits in common. "d8a0e46c81a5b5ef1810c0e766cbad6b8a8a1725" and "257d61aefc391124bad8e41fef34b4fc2f211473" have entirely different histories.

2 changed files with 8 additions and 31 deletions

View file

@ -7,4 +7,3 @@ languages:
- en - en
- es - es
default_language: en default_language: en
exclude_tags: []

View file

@ -43,7 +43,6 @@ def detect_article_language(article_description: str) -> str:
except AttributeError: except AttributeError:
return default_language.iso_code_639_1.name return default_language.iso_code_639_1.name
engine = create_engine("sqlite:///kuow.db") engine = create_engine("sqlite:///kuow.db")
Base.metadata.create_all(engine) Base.metadata.create_all(engine)
@ -131,39 +130,18 @@ with Session(engine) as session:
except (NameError, TypeError): except (NameError, TypeError):
print("Could not find or load IDs for this post") print("Could not find or load IDs for this post")
tags: list[str] = []
try: try:
tags.extend( tags = article_soup.find(
article_soup.find( "script", {"class": "dfp_targeting", "data-key": "tags"}
"script", {"class": "dfp_targeting", "data-key": "tags"} )["data-value"].split("|")
)["data-value"].split("|")
)
except (NameError, TypeError): except (NameError, TypeError):
print("Could not find or load any tags from the 'tags' property") print("Could not find or load any tags for this article")
tags = []
try:
tags.extend(
article_soup.find(
"script", {"class": "dfp_targeting", "data-key": "topics"}
)["data-value"].split("|")
)
except (NameError, TypeError):
print("Could not find or load any tags from the 'tags' property")
# Remove duplicates
tags = list(set(tags))
additional_tag_string = "" additional_tag_string = ""
for tag in tags: for tag in tags:
tag = tag.title().replace(" ", "").replace("&", "And") # TODO: Do a check for tags in the config file that we don't want to tag posts with
if tag.casefold() in config["exclude_tags"]: additional_tag_string += " #{}".format(tag.title().replace(" ", ""))
print(
"Tag {} was found in the article, but won't be included in the post".format(
tag
)
)
else:
additional_tag_string += " #{}".format(tag)
try: try:
article_description = ( article_description = (