1
0
mirror of https://github.com/instaloader/instaloader.git synced 2024-09-12 00:32:24 +02:00

Add unicode normalization of captions (#1453)

This commit is contained in:
MiguelX413 2022-03-17 15:06:26 +00:00 committed by GitHub
parent fdcf2e1367
commit 463ada519e
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -6,6 +6,7 @@ from collections import namedtuple
from datetime import datetime from datetime import datetime
from pathlib import Path from pathlib import Path
from typing import Any, Dict, Iterable, Iterator, List, Optional, Tuple, Union from typing import Any, Dict, Iterable, Iterator, List, Optional, Tuple, Union
from unicodedata import normalize
from . import __version__ from . import __version__
from .exceptions import * from .exceptions import *
@ -322,9 +323,9 @@ class Post:
def caption(self) -> Optional[str]: def caption(self) -> Optional[str]:
"""Caption.""" """Caption."""
if "edge_media_to_caption" in self._node and self._node["edge_media_to_caption"]["edges"]: if "edge_media_to_caption" in self._node and self._node["edge_media_to_caption"]["edges"]:
return self._node["edge_media_to_caption"]["edges"][0]["node"]["text"] return normalize("NFC", self._node["edge_media_to_caption"]["edges"][0]["node"]["text"])
elif "caption" in self._node: elif "caption" in self._node:
return self._node["caption"] return normalize("NFC", self._node["caption"])
return None return None
@property @property