_tag_interface.py 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269
  1. import abc
  2. import re
  3. import typing
  4. import mutagen.id3
  5. import mutagen.mp4
  6. from symuid._uuid import uuid_bytes_to_str, uuid_str_to_bytes
  7. class TagInterface(abc.ABC):
  8. @abc.abstractproperty
  9. def track_path(self):
  10. pass
  11. @abc.abstractmethod
  12. def get_comment(self):
  13. pass
  14. @abc.abstractmethod
  15. def set_comment(self, comment):
  16. pass
  17. @abc.abstractmethod
  18. def get_track_uuid(self):
  19. pass
  20. @abc.abstractmethod
  21. def set_track_uuid(self, uuid):
  22. pass
  23. @abc.abstractmethod
  24. def save(self):
  25. pass
  26. @abc.abstractmethod
  27. def get_free_int(self, tag_label):
  28. pass
  29. @abc.abstractmethod
  30. def set_free_int(self, tag_label, data):
  31. pass
  32. @abc.abstractmethod
  33. def get_free_ints(self, tag_label_prefix):
  34. pass
  35. class _MutagenTagInterface(TagInterface):
  36. # pylint: disable=abstract-method
  37. def __init__(self, mutagen_file):
  38. self._mutagen_file = mutagen_file
  39. @property
  40. def track_path(self):
  41. return self._mutagen_file.filename
  42. def save(self):
  43. self._mutagen_file.save()
  44. class ID3(_MutagenTagInterface):
  45. # http://id3.org/id3v2.4.0-frames#4.1.
  46. _UFID_OWNER_ID = 'symuid'
  47. def __init__(self, mutagen_file):
  48. assert isinstance(mutagen_file.tags, mutagen.id3.ID3), \
  49. mutagen_file.tags
  50. super().__init__(mutagen_file)
  51. def _get_single_text(self, tag_label):
  52. tag = self._mutagen_file.tags.get(tag_label, None)
  53. if tag is None:
  54. # {}.get('a') == None
  55. return None
  56. if len(tag.text) == 1:
  57. return tag.text[0]
  58. raise ValueError(tag)
  59. def get_free_ints(self, tag_label_prefix):
  60. for tag in self._mutagen_file.tags.getall('TXXX:' + tag_label_prefix):
  61. assert len(tag.text) == 1, tag
  62. yield (tag.desc, int(tag.text[0]))
  63. def get_free_int(self, tag_label):
  64. text = self._get_single_text('TXXX:' + tag_label)
  65. return int(text) if text else None
  66. def set_free_int(self, tag_label, data):
  67. # mutagen.id3._specs.EncodedTextSpec.write encodes 'desc' and 'text'
  68. tag = mutagen.id3.TXXX(
  69. encoding=mutagen.id3.Encoding.LATIN1,
  70. desc=tag_label,
  71. text=[str(data)],
  72. )
  73. # TODO overwrite instead of add() ?
  74. self._mutagen_file.tags.add(tag)
  75. return tag
  76. def get_comment(self):
  77. return self._get_single_text('COMM::eng')
  78. def set_comment(self, comment):
  79. tag = mutagen.id3.COMM(
  80. encoding=mutagen.id3.Encoding.UTF8,
  81. lang='eng',
  82. text=[comment],
  83. )
  84. self._mutagen_file.tags.add(tag)
  85. return tag
  86. def get_track_uuid(self):
  87. for ufid in self._mutagen_file.tags.getall('UFID'):
  88. if ufid.owner == self._UFID_OWNER_ID:
  89. return ufid.data
  90. return None
  91. def set_track_uuid(self, uuid):
  92. # mutagen.id3._specs.EncodedTextSpec.write encodes 'owner'
  93. tag = mutagen.id3.UFID(owner=self._UFID_OWNER_ID, data=uuid)
  94. self._mutagen_file.tags.add(tag)
  95. return tag
  96. class MP4(_MutagenTagInterface):
  97. _UUID_TAG_KEY = 'symuid:uuid'
  98. _COMMENT_TAG_KEY = '\xa9cmt'
  99. def __init__(self, mutagen_file):
  100. assert mutagen_file.tags is not None, mutagen_file
  101. assert isinstance(mutagen_file.tags, mutagen.mp4.MP4Tags), \
  102. mutagen_file.tags
  103. super().__init__(mutagen_file)
  104. def _get_single(self, tag_label):
  105. tag = self._mutagen_file.tags.get(tag_label, None)
  106. if tag is None:
  107. # {}.get('a') == None
  108. return None
  109. if len(tag) == 1:
  110. return tag[0]
  111. raise ValueError(tag)
  112. @staticmethod
  113. def _freeform_to_int(freeform):
  114. # "a signed big-endian integer with length one of { 1,2,3,4,8 } bytes"
  115. assert freeform.dataformat == mutagen.mp4.AtomDataType.INTEGER, freeform
  116. return int.from_bytes(freeform, byteorder='big', signed=True)
  117. def get_free_ints(self, tag_label_prefix):
  118. label_pattern = re.compile(r'^----:{}(:|$)'.format(
  119. re.escape(tag_label_prefix),
  120. ))
  121. for label, values in self._mutagen_file.tags.items():
  122. # TODO overwrite instead of add() ?
  123. if label_pattern.match(label):
  124. assert len(values) == 1, (label, values)
  125. value = MP4._freeform_to_int(values[0])
  126. yield (re.sub(r'^----:', '', label), value)
  127. def _get_free(self, tag_label):
  128. # freeform keys start with '----'
  129. # http://mutagen.readthedocs.io/en/latest/api/mp4.html
  130. return self._get_single('----:' + tag_label)
  131. def get_free_int(self, tag_label):
  132. tag = self._get_free(tag_label)
  133. return None if tag is None else MP4._freeform_to_int(tag)
  134. def _get_free_uuid(self, tag_label):
  135. tag = self._get_free(tag_label)
  136. assert tag is None or tag.dataformat == mutagen.mp4.AtomDataType.UUID, tag.dataformat
  137. return tag
  138. def _set_free(self, tag_label, dataformat, data):
  139. assert isinstance(data, bytes)
  140. tag = mutagen.mp4.MP4FreeForm(dataformat=dataformat, data=data)
  141. self._mutagen_file.tags['----:' + tag_label] = [tag]
  142. return tag
  143. def set_free_int(self, tag_label, data):
  144. assert isinstance(data, int)
  145. return self._set_free(
  146. tag_label=tag_label,
  147. # "a signed big-endian integer with length one of { 1,2,3,4,8 } bytes"
  148. dataformat=mutagen.mp4.AtomDataType.INTEGER,
  149. # TODO set byte length properly
  150. data=data.to_bytes(1, byteorder='big', signed=True),
  151. )
  152. def _set_free_uuid(self, tag_label, data):
  153. return self._set_free(
  154. tag_label=tag_label,
  155. # https://mutagen.readthedocs.io/en/latest/api/mp4.html#mutagen.mp4.AtomDataType.UUID
  156. dataformat=mutagen.mp4.AtomDataType.UUID,
  157. data=data,
  158. )
  159. def get_comment(self):
  160. return self._get_single(self._COMMENT_TAG_KEY)
  161. def set_comment(self, comment: str) -> None:
  162. self._mutagen_file[self._COMMENT_TAG_KEY] = [comment]
  163. def get_track_uuid(self):
  164. return self._get_free_uuid(self._UUID_TAG_KEY)
  165. def set_track_uuid(self, uuid):
  166. return self._set_free_uuid(self._UUID_TAG_KEY, uuid)
  167. class Ogg(_MutagenTagInterface):
  168. # https://github.com/cmus/cmus/blob/9a0723f7a90dc7de0898be87963d5105a999aa6c/ip/opus.c#L229
  169. # https://github.com/cmus/cmus/blob/9a0723f7a90dc7de0898be87963d5105a999aa6c/ip/vorbis.c#L319
  170. # https://github.com/cmus/cmus/blob/17bf542c6b120d9dcf6642b259d78badfc1143eb/comment.c#L224
  171. _COMMENT_TAG_KEY = 'comment'
  172. _UUID_TAG_KEY = 'symuid:uuid'
  173. def __init__(self, mutagen_file):
  174. assert isinstance(mutagen_file.tags, (mutagen.oggopus.OggOpusVComment,
  175. mutagen.oggvorbis.OggVCommentDict)), \
  176. (type(mutagen_file), type(mutagen_file.tags))
  177. super().__init__(mutagen_file)
  178. def _get_single_text(self, tag_label) -> typing.Optional[str]:
  179. tag = self._mutagen_file.get(tag_label, None) # type: list
  180. if tag is None:
  181. return None
  182. if len(tag) > 1:
  183. raise ValueError((self.track_path, tag))
  184. if not isinstance(tag[0], str):
  185. raise ValueError((self.track_path, tag))
  186. return tag[0]
  187. def get_comment(self) -> typing.Optional[str]:
  188. return self._get_single_text(self._COMMENT_TAG_KEY)
  189. def set_comment(self, comment: str) -> None:
  190. self._mutagen_file[self._COMMENT_TAG_KEY] = comment
  191. def get_track_uuid(self) -> typing.Optional[bytes]:
  192. uuid_str = self._get_single_text(self._UUID_TAG_KEY)
  193. return uuid_str_to_bytes(uuid_str) if uuid_str else None
  194. def set_track_uuid(self, uuid: bytes) -> None:
  195. self._mutagen_file[self._UUID_TAG_KEY] = uuid_bytes_to_str(uuid)
  196. def get_free_int(self, tag_label: str) -> typing.Optional[int]:
  197. dec = self._get_single_text(tag_label)
  198. return int(dec) if dec else None
  199. def get_free_ints(self, tag_label_prefix: str) \
  200. -> typing.Iterator[typing.Tuple[str, int]]:
  201. for tag_key, tag_value in self._mutagen_file.items():
  202. if tag_key == tag_label_prefix \
  203. or tag_key.startswith(tag_label_prefix + ':'):
  204. if len(tag_value) > 1:
  205. raise ValueError((self.track_path, tag_key, tag_value))
  206. yield (tag_key, int(tag_value[0]))
  207. def set_free_int(self, tag_label: str, data: int) -> typing.Tuple:
  208. self._mutagen_file[tag_label] = str(data)
  209. return (tag_label, self._mutagen_file[tag_label])