AudioFileProber.cs 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494
  1. using System;
  2. using System.Collections.Generic;
  3. using System.Globalization;
  4. using System.Linq;
  5. using System.Threading;
  6. using System.Threading.Tasks;
  7. using ATL;
  8. using Jellyfin.Data.Enums;
  9. using Jellyfin.Extensions;
  10. using MediaBrowser.Controller.Entities;
  11. using MediaBrowser.Controller.Entities.Audio;
  12. using MediaBrowser.Controller.Library;
  13. using MediaBrowser.Controller.Lyrics;
  14. using MediaBrowser.Controller.MediaEncoding;
  15. using MediaBrowser.Controller.Persistence;
  16. using MediaBrowser.Controller.Providers;
  17. using MediaBrowser.Model.Dlna;
  18. using MediaBrowser.Model.Dto;
  19. using MediaBrowser.Model.Entities;
  20. using MediaBrowser.Model.Extensions;
  21. using MediaBrowser.Model.MediaInfo;
  22. using Microsoft.Extensions.Logging;
  23. using static Jellyfin.Extensions.StringExtensions;
  24. namespace MediaBrowser.Providers.MediaInfo
  25. {
  26. /// <summary>
  27. /// Probes audio files for metadata.
  28. /// </summary>
  29. public class AudioFileProber
  30. {
  31. private const char InternalValueSeparator = '\u001F';
  32. private readonly IMediaEncoder _mediaEncoder;
  33. private readonly IItemRepository _itemRepo;
  34. private readonly ILibraryManager _libraryManager;
  35. private readonly ILogger<AudioFileProber> _logger;
  36. private readonly IMediaSourceManager _mediaSourceManager;
  37. private readonly LyricResolver _lyricResolver;
  38. private readonly ILyricManager _lyricManager;
  39. private readonly IMediaStreamRepository _mediaStreamRepository;
  40. /// <summary>
  41. /// Initializes a new instance of the <see cref="AudioFileProber"/> class.
  42. /// </summary>
  43. /// <param name="logger">Instance of the <see cref="ILogger"/> interface.</param>
  44. /// <param name="mediaSourceManager">Instance of the <see cref="IMediaSourceManager"/> interface.</param>
  45. /// <param name="mediaEncoder">Instance of the <see cref="IMediaEncoder"/> interface.</param>
  46. /// <param name="itemRepo">Instance of the <see cref="IItemRepository"/> interface.</param>
  47. /// <param name="libraryManager">Instance of the <see cref="ILibraryManager"/> interface.</param>
  48. /// <param name="lyricResolver">Instance of the <see cref="LyricResolver"/> interface.</param>
  49. /// <param name="lyricManager">Instance of the <see cref="ILyricManager"/> interface.</param>
  50. /// <param name="mediaStreamRepository">Instance of the <see cref="IMediaStreamRepository"/>.</param>
  51. public AudioFileProber(
  52. ILogger<AudioFileProber> logger,
  53. IMediaSourceManager mediaSourceManager,
  54. IMediaEncoder mediaEncoder,
  55. IItemRepository itemRepo,
  56. ILibraryManager libraryManager,
  57. LyricResolver lyricResolver,
  58. ILyricManager lyricManager,
  59. IMediaStreamRepository mediaStreamRepository)
  60. {
  61. _mediaEncoder = mediaEncoder;
  62. _itemRepo = itemRepo;
  63. _libraryManager = libraryManager;
  64. _logger = logger;
  65. _mediaSourceManager = mediaSourceManager;
  66. _lyricResolver = lyricResolver;
  67. _lyricManager = lyricManager;
  68. _mediaStreamRepository = mediaStreamRepository;
  69. ATL.Settings.DisplayValueSeparator = InternalValueSeparator;
  70. ATL.Settings.UseFileNameWhenNoTitle = false;
  71. ATL.Settings.ID3v2_separatev2v3Values = false;
  72. }
  73. /// <summary>
  74. /// Probes the specified item for metadata.
  75. /// </summary>
  76. /// <param name="item">The item to probe.</param>
  77. /// <param name="options">The <see cref="MetadataRefreshOptions"/>.</param>
  78. /// <param name="cancellationToken">The <see cref="CancellationToken"/>.</param>
  79. /// <typeparam name="T">The type of item to resolve.</typeparam>
  80. /// <returns>A <see cref="Task"/> probing the item for metadata.</returns>
  81. public async Task<ItemUpdateType> Probe<T>(
  82. T item,
  83. MetadataRefreshOptions options,
  84. CancellationToken cancellationToken)
  85. where T : Audio
  86. {
  87. var path = item.Path;
  88. var protocol = item.PathProtocol ?? MediaProtocol.File;
  89. if (!item.IsShortcut || options.EnableRemoteContentProbe)
  90. {
  91. if (item.IsShortcut)
  92. {
  93. path = item.ShortcutPath;
  94. protocol = _mediaSourceManager.GetPathProtocol(path);
  95. }
  96. var result = await _mediaEncoder.GetMediaInfo(
  97. new MediaInfoRequest
  98. {
  99. MediaType = DlnaProfileType.Audio,
  100. MediaSource = new MediaSourceInfo
  101. {
  102. Path = path,
  103. Protocol = protocol
  104. }
  105. },
  106. cancellationToken).ConfigureAwait(false);
  107. cancellationToken.ThrowIfCancellationRequested();
  108. await FetchAsync(item, result, options, cancellationToken).ConfigureAwait(false);
  109. }
  110. return ItemUpdateType.MetadataImport;
  111. }
  112. /// <summary>
  113. /// Fetches the specified audio.
  114. /// </summary>
  115. /// <param name="audio">The <see cref="Audio"/>.</param>
  116. /// <param name="mediaInfo">The <see cref="Model.MediaInfo.MediaInfo"/>.</param>
  117. /// <param name="options">The <see cref="MetadataRefreshOptions"/>.</param>
  118. /// <param name="cancellationToken">The <see cref="CancellationToken"/>.</param>
  119. /// <returns>A <see cref="Task"/> representing the asynchronous operation.</returns>
  120. private async Task FetchAsync(
  121. Audio audio,
  122. Model.MediaInfo.MediaInfo mediaInfo,
  123. MetadataRefreshOptions options,
  124. CancellationToken cancellationToken)
  125. {
  126. audio.Container = mediaInfo.Container;
  127. audio.TotalBitrate = mediaInfo.Bitrate;
  128. audio.RunTimeTicks = mediaInfo.RunTimeTicks;
  129. audio.Size = mediaInfo.Size;
  130. // Add external lyrics first to prevent the lrc file get overwritten on first scan
  131. var mediaStreams = new List<MediaStream>(mediaInfo.MediaStreams);
  132. AddExternalLyrics(audio, mediaStreams, options);
  133. var tryExtractEmbeddedLyrics = mediaStreams.All(s => s.Type != MediaStreamType.Lyric);
  134. if (!audio.IsLocked)
  135. {
  136. await FetchDataFromTags(audio, mediaInfo, options, tryExtractEmbeddedLyrics).ConfigureAwait(false);
  137. if (tryExtractEmbeddedLyrics)
  138. {
  139. AddExternalLyrics(audio, mediaStreams, options);
  140. }
  141. }
  142. audio.HasLyrics = mediaStreams.Any(s => s.Type == MediaStreamType.Lyric);
  143. _mediaStreamRepository.SaveMediaStreams(audio.Id, mediaStreams, cancellationToken);
  144. }
  145. /// <summary>
  146. /// Fetches data from the tags.
  147. /// </summary>
  148. /// <param name="audio">The <see cref="Audio"/>.</param>
  149. /// <param name="mediaInfo">The <see cref="Model.MediaInfo.MediaInfo"/>.</param>
  150. /// <param name="options">The <see cref="MetadataRefreshOptions"/>.</param>
  151. /// <param name="tryExtractEmbeddedLyrics">Whether to extract embedded lyrics to lrc file. </param>
  152. private async Task FetchDataFromTags(Audio audio, Model.MediaInfo.MediaInfo mediaInfo, MetadataRefreshOptions options, bool tryExtractEmbeddedLyrics)
  153. {
  154. var libraryOptions = _libraryManager.GetLibraryOptions(audio);
  155. Track track = new Track(audio.Path);
  156. if (track.MetadataFormats
  157. .All(mf => string.Equals(mf.ShortName, "ID3v1", StringComparison.OrdinalIgnoreCase)))
  158. {
  159. _logger.LogWarning("File {File} only has ID3v1 tags, some fields may be truncated", audio.Path);
  160. }
  161. // We should never use the property setter of the ATL.Track class.
  162. // That setter is meant for its own tag parser and external editor usage and will have unwanted side effects
  163. // For example, setting the Year property will also set the Date property, which is not what we want here.
  164. // To properly handle fallback values, we make a clone of those fields when valid.
  165. var trackTitle = (string.IsNullOrEmpty(track.Title) ? mediaInfo.Name : track.Title).Trim();
  166. var trackAlbum = (string.IsNullOrEmpty(track.Album) ? mediaInfo.Album : track.Album).Trim();
  167. var trackYear = track.Year is null or 0 ? mediaInfo.ProductionYear : track.Year;
  168. var trackTrackNumber = track.TrackNumber is null or 0 ? mediaInfo.IndexNumber : track.TrackNumber;
  169. var trackDiscNumber = track.DiscNumber is null or 0 ? mediaInfo.ParentIndexNumber : track.DiscNumber;
  170. if (audio.SupportsPeople && !audio.LockedFields.Contains(MetadataField.Cast))
  171. {
  172. var people = new List<PersonInfo>();
  173. var albumArtists = string.IsNullOrEmpty(track.AlbumArtist) ? [] : track.AlbumArtist.Split(InternalValueSeparator);
  174. if (libraryOptions.UseCustomTagDelimiters)
  175. {
  176. albumArtists = albumArtists.SelectMany(a => SplitWithCustomDelimiter(a, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist)).ToArray();
  177. }
  178. foreach (var albumArtist in albumArtists)
  179. {
  180. if (!string.IsNullOrWhiteSpace(albumArtist))
  181. {
  182. PeopleHelper.AddPerson(people, new PersonInfo
  183. {
  184. Name = albumArtist.Trim(),
  185. Type = PersonKind.AlbumArtist
  186. });
  187. }
  188. }
  189. string[]? performers = null;
  190. if (libraryOptions.PreferNonstandardArtistsTag)
  191. {
  192. track.AdditionalFields.TryGetValue("ARTISTS", out var artistsTagString);
  193. if (artistsTagString is not null)
  194. {
  195. performers = artistsTagString.Split(InternalValueSeparator);
  196. }
  197. }
  198. if (performers is null || performers.Length == 0)
  199. {
  200. performers = string.IsNullOrEmpty(track.Artist) ? [] : track.Artist.Split(InternalValueSeparator);
  201. }
  202. if (libraryOptions.UseCustomTagDelimiters)
  203. {
  204. performers = performers.SelectMany(p => SplitWithCustomDelimiter(p, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist)).ToArray();
  205. }
  206. foreach (var performer in performers)
  207. {
  208. if (!string.IsNullOrWhiteSpace(performer))
  209. {
  210. PeopleHelper.AddPerson(people, new PersonInfo
  211. {
  212. Name = performer.Trim(),
  213. Type = PersonKind.Artist
  214. });
  215. }
  216. }
  217. foreach (var composer in track.Composer.Split(InternalValueSeparator))
  218. {
  219. if (!string.IsNullOrWhiteSpace(composer))
  220. {
  221. PeopleHelper.AddPerson(people, new PersonInfo
  222. {
  223. Name = composer.Trim(),
  224. Type = PersonKind.Composer
  225. });
  226. }
  227. }
  228. _libraryManager.UpdatePeople(audio, people);
  229. if (options.ReplaceAllMetadata && performers.Length != 0)
  230. {
  231. audio.Artists = performers;
  232. }
  233. else if (!options.ReplaceAllMetadata
  234. && (audio.Artists is null || audio.Artists.Count == 0))
  235. {
  236. audio.Artists = performers;
  237. }
  238. if (albumArtists.Length == 0)
  239. {
  240. // Album artists not provided, fall back to performers (artists).
  241. albumArtists = performers;
  242. }
  243. if (options.ReplaceAllMetadata && albumArtists.Length != 0)
  244. {
  245. audio.AlbumArtists = albumArtists;
  246. }
  247. else if (!options.ReplaceAllMetadata
  248. && (audio.AlbumArtists is null || audio.AlbumArtists.Count == 0))
  249. {
  250. audio.AlbumArtists = albumArtists;
  251. }
  252. }
  253. if (!audio.LockedFields.Contains(MetadataField.Name) && !string.IsNullOrEmpty(trackTitle))
  254. {
  255. audio.Name = trackTitle;
  256. }
  257. if (options.ReplaceAllMetadata)
  258. {
  259. audio.Album = trackAlbum;
  260. audio.IndexNumber = trackTrackNumber;
  261. audio.ParentIndexNumber = trackDiscNumber;
  262. }
  263. else
  264. {
  265. audio.Album ??= trackAlbum;
  266. audio.IndexNumber ??= trackTrackNumber;
  267. audio.ParentIndexNumber ??= trackDiscNumber;
  268. }
  269. if (track.Date.HasValue)
  270. {
  271. audio.PremiereDate = track.Date;
  272. }
  273. if (trackYear.HasValue)
  274. {
  275. var year = trackYear.Value;
  276. audio.ProductionYear = year;
  277. // ATL library handles such fallback this with its own internal logic, but we also need to handle it here for the ffprobe fallbacks.
  278. if (!audio.PremiereDate.HasValue)
  279. {
  280. try
  281. {
  282. audio.PremiereDate = new DateTime(year, 01, 01);
  283. }
  284. catch (ArgumentOutOfRangeException ex)
  285. {
  286. _logger.LogError(ex, "Error parsing YEAR tag in {File}. '{TagValue}' is an invalid year", audio.Path, trackYear);
  287. }
  288. }
  289. }
  290. if (!audio.LockedFields.Contains(MetadataField.Genres))
  291. {
  292. var genres = string.IsNullOrEmpty(track.Genre) ? [] : track.Genre.Split(InternalValueSeparator).Distinct(StringComparer.OrdinalIgnoreCase).ToArray();
  293. if (libraryOptions.UseCustomTagDelimiters)
  294. {
  295. genres = genres.SelectMany(g => SplitWithCustomDelimiter(g, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist)).ToArray();
  296. }
  297. genres = genres.Trimmed().Distinct(StringComparer.OrdinalIgnoreCase).ToArray();
  298. audio.Genres = options.ReplaceAllMetadata || audio.Genres is null || audio.Genres.Length == 0
  299. ? genres
  300. : audio.Genres;
  301. }
  302. track.AdditionalFields.TryGetValue("REPLAYGAIN_TRACK_GAIN", out var trackGainTag);
  303. if (trackGainTag is not null)
  304. {
  305. if (trackGainTag.EndsWith("db", StringComparison.OrdinalIgnoreCase))
  306. {
  307. trackGainTag = trackGainTag[..^2].Trim();
  308. }
  309. if (float.TryParse(trackGainTag, NumberStyles.Float, CultureInfo.InvariantCulture, out var value))
  310. {
  311. audio.NormalizationGain = value;
  312. }
  313. }
  314. if (options.ReplaceAllMetadata || !audio.TryGetProviderId(MetadataProvider.MusicBrainzArtist, out _))
  315. {
  316. if ((track.AdditionalFields.TryGetValue("MUSICBRAINZ_ARTISTID", out var musicBrainzArtistTag)
  317. || track.AdditionalFields.TryGetValue("MusicBrainz Artist Id", out musicBrainzArtistTag))
  318. && !string.IsNullOrEmpty(musicBrainzArtistTag))
  319. {
  320. var id = GetFirstMusicBrainzId(musicBrainzArtistTag, libraryOptions.UseCustomTagDelimiters, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist);
  321. audio.TrySetProviderId(MetadataProvider.MusicBrainzArtist, id);
  322. }
  323. }
  324. if (options.ReplaceAllMetadata || !audio.TryGetProviderId(MetadataProvider.MusicBrainzAlbumArtist, out _))
  325. {
  326. if ((track.AdditionalFields.TryGetValue("MUSICBRAINZ_ALBUMARTISTID", out var musicBrainzReleaseArtistIdTag)
  327. || track.AdditionalFields.TryGetValue("MusicBrainz Album Artist Id", out musicBrainzReleaseArtistIdTag))
  328. && !string.IsNullOrEmpty(musicBrainzReleaseArtistIdTag))
  329. {
  330. var id = GetFirstMusicBrainzId(musicBrainzReleaseArtistIdTag, libraryOptions.UseCustomTagDelimiters, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist);
  331. audio.TrySetProviderId(MetadataProvider.MusicBrainzAlbumArtist, id);
  332. }
  333. }
  334. if (options.ReplaceAllMetadata || !audio.TryGetProviderId(MetadataProvider.MusicBrainzAlbum, out _))
  335. {
  336. if ((track.AdditionalFields.TryGetValue("MUSICBRAINZ_ALBUMID", out var musicBrainzReleaseIdTag)
  337. || track.AdditionalFields.TryGetValue("MusicBrainz Album Id", out musicBrainzReleaseIdTag))
  338. && !string.IsNullOrEmpty(musicBrainzReleaseIdTag))
  339. {
  340. var id = GetFirstMusicBrainzId(musicBrainzReleaseIdTag, libraryOptions.UseCustomTagDelimiters, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist);
  341. audio.TrySetProviderId(MetadataProvider.MusicBrainzAlbum, id);
  342. }
  343. }
  344. if (options.ReplaceAllMetadata || !audio.TryGetProviderId(MetadataProvider.MusicBrainzReleaseGroup, out _))
  345. {
  346. if ((track.AdditionalFields.TryGetValue("MUSICBRAINZ_RELEASEGROUPID", out var musicBrainzReleaseGroupIdTag)
  347. || track.AdditionalFields.TryGetValue("MusicBrainz Release Group Id", out musicBrainzReleaseGroupIdTag))
  348. && !string.IsNullOrEmpty(musicBrainzReleaseGroupIdTag))
  349. {
  350. var id = GetFirstMusicBrainzId(musicBrainzReleaseGroupIdTag, libraryOptions.UseCustomTagDelimiters, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist);
  351. audio.TrySetProviderId(MetadataProvider.MusicBrainzReleaseGroup, id);
  352. }
  353. }
  354. if (options.ReplaceAllMetadata || !audio.TryGetProviderId(MetadataProvider.MusicBrainzTrack, out _))
  355. {
  356. if ((track.AdditionalFields.TryGetValue("MUSICBRAINZ_RELEASETRACKID", out var trackMbId)
  357. || track.AdditionalFields.TryGetValue("MusicBrainz Release Track Id", out trackMbId))
  358. && !string.IsNullOrEmpty(trackMbId))
  359. {
  360. var id = GetFirstMusicBrainzId(trackMbId, libraryOptions.UseCustomTagDelimiters, libraryOptions.GetCustomTagDelimiters(), libraryOptions.DelimiterWhitelist);
  361. audio.TrySetProviderId(MetadataProvider.MusicBrainzTrack, id);
  362. }
  363. }
  364. if (options.ReplaceAllMetadata || !audio.TryGetProviderId(MetadataProvider.MusicBrainzRecording, out _))
  365. {
  366. if ((track.AdditionalFields.TryGetValue("MUSICBRAINZ_TRACKID", out var recordingMbId)
  367. || track.AdditionalFields.TryGetValue("MusicBrainz Track Id", out recordingMbId))
  368. && !string.IsNullOrEmpty(recordingMbId))
  369. {
  370. audio.TrySetProviderId(MetadataProvider.MusicBrainzRecording, recordingMbId);
  371. }
  372. else if (track.AdditionalFields.TryGetValue("UFID", out var ufIdValue) && !string.IsNullOrEmpty(ufIdValue))
  373. {
  374. // If tagged with MB Picard, the format is 'http://musicbrainz.org\0<recording MBID>'
  375. if (ufIdValue.Contains("musicbrainz.org", StringComparison.OrdinalIgnoreCase))
  376. {
  377. audio.TrySetProviderId(MetadataProvider.MusicBrainzRecording, ufIdValue.AsSpan().RightPart('\0').ToString());
  378. }
  379. }
  380. }
  381. // Save extracted lyrics if they exist,
  382. // and if the audio doesn't yet have lyrics.
  383. var lyrics = track.Lyrics.SynchronizedLyrics.Count > 0 ? track.Lyrics.FormatSynchToLRC() : track.Lyrics.UnsynchronizedLyrics;
  384. if (!string.IsNullOrWhiteSpace(lyrics)
  385. && tryExtractEmbeddedLyrics)
  386. {
  387. await _lyricManager.SaveLyricAsync(audio, "lrc", lyrics).ConfigureAwait(false);
  388. }
  389. }
  390. private void AddExternalLyrics(
  391. Audio audio,
  392. List<MediaStream> currentStreams,
  393. MetadataRefreshOptions options)
  394. {
  395. var startIndex = currentStreams.Count == 0 ? 0 : (currentStreams.Select(i => i.Index).Max() + 1);
  396. var externalLyricFiles = _lyricResolver.GetExternalStreams(audio, startIndex, options.DirectoryService, false);
  397. audio.LyricFiles = externalLyricFiles.Select(i => i.Path).Distinct().ToArray();
  398. if (externalLyricFiles.Count > 0)
  399. {
  400. currentStreams.Add(externalLyricFiles[0]);
  401. }
  402. }
  403. private List<string> SplitWithCustomDelimiter(string val, char[] tagDelimiters, string[] whitelist)
  404. {
  405. var items = new List<string>();
  406. var temp = val;
  407. foreach (var whitelistItem in whitelist)
  408. {
  409. if (string.IsNullOrWhiteSpace(whitelistItem))
  410. {
  411. continue;
  412. }
  413. var originalTemp = temp;
  414. temp = temp.Replace(whitelistItem, string.Empty, StringComparison.OrdinalIgnoreCase);
  415. if (!string.Equals(temp, originalTemp, StringComparison.OrdinalIgnoreCase))
  416. {
  417. items.Add(whitelistItem);
  418. }
  419. }
  420. var items2 = temp.Split(tagDelimiters, StringSplitOptions.RemoveEmptyEntries | StringSplitOptions.TrimEntries).DistinctNames();
  421. items.AddRange(items2);
  422. return items;
  423. }
  424. // MusicBrainz IDs are multi-value tags, so we need to split them
  425. // However, our current provider can only have one single ID, which means we need to pick the first one
  426. private string? GetFirstMusicBrainzId(string tag, bool useCustomTagDelimiters, char[] tagDelimiters, string[] whitelist)
  427. {
  428. var val = tag.Split(InternalValueSeparator).FirstOrDefault();
  429. if (val is not null && useCustomTagDelimiters)
  430. {
  431. val = SplitWithCustomDelimiter(val, tagDelimiters, whitelist).FirstOrDefault();
  432. }
  433. return val;
  434. }
  435. }
  436. }