123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901 |
- using MediaBrowser.Controller.Entities;
- using MediaBrowser.Controller.Entities.Audio;
- using MediaBrowser.Model.Entities;
- using MediaBrowser.Model.Logging;
- using System;
- using System.Collections.Generic;
- using System.Globalization;
- using System.IO;
- using System.Linq;
- using System.Text;
- using System.Threading;
- using System.Xml;
- namespace MediaBrowser.Controller.Providers
- {
- /// <summary>
- /// Provides a base class for parsing metadata xml
- /// </summary>
- /// <typeparam name="T"></typeparam>
- public class BaseItemXmlParser<T>
- where T : BaseItem, new()
- {
- /// <summary>
- /// The logger
- /// </summary>
- protected ILogger Logger { get; private set; }
- /// <summary>
- /// Initializes a new instance of the <see cref="BaseItemXmlParser{T}" /> class.
- /// </summary>
- /// <param name="logger">The logger.</param>
- public BaseItemXmlParser(ILogger logger)
- {
- Logger = logger;
- }
- /// <summary>
- /// Fetches metadata for an item from one xml file
- /// </summary>
- /// <param name="item">The item.</param>
- /// <param name="metadataFile">The metadata file.</param>
- /// <param name="cancellationToken">The cancellation token.</param>
- /// <exception cref="System.ArgumentNullException"></exception>
- public void Fetch(T item, string metadataFile, CancellationToken cancellationToken)
- {
- if (item == null)
- {
- throw new ArgumentNullException();
- }
- if (string.IsNullOrEmpty(metadataFile))
- {
- throw new ArgumentNullException();
- }
- var settings = new XmlReaderSettings
- {
- CheckCharacters = false,
- IgnoreProcessingInstructions = true,
- IgnoreComments = true,
- ValidationType = ValidationType.None
- };
- item.Taglines.Clear();
- item.Studios.Clear();
- item.Genres.Clear();
- item.People.Clear();
- item.Tags.Clear();
- //Fetch(item, metadataFile, settings, Encoding.GetEncoding("ISO-8859-1"), cancellationToken);
- Fetch(item, metadataFile, settings, Encoding.UTF8, cancellationToken);
- }
- /// <summary>
- /// Fetches the specified item.
- /// </summary>
- /// <param name="item">The item.</param>
- /// <param name="metadataFile">The metadata file.</param>
- /// <param name="settings">The settings.</param>
- /// <param name="encoding">The encoding.</param>
- /// <param name="cancellationToken">The cancellation token.</param>
- private void Fetch(T item, string metadataFile, XmlReaderSettings settings, Encoding encoding, CancellationToken cancellationToken)
- {
- using (var streamReader = new StreamReader(metadataFile, encoding))
- {
- // Use XmlReader for best performance
- using (var reader = XmlReader.Create(streamReader, settings))
- {
- reader.MoveToContent();
- // Loop through each element
- while (reader.Read())
- {
- cancellationToken.ThrowIfCancellationRequested();
- if (reader.NodeType == XmlNodeType.Element)
- {
- FetchDataFromXmlNode(reader, item);
- }
- }
- }
- }
- }
- private readonly CultureInfo _usCulture = new CultureInfo("en-US");
- /// <summary>
- /// Fetches metadata from one Xml Element
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- protected virtual void FetchDataFromXmlNode(XmlReader reader, T item)
- {
- switch (reader.Name)
- {
- // DateCreated
- case "Added":
- DateTime added;
- if (DateTime.TryParse(reader.ReadElementContentAsString() ?? string.Empty, out added))
- {
- item.DateCreated = added.ToUniversalTime();
- }
- break;
- case "LocalTitle":
- item.Name = reader.ReadElementContentAsString();
- break;
- case "Type":
- {
- var type = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(type) && !type.Equals("none", StringComparison.OrdinalIgnoreCase))
- {
- item.DisplayMediaType = type;
- }
- break;
- }
- case "CriticRating":
- {
- var text = reader.ReadElementContentAsString();
- float value;
- if (float.TryParse(text, NumberStyles.Any, _usCulture, out value))
- {
- item.CriticRating = value;
- }
- break;
- }
- case "Budget":
- {
- var text = reader.ReadElementContentAsString();
- double value;
- if (double.TryParse(text, NumberStyles.Any, _usCulture, out value))
- {
- item.Budget = value;
- }
- break;
- }
- case "Revenue":
- {
- var text = reader.ReadElementContentAsString();
- double value;
- if (double.TryParse(text, NumberStyles.Any, _usCulture, out value))
- {
- item.Revenue = value;
- }
- break;
- }
- case "SortTitle":
- item.ForcedSortName = reader.ReadElementContentAsString();
- break;
- case "Overview":
- case "Description":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.Overview = val;
- }
- break;
- }
- case "CriticRatingSummary":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.CriticRatingSummary = val;
- }
- break;
- }
- case "TagLine":
- {
- var tagline = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(tagline))
- {
- item.AddTagline(tagline);
- }
- break;
- }
- case "Website":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.HomePageUrl = val;
- }
- break;
- }
- case "TagLines":
- {
- FetchFromTaglinesNode(reader.ReadSubtree(), item);
- break;
- }
- case "ContentRating":
- case "certification":
- case "MPAARating":
- {
- var rating = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(rating))
- {
- item.OfficialRating = rating;
- }
- break;
- }
- case "MPAADescription":
- {
- var rating = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(rating))
- {
- item.OfficialRatingDescription = rating;
- }
- break;
- }
- case "CustomRating":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.CustomRating = val;
- }
- break;
- }
- case "Runtime":
- case "RunningTime":
- {
- var text = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(text))
- {
- int runtime;
- if (int.TryParse(text.Split(' ')[0], NumberStyles.Integer, _usCulture, out runtime))
- {
- // For audio and video don't replace ffmpeg data
- if (item is Video || item is Audio)
- {
- item.OriginalRunTimeTicks = TimeSpan.FromMinutes(runtime).Ticks;
- }
- else
- {
- item.RunTimeTicks = TimeSpan.FromMinutes(runtime).Ticks;
- }
- }
- }
- break;
- }
- case "Genre":
- {
- foreach (var name in SplitNames(reader.ReadElementContentAsString()))
- {
- if (string.IsNullOrWhiteSpace(name))
- {
- continue;
- }
- item.AddGenre(name);
- }
- break;
- }
- case "AspectRatio":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.AspectRatio = val;
- }
- break;
- }
- case "LockData":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.DontFetchMeta = string.Equals("true", val, StringComparison.OrdinalIgnoreCase);
- }
- break;
- }
- case "Network":
- {
- foreach (var name in SplitNames(reader.ReadElementContentAsString()))
- {
- if (string.IsNullOrWhiteSpace(name))
- {
- continue;
- }
- item.AddStudio(name);
- }
- break;
- }
- case "Director":
- {
- foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v, Type = PersonType.Director }))
- {
- if (string.IsNullOrWhiteSpace(p.Name))
- {
- continue;
- }
- item.AddPerson(p);
- }
- break;
- }
- case "Writer":
- {
- foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v, Type = PersonType.Writer }))
- {
- if (string.IsNullOrWhiteSpace(p.Name))
- {
- continue;
- }
- item.AddPerson(p);
- }
- break;
- }
- case "Actors":
- {
- var actors = reader.ReadInnerXml();
- if (actors.Contains("<"))
- {
- // This is one of the mis-named "Actors" full nodes created by MB2
- // Create a reader and pass it to the persons node processor
- FetchDataFromPersonsNode(new XmlTextReader(new StringReader("<Persons>" + actors + "</Persons>")), item);
- }
- else
- {
- // Old-style piped string
- foreach (var p in SplitNames(actors).Select(v => new PersonInfo { Name = v.Trim(), Type = PersonType.Actor }))
- {
- if (string.IsNullOrWhiteSpace(p.Name))
- {
- continue;
- }
- item.AddPerson(p);
- }
- }
- break;
- }
- case "GuestStars":
- {
- foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v.Trim(), Type = PersonType.GuestStar }))
- {
- if (string.IsNullOrWhiteSpace(p.Name))
- {
- continue;
- }
- item.AddPerson(p);
- }
- break;
- }
- case "Trailer":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.AddTrailerUrl(val, false);
- }
- break;
- }
- case "ProductionYear":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- int productionYear;
- if (int.TryParse(val, out productionYear) && productionYear > 1850)
- {
- item.ProductionYear = productionYear;
- }
- }
- break;
- }
- case "Rating":
- case "IMDBrating":
- {
- var rating = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(rating))
- {
- float val;
- // All external meta is saving this as '.' for decimal I believe...but just to be sure
- if (float.TryParse(rating.Replace(',', '.'), NumberStyles.AllowDecimalPoint, CultureInfo.InvariantCulture, out val))
- {
- item.CommunityRating = val;
- }
- }
- break;
- }
- case "PremiereDate":
- case "FirstAired":
- {
- var firstAired = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(firstAired))
- {
- DateTime airDate;
- if (DateTime.TryParse(firstAired, out airDate) && airDate.Year > 1850)
- {
- item.PremiereDate = airDate.ToUniversalTime();
- item.ProductionYear = airDate.Year;
- }
- }
- break;
- }
- case "MusicbrainzId":
- var mbz = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(mbz))
- {
- item.SetProviderId(MetadataProviders.Musicbrainz, mbz);
- }
- break;
- case "RottenTomatoesId":
- var rtId = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(rtId))
- {
- item.SetProviderId(MetadataProviders.RottenTomatoes, rtId);
- }
- break;
- case "TMDbId":
- var tmdb = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(tmdb))
- {
- item.SetProviderId(MetadataProviders.Tmdb, tmdb);
- }
- break;
- case "CollectionNumber":
- var tmdbCollection = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(tmdbCollection))
- {
- item.SetProviderId(MetadataProviders.TmdbCollection, tmdbCollection);
- }
- break;
- case "TVcomId":
- var TVcomId = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(TVcomId))
- {
- item.SetProviderId(MetadataProviders.Tvcom, TVcomId);
- }
- break;
- case "IMDB_ID":
- case "IMDB":
- case "IMDbId":
- var imDbId = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(imDbId))
- {
- item.SetProviderId(MetadataProviders.Imdb, imDbId);
- }
- break;
- case "Genres":
- FetchFromGenresNode(reader.ReadSubtree(), item);
- break;
- case "Tags":
- FetchFromTagsNode(reader.ReadSubtree(), item);
- break;
- case "Persons":
- FetchDataFromPersonsNode(reader.ReadSubtree(), item);
- break;
- case "ParentalRating":
- FetchFromParentalRatingNode(reader.ReadSubtree(), item);
- break;
- case "Studios":
- FetchFromStudiosNode(reader.ReadSubtree(), item);
- break;
- case "MediaInfo":
- FetchFromMediaInfoNode(reader.ReadSubtree(), item);
- break;
- default:
- reader.Skip();
- break;
- }
- }
- /// <summary>
- /// Fetches from media info node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchFromMediaInfoNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Video":
- FetchFromMediaInfoVideoNode(reader.ReadSubtree(), item);
- break;
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Fetches from media info video node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchFromMediaInfoVideoNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Video3DFormat":
- {
- var video = item as Video;
- if (video != null)
- {
- var val = reader.ReadElementContentAsString();
- if (string.Equals("HSBS", val))
- {
- video.Video3DFormat = Video3DFormat.HalfSideBySide;
- }
- else if (string.Equals("HTAB", val))
- {
- video.Video3DFormat = Video3DFormat.HalfTopAndBottom;
- }
- else if (string.Equals("FTAB", val))
- {
- video.Video3DFormat = Video3DFormat.FullTopAndBottom;
- }
- else if (string.Equals("FSBS", val))
- {
- video.Video3DFormat = Video3DFormat.FullSideBySide;
- }
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Fetches from taglines node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchFromTaglinesNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Tagline":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- item.AddTagline(val);
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Fetches from genres node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchFromGenresNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Genre":
- {
- var genre = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(genre))
- {
- item.AddGenre(genre);
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- private void FetchFromTagsNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Tag":
- {
- var tag = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(tag))
- {
- item.AddTag(tag);
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Fetches the data from persons node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchDataFromPersonsNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Person":
- case "Actor":
- {
- foreach (var person in GetPersonsFromXmlNode(reader.ReadSubtree()))
- {
- item.AddPerson(person);
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Fetches from studios node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchFromStudiosNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Studio":
- {
- var studio = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(studio))
- {
- item.AddStudio(studio);
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Fetches from parental rating node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <param name="item">The item.</param>
- private void FetchFromParentalRatingNode(XmlReader reader, T item)
- {
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- // Removed support for "Value" tag as it conflicted with MPAA rating but leaving this function for possible
- // future support of "Description" -ebr
- default:
- reader.Skip();
- break;
- }
- }
- }
- }
- /// <summary>
- /// Gets the persons from XML node.
- /// </summary>
- /// <param name="reader">The reader.</param>
- /// <returns>IEnumerable{PersonInfo}.</returns>
- private IEnumerable<PersonInfo> GetPersonsFromXmlNode(XmlReader reader)
- {
- var names = new List<string>();
- var type = "Actor"; // If type is not specified assume actor
- var role = string.Empty;
- reader.MoveToContent();
- while (reader.Read())
- {
- if (reader.NodeType == XmlNodeType.Element)
- {
- switch (reader.Name)
- {
- case "Name":
- names.AddRange(SplitNames(reader.ReadElementContentAsString()));
- break;
- case "Type":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- type = val;
- }
- break;
- }
- case "Role":
- {
- var val = reader.ReadElementContentAsString();
- if (!string.IsNullOrWhiteSpace(val))
- {
- role = val;
- }
- break;
- }
- default:
- reader.Skip();
- break;
- }
- }
- }
- return names.Select(n => new PersonInfo { Name = n, Role = role, Type = type });
- }
- /// <summary>
- /// Used to split names of comma or pipe delimeted genres and people
- /// </summary>
- /// <param name="value">The value.</param>
- /// <returns>IEnumerable{System.String}.</returns>
- private IEnumerable<string> SplitNames(string value)
- {
- value = value ?? string.Empty;
- // Only split by comma if there is no pipe in the string
- // We have to be careful to not split names like Matthew, Jr.
- var separator = value.IndexOf('|') == -1 && value.IndexOf(';') == -1 ? new[] { ',' } : new[] { '|', ';' };
- value = value.Trim().Trim(separator);
- return string.IsNullOrWhiteSpace(value) ? new string[] { } : Split(value, separator, StringSplitOptions.RemoveEmptyEntries);
- }
- /// <summary>
- /// Provides an additional overload for string.split
- /// </summary>
- /// <param name="val">The val.</param>
- /// <param name="separators">The separators.</param>
- /// <param name="options">The options.</param>
- /// <returns>System.String[][].</returns>
- private static string[] Split(string val, char[] separators, StringSplitOptions options)
- {
- return val.Split(separators, options);
- }
- }
- }
|