BaseItemXmlParser.cs 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715
  1. using System.Globalization;
  2. using System.IO;
  3. using MediaBrowser.Controller.Entities;
  4. using MediaBrowser.Model.Entities;
  5. using MediaBrowser.Model.Logging;
  6. using System;
  7. using System.Collections.Generic;
  8. using System.Linq;
  9. using System.Threading;
  10. using System.Xml;
  11. namespace MediaBrowser.Controller.Providers
  12. {
  13. /// <summary>
  14. /// Provides a base class for parsing metadata xml
  15. /// </summary>
  16. /// <typeparam name="T"></typeparam>
  17. public class BaseItemXmlParser<T>
  18. where T : BaseItem, new()
  19. {
  20. /// <summary>
  21. /// The logger
  22. /// </summary>
  23. protected ILogger Logger { get; private set; }
  24. /// <summary>
  25. /// Initializes a new instance of the <see cref="BaseItemXmlParser{T}" /> class.
  26. /// </summary>
  27. /// <param name="logger">The logger.</param>
  28. public BaseItemXmlParser(ILogger logger)
  29. {
  30. Logger = logger;
  31. }
  32. /// <summary>
  33. /// Fetches metadata for an item from one xml file
  34. /// </summary>
  35. /// <param name="item">The item.</param>
  36. /// <param name="metadataFile">The metadata file.</param>
  37. /// <param name="cancellationToken">The cancellation token.</param>
  38. /// <exception cref="System.ArgumentNullException"></exception>
  39. public void Fetch(T item, string metadataFile, CancellationToken cancellationToken)
  40. {
  41. if (item == null)
  42. {
  43. throw new ArgumentNullException();
  44. }
  45. if (string.IsNullOrEmpty(metadataFile))
  46. {
  47. throw new ArgumentNullException();
  48. }
  49. var settings = new XmlReaderSettings
  50. {
  51. CheckCharacters = false,
  52. IgnoreProcessingInstructions = true,
  53. IgnoreComments = true,
  54. ValidationType = ValidationType.None
  55. };
  56. item.Taglines.Clear();
  57. item.Studios.Clear();
  58. item.Genres.Clear();
  59. item.People.Clear();
  60. // Use XmlReader for best performance
  61. using (var reader = XmlReader.Create(metadataFile, settings))
  62. {
  63. reader.MoveToContent();
  64. // Loop through each element
  65. while (reader.Read())
  66. {
  67. cancellationToken.ThrowIfCancellationRequested();
  68. if (reader.NodeType == XmlNodeType.Element)
  69. {
  70. FetchDataFromXmlNode(reader, item);
  71. }
  72. }
  73. }
  74. }
  75. private readonly CultureInfo _usCulture = new CultureInfo("en-US");
  76. /// <summary>
  77. /// Fetches metadata from one Xml Element
  78. /// </summary>
  79. /// <param name="reader">The reader.</param>
  80. /// <param name="item">The item.</param>
  81. protected virtual void FetchDataFromXmlNode(XmlReader reader, T item)
  82. {
  83. switch (reader.Name)
  84. {
  85. // DateCreated
  86. case "Added":
  87. DateTime added;
  88. if (DateTime.TryParse(reader.ReadElementContentAsString() ?? string.Empty, out added))
  89. {
  90. item.DateCreated = added.ToUniversalTime();
  91. }
  92. break;
  93. case "LocalTitle":
  94. item.Name = reader.ReadElementContentAsString();
  95. break;
  96. case "Type":
  97. {
  98. var type = reader.ReadElementContentAsString();
  99. if (!string.IsNullOrWhiteSpace(type) && !type.Equals("none", StringComparison.OrdinalIgnoreCase))
  100. {
  101. item.DisplayMediaType = type;
  102. }
  103. break;
  104. }
  105. case "Budget":
  106. {
  107. var text = reader.ReadElementContentAsString();
  108. double value;
  109. if (double.TryParse(text, NumberStyles.Any, _usCulture, out value))
  110. {
  111. item.Budget = value;
  112. }
  113. break;
  114. }
  115. case "Revenue":
  116. {
  117. var text = reader.ReadElementContentAsString();
  118. double value;
  119. if (double.TryParse(text, NumberStyles.Any, _usCulture, out value))
  120. {
  121. item.Revenue = value;
  122. }
  123. break;
  124. }
  125. case "SortTitle":
  126. item.ForcedSortName = reader.ReadElementContentAsString();
  127. break;
  128. case "Overview":
  129. case "Description":
  130. item.Overview = reader.ReadInnerXml();
  131. break;
  132. case "TagLine":
  133. {
  134. var tagline = reader.ReadElementContentAsString();
  135. if (!string.IsNullOrWhiteSpace(tagline))
  136. {
  137. item.AddTagline(tagline);
  138. }
  139. break;
  140. }
  141. case "Website":
  142. {
  143. var val = reader.ReadElementContentAsString();
  144. if (!string.IsNullOrWhiteSpace(val))
  145. {
  146. item.HomePageUrl = val;
  147. }
  148. break;
  149. }
  150. case "TagLines":
  151. {
  152. FetchFromTaglinesNode(reader.ReadSubtree(), item);
  153. break;
  154. }
  155. case "ContentRating":
  156. case "certification":
  157. case "MPAARating":
  158. {
  159. var rating = reader.ReadElementContentAsString();
  160. if (!string.IsNullOrWhiteSpace(rating))
  161. {
  162. item.OfficialRating = rating;
  163. }
  164. break;
  165. }
  166. case "CustomRating":
  167. {
  168. var val = reader.ReadElementContentAsString();
  169. if (!string.IsNullOrWhiteSpace(val))
  170. {
  171. item.CustomRating = val;
  172. }
  173. break;
  174. }
  175. case "Runtime":
  176. case "RunningTime":
  177. {
  178. var text = reader.ReadElementContentAsString();
  179. if (!string.IsNullOrWhiteSpace(text))
  180. {
  181. int runtime;
  182. if (int.TryParse(text.Split(' ')[0], out runtime))
  183. {
  184. item.RunTimeTicks = TimeSpan.FromMinutes(runtime).Ticks;
  185. }
  186. }
  187. break;
  188. }
  189. case "Genre":
  190. {
  191. foreach (var name in SplitNames(reader.ReadElementContentAsString()))
  192. {
  193. if (string.IsNullOrWhiteSpace(name))
  194. {
  195. continue;
  196. }
  197. item.AddGenre(name);
  198. }
  199. break;
  200. }
  201. case "AspectRatio":
  202. {
  203. var val = reader.ReadElementContentAsString();
  204. if (!string.IsNullOrWhiteSpace(val))
  205. {
  206. item.AspectRatio = val;
  207. }
  208. break;
  209. }
  210. case "Network":
  211. {
  212. foreach (var name in SplitNames(reader.ReadElementContentAsString()))
  213. {
  214. if (string.IsNullOrWhiteSpace(name))
  215. {
  216. continue;
  217. }
  218. item.AddStudio(name);
  219. }
  220. break;
  221. }
  222. case "Director":
  223. {
  224. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v, Type = PersonType.Director }))
  225. {
  226. if (string.IsNullOrWhiteSpace(p.Name))
  227. {
  228. continue;
  229. }
  230. item.AddPerson(p);
  231. }
  232. break;
  233. }
  234. case "Writer":
  235. {
  236. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v, Type = PersonType.Writer }))
  237. {
  238. if (string.IsNullOrWhiteSpace(p.Name))
  239. {
  240. continue;
  241. }
  242. item.AddPerson(p);
  243. }
  244. break;
  245. }
  246. case "Actors":
  247. {
  248. var actors = reader.ReadInnerXml();
  249. if (actors.Contains("<"))
  250. {
  251. // This is one of the mis-named "Actors" full nodes created by MB2
  252. // Create a reader and pass it to the persons node processor
  253. FetchDataFromPersonsNode(new XmlTextReader(new StringReader("<Persons>" + actors + "</Persons>")), item);
  254. }
  255. else
  256. {
  257. // Old-style piped string
  258. foreach (var p in SplitNames(actors).Select(v => new PersonInfo { Name = v.Trim(), Type = PersonType.Actor }))
  259. {
  260. if (string.IsNullOrWhiteSpace(p.Name))
  261. {
  262. continue;
  263. }
  264. item.AddPerson(p);
  265. }
  266. }
  267. break;
  268. }
  269. case "GuestStars":
  270. {
  271. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v.Trim(), Type = PersonType.GuestStar }))
  272. {
  273. if (string.IsNullOrWhiteSpace(p.Name))
  274. {
  275. continue;
  276. }
  277. item.AddPerson(p);
  278. }
  279. break;
  280. }
  281. case "Trailer":
  282. {
  283. var val = reader.ReadElementContentAsString();
  284. if (!string.IsNullOrWhiteSpace(val))
  285. {
  286. //item.AddTrailerUrl(val);
  287. }
  288. break;
  289. }
  290. case "ProductionYear":
  291. {
  292. var val = reader.ReadElementContentAsString();
  293. if (!string.IsNullOrWhiteSpace(val))
  294. {
  295. int productionYear;
  296. if (int.TryParse(val, out productionYear) && productionYear > 1850)
  297. {
  298. item.ProductionYear = productionYear;
  299. }
  300. }
  301. break;
  302. }
  303. case "Rating":
  304. case "IMDBrating":
  305. {
  306. var rating = reader.ReadElementContentAsString();
  307. if (!string.IsNullOrWhiteSpace(rating))
  308. {
  309. float val;
  310. if (float.TryParse(rating, out val))
  311. {
  312. item.CommunityRating = val;
  313. }
  314. }
  315. break;
  316. }
  317. case "FirstAired":
  318. {
  319. var firstAired = reader.ReadElementContentAsString();
  320. if (!string.IsNullOrWhiteSpace(firstAired))
  321. {
  322. DateTime airDate;
  323. if (DateTime.TryParse(firstAired, out airDate) && airDate.Year > 1850)
  324. {
  325. item.PremiereDate = airDate.ToUniversalTime();
  326. item.ProductionYear = airDate.Year;
  327. }
  328. }
  329. break;
  330. }
  331. case "TMDbId":
  332. var tmdb = reader.ReadElementContentAsString();
  333. if (!string.IsNullOrWhiteSpace(tmdb))
  334. {
  335. item.SetProviderId(MetadataProviders.Tmdb, tmdb);
  336. }
  337. break;
  338. case "TVcomId":
  339. var TVcomId = reader.ReadElementContentAsString();
  340. if (!string.IsNullOrWhiteSpace(TVcomId))
  341. {
  342. item.SetProviderId(MetadataProviders.Tvcom, TVcomId);
  343. }
  344. break;
  345. case "IMDB_ID":
  346. case "IMDB":
  347. case "IMDbId":
  348. var IMDbId = reader.ReadElementContentAsString();
  349. if (!string.IsNullOrWhiteSpace(IMDbId))
  350. {
  351. item.SetProviderId(MetadataProviders.Imdb, IMDbId);
  352. }
  353. break;
  354. case "Genres":
  355. FetchFromGenresNode(reader.ReadSubtree(), item);
  356. break;
  357. case "Persons":
  358. FetchDataFromPersonsNode(reader.ReadSubtree(), item);
  359. break;
  360. case "ParentalRating":
  361. FetchFromParentalRatingNode(reader.ReadSubtree(), item);
  362. break;
  363. case "Studios":
  364. FetchFromStudiosNode(reader.ReadSubtree(), item);
  365. break;
  366. default:
  367. reader.Skip();
  368. break;
  369. }
  370. }
  371. /// <summary>
  372. /// Fetches from taglines node.
  373. /// </summary>
  374. /// <param name="reader">The reader.</param>
  375. /// <param name="item">The item.</param>
  376. private void FetchFromTaglinesNode(XmlReader reader, T item)
  377. {
  378. reader.MoveToContent();
  379. while (reader.Read())
  380. {
  381. if (reader.NodeType == XmlNodeType.Element)
  382. {
  383. switch (reader.Name)
  384. {
  385. case "Tagline":
  386. {
  387. var val = reader.ReadElementContentAsString();
  388. if (!string.IsNullOrWhiteSpace(val))
  389. {
  390. item.AddTagline(val);
  391. }
  392. break;
  393. }
  394. default:
  395. reader.Skip();
  396. break;
  397. }
  398. }
  399. }
  400. }
  401. /// <summary>
  402. /// Fetches from genres node.
  403. /// </summary>
  404. /// <param name="reader">The reader.</param>
  405. /// <param name="item">The item.</param>
  406. private void FetchFromGenresNode(XmlReader reader, T item)
  407. {
  408. reader.MoveToContent();
  409. while (reader.Read())
  410. {
  411. if (reader.NodeType == XmlNodeType.Element)
  412. {
  413. switch (reader.Name)
  414. {
  415. case "Genre":
  416. {
  417. var genre = reader.ReadElementContentAsString();
  418. if (!string.IsNullOrWhiteSpace(genre))
  419. {
  420. item.AddGenre(genre);
  421. }
  422. break;
  423. }
  424. default:
  425. reader.Skip();
  426. break;
  427. }
  428. }
  429. }
  430. }
  431. /// <summary>
  432. /// Fetches the data from persons node.
  433. /// </summary>
  434. /// <param name="reader">The reader.</param>
  435. /// <param name="item">The item.</param>
  436. private void FetchDataFromPersonsNode(XmlReader reader, T item)
  437. {
  438. reader.MoveToContent();
  439. while (reader.Read())
  440. {
  441. if (reader.NodeType == XmlNodeType.Element)
  442. {
  443. switch (reader.Name)
  444. {
  445. case "Person":
  446. case "Actor":
  447. {
  448. foreach (var person in GetPersonsFromXmlNode(reader.ReadSubtree()))
  449. {
  450. item.AddPerson(person);
  451. }
  452. break;
  453. }
  454. default:
  455. reader.Skip();
  456. break;
  457. }
  458. }
  459. }
  460. }
  461. /// <summary>
  462. /// Fetches from studios node.
  463. /// </summary>
  464. /// <param name="reader">The reader.</param>
  465. /// <param name="item">The item.</param>
  466. private void FetchFromStudiosNode(XmlReader reader, T item)
  467. {
  468. reader.MoveToContent();
  469. while (reader.Read())
  470. {
  471. if (reader.NodeType == XmlNodeType.Element)
  472. {
  473. switch (reader.Name)
  474. {
  475. case "Studio":
  476. {
  477. var studio = reader.ReadElementContentAsString();
  478. if (!string.IsNullOrWhiteSpace(studio))
  479. {
  480. item.AddStudio(studio);
  481. }
  482. break;
  483. }
  484. default:
  485. reader.Skip();
  486. break;
  487. }
  488. }
  489. }
  490. }
  491. /// <summary>
  492. /// Fetches from parental rating node.
  493. /// </summary>
  494. /// <param name="reader">The reader.</param>
  495. /// <param name="item">The item.</param>
  496. private void FetchFromParentalRatingNode(XmlReader reader, T item)
  497. {
  498. reader.MoveToContent();
  499. while (reader.Read())
  500. {
  501. if (reader.NodeType == XmlNodeType.Element)
  502. {
  503. switch (reader.Name)
  504. {
  505. case "Value":
  506. {
  507. var ratingString = reader.ReadElementContentAsString();
  508. int rating = 7;
  509. if (!string.IsNullOrWhiteSpace(ratingString))
  510. {
  511. int.TryParse(ratingString, out rating);
  512. }
  513. switch (rating)
  514. {
  515. case -1:
  516. item.OfficialRating = "NR";
  517. break;
  518. case 0:
  519. item.OfficialRating = "UR";
  520. break;
  521. case 1:
  522. item.OfficialRating = "G";
  523. break;
  524. case 3:
  525. item.OfficialRating = "PG";
  526. break;
  527. case 4:
  528. item.OfficialRating = "PG-13";
  529. break;
  530. case 5:
  531. item.OfficialRating = "NC-17";
  532. break;
  533. case 6:
  534. item.OfficialRating = "R";
  535. break;
  536. }
  537. break;
  538. }
  539. default:
  540. reader.Skip();
  541. break;
  542. }
  543. }
  544. }
  545. }
  546. /// <summary>
  547. /// Gets the persons from XML node.
  548. /// </summary>
  549. /// <param name="reader">The reader.</param>
  550. /// <returns>IEnumerable{PersonInfo}.</returns>
  551. private IEnumerable<PersonInfo> GetPersonsFromXmlNode(XmlReader reader)
  552. {
  553. var names = new List<string>();
  554. var type = "Actor"; // If type is not specified assume actor
  555. var role = string.Empty;
  556. reader.MoveToContent();
  557. while (reader.Read())
  558. {
  559. if (reader.NodeType == XmlNodeType.Element)
  560. {
  561. switch (reader.Name)
  562. {
  563. case "Name":
  564. names.AddRange(SplitNames(reader.ReadElementContentAsString()));
  565. break;
  566. case "Type":
  567. {
  568. var val = reader.ReadElementContentAsString();
  569. if (!string.IsNullOrWhiteSpace(val))
  570. {
  571. type = val;
  572. }
  573. break;
  574. }
  575. case "Role":
  576. {
  577. var val = reader.ReadElementContentAsString();
  578. if (!string.IsNullOrWhiteSpace(val))
  579. {
  580. role = val;
  581. }
  582. break;
  583. }
  584. default:
  585. reader.Skip();
  586. break;
  587. }
  588. }
  589. }
  590. return names.Select(n => new PersonInfo { Name = n, Role = role, Type = type });
  591. }
  592. /// <summary>
  593. /// Used to split names of comma or pipe delimeted genres and people
  594. /// </summary>
  595. /// <param name="value">The value.</param>
  596. /// <returns>IEnumerable{System.String}.</returns>
  597. private IEnumerable<string> SplitNames(string value)
  598. {
  599. value = value ?? string.Empty;
  600. // Only split by comma if there is no pipe in the string
  601. // We have to be careful to not split names like Matthew, Jr.
  602. var separator = value.IndexOf('|') == -1 ? ',' : '|';
  603. value = value.Trim().Trim(separator);
  604. return string.IsNullOrWhiteSpace(value) ? new string[] { } : Split(value, separator, StringSplitOptions.RemoveEmptyEntries);
  605. }
  606. /// <summary>
  607. /// Provides an additional overload for string.split
  608. /// </summary>
  609. /// <param name="val">The val.</param>
  610. /// <param name="separator">The separator.</param>
  611. /// <param name="options">The options.</param>
  612. /// <returns>System.String[][].</returns>
  613. private static string[] Split(string val, char separator, StringSplitOptions options)
  614. {
  615. return val.Split(new[] { separator }, options);
  616. }
  617. }
  618. }