BaseItemXmlParser.cs 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667
  1. using MediaBrowser.Controller.Entities;
  2. using MediaBrowser.Model.Entities;
  3. using MediaBrowser.Model.Logging;
  4. using System;
  5. using System.Collections.Generic;
  6. using System.Linq;
  7. using System.Threading;
  8. using System.Xml;
  9. namespace MediaBrowser.Controller.Providers
  10. {
  11. /// <summary>
  12. /// Provides a base class for parsing metadata xml
  13. /// </summary>
  14. /// <typeparam name="T"></typeparam>
  15. public class BaseItemXmlParser<T>
  16. where T : BaseItem, new()
  17. {
  18. /// <summary>
  19. /// The logger
  20. /// </summary>
  21. protected ILogger Logger { get; private set; }
  22. /// <summary>
  23. /// Initializes a new instance of the <see cref="BaseItemXmlParser{T}" /> class.
  24. /// </summary>
  25. /// <param name="logger">The logger.</param>
  26. public BaseItemXmlParser(ILogger logger)
  27. {
  28. Logger = logger;
  29. }
  30. /// <summary>
  31. /// Fetches metadata for an item from one xml file
  32. /// </summary>
  33. /// <param name="item">The item.</param>
  34. /// <param name="metadataFile">The metadata file.</param>
  35. /// <param name="cancellationToken">The cancellation token.</param>
  36. /// <exception cref="System.ArgumentNullException"></exception>
  37. public void Fetch(T item, string metadataFile, CancellationToken cancellationToken)
  38. {
  39. if (item == null)
  40. {
  41. throw new ArgumentNullException();
  42. }
  43. if (string.IsNullOrEmpty(metadataFile))
  44. {
  45. throw new ArgumentNullException();
  46. }
  47. var settings = new XmlReaderSettings
  48. {
  49. CheckCharacters = false,
  50. IgnoreProcessingInstructions = true,
  51. IgnoreComments = true,
  52. ValidationType = ValidationType.None
  53. };
  54. // Use XmlReader for best performance
  55. using (var reader = XmlReader.Create(metadataFile, settings))
  56. {
  57. reader.MoveToContent();
  58. // Loop through each element
  59. while (reader.Read())
  60. {
  61. cancellationToken.ThrowIfCancellationRequested();
  62. if (reader.NodeType == XmlNodeType.Element)
  63. {
  64. FetchDataFromXmlNode(reader, item);
  65. }
  66. }
  67. }
  68. }
  69. /// <summary>
  70. /// Fetches metadata from one Xml Element
  71. /// </summary>
  72. /// <param name="reader">The reader.</param>
  73. /// <param name="item">The item.</param>
  74. protected virtual void FetchDataFromXmlNode(XmlReader reader, T item)
  75. {
  76. switch (reader.Name)
  77. {
  78. // DateCreated
  79. case "Added":
  80. DateTime added;
  81. if (DateTime.TryParse(reader.ReadElementContentAsString() ?? string.Empty, out added))
  82. {
  83. item.DateCreated = added.ToUniversalTime();
  84. }
  85. break;
  86. case "LocalTitle":
  87. item.Name = reader.ReadElementContentAsString();
  88. break;
  89. case "Type":
  90. {
  91. var type = reader.ReadElementContentAsString();
  92. if (!string.IsNullOrWhiteSpace(type) && !type.Equals("none", StringComparison.OrdinalIgnoreCase))
  93. {
  94. item.DisplayMediaType = type;
  95. }
  96. break;
  97. }
  98. case "SortTitle":
  99. item.ForcedSortName = reader.ReadElementContentAsString();
  100. break;
  101. case "Overview":
  102. case "Description":
  103. item.Overview = reader.ReadElementContentAsString();
  104. break;
  105. case "TagLine":
  106. {
  107. var tagline = reader.ReadElementContentAsString();
  108. if (!string.IsNullOrWhiteSpace(tagline))
  109. {
  110. item.AddTagline(tagline);
  111. }
  112. break;
  113. }
  114. case "Website":
  115. {
  116. var val = reader.ReadElementContentAsString();
  117. if (!string.IsNullOrWhiteSpace(val))
  118. {
  119. item.HomePageUrl = val;
  120. }
  121. break;
  122. }
  123. case "TagLines":
  124. {
  125. FetchFromTaglinesNode(reader.ReadSubtree(), item);
  126. break;
  127. }
  128. case "ContentRating":
  129. case "certification":
  130. case "MPAARating":
  131. {
  132. var rating = reader.ReadElementContentAsString();
  133. if (!string.IsNullOrWhiteSpace(rating))
  134. {
  135. item.OfficialRating = rating;
  136. }
  137. break;
  138. }
  139. case "CustomRating":
  140. {
  141. var val = reader.ReadElementContentAsString();
  142. if (!string.IsNullOrWhiteSpace(val))
  143. {
  144. item.CustomRating = val;
  145. }
  146. break;
  147. }
  148. case "Runtime":
  149. case "RunningTime":
  150. {
  151. var text = reader.ReadElementContentAsString();
  152. if (!string.IsNullOrWhiteSpace(text))
  153. {
  154. int runtime;
  155. if (int.TryParse(text.Split(' ')[0], out runtime))
  156. {
  157. item.RunTimeTicks = TimeSpan.FromMinutes(runtime).Ticks;
  158. }
  159. }
  160. break;
  161. }
  162. case "Genre":
  163. {
  164. foreach (var name in SplitNames(reader.ReadElementContentAsString()))
  165. {
  166. if (string.IsNullOrWhiteSpace(name))
  167. {
  168. continue;
  169. }
  170. item.AddGenre(name);
  171. }
  172. break;
  173. }
  174. case "AspectRatio":
  175. {
  176. var val = reader.ReadElementContentAsString();
  177. if (!string.IsNullOrWhiteSpace(val))
  178. {
  179. item.AspectRatio = val;
  180. }
  181. break;
  182. }
  183. case "Network":
  184. {
  185. foreach (var name in SplitNames(reader.ReadElementContentAsString()))
  186. {
  187. if (string.IsNullOrWhiteSpace(name))
  188. {
  189. continue;
  190. }
  191. item.AddStudio(name);
  192. }
  193. break;
  194. }
  195. case "Director":
  196. {
  197. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v, Type = PersonType.Director }))
  198. {
  199. if (string.IsNullOrWhiteSpace(p.Name))
  200. {
  201. continue;
  202. }
  203. item.AddPerson(p);
  204. }
  205. break;
  206. }
  207. case "Writer":
  208. {
  209. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v, Type = PersonType.Writer }))
  210. {
  211. if (string.IsNullOrWhiteSpace(p.Name))
  212. {
  213. continue;
  214. }
  215. item.AddPerson(p);
  216. }
  217. break;
  218. }
  219. case "Actors":
  220. {
  221. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v.Trim(), Type = PersonType.Actor }))
  222. {
  223. if (string.IsNullOrWhiteSpace(p.Name))
  224. {
  225. continue;
  226. }
  227. item.AddPerson(p);
  228. }
  229. break;
  230. }
  231. case "GuestStars":
  232. {
  233. foreach (var p in SplitNames(reader.ReadElementContentAsString()).Select(v => new PersonInfo { Name = v.Trim(), Type = PersonType.GuestStar }))
  234. {
  235. if (string.IsNullOrWhiteSpace(p.Name))
  236. {
  237. continue;
  238. }
  239. item.AddPerson(p);
  240. }
  241. break;
  242. }
  243. case "Trailer":
  244. {
  245. var val = reader.ReadElementContentAsString();
  246. if (!string.IsNullOrWhiteSpace(val))
  247. {
  248. item.AddTrailerUrl(val);
  249. }
  250. break;
  251. }
  252. case "ProductionYear":
  253. {
  254. var val = reader.ReadElementContentAsString();
  255. if (!string.IsNullOrWhiteSpace(val))
  256. {
  257. int ProductionYear;
  258. if (int.TryParse(val, out ProductionYear) && ProductionYear > 1850)
  259. {
  260. item.ProductionYear = ProductionYear;
  261. }
  262. }
  263. break;
  264. }
  265. case "Rating":
  266. case "IMDBrating":
  267. {
  268. var rating = reader.ReadElementContentAsString();
  269. if (!string.IsNullOrWhiteSpace(rating))
  270. {
  271. float val;
  272. if (float.TryParse(rating, out val))
  273. {
  274. item.CommunityRating = val;
  275. }
  276. }
  277. break;
  278. }
  279. case "FirstAired":
  280. {
  281. var firstAired = reader.ReadElementContentAsString();
  282. if (!string.IsNullOrWhiteSpace(firstAired))
  283. {
  284. DateTime airDate;
  285. if (DateTime.TryParse(firstAired, out airDate) && airDate.Year > 1850)
  286. {
  287. item.PremiereDate = airDate.ToUniversalTime();
  288. item.ProductionYear = airDate.Year;
  289. }
  290. }
  291. break;
  292. }
  293. case "TMDbId":
  294. var tmdb = reader.ReadElementContentAsString();
  295. if (!string.IsNullOrWhiteSpace(tmdb))
  296. {
  297. item.SetProviderId(MetadataProviders.Tmdb, tmdb);
  298. }
  299. break;
  300. case "TVcomId":
  301. var TVcomId = reader.ReadElementContentAsString();
  302. if (!string.IsNullOrWhiteSpace(TVcomId))
  303. {
  304. item.SetProviderId(MetadataProviders.Tvcom, TVcomId);
  305. }
  306. break;
  307. case "IMDB_ID":
  308. case "IMDB":
  309. case "IMDbId":
  310. var IMDbId = reader.ReadElementContentAsString();
  311. if (!string.IsNullOrWhiteSpace(IMDbId))
  312. {
  313. item.SetProviderId(MetadataProviders.Imdb, IMDbId);
  314. }
  315. break;
  316. case "Genres":
  317. FetchFromGenresNode(reader.ReadSubtree(), item);
  318. break;
  319. case "Persons":
  320. FetchDataFromPersonsNode(reader.ReadSubtree(), item);
  321. break;
  322. case "ParentalRating":
  323. FetchFromParentalRatingNode(reader.ReadSubtree(), item);
  324. break;
  325. case "Studios":
  326. FetchFromStudiosNode(reader.ReadSubtree(), item);
  327. break;
  328. default:
  329. reader.Skip();
  330. break;
  331. }
  332. }
  333. /// <summary>
  334. /// Fetches from taglines node.
  335. /// </summary>
  336. /// <param name="reader">The reader.</param>
  337. /// <param name="item">The item.</param>
  338. private void FetchFromTaglinesNode(XmlReader reader, T item)
  339. {
  340. reader.MoveToContent();
  341. while (reader.Read())
  342. {
  343. if (reader.NodeType == XmlNodeType.Element)
  344. {
  345. switch (reader.Name)
  346. {
  347. case "Tagline":
  348. {
  349. var val = reader.ReadElementContentAsString();
  350. if (!string.IsNullOrWhiteSpace(val))
  351. {
  352. item.AddTagline(val);
  353. }
  354. break;
  355. }
  356. default:
  357. reader.Skip();
  358. break;
  359. }
  360. }
  361. }
  362. }
  363. /// <summary>
  364. /// Fetches from genres node.
  365. /// </summary>
  366. /// <param name="reader">The reader.</param>
  367. /// <param name="item">The item.</param>
  368. private void FetchFromGenresNode(XmlReader reader, T item)
  369. {
  370. reader.MoveToContent();
  371. while (reader.Read())
  372. {
  373. if (reader.NodeType == XmlNodeType.Element)
  374. {
  375. switch (reader.Name)
  376. {
  377. case "Genre":
  378. {
  379. var genre = reader.ReadElementContentAsString();
  380. if (!string.IsNullOrWhiteSpace(genre))
  381. {
  382. item.AddGenre(genre);
  383. }
  384. break;
  385. }
  386. default:
  387. reader.Skip();
  388. break;
  389. }
  390. }
  391. }
  392. }
  393. /// <summary>
  394. /// Fetches the data from persons node.
  395. /// </summary>
  396. /// <param name="reader">The reader.</param>
  397. /// <param name="item">The item.</param>
  398. private void FetchDataFromPersonsNode(XmlReader reader, T item)
  399. {
  400. reader.MoveToContent();
  401. while (reader.Read())
  402. {
  403. if (reader.NodeType == XmlNodeType.Element)
  404. {
  405. switch (reader.Name)
  406. {
  407. case "Person":
  408. {
  409. item.AddPeople(GetPersonsFromXmlNode(reader.ReadSubtree()));
  410. break;
  411. }
  412. default:
  413. reader.Skip();
  414. break;
  415. }
  416. }
  417. }
  418. }
  419. /// <summary>
  420. /// Fetches from studios node.
  421. /// </summary>
  422. /// <param name="reader">The reader.</param>
  423. /// <param name="item">The item.</param>
  424. private void FetchFromStudiosNode(XmlReader reader, T item)
  425. {
  426. reader.MoveToContent();
  427. while (reader.Read())
  428. {
  429. if (reader.NodeType == XmlNodeType.Element)
  430. {
  431. switch (reader.Name)
  432. {
  433. case "Studio":
  434. {
  435. var studio = reader.ReadElementContentAsString();
  436. if (!string.IsNullOrWhiteSpace(studio))
  437. {
  438. item.AddStudio(studio);
  439. }
  440. break;
  441. }
  442. default:
  443. reader.Skip();
  444. break;
  445. }
  446. }
  447. }
  448. }
  449. /// <summary>
  450. /// Fetches from parental rating node.
  451. /// </summary>
  452. /// <param name="reader">The reader.</param>
  453. /// <param name="item">The item.</param>
  454. private void FetchFromParentalRatingNode(XmlReader reader, T item)
  455. {
  456. reader.MoveToContent();
  457. while (reader.Read())
  458. {
  459. if (reader.NodeType == XmlNodeType.Element)
  460. {
  461. switch (reader.Name)
  462. {
  463. case "Value":
  464. {
  465. var ratingString = reader.ReadElementContentAsString();
  466. int rating = 7;
  467. if (!string.IsNullOrWhiteSpace(ratingString))
  468. {
  469. int.TryParse(ratingString, out rating);
  470. }
  471. switch (rating)
  472. {
  473. case -1:
  474. item.OfficialRating = "NR";
  475. break;
  476. case 0:
  477. item.OfficialRating = "UR";
  478. break;
  479. case 1:
  480. item.OfficialRating = "G";
  481. break;
  482. case 3:
  483. item.OfficialRating = "PG";
  484. break;
  485. case 4:
  486. item.OfficialRating = "PG-13";
  487. break;
  488. case 5:
  489. item.OfficialRating = "NC-17";
  490. break;
  491. case 6:
  492. item.OfficialRating = "R";
  493. break;
  494. }
  495. break;
  496. }
  497. default:
  498. reader.Skip();
  499. break;
  500. }
  501. }
  502. }
  503. }
  504. /// <summary>
  505. /// Gets the persons from XML node.
  506. /// </summary>
  507. /// <param name="reader">The reader.</param>
  508. /// <returns>IEnumerable{PersonInfo}.</returns>
  509. private IEnumerable<PersonInfo> GetPersonsFromXmlNode(XmlReader reader)
  510. {
  511. var names = new List<string>();
  512. var type = string.Empty;
  513. var role = string.Empty;
  514. reader.MoveToContent();
  515. while (reader.Read())
  516. {
  517. if (reader.NodeType == XmlNodeType.Element)
  518. {
  519. switch (reader.Name)
  520. {
  521. case "Name":
  522. names.AddRange(SplitNames(reader.ReadElementContentAsString()));
  523. break;
  524. case "Type":
  525. {
  526. var val = reader.ReadElementContentAsString();
  527. if (!string.IsNullOrWhiteSpace(val))
  528. {
  529. type = val;
  530. }
  531. break;
  532. }
  533. case "Role":
  534. {
  535. var val = reader.ReadElementContentAsString();
  536. if (!string.IsNullOrWhiteSpace(val))
  537. {
  538. role = val;
  539. }
  540. break;
  541. }
  542. default:
  543. reader.Skip();
  544. break;
  545. }
  546. }
  547. }
  548. return names.Select(n => new PersonInfo { Name = n, Role = role, Type = type });
  549. }
  550. /// <summary>
  551. /// Used to split names of comma or pipe delimeted genres and people
  552. /// </summary>
  553. /// <param name="value">The value.</param>
  554. /// <returns>IEnumerable{System.String}.</returns>
  555. private IEnumerable<string> SplitNames(string value)
  556. {
  557. value = value ?? string.Empty;
  558. // Only split by comma if there is no pipe in the string
  559. // We have to be careful to not split names like Matthew, Jr.
  560. var separator = value.IndexOf('|') == -1 ? ',' : '|';
  561. value = value.Trim().Trim(separator);
  562. return string.IsNullOrWhiteSpace(value) ? new string[] { } : Split(value, separator, StringSplitOptions.RemoveEmptyEntries);
  563. }
  564. /// <summary>
  565. /// Provides an additional overload for string.split
  566. /// </summary>
  567. /// <param name="val">The val.</param>
  568. /// <param name="separator">The separator.</param>
  569. /// <param name="options">The options.</param>
  570. /// <returns>System.String[][].</returns>
  571. private static string[] Split(string val, char separator, StringSplitOptions options)
  572. {
  573. return val.Split(new[] { separator }, options);
  574. }
  575. }
  576. }