RemoteSeriesProvider.cs 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620
  1. using System.Xml.Linq;
  2. using MediaBrowser.Common.Configuration;
  3. using MediaBrowser.Common.Extensions;
  4. using MediaBrowser.Common.Net;
  5. using MediaBrowser.Controller.Configuration;
  6. using MediaBrowser.Controller.Entities;
  7. using MediaBrowser.Controller.Entities.TV;
  8. using MediaBrowser.Controller.Library;
  9. using MediaBrowser.Controller.Providers;
  10. using MediaBrowser.Model.Entities;
  11. using MediaBrowser.Model.IO;
  12. using MediaBrowser.Model.Logging;
  13. using System;
  14. using System.Globalization;
  15. using System.IO;
  16. using System.Linq;
  17. using System.Net;
  18. using System.Text;
  19. using System.Threading;
  20. using System.Threading.Tasks;
  21. using System.Xml;
  22. using MediaBrowser.Providers.Extensions;
  23. namespace MediaBrowser.Providers.TV
  24. {
  25. /// <summary>
  26. /// Class RemoteSeriesProvider
  27. /// </summary>
  28. class RemoteSeriesProvider : BaseMetadataProvider, IDisposable
  29. {
  30. /// <summary>
  31. /// The _provider manager
  32. /// </summary>
  33. private readonly IProviderManager _providerManager;
  34. /// <summary>
  35. /// The tv db
  36. /// </summary>
  37. internal readonly SemaphoreSlim TvDbResourcePool = new SemaphoreSlim(2, 2);
  38. /// <summary>
  39. /// Gets the current.
  40. /// </summary>
  41. /// <value>The current.</value>
  42. internal static RemoteSeriesProvider Current { get; private set; }
  43. /// <summary>
  44. /// The _zip client
  45. /// </summary>
  46. private readonly IZipClient _zipClient;
  47. /// <summary>
  48. /// Gets the HTTP client.
  49. /// </summary>
  50. /// <value>The HTTP client.</value>
  51. protected IHttpClient HttpClient { get; private set; }
  52. /// <summary>
  53. /// Initializes a new instance of the <see cref="RemoteSeriesProvider" /> class.
  54. /// </summary>
  55. /// <param name="httpClient">The HTTP client.</param>
  56. /// <param name="logManager">The log manager.</param>
  57. /// <param name="configurationManager">The configuration manager.</param>
  58. /// <param name="providerManager">The provider manager.</param>
  59. /// <param name="zipClient">The zip client.</param>
  60. /// <exception cref="System.ArgumentNullException">httpClient</exception>
  61. public RemoteSeriesProvider(IHttpClient httpClient, ILogManager logManager, IServerConfigurationManager configurationManager, IProviderManager providerManager, IZipClient zipClient)
  62. : base(logManager, configurationManager)
  63. {
  64. if (httpClient == null)
  65. {
  66. throw new ArgumentNullException("httpClient");
  67. }
  68. HttpClient = httpClient;
  69. _providerManager = providerManager;
  70. _zipClient = zipClient;
  71. Current = this;
  72. }
  73. /// <summary>
  74. /// Releases unmanaged and - optionally - managed resources.
  75. /// </summary>
  76. /// <param name="dispose"><c>true</c> to release both managed and unmanaged resources; <c>false</c> to release only unmanaged resources.</param>
  77. protected virtual void Dispose(bool dispose)
  78. {
  79. if (dispose)
  80. {
  81. TvDbResourcePool.Dispose();
  82. }
  83. }
  84. /// <summary>
  85. /// The root URL
  86. /// </summary>
  87. private const string RootUrl = "http://www.thetvdb.com/api/";
  88. /// <summary>
  89. /// The series query
  90. /// </summary>
  91. private const string SeriesQuery = "GetSeries.php?seriesname={0}";
  92. /// <summary>
  93. /// The series get zip
  94. /// </summary>
  95. private const string SeriesGetZip = "http://www.thetvdb.com/api/{0}/series/{1}/all/{2}.zip";
  96. /// <summary>
  97. /// The LOCA l_ MET a_ FIL e_ NAME
  98. /// </summary>
  99. protected const string LocalMetaFileName = "Series.xml";
  100. /// <summary>
  101. /// Supportses the specified item.
  102. /// </summary>
  103. /// <param name="item">The item.</param>
  104. /// <returns><c>true</c> if XXXX, <c>false</c> otherwise</returns>
  105. public override bool Supports(BaseItem item)
  106. {
  107. return item is Series;
  108. }
  109. /// <summary>
  110. /// Gets the priority.
  111. /// </summary>
  112. /// <value>The priority.</value>
  113. public override MetadataProviderPriority Priority
  114. {
  115. get { return MetadataProviderPriority.Second; }
  116. }
  117. /// <summary>
  118. /// Gets a value indicating whether [requires internet].
  119. /// </summary>
  120. /// <value><c>true</c> if [requires internet]; otherwise, <c>false</c>.</value>
  121. public override bool RequiresInternet
  122. {
  123. get
  124. {
  125. return true;
  126. }
  127. }
  128. /// <summary>
  129. /// Gets a value indicating whether [refresh on version change].
  130. /// </summary>
  131. /// <value><c>true</c> if [refresh on version change]; otherwise, <c>false</c>.</value>
  132. protected override bool RefreshOnVersionChange
  133. {
  134. get
  135. {
  136. return true;
  137. }
  138. }
  139. /// <summary>
  140. /// Gets the provider version.
  141. /// </summary>
  142. /// <value>The provider version.</value>
  143. protected override string ProviderVersion
  144. {
  145. get
  146. {
  147. return "1";
  148. }
  149. }
  150. protected override DateTime CompareDate(BaseItem item)
  151. {
  152. var seriesId = item.GetProviderId(MetadataProviders.Tvdb);
  153. if (!string.IsNullOrEmpty(seriesId))
  154. {
  155. // Process images
  156. var path = GetSeriesDataPath(ConfigurationManager.ApplicationPaths, seriesId);
  157. var files = new DirectoryInfo(path)
  158. .EnumerateFiles("*.xml", SearchOption.TopDirectoryOnly)
  159. .Select(i => i.LastWriteTimeUtc)
  160. .ToArray();
  161. if (files.Length > 0)
  162. {
  163. return files.Max();
  164. }
  165. }
  166. return base.CompareDate(item);
  167. }
  168. /// <summary>
  169. /// Fetches metadata and returns true or false indicating if any work that requires persistence was done
  170. /// </summary>
  171. /// <param name="item">The item.</param>
  172. /// <param name="force">if set to <c>true</c> [force].</param>
  173. /// <param name="cancellationToken">The cancellation token.</param>
  174. /// <returns>Task{System.Boolean}.</returns>
  175. public override async Task<bool> FetchAsync(BaseItem item, bool force, CancellationToken cancellationToken)
  176. {
  177. cancellationToken.ThrowIfCancellationRequested();
  178. var series = (Series)item;
  179. var seriesId = series.GetProviderId(MetadataProviders.Tvdb);
  180. if (string.IsNullOrEmpty(seriesId))
  181. {
  182. seriesId = await GetSeriesId(series, cancellationToken);
  183. }
  184. cancellationToken.ThrowIfCancellationRequested();
  185. if (!string.IsNullOrEmpty(seriesId))
  186. {
  187. series.SetProviderId(MetadataProviders.Tvdb, seriesId);
  188. var seriesDataPath = GetSeriesDataPath(ConfigurationManager.ApplicationPaths, seriesId);
  189. await FetchSeriesData(series, seriesId, seriesDataPath, force, cancellationToken).ConfigureAwait(false);
  190. }
  191. BaseProviderInfo data;
  192. if (!item.ProviderData.TryGetValue(Id, out data))
  193. {
  194. data = new BaseProviderInfo();
  195. item.ProviderData[Id] = data;
  196. }
  197. SetLastRefreshed(item, DateTime.UtcNow);
  198. return true;
  199. }
  200. /// <summary>
  201. /// Fetches the series data.
  202. /// </summary>
  203. /// <param name="series">The series.</param>
  204. /// <param name="seriesId">The series id.</param>
  205. /// <param name="seriesDataPath">The series data path.</param>
  206. /// <param name="isForcedRefresh">if set to <c>true</c> [is forced refresh].</param>
  207. /// <param name="cancellationToken">The cancellation token.</param>
  208. /// <returns>Task{System.Boolean}.</returns>
  209. private async Task FetchSeriesData(Series series, string seriesId, string seriesDataPath, bool isForcedRefresh, CancellationToken cancellationToken)
  210. {
  211. var files = Directory.EnumerateFiles(seriesDataPath, "*.xml", SearchOption.TopDirectoryOnly).Select(Path.GetFileName).ToArray();
  212. var seriesXmlFilename = ConfigurationManager.Configuration.PreferredMetadataLanguage.ToLower() + ".xml";
  213. // Only download if not already there
  214. // The prescan task will take care of updates so we don't need to re-download here
  215. if (!files.Contains("banners.xml", StringComparer.OrdinalIgnoreCase) || !files.Contains("actors.xml", StringComparer.OrdinalIgnoreCase) || !files.Contains(seriesXmlFilename, StringComparer.OrdinalIgnoreCase))
  216. {
  217. await DownloadSeriesZip(seriesId, seriesDataPath, cancellationToken).ConfigureAwait(false);
  218. }
  219. // Examine if there's no local metadata, or save local is on (to get updates)
  220. if (!HasLocalMeta(series) || isForcedRefresh)
  221. {
  222. var seriesXmlPath = Path.Combine(seriesDataPath, seriesXmlFilename);
  223. var actorsXmlPath = Path.Combine(seriesDataPath, "actors.xml");
  224. var seriesDoc = new XmlDocument();
  225. seriesDoc.Load(seriesXmlPath);
  226. FetchMainInfo(series, seriesDoc);
  227. if (!series.LockedFields.Contains(MetadataFields.Cast))
  228. {
  229. var actorsDoc = new XmlDocument();
  230. actorsDoc.Load(actorsXmlPath);
  231. FetchActors(series, actorsDoc, seriesDoc);
  232. }
  233. }
  234. }
  235. /// <summary>
  236. /// Downloads the series zip.
  237. /// </summary>
  238. /// <param name="seriesId">The series id.</param>
  239. /// <param name="seriesDataPath">The series data path.</param>
  240. /// <param name="cancellationToken">The cancellation token.</param>
  241. /// <returns>Task.</returns>
  242. internal async Task DownloadSeriesZip(string seriesId, string seriesDataPath, CancellationToken cancellationToken)
  243. {
  244. var url = string.Format(SeriesGetZip, TVUtils.TvdbApiKey, seriesId, ConfigurationManager.Configuration.PreferredMetadataLanguage);
  245. using (var zipStream = await HttpClient.Get(new HttpRequestOptions
  246. {
  247. Url = url,
  248. ResourcePool = TvDbResourcePool,
  249. CancellationToken = cancellationToken
  250. }).ConfigureAwait(false))
  251. {
  252. // Copy to memory stream because we need a seekable stream
  253. using (var ms = new MemoryStream())
  254. {
  255. await zipStream.CopyToAsync(ms).ConfigureAwait(false);
  256. ms.Position = 0;
  257. _zipClient.ExtractAll(ms, seriesDataPath, true);
  258. }
  259. }
  260. }
  261. /// <summary>
  262. /// Gets the series data path.
  263. /// </summary>
  264. /// <param name="appPaths">The app paths.</param>
  265. /// <param name="seriesId">The series id.</param>
  266. /// <returns>System.String.</returns>
  267. internal static string GetSeriesDataPath(IApplicationPaths appPaths, string seriesId)
  268. {
  269. var seriesDataPath = Path.Combine(GetSeriesDataPath(appPaths), seriesId);
  270. if (!Directory.Exists(seriesDataPath))
  271. {
  272. Directory.CreateDirectory(seriesDataPath);
  273. }
  274. return seriesDataPath;
  275. }
  276. /// <summary>
  277. /// Gets the series data path.
  278. /// </summary>
  279. /// <param name="appPaths">The app paths.</param>
  280. /// <returns>System.String.</returns>
  281. internal static string GetSeriesDataPath(IApplicationPaths appPaths)
  282. {
  283. var dataPath = Path.Combine(appPaths.DataPath, "tvdb");
  284. if (!Directory.Exists(dataPath))
  285. {
  286. Directory.CreateDirectory(dataPath);
  287. }
  288. return dataPath;
  289. }
  290. /// <summary>
  291. /// Fetches the main info.
  292. /// </summary>
  293. /// <param name="series">The series.</param>
  294. /// <param name="doc">The doc.</param>
  295. private void FetchMainInfo(Series series, XmlDocument doc)
  296. {
  297. if (!series.LockedFields.Contains(MetadataFields.Name))
  298. {
  299. series.Name = doc.SafeGetString("//SeriesName");
  300. }
  301. if (!series.LockedFields.Contains(MetadataFields.Overview))
  302. {
  303. series.Overview = doc.SafeGetString("//Overview");
  304. }
  305. series.CommunityRating = doc.SafeGetSingle("//Rating", 0, 10);
  306. series.AirDays = TVUtils.GetAirDays(doc.SafeGetString("//Airs_DayOfWeek"));
  307. series.AirTime = doc.SafeGetString("//Airs_Time");
  308. SeriesStatus seriesStatus;
  309. if(Enum.TryParse(doc.SafeGetString("//Status"), true, out seriesStatus))
  310. series.Status = seriesStatus;
  311. series.PremiereDate = doc.SafeGetDateTime("//FirstAired");
  312. if (series.PremiereDate.HasValue)
  313. series.ProductionYear = series.PremiereDate.Value.Year;
  314. series.RunTimeTicks = TimeSpan.FromMinutes(doc.SafeGetInt32("//Runtime")).Ticks;
  315. if (!series.LockedFields.Contains(MetadataFields.Studios))
  316. {
  317. string s = doc.SafeGetString("//Network");
  318. if (!string.IsNullOrWhiteSpace(s))
  319. {
  320. series.Studios.Clear();
  321. foreach (var studio in s.Trim().Split('|'))
  322. {
  323. series.AddStudio(studio);
  324. }
  325. }
  326. }
  327. series.OfficialRating = doc.SafeGetString("//ContentRating");
  328. if (!series.LockedFields.Contains(MetadataFields.Genres))
  329. {
  330. string g = doc.SafeGetString("//Genre");
  331. if (g != null)
  332. {
  333. string[] genres = g.Trim('|').Split('|');
  334. if (g.Length > 0)
  335. {
  336. series.Genres.Clear();
  337. foreach (var genre in genres)
  338. {
  339. series.AddGenre(genre);
  340. }
  341. }
  342. }
  343. }
  344. if (series.Status == SeriesStatus.Ended) {
  345. var document = XDocument.Load(new XmlNodeReader(doc));
  346. var dates = document.Descendants("Episode").Where(x => {
  347. var seasonNumber = x.Element("SeasonNumber");
  348. var firstAired = x.Element("FirstAired");
  349. return firstAired != null && seasonNumber != null && (!string.IsNullOrEmpty(seasonNumber.Value) && seasonNumber.Value != "0") && !string.IsNullOrEmpty(firstAired.Value);
  350. }).Select(x => {
  351. DateTime? date = null;
  352. DateTime tempDate;
  353. var firstAired = x.Element("FirstAired");
  354. if (firstAired != null && DateTime.TryParse(firstAired.Value, out tempDate))
  355. {
  356. date = tempDate;
  357. }
  358. return date;
  359. }).ToList();
  360. if(dates.Any(x=>x.HasValue))
  361. series.EndDate = dates.Where(x => x.HasValue).Max();
  362. }
  363. }
  364. /// <summary>
  365. /// Fetches the actors.
  366. /// </summary>
  367. /// <param name="series">The series.</param>
  368. /// <param name="actorsDoc">The actors doc.</param>
  369. /// <param name="seriesDoc">The seriesDoc.</param>
  370. /// <returns>Task.</returns>
  371. private void FetchActors(Series series, XmlDocument actorsDoc, XmlDocument seriesDoc)
  372. {
  373. XmlNode actorsNode = null;
  374. if (ConfigurationManager.Configuration.SaveLocalMeta)
  375. {
  376. //add to the main seriesDoc for saving
  377. var seriesNode = seriesDoc.SelectSingleNode("//Series");
  378. if (seriesNode != null)
  379. {
  380. actorsNode = seriesDoc.CreateNode(XmlNodeType.Element, "Persons", null);
  381. seriesNode.AppendChild(actorsNode);
  382. }
  383. }
  384. var xmlNodeList = actorsDoc.SelectNodes("Actors/Actor");
  385. if (xmlNodeList != null)
  386. {
  387. series.People.Clear();
  388. foreach (XmlNode p in xmlNodeList)
  389. {
  390. string actorName = p.SafeGetString("Name");
  391. string actorRole = p.SafeGetString("Role");
  392. if (!string.IsNullOrWhiteSpace(actorName))
  393. {
  394. // Sometimes tvdb actors have leading spaces
  395. series.AddPerson(new PersonInfo { Type = PersonType.Actor, Name = actorName.Trim(), Role = actorRole });
  396. if (ConfigurationManager.Configuration.SaveLocalMeta && actorsNode != null)
  397. {
  398. //create in main seriesDoc
  399. var personNode = seriesDoc.CreateNode(XmlNodeType.Element, "Person", null);
  400. foreach (XmlNode subNode in p.ChildNodes)
  401. personNode.AppendChild(seriesDoc.ImportNode(subNode, true));
  402. //need to add the type
  403. var typeNode = seriesDoc.CreateNode(XmlNodeType.Element, "Type", null);
  404. typeNode.InnerText = PersonType.Actor;
  405. personNode.AppendChild(typeNode);
  406. actorsNode.AppendChild(personNode);
  407. }
  408. }
  409. }
  410. }
  411. }
  412. /// <summary>
  413. /// The us culture
  414. /// </summary>
  415. protected readonly CultureInfo UsCulture = new CultureInfo("en-US");
  416. /// <summary>
  417. /// Determines whether [has local meta] [the specified item].
  418. /// </summary>
  419. /// <param name="item">The item.</param>
  420. /// <returns><c>true</c> if [has local meta] [the specified item]; otherwise, <c>false</c>.</returns>
  421. private bool HasLocalMeta(BaseItem item)
  422. {
  423. return item.ResolveArgs.ContainsMetaFileByName(LocalMetaFileName);
  424. }
  425. /// <summary>
  426. /// Gets the series id.
  427. /// </summary>
  428. /// <param name="item">The item.</param>
  429. /// <param name="cancellationToken">The cancellation token.</param>
  430. /// <returns>Task{System.String}.</returns>
  431. private async Task<string> GetSeriesId(BaseItem item, CancellationToken cancellationToken)
  432. {
  433. var seriesId = item.GetProviderId(MetadataProviders.Tvdb);
  434. if (string.IsNullOrEmpty(seriesId))
  435. {
  436. seriesId = await FindSeries(item.Name, cancellationToken).ConfigureAwait(false);
  437. }
  438. return seriesId;
  439. }
  440. /// <summary>
  441. /// Finds the series.
  442. /// </summary>
  443. /// <param name="name">The name.</param>
  444. /// <param name="cancellationToken">The cancellation token.</param>
  445. /// <returns>Task{System.String}.</returns>
  446. public async Task<string> FindSeries(string name, CancellationToken cancellationToken)
  447. {
  448. //nope - search for it
  449. string url = string.Format(RootUrl + SeriesQuery, WebUtility.UrlEncode(name));
  450. var doc = new XmlDocument();
  451. using (var results = await HttpClient.Get(new HttpRequestOptions
  452. {
  453. Url = url,
  454. ResourcePool = TvDbResourcePool,
  455. CancellationToken = cancellationToken
  456. }).ConfigureAwait(false))
  457. {
  458. doc.Load(results);
  459. }
  460. if (doc.HasChildNodes)
  461. {
  462. XmlNodeList nodes = doc.SelectNodes("//Series");
  463. string comparableName = GetComparableName(name);
  464. if (nodes != null)
  465. foreach (XmlNode node in nodes)
  466. {
  467. var n = node.SelectSingleNode("./SeriesName");
  468. if (n != null && GetComparableName(n.InnerText) == comparableName)
  469. {
  470. n = node.SelectSingleNode("./seriesid");
  471. if (n != null)
  472. return n.InnerText;
  473. }
  474. else
  475. {
  476. if (n != null)
  477. Logger.Info("TVDb Provider - " + n.InnerText + " did not match " + comparableName);
  478. }
  479. }
  480. }
  481. Logger.Info("TVDb Provider - Could not find " + name + ". Check name on Thetvdb.org.");
  482. return null;
  483. }
  484. /// <summary>
  485. /// The remove
  486. /// </summary>
  487. const string remove = "\"'!`?";
  488. /// <summary>
  489. /// The spacers
  490. /// </summary>
  491. const string spacers = "/,.:;\\(){}[]+-_=–*"; // (there are not actually two - in the they are different char codes)
  492. /// <summary>
  493. /// Gets the name of the comparable.
  494. /// </summary>
  495. /// <param name="name">The name.</param>
  496. /// <returns>System.String.</returns>
  497. internal static string GetComparableName(string name)
  498. {
  499. name = name.ToLower();
  500. name = name.Normalize(NormalizationForm.FormKD);
  501. var sb = new StringBuilder();
  502. foreach (var c in name)
  503. {
  504. if ((int)c >= 0x2B0 && (int)c <= 0x0333)
  505. {
  506. // skip char modifier and diacritics
  507. }
  508. else if (remove.IndexOf(c) > -1)
  509. {
  510. // skip chars we are removing
  511. }
  512. else if (spacers.IndexOf(c) > -1)
  513. {
  514. sb.Append(" ");
  515. }
  516. else if (c == '&')
  517. {
  518. sb.Append(" and ");
  519. }
  520. else
  521. {
  522. sb.Append(c);
  523. }
  524. }
  525. name = sb.ToString();
  526. name = name.Replace(", the", "");
  527. name = name.Replace("the ", " ");
  528. name = name.Replace(" the ", " ");
  529. string prevName;
  530. do
  531. {
  532. prevName = name;
  533. name = name.Replace(" ", " ");
  534. } while (name.Length != prevName.Length);
  535. return name.Trim();
  536. }
  537. /// <summary>
  538. /// Performs application-defined tasks associated with freeing, releasing, or resetting unmanaged resources.
  539. /// </summary>
  540. public void Dispose()
  541. {
  542. Dispose(true);
  543. }
  544. }
  545. }