RemoteSeriesProvider.cs 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640
  1. using System.Xml.Linq;
  2. using MediaBrowser.Common.Configuration;
  3. using MediaBrowser.Common.Extensions;
  4. using MediaBrowser.Common.Net;
  5. using MediaBrowser.Controller.Configuration;
  6. using MediaBrowser.Controller.Entities;
  7. using MediaBrowser.Controller.Entities.TV;
  8. using MediaBrowser.Controller.Library;
  9. using MediaBrowser.Controller.Providers;
  10. using MediaBrowser.Model.Entities;
  11. using MediaBrowser.Model.IO;
  12. using MediaBrowser.Model.Logging;
  13. using System;
  14. using System.Globalization;
  15. using System.IO;
  16. using System.Linq;
  17. using System.Net;
  18. using System.Text;
  19. using System.Threading;
  20. using System.Threading.Tasks;
  21. using System.Xml;
  22. using MediaBrowser.Providers.Extensions;
  23. namespace MediaBrowser.Providers.TV
  24. {
  25. /// <summary>
  26. /// Class RemoteSeriesProvider
  27. /// </summary>
  28. class RemoteSeriesProvider : BaseMetadataProvider, IDisposable
  29. {
  30. /// <summary>
  31. /// The _provider manager
  32. /// </summary>
  33. private readonly IProviderManager _providerManager;
  34. /// <summary>
  35. /// The tv db
  36. /// </summary>
  37. internal readonly SemaphoreSlim TvDbResourcePool = new SemaphoreSlim(2, 2);
  38. /// <summary>
  39. /// Gets the current.
  40. /// </summary>
  41. /// <value>The current.</value>
  42. internal static RemoteSeriesProvider Current { get; private set; }
  43. /// <summary>
  44. /// The _zip client
  45. /// </summary>
  46. private readonly IZipClient _zipClient;
  47. /// <summary>
  48. /// Gets the HTTP client.
  49. /// </summary>
  50. /// <value>The HTTP client.</value>
  51. protected IHttpClient HttpClient { get; private set; }
  52. /// <summary>
  53. /// Initializes a new instance of the <see cref="RemoteSeriesProvider" /> class.
  54. /// </summary>
  55. /// <param name="httpClient">The HTTP client.</param>
  56. /// <param name="logManager">The log manager.</param>
  57. /// <param name="configurationManager">The configuration manager.</param>
  58. /// <param name="providerManager">The provider manager.</param>
  59. /// <param name="zipClient">The zip client.</param>
  60. /// <exception cref="System.ArgumentNullException">httpClient</exception>
  61. public RemoteSeriesProvider(IHttpClient httpClient, ILogManager logManager, IServerConfigurationManager configurationManager, IProviderManager providerManager, IZipClient zipClient)
  62. : base(logManager, configurationManager)
  63. {
  64. if (httpClient == null)
  65. {
  66. throw new ArgumentNullException("httpClient");
  67. }
  68. HttpClient = httpClient;
  69. _providerManager = providerManager;
  70. _zipClient = zipClient;
  71. Current = this;
  72. }
  73. /// <summary>
  74. /// Releases unmanaged and - optionally - managed resources.
  75. /// </summary>
  76. /// <param name="dispose"><c>true</c> to release both managed and unmanaged resources; <c>false</c> to release only unmanaged resources.</param>
  77. protected virtual void Dispose(bool dispose)
  78. {
  79. if (dispose)
  80. {
  81. TvDbResourcePool.Dispose();
  82. }
  83. }
  84. /// <summary>
  85. /// The root URL
  86. /// </summary>
  87. private const string RootUrl = "http://www.thetvdb.com/api/";
  88. /// <summary>
  89. /// The series query
  90. /// </summary>
  91. private const string SeriesQuery = "GetSeries.php?seriesname={0}";
  92. /// <summary>
  93. /// The series get zip
  94. /// </summary>
  95. private const string SeriesGetZip = "http://www.thetvdb.com/api/{0}/series/{1}/all/{2}.zip";
  96. /// <summary>
  97. /// The LOCA l_ MET a_ FIL e_ NAME
  98. /// </summary>
  99. protected const string LocalMetaFileName = "Series.xml";
  100. /// <summary>
  101. /// Supportses the specified item.
  102. /// </summary>
  103. /// <param name="item">The item.</param>
  104. /// <returns><c>true</c> if XXXX, <c>false</c> otherwise</returns>
  105. public override bool Supports(BaseItem item)
  106. {
  107. return item is Series;
  108. }
  109. /// <summary>
  110. /// Gets the priority.
  111. /// </summary>
  112. /// <value>The priority.</value>
  113. public override MetadataProviderPriority Priority
  114. {
  115. get { return MetadataProviderPriority.Second; }
  116. }
  117. /// <summary>
  118. /// Gets a value indicating whether [requires internet].
  119. /// </summary>
  120. /// <value><c>true</c> if [requires internet]; otherwise, <c>false</c>.</value>
  121. public override bool RequiresInternet
  122. {
  123. get
  124. {
  125. return true;
  126. }
  127. }
  128. /// <summary>
  129. /// Gets a value indicating whether [refresh on version change].
  130. /// </summary>
  131. /// <value><c>true</c> if [refresh on version change]; otherwise, <c>false</c>.</value>
  132. protected override bool RefreshOnVersionChange
  133. {
  134. get
  135. {
  136. return true;
  137. }
  138. }
  139. /// <summary>
  140. /// Gets the provider version.
  141. /// </summary>
  142. /// <value>The provider version.</value>
  143. protected override string ProviderVersion
  144. {
  145. get
  146. {
  147. return "1";
  148. }
  149. }
  150. /// <summary>
  151. /// Needses the refresh internal.
  152. /// </summary>
  153. /// <param name="item">The item.</param>
  154. /// <param name="providerInfo">The provider info.</param>
  155. /// <returns><c>true</c> if XXXX, <c>false</c> otherwise</returns>
  156. protected override bool NeedsRefreshInternal(BaseItem item, BaseProviderInfo providerInfo)
  157. {
  158. // Refresh even if local metadata exists because we need episode infos
  159. if (GetComparisonData(item) != providerInfo.Data)
  160. {
  161. return true;
  162. }
  163. return base.NeedsRefreshInternal(item, providerInfo);
  164. }
  165. /// <summary>
  166. /// Gets the comparison data.
  167. /// </summary>
  168. /// <param name="item">The item.</param>
  169. /// <returns>Guid.</returns>
  170. private Guid GetComparisonData(BaseItem item)
  171. {
  172. var seriesId = item.GetProviderId(MetadataProviders.Tvdb);
  173. if (!string.IsNullOrEmpty(seriesId))
  174. {
  175. // Process images
  176. var path = GetSeriesDataPath(ConfigurationManager.ApplicationPaths, seriesId);
  177. var files = new DirectoryInfo(path)
  178. .EnumerateFiles("*.xml", SearchOption.TopDirectoryOnly)
  179. .Select(i => i.FullName + i.LastWriteTimeUtc.Ticks)
  180. .ToArray();
  181. if (files.Length > 0)
  182. {
  183. return string.Join(string.Empty, files).GetMD5();
  184. }
  185. }
  186. return Guid.Empty;
  187. }
  188. /// <summary>
  189. /// Fetches metadata and returns true or false indicating if any work that requires persistence was done
  190. /// </summary>
  191. /// <param name="item">The item.</param>
  192. /// <param name="force">if set to <c>true</c> [force].</param>
  193. /// <param name="cancellationToken">The cancellation token.</param>
  194. /// <returns>Task{System.Boolean}.</returns>
  195. public override async Task<bool> FetchAsync(BaseItem item, bool force, CancellationToken cancellationToken)
  196. {
  197. cancellationToken.ThrowIfCancellationRequested();
  198. var series = (Series)item;
  199. var seriesId = series.GetProviderId(MetadataProviders.Tvdb);
  200. if (string.IsNullOrEmpty(seriesId))
  201. {
  202. seriesId = await GetSeriesId(series, cancellationToken);
  203. }
  204. cancellationToken.ThrowIfCancellationRequested();
  205. if (!string.IsNullOrEmpty(seriesId))
  206. {
  207. series.SetProviderId(MetadataProviders.Tvdb, seriesId);
  208. var seriesDataPath = GetSeriesDataPath(ConfigurationManager.ApplicationPaths, seriesId);
  209. await FetchSeriesData(series, seriesId, seriesDataPath, cancellationToken).ConfigureAwait(false);
  210. }
  211. BaseProviderInfo data;
  212. if (!item.ProviderData.TryGetValue(Id, out data))
  213. {
  214. data = new BaseProviderInfo();
  215. item.ProviderData[Id] = data;
  216. }
  217. data.Data = GetComparisonData(item);
  218. SetLastRefreshed(item, DateTime.UtcNow);
  219. return true;
  220. }
  221. /// <summary>
  222. /// Fetches the series data.
  223. /// </summary>
  224. /// <param name="series">The series.</param>
  225. /// <param name="seriesId">The series id.</param>
  226. /// <param name="seriesDataPath">The series data path.</param>
  227. /// <param name="cancellationToken">The cancellation token.</param>
  228. /// <returns>Task{System.Boolean}.</returns>
  229. private async Task FetchSeriesData(Series series, string seriesId, string seriesDataPath, CancellationToken cancellationToken)
  230. {
  231. var files = Directory.EnumerateFiles(seriesDataPath, "*.xml", SearchOption.TopDirectoryOnly).Select(Path.GetFileName).ToArray();
  232. var seriesXmlFilename = ConfigurationManager.Configuration.PreferredMetadataLanguage.ToLower() + ".xml";
  233. // Only download if not already there
  234. // The prescan task will take care of updates so we don't need to re-download here
  235. if (!files.Contains("banners.xml", StringComparer.OrdinalIgnoreCase) || !files.Contains("actors.xml", StringComparer.OrdinalIgnoreCase) || !files.Contains(seriesXmlFilename, StringComparer.OrdinalIgnoreCase))
  236. {
  237. await DownloadSeriesZip(seriesId, seriesDataPath, cancellationToken).ConfigureAwait(false);
  238. }
  239. // Examine if there's no local metadata, or save local is on (to get updates)
  240. if (!HasLocalMeta(series) || ConfigurationManager.Configuration.SaveLocalMeta)
  241. {
  242. var seriesXmlPath = Path.Combine(seriesDataPath, seriesXmlFilename);
  243. var actorsXmlPath = Path.Combine(seriesDataPath, "actors.xml");
  244. var seriesDoc = new XmlDocument();
  245. seriesDoc.Load(seriesXmlPath);
  246. FetchMainInfo(series, seriesDoc);
  247. var actorsDoc = new XmlDocument();
  248. actorsDoc.Load(actorsXmlPath);
  249. FetchActors(series, actorsDoc, seriesDoc);
  250. if (ConfigurationManager.Configuration.SaveLocalMeta)
  251. {
  252. var ms = new MemoryStream();
  253. seriesDoc.Save(ms);
  254. await _providerManager.SaveToLibraryFilesystem(series, Path.Combine(series.MetaLocation, LocalMetaFileName), ms, cancellationToken).ConfigureAwait(false);
  255. }
  256. }
  257. }
  258. /// <summary>
  259. /// Downloads the series zip.
  260. /// </summary>
  261. /// <param name="seriesId">The series id.</param>
  262. /// <param name="seriesDataPath">The series data path.</param>
  263. /// <param name="cancellationToken">The cancellation token.</param>
  264. /// <returns>Task.</returns>
  265. internal async Task DownloadSeriesZip(string seriesId, string seriesDataPath, CancellationToken cancellationToken)
  266. {
  267. var url = string.Format(SeriesGetZip, TVUtils.TvdbApiKey, seriesId, ConfigurationManager.Configuration.PreferredMetadataLanguage);
  268. using (var zipStream = await HttpClient.Get(new HttpRequestOptions
  269. {
  270. Url = url,
  271. ResourcePool = TvDbResourcePool,
  272. CancellationToken = cancellationToken
  273. }).ConfigureAwait(false))
  274. {
  275. // Copy to memory stream because we need a seekable stream
  276. using (var ms = new MemoryStream())
  277. {
  278. await zipStream.CopyToAsync(ms).ConfigureAwait(false);
  279. ms.Position = 0;
  280. _zipClient.ExtractAll(ms, seriesDataPath, true);
  281. }
  282. }
  283. }
  284. /// <summary>
  285. /// Gets the series data path.
  286. /// </summary>
  287. /// <param name="appPaths">The app paths.</param>
  288. /// <param name="seriesId">The series id.</param>
  289. /// <returns>System.String.</returns>
  290. internal static string GetSeriesDataPath(IApplicationPaths appPaths, string seriesId)
  291. {
  292. var seriesDataPath = Path.Combine(GetSeriesDataPath(appPaths), seriesId);
  293. if (!Directory.Exists(seriesDataPath))
  294. {
  295. Directory.CreateDirectory(seriesDataPath);
  296. }
  297. return seriesDataPath;
  298. }
  299. /// <summary>
  300. /// Gets the series data path.
  301. /// </summary>
  302. /// <param name="appPaths">The app paths.</param>
  303. /// <returns>System.String.</returns>
  304. internal static string GetSeriesDataPath(IApplicationPaths appPaths)
  305. {
  306. var dataPath = Path.Combine(appPaths.DataPath, "tvdb");
  307. if (!Directory.Exists(dataPath))
  308. {
  309. Directory.CreateDirectory(dataPath);
  310. }
  311. return dataPath;
  312. }
  313. /// <summary>
  314. /// Fetches the main info.
  315. /// </summary>
  316. /// <param name="series">The series.</param>
  317. /// <param name="doc">The doc.</param>
  318. private void FetchMainInfo(Series series, XmlDocument doc)
  319. {
  320. series.Name = doc.SafeGetString("//SeriesName");
  321. series.Overview = doc.SafeGetString("//Overview");
  322. series.CommunityRating = doc.SafeGetSingle("//Rating", 0, 10);
  323. series.AirDays = TVUtils.GetAirDays(doc.SafeGetString("//Airs_DayOfWeek"));
  324. series.AirTime = doc.SafeGetString("//Airs_Time");
  325. SeriesStatus seriesStatus;
  326. if(Enum.TryParse(doc.SafeGetString("//Status"), true, out seriesStatus))
  327. series.Status = seriesStatus;
  328. series.PremiereDate = doc.SafeGetDateTime("//FirstAired");
  329. if (series.PremiereDate.HasValue)
  330. series.ProductionYear = series.PremiereDate.Value.Year;
  331. //Runtime is in minutes, and 1 tick = 10000 ms
  332. series.RunTimeTicks = doc.SafeGetInt32("//Runtime") * 6;
  333. string s = doc.SafeGetString("//Network");
  334. if (!string.IsNullOrWhiteSpace(s))
  335. {
  336. series.Studios.Clear();
  337. foreach (var studio in s.Trim().Split('|'))
  338. {
  339. series.AddStudio(studio);
  340. }
  341. }
  342. series.OfficialRating = doc.SafeGetString("//ContentRating");
  343. string g = doc.SafeGetString("//Genre");
  344. if (g != null)
  345. {
  346. string[] genres = g.Trim('|').Split('|');
  347. if (g.Length > 0)
  348. {
  349. series.Genres.Clear();
  350. foreach (var genre in genres)
  351. {
  352. series.AddGenre(genre);
  353. }
  354. }
  355. }
  356. if (series.Status == SeriesStatus.Ended) {
  357. var document = XDocument.Load(new XmlNodeReader(doc));
  358. var dates = document.Descendants("Episode").Where(x => {
  359. var seasonNumber = x.Element("SeasonNumber");
  360. var firstAired = x.Element("FirstAired");
  361. return firstAired != null && seasonNumber != null && (!string.IsNullOrEmpty(seasonNumber.Value) && seasonNumber.Value != "0") && !string.IsNullOrEmpty(firstAired.Value);
  362. }).Select(x => {
  363. DateTime? date = null;
  364. DateTime tempDate;
  365. var firstAired = x.Element("FirstAired");
  366. if (firstAired != null && DateTime.TryParse(firstAired.Value, out tempDate))
  367. {
  368. date = tempDate;
  369. }
  370. return date;
  371. }).ToList();
  372. if(dates.Any(x=>x.HasValue))
  373. series.EndDate = dates.Where(x => x.HasValue).Max();
  374. }
  375. }
  376. /// <summary>
  377. /// Fetches the actors.
  378. /// </summary>
  379. /// <param name="series">The series.</param>
  380. /// <param name="actorsDoc">The actors doc.</param>
  381. /// <param name="seriesDoc">The seriesDoc.</param>
  382. /// <returns>Task.</returns>
  383. private void FetchActors(Series series, XmlDocument actorsDoc, XmlDocument seriesDoc)
  384. {
  385. XmlNode actorsNode = null;
  386. if (ConfigurationManager.Configuration.SaveLocalMeta)
  387. {
  388. //add to the main seriesDoc for saving
  389. var seriesNode = seriesDoc.SelectSingleNode("//Series");
  390. if (seriesNode != null)
  391. {
  392. actorsNode = seriesDoc.CreateNode(XmlNodeType.Element, "Persons", null);
  393. seriesNode.AppendChild(actorsNode);
  394. }
  395. }
  396. var xmlNodeList = actorsDoc.SelectNodes("Actors/Actor");
  397. if (xmlNodeList != null)
  398. {
  399. series.People.Clear();
  400. foreach (XmlNode p in xmlNodeList)
  401. {
  402. string actorName = p.SafeGetString("Name");
  403. string actorRole = p.SafeGetString("Role");
  404. if (!string.IsNullOrWhiteSpace(actorName))
  405. {
  406. // Sometimes tvdb actors have leading spaces
  407. series.AddPerson(new PersonInfo { Type = PersonType.Actor, Name = actorName.Trim(), Role = actorRole });
  408. if (ConfigurationManager.Configuration.SaveLocalMeta && actorsNode != null)
  409. {
  410. //create in main seriesDoc
  411. var personNode = seriesDoc.CreateNode(XmlNodeType.Element, "Person", null);
  412. foreach (XmlNode subNode in p.ChildNodes)
  413. personNode.AppendChild(seriesDoc.ImportNode(subNode, true));
  414. //need to add the type
  415. var typeNode = seriesDoc.CreateNode(XmlNodeType.Element, "Type", null);
  416. typeNode.InnerText = PersonType.Actor;
  417. personNode.AppendChild(typeNode);
  418. actorsNode.AppendChild(personNode);
  419. }
  420. }
  421. }
  422. }
  423. }
  424. /// <summary>
  425. /// The us culture
  426. /// </summary>
  427. protected readonly CultureInfo UsCulture = new CultureInfo("en-US");
  428. /// <summary>
  429. /// Determines whether [has local meta] [the specified item].
  430. /// </summary>
  431. /// <param name="item">The item.</param>
  432. /// <returns><c>true</c> if [has local meta] [the specified item]; otherwise, <c>false</c>.</returns>
  433. private bool HasLocalMeta(BaseItem item)
  434. {
  435. return item.ResolveArgs.ContainsMetaFileByName(LocalMetaFileName);
  436. }
  437. /// <summary>
  438. /// Gets the series id.
  439. /// </summary>
  440. /// <param name="item">The item.</param>
  441. /// <param name="cancellationToken">The cancellation token.</param>
  442. /// <returns>Task{System.String}.</returns>
  443. private async Task<string> GetSeriesId(BaseItem item, CancellationToken cancellationToken)
  444. {
  445. var seriesId = item.GetProviderId(MetadataProviders.Tvdb);
  446. if (string.IsNullOrEmpty(seriesId))
  447. {
  448. seriesId = await FindSeries(item.Name, cancellationToken).ConfigureAwait(false);
  449. }
  450. return seriesId;
  451. }
  452. /// <summary>
  453. /// Finds the series.
  454. /// </summary>
  455. /// <param name="name">The name.</param>
  456. /// <param name="cancellationToken">The cancellation token.</param>
  457. /// <returns>Task{System.String}.</returns>
  458. public async Task<string> FindSeries(string name, CancellationToken cancellationToken)
  459. {
  460. //nope - search for it
  461. string url = string.Format(RootUrl + SeriesQuery, WebUtility.UrlEncode(name));
  462. var doc = new XmlDocument();
  463. using (var results = await HttpClient.Get(new HttpRequestOptions
  464. {
  465. Url = url,
  466. ResourcePool = TvDbResourcePool,
  467. CancellationToken = cancellationToken
  468. }).ConfigureAwait(false))
  469. {
  470. doc.Load(results);
  471. }
  472. if (doc.HasChildNodes)
  473. {
  474. XmlNodeList nodes = doc.SelectNodes("//Series");
  475. string comparableName = GetComparableName(name);
  476. if (nodes != null)
  477. foreach (XmlNode node in nodes)
  478. {
  479. var n = node.SelectSingleNode("./SeriesName");
  480. if (n != null && GetComparableName(n.InnerText) == comparableName)
  481. {
  482. n = node.SelectSingleNode("./seriesid");
  483. if (n != null)
  484. return n.InnerText;
  485. }
  486. else
  487. {
  488. if (n != null)
  489. Logger.Info("TVDb Provider - " + n.InnerText + " did not match " + comparableName);
  490. }
  491. }
  492. }
  493. Logger.Info("TVDb Provider - Could not find " + name + ". Check name on Thetvdb.org.");
  494. return null;
  495. }
  496. /// <summary>
  497. /// The remove
  498. /// </summary>
  499. const string remove = "\"'!`?";
  500. /// <summary>
  501. /// The spacers
  502. /// </summary>
  503. const string spacers = "/,.:;\\(){}[]+-_=–*"; // (there are not actually two - in the they are different char codes)
  504. /// <summary>
  505. /// Gets the name of the comparable.
  506. /// </summary>
  507. /// <param name="name">The name.</param>
  508. /// <returns>System.String.</returns>
  509. internal static string GetComparableName(string name)
  510. {
  511. name = name.ToLower();
  512. name = name.Normalize(NormalizationForm.FormKD);
  513. var sb = new StringBuilder();
  514. foreach (var c in name)
  515. {
  516. if ((int)c >= 0x2B0 && (int)c <= 0x0333)
  517. {
  518. // skip char modifier and diacritics
  519. }
  520. else if (remove.IndexOf(c) > -1)
  521. {
  522. // skip chars we are removing
  523. }
  524. else if (spacers.IndexOf(c) > -1)
  525. {
  526. sb.Append(" ");
  527. }
  528. else if (c == '&')
  529. {
  530. sb.Append(" and ");
  531. }
  532. else
  533. {
  534. sb.Append(c);
  535. }
  536. }
  537. name = sb.ToString();
  538. name = name.Replace(", the", "");
  539. name = name.Replace("the ", " ");
  540. name = name.Replace(" the ", " ");
  541. string prevName;
  542. do
  543. {
  544. prevName = name;
  545. name = name.Replace(" ", " ");
  546. } while (name.Length != prevName.Length);
  547. return name.Trim();
  548. }
  549. /// <summary>
  550. /// Performs application-defined tasks associated with freeing, releasing, or resetting unmanaged resources.
  551. /// </summary>
  552. public void Dispose()
  553. {
  554. Dispose(true);
  555. }
  556. }
  557. }