mirror of
https://github.com/ytdl-org/youtube-dl.git
synced 2025-07-05 09:56:20 +00:00
[iqm2] Merge with jwplatform changes
This commit is contained in:
commit
9f11769f17
8
.github/ISSUE_TEMPLATE.md
vendored
8
.github/ISSUE_TEMPLATE.md
vendored
@ -6,8 +6,8 @@
|
|||||||
|
|
||||||
---
|
---
|
||||||
|
|
||||||
### Make sure you are using the *latest* version: run `youtube-dl --version` and ensure your version is *2016.10.02*. If it's not read [this FAQ entry](https://github.com/rg3/youtube-dl/blob/master/README.md#how-do-i-update-youtube-dl) and update. Issues with outdated version will be rejected.
|
### Make sure you are using the *latest* version: run `youtube-dl --version` and ensure your version is *2017.03.05*. If it's not read [this FAQ entry](https://github.com/rg3/youtube-dl/blob/master/README.md#how-do-i-update-youtube-dl) and update. Issues with outdated version will be rejected.
|
||||||
- [ ] I've **verified** and **I assure** that I'm running youtube-dl **2016.10.02**
|
- [ ] I've **verified** and **I assure** that I'm running youtube-dl **2017.03.05**
|
||||||
|
|
||||||
### Before submitting an *issue* make sure you have:
|
### Before submitting an *issue* make sure you have:
|
||||||
- [ ] At least skimmed through [README](https://github.com/rg3/youtube-dl/blob/master/README.md) and **most notably** [FAQ](https://github.com/rg3/youtube-dl#faq) and [BUGS](https://github.com/rg3/youtube-dl#bugs) sections
|
- [ ] At least skimmed through [README](https://github.com/rg3/youtube-dl/blob/master/README.md) and **most notably** [FAQ](https://github.com/rg3/youtube-dl#faq) and [BUGS](https://github.com/rg3/youtube-dl#bugs) sections
|
||||||
@ -35,7 +35,7 @@ $ youtube-dl -v <your command line>
|
|||||||
[debug] User config: []
|
[debug] User config: []
|
||||||
[debug] Command-line args: [u'-v', u'http://www.youtube.com/watch?v=BaW_jenozKcj']
|
[debug] Command-line args: [u'-v', u'http://www.youtube.com/watch?v=BaW_jenozKcj']
|
||||||
[debug] Encodings: locale cp1251, fs mbcs, out cp866, pref cp1251
|
[debug] Encodings: locale cp1251, fs mbcs, out cp866, pref cp1251
|
||||||
[debug] youtube-dl version 2016.10.02
|
[debug] youtube-dl version 2017.03.05
|
||||||
[debug] Python version 2.7.11 - Windows-2003Server-5.2.3790-SP2
|
[debug] Python version 2.7.11 - Windows-2003Server-5.2.3790-SP2
|
||||||
[debug] exe versions: ffmpeg N-75573-g1d0487f, ffprobe N-75573-g1d0487f, rtmpdump 2.4
|
[debug] exe versions: ffmpeg N-75573-g1d0487f, ffprobe N-75573-g1d0487f, rtmpdump 2.4
|
||||||
[debug] Proxy map: {}
|
[debug] Proxy map: {}
|
||||||
@ -50,6 +50,8 @@ $ youtube-dl -v <your command line>
|
|||||||
- Single video: https://youtu.be/BaW_jenozKc
|
- Single video: https://youtu.be/BaW_jenozKc
|
||||||
- Playlist: https://www.youtube.com/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc
|
- Playlist: https://www.youtube.com/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc
|
||||||
|
|
||||||
|
Note that **youtube-dl does not support sites dedicated to [copyright infringement](https://github.com/rg3/youtube-dl#can-you-add-support-for-this-anime-video-site-or-site-which-shows-current-movies-for-free)**. In order for site support request to be accepted all provided example URLs should not violate any copyrights.
|
||||||
|
|
||||||
---
|
---
|
||||||
|
|
||||||
### Description of your *issue*, suggested solution and other information
|
### Description of your *issue*, suggested solution and other information
|
||||||
|
2
.github/ISSUE_TEMPLATE_tmpl.md
vendored
2
.github/ISSUE_TEMPLATE_tmpl.md
vendored
@ -50,6 +50,8 @@ $ youtube-dl -v <your command line>
|
|||||||
- Single video: https://youtu.be/BaW_jenozKc
|
- Single video: https://youtu.be/BaW_jenozKc
|
||||||
- Playlist: https://www.youtube.com/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc
|
- Playlist: https://www.youtube.com/playlist?list=PL4lCao7KL_QFVb7Iudeipvc2BCavECqzc
|
||||||
|
|
||||||
|
Note that **youtube-dl does not support sites dedicated to [copyright infringement](https://github.com/rg3/youtube-dl#can-you-add-support-for-this-anime-video-site-or-site-which-shows-current-movies-for-free)**. In order for site support request to be accepted all provided example URLs should not violate any copyrights.
|
||||||
|
|
||||||
---
|
---
|
||||||
|
|
||||||
### Description of your *issue*, suggested solution and other information
|
### Description of your *issue*, suggested solution and other information
|
||||||
|
4
.gitignore
vendored
4
.gitignore
vendored
@ -30,6 +30,10 @@ updates_key.pem
|
|||||||
*.m4v
|
*.m4v
|
||||||
*.mp3
|
*.mp3
|
||||||
*.3gp
|
*.3gp
|
||||||
|
*.wav
|
||||||
|
*.ape
|
||||||
|
*.mkv
|
||||||
|
*.swf
|
||||||
*.part
|
*.part
|
||||||
*.swp
|
*.swp
|
||||||
test/testdata
|
test/testdata
|
||||||
|
@ -6,8 +6,12 @@ python:
|
|||||||
- "3.3"
|
- "3.3"
|
||||||
- "3.4"
|
- "3.4"
|
||||||
- "3.5"
|
- "3.5"
|
||||||
|
- "3.6"
|
||||||
sudo: false
|
sudo: false
|
||||||
script: nosetests test --verbose
|
env:
|
||||||
|
- YTDL_TEST_SET=core
|
||||||
|
- YTDL_TEST_SET=download
|
||||||
|
script: ./devscripts/run_tests.sh
|
||||||
notifications:
|
notifications:
|
||||||
email:
|
email:
|
||||||
- filippo.valsorda@gmail.com
|
- filippo.valsorda@gmail.com
|
||||||
|
22
AUTHORS
22
AUTHORS
@ -185,3 +185,25 @@ Aleksander Nitecki
|
|||||||
Sebastian Blunt
|
Sebastian Blunt
|
||||||
Matěj Cepl
|
Matěj Cepl
|
||||||
Xie Yanbo
|
Xie Yanbo
|
||||||
|
Philip Xu
|
||||||
|
John Hawkinson
|
||||||
|
Rich Leeper
|
||||||
|
Zhong Jianxin
|
||||||
|
Thor77
|
||||||
|
Mattias Wadman
|
||||||
|
Arjan Verwer
|
||||||
|
Costy Petrisor
|
||||||
|
Logan B
|
||||||
|
Alex Seiler
|
||||||
|
Vijay Singh
|
||||||
|
Paul Hartmann
|
||||||
|
Stephen Chen
|
||||||
|
Fabian Stahl
|
||||||
|
Bagira
|
||||||
|
Odd Stråbø
|
||||||
|
Philip Herzog
|
||||||
|
Thomas Christlieb
|
||||||
|
Marek Rusinowski
|
||||||
|
Tobias Gruetzmacher
|
||||||
|
Olivier Bilodeau
|
||||||
|
Lars Vierbergen
|
||||||
|
@ -12,7 +12,7 @@ $ youtube-dl -v <your command line>
|
|||||||
[debug] Proxy map: {}
|
[debug] Proxy map: {}
|
||||||
...
|
...
|
||||||
```
|
```
|
||||||
**Do not post screenshots of verbose log only plain text is acceptable.**
|
**Do not post screenshots of verbose logs; only plain text is acceptable.**
|
||||||
|
|
||||||
The output (including the first lines) contains important debugging information. Issues without the full output are often not reproducible and therefore do not get solved in short order, if ever.
|
The output (including the first lines) contains important debugging information. Issues without the full output are often not reproducible and therefore do not get solved in short order, if ever.
|
||||||
|
|
||||||
@ -66,7 +66,7 @@ Only post features that you (or an incapacitated friend you can personally talk
|
|||||||
|
|
||||||
### Is your question about youtube-dl?
|
### Is your question about youtube-dl?
|
||||||
|
|
||||||
It may sound strange, but some bug reports we receive are completely unrelated to youtube-dl and relate to a different or even the reporter's own application. Please make sure that you are actually using youtube-dl. If you are using a UI for youtube-dl, report the bug to the maintainer of the actual application providing the UI. On the other hand, if your UI for youtube-dl fails in some way you believe is related to youtube-dl, by all means, go ahead and report the bug.
|
It may sound strange, but some bug reports we receive are completely unrelated to youtube-dl and relate to a different, or even the reporter's own, application. Please make sure that you are actually using youtube-dl. If you are using a UI for youtube-dl, report the bug to the maintainer of the actual application providing the UI. On the other hand, if your UI for youtube-dl fails in some way you believe is related to youtube-dl, by all means, go ahead and report the bug.
|
||||||
|
|
||||||
# DEVELOPER INSTRUCTIONS
|
# DEVELOPER INSTRUCTIONS
|
||||||
|
|
||||||
@ -85,16 +85,16 @@ To run the test, simply invoke your favorite test runner, or execute a test file
|
|||||||
If you want to create a build of youtube-dl yourself, you'll need
|
If you want to create a build of youtube-dl yourself, you'll need
|
||||||
|
|
||||||
* python
|
* python
|
||||||
* make (both GNU make and BSD make are supported)
|
* make (only GNU make is supported)
|
||||||
* pandoc
|
* pandoc
|
||||||
* zip
|
* zip
|
||||||
* nosetests
|
* nosetests
|
||||||
|
|
||||||
### Adding support for a new site
|
### Adding support for a new site
|
||||||
|
|
||||||
If you want to add support for a new site, first of all **make sure** this site is **not dedicated to [copyright infringement](#can-you-add-support-for-this-anime-video-site-or-site-which-shows-current-movies-for-free)**. youtube-dl does **not support** such sites thus pull requests adding support for them **will be rejected**.
|
If you want to add support for a new site, first of all **make sure** this site is **not dedicated to [copyright infringement](README.md#can-you-add-support-for-this-anime-video-site-or-site-which-shows-current-movies-for-free)**. youtube-dl does **not support** such sites thus pull requests adding support for them **will be rejected**.
|
||||||
|
|
||||||
After you have ensured this site is distributing it's content legally, you can follow this quick list (assuming your service is called `yourextractor`):
|
After you have ensured this site is distributing its content legally, you can follow this quick list (assuming your service is called `yourextractor`):
|
||||||
|
|
||||||
1. [Fork this repository](https://github.com/rg3/youtube-dl/fork)
|
1. [Fork this repository](https://github.com/rg3/youtube-dl/fork)
|
||||||
2. Check out the source code with:
|
2. Check out the source code with:
|
||||||
@ -124,7 +124,7 @@ After you have ensured this site is distributing it's content legally, you can f
|
|||||||
'id': '42',
|
'id': '42',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Video title goes here',
|
'title': 'Video title goes here',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
# TODO more properties, either as:
|
# TODO more properties, either as:
|
||||||
# * A value
|
# * A value
|
||||||
# * MD5 checksum; start the string with md5:
|
# * MD5 checksum; start the string with md5:
|
||||||
@ -167,19 +167,19 @@ In any case, thank you very much for your contributions!
|
|||||||
|
|
||||||
This section introduces a guide lines for writing idiomatic, robust and future-proof extractor code.
|
This section introduces a guide lines for writing idiomatic, robust and future-proof extractor code.
|
||||||
|
|
||||||
Extractors are very fragile by nature since they depend on the layout of the source data provided by 3rd party media hoster out of your control and this layout tend to change. As an extractor implementer your task is not only to write code that will extract media links and metadata correctly but also to minimize code dependency on source's layout changes and even to make the code foresee potential future changes and be ready for that. This is important because it will allow extractor not to break on minor layout changes thus keeping old youtube-dl versions working. Even though this breakage issue is easily fixed by emitting a new version of youtube-dl with fix incorporated all the previous version become broken in all repositories and distros' packages that may not be so prompt in fetching the update from us. Needless to say some may never receive an update at all that is possible for non rolling release distros.
|
Extractors are very fragile by nature since they depend on the layout of the source data provided by 3rd party media hosters out of your control and this layout tends to change. As an extractor implementer your task is not only to write code that will extract media links and metadata correctly but also to minimize dependency on the source's layout and even to make the code foresee potential future changes and be ready for that. This is important because it will allow the extractor not to break on minor layout changes thus keeping old youtube-dl versions working. Even though this breakage issue is easily fixed by emitting a new version of youtube-dl with a fix incorporated, all the previous versions become broken in all repositories and distros' packages that may not be so prompt in fetching the update from us. Needless to say, some non rolling release distros may never receive an update at all.
|
||||||
|
|
||||||
### Mandatory and optional metafields
|
### Mandatory and optional metafields
|
||||||
|
|
||||||
For extraction to work youtube-dl relies on metadata your extractor extracts and provides to youtube-dl expressed by [information dictionary](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L75-L257) or simply *info dict*. Only the following meta fields in *info dict* are considered mandatory for successful extraction process by youtube-dl:
|
For extraction to work youtube-dl relies on metadata your extractor extracts and provides to youtube-dl expressed by an [information dictionary](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L75-L257) or simply *info dict*. Only the following meta fields in the *info dict* are considered mandatory for a successful extraction process by youtube-dl:
|
||||||
|
|
||||||
- `id` (media identifier)
|
- `id` (media identifier)
|
||||||
- `title` (media title)
|
- `title` (media title)
|
||||||
- `url` (media download URL) or `formats`
|
- `url` (media download URL) or `formats`
|
||||||
|
|
||||||
In fact only the last option is technically mandatory (i.e. if you can't figure out the download location of the media the extraction does not make any sense). But by convention youtube-dl also treats `id` and `title` to be mandatory. Thus aforementioned metafields are the critical data the extraction does not make any sense without and if any of them fail to be extracted then extractor is considered completely broken.
|
In fact only the last option is technically mandatory (i.e. if you can't figure out the download location of the media the extraction does not make any sense). But by convention youtube-dl also treats `id` and `title` as mandatory. Thus the aforementioned metafields are the critical data that the extraction does not make any sense without and if any of them fail to be extracted then the extractor is considered completely broken.
|
||||||
|
|
||||||
[Any field](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L149-L257) apart from the aforementioned ones are considered **optional**. That means that extraction should be **tolerate** to situations when sources for these fields can potentially be unavailable (even if they are always available at the moment) and **future-proof** in order not to break the extraction of general purpose mandatory fields.
|
[Any field](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L149-L257) apart from the aforementioned ones are considered **optional**. That means that extraction should be **tolerant** to situations when sources for these fields can potentially be unavailable (even if they are always available at the moment) and **future-proof** in order not to break the extraction of general purpose mandatory fields.
|
||||||
|
|
||||||
#### Example
|
#### Example
|
||||||
|
|
||||||
@ -199,7 +199,7 @@ Assume at this point `meta`'s layout is:
|
|||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
|
||||||
Assume you want to extract `summary` and put into resulting info dict as `description`. Since `description` is optional metafield you should be ready that this key may be missing from the `meta` dict, so that you should extract it like:
|
Assume you want to extract `summary` and put it into the resulting info dict as `description`. Since `description` is an optional meta field you should be ready that this key may be missing from the `meta` dict, so that you should extract it like:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
description = meta.get('summary') # correct
|
description = meta.get('summary') # correct
|
||||||
@ -211,7 +211,7 @@ and not like:
|
|||||||
description = meta['summary'] # incorrect
|
description = meta['summary'] # incorrect
|
||||||
```
|
```
|
||||||
|
|
||||||
The latter will break extraction process with `KeyError` if `summary` disappears from `meta` at some time later but with former approach extraction will just go ahead with `description` set to `None` that is perfectly fine (remember `None` is equivalent for absence of data).
|
The latter will break extraction process with `KeyError` if `summary` disappears from `meta` at some later time but with the former approach extraction will just go ahead with `description` set to `None` which is perfectly fine (remember `None` is equivalent to the absence of data).
|
||||||
|
|
||||||
Similarly, you should pass `fatal=False` when extracting optional data from a webpage with `_search_regex`, `_html_search_regex` or similar methods, for instance:
|
Similarly, you should pass `fatal=False` when extracting optional data from a webpage with `_search_regex`, `_html_search_regex` or similar methods, for instance:
|
||||||
|
|
||||||
@ -231,21 +231,21 @@ description = self._search_regex(
|
|||||||
webpage, 'description', default=None)
|
webpage, 'description', default=None)
|
||||||
```
|
```
|
||||||
|
|
||||||
On failure this code will silently continue the extraction with `description` set to `None`. That is useful for metafields that are known to may or may not be present.
|
On failure this code will silently continue the extraction with `description` set to `None`. That is useful for metafields that may or may not be present.
|
||||||
|
|
||||||
### Provide fallbacks
|
### Provide fallbacks
|
||||||
|
|
||||||
When extracting metadata try to provide several scenarios for that. For example if `title` is present in several places/sources try extracting from at least some of them. This would make it more future-proof in case some of the sources became unavailable.
|
When extracting metadata try to do so from multiple sources. For example if `title` is present in several places, try extracting from at least some of them. This makes it more future-proof in case some of the sources become unavailable.
|
||||||
|
|
||||||
#### Example
|
#### Example
|
||||||
|
|
||||||
Say `meta` from previous example has a `title` and you are about to extract it. Since `title` is mandatory meta field you should end up with something like:
|
Say `meta` from the previous example has a `title` and you are about to extract it. Since `title` is a mandatory meta field you should end up with something like:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
title = meta['title']
|
title = meta['title']
|
||||||
```
|
```
|
||||||
|
|
||||||
If `title` disappeares from `meta` in future due to some changes on hoster's side the extraction would fail since `title` is mandatory. That's expected.
|
If `title` disappears from `meta` in future due to some changes on the hoster's side the extraction would fail since `title` is mandatory. That's expected.
|
||||||
|
|
||||||
Assume that you have some another source you can extract `title` from, for example `og:title` HTML meta of a `webpage`. In this case you can provide a fallback scenario:
|
Assume that you have some another source you can extract `title` from, for example `og:title` HTML meta of a `webpage`. In this case you can provide a fallback scenario:
|
||||||
|
|
||||||
@ -282,7 +282,7 @@ title = self._search_regex(
|
|||||||
webpage, 'title', group='title')
|
webpage, 'title', group='title')
|
||||||
```
|
```
|
||||||
|
|
||||||
Note how you tolerate potential changes in `style` attribute's value or switch from using double quotes to single for `class` attribute:
|
Note how you tolerate potential changes in the `style` attribute's value or switch from using double quotes to single for `class` attribute:
|
||||||
|
|
||||||
The code definitely should not look like:
|
The code definitely should not look like:
|
||||||
|
|
||||||
|
884
ChangeLog
884
ChangeLog
@ -1,3 +1,887 @@
|
|||||||
|
version 2017.03.05
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [twitch] Add basic support for two-factor authentication (#11974)
|
||||||
|
+ [vier] Add support for vijf.be (#12304)
|
||||||
|
+ [redbulltv] Add support for redbull.tv (#3919, #11948)
|
||||||
|
* [douyutv] Switch to the PC API to escape the 5-min limitation (#12316)
|
||||||
|
+ [generic] Add support for rutube embeds
|
||||||
|
+ [rutube] Relax URL regular expression
|
||||||
|
+ [vrak] Add support for vrak.tv (#11452)
|
||||||
|
+ [brightcove:new] Add ability to smuggle geo_countries into URL
|
||||||
|
+ [brightcove:new] Raise GeoRestrictedError
|
||||||
|
* [go] Relax URL regular expression (#12341)
|
||||||
|
* [24video] Use original host for requests (#12339)
|
||||||
|
* [ruutu] Disable DASH formats (#12322)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.03.02
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [adobepass] Add support for Charter Spectrum (#11465)
|
||||||
|
* [YoutubeDL] Don't sanitize identifiers in output template (#12317)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [facebook] Fix extraction (#12323, #12330)
|
||||||
|
* [youtube] Mark errors about rental videos as expected (#12324)
|
||||||
|
+ [npo] Add support for audio
|
||||||
|
* [npo] Adapt to app.php API (#12311, #12320)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.28
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [utils] Add bytes_to_long and long_to_bytes
|
||||||
|
+ [utils] Add pkcs1pad
|
||||||
|
+ [aes] Add aes_cbc_encrypt
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [azmedien:showplaylist] Add support for show playlists (#12160)
|
||||||
|
+ [youtube:playlist] Recognize another playlist pattern (#11928, #12286)
|
||||||
|
+ [daisuki] Add support for daisuki.net (#2486, #3186, #4738, #6175, #7776,
|
||||||
|
#10060)
|
||||||
|
* [douyu] Fix extraction (#12301)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.27
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [downloader/common] Limit displaying 2 digits after decimal point in sleep
|
||||||
|
interval message (#12183)
|
||||||
|
+ [extractor/common] Add preference to _parse_html5_media_entries
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [npo] Add support for zapp.nl
|
||||||
|
+ [npo] Add support for hetklokhuis.nl (#12293)
|
||||||
|
- [scivee] Remove extractor (#9315)
|
||||||
|
+ [cda] Decode download URL (#12255)
|
||||||
|
+ [crunchyroll] Improve uploader extraction (#12267)
|
||||||
|
+ [youtube] Raise GeoRestrictedError
|
||||||
|
+ [dailymotion] Raise GeoRestrictedError
|
||||||
|
+ [mdr] Recognize more URL patterns (#12169)
|
||||||
|
+ [tvigle] Raise GeoRestrictedError
|
||||||
|
* [vevo] Fix extraction for videos with the new streams/streamsV3 format
|
||||||
|
(#11719)
|
||||||
|
+ [freshlive] Add support for freshlive.tv (#12175)
|
||||||
|
+ [xhamster] Capture and output videoClosed error (#12263)
|
||||||
|
+ [etonline] Add support for etonline.com (#12236)
|
||||||
|
+ [njpwworld] Add support for njpwworld.com (#11561)
|
||||||
|
* [amcnetworks] Relax URL regular expression (#12127)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.24.1
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [noco] Modernize
|
||||||
|
* [noco] Switch login URL to https (#12246)
|
||||||
|
+ [thescene] Extract more metadata
|
||||||
|
* [thescene] Fix extraction (#12235)
|
||||||
|
+ [tubitv] Use geo bypass mechanism
|
||||||
|
* [openload] Fix extraction (#10408)
|
||||||
|
+ [ivi] Raise GeoRestrictedError
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.24
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [options] Hide deprecated options from --help
|
||||||
|
* [options] Deprecate --autonumber-size
|
||||||
|
+ [YoutubeDL] Add support for string formatting operations in output template
|
||||||
|
(#5185, #5748, #6841, #9929, #9966 #9978, #12189)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [lynda:course] Add webpage extraction fallback (#12238)
|
||||||
|
* [go] Sign all uplynk URLs and use geo bypass only for free videos
|
||||||
|
(#12087, #12210)
|
||||||
|
+ [skylinewebcams] Add support for skylinewebcams.com (#12221)
|
||||||
|
+ [instagram] Add support for multi video posts (#12226)
|
||||||
|
+ [crunchyroll] Extract playlist entries ids
|
||||||
|
* [mgtv] Fix extraction
|
||||||
|
+ [sohu] Raise GeoRestrictedError
|
||||||
|
+ [leeco] Raise GeoRestrictedError and use geo bypass mechanism
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.22
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [crunchyroll] Fix descriptions with double quotes (#12124)
|
||||||
|
* [dailymotion] Make comment count optional (#12209)
|
||||||
|
+ [vidzi] Add support for vidzi.cc (#12213)
|
||||||
|
+ [24video] Add support for 24video.tube (#12217)
|
||||||
|
+ [crackle] Use geo bypass mechanism
|
||||||
|
+ [viewster] Use geo verification headers
|
||||||
|
+ [tfo] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [telequebec] Use geo bypass mechanism
|
||||||
|
+ [limelight] Extract PlaylistService errors and improve geo restriction
|
||||||
|
detection
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.21
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [extractor/common] Allow calling _initialize_geo_bypass from extractors
|
||||||
|
(#11970)
|
||||||
|
+ [adobepass] Add support for Time Warner Cable (#12191)
|
||||||
|
+ [travis] Run tests in parallel
|
||||||
|
+ [downloader/ism] Honor HTTP headers when downloading fragments
|
||||||
|
+ [downloader/dash] Honor HTTP headers when downloading fragments
|
||||||
|
+ [utils] Add GeoUtils class for working with geo tools and GeoUtils.random_ipv4
|
||||||
|
+ Add option --geo-bypass-country for explicit geo bypass on behalf of
|
||||||
|
specified country
|
||||||
|
+ Add options to control geo bypass mechanism --geo-bypass and --no-geo-bypass
|
||||||
|
+ Add experimental geo restriction bypass mechanism based on faking
|
||||||
|
X-Forwarded-For HTTP header
|
||||||
|
+ [utils] Introduce GeoRestrictedError for geo restricted videos
|
||||||
|
+ [utils] Introduce YoutubeDLError base class for all youtube-dl exceptions
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [ninecninemedia] Use geo bypass mechanism
|
||||||
|
* [spankbang] Make uploader optional (#12193)
|
||||||
|
+ [iprima] Improve geo restriction detection and disable geo bypass
|
||||||
|
* [iprima] Modernize
|
||||||
|
* [commonmistakes] Disable UnicodeBOM extractor test for python 3.2
|
||||||
|
+ [prosiebensat1] Throw ExtractionError on unsupported page type (#12180)
|
||||||
|
* [nrk] Update _API_HOST and relax _VALID_URL
|
||||||
|
+ [tv4] Bypass geo restriction and improve detection
|
||||||
|
* [tv4] Switch to hls3 protocol (#12177)
|
||||||
|
+ [viki] Improve geo restriction detection
|
||||||
|
+ [vgtv] Improve geo restriction detection
|
||||||
|
+ [srgssr] Improve geo restriction detection
|
||||||
|
+ [vbox7] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [svt] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [pbs] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [ondemandkorea] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [nrk] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [itv] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [go] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
+ [dramafever] Improve geo restriction detection and use geo bypass mechanism
|
||||||
|
* [brightcove:legacy] Restrict videoPlayer value (#12040)
|
||||||
|
+ [tvn24] Add support for tvn24.pl and tvn24bis.pl (#11679)
|
||||||
|
+ [thisav] Add support for HTML5 media (#11771)
|
||||||
|
* [metacafe] Bypass family filter (#10371)
|
||||||
|
* [viceland] Improve info extraction
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.17
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [heise] Improve extraction (#9725)
|
||||||
|
* [ellentv] Improve (#11653)
|
||||||
|
* [openload] Fix extraction (#10408, #12002)
|
||||||
|
+ [theplatform] Recognize URLs with whitespaces (#12044)
|
||||||
|
* [einthusan] Relax URL regular expression (#12141, #12159)
|
||||||
|
+ [generic] Support complex JWPlayer embedded videos (#12030)
|
||||||
|
* [elpais] Improve extraction (#12139)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.16
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [utils] Add support for quoted string literals in --match-filter (#8050,
|
||||||
|
#12142, #12144)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [ceskatelevize] Lower priority for audio description sources (#12119)
|
||||||
|
* [amcnetworks] Fix extraction (#12127)
|
||||||
|
* [pinkbike] Fix uploader extraction (#12054)
|
||||||
|
+ [onetpl] Add support for businessinsider.com.pl and plejada.pl
|
||||||
|
+ [onetpl] Add support for onet.pl (#10507)
|
||||||
|
+ [onetmvp] Add shortcut extractor
|
||||||
|
+ [vodpl] Add support for vod.pl (#12122)
|
||||||
|
+ [pornhub] Extract video URL from tv platform site (#12007, #12129)
|
||||||
|
+ [ceskatelevize] Extract DASH formats (#12119, #12133)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.14
|
||||||
|
|
||||||
|
Core
|
||||||
|
* TypeError is fixed with Python 2.7.13 on Windows (#11540, #12085)
|
||||||
|
|
||||||
|
Extractor
|
||||||
|
* [zdf] Fix extraction (#12117)
|
||||||
|
* [xtube] Fix extraction for both kinds of video id (#12088)
|
||||||
|
* [xtube] Improve title extraction (#12088)
|
||||||
|
+ [lemonde] Fallback delegate extraction to generic extractor (#12115, #12116)
|
||||||
|
* [bellmedia] Allow video id longer than 6 characters (#12114)
|
||||||
|
+ [limelight] Add support for referer protected videos
|
||||||
|
* [disney] Improve extraction (#4975, #11000, #11882, #11936)
|
||||||
|
* [hotstar] Improve extraction (#12096)
|
||||||
|
* [einthusan] Fix extraction (#11416)
|
||||||
|
+ [aenetworks] Add support for lifetimemovieclub.com (#12097)
|
||||||
|
* [youtube] Fix parsing codecs (#12091)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.11
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [utils] Introduce get_elements_by_class and get_elements_by_attribute
|
||||||
|
utility functions
|
||||||
|
+ [extractor/common] Skip m3u8 manifests protected with Adobe Flash Access
|
||||||
|
|
||||||
|
Extractor
|
||||||
|
* [pluralsight:course] Fix extraction (#12075)
|
||||||
|
+ [bbc] Extract m3u8 formats with 320k audio
|
||||||
|
* [facebook] Relax video id matching (#11017, #12055, #12056)
|
||||||
|
+ [corus] Add support for Corus Entertainment sites (#12060, #9164)
|
||||||
|
+ [pluralsight] Detect blocked account error message (#12070)
|
||||||
|
+ [bloomberg] Add another video id pattern (#12062)
|
||||||
|
* [extractor/commonmistakes] Restrict URL regular expression (#12050)
|
||||||
|
+ [tvplayer] Add support for tvplayer.com
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.10
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [xtube] Fix extraction (#12023)
|
||||||
|
* [pornhub] Fix extraction (#12007, #12018)
|
||||||
|
* [facebook] Improve JS data regular expression (#12042)
|
||||||
|
* [kaltura] Improve embed partner id extraction (#12041)
|
||||||
|
+ [sprout] Add support for sproutonline.com
|
||||||
|
* [6play] Improve extraction
|
||||||
|
+ [scrippsnetworks:watch] Add support for Scripps Networks sites (#10765)
|
||||||
|
+ [go] Add support for Adobe Pass authentication (#11468, #10831)
|
||||||
|
* [6play] Fix extraction (#12011)
|
||||||
|
+ [nbc] Add support for Adobe Pass authentication (#12006)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.07
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [extractor/common] Fix audio only with audio group in m3u8 (#11995)
|
||||||
|
+ [downloader/fragment] Respect --no-part
|
||||||
|
* [extractor/common] Speed-up HTML5 media entries extraction (#11979)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [pornhub] Fix extraction (#11997)
|
||||||
|
+ [canalplus] Add support for cstar.fr (#11990)
|
||||||
|
+ [extractor/generic] Improve RTMP support (#11993)
|
||||||
|
+ [gaskrank] Add support for gaskrank.tv (#11685)
|
||||||
|
* [bandcamp] Fix extraction for incomplete albums (#11727)
|
||||||
|
* [iwara] Fix extraction (#11781)
|
||||||
|
* [googledrive] Fix extraction on Python 3.6
|
||||||
|
+ [videopress] Add support for videopress.com
|
||||||
|
+ [afreecatv] Extract RTMP formats
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.04.1
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [twitch:stream] Add support for player.twitch.tv (#11971)
|
||||||
|
* [radiocanada] Fix extraction for toutv rtmp formats
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.04
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ Add --playlist-random to shuffle playlists (#11889, #11901)
|
||||||
|
* [utils] Improve comments processing in js_to_json (#11947)
|
||||||
|
* [utils] Handle single-line comments in js_to_json
|
||||||
|
* [downloader/external:ffmpeg] Minimize the use of aac_adtstoasc filter
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [piksel] Add another app token pattern (#11969)
|
||||||
|
+ [vk] Capture and output author blocked error message (#11965)
|
||||||
|
+ [turner] Fix secure HLS formats downloading with ffmpeg (#11358, #11373,
|
||||||
|
#11800)
|
||||||
|
+ [drtv] Add support for live and radio sections (#1827, #3427)
|
||||||
|
* [myspace] Fix extraction and extract HLS and HTTP formats
|
||||||
|
+ [youtube] Add format info for itag 325 and 328
|
||||||
|
* [vine] Fix extraction (#11955)
|
||||||
|
- [sportbox] Remove extractor (#11954)
|
||||||
|
+ [filmon] Add support for filmon.com (#11187)
|
||||||
|
+ [infoq] Add audio only formats (#11565)
|
||||||
|
* [douyutv] Improve room id regular expression (#11931)
|
||||||
|
* [iprima] Fix extraction (#11920, #11896)
|
||||||
|
* [youtube] Fix ytsearch when cookies are provided (#11924)
|
||||||
|
* [go] Relax video id regular expression (#11937)
|
||||||
|
* [facebook] Fix title extraction (#11941)
|
||||||
|
+ [youtube:playlist] Recognize TL playlists (#11945)
|
||||||
|
+ [bilibili] Support new Bangumi URLs (#11845)
|
||||||
|
+ [cbc:watch] Extract audio codec for audio only formats (#11893)
|
||||||
|
+ [elpais] Fix extraction for some URLs (#11765)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.02.01
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [facebook] Add another fallback extraction scenario (#11926)
|
||||||
|
* [prosiebensat1] Fix extraction of descriptions (#11810, #11929)
|
||||||
|
- [crunchyroll] Remove ScaledBorderAndShadow settings (#9028)
|
||||||
|
+ [vimeo] Extract upload timestamp
|
||||||
|
+ [vimeo] Extract license (#8726, #11880)
|
||||||
|
+ [nrk:series] Add support for series (#11571, #11711)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.31
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [compat] Add compat_etree_register_namespace
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [youtube] Fix extraction for domainless player URLs (#11890, #11891, #11892,
|
||||||
|
#11894, #11895, #11897, #11900, #11903, #11904, #11906, #11907, #11909,
|
||||||
|
#11913, #11914, #11915, #11916, #11917, #11918, #11919)
|
||||||
|
+ [vimeo] Extract both mixed and separated DASH formats
|
||||||
|
+ [ruutu] Extract DASH formats
|
||||||
|
* [itv] Fix extraction for python 2.6
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.29
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [extractor/common] Fix initialization template (#11605, #11825)
|
||||||
|
+ [extractor/common] Document fragment_base_url and fragment's path fields
|
||||||
|
* [extractor/common] Fix duration per DASH segment (#11868)
|
||||||
|
+ Introduce --autonumber-start option for initial value of %(autonumber)s
|
||||||
|
template (#727, #2702, #9362, #10457, #10529, #11862)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [azmedien:playlist] Add support for topic and themen playlists (#11817)
|
||||||
|
* [npo] Fix subtitles extraction
|
||||||
|
+ [itv] Extract subtitles
|
||||||
|
+ [itv] Add support for itv.com (#9240)
|
||||||
|
+ [mtv81] Add support for mtv81.com (#7619)
|
||||||
|
+ [vlive] Add support for channels (#11826)
|
||||||
|
+ [kaltura] Add fallback for fileExt
|
||||||
|
+ [kaltura] Improve uploader_id extraction
|
||||||
|
+ [konserthusetplay] Add support for rspoplay.se (#11828)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.28
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [utils] Improve parse_duration
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [crunchyroll] Improve series and season metadata extraction (#11832)
|
||||||
|
* [soundcloud] Improve formats extraction and extract audio bitrate
|
||||||
|
+ [soundcloud] Extract HLS formats
|
||||||
|
* [soundcloud] Fix track URL extraction (#11852)
|
||||||
|
+ [twitch:vod] Expand URL regular expressions (#11846)
|
||||||
|
* [aenetworks] Fix season episodes extraction (#11669)
|
||||||
|
+ [tva] Add support for videos.tva.ca (#11842)
|
||||||
|
* [jamendo] Improve and extract more metadata (#11836)
|
||||||
|
+ [disney] Add support for Disney sites (#7409, #11801, #4975, #11000)
|
||||||
|
* [vevo] Remove request to old API and catch API v2 errors
|
||||||
|
+ [cmt,mtv,southpark] Add support for episode URLs (#11837)
|
||||||
|
+ [youtube] Add fallback for duration extraction (#11841)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.25
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [openload] Fallback video extension to mp4
|
||||||
|
+ [extractor/generic] Add support for Openload embeds (#11536, #11812)
|
||||||
|
* [srgssr] Fix rts video extraction (#11831)
|
||||||
|
+ [afreecatv:global] Add support for afreeca.tv (#11807)
|
||||||
|
+ [crackle] Extract vtt subtitles
|
||||||
|
+ [crackle] Extract multiple resolutions for thumbnails
|
||||||
|
+ [crackle] Add support for mobile URLs
|
||||||
|
+ [konserthusetplay] Extract subtitles (#11823)
|
||||||
|
+ [konserthusetplay] Add support for HLS videos (#11823)
|
||||||
|
* [vimeo:review] Fix config URL extraction (#11821)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.24
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [pluralsight] Fix extraction (#11820)
|
||||||
|
+ [nextmedia] Add support for NextTV (壹電視)
|
||||||
|
* [24video] Fix extraction (#11811)
|
||||||
|
* [youtube:playlist] Fix nonexistent and private playlist detection (#11604)
|
||||||
|
+ [chirbit] Extract uploader (#11809)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.22
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [pornflip] Add support for pornflip.com (#11556, #11795)
|
||||||
|
* [chaturbate] Fix extraction (#11797, #11802)
|
||||||
|
+ [azmedien] Add support for AZ Medien sites (#11784, #11785)
|
||||||
|
+ [nextmedia] Support redirected URLs
|
||||||
|
+ [vimeo:channel] Extract videos' titles for playlist entries (#11796)
|
||||||
|
+ [youtube] Extract episode metadata (#9695, #11774)
|
||||||
|
+ [cspan] Support Ustream embedded videos (#11547)
|
||||||
|
+ [1tv] Add support for HLS videos (#11786)
|
||||||
|
* [uol] Fix extraction (#11770)
|
||||||
|
* [mtv] Relax triforce feed regular expression (#11766)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.18
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [bilibili] Fix extraction (#11077)
|
||||||
|
+ [canalplus] Add fallback for video id (#11764)
|
||||||
|
* [20min] Fix extraction (#11683, #11751)
|
||||||
|
* [imdb] Extend URL regular expression (#11744)
|
||||||
|
+ [naver] Add support for tv.naver.com links (#11743)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.16
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [options] Apply custom config to final composite configuration (#11741)
|
||||||
|
* [YoutubeDL] Improve protocol auto determining (#11720)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [xiami] Relax URL regular expressions
|
||||||
|
* [xiami] Improve track metadata extraction (#11699)
|
||||||
|
+ [limelight] Check hand-make direct HTTP links
|
||||||
|
+ [limelight] Add support for direct HTTP links at video.llnw.net (#11737)
|
||||||
|
+ [brightcove] Recognize another player ID pattern (#11688)
|
||||||
|
+ [niconico] Support login via cookies (#7968)
|
||||||
|
* [yourupload] Fix extraction (#11601)
|
||||||
|
+ [beam:live] Add support for beam.pro live streams (#10702, #11596)
|
||||||
|
* [vevo] Improve geo restriction detection
|
||||||
|
+ [dramafever] Add support for URLs with language code (#11714)
|
||||||
|
* [cbc] Improve playlist support (#11704)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.14
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [common] Add ability to customize akamai manifest host
|
||||||
|
+ [utils] Add more date formats
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
- [mtv] Eliminate _transform_rtmp_url
|
||||||
|
* [mtv] Generalize triforce mgid extraction
|
||||||
|
+ [cmt] Add support for full episodes and video clips (#11623)
|
||||||
|
+ [mitele] Extract DASH formats
|
||||||
|
+ [ooyala] Add support for videos with embedToken (#11684)
|
||||||
|
* [mixcloud] Fix extraction (#11674)
|
||||||
|
* [openload] Fix extraction (#10408)
|
||||||
|
* [tv4] Improve extraction (#11698)
|
||||||
|
* [freesound] Fix and improve extraction (#11602)
|
||||||
|
+ [nick] Add support for beta.nick.com (#11655)
|
||||||
|
* [mtv,cc] Use HLS by default with native HLS downloader (#11641)
|
||||||
|
* [mtv] Fix non-HLS extraction
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.10
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [youtube] Fix extraction (#11663, #11664)
|
||||||
|
+ [inc] Add support for inc.com (#11277, #11647)
|
||||||
|
+ [youtube] Add itag 212 (#11575)
|
||||||
|
+ [egghead:course] Add support for egghead.io courses
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.08
|
||||||
|
|
||||||
|
Core
|
||||||
|
* Fix "invalid escape sequence" errors under Python 3.6 (#11581)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [hitrecord] Add support for hitrecord.org (#10867, #11626)
|
||||||
|
- [videott] Remove extractor
|
||||||
|
* [swrmediathek] Improve extraction
|
||||||
|
- [sharesix] Remove extractor
|
||||||
|
- [aol:features] Remove extractor
|
||||||
|
* [sendtonews] Improve info extraction
|
||||||
|
* [3sat,phoenix] Fix extraction (#11619)
|
||||||
|
* [comedycentral/mtv] Add support for HLS videos (#11600)
|
||||||
|
* [discoverygo] Fix JSON data parsing (#11219, #11522)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.05
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [zdf] Fix extraction (#11055, #11063)
|
||||||
|
* [pornhub:playlist] Improve extraction (#11594)
|
||||||
|
+ [cctv] Add support for ncpa-classic.com (#11591)
|
||||||
|
+ [tunein] Add support for embeds (#11579)
|
||||||
|
|
||||||
|
|
||||||
|
version 2017.01.02
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [cctv] Improve extraction (#879, #6753, #8541)
|
||||||
|
+ [nrktv:episodes] Add support for episodes (#11571)
|
||||||
|
+ [arkena] Add support for video.arkena.com (#11568)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.31
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ Introduce --config-location option for custom configuration files (#6745,
|
||||||
|
#10648)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [twitch] Add support for player.twitch.tv (#11535, #11537)
|
||||||
|
+ [videa] Add support for videa.hu (#8181, #11133)
|
||||||
|
* [vk] Fix postlive videos extraction
|
||||||
|
* [vk] Extract from playerParams (#11555)
|
||||||
|
- [freevideo] Remove extractor (#11515)
|
||||||
|
+ [showroomlive] Add support for showroom-live.com (#11458)
|
||||||
|
* [xhamster] Fix duration extraction (#11549)
|
||||||
|
* [rtve:live] Fix extraction (#11529)
|
||||||
|
* [brightcove:legacy] Improve embeds detection (#11523)
|
||||||
|
+ [twitch] Add support for rechat messages (#11524)
|
||||||
|
* [acast] Fix audio and timestamp extraction (#11521)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.22
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [extractor/common] Improve detection of video-only formats in m3u8
|
||||||
|
manifests (#11507)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [theplatform] Pass geo verification headers to SMIL request (#10146)
|
||||||
|
+ [viu] Pass geo verification headers to auth request
|
||||||
|
* [rtl2] Extract more formats and metadata
|
||||||
|
* [vbox7] Skip malformed JSON-LD (#11501)
|
||||||
|
* [uplynk] Force downloading using native HLS downloader (#11496)
|
||||||
|
+ [laola1] Add support for another extraction scenario (#11460)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.20
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [extractor/common] Improve fragment URL construction for DASH media
|
||||||
|
* [extractor/common] Fix codec information extraction for mixed audio/video
|
||||||
|
DASH media (#11490)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [vbox7] Fix extraction (#11494)
|
||||||
|
+ [uktvplay] Add support for uktvplay.uktv.co.uk (#11027)
|
||||||
|
+ [piksel] Add support for player.piksel.com (#11246)
|
||||||
|
+ [vimeo] Add support for DASH formats
|
||||||
|
* [vimeo] Fix extraction for HLS formats (#11490)
|
||||||
|
* [kaltura] Fix wrong widget ID in some cases (#11480)
|
||||||
|
+ [nrktv:direkte] Add support for live streams (#11488)
|
||||||
|
* [pbs] Fix extraction for geo restricted videos (#7095)
|
||||||
|
* [brightcove:new] Skip widevine classic videos
|
||||||
|
+ [viu] Add support for viu.com (#10607, #11329)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.18
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [extractor/common] Recognize DASH formats in html5 media entries
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [ccma] Add support for ccma.cat (#11359)
|
||||||
|
* [laola1tv] Improve extraction
|
||||||
|
+ [laola1tv] Add support embed URLs (#11460)
|
||||||
|
* [nbc] Fix extraction for MSNBC videos (#11466)
|
||||||
|
* [twitch] Adapt to new videos pages URL schema (#11469)
|
||||||
|
+ [meipai] Add support for meipai.com (#10718)
|
||||||
|
* [jwplatform] Improve subtitles and duration extraction
|
||||||
|
+ [ondemandkorea] Add support for ondemandkorea.com (#10772)
|
||||||
|
+ [vvvvid] Add support for vvvvid.it (#5915)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.15
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [utils] Add convenience urljoin
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [openload] Recognize oload.tv URLs (#10408)
|
||||||
|
+ [facebook] Recognize .onion URLs (#11443)
|
||||||
|
* [vlive] Fix extraction (#11375, #11383)
|
||||||
|
+ [canvas] Extract DASH formats
|
||||||
|
+ [melonvod] Add support for vod.melon.com (#11419)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.12
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [utils] Add common user agents map
|
||||||
|
+ [common] Recognize HLS manifests that contain video only formats (#11394)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [dplay] Use Safari user agent for HLS (#11418)
|
||||||
|
+ [facebook] Detect login required error message
|
||||||
|
* [facebook] Improve video selection (#11390)
|
||||||
|
+ [canalplus] Add another video id pattern (#11399)
|
||||||
|
* [mixcloud] Relax URL regular expression (#11406)
|
||||||
|
* [ctvnews] Relax URL regular expression (#11394)
|
||||||
|
+ [rte] Capture and output error message (#7746, #10498)
|
||||||
|
+ [prosiebensat1] Add support for DASH formats
|
||||||
|
* [srgssr] Improve extraction for geo restricted videos (#11089)
|
||||||
|
* [rts] Improve extraction for geo restricted videos (#4989)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.09
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [socks] Fix error reporting (#11355)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [openload] Fix extraction (#10408)
|
||||||
|
* [pandoratv] Fix extraction (#11023)
|
||||||
|
+ [telebruxelles] Add support for emission URLs
|
||||||
|
* [telebruxelles] Extract all formats
|
||||||
|
+ [bloomberg] Add another video id regular expression (#11371)
|
||||||
|
* [fusion] Update ooyala id regular expression (#11364)
|
||||||
|
+ [1tv] Add support for playlists (#11335)
|
||||||
|
* [1tv] Improve extraction (#11335)
|
||||||
|
+ [aenetworks] Extract more formats (#11321)
|
||||||
|
+ [thisoldhouse] Recognize /tv-episode/ URLs (#11271)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.12.01
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [soundcloud] Update client id (#11327)
|
||||||
|
* [ruutu] Detect DRM protected videos
|
||||||
|
+ [liveleak] Add support for youtube embeds (#10688)
|
||||||
|
* [spike] Fix full episodes support (#11312)
|
||||||
|
* [comedycentral] Fix full episodes support
|
||||||
|
* [normalboots] Rewrite in terms of JWPlatform (#11184)
|
||||||
|
* [teamfourstar] Rewrite in terms of JWPlatform (#11184)
|
||||||
|
- [screenwavemedia] Remove extractor (#11184)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.27
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [webcaster] Add support for webcaster.pro
|
||||||
|
+ [azubu] Add support for azubu.uol.com.br (#11305)
|
||||||
|
* [viki] Prefer hls formats
|
||||||
|
* [viki] Fix rtmp formats extraction (#11255)
|
||||||
|
* [puls4] Relax URL regular expression (#11267)
|
||||||
|
* [vevo] Improve artist extraction (#10911)
|
||||||
|
* [mitele] Relax URL regular expression and extract more metadata (#11244)
|
||||||
|
+ [cbslocal] Recognize New York site (#11285)
|
||||||
|
+ [youtube:playlist] Pass disable_polymer in URL query (#11193)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.22
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [hellporno] Fix video extension extraction (#11247)
|
||||||
|
+ [hellporno] Add support for hellporno.net (#11247)
|
||||||
|
+ [amcnetworks] Recognize more BBC America URLs (#11263)
|
||||||
|
* [funnyordie] Improve extraction (#11208)
|
||||||
|
* [extractor/generic] Improve limelight embeds support
|
||||||
|
- [crunchyroll] Remove ScaledBorderAndShadow from ASS subtitles (#8207, #9028)
|
||||||
|
* [bandcamp] Fix free downloads extraction and extract all formats (#11067)
|
||||||
|
* [twitter:card] Relax URL regular expression (#11225)
|
||||||
|
+ [tvanouvelles] Add support for tvanouvelles.ca (#10616)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.18
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [youtube:live] Relax URL regular expression (#11164)
|
||||||
|
* [openload] Fix extraction (#10408, #11122)
|
||||||
|
* [vlive] Prefer locale over language for subtitles id (#11203)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.14.1
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [downoader/fragment,f4m,hls] Respect HTTP headers from info dict
|
||||||
|
* [extractor/common] Fix media templates with Bandwidth substitution pattern in
|
||||||
|
MPD manifests (#11175)
|
||||||
|
* [extractor/common] Improve thumbnail extraction from JSON-LD
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [nrk] Workaround geo restriction
|
||||||
|
+ [nrk] Improve error detection and messages
|
||||||
|
+ [afreecatv] Add support for vod.afreecatv.com (#11174)
|
||||||
|
* [cda] Fix and improve extraction (#10929, #10936)
|
||||||
|
* [plays] Fix extraction (#11165)
|
||||||
|
* [eagleplatform] Fix extraction (#11160)
|
||||||
|
+ [audioboom] Recognize /posts/ URLs (#11149)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.08.1
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [espn:article] Fix support for espn.com articles
|
||||||
|
* [franceculture] Fix extraction (#11140)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.08
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [tmz:article] Fix extraction (#11052)
|
||||||
|
* [espn] Fix extraction (#11041)
|
||||||
|
* [mitele] Fix extraction after website redesign (#10824)
|
||||||
|
- [ard] Remove age restriction check (#11129)
|
||||||
|
* [generic] Improve support for pornhub.com embeds (#11100)
|
||||||
|
+ [generic] Add support for redtube.com embeds (#11099)
|
||||||
|
+ [generic] Add support for drtuber.com embeds (#11098)
|
||||||
|
+ [redtube] Add support for embed URLs
|
||||||
|
+ [drtuber] Add support for embed URLs
|
||||||
|
+ [yahoo] Improve content id extraction (#11088)
|
||||||
|
* [toutv] Relax URL regular expression (#11121)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.04
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [extractor/common] Tolerate malformed RESOLUTION attribute in m3u8
|
||||||
|
manifests (#11113)
|
||||||
|
* [downloader/ism] Fix AVC Decoder Configuration Record
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [fox9] Add support for fox9.com (#11110)
|
||||||
|
+ [anvato] Extract more metadata and improve formats extraction
|
||||||
|
* [vodlocker] Improve removed videos detection (#11106)
|
||||||
|
+ [vzaar] Add support for vzaar.com (#11093)
|
||||||
|
+ [vice] Add support for uplynk preplay videos (#11101)
|
||||||
|
* [tubitv] Fix extraction (#11061)
|
||||||
|
+ [shahid] Add support for authentication (#11091)
|
||||||
|
+ [radiocanada] Add subtitles support (#11096)
|
||||||
|
+ [generic] Add support for ISM manifests
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.11.02
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ Add basic support for Smooth Streaming protocol (#8118, #10969)
|
||||||
|
* Improve MPD manifest base URL extraction (#10909, #11079)
|
||||||
|
* Fix --match-filter for int-like strings (#11082)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [mva] Add support for ISM formats
|
||||||
|
+ [msn] Add support for ISM formats
|
||||||
|
+ [onet] Add support for ISM formats
|
||||||
|
+ [tvp] Add support for ISM formats
|
||||||
|
+ [nicknight] Add support for nicknight sites (#10769)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.30
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [facebook] Improve 1080P video detection (#11073)
|
||||||
|
* [imgur] Recognize /r/ URLs (#11071)
|
||||||
|
* [beeg] Fix extraction (#11069)
|
||||||
|
* [openload] Fix extraction (#10408)
|
||||||
|
* [gvsearch] Modernize and fix search request (#11051)
|
||||||
|
* [adultswim] Fix extraction (#10979)
|
||||||
|
+ [nobelprize] Add support for nobelprize.org (#9999)
|
||||||
|
* [hornbunny] Fix extraction (#10981)
|
||||||
|
* [tvp] Improve video id extraction (#10585)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.26
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [rentv] Add support for ren.tv (#10620)
|
||||||
|
+ [ard] Detect unavailable videos (#11018)
|
||||||
|
* [vk] Fix extraction (#11022)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.25
|
||||||
|
|
||||||
|
Core
|
||||||
|
* Running youtube-dl in the background is fixed (#10996, #10706, #955)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [jamendo] Add support for jamendo.com (#10132, #10736)
|
||||||
|
+ [pandatv] Add support for panda.tv (#10736)
|
||||||
|
+ [dotsub] Support Vimeo embed (#10964)
|
||||||
|
* [litv] Fix extraction
|
||||||
|
+ [vimeo] Delegate ondemand redirects to ondemand extractor (#10994)
|
||||||
|
* [vivo] Fix extraction (#11003)
|
||||||
|
+ [twitch:stream] Add support for rebroadcasts (#10995)
|
||||||
|
* [pluralsight] Fix subtitles conversion (#10990)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.21.1
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [pluralsight] Process all clip URLs (#10984)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.21
|
||||||
|
|
||||||
|
Core
|
||||||
|
- Disable thumbnails embedding in mkv
|
||||||
|
+ Add support for Comcast multiple-system operator (#10819)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [pluralsight] Adapt to new API (#10972)
|
||||||
|
* [openload] Fix extraction (#10408, #10971)
|
||||||
|
+ [natgeo] Extract m3u8 formats (#10959)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.19
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ [utils] Expose PACKED_CODES_RE
|
||||||
|
+ [extractor/common] Extract non smil wowza mpd manifests
|
||||||
|
+ [extractor/common] Detect f4m audio-only formats
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [vidzi] Fix extraction (#10908, #10952)
|
||||||
|
* [urplay] Fix subtitles extraction
|
||||||
|
+ [urplay] Add support for urskola.se (#10915)
|
||||||
|
+ [orf] Add subtitles support (#10939)
|
||||||
|
* [youtube] Fix --no-playlist behavior for youtu.be/id URLs (#10896)
|
||||||
|
* [nrk] Relax URL regular expression (#10928)
|
||||||
|
+ [nytimes] Add support for podcasts (#10926)
|
||||||
|
* [pluralsight] Relax URL regular expression (#10941)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.16
|
||||||
|
|
||||||
|
Core
|
||||||
|
* [postprocessor/ffmpeg] Return correct filepath and ext in updated information
|
||||||
|
in FFmpegExtractAudioPP (#10879)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [ruutu] Add support for supla.fi (#10849)
|
||||||
|
+ [theoperaplatform] Add support for theoperaplatform.eu (#10914)
|
||||||
|
* [lynda] Fix height for prioritized streams
|
||||||
|
+ [lynda] Add fallback extraction scenario
|
||||||
|
* [lynda] Switch to https (#10916)
|
||||||
|
+ [huajiao] New extractor (#10917)
|
||||||
|
* [cmt] Fix mgid extraction (#10813)
|
||||||
|
+ [safari:course] Add support for techbus.safaribooksonline.com
|
||||||
|
* [orf:tvthek] Fix extraction and modernize (#10898)
|
||||||
|
* [chirbit] Fix extraction of user profile pages
|
||||||
|
* [carambatv] Fix extraction
|
||||||
|
* [canalplus] Fix extraction for some videos
|
||||||
|
* [cbsinteractive] Fix extraction for cnet.com
|
||||||
|
* [parliamentliveuk] Lower case URLs are now recognized (#10912)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.12
|
||||||
|
|
||||||
|
Core
|
||||||
|
+ Support HTML media elements without child nodes
|
||||||
|
* [Makefile] Support for GNU make < 4 is fixed; BSD make dropped (#9387)
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
* [dailymotion] Fix extraction (#10901)
|
||||||
|
* [vimeo:review] Fix extraction (#10900)
|
||||||
|
* [nhl] Correctly handle invalid formats (#10713)
|
||||||
|
* [footyroom] Fix extraction (#10810)
|
||||||
|
* [abc.net.au:iview] Fix for standalone (non series) videos (#10895)
|
||||||
|
+ [hbo] Add support for episode pages (#10892)
|
||||||
|
* [allocine] Fix extraction (#10860)
|
||||||
|
+ [nextmedia] Recognize action news on AppleDaily
|
||||||
|
* [lego] Improve info extraction and bypass geo restriction (#10872)
|
||||||
|
|
||||||
|
|
||||||
|
version 2016.10.07
|
||||||
|
|
||||||
|
Extractors
|
||||||
|
+ [iprima] Detect geo restriction
|
||||||
|
* [facebook] Fix video extraction (#10846)
|
||||||
|
+ [commonprotocols] Support direct MMS links (#10838)
|
||||||
|
+ [generic] Add support for multiple vimeo embeds (#10862)
|
||||||
|
+ [nzz] Add support for nzz.ch (#4407)
|
||||||
|
+ [npo] Detect geo restriction
|
||||||
|
+ [npo] Add support for 2doc.nl (#10842)
|
||||||
|
+ [lego] Add support for lego.com (#10369)
|
||||||
|
+ [tonline] Add support for t-online.de (#10376)
|
||||||
|
* [techtalks] Relax URL regular expression (#10840)
|
||||||
|
* [youtube:live] Extend URL regular expression (#10839)
|
||||||
|
+ [theweatherchannel] Add support for weather.com (#7188)
|
||||||
|
+ [thisoldhouse] Add support for thisoldhouse.com (#10837)
|
||||||
|
+ [nhl] Add support for wch2016.com (#10833)
|
||||||
|
* [pornoxo] Use JWPlatform to improve metadata extraction
|
||||||
|
|
||||||
|
|
||||||
version 2016.10.02
|
version 2016.10.02
|
||||||
|
|
||||||
Core
|
Core
|
||||||
|
6
Makefile
6
Makefile
@ -1,7 +1,7 @@
|
|||||||
all: youtube-dl README.md CONTRIBUTING.md README.txt youtube-dl.1 youtube-dl.bash-completion youtube-dl.zsh youtube-dl.fish supportedsites
|
all: youtube-dl README.md CONTRIBUTING.md README.txt youtube-dl.1 youtube-dl.bash-completion youtube-dl.zsh youtube-dl.fish supportedsites
|
||||||
|
|
||||||
clean:
|
clean:
|
||||||
rm -rf youtube-dl.1.temp.md youtube-dl.1 youtube-dl.bash-completion README.txt MANIFEST build/ dist/ .coverage cover/ youtube-dl.tar.gz youtube-dl.zsh youtube-dl.fish youtube_dl/extractor/lazy_extractors.py *.dump *.part* *.info.json *.mp4 *.m4a *.flv *.mp3 *.avi *.mkv *.webm *.3gp *.jpg *.png CONTRIBUTING.md.tmp ISSUE_TEMPLATE.md.tmp youtube-dl youtube-dl.exe
|
rm -rf youtube-dl.1.temp.md youtube-dl.1 youtube-dl.bash-completion README.txt MANIFEST build/ dist/ .coverage cover/ youtube-dl.tar.gz youtube-dl.zsh youtube-dl.fish youtube_dl/extractor/lazy_extractors.py *.dump *.part* *.info.json *.mp4 *.m4a *.flv *.mp3 *.avi *.mkv *.webm *.3gp *.wav *.ape *.swf *.jpg *.png CONTRIBUTING.md.tmp ISSUE_TEMPLATE.md.tmp youtube-dl youtube-dl.exe
|
||||||
find . -name "*.pyc" -delete
|
find . -name "*.pyc" -delete
|
||||||
find . -name "*.class" -delete
|
find . -name "*.class" -delete
|
||||||
|
|
||||||
@ -12,7 +12,7 @@ SHAREDIR ?= $(PREFIX)/share
|
|||||||
PYTHON ?= /usr/bin/env python
|
PYTHON ?= /usr/bin/env python
|
||||||
|
|
||||||
# set SYSCONFDIR to /etc if PREFIX=/usr or PREFIX=/usr/local
|
# set SYSCONFDIR to /etc if PREFIX=/usr or PREFIX=/usr/local
|
||||||
SYSCONFDIR != if [ $(PREFIX) = /usr -o $(PREFIX) = /usr/local ]; then echo /etc; else echo $(PREFIX)/etc; fi
|
SYSCONFDIR = $(shell if [ $(PREFIX) = /usr -o $(PREFIX) = /usr/local ]; then echo /etc; else echo $(PREFIX)/etc; fi)
|
||||||
|
|
||||||
install: youtube-dl youtube-dl.1 youtube-dl.bash-completion youtube-dl.zsh youtube-dl.fish
|
install: youtube-dl youtube-dl.1 youtube-dl.bash-completion youtube-dl.zsh youtube-dl.fish
|
||||||
install -d $(DESTDIR)$(BINDIR)
|
install -d $(DESTDIR)$(BINDIR)
|
||||||
@ -90,7 +90,7 @@ fish-completion: youtube-dl.fish
|
|||||||
|
|
||||||
lazy-extractors: youtube_dl/extractor/lazy_extractors.py
|
lazy-extractors: youtube_dl/extractor/lazy_extractors.py
|
||||||
|
|
||||||
_EXTRACTOR_FILES != find youtube_dl/extractor -iname '*.py' -and -not -iname 'lazy_extractors.py'
|
_EXTRACTOR_FILES = $(shell find youtube_dl/extractor -iname '*.py' -and -not -iname 'lazy_extractors.py')
|
||||||
youtube_dl/extractor/lazy_extractors.py: devscripts/make_lazy_extractors.py devscripts/lazy_load_template.py $(_EXTRACTOR_FILES)
|
youtube_dl/extractor/lazy_extractors.py: devscripts/make_lazy_extractors.py devscripts/lazy_load_template.py $(_EXTRACTOR_FILES)
|
||||||
$(PYTHON) devscripts/make_lazy_extractors.py $@
|
$(PYTHON) devscripts/make_lazy_extractors.py $@
|
||||||
|
|
||||||
|
299
README.md
299
README.md
@ -29,7 +29,7 @@ Windows users can [download an .exe file](https://yt-dl.org/latest/youtube-dl.ex
|
|||||||
|
|
||||||
You can also use pip:
|
You can also use pip:
|
||||||
|
|
||||||
sudo pip install --upgrade youtube-dl
|
sudo -H pip install --upgrade youtube-dl
|
||||||
|
|
||||||
This command will update youtube-dl if you have already installed it. See the [pypi page](https://pypi.python.org/pypi/youtube_dl) for more information.
|
This command will update youtube-dl if you have already installed it. See the [pypi page](https://pypi.python.org/pypi/youtube_dl) for more information.
|
||||||
|
|
||||||
@ -44,11 +44,7 @@ Or with [MacPorts](https://www.macports.org/):
|
|||||||
Alternatively, refer to the [developer instructions](#developer-instructions) for how to check out and work with the git repository. For further options, including PGP signatures, see the [youtube-dl Download Page](https://rg3.github.io/youtube-dl/download.html).
|
Alternatively, refer to the [developer instructions](#developer-instructions) for how to check out and work with the git repository. For further options, including PGP signatures, see the [youtube-dl Download Page](https://rg3.github.io/youtube-dl/download.html).
|
||||||
|
|
||||||
# DESCRIPTION
|
# DESCRIPTION
|
||||||
**youtube-dl** is a command-line program to download videos from
|
**youtube-dl** is a command-line program to download videos from YouTube.com and a few more sites. It requires the Python interpreter, version 2.6, 2.7, or 3.2+, and it is not platform specific. It should work on your Unix box, on Windows or on Mac OS X. It is released to the public domain, which means you can modify it, redistribute it or use it however you like.
|
||||||
YouTube.com and a few more sites. It requires the Python interpreter, version
|
|
||||||
2.6, 2.7, or 3.2+, and it is not platform specific. It should work on
|
|
||||||
your Unix box, on Windows or on Mac OS X. It is released to the public domain,
|
|
||||||
which means you can modify it, redistribute it or use it however you like.
|
|
||||||
|
|
||||||
youtube-dl [OPTIONS] URL [URL...]
|
youtube-dl [OPTIONS] URL [URL...]
|
||||||
|
|
||||||
@ -84,13 +80,14 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
configuration in ~/.config/youtube-
|
configuration in ~/.config/youtube-
|
||||||
dl/config (%APPDATA%/youtube-dl/config.txt
|
dl/config (%APPDATA%/youtube-dl/config.txt
|
||||||
on Windows)
|
on Windows)
|
||||||
|
--config-location PATH Location of the configuration file; either
|
||||||
|
the path to the config or its containing
|
||||||
|
directory.
|
||||||
--flat-playlist Do not extract the videos of a playlist,
|
--flat-playlist Do not extract the videos of a playlist,
|
||||||
only list them.
|
only list them.
|
||||||
--mark-watched Mark videos watched (YouTube only)
|
--mark-watched Mark videos watched (YouTube only)
|
||||||
--no-mark-watched Do not mark videos watched (YouTube only)
|
--no-mark-watched Do not mark videos watched (YouTube only)
|
||||||
--no-color Do not emit color codes in output
|
--no-color Do not emit color codes in output
|
||||||
--abort-on-unavailable-fragment Abort downloading when some fragment is not
|
|
||||||
available
|
|
||||||
|
|
||||||
## Network Options:
|
## Network Options:
|
||||||
--proxy URL Use the specified HTTP/HTTPS/SOCKS proxy.
|
--proxy URL Use the specified HTTP/HTTPS/SOCKS proxy.
|
||||||
@ -100,16 +97,23 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
string (--proxy "") for direct connection
|
string (--proxy "") for direct connection
|
||||||
--socket-timeout SECONDS Time to wait before giving up, in seconds
|
--socket-timeout SECONDS Time to wait before giving up, in seconds
|
||||||
--source-address IP Client-side IP address to bind to
|
--source-address IP Client-side IP address to bind to
|
||||||
(experimental)
|
|
||||||
-4, --force-ipv4 Make all connections via IPv4
|
-4, --force-ipv4 Make all connections via IPv4
|
||||||
(experimental)
|
|
||||||
-6, --force-ipv6 Make all connections via IPv6
|
-6, --force-ipv6 Make all connections via IPv6
|
||||||
(experimental)
|
|
||||||
|
## Geo Restriction:
|
||||||
--geo-verification-proxy URL Use this proxy to verify the IP address for
|
--geo-verification-proxy URL Use this proxy to verify the IP address for
|
||||||
some geo-restricted sites. The default
|
some geo-restricted sites. The default
|
||||||
proxy specified by --proxy (or none, if the
|
proxy specified by --proxy (or none, if the
|
||||||
options is not present) is used for the
|
options is not present) is used for the
|
||||||
actual downloading. (experimental)
|
actual downloading.
|
||||||
|
--geo-bypass Bypass geographic restriction via faking
|
||||||
|
X-Forwarded-For HTTP header (experimental)
|
||||||
|
--no-geo-bypass Do not bypass geographic restriction via
|
||||||
|
faking X-Forwarded-For HTTP header
|
||||||
|
(experimental)
|
||||||
|
--geo-bypass-country CODE Force bypass geographic restriction with
|
||||||
|
explicitly provided two-letter ISO 3166-2
|
||||||
|
country code (experimental)
|
||||||
|
|
||||||
## Video Selection:
|
## Video Selection:
|
||||||
--playlist-start NUMBER Playlist video to start at (default is 1)
|
--playlist-start NUMBER Playlist video to start at (default is 1)
|
||||||
@ -140,15 +144,17 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
COUNT views
|
COUNT views
|
||||||
--max-views COUNT Do not download any videos with more than
|
--max-views COUNT Do not download any videos with more than
|
||||||
COUNT views
|
COUNT views
|
||||||
--match-filter FILTER Generic video filter (experimental).
|
--match-filter FILTER Generic video filter. Specify any key (see
|
||||||
Specify any key (see help for -o for a list
|
help for -o for a list of available keys)
|
||||||
of available keys) to match if the key is
|
to match if the key is present, !key to
|
||||||
present, !key to check if the key is not
|
check if the key is not present, key >
|
||||||
present,key > NUMBER (like "comment_count >
|
NUMBER (like "comment_count > 12", also
|
||||||
12", also works with >=, <, <=, !=, =) to
|
works with >=, <, <=, !=, =) to compare
|
||||||
compare against a number, and & to require
|
against a number, key = 'LITERAL' (like
|
||||||
multiple matches. Values which are not
|
"uploader = 'Mike Smith'", also works with
|
||||||
known are excluded unless you put a
|
!=) to match against a string literal and &
|
||||||
|
to require multiple matches. Values which
|
||||||
|
are not known are excluded unless you put a
|
||||||
question mark (?) after the operator. For
|
question mark (?) after the operator. For
|
||||||
example, to only match videos that have
|
example, to only match videos that have
|
||||||
been liked more than 100 times and disliked
|
been liked more than 100 times and disliked
|
||||||
@ -179,6 +185,8 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
only)
|
only)
|
||||||
--skip-unavailable-fragments Skip unavailable fragments (DASH and
|
--skip-unavailable-fragments Skip unavailable fragments (DASH and
|
||||||
hlsnative only)
|
hlsnative only)
|
||||||
|
--abort-on-unavailable-fragment Abort downloading when some fragment is not
|
||||||
|
available
|
||||||
--buffer-size SIZE Size of download buffer (e.g. 1024 or 16K)
|
--buffer-size SIZE Size of download buffer (e.g. 1024 or 16K)
|
||||||
(default is 1024)
|
(default is 1024)
|
||||||
--no-resize-buffer Do not automatically adjust the buffer
|
--no-resize-buffer Do not automatically adjust the buffer
|
||||||
@ -186,6 +194,7 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
automatically resized from an initial value
|
automatically resized from an initial value
|
||||||
of SIZE.
|
of SIZE.
|
||||||
--playlist-reverse Download playlist videos in reverse order
|
--playlist-reverse Download playlist videos in reverse order
|
||||||
|
--playlist-random Download playlist videos in random order
|
||||||
--xattr-set-filesize Set file xattribute ytdl.filesize with
|
--xattr-set-filesize Set file xattribute ytdl.filesize with
|
||||||
expected file size (experimental)
|
expected file size (experimental)
|
||||||
--hls-prefer-native Use the native HLS downloader instead of
|
--hls-prefer-native Use the native HLS downloader instead of
|
||||||
@ -208,19 +217,11 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
--id Use only video ID in file name
|
--id Use only video ID in file name
|
||||||
-o, --output TEMPLATE Output filename template, see the "OUTPUT
|
-o, --output TEMPLATE Output filename template, see the "OUTPUT
|
||||||
TEMPLATE" for all the info
|
TEMPLATE" for all the info
|
||||||
--autonumber-size NUMBER Specify the number of digits in
|
--autonumber-start NUMBER Specify the start value for %(autonumber)s
|
||||||
%(autonumber)s when it is present in output
|
(default is 1)
|
||||||
filename template or --auto-number option
|
|
||||||
is given
|
|
||||||
--restrict-filenames Restrict filenames to only ASCII
|
--restrict-filenames Restrict filenames to only ASCII
|
||||||
characters, and avoid "&" and spaces in
|
characters, and avoid "&" and spaces in
|
||||||
filenames
|
filenames
|
||||||
-A, --auto-number [deprecated; use -o
|
|
||||||
"%(autonumber)s-%(title)s.%(ext)s" ] Number
|
|
||||||
downloaded files starting from 00000
|
|
||||||
-t, --title [deprecated] Use title in file name
|
|
||||||
(default)
|
|
||||||
-l, --literal [deprecated] Alias of --title
|
|
||||||
-w, --no-overwrites Do not overwrite files
|
-w, --no-overwrites Do not overwrite files
|
||||||
-c, --continue Force resume of partially downloaded files.
|
-c, --continue Force resume of partially downloaded files.
|
||||||
By default, youtube-dl will resume
|
By default, youtube-dl will resume
|
||||||
@ -354,7 +355,7 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
-u, --username USERNAME Login with this account ID
|
-u, --username USERNAME Login with this account ID
|
||||||
-p, --password PASSWORD Account password. If this option is left
|
-p, --password PASSWORD Account password. If this option is left
|
||||||
out, youtube-dl will ask interactively.
|
out, youtube-dl will ask interactively.
|
||||||
-2, --twofactor TWOFACTOR Two-factor auth code
|
-2, --twofactor TWOFACTOR Two-factor authentication code
|
||||||
-n, --netrc Use .netrc authentication data
|
-n, --netrc Use .netrc authentication data
|
||||||
--video-password PASSWORD Video password (vimeo, smotri, youku)
|
--video-password PASSWORD Video password (vimeo, smotri, youku)
|
||||||
|
|
||||||
@ -375,7 +376,7 @@ which means you can modify it, redistribute it or use it however you like.
|
|||||||
avprobe)
|
avprobe)
|
||||||
--audio-format FORMAT Specify audio format: "best", "aac",
|
--audio-format FORMAT Specify audio format: "best", "aac",
|
||||||
"vorbis", "mp3", "m4a", "opus", or "wav";
|
"vorbis", "mp3", "m4a", "opus", or "wav";
|
||||||
"best" by default
|
"best" by default; No effect without -x
|
||||||
--audio-quality QUALITY Specify ffmpeg/avconv audio quality, insert
|
--audio-quality QUALITY Specify ffmpeg/avconv audio quality, insert
|
||||||
a value between 0 (better) and 9 (worse)
|
a value between 0 (better) and 9 (worse)
|
||||||
for VBR or a specific bitrate like 128K
|
for VBR or a specific bitrate like 128K
|
||||||
@ -447,14 +448,16 @@ Note that options in configuration file are just the same options aka switches u
|
|||||||
|
|
||||||
You can use `--ignore-config` if you want to disable the configuration file for a particular youtube-dl run.
|
You can use `--ignore-config` if you want to disable the configuration file for a particular youtube-dl run.
|
||||||
|
|
||||||
|
You can also use `--config-location` if you want to use custom configuration file for a particular youtube-dl run.
|
||||||
|
|
||||||
### Authentication with `.netrc` file
|
### Authentication with `.netrc` file
|
||||||
|
|
||||||
You may also want to configure automatic credentials storage for extractors that support authentication (by providing login and password with `--username` and `--password`) in order not to pass credentials as command line arguments on every youtube-dl execution and prevent tracking plain text passwords in the shell command history. You can achieve this using a [`.netrc` file](http://stackoverflow.com/tags/.netrc/info) on per extractor basis. For that you will need to create a `.netrc` file in your `$HOME` and restrict permissions to read/write by you only:
|
You may also want to configure automatic credentials storage for extractors that support authentication (by providing login and password with `--username` and `--password`) in order not to pass credentials as command line arguments on every youtube-dl execution and prevent tracking plain text passwords in the shell command history. You can achieve this using a [`.netrc` file](http://stackoverflow.com/tags/.netrc/info) on a per extractor basis. For that you will need to create a `.netrc` file in your `$HOME` and restrict permissions to read/write by only you:
|
||||||
```
|
```
|
||||||
touch $HOME/.netrc
|
touch $HOME/.netrc
|
||||||
chmod a-rwx,u+rw $HOME/.netrc
|
chmod a-rwx,u+rw $HOME/.netrc
|
||||||
```
|
```
|
||||||
After that you can add credentials for extractor in the following format, where *extractor* is the name of extractor in lowercase:
|
After that you can add credentials for an extractor in the following format, where *extractor* is the name of the extractor in lowercase:
|
||||||
```
|
```
|
||||||
machine <extractor> login <login> password <password>
|
machine <extractor> login <login> password <password>
|
||||||
```
|
```
|
||||||
@ -473,90 +476,92 @@ The `-o` option allows users to indicate a template for the output file names.
|
|||||||
|
|
||||||
**tl;dr:** [navigate me to examples](#output-template-examples).
|
**tl;dr:** [navigate me to examples](#output-template-examples).
|
||||||
|
|
||||||
The basic usage is not to set any template arguments when downloading a single file, like in `youtube-dl -o funny_video.flv "http://some/video"`. However, it may contain special sequences that will be replaced when downloading each video. The special sequences have the format `%(NAME)s`. To clarify, that is a percent symbol followed by a name in parentheses, followed by a lowercase S. Allowed names are:
|
The basic usage is not to set any template arguments when downloading a single file, like in `youtube-dl -o funny_video.flv "http://some/video"`. However, it may contain special sequences that will be replaced when downloading each video. The special sequences may be formatted according to [python string formatting operations](https://docs.python.org/2/library/stdtypes.html#string-formatting). For example, `%(NAME)s` or `%(NAME)05d`. To clarify, that is a percent symbol followed by a name in parentheses, followed by a formatting operations. Allowed names along with sequence type are:
|
||||||
|
|
||||||
- `id`: Video identifier
|
- `id` (string): Video identifier
|
||||||
- `title`: Video title
|
- `title` (string): Video title
|
||||||
- `url`: Video URL
|
- `url` (string): Video URL
|
||||||
- `ext`: Video filename extension
|
- `ext` (string): Video filename extension
|
||||||
- `alt_title`: A secondary title of the video
|
- `alt_title` (string): A secondary title of the video
|
||||||
- `display_id`: An alternative identifier for the video
|
- `display_id` (string): An alternative identifier for the video
|
||||||
- `uploader`: Full name of the video uploader
|
- `uploader` (string): Full name of the video uploader
|
||||||
- `license`: License name the video is licensed under
|
- `license` (string): License name the video is licensed under
|
||||||
- `creator`: The creator of the video
|
- `creator` (string): The creator of the video
|
||||||
- `release_date`: The date (YYYYMMDD) when the video was released
|
- `release_date` (string): The date (YYYYMMDD) when the video was released
|
||||||
- `timestamp`: UNIX timestamp of the moment the video became available
|
- `timestamp` (numeric): UNIX timestamp of the moment the video became available
|
||||||
- `upload_date`: Video upload date (YYYYMMDD)
|
- `upload_date` (string): Video upload date (YYYYMMDD)
|
||||||
- `uploader_id`: Nickname or id of the video uploader
|
- `uploader_id` (string): Nickname or id of the video uploader
|
||||||
- `location`: Physical location where the video was filmed
|
- `location` (string): Physical location where the video was filmed
|
||||||
- `duration`: Length of the video in seconds
|
- `duration` (numeric): Length of the video in seconds
|
||||||
- `view_count`: How many users have watched the video on the platform
|
- `view_count` (numeric): How many users have watched the video on the platform
|
||||||
- `like_count`: Number of positive ratings of the video
|
- `like_count` (numeric): Number of positive ratings of the video
|
||||||
- `dislike_count`: Number of negative ratings of the video
|
- `dislike_count` (numeric): Number of negative ratings of the video
|
||||||
- `repost_count`: Number of reposts of the video
|
- `repost_count` (numeric): Number of reposts of the video
|
||||||
- `average_rating`: Average rating give by users, the scale used depends on the webpage
|
- `average_rating` (numeric): Average rating give by users, the scale used depends on the webpage
|
||||||
- `comment_count`: Number of comments on the video
|
- `comment_count` (numeric): Number of comments on the video
|
||||||
- `age_limit`: Age restriction for the video (years)
|
- `age_limit` (numeric): Age restriction for the video (years)
|
||||||
- `format`: A human-readable description of the format
|
- `format` (string): A human-readable description of the format
|
||||||
- `format_id`: Format code specified by `--format`
|
- `format_id` (string): Format code specified by `--format`
|
||||||
- `format_note`: Additional info about the format
|
- `format_note` (string): Additional info about the format
|
||||||
- `width`: Width of the video
|
- `width` (numeric): Width of the video
|
||||||
- `height`: Height of the video
|
- `height` (numeric): Height of the video
|
||||||
- `resolution`: Textual description of width and height
|
- `resolution` (string): Textual description of width and height
|
||||||
- `tbr`: Average bitrate of audio and video in KBit/s
|
- `tbr` (numeric): Average bitrate of audio and video in KBit/s
|
||||||
- `abr`: Average audio bitrate in KBit/s
|
- `abr` (numeric): Average audio bitrate in KBit/s
|
||||||
- `acodec`: Name of the audio codec in use
|
- `acodec` (string): Name of the audio codec in use
|
||||||
- `asr`: Audio sampling rate in Hertz
|
- `asr` (numeric): Audio sampling rate in Hertz
|
||||||
- `vbr`: Average video bitrate in KBit/s
|
- `vbr` (numeric): Average video bitrate in KBit/s
|
||||||
- `fps`: Frame rate
|
- `fps` (numeric): Frame rate
|
||||||
- `vcodec`: Name of the video codec in use
|
- `vcodec` (string): Name of the video codec in use
|
||||||
- `container`: Name of the container format
|
- `container` (string): Name of the container format
|
||||||
- `filesize`: The number of bytes, if known in advance
|
- `filesize` (numeric): The number of bytes, if known in advance
|
||||||
- `filesize_approx`: An estimate for the number of bytes
|
- `filesize_approx` (numeric): An estimate for the number of bytes
|
||||||
- `protocol`: The protocol that will be used for the actual download
|
- `protocol` (string): The protocol that will be used for the actual download
|
||||||
- `extractor`: Name of the extractor
|
- `extractor` (string): Name of the extractor
|
||||||
- `extractor_key`: Key name of the extractor
|
- `extractor_key` (string): Key name of the extractor
|
||||||
- `epoch`: Unix epoch when creating the file
|
- `epoch` (numeric): Unix epoch when creating the file
|
||||||
- `autonumber`: Five-digit number that will be increased with each download, starting at zero
|
- `autonumber` (numeric): Five-digit number that will be increased with each download, starting at zero
|
||||||
- `playlist`: Name or id of the playlist that contains the video
|
- `playlist` (string): Name or id of the playlist that contains the video
|
||||||
- `playlist_index`: Index of the video in the playlist padded with leading zeros according to the total length of the playlist
|
- `playlist_index` (numeric): Index of the video in the playlist padded with leading zeros according to the total length of the playlist
|
||||||
- `playlist_id`: Playlist identifier
|
- `playlist_id` (string): Playlist identifier
|
||||||
- `playlist_title`: Playlist title
|
- `playlist_title` (string): Playlist title
|
||||||
|
|
||||||
|
|
||||||
Available for the video that belongs to some logical chapter or section:
|
Available for the video that belongs to some logical chapter or section:
|
||||||
- `chapter`: Name or title of the chapter the video belongs to
|
- `chapter` (string): Name or title of the chapter the video belongs to
|
||||||
- `chapter_number`: Number of the chapter the video belongs to
|
- `chapter_number` (numeric): Number of the chapter the video belongs to
|
||||||
- `chapter_id`: Id of the chapter the video belongs to
|
- `chapter_id` (string): Id of the chapter the video belongs to
|
||||||
|
|
||||||
Available for the video that is an episode of some series or programme:
|
Available for the video that is an episode of some series or programme:
|
||||||
- `series`: Title of the series or programme the video episode belongs to
|
- `series` (string): Title of the series or programme the video episode belongs to
|
||||||
- `season`: Title of the season the video episode belongs to
|
- `season` (string): Title of the season the video episode belongs to
|
||||||
- `season_number`: Number of the season the video episode belongs to
|
- `season_number` (numeric): Number of the season the video episode belongs to
|
||||||
- `season_id`: Id of the season the video episode belongs to
|
- `season_id` (string): Id of the season the video episode belongs to
|
||||||
- `episode`: Title of the video episode
|
- `episode` (string): Title of the video episode
|
||||||
- `episode_number`: Number of the video episode within a season
|
- `episode_number` (numeric): Number of the video episode within a season
|
||||||
- `episode_id`: Id of the video episode
|
- `episode_id` (string): Id of the video episode
|
||||||
|
|
||||||
Available for the media that is a track or a part of a music album:
|
Available for the media that is a track or a part of a music album:
|
||||||
- `track`: Title of the track
|
- `track` (string): Title of the track
|
||||||
- `track_number`: Number of the track within an album or a disc
|
- `track_number` (numeric): Number of the track within an album or a disc
|
||||||
- `track_id`: Id of the track
|
- `track_id` (string): Id of the track
|
||||||
- `artist`: Artist(s) of the track
|
- `artist` (string): Artist(s) of the track
|
||||||
- `genre`: Genre(s) of the track
|
- `genre` (string): Genre(s) of the track
|
||||||
- `album`: Title of the album the track belongs to
|
- `album` (string): Title of the album the track belongs to
|
||||||
- `album_type`: Type of the album
|
- `album_type` (string): Type of the album
|
||||||
- `album_artist`: List of all artists appeared on the album
|
- `album_artist` (string): List of all artists appeared on the album
|
||||||
- `disc_number`: Number of the disc or other physical medium the track belongs to
|
- `disc_number` (numeric): Number of the disc or other physical medium the track belongs to
|
||||||
- `release_year`: Year (YYYY) when the album was released
|
- `release_year` (numeric): Year (YYYY) when the album was released
|
||||||
|
|
||||||
Each aforementioned sequence when referenced in output template will be replaced by the actual value corresponding to the sequence name. Note that some of the sequences are not guaranteed to be present since they depend on the metadata obtained by particular extractor, such sequences will be replaced with `NA`.
|
Each aforementioned sequence when referenced in an output template will be replaced by the actual value corresponding to the sequence name. Note that some of the sequences are not guaranteed to be present since they depend on the metadata obtained by a particular extractor. Such sequences will be replaced with `NA`.
|
||||||
|
|
||||||
For example for `-o %(title)s-%(id)s.%(ext)s` and mp4 video with title `youtube-dl test video` and id `BaW_jenozKcj` this will result in a `youtube-dl test video-BaW_jenozKcj.mp4` file created in the current directory.
|
For example for `-o %(title)s-%(id)s.%(ext)s` and an mp4 video with title `youtube-dl test video` and id `BaW_jenozKcj`, this will result in a `youtube-dl test video-BaW_jenozKcj.mp4` file created in the current directory.
|
||||||
|
|
||||||
Output template can also contain arbitrary hierarchical path, e.g. `-o '%(playlist)s/%(playlist_index)s - %(title)s.%(ext)s'` that will result in downloading each video in a directory corresponding to this path template. Any missing directory will be automatically created for you.
|
For numeric sequences you can use numeric related formatting, for example, `%(view_count)05d` will result in a string with view count padded with zeros up to 5 characters, like in `00042`.
|
||||||
|
|
||||||
To specify percent literal in output template use `%%`. To output to stdout use `-o -`.
|
Output templates can also contain arbitrary hierarchical path, e.g. `-o '%(playlist)s/%(playlist_index)s - %(title)s.%(ext)s'` which will result in downloading each video in a directory corresponding to this path template. Any missing directory will be automatically created for you.
|
||||||
|
|
||||||
|
To use percent literals in an output template use `%%`. To output to stdout use `-o -`.
|
||||||
|
|
||||||
The current default template is `%(title)s-%(id)s.%(ext)s`.
|
The current default template is `%(title)s-%(id)s.%(ext)s`.
|
||||||
|
|
||||||
@ -564,7 +569,7 @@ In some cases, you don't want special characters such as 中, spaces, or &, such
|
|||||||
|
|
||||||
#### Output template and Windows batch files
|
#### Output template and Windows batch files
|
||||||
|
|
||||||
If you are using output template inside a Windows batch file then you must escape plain percent characters (`%`) by doubling, so that `-o "%(title)s-%(id)s.%(ext)s"` should become `-o "%%(title)s-%%(id)s.%%(ext)s"`. However you should not touch `%`'s that are not plain characters, e.g. environment variables for expansion should stay intact: `-o "C:\%HOMEPATH%\Desktop\%%(title)s.%%(ext)s"`.
|
If you are using an output template inside a Windows batch file then you must escape plain percent characters (`%`) by doubling, so that `-o "%(title)s-%(id)s.%(ext)s"` should become `-o "%%(title)s-%%(id)s.%%(ext)s"`. However you should not touch `%`'s that are not plain characters, e.g. environment variables for expansion should stay intact: `-o "C:\%HOMEPATH%\Desktop\%%(title)s.%%(ext)s"`.
|
||||||
|
|
||||||
#### Output template examples
|
#### Output template examples
|
||||||
|
|
||||||
@ -597,7 +602,7 @@ $ youtube-dl -o - BaW_jenozKc
|
|||||||
|
|
||||||
By default youtube-dl tries to download the best available quality, i.e. if you want the best quality you **don't need** to pass any special options, youtube-dl will guess it for you by **default**.
|
By default youtube-dl tries to download the best available quality, i.e. if you want the best quality you **don't need** to pass any special options, youtube-dl will guess it for you by **default**.
|
||||||
|
|
||||||
But sometimes you may want to download in a different format, for example when you are on a slow or intermittent connection. The key mechanism for achieving this is so called *format selection* based on which you can explicitly specify desired format, select formats based on some criterion or criteria, setup precedence and much more.
|
But sometimes you may want to download in a different format, for example when you are on a slow or intermittent connection. The key mechanism for achieving this is so-called *format selection* based on which you can explicitly specify desired format, select formats based on some criterion or criteria, setup precedence and much more.
|
||||||
|
|
||||||
The general syntax for format selection is `--format FORMAT` or shorter `-f FORMAT` where `FORMAT` is a *selector expression*, i.e. an expression that describes format or formats you would like to download.
|
The general syntax for format selection is `--format FORMAT` or shorter `-f FORMAT` where `FORMAT` is a *selector expression*, i.e. an expression that describes format or formats you would like to download.
|
||||||
|
|
||||||
@ -605,21 +610,21 @@ The general syntax for format selection is `--format FORMAT` or shorter `-f FORM
|
|||||||
|
|
||||||
The simplest case is requesting a specific format, for example with `-f 22` you can download the format with format code equal to 22. You can get the list of available format codes for particular video using `--list-formats` or `-F`. Note that these format codes are extractor specific.
|
The simplest case is requesting a specific format, for example with `-f 22` you can download the format with format code equal to 22. You can get the list of available format codes for particular video using `--list-formats` or `-F`. Note that these format codes are extractor specific.
|
||||||
|
|
||||||
You can also use a file extension (currently `3gp`, `aac`, `flv`, `m4a`, `mp3`, `mp4`, `ogg`, `wav`, `webm` are supported) to download best quality format of particular file extension served as a single file, e.g. `-f webm` will download best quality format with `webm` extension served as a single file.
|
You can also use a file extension (currently `3gp`, `aac`, `flv`, `m4a`, `mp3`, `mp4`, `ogg`, `wav`, `webm` are supported) to download the best quality format of a particular file extension served as a single file, e.g. `-f webm` will download the best quality format with the `webm` extension served as a single file.
|
||||||
|
|
||||||
You can also use special names to select particular edge case format:
|
You can also use special names to select particular edge case formats:
|
||||||
- `best`: Select best quality format represented by single file with video and audio
|
- `best`: Select the best quality format represented by a single file with video and audio.
|
||||||
- `worst`: Select worst quality format represented by single file with video and audio
|
- `worst`: Select the worst quality format represented by a single file with video and audio.
|
||||||
- `bestvideo`: Select best quality video only format (e.g. DASH video), may not be available
|
- `bestvideo`: Select the best quality video-only format (e.g. DASH video). May not be available.
|
||||||
- `worstvideo`: Select worst quality video only format, may not be available
|
- `worstvideo`: Select the worst quality video-only format. May not be available.
|
||||||
- `bestaudio`: Select best quality audio only format, may not be available
|
- `bestaudio`: Select the best quality audio only-format. May not be available.
|
||||||
- `worstaudio`: Select worst quality audio only format, may not be available
|
- `worstaudio`: Select the worst quality audio only-format. May not be available.
|
||||||
|
|
||||||
For example, to download worst quality video only format you can use `-f worstvideo`.
|
For example, to download the worst quality video-only format you can use `-f worstvideo`.
|
||||||
|
|
||||||
If you want to download multiple videos and they don't have the same formats available, you can specify the order of preference using slashes. Note that slash is left-associative, i.e. formats on the left hand side are preferred, for example `-f 22/17/18` will download format 22 if it's available, otherwise it will download format 17 if it's available, otherwise it will download format 18 if it's available, otherwise it will complain that no suitable formats are available for download.
|
If you want to download multiple videos and they don't have the same formats available, you can specify the order of preference using slashes. Note that slash is left-associative, i.e. formats on the left hand side are preferred, for example `-f 22/17/18` will download format 22 if it's available, otherwise it will download format 17 if it's available, otherwise it will download format 18 if it's available, otherwise it will complain that no suitable formats are available for download.
|
||||||
|
|
||||||
If you want to download several formats of the same video use comma as a separator, e.g. `-f 22,17,18` will download all these three formats, of course if they are available. Or more sophisticated example combined with precedence feature `-f 136/137/mp4/bestvideo,140/m4a/bestaudio`.
|
If you want to download several formats of the same video use a comma as a separator, e.g. `-f 22,17,18` will download all these three formats, of course if they are available. Or a more sophisticated example combined with the precedence feature: `-f 136/137/mp4/bestvideo,140/m4a/bestaudio`.
|
||||||
|
|
||||||
You can also filter the video formats by putting a condition in brackets, as in `-f "best[height=720]"` (or `-f "[filesize>10M]"`).
|
You can also filter the video formats by putting a condition in brackets, as in `-f "best[height=720]"` (or `-f "[filesize>10M]"`).
|
||||||
|
|
||||||
@ -638,18 +643,18 @@ Also filtering work for comparisons `=` (equals), `!=` (not equals), `^=` (begin
|
|||||||
- `acodec`: Name of the audio codec in use
|
- `acodec`: Name of the audio codec in use
|
||||||
- `vcodec`: Name of the video codec in use
|
- `vcodec`: Name of the video codec in use
|
||||||
- `container`: Name of the container format
|
- `container`: Name of the container format
|
||||||
- `protocol`: The protocol that will be used for the actual download, lower-case. `http`, `https`, `rtsp`, `rtmp`, `rtmpe`, `m3u8`, or `m3u8_native`
|
- `protocol`: The protocol that will be used for the actual download, lower-case (`http`, `https`, `rtsp`, `rtmp`, `rtmpe`, `mms`, `f4m`, `ism`, `m3u8`, or `m3u8_native`)
|
||||||
- `format_id`: A short description of the format
|
- `format_id`: A short description of the format
|
||||||
|
|
||||||
Note that none of the aforementioned meta fields are guaranteed to be present since this solely depends on the metadata obtained by particular extractor, i.e. the metadata offered by video hoster.
|
Note that none of the aforementioned meta fields are guaranteed to be present since this solely depends on the metadata obtained by particular extractor, i.e. the metadata offered by the video hoster.
|
||||||
|
|
||||||
Formats for which the value is not known are excluded unless you put a question mark (`?`) after the operator. You can combine format filters, so `-f "[height <=? 720][tbr>500]"` selects up to 720p videos (or videos where the height is not known) with a bitrate of at least 500 KBit/s.
|
Formats for which the value is not known are excluded unless you put a question mark (`?`) after the operator. You can combine format filters, so `-f "[height <=? 720][tbr>500]"` selects up to 720p videos (or videos where the height is not known) with a bitrate of at least 500 KBit/s.
|
||||||
|
|
||||||
You can merge the video and audio of two formats into a single file using `-f <video-format>+<audio-format>` (requires ffmpeg or avconv installed), for example `-f bestvideo+bestaudio` will download best video only format, best audio only format and mux them together with ffmpeg/avconv.
|
You can merge the video and audio of two formats into a single file using `-f <video-format>+<audio-format>` (requires ffmpeg or avconv installed), for example `-f bestvideo+bestaudio` will download the best video-only format, the best audio-only format and mux them together with ffmpeg/avconv.
|
||||||
|
|
||||||
Format selectors can also be grouped using parentheses, for example if you want to download the best mp4 and webm formats with a height lower than 480 you can use `-f '(mp4,webm)[height<480]'`.
|
Format selectors can also be grouped using parentheses, for example if you want to download the best mp4 and webm formats with a height lower than 480 you can use `-f '(mp4,webm)[height<480]'`.
|
||||||
|
|
||||||
Since the end of April 2015 and version 2015.04.26 youtube-dl uses `-f bestvideo+bestaudio/best` as default format selection (see [#5447](https://github.com/rg3/youtube-dl/issues/5447), [#5456](https://github.com/rg3/youtube-dl/issues/5456)). If ffmpeg or avconv are installed this results in downloading `bestvideo` and `bestaudio` separately and muxing them together into a single file giving the best overall quality available. Otherwise it falls back to `best` and results in downloading the best available quality served as a single file. `best` is also needed for videos that don't come from YouTube because they don't provide the audio and video in two different files. If you want to only download some DASH formats (for example if you are not interested in getting videos with a resolution higher than 1080p), you can add `-f bestvideo[height<=?1080]+bestaudio/best` to your configuration file. Note that if you use youtube-dl to stream to `stdout` (and most likely to pipe it to your media player then), i.e. you explicitly specify output template as `-o -`, youtube-dl still uses `-f best` format selection in order to start content delivery immediately to your player and not to wait until `bestvideo` and `bestaudio` are downloaded and muxed.
|
Since the end of April 2015 and version 2015.04.26, youtube-dl uses `-f bestvideo+bestaudio/best` as the default format selection (see [#5447](https://github.com/rg3/youtube-dl/issues/5447), [#5456](https://github.com/rg3/youtube-dl/issues/5456)). If ffmpeg or avconv are installed this results in downloading `bestvideo` and `bestaudio` separately and muxing them together into a single file giving the best overall quality available. Otherwise it falls back to `best` and results in downloading the best available quality served as a single file. `best` is also needed for videos that don't come from YouTube because they don't provide the audio and video in two different files. If you want to only download some DASH formats (for example if you are not interested in getting videos with a resolution higher than 1080p), you can add `-f bestvideo[height<=?1080]+bestaudio/best` to your configuration file. Note that if you use youtube-dl to stream to `stdout` (and most likely to pipe it to your media player then), i.e. you explicitly specify output template as `-o -`, youtube-dl still uses `-f best` format selection in order to start content delivery immediately to your player and not to wait until `bestvideo` and `bestaudio` are downloaded and muxed.
|
||||||
|
|
||||||
If you want to preserve the old format selection behavior (prior to youtube-dl 2015.04.26), i.e. you want to download the best available quality media served as a single file, you should explicitly specify your choice with `-f best`. You may want to add it to the [configuration file](#configuration) in order not to type it every time you run youtube-dl.
|
If you want to preserve the old format selection behavior (prior to youtube-dl 2015.04.26), i.e. you want to download the best available quality media served as a single file, you should explicitly specify your choice with `-f best`. You may want to add it to the [configuration file](#configuration) in order not to type it every time you run youtube-dl.
|
||||||
|
|
||||||
@ -664,7 +669,7 @@ $ youtube-dl -f 'bestvideo[ext=mp4]+bestaudio[ext=m4a]/best[ext=mp4]/best'
|
|||||||
# Download best format available but not better that 480p
|
# Download best format available but not better that 480p
|
||||||
$ youtube-dl -f 'bestvideo[height<=480]+bestaudio/best[height<=480]'
|
$ youtube-dl -f 'bestvideo[height<=480]+bestaudio/best[height<=480]'
|
||||||
|
|
||||||
# Download best video only format but no bigger that 50 MB
|
# Download best video only format but no bigger than 50 MB
|
||||||
$ youtube-dl -f 'best[filesize<50M]'
|
$ youtube-dl -f 'best[filesize<50M]'
|
||||||
|
|
||||||
# Download best format available via direct link over HTTP/HTTPS protocol
|
# Download best format available via direct link over HTTP/HTTPS protocol
|
||||||
@ -728,7 +733,7 @@ Add a file exclusion for `youtube-dl.exe` in Windows Defender settings.
|
|||||||
|
|
||||||
YouTube changed their playlist format in March 2014 and later on, so you'll need at least youtube-dl 2014.07.25 to download all YouTube videos.
|
YouTube changed their playlist format in March 2014 and later on, so you'll need at least youtube-dl 2014.07.25 to download all YouTube videos.
|
||||||
|
|
||||||
If you have installed youtube-dl with a package manager, pip, setup.py or a tarball, please use that to update. Note that Ubuntu packages do not seem to get updated anymore. Since we are not affiliated with Ubuntu, there is little we can do. Feel free to [report bugs](https://bugs.launchpad.net/ubuntu/+source/youtube-dl/+filebug) to the [Ubuntu packaging guys](mailto:ubuntu-motu@lists.ubuntu.com?subject=outdated%20version%20of%20youtube-dl) - all they have to do is update the package to a somewhat recent version. See above for a way to update.
|
If you have installed youtube-dl with a package manager, pip, setup.py or a tarball, please use that to update. Note that Ubuntu packages do not seem to get updated anymore. Since we are not affiliated with Ubuntu, there is little we can do. Feel free to [report bugs](https://bugs.launchpad.net/ubuntu/+source/youtube-dl/+filebug) to the [Ubuntu packaging people](mailto:ubuntu-motu@lists.ubuntu.com?subject=outdated%20version%20of%20youtube-dl) - all they have to do is update the package to a somewhat recent version. See above for a way to update.
|
||||||
|
|
||||||
### I'm getting an error when trying to use output template: `error: using output template conflicts with using title, video ID or auto number`
|
### I'm getting an error when trying to use output template: `error: using output template conflicts with using title, video ID or auto number`
|
||||||
|
|
||||||
@ -758,7 +763,7 @@ Once the video is fully downloaded, use any video player, such as [mpv](https://
|
|||||||
|
|
||||||
### I extracted a video URL with `-g`, but it does not play on another machine / in my web browser.
|
### I extracted a video URL with `-g`, but it does not play on another machine / in my web browser.
|
||||||
|
|
||||||
It depends a lot on the service. In many cases, requests for the video (to download/play it) must come from the same IP address and with the same cookies. Use the `--cookies` option to write the required cookies into a file, and advise your downloader to read cookies from that file. Some sites also require a common user agent to be used, use `--dump-user-agent` to see the one in use by youtube-dl.
|
It depends a lot on the service. In many cases, requests for the video (to download/play it) must come from the same IP address and with the same cookies and/or HTTP headers. Use the `--cookies` option to write the required cookies into a file, and advise your downloader to read cookies from that file. Some sites also require a common user agent to be used, use `--dump-user-agent` to see the one in use by youtube-dl. You can also get necessary cookies and HTTP headers from JSON output obtained with `--dump-json`.
|
||||||
|
|
||||||
It may be beneficial to use IPv6; in some cases, the restrictions are only applied to IPv4. Some services (sometimes only for a subset of videos) do not restrict the video URL by IP address, cookie, or user-agent, but these are the exception rather than the rule.
|
It may be beneficial to use IPv6; in some cases, the restrictions are only applied to IPv4. Some services (sometimes only for a subset of videos) do not restrict the video URL by IP address, cookie, or user-agent, but these are the exception rather than the rule.
|
||||||
|
|
||||||
@ -840,7 +845,7 @@ Use the `--cookies` option, for example `--cookies /path/to/cookies/file.txt`.
|
|||||||
|
|
||||||
In order to extract cookies from browser use any conforming browser extension for exporting cookies. For example, [cookies.txt](https://chrome.google.com/webstore/detail/cookiestxt/njabckikapfpffapmjgojcnbfjonfjfg) (for Chrome) or [Export Cookies](https://addons.mozilla.org/en-US/firefox/addon/export-cookies/) (for Firefox).
|
In order to extract cookies from browser use any conforming browser extension for exporting cookies. For example, [cookies.txt](https://chrome.google.com/webstore/detail/cookiestxt/njabckikapfpffapmjgojcnbfjonfjfg) (for Chrome) or [Export Cookies](https://addons.mozilla.org/en-US/firefox/addon/export-cookies/) (for Firefox).
|
||||||
|
|
||||||
Note that the cookies file must be in Mozilla/Netscape format and the first line of the cookies file must be either `# HTTP Cookie File` or `# Netscape HTTP Cookie File`. Make sure you have correct [newline format](https://en.wikipedia.org/wiki/Newline) in the cookies file and convert newlines if necessary to correspond with your OS, namely `CRLF` (`\r\n`) for Windows, `LF` (`\n`) for Linux and `CR` (`\r`) for Mac OS. `HTTP Error 400: Bad Request` when using `--cookies` is a good sign of invalid newline format.
|
Note that the cookies file must be in Mozilla/Netscape format and the first line of the cookies file must be either `# HTTP Cookie File` or `# Netscape HTTP Cookie File`. Make sure you have correct [newline format](https://en.wikipedia.org/wiki/Newline) in the cookies file and convert newlines if necessary to correspond with your OS, namely `CRLF` (`\r\n`) for Windows and `LF` (`\n`) for Unix and Unix-like systems (Linux, Mac OS, etc.). `HTTP Error 400: Bad Request` when using `--cookies` is a good sign of invalid newline format.
|
||||||
|
|
||||||
Passing cookies to youtube-dl is a good way to workaround login when a particular extractor does not implement it explicitly. Another use case is working around [CAPTCHA](https://en.wikipedia.org/wiki/CAPTCHA) some websites require you to solve in particular cases in order to get access (e.g. YouTube, CloudFlare).
|
Passing cookies to youtube-dl is a good way to workaround login when a particular extractor does not implement it explicitly. Another use case is working around [CAPTCHA](https://en.wikipedia.org/wiki/CAPTCHA) some websites require you to solve in particular cases in order to get access (e.g. YouTube, CloudFlare).
|
||||||
|
|
||||||
@ -902,7 +907,7 @@ If you want to find out whether a given URL is supported, simply call youtube-dl
|
|||||||
|
|
||||||
# Why do I need to go through that much red tape when filing bugs?
|
# Why do I need to go through that much red tape when filing bugs?
|
||||||
|
|
||||||
Before we had the issue template, despite our extensive [bug reporting instructions](#bugs), about 80% of the issue reports we got were useless, for instance because people used ancient versions hundreds of releases old, because of simple syntactic errors (not in youtube-dl but in general shell usage), because the problem was alrady reported multiple times before, because people did not actually read an error message, even if it said "please install ffmpeg", because people did not mention the URL they were trying to download and many more simple, easy-to-avoid problems, many of whom were totally unrelated to youtube-dl.
|
Before we had the issue template, despite our extensive [bug reporting instructions](#bugs), about 80% of the issue reports we got were useless, for instance because people used ancient versions hundreds of releases old, because of simple syntactic errors (not in youtube-dl but in general shell usage), because the problem was already reported multiple times before, because people did not actually read an error message, even if it said "please install ffmpeg", because people did not mention the URL they were trying to download and many more simple, easy-to-avoid problems, many of whom were totally unrelated to youtube-dl.
|
||||||
|
|
||||||
youtube-dl is an open-source project manned by too few volunteers, so we'd rather spend time fixing bugs where we are certain none of those simple problems apply, and where we can be reasonably confident to be able to reproduce the issue without asking the reporter repeatedly. As such, the output of `youtube-dl -v YOUR_URL_HERE` is really all that's required to file an issue. The issue template also guides you through some basic steps you can do, such as checking that your version of youtube-dl is current.
|
youtube-dl is an open-source project manned by too few volunteers, so we'd rather spend time fixing bugs where we are certain none of those simple problems apply, and where we can be reasonably confident to be able to reproduce the issue without asking the reporter repeatedly. As such, the output of `youtube-dl -v YOUR_URL_HERE` is really all that's required to file an issue. The issue template also guides you through some basic steps you can do, such as checking that your version of youtube-dl is current.
|
||||||
|
|
||||||
@ -923,16 +928,16 @@ To run the test, simply invoke your favorite test runner, or execute a test file
|
|||||||
If you want to create a build of youtube-dl yourself, you'll need
|
If you want to create a build of youtube-dl yourself, you'll need
|
||||||
|
|
||||||
* python
|
* python
|
||||||
* make (both GNU make and BSD make are supported)
|
* make (only GNU make is supported)
|
||||||
* pandoc
|
* pandoc
|
||||||
* zip
|
* zip
|
||||||
* nosetests
|
* nosetests
|
||||||
|
|
||||||
### Adding support for a new site
|
### Adding support for a new site
|
||||||
|
|
||||||
If you want to add support for a new site, first of all **make sure** this site is **not dedicated to [copyright infringement](#can-you-add-support-for-this-anime-video-site-or-site-which-shows-current-movies-for-free)**. youtube-dl does **not support** such sites thus pull requests adding support for them **will be rejected**.
|
If you want to add support for a new site, first of all **make sure** this site is **not dedicated to [copyright infringement](README.md#can-you-add-support-for-this-anime-video-site-or-site-which-shows-current-movies-for-free)**. youtube-dl does **not support** such sites thus pull requests adding support for them **will be rejected**.
|
||||||
|
|
||||||
After you have ensured this site is distributing it's content legally, you can follow this quick list (assuming your service is called `yourextractor`):
|
After you have ensured this site is distributing its content legally, you can follow this quick list (assuming your service is called `yourextractor`):
|
||||||
|
|
||||||
1. [Fork this repository](https://github.com/rg3/youtube-dl/fork)
|
1. [Fork this repository](https://github.com/rg3/youtube-dl/fork)
|
||||||
2. Check out the source code with:
|
2. Check out the source code with:
|
||||||
@ -962,7 +967,7 @@ After you have ensured this site is distributing it's content legally, you can f
|
|||||||
'id': '42',
|
'id': '42',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Video title goes here',
|
'title': 'Video title goes here',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
# TODO more properties, either as:
|
# TODO more properties, either as:
|
||||||
# * A value
|
# * A value
|
||||||
# * MD5 checksum; start the string with md5:
|
# * MD5 checksum; start the string with md5:
|
||||||
@ -1005,19 +1010,19 @@ In any case, thank you very much for your contributions!
|
|||||||
|
|
||||||
This section introduces a guide lines for writing idiomatic, robust and future-proof extractor code.
|
This section introduces a guide lines for writing idiomatic, robust and future-proof extractor code.
|
||||||
|
|
||||||
Extractors are very fragile by nature since they depend on the layout of the source data provided by 3rd party media hoster out of your control and this layout tend to change. As an extractor implementer your task is not only to write code that will extract media links and metadata correctly but also to minimize code dependency on source's layout changes and even to make the code foresee potential future changes and be ready for that. This is important because it will allow extractor not to break on minor layout changes thus keeping old youtube-dl versions working. Even though this breakage issue is easily fixed by emitting a new version of youtube-dl with fix incorporated all the previous version become broken in all repositories and distros' packages that may not be so prompt in fetching the update from us. Needless to say some may never receive an update at all that is possible for non rolling release distros.
|
Extractors are very fragile by nature since they depend on the layout of the source data provided by 3rd party media hosters out of your control and this layout tends to change. As an extractor implementer your task is not only to write code that will extract media links and metadata correctly but also to minimize dependency on the source's layout and even to make the code foresee potential future changes and be ready for that. This is important because it will allow the extractor not to break on minor layout changes thus keeping old youtube-dl versions working. Even though this breakage issue is easily fixed by emitting a new version of youtube-dl with a fix incorporated, all the previous versions become broken in all repositories and distros' packages that may not be so prompt in fetching the update from us. Needless to say, some non rolling release distros may never receive an update at all.
|
||||||
|
|
||||||
### Mandatory and optional metafields
|
### Mandatory and optional metafields
|
||||||
|
|
||||||
For extraction to work youtube-dl relies on metadata your extractor extracts and provides to youtube-dl expressed by [information dictionary](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L75-L257) or simply *info dict*. Only the following meta fields in *info dict* are considered mandatory for successful extraction process by youtube-dl:
|
For extraction to work youtube-dl relies on metadata your extractor extracts and provides to youtube-dl expressed by an [information dictionary](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L75-L257) or simply *info dict*. Only the following meta fields in the *info dict* are considered mandatory for a successful extraction process by youtube-dl:
|
||||||
|
|
||||||
- `id` (media identifier)
|
- `id` (media identifier)
|
||||||
- `title` (media title)
|
- `title` (media title)
|
||||||
- `url` (media download URL) or `formats`
|
- `url` (media download URL) or `formats`
|
||||||
|
|
||||||
In fact only the last option is technically mandatory (i.e. if you can't figure out the download location of the media the extraction does not make any sense). But by convention youtube-dl also treats `id` and `title` to be mandatory. Thus aforementioned metafields are the critical data the extraction does not make any sense without and if any of them fail to be extracted then extractor is considered completely broken.
|
In fact only the last option is technically mandatory (i.e. if you can't figure out the download location of the media the extraction does not make any sense). But by convention youtube-dl also treats `id` and `title` as mandatory. Thus the aforementioned metafields are the critical data that the extraction does not make any sense without and if any of them fail to be extracted then the extractor is considered completely broken.
|
||||||
|
|
||||||
[Any field](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L149-L257) apart from the aforementioned ones are considered **optional**. That means that extraction should be **tolerate** to situations when sources for these fields can potentially be unavailable (even if they are always available at the moment) and **future-proof** in order not to break the extraction of general purpose mandatory fields.
|
[Any field](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/extractor/common.py#L149-L257) apart from the aforementioned ones are considered **optional**. That means that extraction should be **tolerant** to situations when sources for these fields can potentially be unavailable (even if they are always available at the moment) and **future-proof** in order not to break the extraction of general purpose mandatory fields.
|
||||||
|
|
||||||
#### Example
|
#### Example
|
||||||
|
|
||||||
@ -1037,7 +1042,7 @@ Assume at this point `meta`'s layout is:
|
|||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
|
||||||
Assume you want to extract `summary` and put into resulting info dict as `description`. Since `description` is optional metafield you should be ready that this key may be missing from the `meta` dict, so that you should extract it like:
|
Assume you want to extract `summary` and put it into the resulting info dict as `description`. Since `description` is an optional meta field you should be ready that this key may be missing from the `meta` dict, so that you should extract it like:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
description = meta.get('summary') # correct
|
description = meta.get('summary') # correct
|
||||||
@ -1049,7 +1054,7 @@ and not like:
|
|||||||
description = meta['summary'] # incorrect
|
description = meta['summary'] # incorrect
|
||||||
```
|
```
|
||||||
|
|
||||||
The latter will break extraction process with `KeyError` if `summary` disappears from `meta` at some time later but with former approach extraction will just go ahead with `description` set to `None` that is perfectly fine (remember `None` is equivalent for absence of data).
|
The latter will break extraction process with `KeyError` if `summary` disappears from `meta` at some later time but with the former approach extraction will just go ahead with `description` set to `None` which is perfectly fine (remember `None` is equivalent to the absence of data).
|
||||||
|
|
||||||
Similarly, you should pass `fatal=False` when extracting optional data from a webpage with `_search_regex`, `_html_search_regex` or similar methods, for instance:
|
Similarly, you should pass `fatal=False` when extracting optional data from a webpage with `_search_regex`, `_html_search_regex` or similar methods, for instance:
|
||||||
|
|
||||||
@ -1069,21 +1074,21 @@ description = self._search_regex(
|
|||||||
webpage, 'description', default=None)
|
webpage, 'description', default=None)
|
||||||
```
|
```
|
||||||
|
|
||||||
On failure this code will silently continue the extraction with `description` set to `None`. That is useful for metafields that are known to may or may not be present.
|
On failure this code will silently continue the extraction with `description` set to `None`. That is useful for metafields that may or may not be present.
|
||||||
|
|
||||||
### Provide fallbacks
|
### Provide fallbacks
|
||||||
|
|
||||||
When extracting metadata try to provide several scenarios for that. For example if `title` is present in several places/sources try extracting from at least some of them. This would make it more future-proof in case some of the sources became unavailable.
|
When extracting metadata try to do so from multiple sources. For example if `title` is present in several places, try extracting from at least some of them. This makes it more future-proof in case some of the sources become unavailable.
|
||||||
|
|
||||||
#### Example
|
#### Example
|
||||||
|
|
||||||
Say `meta` from previous example has a `title` and you are about to extract it. Since `title` is mandatory meta field you should end up with something like:
|
Say `meta` from the previous example has a `title` and you are about to extract it. Since `title` is a mandatory meta field you should end up with something like:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
title = meta['title']
|
title = meta['title']
|
||||||
```
|
```
|
||||||
|
|
||||||
If `title` disappeares from `meta` in future due to some changes on hoster's side the extraction would fail since `title` is mandatory. That's expected.
|
If `title` disappears from `meta` in future due to some changes on the hoster's side the extraction would fail since `title` is mandatory. That's expected.
|
||||||
|
|
||||||
Assume that you have some another source you can extract `title` from, for example `og:title` HTML meta of a `webpage`. In this case you can provide a fallback scenario:
|
Assume that you have some another source you can extract `title` from, for example `og:title` HTML meta of a `webpage`. In this case you can provide a fallback scenario:
|
||||||
|
|
||||||
@ -1120,7 +1125,7 @@ title = self._search_regex(
|
|||||||
webpage, 'title', group='title')
|
webpage, 'title', group='title')
|
||||||
```
|
```
|
||||||
|
|
||||||
Note how you tolerate potential changes in `style` attribute's value or switch from using double quotes to single for `class` attribute:
|
Note how you tolerate potential changes in the `style` attribute's value or switch from using double quotes to single for `class` attribute:
|
||||||
|
|
||||||
The code definitely should not look like:
|
The code definitely should not look like:
|
||||||
|
|
||||||
@ -1149,7 +1154,7 @@ with youtube_dl.YoutubeDL(ydl_opts) as ydl:
|
|||||||
ydl.download(['http://www.youtube.com/watch?v=BaW_jenozKc'])
|
ydl.download(['http://www.youtube.com/watch?v=BaW_jenozKc'])
|
||||||
```
|
```
|
||||||
|
|
||||||
Most likely, you'll want to use various options. For a list of options available, have a look at [`youtube_dl/YoutubeDL.py`](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/YoutubeDL.py#L128-L278). For a start, if you want to intercept youtube-dl's output, set a `logger` object.
|
Most likely, you'll want to use various options. For a list of options available, have a look at [`youtube_dl/YoutubeDL.py`](https://github.com/rg3/youtube-dl/blob/master/youtube_dl/YoutubeDL.py#L129-L279). For a start, if you want to intercept youtube-dl's output, set a `logger` object.
|
||||||
|
|
||||||
Here's a more complete example of a program that outputs only errors (and a short message after the download is finished), and downloads/converts the video to an mp3 file:
|
Here's a more complete example of a program that outputs only errors (and a short message after the download is finished), and downloads/converts the video to an mp3 file:
|
||||||
|
|
||||||
@ -1190,7 +1195,7 @@ with youtube_dl.YoutubeDL(ydl_opts) as ydl:
|
|||||||
|
|
||||||
# BUGS
|
# BUGS
|
||||||
|
|
||||||
Bugs and suggestions should be reported at: <https://github.com/rg3/youtube-dl/issues>. Unless you were prompted so or there is another pertinent reason (e.g. GitHub fails to accept the bug report), please do not send bug reports via personal email. For discussions, join us in the IRC channel [#youtube-dl](irc://chat.freenode.net/#youtube-dl) on freenode ([webchat](http://webchat.freenode.net/?randomnick=1&channels=youtube-dl)).
|
Bugs and suggestions should be reported at: <https://github.com/rg3/youtube-dl/issues>. Unless you were prompted to or there is another pertinent reason (e.g. GitHub fails to accept the bug report), please do not send bug reports via personal email. For discussions, join us in the IRC channel [#youtube-dl](irc://chat.freenode.net/#youtube-dl) on freenode ([webchat](http://webchat.freenode.net/?randomnick=1&channels=youtube-dl)).
|
||||||
|
|
||||||
**Please include the full output of youtube-dl when run with `-v`**, i.e. **add** `-v` flag to **your command line**, copy the **whole** output and post it in the issue body wrapped in \`\`\` for better formatting. It should look similar to this:
|
**Please include the full output of youtube-dl when run with `-v`**, i.e. **add** `-v` flag to **your command line**, copy the **whole** output and post it in the issue body wrapped in \`\`\` for better formatting. It should look similar to this:
|
||||||
```
|
```
|
||||||
@ -1206,7 +1211,7 @@ $ youtube-dl -v <your command line>
|
|||||||
[debug] Proxy map: {}
|
[debug] Proxy map: {}
|
||||||
...
|
...
|
||||||
```
|
```
|
||||||
**Do not post screenshots of verbose log only plain text is acceptable.**
|
**Do not post screenshots of verbose logs; only plain text is acceptable.**
|
||||||
|
|
||||||
The output (including the first lines) contains important debugging information. Issues without the full output are often not reproducible and therefore do not get solved in short order, if ever.
|
The output (including the first lines) contains important debugging information. Issues without the full output are often not reproducible and therefore do not get solved in short order, if ever.
|
||||||
|
|
||||||
@ -1260,7 +1265,7 @@ Only post features that you (or an incapacitated friend you can personally talk
|
|||||||
|
|
||||||
### Is your question about youtube-dl?
|
### Is your question about youtube-dl?
|
||||||
|
|
||||||
It may sound strange, but some bug reports we receive are completely unrelated to youtube-dl and relate to a different or even the reporter's own application. Please make sure that you are actually using youtube-dl. If you are using a UI for youtube-dl, report the bug to the maintainer of the actual application providing the UI. On the other hand, if your UI for youtube-dl fails in some way you believe is related to youtube-dl, by all means, go ahead and report the bug.
|
It may sound strange, but some bug reports we receive are completely unrelated to youtube-dl and relate to a different, or even the reporter's own, application. Please make sure that you are actually using youtube-dl. If you are using a UI for youtube-dl, report the bug to the maintainer of the actual application providing the UI. On the other hand, if your UI for youtube-dl fails in some way you believe is related to youtube-dl, by all means, go ahead and report the bug.
|
||||||
|
|
||||||
# COPYRIGHT
|
# COPYRIGHT
|
||||||
|
|
||||||
|
@ -25,5 +25,6 @@ def build_completion(opt_parser):
|
|||||||
filled_template = template.replace("{{flags}}", " ".join(opts_flag))
|
filled_template = template.replace("{{flags}}", " ".join(opts_flag))
|
||||||
f.write(filled_template)
|
f.write(filled_template)
|
||||||
|
|
||||||
|
|
||||||
parser = youtube_dl.parseOpts()[0]
|
parser = youtube_dl.parseOpts()[0]
|
||||||
build_completion(parser)
|
build_completion(parser)
|
||||||
|
@ -424,8 +424,6 @@ class BuildHTTPRequestHandler(compat_http_server.BaseHTTPRequestHandler):
|
|||||||
self.send_header('Content-Length', len(msg))
|
self.send_header('Content-Length', len(msg))
|
||||||
self.end_headers()
|
self.end_headers()
|
||||||
self.wfile.write(msg)
|
self.wfile.write(msg)
|
||||||
except HTTPError as e:
|
|
||||||
self.send_response(e.code, str(e))
|
|
||||||
else:
|
else:
|
||||||
self.send_response(500, 'Unknown build method "%s"' % action)
|
self.send_response(500, 'Unknown build method "%s"' % action)
|
||||||
else:
|
else:
|
||||||
|
@ -2,11 +2,13 @@
|
|||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
import base64
|
import base64
|
||||||
|
import io
|
||||||
import json
|
import json
|
||||||
import mimetypes
|
import mimetypes
|
||||||
import netrc
|
import netrc
|
||||||
import optparse
|
import optparse
|
||||||
import os
|
import os
|
||||||
|
import re
|
||||||
import sys
|
import sys
|
||||||
|
|
||||||
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
|
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
|
||||||
@ -90,16 +92,23 @@ class GitHubReleaser(object):
|
|||||||
|
|
||||||
|
|
||||||
def main():
|
def main():
|
||||||
parser = optparse.OptionParser(usage='%prog VERSION BUILDPATH')
|
parser = optparse.OptionParser(usage='%prog CHANGELOG VERSION BUILDPATH')
|
||||||
options, args = parser.parse_args()
|
options, args = parser.parse_args()
|
||||||
if len(args) != 2:
|
if len(args) != 3:
|
||||||
parser.error('Expected a version and a build directory')
|
parser.error('Expected a version and a build directory')
|
||||||
|
|
||||||
version, build_path = args
|
changelog_file, version, build_path = args
|
||||||
|
|
||||||
|
with io.open(changelog_file, encoding='utf-8') as inf:
|
||||||
|
changelog = inf.read()
|
||||||
|
|
||||||
|
mobj = re.search(r'(?s)version %s\n{2}(.+?)\n{3}' % version, changelog)
|
||||||
|
body = mobj.group(1) if mobj else ''
|
||||||
|
|
||||||
releaser = GitHubReleaser()
|
releaser = GitHubReleaser()
|
||||||
|
|
||||||
new_release = releaser.create_release(version, name='youtube-dl %s' % version)
|
new_release = releaser.create_release(
|
||||||
|
version, name='youtube-dl %s' % version, body=body)
|
||||||
release_id = new_release['id']
|
release_id = new_release['id']
|
||||||
|
|
||||||
for asset in os.listdir(build_path):
|
for asset in os.listdir(build_path):
|
||||||
|
@ -44,5 +44,6 @@ def build_completion(opt_parser):
|
|||||||
with open(FISH_COMPLETION_FILE, 'w') as f:
|
with open(FISH_COMPLETION_FILE, 'w') as f:
|
||||||
f.write(filled_template)
|
f.write(filled_template)
|
||||||
|
|
||||||
|
|
||||||
parser = youtube_dl.parseOpts()[0]
|
parser = youtube_dl.parseOpts()[0]
|
||||||
build_completion(parser)
|
build_completion(parser)
|
||||||
|
@ -23,6 +23,7 @@ def openssl_encode(algo, key, iv):
|
|||||||
out, _ = prog.communicate(secret_msg)
|
out, _ = prog.communicate(secret_msg)
|
||||||
return out
|
return out
|
||||||
|
|
||||||
|
|
||||||
iv = key = [0x20, 0x15] + 14 * [0]
|
iv = key = [0x20, 0x15] + 14 * [0]
|
||||||
|
|
||||||
r = openssl_encode('aes-128-cbc', key, iv)
|
r = openssl_encode('aes-128-cbc', key, iv)
|
||||||
|
@ -32,5 +32,6 @@ def main():
|
|||||||
with open('supportedsites.html', 'w', encoding='utf-8') as sitesf:
|
with open('supportedsites.html', 'w', encoding='utf-8') as sitesf:
|
||||||
sitesf.write(template)
|
sitesf.write(template)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
main()
|
main()
|
||||||
|
@ -28,5 +28,6 @@ def main():
|
|||||||
with io.open(outfile, 'w', encoding='utf-8') as outf:
|
with io.open(outfile, 'w', encoding='utf-8') as outf:
|
||||||
outf.write(out)
|
outf.write(out)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
main()
|
main()
|
||||||
|
@ -1,6 +1,7 @@
|
|||||||
from __future__ import unicode_literals, print_function
|
from __future__ import unicode_literals, print_function
|
||||||
|
|
||||||
from inspect import getsource
|
from inspect import getsource
|
||||||
|
import io
|
||||||
import os
|
import os
|
||||||
from os.path import dirname as dirn
|
from os.path import dirname as dirn
|
||||||
import sys
|
import sys
|
||||||
@ -59,6 +60,7 @@ def build_lazy_ie(ie, name):
|
|||||||
s += make_valid_template.format(valid_url=ie._make_valid_url())
|
s += make_valid_template.format(valid_url=ie._make_valid_url())
|
||||||
return s
|
return s
|
||||||
|
|
||||||
|
|
||||||
# find the correct sorting and add the required base classes so that sublcasses
|
# find the correct sorting and add the required base classes so that sublcasses
|
||||||
# can be correctly created
|
# can be correctly created
|
||||||
classes = _ALL_CLASSES[:-1]
|
classes = _ALL_CLASSES[:-1]
|
||||||
@ -94,5 +96,5 @@ module_contents.append(
|
|||||||
|
|
||||||
module_src = '\n'.join(module_contents) + '\n'
|
module_src = '\n'.join(module_contents) + '\n'
|
||||||
|
|
||||||
with open(lazy_extractors_filename, 'wt') as f:
|
with io.open(lazy_extractors_filename, 'wt', encoding='utf-8') as f:
|
||||||
f.write(module_src)
|
f.write(module_src)
|
||||||
|
@ -41,5 +41,6 @@ def main():
|
|||||||
with io.open(outfile, 'w', encoding='utf-8') as outf:
|
with io.open(outfile, 'w', encoding='utf-8') as outf:
|
||||||
outf.write(out)
|
outf.write(out)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
main()
|
main()
|
||||||
|
@ -74,5 +74,6 @@ def filter_options(readme):
|
|||||||
|
|
||||||
return ret
|
return ret
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
main()
|
main()
|
||||||
|
@ -110,7 +110,7 @@ RELEASE_FILES="youtube-dl youtube-dl.exe youtube-dl-$version.tar.gz"
|
|||||||
for f in $RELEASE_FILES; do gpg --passphrase-repeat 5 --detach-sig "build/$version/$f"; done
|
for f in $RELEASE_FILES; do gpg --passphrase-repeat 5 --detach-sig "build/$version/$f"; done
|
||||||
|
|
||||||
ROOT=$(pwd)
|
ROOT=$(pwd)
|
||||||
python devscripts/create-github-release.py $version "$ROOT/build/$version"
|
python devscripts/create-github-release.py ChangeLog $version "$ROOT/build/$version"
|
||||||
|
|
||||||
ssh ytdl@yt-dl.org "sh html/update_latest.sh $version"
|
ssh ytdl@yt-dl.org "sh html/update_latest.sh $version"
|
||||||
|
|
||||||
|
21
devscripts/run_tests.sh
Executable file
21
devscripts/run_tests.sh
Executable file
@ -0,0 +1,21 @@
|
|||||||
|
#!/bin/bash
|
||||||
|
|
||||||
|
DOWNLOAD_TESTS="age_restriction|download|subtitles|write_annotations|iqiyi_sdk_interpreter|youtube_lists"
|
||||||
|
|
||||||
|
test_set=""
|
||||||
|
multiprocess_args=""
|
||||||
|
|
||||||
|
case "$YTDL_TEST_SET" in
|
||||||
|
core)
|
||||||
|
test_set="-I test_($DOWNLOAD_TESTS)\.py"
|
||||||
|
;;
|
||||||
|
download)
|
||||||
|
test_set="-I test_(?!$DOWNLOAD_TESTS).+\.py"
|
||||||
|
multiprocess_args="--processes=4 --process-timeout=540"
|
||||||
|
;;
|
||||||
|
*)
|
||||||
|
break
|
||||||
|
;;
|
||||||
|
esac
|
||||||
|
|
||||||
|
nosetests test --verbose $test_set $multiprocess_args
|
@ -44,5 +44,6 @@ def build_completion(opt_parser):
|
|||||||
with open(ZSH_COMPLETION_FILE, "w") as f:
|
with open(ZSH_COMPLETION_FILE, "w") as f:
|
||||||
f.write(template)
|
f.write(template)
|
||||||
|
|
||||||
|
|
||||||
parser = youtube_dl.parseOpts()[0]
|
parser = youtube_dl.parseOpts()[0]
|
||||||
build_completion(parser)
|
build_completion(parser)
|
||||||
|
@ -11,6 +11,7 @@
|
|||||||
- **4tube**
|
- **4tube**
|
||||||
- **56.com**
|
- **56.com**
|
||||||
- **5min**
|
- **5min**
|
||||||
|
- **6play**
|
||||||
- **8tracks**
|
- **8tracks**
|
||||||
- **91porn**
|
- **91porn**
|
||||||
- **9c9media**
|
- **9c9media**
|
||||||
@ -33,7 +34,8 @@
|
|||||||
- **AdobeTVVideo**
|
- **AdobeTVVideo**
|
||||||
- **AdultSwim**
|
- **AdultSwim**
|
||||||
- **aenetworks**: A+E Networks: A&E, Lifetime, History.com, FYI Network
|
- **aenetworks**: A+E Networks: A&E, Lifetime, History.com, FYI Network
|
||||||
- **AfreecaTV**: afreecatv.com
|
- **afreecatv**: afreecatv.com
|
||||||
|
- **afreecatv:global**: afreecatv.com
|
||||||
- **AirMozilla**
|
- **AirMozilla**
|
||||||
- **AlJazeera**
|
- **AlJazeera**
|
||||||
- **Allocine**
|
- **Allocine**
|
||||||
@ -74,6 +76,9 @@
|
|||||||
- **awaan:live**
|
- **awaan:live**
|
||||||
- **awaan:season**
|
- **awaan:season**
|
||||||
- **awaan:video**
|
- **awaan:video**
|
||||||
|
- **AZMedien**: AZ Medien videos
|
||||||
|
- **AZMedienPlaylist**: AZ Medien playlists
|
||||||
|
- **AZMedienShowPlaylist**: AZ Medien show playlists
|
||||||
- **Azubu**
|
- **Azubu**
|
||||||
- **AzubuLive**
|
- **AzubuLive**
|
||||||
- **BaiduVideo**: 百度视频
|
- **BaiduVideo**: 百度视频
|
||||||
@ -81,12 +86,14 @@
|
|||||||
- **bambuser:channel**
|
- **bambuser:channel**
|
||||||
- **Bandcamp**
|
- **Bandcamp**
|
||||||
- **Bandcamp:album**
|
- **Bandcamp:album**
|
||||||
|
- **bangumi.bilibili.com**: BiliBili番剧
|
||||||
- **bbc**: BBC
|
- **bbc**: BBC
|
||||||
- **bbc.co.uk**: BBC iPlayer
|
- **bbc.co.uk**: BBC iPlayer
|
||||||
- **bbc.co.uk:article**: BBC articles
|
- **bbc.co.uk:article**: BBC articles
|
||||||
- **bbc.co.uk:iplayer:playlist**
|
- **bbc.co.uk:iplayer:playlist**
|
||||||
- **bbc.co.uk:playlist**
|
- **bbc.co.uk:playlist**
|
||||||
- **BeatportPro**
|
- **Beam:live**
|
||||||
|
- **Beatport**
|
||||||
- **Beeg**
|
- **Beeg**
|
||||||
- **BehindKink**
|
- **BehindKink**
|
||||||
- **BellMedia**
|
- **BellMedia**
|
||||||
@ -131,7 +138,8 @@
|
|||||||
- **cbsnews**: CBS News
|
- **cbsnews**: CBS News
|
||||||
- **cbsnews:livevideo**: CBS News Live Videos
|
- **cbsnews:livevideo**: CBS News Live Videos
|
||||||
- **CBSSports**
|
- **CBSSports**
|
||||||
- **CCTV**
|
- **CCMA**
|
||||||
|
- **CCTV**: 央视网
|
||||||
- **CDA**
|
- **CDA**
|
||||||
- **CeskaTelevize**
|
- **CeskaTelevize**
|
||||||
- **channel9**: Channel 9
|
- **channel9**: Channel 9
|
||||||
@ -158,9 +166,11 @@
|
|||||||
- **CollegeRama**
|
- **CollegeRama**
|
||||||
- **ComCarCoff**
|
- **ComCarCoff**
|
||||||
- **ComedyCentral**
|
- **ComedyCentral**
|
||||||
|
- **ComedyCentralFullEpisodes**
|
||||||
- **ComedyCentralShortname**
|
- **ComedyCentralShortname**
|
||||||
- **ComedyCentralTV**
|
- **ComedyCentralTV**
|
||||||
- **CondeNast**: Condé Nast media group: Allure, Architectural Digest, Ars Technica, Bon Appétit, Brides, Condé Nast, Condé Nast Traveler, Details, Epicurious, GQ, Glamour, Golf Digest, SELF, Teen Vogue, The New Yorker, Vanity Fair, Vogue, W Magazine, WIRED
|
- **CondeNast**: Condé Nast media group: Allure, Architectural Digest, Ars Technica, Bon Appétit, Brides, Condé Nast, Condé Nast Traveler, Details, Epicurious, GQ, Glamour, Golf Digest, SELF, Teen Vogue, The New Yorker, Vanity Fair, Vogue, W Magazine, WIRED
|
||||||
|
- **Corus**
|
||||||
- **Coub**
|
- **Coub**
|
||||||
- **Cracked**
|
- **Cracked**
|
||||||
- **Crackle**
|
- **Crackle**
|
||||||
@ -182,6 +192,8 @@
|
|||||||
- **dailymotion:playlist**
|
- **dailymotion:playlist**
|
||||||
- **dailymotion:user**
|
- **dailymotion:user**
|
||||||
- **DailymotionCloud**
|
- **DailymotionCloud**
|
||||||
|
- **Daisuki**
|
||||||
|
- **DaisukiPlaylist**
|
||||||
- **daum.net**
|
- **daum.net**
|
||||||
- **daum.net:clip**
|
- **daum.net:clip**
|
||||||
- **daum.net:playlist**
|
- **daum.net:playlist**
|
||||||
@ -196,6 +208,7 @@
|
|||||||
- **Digiteka**
|
- **Digiteka**
|
||||||
- **Discovery**
|
- **Discovery**
|
||||||
- **DiscoveryGo**
|
- **DiscoveryGo**
|
||||||
|
- **Disney**
|
||||||
- **Dotsub**
|
- **Dotsub**
|
||||||
- **DouyuTV**: 斗鱼
|
- **DouyuTV**: 斗鱼
|
||||||
- **DPlay**
|
- **DPlay**
|
||||||
@ -204,7 +217,8 @@
|
|||||||
- **DRBonanza**
|
- **DRBonanza**
|
||||||
- **Dropbox**
|
- **Dropbox**
|
||||||
- **DrTuber**
|
- **DrTuber**
|
||||||
- **DRTV**
|
- **drtv**
|
||||||
|
- **drtv:live**
|
||||||
- **Dumpert**
|
- **Dumpert**
|
||||||
- **dvtv**: http://video.aktualne.cz/
|
- **dvtv**: http://video.aktualne.cz/
|
||||||
- **dw**
|
- **dw**
|
||||||
@ -212,6 +226,7 @@
|
|||||||
- **EaglePlatform**
|
- **EaglePlatform**
|
||||||
- **EbaumsWorld**
|
- **EbaumsWorld**
|
||||||
- **EchoMsk**
|
- **EchoMsk**
|
||||||
|
- **egghead:course**: egghead.io course
|
||||||
- **eHow**
|
- **eHow**
|
||||||
- **Einthusan**
|
- **Einthusan**
|
||||||
- **eitb.tv**
|
- **eitb.tv**
|
||||||
@ -225,7 +240,9 @@
|
|||||||
- **EroProfile**
|
- **EroProfile**
|
||||||
- **Escapist**
|
- **Escapist**
|
||||||
- **ESPN**
|
- **ESPN**
|
||||||
|
- **ESPNArticle**
|
||||||
- **EsriVideo**
|
- **EsriVideo**
|
||||||
|
- **ETOnline**
|
||||||
- **Europa**
|
- **Europa**
|
||||||
- **EveryonesMixtape**
|
- **EveryonesMixtape**
|
||||||
- **ExpoTV**
|
- **ExpoTV**
|
||||||
@ -237,8 +254,9 @@
|
|||||||
- **fc2**
|
- **fc2**
|
||||||
- **fc2:embed**
|
- **fc2:embed**
|
||||||
- **Fczenit**
|
- **Fczenit**
|
||||||
- **features.aol.com**
|
|
||||||
- **fernsehkritik.tv**
|
- **fernsehkritik.tv**
|
||||||
|
- **filmon**
|
||||||
|
- **filmon:channel**
|
||||||
- **Firstpost**
|
- **Firstpost**
|
||||||
- **FiveTV**
|
- **FiveTV**
|
||||||
- **Flickr**
|
- **Flickr**
|
||||||
@ -247,6 +265,7 @@
|
|||||||
- **FootyRoom**
|
- **FootyRoom**
|
||||||
- **Formula1**
|
- **Formula1**
|
||||||
- **FOX**
|
- **FOX**
|
||||||
|
- **FOX9**
|
||||||
- **Foxgay**
|
- **Foxgay**
|
||||||
- **foxnews**: Fox News and Fox Business Video
|
- **foxnews**: Fox News and Fox Business Video
|
||||||
- **foxnews:article**
|
- **foxnews:article**
|
||||||
@ -259,7 +278,7 @@
|
|||||||
- **francetvinfo.fr**
|
- **francetvinfo.fr**
|
||||||
- **Freesound**
|
- **Freesound**
|
||||||
- **freespeech.org**
|
- **freespeech.org**
|
||||||
- **FreeVideo**
|
- **FreshLive**
|
||||||
- **Funimation**
|
- **Funimation**
|
||||||
- **FunnyOrDie**
|
- **FunnyOrDie**
|
||||||
- **Fusion**
|
- **Fusion**
|
||||||
@ -270,6 +289,7 @@
|
|||||||
- **Gamersyde**
|
- **Gamersyde**
|
||||||
- **GameSpot**
|
- **GameSpot**
|
||||||
- **GameStar**
|
- **GameStar**
|
||||||
|
- **Gaskrank**
|
||||||
- **Gazeta**
|
- **Gazeta**
|
||||||
- **GDCVault**
|
- **GDCVault**
|
||||||
- **generic**: Generic downloader that works on some sites
|
- **generic**: Generic downloader that works on some sites
|
||||||
@ -289,17 +309,19 @@
|
|||||||
- **Groupon**
|
- **Groupon**
|
||||||
- **Hark**
|
- **Hark**
|
||||||
- **HBO**
|
- **HBO**
|
||||||
|
- **HBOEpisode**
|
||||||
- **HearThisAt**
|
- **HearThisAt**
|
||||||
- **Heise**
|
- **Heise**
|
||||||
- **HellPorno**
|
- **HellPorno**
|
||||||
- **Helsinki**: helsinki.fi
|
- **Helsinki**: helsinki.fi
|
||||||
- **HentaiStigma**
|
- **HentaiStigma**
|
||||||
- **HGTV**
|
- **hetklokhuis**
|
||||||
- **hgtv.com:show**
|
- **hgtv.com:show**
|
||||||
- **HistoricFilms**
|
- **HistoricFilms**
|
||||||
- **history:topic**: History.com Topic
|
- **history:topic**: History.com Topic
|
||||||
- **hitbox**
|
- **hitbox**
|
||||||
- **hitbox:live**
|
- **hitbox:live**
|
||||||
|
- **HitRecord**
|
||||||
- **HornBunny**
|
- **HornBunny**
|
||||||
- **HotNewHipHop**
|
- **HotNewHipHop**
|
||||||
- **HotStar**
|
- **HotStar**
|
||||||
@ -307,6 +329,7 @@
|
|||||||
- **HowStuffWorks**
|
- **HowStuffWorks**
|
||||||
- **HRTi**
|
- **HRTi**
|
||||||
- **HRTiPlaylist**
|
- **HRTiPlaylist**
|
||||||
|
- **Huajiao**: 花椒直播
|
||||||
- **HuffPost**: Huffington Post
|
- **HuffPost**: Huffington Post
|
||||||
- **Hypem**
|
- **Hypem**
|
||||||
- **Iconosquare**
|
- **Iconosquare**
|
||||||
@ -316,6 +339,7 @@
|
|||||||
- **Imgur**
|
- **Imgur**
|
||||||
- **ImgurAlbum**
|
- **ImgurAlbum**
|
||||||
- **Ina**
|
- **Ina**
|
||||||
|
- **Inc**
|
||||||
- **Indavideo**
|
- **Indavideo**
|
||||||
- **IndavideoEmbed**
|
- **IndavideoEmbed**
|
||||||
- **InfoQ**
|
- **InfoQ**
|
||||||
@ -325,11 +349,14 @@
|
|||||||
- **IPrima**
|
- **IPrima**
|
||||||
- **iqiyi**: 爱奇艺
|
- **iqiyi**: 爱奇艺
|
||||||
- **Ir90Tv**
|
- **Ir90Tv**
|
||||||
|
- **ITV**
|
||||||
- **ivi**: ivi.ru
|
- **ivi**: ivi.ru
|
||||||
- **ivi:compilation**: ivi.ru compilations
|
- **ivi:compilation**: ivi.ru compilations
|
||||||
- **ivideon**: Ivideon TV
|
- **ivideon**: Ivideon TV
|
||||||
- **Iwara**
|
- **Iwara**
|
||||||
- **Izlesene**
|
- **Izlesene**
|
||||||
|
- **Jamendo**
|
||||||
|
- **JamendoAlbum**
|
||||||
- **JeuxVideo**
|
- **JeuxVideo**
|
||||||
- **Jove**
|
- **Jove**
|
||||||
- **jpopsuki.tv**
|
- **jpopsuki.tv**
|
||||||
@ -357,13 +384,15 @@
|
|||||||
- **kuwo:singer**: 酷我音乐 - 歌手
|
- **kuwo:singer**: 酷我音乐 - 歌手
|
||||||
- **kuwo:song**: 酷我音乐
|
- **kuwo:song**: 酷我音乐
|
||||||
- **la7.it**
|
- **la7.it**
|
||||||
- **Laola1Tv**
|
- **laola1tv**
|
||||||
|
- **laola1tv:embed**
|
||||||
- **LCI**
|
- **LCI**
|
||||||
- **Lcp**
|
- **Lcp**
|
||||||
- **LcpPlay**
|
- **LcpPlay**
|
||||||
- **Le**: 乐视网
|
- **Le**: 乐视网
|
||||||
- **Learnr**
|
- **Learnr**
|
||||||
- **Lecture2Go**
|
- **Lecture2Go**
|
||||||
|
- **LEGO**
|
||||||
- **Lemonde**
|
- **Lemonde**
|
||||||
- **LePlaylist**
|
- **LePlaylist**
|
||||||
- **LetvCloud**: 乐视云
|
- **LetvCloud**: 乐视云
|
||||||
@ -394,6 +423,8 @@
|
|||||||
- **MatchTV**
|
- **MatchTV**
|
||||||
- **MDR**: MDR.DE and KiKA
|
- **MDR**: MDR.DE and KiKA
|
||||||
- **media.ccc.de**
|
- **media.ccc.de**
|
||||||
|
- **Meipai**: 美拍
|
||||||
|
- **MelonVOD**
|
||||||
- **META**
|
- **META**
|
||||||
- **metacafe**
|
- **metacafe**
|
||||||
- **Metacritic**
|
- **Metacritic**
|
||||||
@ -427,6 +458,7 @@
|
|||||||
- **mtg**: MTG services
|
- **mtg**: MTG services
|
||||||
- **mtv**
|
- **mtv**
|
||||||
- **mtv.de**
|
- **mtv.de**
|
||||||
|
- **mtv81**
|
||||||
- **mtv:video**
|
- **mtv:video**
|
||||||
- **mtvservices:embedded**
|
- **mtvservices:embedded**
|
||||||
- **MuenchenTV**: münchen.tv
|
- **MuenchenTV**: münchen.tv
|
||||||
@ -469,6 +501,7 @@
|
|||||||
- **Newstube**
|
- **Newstube**
|
||||||
- **NextMedia**: 蘋果日報
|
- **NextMedia**: 蘋果日報
|
||||||
- **NextMediaActionNews**: 蘋果日報 - 動新聞
|
- **NextMediaActionNews**: 蘋果日報 - 動新聞
|
||||||
|
- **NextTV**: 壹電視
|
||||||
- **nfb**: National Film Board of Canada
|
- **nfb**: National Film Board of Canada
|
||||||
- **nfl.com**
|
- **nfl.com**
|
||||||
- **NhkVod**
|
- **NhkVod**
|
||||||
@ -478,11 +511,14 @@
|
|||||||
- **nhl.com:videocenter:category**: NHL videocenter category
|
- **nhl.com:videocenter:category**: NHL videocenter category
|
||||||
- **nick.com**
|
- **nick.com**
|
||||||
- **nick.de**
|
- **nick.de**
|
||||||
|
- **nicknight**
|
||||||
- **niconico**: ニコニコ動画
|
- **niconico**: ニコニコ動画
|
||||||
- **NiconicoPlaylist**
|
- **NiconicoPlaylist**
|
||||||
- **Nintendo**
|
- **Nintendo**
|
||||||
- **njoy**: N-JOY
|
- **njoy**: N-JOY
|
||||||
- **njoy:embed**
|
- **njoy:embed**
|
||||||
|
- **NJPWWorld**: 新日本プロレスワールド
|
||||||
|
- **NobelPrize**
|
||||||
- **Noco**
|
- **Noco**
|
||||||
- **Normalboots**
|
- **Normalboots**
|
||||||
- **NosVideo**
|
- **NosVideo**
|
||||||
@ -503,17 +539,24 @@
|
|||||||
- **NRKPlaylist**
|
- **NRKPlaylist**
|
||||||
- **NRKSkole**: NRK Skole
|
- **NRKSkole**: NRK Skole
|
||||||
- **NRKTV**: NRK TV and NRK Radio
|
- **NRKTV**: NRK TV and NRK Radio
|
||||||
|
- **NRKTVDirekte**: NRK TV Direkte and NRK Radio Direkte
|
||||||
|
- **NRKTVEpisodes**
|
||||||
|
- **NRKTVSeries**
|
||||||
- **ntv.ru**
|
- **ntv.ru**
|
||||||
- **Nuvid**
|
- **Nuvid**
|
||||||
- **NYTimes**
|
- **NYTimes**
|
||||||
- **NYTimesArticle**
|
- **NYTimesArticle**
|
||||||
|
- **NZZ**
|
||||||
- **ocw.mit.edu**
|
- **ocw.mit.edu**
|
||||||
- **OdaTV**
|
- **OdaTV**
|
||||||
- **Odnoklassniki**
|
- **Odnoklassniki**
|
||||||
- **OktoberfestTV**
|
- **OktoberfestTV**
|
||||||
- **on.aol.com**
|
- **on.aol.com**
|
||||||
|
- **OnDemandKorea**
|
||||||
|
- **onet.pl**
|
||||||
- **onet.tv**
|
- **onet.tv**
|
||||||
- **onet.tv:channel**
|
- **onet.tv:channel**
|
||||||
|
- **OnetMVP**
|
||||||
- **OnionStudios**
|
- **OnionStudios**
|
||||||
- **Ooyala**
|
- **Ooyala**
|
||||||
- **OoyalaExternal**
|
- **OoyalaExternal**
|
||||||
@ -523,6 +566,7 @@
|
|||||||
- **orf:iptv**: iptv.ORF.at
|
- **orf:iptv**: iptv.ORF.at
|
||||||
- **orf:oe1**: Radio Österreich 1
|
- **orf:oe1**: Radio Österreich 1
|
||||||
- **orf:tvthek**: ORF TVthek
|
- **orf:tvthek**: ORF TVthek
|
||||||
|
- **PandaTV**: 熊猫TV
|
||||||
- **pandora.tv**: 판도라TV
|
- **pandora.tv**: 판도라TV
|
||||||
- **parliamentlive.tv**: UK parliament videos
|
- **parliamentlive.tv**: UK parliament videos
|
||||||
- **Patreon**
|
- **Patreon**
|
||||||
@ -534,6 +578,7 @@
|
|||||||
- **PhilharmonieDeParis**: Philharmonie de Paris
|
- **PhilharmonieDeParis**: Philharmonie de Paris
|
||||||
- **phoenix.de**
|
- **phoenix.de**
|
||||||
- **Photobucket**
|
- **Photobucket**
|
||||||
|
- **Piksel**
|
||||||
- **Pinkbike**
|
- **Pinkbike**
|
||||||
- **Pladform**
|
- **Pladform**
|
||||||
- **play.fm**
|
- **play.fm**
|
||||||
@ -550,6 +595,7 @@
|
|||||||
- **PolskieRadio**
|
- **PolskieRadio**
|
||||||
- **PolskieRadioCategory**
|
- **PolskieRadioCategory**
|
||||||
- **PornCom**
|
- **PornCom**
|
||||||
|
- **PornFlip**
|
||||||
- **PornHd**
|
- **PornHd**
|
||||||
- **PornHub**: PornHub and Thumbzilla
|
- **PornHub**: PornHub and Thumbzilla
|
||||||
- **PornHubPlaylist**
|
- **PornHubPlaylist**
|
||||||
@ -580,8 +626,11 @@
|
|||||||
- **RaiTV**
|
- **RaiTV**
|
||||||
- **RBMARadio**
|
- **RBMARadio**
|
||||||
- **RDS**: RDS.ca
|
- **RDS**: RDS.ca
|
||||||
|
- **RedBullTV**
|
||||||
- **RedTube**
|
- **RedTube**
|
||||||
- **RegioTV**
|
- **RegioTV**
|
||||||
|
- **RENTV**
|
||||||
|
- **RENTVArticle**
|
||||||
- **Restudy**
|
- **Restudy**
|
||||||
- **Reuters**
|
- **Reuters**
|
||||||
- **ReverbNation**
|
- **ReverbNation**
|
||||||
@ -625,22 +674,20 @@
|
|||||||
- **savefrom.net**
|
- **savefrom.net**
|
||||||
- **SBS**: sbs.com.au
|
- **SBS**: sbs.com.au
|
||||||
- **schooltv**
|
- **schooltv**
|
||||||
- **SciVee**
|
|
||||||
- **screen.yahoo:search**: Yahoo screen search
|
- **screen.yahoo:search**: Yahoo screen search
|
||||||
- **Screencast**
|
- **Screencast**
|
||||||
- **ScreencastOMatic**
|
- **ScreencastOMatic**
|
||||||
- **ScreenJunkies**
|
- **scrippsnetworks:watch**
|
||||||
- **ScreenwaveMedia**
|
|
||||||
- **Seeker**
|
- **Seeker**
|
||||||
- **SenateISVP**
|
- **SenateISVP**
|
||||||
- **SendtoNews**
|
- **SendtoNews**
|
||||||
- **ServingSys**
|
- **ServingSys**
|
||||||
- **Sexu**
|
- **Sexu**
|
||||||
- **Shahid**
|
- **Shahid**
|
||||||
- **Shared**: shared.sx and vivo.sx
|
- **Shared**: shared.sx
|
||||||
- **ShareSix**
|
- **ShowRoomLive**
|
||||||
- **Sina**
|
- **Sina**
|
||||||
- **SixPlay**
|
- **SkylineWebcams**
|
||||||
- **skynewsarabia:article**
|
- **skynewsarabia:article**
|
||||||
- **skynewsarabia:video**
|
- **skynewsarabia:video**
|
||||||
- **SkySports**
|
- **SkySports**
|
||||||
@ -672,10 +719,10 @@
|
|||||||
- **Spiegeltv**
|
- **Spiegeltv**
|
||||||
- **Spike**
|
- **Spike**
|
||||||
- **Sport5**
|
- **Sport5**
|
||||||
- **SportBox**
|
|
||||||
- **SportBoxEmbed**
|
- **SportBoxEmbed**
|
||||||
- **SportDeutschland**
|
- **SportDeutschland**
|
||||||
- **Sportschau**
|
- **Sportschau**
|
||||||
|
- **Sprout**
|
||||||
- **sr:mediathek**: Saarländischer Rundfunk
|
- **sr:mediathek**: Saarländischer Rundfunk
|
||||||
- **SRGSSR**
|
- **SRGSSR**
|
||||||
- **SRGSSRPlay**: srf.ch, rts.ch, rsi.ch, rtr.ch and swissinfo.ch play sites
|
- **SRGSSRPlay**: srf.ch, rts.ch, rsi.ch, rtr.ch and swissinfo.ch play sites
|
||||||
@ -692,6 +739,7 @@
|
|||||||
- **SWRMediathek**
|
- **SWRMediathek**
|
||||||
- **Syfy**
|
- **Syfy**
|
||||||
- **SztvHu**
|
- **SztvHu**
|
||||||
|
- **t-online.de**
|
||||||
- **Tagesschau**
|
- **Tagesschau**
|
||||||
- **tagesschau:player**
|
- **tagesschau:player**
|
||||||
- **Tass**
|
- **Tass**
|
||||||
@ -701,7 +749,7 @@
|
|||||||
- **teachertube:user:collection**: teachertube.com user and collection videos
|
- **teachertube:user:collection**: teachertube.com user and collection videos
|
||||||
- **TeachingChannel**
|
- **TeachingChannel**
|
||||||
- **Teamcoco**
|
- **Teamcoco**
|
||||||
- **TeamFour**
|
- **TeamFourStar**
|
||||||
- **TechTalks**
|
- **TechTalks**
|
||||||
- **techtv.mit.edu**
|
- **techtv.mit.edu**
|
||||||
- **ted**
|
- **ted**
|
||||||
@ -716,13 +764,16 @@
|
|||||||
- **TF1**
|
- **TF1**
|
||||||
- **TFO**
|
- **TFO**
|
||||||
- **TheIntercept**
|
- **TheIntercept**
|
||||||
|
- **theoperaplatform**
|
||||||
- **ThePlatform**
|
- **ThePlatform**
|
||||||
- **ThePlatformFeed**
|
- **ThePlatformFeed**
|
||||||
- **TheScene**
|
- **TheScene**
|
||||||
- **TheSixtyOne**
|
- **TheSixtyOne**
|
||||||
- **TheStar**
|
- **TheStar**
|
||||||
|
- **TheWeatherChannel**
|
||||||
- **ThisAmericanLife**
|
- **ThisAmericanLife**
|
||||||
- **ThisAV**
|
- **ThisAV**
|
||||||
|
- **ThisOldHouse**
|
||||||
- **tinypic**: tinypic.com videos
|
- **tinypic**: tinypic.com videos
|
||||||
- **tlc.de**
|
- **tlc.de**
|
||||||
- **TMZ**
|
- **TMZ**
|
||||||
@ -754,21 +805,29 @@
|
|||||||
- **TV2Article**
|
- **TV2Article**
|
||||||
- **TV3**
|
- **TV3**
|
||||||
- **TV4**: tv4.se and tv4play.se
|
- **TV4**: tv4.se and tv4play.se
|
||||||
|
- **TVA**
|
||||||
|
- **TVANouvelles**
|
||||||
|
- **TVANouvellesArticle**
|
||||||
- **TVC**
|
- **TVC**
|
||||||
- **TVCArticle**
|
- **TVCArticle**
|
||||||
- **tvigle**: Интернет-телевидение Tvigle.ru
|
- **tvigle**: Интернет-телевидение Tvigle.ru
|
||||||
- **tvland.com**
|
- **tvland.com**
|
||||||
|
- **TVN24**
|
||||||
- **TVNoe**
|
- **TVNoe**
|
||||||
- **tvp**: Telewizja Polska
|
- **tvp**: Telewizja Polska
|
||||||
- **tvp:embed**: Telewizja Polska
|
- **tvp:embed**: Telewizja Polska
|
||||||
- **tvp:series**
|
- **tvp:series**
|
||||||
|
- **TVPlayer**
|
||||||
- **Tweakers**
|
- **Tweakers**
|
||||||
- **twitch:chapter**
|
- **twitch:chapter**
|
||||||
- **twitch:clips**
|
- **twitch:clips**
|
||||||
- **twitch:past_broadcasts**
|
|
||||||
- **twitch:profile**
|
- **twitch:profile**
|
||||||
- **twitch:stream**
|
- **twitch:stream**
|
||||||
- **twitch:video**
|
- **twitch:video**
|
||||||
|
- **twitch:videos:all**
|
||||||
|
- **twitch:videos:highlights**
|
||||||
|
- **twitch:videos:past-broadcasts**
|
||||||
|
- **twitch:videos:uploads**
|
||||||
- **twitch:vod**
|
- **twitch:vod**
|
||||||
- **twitter**
|
- **twitter**
|
||||||
- **twitter:amplify**
|
- **twitter:amplify**
|
||||||
@ -776,6 +835,7 @@
|
|||||||
- **udemy**
|
- **udemy**
|
||||||
- **udemy:course**
|
- **udemy:course**
|
||||||
- **UDNEmbed**: 聯合影音
|
- **UDNEmbed**: 聯合影音
|
||||||
|
- **UKTVPlay**
|
||||||
- **Unistra**
|
- **Unistra**
|
||||||
- **uol.com.br**
|
- **uol.com.br**
|
||||||
- **uplynk**
|
- **uplynk**
|
||||||
@ -804,6 +864,7 @@
|
|||||||
- **ViceShow**
|
- **ViceShow**
|
||||||
- **Vidbit**
|
- **Vidbit**
|
||||||
- **Viddler**
|
- **Viddler**
|
||||||
|
- **Videa**
|
||||||
- **video.google:search**: Google Video search
|
- **video.google:search**: Google Video search
|
||||||
- **video.mit.edu**
|
- **video.mit.edu**
|
||||||
- **VideoDetective**
|
- **VideoDetective**
|
||||||
@ -813,7 +874,7 @@
|
|||||||
- **videomore:season**
|
- **videomore:season**
|
||||||
- **videomore:video**
|
- **videomore:video**
|
||||||
- **VideoPremium**
|
- **VideoPremium**
|
||||||
- **VideoTt**: video.tt - Your True Tube (Currently broken)
|
- **VideoPress**
|
||||||
- **videoweed**: VideoWeed
|
- **videoweed**: VideoWeed
|
||||||
- **Vidio**
|
- **Vidio**
|
||||||
- **vidme**
|
- **vidme**
|
||||||
@ -840,20 +901,29 @@
|
|||||||
- **Vimple**: Vimple - one-click video hosting
|
- **Vimple**: Vimple - one-click video hosting
|
||||||
- **Vine**
|
- **Vine**
|
||||||
- **vine:user**
|
- **vine:user**
|
||||||
|
- **Viu**
|
||||||
|
- **viu:ott**
|
||||||
|
- **viu:playlist**
|
||||||
|
- **Vivo**: vivo.sx
|
||||||
- **vk**: VK
|
- **vk**: VK
|
||||||
- **vk:uservideos**: VK - User's Videos
|
- **vk:uservideos**: VK - User's Videos
|
||||||
- **vk:wallpost**
|
- **vk:wallpost**
|
||||||
- **vlive**
|
- **vlive**
|
||||||
|
- **vlive:channel**
|
||||||
- **Vodlocker**
|
- **Vodlocker**
|
||||||
|
- **VODPl**
|
||||||
- **VODPlatform**
|
- **VODPlatform**
|
||||||
- **VoiceRepublic**
|
- **VoiceRepublic**
|
||||||
- **VoxMedia**
|
- **VoxMedia**
|
||||||
- **Vporn**
|
- **Vporn**
|
||||||
- **vpro**: npo.nl and ntr.nl
|
- **vpro**: npo.nl and ntr.nl
|
||||||
|
- **Vrak**
|
||||||
- **VRT**
|
- **VRT**
|
||||||
- **vube**: Vube.com
|
- **vube**: Vube.com
|
||||||
- **VuClip**
|
- **VuClip**
|
||||||
|
- **VVVVID**
|
||||||
- **VyboryMos**
|
- **VyboryMos**
|
||||||
|
- **Vzaar**
|
||||||
- **Walla**
|
- **Walla**
|
||||||
- **washingtonpost**
|
- **washingtonpost**
|
||||||
- **washingtonpost:article**
|
- **washingtonpost:article**
|
||||||
@ -861,6 +931,8 @@
|
|||||||
- **WatchIndianPorn**: Watch Indian Porn
|
- **WatchIndianPorn**: Watch Indian Porn
|
||||||
- **WDR**
|
- **WDR**
|
||||||
- **wdr:mobile**
|
- **wdr:mobile**
|
||||||
|
- **Webcaster**
|
||||||
|
- **WebcasterFeed**
|
||||||
- **WebOfStories**
|
- **WebOfStories**
|
||||||
- **WebOfStoriesPlaylist**
|
- **WebOfStoriesPlaylist**
|
||||||
- **WeiqiTV**: WQTV
|
- **WeiqiTV**: WQTV
|
||||||
|
5
setup.py
5
setup.py
@ -107,8 +107,8 @@ setup(
|
|||||||
url='https://github.com/rg3/youtube-dl',
|
url='https://github.com/rg3/youtube-dl',
|
||||||
author='Ricardo Garcia',
|
author='Ricardo Garcia',
|
||||||
author_email='ytdl@yt-dl.org',
|
author_email='ytdl@yt-dl.org',
|
||||||
maintainer='Philipp Hagemeister',
|
maintainer='Sergey M.',
|
||||||
maintainer_email='phihag@phihag.de',
|
maintainer_email='dstftw@gmail.com',
|
||||||
packages=[
|
packages=[
|
||||||
'youtube_dl',
|
'youtube_dl',
|
||||||
'youtube_dl.extractor', 'youtube_dl.downloader',
|
'youtube_dl.extractor', 'youtube_dl.downloader',
|
||||||
@ -130,6 +130,7 @@ setup(
|
|||||||
'Programming Language :: Python :: 3.3',
|
'Programming Language :: Python :: 3.3',
|
||||||
'Programming Language :: Python :: 3.4',
|
'Programming Language :: Python :: 3.4',
|
||||||
'Programming Language :: Python :: 3.5',
|
'Programming Language :: Python :: 3.5',
|
||||||
|
'Programming Language :: Python :: 3.6',
|
||||||
],
|
],
|
||||||
|
|
||||||
cmdclass={'build_lazy_extractors': build_lazy_extractors},
|
cmdclass={'build_lazy_extractors': build_lazy_extractors},
|
||||||
|
@ -84,5 +84,6 @@ class TestInfoExtractor(unittest.TestCase):
|
|||||||
self.assertRaises(ExtractorError, self.ie._download_json, uri, None)
|
self.assertRaises(ExtractorError, self.ie._download_json, uri, None)
|
||||||
self.assertEqual(self.ie._download_json(uri, None, fatal=False), None)
|
self.assertEqual(self.ie._download_json(uri, None, fatal=False), None)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -1,4 +1,5 @@
|
|||||||
#!/usr/bin/env python
|
#!/usr/bin/env python
|
||||||
|
# coding: utf-8
|
||||||
|
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
@ -525,6 +526,7 @@ class TestYoutubeDL(unittest.TestCase):
|
|||||||
'id': '1234',
|
'id': '1234',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'width': None,
|
'width': None,
|
||||||
|
'height': 1080,
|
||||||
}
|
}
|
||||||
|
|
||||||
def fname(templ):
|
def fname(templ):
|
||||||
@ -534,16 +536,29 @@ class TestYoutubeDL(unittest.TestCase):
|
|||||||
self.assertEqual(fname('%(id)s-%(width)s.%(ext)s'), '1234-NA.mp4')
|
self.assertEqual(fname('%(id)s-%(width)s.%(ext)s'), '1234-NA.mp4')
|
||||||
# Replace missing fields with 'NA'
|
# Replace missing fields with 'NA'
|
||||||
self.assertEqual(fname('%(uploader_date)s-%(id)s.%(ext)s'), 'NA-1234.mp4')
|
self.assertEqual(fname('%(uploader_date)s-%(id)s.%(ext)s'), 'NA-1234.mp4')
|
||||||
|
self.assertEqual(fname('%(height)d.%(ext)s'), '1080.mp4')
|
||||||
|
self.assertEqual(fname('%(height)6d.%(ext)s'), ' 1080.mp4')
|
||||||
|
self.assertEqual(fname('%(height)-6d.%(ext)s'), '1080 .mp4')
|
||||||
|
self.assertEqual(fname('%(height)06d.%(ext)s'), '001080.mp4')
|
||||||
|
self.assertEqual(fname('%(height) 06d.%(ext)s'), ' 01080.mp4')
|
||||||
|
self.assertEqual(fname('%(height) 06d.%(ext)s'), ' 01080.mp4')
|
||||||
|
self.assertEqual(fname('%(height)0 6d.%(ext)s'), ' 01080.mp4')
|
||||||
|
self.assertEqual(fname('%(height)0 6d.%(ext)s'), ' 01080.mp4')
|
||||||
|
self.assertEqual(fname('%(height) 0 6d.%(ext)s'), ' 01080.mp4')
|
||||||
|
self.assertEqual(fname('%%(height)06d.%(ext)s'), '%(height)06d.mp4')
|
||||||
|
self.assertEqual(fname('%(width)06d.%(ext)s'), 'NA.mp4')
|
||||||
|
self.assertEqual(fname('%(width)06d.%%(ext)s'), 'NA.%(ext)s')
|
||||||
|
self.assertEqual(fname('%%(width)06d.%(ext)s'), '%(width)06d.mp4')
|
||||||
|
|
||||||
def test_format_note(self):
|
def test_format_note(self):
|
||||||
ydl = YoutubeDL()
|
ydl = YoutubeDL()
|
||||||
self.assertEqual(ydl._format_note({}), '')
|
self.assertEqual(ydl._format_note({}), '')
|
||||||
assertRegexpMatches(self, ydl._format_note({
|
assertRegexpMatches(self, ydl._format_note({
|
||||||
'vbr': 10,
|
'vbr': 10,
|
||||||
}), '^\s*10k$')
|
}), r'^\s*10k$')
|
||||||
assertRegexpMatches(self, ydl._format_note({
|
assertRegexpMatches(self, ydl._format_note({
|
||||||
'fps': 30,
|
'fps': 30,
|
||||||
}), '^30fps$')
|
}), r'^30fps$')
|
||||||
|
|
||||||
def test_postprocessors(self):
|
def test_postprocessors(self):
|
||||||
filename = 'post-processor-testfile.mp4'
|
filename = 'post-processor-testfile.mp4'
|
||||||
@ -605,6 +620,9 @@ class TestYoutubeDL(unittest.TestCase):
|
|||||||
'extractor': 'TEST',
|
'extractor': 'TEST',
|
||||||
'duration': 30,
|
'duration': 30,
|
||||||
'filesize': 10 * 1024,
|
'filesize': 10 * 1024,
|
||||||
|
'playlist_id': '42',
|
||||||
|
'uploader': "變態妍字幕版 太妍 тест",
|
||||||
|
'creator': "тест ' 123 ' тест--",
|
||||||
}
|
}
|
||||||
second = {
|
second = {
|
||||||
'id': '2',
|
'id': '2',
|
||||||
@ -614,6 +632,8 @@ class TestYoutubeDL(unittest.TestCase):
|
|||||||
'duration': 10,
|
'duration': 10,
|
||||||
'description': 'foo',
|
'description': 'foo',
|
||||||
'filesize': 5 * 1024,
|
'filesize': 5 * 1024,
|
||||||
|
'playlist_id': '43',
|
||||||
|
'uploader': "тест 123",
|
||||||
}
|
}
|
||||||
videos = [first, second]
|
videos = [first, second]
|
||||||
|
|
||||||
@ -650,6 +670,30 @@ class TestYoutubeDL(unittest.TestCase):
|
|||||||
res = get_videos(f)
|
res = get_videos(f)
|
||||||
self.assertEqual(res, ['1'])
|
self.assertEqual(res, ['1'])
|
||||||
|
|
||||||
|
f = match_filter_func('playlist_id = 42')
|
||||||
|
res = get_videos(f)
|
||||||
|
self.assertEqual(res, ['1'])
|
||||||
|
|
||||||
|
f = match_filter_func('uploader = "變態妍字幕版 太妍 тест"')
|
||||||
|
res = get_videos(f)
|
||||||
|
self.assertEqual(res, ['1'])
|
||||||
|
|
||||||
|
f = match_filter_func('uploader != "變態妍字幕版 太妍 тест"')
|
||||||
|
res = get_videos(f)
|
||||||
|
self.assertEqual(res, ['2'])
|
||||||
|
|
||||||
|
f = match_filter_func('creator = "тест \' 123 \' тест--"')
|
||||||
|
res = get_videos(f)
|
||||||
|
self.assertEqual(res, ['1'])
|
||||||
|
|
||||||
|
f = match_filter_func("creator = 'тест \\' 123 \\' тест--'")
|
||||||
|
res = get_videos(f)
|
||||||
|
self.assertEqual(res, ['1'])
|
||||||
|
|
||||||
|
f = match_filter_func(r"creator = 'тест \' 123 \' тест--' & duration > 30")
|
||||||
|
res = get_videos(f)
|
||||||
|
self.assertEqual(res, [])
|
||||||
|
|
||||||
def test_playlist_items_selection(self):
|
def test_playlist_items_selection(self):
|
||||||
entries = [{
|
entries = [{
|
||||||
'id': compat_str(i),
|
'id': compat_str(i),
|
||||||
|
@ -8,7 +8,7 @@ import sys
|
|||||||
import unittest
|
import unittest
|
||||||
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
|
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
|
||||||
|
|
||||||
from youtube_dl.aes import aes_decrypt, aes_encrypt, aes_cbc_decrypt, aes_decrypt_text
|
from youtube_dl.aes import aes_decrypt, aes_encrypt, aes_cbc_decrypt, aes_cbc_encrypt, aes_decrypt_text
|
||||||
from youtube_dl.utils import bytes_to_intlist, intlist_to_bytes
|
from youtube_dl.utils import bytes_to_intlist, intlist_to_bytes
|
||||||
import base64
|
import base64
|
||||||
|
|
||||||
@ -34,6 +34,13 @@ class TestAES(unittest.TestCase):
|
|||||||
decrypted = intlist_to_bytes(aes_cbc_decrypt(data, self.key, self.iv))
|
decrypted = intlist_to_bytes(aes_cbc_decrypt(data, self.key, self.iv))
|
||||||
self.assertEqual(decrypted.rstrip(b'\x08'), self.secret_msg)
|
self.assertEqual(decrypted.rstrip(b'\x08'), self.secret_msg)
|
||||||
|
|
||||||
|
def test_cbc_encrypt(self):
|
||||||
|
data = bytes_to_intlist(self.secret_msg)
|
||||||
|
encrypted = intlist_to_bytes(aes_cbc_encrypt(data, self.key, self.iv))
|
||||||
|
self.assertEqual(
|
||||||
|
encrypted,
|
||||||
|
b"\x97\x92+\xe5\x0b\xc3\x18\x91ky9m&\xb3\xb5@\xe6'\xc2\x96.\xc8u\x88\xab9-[\x9e|\xf1\xcd")
|
||||||
|
|
||||||
def test_decrypt_text(self):
|
def test_decrypt_text(self):
|
||||||
password = intlist_to_bytes(self.key).decode('utf-8')
|
password = intlist_to_bytes(self.key).decode('utf-8')
|
||||||
encrypted = base64.b64encode(
|
encrypted = base64.b64encode(
|
||||||
@ -51,5 +58,6 @@ class TestAES(unittest.TestCase):
|
|||||||
decrypted = (aes_decrypt_text(encrypted, password, 32))
|
decrypted = (aes_decrypt_text(encrypted, password, 32))
|
||||||
self.assertEqual(decrypted, self.secret_msg)
|
self.assertEqual(decrypted, self.secret_msg)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -60,10 +60,15 @@ def _file_md5(fn):
|
|||||||
with open(fn, 'rb') as f:
|
with open(fn, 'rb') as f:
|
||||||
return hashlib.md5(f.read()).hexdigest()
|
return hashlib.md5(f.read()).hexdigest()
|
||||||
|
|
||||||
|
|
||||||
defs = gettestcases()
|
defs = gettestcases()
|
||||||
|
|
||||||
|
|
||||||
class TestDownload(unittest.TestCase):
|
class TestDownload(unittest.TestCase):
|
||||||
|
# Parallel testing in nosetests. See
|
||||||
|
# http://nose.readthedocs.org/en/latest/doc_tests/test_multiprocess/multiprocess.html
|
||||||
|
_multiprocess_shared_ = True
|
||||||
|
|
||||||
maxDiff = None
|
maxDiff = None
|
||||||
|
|
||||||
def setUp(self):
|
def setUp(self):
|
||||||
@ -72,7 +77,7 @@ class TestDownload(unittest.TestCase):
|
|||||||
# Dynamically generate tests
|
# Dynamically generate tests
|
||||||
|
|
||||||
|
|
||||||
def generator(test_case):
|
def generator(test_case, tname):
|
||||||
|
|
||||||
def test_template(self):
|
def test_template(self):
|
||||||
ie = youtube_dl.extractor.get_info_extractor(test_case['name'])
|
ie = youtube_dl.extractor.get_info_extractor(test_case['name'])
|
||||||
@ -101,6 +106,7 @@ def generator(test_case):
|
|||||||
return
|
return
|
||||||
|
|
||||||
params = get_params(test_case.get('params', {}))
|
params = get_params(test_case.get('params', {}))
|
||||||
|
params['outtmpl'] = tname + '_' + params['outtmpl']
|
||||||
if is_playlist and 'playlist' not in test_case:
|
if is_playlist and 'playlist' not in test_case:
|
||||||
params.setdefault('extract_flat', 'in_playlist')
|
params.setdefault('extract_flat', 'in_playlist')
|
||||||
params.setdefault('skip_download', True)
|
params.setdefault('skip_download', True)
|
||||||
@ -145,7 +151,7 @@ def generator(test_case):
|
|||||||
raise
|
raise
|
||||||
|
|
||||||
if try_num == RETRIES:
|
if try_num == RETRIES:
|
||||||
report_warning('Failed due to network errors, skipping...')
|
report_warning('%s failed due to network errors, skipping...' % tname)
|
||||||
return
|
return
|
||||||
|
|
||||||
print('Retrying: {0} failed tries\n\n##########\n\n'.format(try_num))
|
print('Retrying: {0} failed tries\n\n##########\n\n'.format(try_num))
|
||||||
@ -217,14 +223,15 @@ def generator(test_case):
|
|||||||
|
|
||||||
return test_template
|
return test_template
|
||||||
|
|
||||||
|
|
||||||
# And add them to TestDownload
|
# And add them to TestDownload
|
||||||
for n, test_case in enumerate(defs):
|
for n, test_case in enumerate(defs):
|
||||||
test_method = generator(test_case)
|
|
||||||
tname = 'test_' + str(test_case['name'])
|
tname = 'test_' + str(test_case['name'])
|
||||||
i = 1
|
i = 1
|
||||||
while hasattr(TestDownload, tname):
|
while hasattr(TestDownload, tname):
|
||||||
tname = 'test_%s_%d' % (test_case['name'], i)
|
tname = 'test_%s_%d' % (test_case['name'], i)
|
||||||
i += 1
|
i += 1
|
||||||
|
test_method = generator(test_case, tname)
|
||||||
test_method.__name__ = str(tname)
|
test_method.__name__ = str(tname)
|
||||||
setattr(TestDownload, test_method.__name__, test_method)
|
setattr(TestDownload, test_method.__name__, test_method)
|
||||||
del test_method
|
del test_method
|
||||||
|
@ -39,5 +39,6 @@ class TestExecution(unittest.TestCase):
|
|||||||
_, stderr = p.communicate()
|
_, stderr = p.communicate()
|
||||||
self.assertFalse(stderr)
|
self.assertFalse(stderr)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -87,7 +87,7 @@ class TestHTTP(unittest.TestCase):
|
|||||||
|
|
||||||
ydl = YoutubeDL({'logger': FakeLogger()})
|
ydl = YoutubeDL({'logger': FakeLogger()})
|
||||||
r = ydl.extract_info('http://localhost:%d/302' % self.port)
|
r = ydl.extract_info('http://localhost:%d/302' % self.port)
|
||||||
self.assertEqual(r['url'], 'http://localhost:%d/vid.mp4' % self.port)
|
self.assertEqual(r['entries'][0]['url'], 'http://localhost:%d/vid.mp4' % self.port)
|
||||||
|
|
||||||
|
|
||||||
class TestHTTPS(unittest.TestCase):
|
class TestHTTPS(unittest.TestCase):
|
||||||
@ -111,7 +111,7 @@ class TestHTTPS(unittest.TestCase):
|
|||||||
|
|
||||||
ydl = YoutubeDL({'logger': FakeLogger(), 'nocheckcertificate': True})
|
ydl = YoutubeDL({'logger': FakeLogger(), 'nocheckcertificate': True})
|
||||||
r = ydl.extract_info('https://localhost:%d/video.html' % self.port)
|
r = ydl.extract_info('https://localhost:%d/video.html' % self.port)
|
||||||
self.assertEqual(r['url'], 'https://localhost:%d/vid.mp4' % self.port)
|
self.assertEqual(r['entries'][0]['url'], 'https://localhost:%d/vid.mp4' % self.port)
|
||||||
|
|
||||||
|
|
||||||
def _build_proxy_handler(name):
|
def _build_proxy_handler(name):
|
||||||
@ -169,5 +169,6 @@ class TestProxy(unittest.TestCase):
|
|||||||
# b'xn--fiq228c' is '中文'.encode('idna')
|
# b'xn--fiq228c' is '中文'.encode('idna')
|
||||||
self.assertEqual(response, 'normal: http://xn--fiq228c.tw/')
|
self.assertEqual(response, 'normal: http://xn--fiq228c.tw/')
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -43,5 +43,6 @@ class TestIqiyiSDKInterpreter(unittest.TestCase):
|
|||||||
ie._login()
|
ie._login()
|
||||||
self.assertTrue('unable to log in:' in logger.messages[0])
|
self.assertTrue('unable to log in:' in logger.messages[0])
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -104,6 +104,14 @@ class TestJSInterpreter(unittest.TestCase):
|
|||||||
}''')
|
}''')
|
||||||
self.assertEqual(jsi.call_function('x'), [20, 20, 30, 40, 50])
|
self.assertEqual(jsi.call_function('x'), [20, 20, 30, 40, 50])
|
||||||
|
|
||||||
|
def test_call(self):
|
||||||
|
jsi = JSInterpreter('''
|
||||||
|
function x() { return 2; }
|
||||||
|
function y(a) { return x() + a; }
|
||||||
|
function z() { return y(3); }
|
||||||
|
''')
|
||||||
|
self.assertEqual(jsi.call_function('z'), 5)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -34,6 +34,9 @@ from youtube_dl.utils import (
|
|||||||
find_xpath_attr,
|
find_xpath_attr,
|
||||||
fix_xml_ampersands,
|
fix_xml_ampersands,
|
||||||
get_element_by_class,
|
get_element_by_class,
|
||||||
|
get_element_by_attribute,
|
||||||
|
get_elements_by_class,
|
||||||
|
get_elements_by_attribute,
|
||||||
InAdvancePagedList,
|
InAdvancePagedList,
|
||||||
intlist_to_bytes,
|
intlist_to_bytes,
|
||||||
is_html,
|
is_html,
|
||||||
@ -49,6 +52,7 @@ from youtube_dl.utils import (
|
|||||||
parse_filesize,
|
parse_filesize,
|
||||||
parse_count,
|
parse_count,
|
||||||
parse_iso8601,
|
parse_iso8601,
|
||||||
|
pkcs1pad,
|
||||||
read_batch_urls,
|
read_batch_urls,
|
||||||
sanitize_filename,
|
sanitize_filename,
|
||||||
sanitize_path,
|
sanitize_path,
|
||||||
@ -69,6 +73,8 @@ from youtube_dl.utils import (
|
|||||||
uppercase_escape,
|
uppercase_escape,
|
||||||
lowercase_escape,
|
lowercase_escape,
|
||||||
url_basename,
|
url_basename,
|
||||||
|
base_url,
|
||||||
|
urljoin,
|
||||||
urlencode_postdata,
|
urlencode_postdata,
|
||||||
urshift,
|
urshift,
|
||||||
update_url_query,
|
update_url_query,
|
||||||
@ -293,6 +299,9 @@ class TestUtil(unittest.TestCase):
|
|||||||
self.assertEqual(unified_strdate('27.02.2016 17:30'), '20160227')
|
self.assertEqual(unified_strdate('27.02.2016 17:30'), '20160227')
|
||||||
self.assertEqual(unified_strdate('UNKNOWN DATE FORMAT'), None)
|
self.assertEqual(unified_strdate('UNKNOWN DATE FORMAT'), None)
|
||||||
self.assertEqual(unified_strdate('Feb 7, 2016 at 6:35 pm'), '20160207')
|
self.assertEqual(unified_strdate('Feb 7, 2016 at 6:35 pm'), '20160207')
|
||||||
|
self.assertEqual(unified_strdate('July 15th, 2013'), '20130715')
|
||||||
|
self.assertEqual(unified_strdate('September 1st, 2013'), '20130901')
|
||||||
|
self.assertEqual(unified_strdate('Sep 2nd, 2013'), '20130902')
|
||||||
|
|
||||||
def test_unified_timestamps(self):
|
def test_unified_timestamps(self):
|
||||||
self.assertEqual(unified_timestamp('December 21, 2010'), 1292889600)
|
self.assertEqual(unified_timestamp('December 21, 2010'), 1292889600)
|
||||||
@ -437,6 +446,30 @@ class TestUtil(unittest.TestCase):
|
|||||||
url_basename('http://media.w3.org/2010/05/sintel/trailer.mp4'),
|
url_basename('http://media.w3.org/2010/05/sintel/trailer.mp4'),
|
||||||
'trailer.mp4')
|
'trailer.mp4')
|
||||||
|
|
||||||
|
def test_base_url(self):
|
||||||
|
self.assertEqual(base_url('http://foo.de/'), 'http://foo.de/')
|
||||||
|
self.assertEqual(base_url('http://foo.de/bar'), 'http://foo.de/')
|
||||||
|
self.assertEqual(base_url('http://foo.de/bar/'), 'http://foo.de/bar/')
|
||||||
|
self.assertEqual(base_url('http://foo.de/bar/baz'), 'http://foo.de/bar/')
|
||||||
|
self.assertEqual(base_url('http://foo.de/bar/baz?x=z/x/c'), 'http://foo.de/bar/')
|
||||||
|
|
||||||
|
def test_urljoin(self):
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', '/a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('//foo.de/', '/a/b/c.txt'), '//foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', 'a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('http://foo.de', '/a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('http://foo.de', 'a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', 'http://foo.de/a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', '//foo.de/a/b/c.txt'), '//foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin(None, 'http://foo.de/a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin(None, '//foo.de/a/b/c.txt'), '//foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('', 'http://foo.de/a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin(['foobar'], 'http://foo.de/a/b/c.txt'), 'http://foo.de/a/b/c.txt')
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', None), None)
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', ''), None)
|
||||||
|
self.assertEqual(urljoin('http://foo.de/', ['foobar']), None)
|
||||||
|
self.assertEqual(urljoin('http://foo.de/a/b/c.txt', '.././../d.txt'), 'http://foo.de/d.txt')
|
||||||
|
|
||||||
def test_parse_age_limit(self):
|
def test_parse_age_limit(self):
|
||||||
self.assertEqual(parse_age_limit(None), None)
|
self.assertEqual(parse_age_limit(None), None)
|
||||||
self.assertEqual(parse_age_limit(False), None)
|
self.assertEqual(parse_age_limit(False), None)
|
||||||
@ -481,6 +514,7 @@ class TestUtil(unittest.TestCase):
|
|||||||
self.assertEqual(parse_duration('1 hour 3 minutes'), 3780)
|
self.assertEqual(parse_duration('1 hour 3 minutes'), 3780)
|
||||||
self.assertEqual(parse_duration('87 Min.'), 5220)
|
self.assertEqual(parse_duration('87 Min.'), 5220)
|
||||||
self.assertEqual(parse_duration('PT1H0.040S'), 3600.04)
|
self.assertEqual(parse_duration('PT1H0.040S'), 3600.04)
|
||||||
|
self.assertEqual(parse_duration('PT00H03M30SZ'), 210)
|
||||||
|
|
||||||
def test_fix_xml_ampersands(self):
|
def test_fix_xml_ampersands(self):
|
||||||
self.assertEqual(
|
self.assertEqual(
|
||||||
@ -755,12 +789,27 @@ class TestUtil(unittest.TestCase):
|
|||||||
on = js_to_json('["abc", "def",]')
|
on = js_to_json('["abc", "def",]')
|
||||||
self.assertEqual(json.loads(on), ['abc', 'def'])
|
self.assertEqual(json.loads(on), ['abc', 'def'])
|
||||||
|
|
||||||
|
on = js_to_json('[/*comment\n*/"abc"/*comment\n*/,/*comment\n*/"def",/*comment\n*/]')
|
||||||
|
self.assertEqual(json.loads(on), ['abc', 'def'])
|
||||||
|
|
||||||
|
on = js_to_json('[//comment\n"abc" //comment\n,//comment\n"def",//comment\n]')
|
||||||
|
self.assertEqual(json.loads(on), ['abc', 'def'])
|
||||||
|
|
||||||
on = js_to_json('{"abc": "def",}')
|
on = js_to_json('{"abc": "def",}')
|
||||||
self.assertEqual(json.loads(on), {'abc': 'def'})
|
self.assertEqual(json.loads(on), {'abc': 'def'})
|
||||||
|
|
||||||
|
on = js_to_json('{/*comment\n*/"abc"/*comment\n*/:/*comment\n*/"def"/*comment\n*/,/*comment\n*/}')
|
||||||
|
self.assertEqual(json.loads(on), {'abc': 'def'})
|
||||||
|
|
||||||
on = js_to_json('{ 0: /* " \n */ ",]" , }')
|
on = js_to_json('{ 0: /* " \n */ ",]" , }')
|
||||||
self.assertEqual(json.loads(on), {'0': ',]'})
|
self.assertEqual(json.loads(on), {'0': ',]'})
|
||||||
|
|
||||||
|
on = js_to_json('{ /*comment\n*/0/*comment\n*/: /* " \n */ ",]" , }')
|
||||||
|
self.assertEqual(json.loads(on), {'0': ',]'})
|
||||||
|
|
||||||
|
on = js_to_json('{ 0: // comment\n1 }')
|
||||||
|
self.assertEqual(json.loads(on), {'0': 1})
|
||||||
|
|
||||||
on = js_to_json(r'["<p>x<\/p>"]')
|
on = js_to_json(r'["<p>x<\/p>"]')
|
||||||
self.assertEqual(json.loads(on), ['<p>x</p>'])
|
self.assertEqual(json.loads(on), ['<p>x</p>'])
|
||||||
|
|
||||||
@ -770,15 +819,27 @@ class TestUtil(unittest.TestCase):
|
|||||||
on = js_to_json("['a\\\nb']")
|
on = js_to_json("['a\\\nb']")
|
||||||
self.assertEqual(json.loads(on), ['ab'])
|
self.assertEqual(json.loads(on), ['ab'])
|
||||||
|
|
||||||
|
on = js_to_json("/*comment\n*/[/*comment\n*/'a\\\nb'/*comment\n*/]/*comment\n*/")
|
||||||
|
self.assertEqual(json.loads(on), ['ab'])
|
||||||
|
|
||||||
on = js_to_json('{0xff:0xff}')
|
on = js_to_json('{0xff:0xff}')
|
||||||
self.assertEqual(json.loads(on), {'255': 255})
|
self.assertEqual(json.loads(on), {'255': 255})
|
||||||
|
|
||||||
|
on = js_to_json('{/*comment\n*/0xff/*comment\n*/:/*comment\n*/0xff/*comment\n*/}')
|
||||||
|
self.assertEqual(json.loads(on), {'255': 255})
|
||||||
|
|
||||||
on = js_to_json('{077:077}')
|
on = js_to_json('{077:077}')
|
||||||
self.assertEqual(json.loads(on), {'63': 63})
|
self.assertEqual(json.loads(on), {'63': 63})
|
||||||
|
|
||||||
|
on = js_to_json('{/*comment\n*/077/*comment\n*/:/*comment\n*/077/*comment\n*/}')
|
||||||
|
self.assertEqual(json.loads(on), {'63': 63})
|
||||||
|
|
||||||
on = js_to_json('{42:42}')
|
on = js_to_json('{42:42}')
|
||||||
self.assertEqual(json.loads(on), {'42': 42})
|
self.assertEqual(json.loads(on), {'42': 42})
|
||||||
|
|
||||||
|
on = js_to_json('{/*comment\n*/42/*comment\n*/:/*comment\n*/42/*comment\n*/}')
|
||||||
|
self.assertEqual(json.loads(on), {'42': 42})
|
||||||
|
|
||||||
def test_extract_attributes(self):
|
def test_extract_attributes(self):
|
||||||
self.assertEqual(extract_attributes('<e x="y">'), {'x': 'y'})
|
self.assertEqual(extract_attributes('<e x="y">'), {'x': 'y'})
|
||||||
self.assertEqual(extract_attributes("<e x='y'>"), {'x': 'y'})
|
self.assertEqual(extract_attributes("<e x='y'>"), {'x': 'y'})
|
||||||
@ -1044,6 +1105,14 @@ The first line
|
|||||||
ohdave_rsa_encrypt(b'aa111222', e, N),
|
ohdave_rsa_encrypt(b'aa111222', e, N),
|
||||||
'726664bd9a23fd0c70f9f1b84aab5e3905ce1e45a584e9cbcf9bcc7510338fc1986d6c599ff990d923aa43c51c0d9013cd572e13bc58f4ae48f2ed8c0b0ba881')
|
'726664bd9a23fd0c70f9f1b84aab5e3905ce1e45a584e9cbcf9bcc7510338fc1986d6c599ff990d923aa43c51c0d9013cd572e13bc58f4ae48f2ed8c0b0ba881')
|
||||||
|
|
||||||
|
def test_pkcs1pad(self):
|
||||||
|
data = [1, 2, 3]
|
||||||
|
padded_data = pkcs1pad(data, 32)
|
||||||
|
self.assertEqual(padded_data[:2], [0, 2])
|
||||||
|
self.assertEqual(padded_data[28:], [0, 1, 2, 3])
|
||||||
|
|
||||||
|
self.assertRaises(ValueError, pkcs1pad, data, 8)
|
||||||
|
|
||||||
def test_encode_base_n(self):
|
def test_encode_base_n(self):
|
||||||
self.assertEqual(encode_base_n(0, 30), '0')
|
self.assertEqual(encode_base_n(0, 30), '0')
|
||||||
self.assertEqual(encode_base_n(80, 30), '2k')
|
self.assertEqual(encode_base_n(80, 30), '2k')
|
||||||
@ -1067,5 +1136,32 @@ The first line
|
|||||||
self.assertEqual(get_element_by_class('foo', html), 'nice')
|
self.assertEqual(get_element_by_class('foo', html), 'nice')
|
||||||
self.assertEqual(get_element_by_class('no-such-class', html), None)
|
self.assertEqual(get_element_by_class('no-such-class', html), None)
|
||||||
|
|
||||||
|
def test_get_element_by_attribute(self):
|
||||||
|
html = '''
|
||||||
|
<span class="foo bar">nice</span>
|
||||||
|
'''
|
||||||
|
|
||||||
|
self.assertEqual(get_element_by_attribute('class', 'foo bar', html), 'nice')
|
||||||
|
self.assertEqual(get_element_by_attribute('class', 'foo', html), None)
|
||||||
|
self.assertEqual(get_element_by_attribute('class', 'no-such-foo', html), None)
|
||||||
|
|
||||||
|
def test_get_elements_by_class(self):
|
||||||
|
html = '''
|
||||||
|
<span class="foo bar">nice</span><span class="foo bar">also nice</span>
|
||||||
|
'''
|
||||||
|
|
||||||
|
self.assertEqual(get_elements_by_class('foo', html), ['nice', 'also nice'])
|
||||||
|
self.assertEqual(get_elements_by_class('no-such-class', html), [])
|
||||||
|
|
||||||
|
def test_get_elements_by_attribute(self):
|
||||||
|
html = '''
|
||||||
|
<span class="foo bar">nice</span><span class="foo bar">also nice</span>
|
||||||
|
'''
|
||||||
|
|
||||||
|
self.assertEqual(get_elements_by_attribute('class', 'foo bar', html), ['nice', 'also nice'])
|
||||||
|
self.assertEqual(get_elements_by_attribute('class', 'foo', html), [])
|
||||||
|
self.assertEqual(get_elements_by_attribute('class', 'no-such-foo', html), [])
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -66,5 +66,6 @@ class TestVerboseOutput(unittest.TestCase):
|
|||||||
self.assertTrue(b'-p' in serr)
|
self.assertTrue(b'-p' in serr)
|
||||||
self.assertTrue(b'secret' not in serr)
|
self.assertTrue(b'secret' not in serr)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -24,6 +24,7 @@ class YoutubeDL(youtube_dl.YoutubeDL):
|
|||||||
super(YoutubeDL, self).__init__(*args, **kwargs)
|
super(YoutubeDL, self).__init__(*args, **kwargs)
|
||||||
self.to_stderr = self.to_screen
|
self.to_stderr = self.to_screen
|
||||||
|
|
||||||
|
|
||||||
params = get_params({
|
params = get_params({
|
||||||
'writeannotations': True,
|
'writeannotations': True,
|
||||||
'skip_download': True,
|
'skip_download': True,
|
||||||
@ -74,5 +75,6 @@ class TestAnnotations(unittest.TestCase):
|
|||||||
def tearDown(self):
|
def tearDown(self):
|
||||||
try_rm(ANNOTATIONS_FILE)
|
try_rm(ANNOTATIONS_FILE)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -66,5 +66,6 @@ class TestYoutubeLists(unittest.TestCase):
|
|||||||
for entry in result['entries']:
|
for entry in result['entries']:
|
||||||
self.assertTrue(entry.get('title'))
|
self.assertTrue(entry.get('title'))
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
@ -114,6 +114,7 @@ def make_tfunc(url, stype, sig_input, expected_sig):
|
|||||||
test_func.__name__ = str('test_signature_' + stype + '_' + test_id)
|
test_func.__name__ = str('test_signature_' + stype + '_' + test_id)
|
||||||
setattr(TestSignature, test_func.__name__, test_func)
|
setattr(TestSignature, test_func.__name__, test_func)
|
||||||
|
|
||||||
|
|
||||||
for test_spec in _TESTS:
|
for test_spec in _TESTS:
|
||||||
make_tfunc(*test_spec)
|
make_tfunc(*test_spec)
|
||||||
|
|
||||||
|
@ -24,6 +24,7 @@ import sys
|
|||||||
import time
|
import time
|
||||||
import tokenize
|
import tokenize
|
||||||
import traceback
|
import traceback
|
||||||
|
import random
|
||||||
|
|
||||||
from .compat import (
|
from .compat import (
|
||||||
compat_basestring,
|
compat_basestring,
|
||||||
@ -32,6 +33,7 @@ from .compat import (
|
|||||||
compat_get_terminal_size,
|
compat_get_terminal_size,
|
||||||
compat_http_client,
|
compat_http_client,
|
||||||
compat_kwargs,
|
compat_kwargs,
|
||||||
|
compat_numeric_types,
|
||||||
compat_os_name,
|
compat_os_name,
|
||||||
compat_str,
|
compat_str,
|
||||||
compat_tokenize_tokenize,
|
compat_tokenize_tokenize,
|
||||||
@ -55,6 +57,8 @@ from .utils import (
|
|||||||
ExtractorError,
|
ExtractorError,
|
||||||
format_bytes,
|
format_bytes,
|
||||||
formatSeconds,
|
formatSeconds,
|
||||||
|
GeoRestrictedError,
|
||||||
|
ISO3166Utils,
|
||||||
locked_file,
|
locked_file,
|
||||||
make_HTTPS_handler,
|
make_HTTPS_handler,
|
||||||
MaxDownloadsReached,
|
MaxDownloadsReached,
|
||||||
@ -159,6 +163,7 @@ class YoutubeDL(object):
|
|||||||
playlistend: Playlist item to end at.
|
playlistend: Playlist item to end at.
|
||||||
playlist_items: Specific indices of playlist to download.
|
playlist_items: Specific indices of playlist to download.
|
||||||
playlistreverse: Download playlist items in reverse order.
|
playlistreverse: Download playlist items in reverse order.
|
||||||
|
playlistrandom: Download playlist items in random order.
|
||||||
matchtitle: Download only matching titles.
|
matchtitle: Download only matching titles.
|
||||||
rejecttitle: Reject downloads for matching titles.
|
rejecttitle: Reject downloads for matching titles.
|
||||||
logger: Log messages to a logging.Logger instance.
|
logger: Log messages to a logging.Logger instance.
|
||||||
@ -270,6 +275,12 @@ class YoutubeDL(object):
|
|||||||
If it returns None, the video is downloaded.
|
If it returns None, the video is downloaded.
|
||||||
match_filter_func in utils.py is one example for this.
|
match_filter_func in utils.py is one example for this.
|
||||||
no_color: Do not emit color codes in output.
|
no_color: Do not emit color codes in output.
|
||||||
|
geo_bypass: Bypass geographic restriction via faking X-Forwarded-For
|
||||||
|
HTTP header (experimental)
|
||||||
|
geo_bypass_country:
|
||||||
|
Two-letter ISO 3166-2 country code that will be used for
|
||||||
|
explicit geographic restriction bypassing via faking
|
||||||
|
X-Forwarded-For HTTP header (experimental)
|
||||||
|
|
||||||
The following options determine which downloader is picked:
|
The following options determine which downloader is picked:
|
||||||
external_downloader: Executable of the external downloader to call.
|
external_downloader: Executable of the external downloader to call.
|
||||||
@ -317,11 +328,21 @@ class YoutubeDL(object):
|
|||||||
self.params.update(params)
|
self.params.update(params)
|
||||||
self.cache = Cache(self)
|
self.cache = Cache(self)
|
||||||
|
|
||||||
if self.params.get('cn_verification_proxy') is not None:
|
def check_deprecated(param, option, suggestion):
|
||||||
self.report_warning('--cn-verification-proxy is deprecated. Use --geo-verification-proxy instead.')
|
if self.params.get(param) is not None:
|
||||||
|
self.report_warning(
|
||||||
|
'%s is deprecated. Use %s instead.' % (option, suggestion))
|
||||||
|
return True
|
||||||
|
return False
|
||||||
|
|
||||||
|
if check_deprecated('cn_verification_proxy', '--cn-verification-proxy', '--geo-verification-proxy'):
|
||||||
if self.params.get('geo_verification_proxy') is None:
|
if self.params.get('geo_verification_proxy') is None:
|
||||||
self.params['geo_verification_proxy'] = self.params['cn_verification_proxy']
|
self.params['geo_verification_proxy'] = self.params['cn_verification_proxy']
|
||||||
|
|
||||||
|
check_deprecated('autonumber_size', '--autonumber-size', 'output template with %(autonumber)0Nd, where N in the number of digits')
|
||||||
|
check_deprecated('autonumber', '--auto-number', '-o "%(autonumber)s-%(title)s.%(ext)s"')
|
||||||
|
check_deprecated('usetitle', '--title', '-o "%(title)s-%(id)s.%(ext)s"')
|
||||||
|
|
||||||
if params.get('bidi_workaround', False):
|
if params.get('bidi_workaround', False):
|
||||||
try:
|
try:
|
||||||
import pty
|
import pty
|
||||||
@ -583,10 +604,7 @@ class YoutubeDL(object):
|
|||||||
autonumber_size = self.params.get('autonumber_size')
|
autonumber_size = self.params.get('autonumber_size')
|
||||||
if autonumber_size is None:
|
if autonumber_size is None:
|
||||||
autonumber_size = 5
|
autonumber_size = 5
|
||||||
autonumber_templ = '%0' + str(autonumber_size) + 'd'
|
template_dict['autonumber'] = self.params.get('autonumber_start', 1) - 1 + self._num_downloads
|
||||||
template_dict['autonumber'] = autonumber_templ % self._num_downloads
|
|
||||||
if template_dict.get('playlist_index') is not None:
|
|
||||||
template_dict['playlist_index'] = '%0*d' % (len(str(template_dict['n_entries'])), template_dict['playlist_index'])
|
|
||||||
if template_dict.get('resolution') is None:
|
if template_dict.get('resolution') is None:
|
||||||
if template_dict.get('width') and template_dict.get('height'):
|
if template_dict.get('width') and template_dict.get('height'):
|
||||||
template_dict['resolution'] = '%dx%d' % (template_dict['width'], template_dict['height'])
|
template_dict['resolution'] = '%dx%d' % (template_dict['width'], template_dict['height'])
|
||||||
@ -598,13 +616,62 @@ class YoutubeDL(object):
|
|||||||
sanitize = lambda k, v: sanitize_filename(
|
sanitize = lambda k, v: sanitize_filename(
|
||||||
compat_str(v),
|
compat_str(v),
|
||||||
restricted=self.params.get('restrictfilenames'),
|
restricted=self.params.get('restrictfilenames'),
|
||||||
is_id=(k == 'id'))
|
is_id=(k == 'id' or k.endswith('_id')))
|
||||||
template_dict = dict((k, sanitize(k, v))
|
template_dict = dict((k, v if isinstance(v, compat_numeric_types) else sanitize(k, v))
|
||||||
for k, v in template_dict.items()
|
for k, v in template_dict.items()
|
||||||
if v is not None and not isinstance(v, (list, tuple, dict)))
|
if v is not None and not isinstance(v, (list, tuple, dict)))
|
||||||
template_dict = collections.defaultdict(lambda: 'NA', template_dict)
|
template_dict = collections.defaultdict(lambda: 'NA', template_dict)
|
||||||
|
|
||||||
outtmpl = self.params.get('outtmpl', DEFAULT_OUTTMPL)
|
outtmpl = self.params.get('outtmpl', DEFAULT_OUTTMPL)
|
||||||
|
|
||||||
|
# For fields playlist_index and autonumber convert all occurrences
|
||||||
|
# of %(field)s to %(field)0Nd for backward compatibility
|
||||||
|
field_size_compat_map = {
|
||||||
|
'playlist_index': len(str(template_dict['n_entries'])),
|
||||||
|
'autonumber': autonumber_size,
|
||||||
|
}
|
||||||
|
FIELD_SIZE_COMPAT_RE = r'(?<!%)%\((?P<field>autonumber|playlist_index)\)s'
|
||||||
|
mobj = re.search(FIELD_SIZE_COMPAT_RE, outtmpl)
|
||||||
|
if mobj:
|
||||||
|
outtmpl = re.sub(
|
||||||
|
FIELD_SIZE_COMPAT_RE,
|
||||||
|
r'%%(\1)0%dd' % field_size_compat_map[mobj.group('field')],
|
||||||
|
outtmpl)
|
||||||
|
|
||||||
|
NUMERIC_FIELDS = set((
|
||||||
|
'width', 'height', 'tbr', 'abr', 'asr', 'vbr', 'fps', 'filesize', 'filesize_approx',
|
||||||
|
'upload_year', 'upload_month', 'upload_day',
|
||||||
|
'duration', 'view_count', 'like_count', 'dislike_count', 'repost_count',
|
||||||
|
'average_rating', 'comment_count', 'age_limit',
|
||||||
|
'start_time', 'end_time',
|
||||||
|
'chapter_number', 'season_number', 'episode_number',
|
||||||
|
'track_number', 'disc_number', 'release_year',
|
||||||
|
'playlist_index',
|
||||||
|
))
|
||||||
|
|
||||||
|
# Missing numeric fields used together with integer presentation types
|
||||||
|
# in format specification will break the argument substitution since
|
||||||
|
# string 'NA' is returned for missing fields. We will patch output
|
||||||
|
# template for missing fields to meet string presentation type.
|
||||||
|
for numeric_field in NUMERIC_FIELDS:
|
||||||
|
if numeric_field not in template_dict:
|
||||||
|
# As of [1] format syntax is:
|
||||||
|
# %[mapping_key][conversion_flags][minimum_width][.precision][length_modifier]type
|
||||||
|
# 1. https://docs.python.org/2/library/stdtypes.html#string-formatting
|
||||||
|
FORMAT_RE = r'''(?x)
|
||||||
|
(?<!%)
|
||||||
|
%
|
||||||
|
\({0}\) # mapping key
|
||||||
|
(?:[#0\-+ ]+)? # conversion flags (optional)
|
||||||
|
(?:\d+)? # minimum field width (optional)
|
||||||
|
(?:\.\d+)? # precision (optional)
|
||||||
|
[hlL]? # length modifier (optional)
|
||||||
|
[diouxXeEfFgGcrs%] # conversion type
|
||||||
|
'''
|
||||||
|
outtmpl = re.sub(
|
||||||
|
FORMAT_RE.format(numeric_field),
|
||||||
|
r'%({0})s'.format(numeric_field), outtmpl)
|
||||||
|
|
||||||
tmpl = compat_expanduser(outtmpl)
|
tmpl = compat_expanduser(outtmpl)
|
||||||
filename = tmpl % template_dict
|
filename = tmpl % template_dict
|
||||||
# Temporary fix for #4787
|
# Temporary fix for #4787
|
||||||
@ -705,6 +772,14 @@ class YoutubeDL(object):
|
|||||||
return self.process_ie_result(ie_result, download, extra_info)
|
return self.process_ie_result(ie_result, download, extra_info)
|
||||||
else:
|
else:
|
||||||
return ie_result
|
return ie_result
|
||||||
|
except GeoRestrictedError as e:
|
||||||
|
msg = e.msg
|
||||||
|
if e.countries:
|
||||||
|
msg += '\nThis video is available in %s.' % ', '.join(
|
||||||
|
map(ISO3166Utils.short2full, e.countries))
|
||||||
|
msg += '\nYou might want to use a VPN or a proxy server (with --proxy) to workaround.'
|
||||||
|
self.report_error(msg)
|
||||||
|
break
|
||||||
except ExtractorError as e: # An error we somewhat expected
|
except ExtractorError as e: # An error we somewhat expected
|
||||||
self.report_error(compat_str(e), e.format_traceback())
|
self.report_error(compat_str(e), e.format_traceback())
|
||||||
break
|
break
|
||||||
@ -842,8 +917,17 @@ class YoutubeDL(object):
|
|||||||
if self.params.get('playlistreverse', False):
|
if self.params.get('playlistreverse', False):
|
||||||
entries = entries[::-1]
|
entries = entries[::-1]
|
||||||
|
|
||||||
|
if self.params.get('playlistrandom', False):
|
||||||
|
random.shuffle(entries)
|
||||||
|
|
||||||
|
x_forwarded_for = ie_result.get('__x_forwarded_for_ip')
|
||||||
|
|
||||||
for i, entry in enumerate(entries, 1):
|
for i, entry in enumerate(entries, 1):
|
||||||
self.to_screen('[download] Downloading video %s of %s' % (i, n_entries))
|
self.to_screen('[download] Downloading video %s of %s' % (i, n_entries))
|
||||||
|
# This __x_forwarded_for_ip thing is a bit ugly but requires
|
||||||
|
# minimal changes
|
||||||
|
if x_forwarded_for:
|
||||||
|
entry['__x_forwarded_for_ip'] = x_forwarded_for
|
||||||
extra = {
|
extra = {
|
||||||
'n_entries': n_entries,
|
'n_entries': n_entries,
|
||||||
'playlist': playlist,
|
'playlist': playlist,
|
||||||
@ -1228,6 +1312,11 @@ class YoutubeDL(object):
|
|||||||
if cookies:
|
if cookies:
|
||||||
res['Cookie'] = cookies
|
res['Cookie'] = cookies
|
||||||
|
|
||||||
|
if 'X-Forwarded-For' not in res:
|
||||||
|
x_forwarded_for_ip = info_dict.get('__x_forwarded_for_ip')
|
||||||
|
if x_forwarded_for_ip:
|
||||||
|
res['X-Forwarded-For'] = x_forwarded_for_ip
|
||||||
|
|
||||||
return res
|
return res
|
||||||
|
|
||||||
def _calc_cookies(self, info_dict):
|
def _calc_cookies(self, info_dict):
|
||||||
@ -1339,7 +1428,7 @@ class YoutubeDL(object):
|
|||||||
format['format_id'] = compat_str(i)
|
format['format_id'] = compat_str(i)
|
||||||
else:
|
else:
|
||||||
# Sanitize format_id from characters used in format selector expression
|
# Sanitize format_id from characters used in format selector expression
|
||||||
format['format_id'] = re.sub('[\s,/+\[\]()]', '_', format['format_id'])
|
format['format_id'] = re.sub(r'[\s,/+\[\]()]', '_', format['format_id'])
|
||||||
format_id = format['format_id']
|
format_id = format['format_id']
|
||||||
if format_id not in formats_dict:
|
if format_id not in formats_dict:
|
||||||
formats_dict[format_id] = []
|
formats_dict[format_id] = []
|
||||||
@ -1363,13 +1452,16 @@ class YoutubeDL(object):
|
|||||||
format['ext'] = determine_ext(format['url']).lower()
|
format['ext'] = determine_ext(format['url']).lower()
|
||||||
# Automatically determine protocol if missing (useful for format
|
# Automatically determine protocol if missing (useful for format
|
||||||
# selection purposes)
|
# selection purposes)
|
||||||
if 'protocol' not in format:
|
if format.get('protocol') is None:
|
||||||
format['protocol'] = determine_protocol(format)
|
format['protocol'] = determine_protocol(format)
|
||||||
# Add HTTP headers, so that external programs can use them from the
|
# Add HTTP headers, so that external programs can use them from the
|
||||||
# json output
|
# json output
|
||||||
full_format_info = info_dict.copy()
|
full_format_info = info_dict.copy()
|
||||||
full_format_info.update(format)
|
full_format_info.update(format)
|
||||||
format['http_headers'] = self._calc_headers(full_format_info)
|
format['http_headers'] = self._calc_headers(full_format_info)
|
||||||
|
# Remove private housekeeping stuff
|
||||||
|
if '__x_forwarded_for_ip' in info_dict:
|
||||||
|
del info_dict['__x_forwarded_for_ip']
|
||||||
|
|
||||||
# TODO Central sorting goes here
|
# TODO Central sorting goes here
|
||||||
|
|
||||||
@ -1658,7 +1750,7 @@ class YoutubeDL(object):
|
|||||||
video_ext, audio_ext = audio.get('ext'), video.get('ext')
|
video_ext, audio_ext = audio.get('ext'), video.get('ext')
|
||||||
if video_ext and audio_ext:
|
if video_ext and audio_ext:
|
||||||
COMPATIBLE_EXTS = (
|
COMPATIBLE_EXTS = (
|
||||||
('mp3', 'mp4', 'm4a', 'm4p', 'm4b', 'm4r', 'm4v'),
|
('mp3', 'mp4', 'm4a', 'm4p', 'm4b', 'm4r', 'm4v', 'ismv', 'isma'),
|
||||||
('webm')
|
('webm')
|
||||||
)
|
)
|
||||||
for exts in COMPATIBLE_EXTS:
|
for exts in COMPATIBLE_EXTS:
|
||||||
|
@ -95,8 +95,7 @@ def _real_main(argv=None):
|
|||||||
write_string('[debug] Batch file urls: ' + repr(batch_urls) + '\n')
|
write_string('[debug] Batch file urls: ' + repr(batch_urls) + '\n')
|
||||||
except IOError:
|
except IOError:
|
||||||
sys.exit('ERROR: batch file could not be read')
|
sys.exit('ERROR: batch file could not be read')
|
||||||
all_urls = batch_urls + args
|
all_urls = batch_urls + [url.strip() for url in args] # batch_urls are already striped in read_batch_urls
|
||||||
all_urls = [url.strip() for url in all_urls]
|
|
||||||
_enc = preferredencoding()
|
_enc = preferredencoding()
|
||||||
all_urls = [url.decode(_enc, 'ignore') if isinstance(url, bytes) else url for url in all_urls]
|
all_urls = [url.decode(_enc, 'ignore') if isinstance(url, bytes) else url for url in all_urls]
|
||||||
|
|
||||||
@ -134,6 +133,12 @@ def _real_main(argv=None):
|
|||||||
parser.error('TV Provider account username missing\n')
|
parser.error('TV Provider account username missing\n')
|
||||||
if opts.outtmpl is not None and (opts.usetitle or opts.autonumber or opts.useid):
|
if opts.outtmpl is not None and (opts.usetitle or opts.autonumber or opts.useid):
|
||||||
parser.error('using output template conflicts with using title, video ID or auto number')
|
parser.error('using output template conflicts with using title, video ID or auto number')
|
||||||
|
if opts.autonumber_size is not None:
|
||||||
|
if opts.autonumber_size <= 0:
|
||||||
|
parser.error('auto number size must be positive')
|
||||||
|
if opts.autonumber_start is not None:
|
||||||
|
if opts.autonumber_start < 0:
|
||||||
|
parser.error('auto number start must be positive or 0')
|
||||||
if opts.usetitle and opts.useid:
|
if opts.usetitle and opts.useid:
|
||||||
parser.error('using title conflicts with using video ID')
|
parser.error('using title conflicts with using video ID')
|
||||||
if opts.username is not None and opts.password is None:
|
if opts.username is not None and opts.password is None:
|
||||||
@ -322,6 +327,7 @@ def _real_main(argv=None):
|
|||||||
'listformats': opts.listformats,
|
'listformats': opts.listformats,
|
||||||
'outtmpl': outtmpl,
|
'outtmpl': outtmpl,
|
||||||
'autonumber_size': opts.autonumber_size,
|
'autonumber_size': opts.autonumber_size,
|
||||||
|
'autonumber_start': opts.autonumber_start,
|
||||||
'restrictfilenames': opts.restrictfilenames,
|
'restrictfilenames': opts.restrictfilenames,
|
||||||
'ignoreerrors': opts.ignoreerrors,
|
'ignoreerrors': opts.ignoreerrors,
|
||||||
'force_generic_extractor': opts.force_generic_extractor,
|
'force_generic_extractor': opts.force_generic_extractor,
|
||||||
@ -338,6 +344,7 @@ def _real_main(argv=None):
|
|||||||
'playliststart': opts.playliststart,
|
'playliststart': opts.playliststart,
|
||||||
'playlistend': opts.playlistend,
|
'playlistend': opts.playlistend,
|
||||||
'playlistreverse': opts.playlist_reverse,
|
'playlistreverse': opts.playlist_reverse,
|
||||||
|
'playlistrandom': opts.playlist_random,
|
||||||
'noplaylist': opts.noplaylist,
|
'noplaylist': opts.noplaylist,
|
||||||
'logtostderr': opts.outtmpl == '-',
|
'logtostderr': opts.outtmpl == '-',
|
||||||
'consoletitle': opts.consoletitle,
|
'consoletitle': opts.consoletitle,
|
||||||
@ -406,7 +413,12 @@ def _real_main(argv=None):
|
|||||||
'postprocessor_args': postprocessor_args,
|
'postprocessor_args': postprocessor_args,
|
||||||
'cn_verification_proxy': opts.cn_verification_proxy,
|
'cn_verification_proxy': opts.cn_verification_proxy,
|
||||||
'geo_verification_proxy': opts.geo_verification_proxy,
|
'geo_verification_proxy': opts.geo_verification_proxy,
|
||||||
|
'config_location': opts.config_location,
|
||||||
|
'geo_bypass': opts.geo_bypass,
|
||||||
|
'geo_bypass_country': opts.geo_bypass_country,
|
||||||
|
# just for deprecation check
|
||||||
|
'autonumber': opts.autonumber if opts.autonumber is True else None,
|
||||||
|
'usetitle': opts.usetitle if opts.usetitle is True else None,
|
||||||
}
|
}
|
||||||
|
|
||||||
with YoutubeDL(ydl_opts) as ydl:
|
with YoutubeDL(ydl_opts) as ydl:
|
||||||
@ -450,4 +462,5 @@ def main(argv=None):
|
|||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
sys.exit('\nERROR: Interrupted by user')
|
sys.exit('\nERROR: Interrupted by user')
|
||||||
|
|
||||||
|
|
||||||
__all__ = ['main', 'YoutubeDL', 'gen_extractors', 'list_extractors']
|
__all__ = ['main', 'YoutubeDL', 'gen_extractors', 'list_extractors']
|
||||||
|
@ -60,6 +60,34 @@ def aes_cbc_decrypt(data, key, iv):
|
|||||||
return decrypted_data
|
return decrypted_data
|
||||||
|
|
||||||
|
|
||||||
|
def aes_cbc_encrypt(data, key, iv):
|
||||||
|
"""
|
||||||
|
Encrypt with aes in CBC mode. Using PKCS#7 padding
|
||||||
|
|
||||||
|
@param {int[]} data cleartext
|
||||||
|
@param {int[]} key 16/24/32-Byte cipher key
|
||||||
|
@param {int[]} iv 16-Byte IV
|
||||||
|
@returns {int[]} encrypted data
|
||||||
|
"""
|
||||||
|
expanded_key = key_expansion(key)
|
||||||
|
block_count = int(ceil(float(len(data)) / BLOCK_SIZE_BYTES))
|
||||||
|
|
||||||
|
encrypted_data = []
|
||||||
|
previous_cipher_block = iv
|
||||||
|
for i in range(block_count):
|
||||||
|
block = data[i * BLOCK_SIZE_BYTES: (i + 1) * BLOCK_SIZE_BYTES]
|
||||||
|
remaining_length = BLOCK_SIZE_BYTES - len(block)
|
||||||
|
block += [remaining_length] * remaining_length
|
||||||
|
mixed_block = xor(block, previous_cipher_block)
|
||||||
|
|
||||||
|
encrypted_block = aes_encrypt(mixed_block, expanded_key)
|
||||||
|
encrypted_data += encrypted_block
|
||||||
|
|
||||||
|
previous_cipher_block = encrypted_block
|
||||||
|
|
||||||
|
return encrypted_data
|
||||||
|
|
||||||
|
|
||||||
def key_expansion(data):
|
def key_expansion(data):
|
||||||
"""
|
"""
|
||||||
Generate key schedule
|
Generate key schedule
|
||||||
@ -174,6 +202,7 @@ def aes_decrypt_text(data, password, key_size_bytes):
|
|||||||
|
|
||||||
return plaintext
|
return plaintext
|
||||||
|
|
||||||
|
|
||||||
RCON = (0x8d, 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36)
|
RCON = (0x8d, 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36)
|
||||||
SBOX = (0x63, 0x7C, 0x77, 0x7B, 0xF2, 0x6B, 0x6F, 0xC5, 0x30, 0x01, 0x67, 0x2B, 0xFE, 0xD7, 0xAB, 0x76,
|
SBOX = (0x63, 0x7C, 0x77, 0x7B, 0xF2, 0x6B, 0x6F, 0xC5, 0x30, 0x01, 0x67, 0x2B, 0xFE, 0xD7, 0xAB, 0x76,
|
||||||
0xCA, 0x82, 0xC9, 0x7D, 0xFA, 0x59, 0x47, 0xF0, 0xAD, 0xD4, 0xA2, 0xAF, 0x9C, 0xA4, 0x72, 0xC0,
|
0xCA, 0x82, 0xC9, 0x7D, 0xFA, 0x59, 0x47, 0xF0, 0xAD, 0xD4, 0xA2, 0xAF, 0x9C, 0xA4, 0x72, 0xC0,
|
||||||
@ -328,4 +357,5 @@ def inc(data):
|
|||||||
break
|
break
|
||||||
return data
|
return data
|
||||||
|
|
||||||
|
|
||||||
__all__ = ['aes_encrypt', 'key_expansion', 'aes_ctr_decrypt', 'aes_cbc_decrypt', 'aes_decrypt_text']
|
__all__ = ['aes_encrypt', 'key_expansion', 'aes_ctr_decrypt', 'aes_cbc_decrypt', 'aes_decrypt_text']
|
||||||
|
@ -2344,7 +2344,7 @@ try:
|
|||||||
from urllib.parse import unquote_plus as compat_urllib_parse_unquote_plus
|
from urllib.parse import unquote_plus as compat_urllib_parse_unquote_plus
|
||||||
except ImportError: # Python 2
|
except ImportError: # Python 2
|
||||||
_asciire = (compat_urllib_parse._asciire if hasattr(compat_urllib_parse, '_asciire')
|
_asciire = (compat_urllib_parse._asciire if hasattr(compat_urllib_parse, '_asciire')
|
||||||
else re.compile('([\x00-\x7f]+)'))
|
else re.compile(r'([\x00-\x7f]+)'))
|
||||||
|
|
||||||
# HACK: The following are the correct unquote_to_bytes, unquote and unquote_plus
|
# HACK: The following are the correct unquote_to_bytes, unquote and unquote_plus
|
||||||
# implementations from cpython 3.4.3's stdlib. Python 2's version
|
# implementations from cpython 3.4.3's stdlib. Python 2's version
|
||||||
@ -2491,6 +2491,7 @@ class _TreeBuilder(etree.TreeBuilder):
|
|||||||
def doctype(self, name, pubid, system):
|
def doctype(self, name, pubid, system):
|
||||||
pass
|
pass
|
||||||
|
|
||||||
|
|
||||||
if sys.version_info[0] >= 3:
|
if sys.version_info[0] >= 3:
|
||||||
def compat_etree_fromstring(text):
|
def compat_etree_fromstring(text):
|
||||||
return etree.XML(text, parser=etree.XMLParser(target=_TreeBuilder()))
|
return etree.XML(text, parser=etree.XMLParser(target=_TreeBuilder()))
|
||||||
@ -2528,6 +2529,24 @@ else:
|
|||||||
el.text = el.text.decode('utf-8')
|
el.text = el.text.decode('utf-8')
|
||||||
return doc
|
return doc
|
||||||
|
|
||||||
|
if hasattr(etree, 'register_namespace'):
|
||||||
|
compat_etree_register_namespace = etree.register_namespace
|
||||||
|
else:
|
||||||
|
def compat_etree_register_namespace(prefix, uri):
|
||||||
|
"""Register a namespace prefix.
|
||||||
|
The registry is global, and any existing mapping for either the
|
||||||
|
given prefix or the namespace URI will be removed.
|
||||||
|
*prefix* is the namespace prefix, *uri* is a namespace uri. Tags and
|
||||||
|
attributes in this namespace will be serialized with prefix if possible.
|
||||||
|
ValueError is raised if prefix is reserved or is invalid.
|
||||||
|
"""
|
||||||
|
if re.match(r"ns\d+$", prefix):
|
||||||
|
raise ValueError("Prefix format reserved for internal use")
|
||||||
|
for k, v in list(etree._namespace_map.items()):
|
||||||
|
if k == uri or v == prefix:
|
||||||
|
del etree._namespace_map[k]
|
||||||
|
etree._namespace_map[uri] = prefix
|
||||||
|
|
||||||
if sys.version_info < (2, 7):
|
if sys.version_info < (2, 7):
|
||||||
# Here comes the crazy part: In 2.6, if the xpath is a unicode,
|
# Here comes the crazy part: In 2.6, if the xpath is a unicode,
|
||||||
# .//node does not match if a node is a direct child of . !
|
# .//node does not match if a node is a direct child of . !
|
||||||
@ -2741,6 +2760,12 @@ else:
|
|||||||
compat_kwargs = lambda kwargs: kwargs
|
compat_kwargs = lambda kwargs: kwargs
|
||||||
|
|
||||||
|
|
||||||
|
try:
|
||||||
|
compat_numeric_types = (int, float, long, complex)
|
||||||
|
except NameError: # Python 3
|
||||||
|
compat_numeric_types = (int, float, complex)
|
||||||
|
|
||||||
|
|
||||||
if sys.version_info < (2, 7):
|
if sys.version_info < (2, 7):
|
||||||
def compat_socket_create_connection(address, timeout, source_address=None):
|
def compat_socket_create_connection(address, timeout, source_address=None):
|
||||||
host, port = address
|
host, port = address
|
||||||
@ -2787,6 +2812,7 @@ def workaround_optparse_bug9161():
|
|||||||
return real_add_option(self, *bargs, **bkwargs)
|
return real_add_option(self, *bargs, **bkwargs)
|
||||||
optparse.OptionGroup.add_option = _compat_add_option
|
optparse.OptionGroup.add_option = _compat_add_option
|
||||||
|
|
||||||
|
|
||||||
if hasattr(shutil, 'get_terminal_size'): # Python >= 3.3
|
if hasattr(shutil, 'get_terminal_size'): # Python >= 3.3
|
||||||
compat_get_terminal_size = shutil.get_terminal_size
|
compat_get_terminal_size = shutil.get_terminal_size
|
||||||
else:
|
else:
|
||||||
@ -2863,6 +2889,7 @@ __all__ = [
|
|||||||
'compat_cookiejar',
|
'compat_cookiejar',
|
||||||
'compat_cookies',
|
'compat_cookies',
|
||||||
'compat_etree_fromstring',
|
'compat_etree_fromstring',
|
||||||
|
'compat_etree_register_namespace',
|
||||||
'compat_expanduser',
|
'compat_expanduser',
|
||||||
'compat_get_terminal_size',
|
'compat_get_terminal_size',
|
||||||
'compat_getenv',
|
'compat_getenv',
|
||||||
@ -2874,6 +2901,7 @@ __all__ = [
|
|||||||
'compat_input',
|
'compat_input',
|
||||||
'compat_itertools_count',
|
'compat_itertools_count',
|
||||||
'compat_kwargs',
|
'compat_kwargs',
|
||||||
|
'compat_numeric_types',
|
||||||
'compat_ord',
|
'compat_ord',
|
||||||
'compat_os_name',
|
'compat_os_name',
|
||||||
'compat_parse_qs',
|
'compat_parse_qs',
|
||||||
|
@ -7,6 +7,7 @@ from .http import HttpFD
|
|||||||
from .rtmp import RtmpFD
|
from .rtmp import RtmpFD
|
||||||
from .dash import DashSegmentsFD
|
from .dash import DashSegmentsFD
|
||||||
from .rtsp import RtspFD
|
from .rtsp import RtspFD
|
||||||
|
from .ism import IsmFD
|
||||||
from .external import (
|
from .external import (
|
||||||
get_external_downloader,
|
get_external_downloader,
|
||||||
FFmpegFD,
|
FFmpegFD,
|
||||||
@ -24,6 +25,7 @@ PROTOCOL_MAP = {
|
|||||||
'rtsp': RtspFD,
|
'rtsp': RtspFD,
|
||||||
'f4m': F4mFD,
|
'f4m': F4mFD,
|
||||||
'http_dash_segments': DashSegmentsFD,
|
'http_dash_segments': DashSegmentsFD,
|
||||||
|
'ism': IsmFD,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
@ -346,9 +346,11 @@ class FileDownloader(object):
|
|||||||
min_sleep_interval = self.params.get('sleep_interval')
|
min_sleep_interval = self.params.get('sleep_interval')
|
||||||
if min_sleep_interval:
|
if min_sleep_interval:
|
||||||
max_sleep_interval = self.params.get('max_sleep_interval', min_sleep_interval)
|
max_sleep_interval = self.params.get('max_sleep_interval', min_sleep_interval)
|
||||||
print(min_sleep_interval, max_sleep_interval)
|
|
||||||
sleep_interval = random.uniform(min_sleep_interval, max_sleep_interval)
|
sleep_interval = random.uniform(min_sleep_interval, max_sleep_interval)
|
||||||
self.to_screen('[download] Sleeping %s seconds...' % sleep_interval)
|
self.to_screen(
|
||||||
|
'[download] Sleeping %s seconds...' % (
|
||||||
|
int(sleep_interval) if sleep_interval.is_integer()
|
||||||
|
else '%.2f' % sleep_interval))
|
||||||
time.sleep(sleep_interval)
|
time.sleep(sleep_interval)
|
||||||
|
|
||||||
return self.real_download(filename, info_dict)
|
return self.real_download(filename, info_dict)
|
||||||
|
@ -43,7 +43,10 @@ class DashSegmentsFD(FragmentFD):
|
|||||||
count = 0
|
count = 0
|
||||||
while count <= fragment_retries:
|
while count <= fragment_retries:
|
||||||
try:
|
try:
|
||||||
success = ctx['dl'].download(target_filename, {'url': segment_url})
|
success = ctx['dl'].download(target_filename, {
|
||||||
|
'url': segment_url,
|
||||||
|
'http_headers': info_dict.get('http_headers'),
|
||||||
|
})
|
||||||
if not success:
|
if not success:
|
||||||
return False
|
return False
|
||||||
down, target_sanitized = sanitize_open(target_filename, 'rb')
|
down, target_sanitized = sanitize_open(target_filename, 'rb')
|
||||||
|
@ -17,6 +17,7 @@ from ..utils import (
|
|||||||
encodeArgument,
|
encodeArgument,
|
||||||
handle_youtubedl_headers,
|
handle_youtubedl_headers,
|
||||||
check_executable,
|
check_executable,
|
||||||
|
is_outdated_version,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@ -198,6 +199,15 @@ class FFmpegFD(ExternalFD):
|
|||||||
|
|
||||||
args = [ffpp.executable, '-y']
|
args = [ffpp.executable, '-y']
|
||||||
|
|
||||||
|
seekable = info_dict.get('_seekable')
|
||||||
|
if seekable is not None:
|
||||||
|
# setting -seekable prevents ffmpeg from guessing if the server
|
||||||
|
# supports seeking(by adding the header `Range: bytes=0-`), which
|
||||||
|
# can cause problems in some cases
|
||||||
|
# https://github.com/rg3/youtube-dl/issues/11800#issuecomment-275037127
|
||||||
|
# http://trac.ffmpeg.org/ticket/6125#comment:10
|
||||||
|
args += ['-seekable', '1' if seekable else '0']
|
||||||
|
|
||||||
args += self._configuration_args()
|
args += self._configuration_args()
|
||||||
|
|
||||||
# start_time = info_dict.get('start_time') or 0
|
# start_time = info_dict.get('start_time') or 0
|
||||||
@ -264,7 +274,9 @@ class FFmpegFD(ExternalFD):
|
|||||||
if self.params.get('hls_use_mpegts', False) or tmpfilename == '-':
|
if self.params.get('hls_use_mpegts', False) or tmpfilename == '-':
|
||||||
args += ['-f', 'mpegts']
|
args += ['-f', 'mpegts']
|
||||||
else:
|
else:
|
||||||
args += ['-f', 'mp4', '-bsf:a', 'aac_adtstoasc']
|
args += ['-f', 'mp4']
|
||||||
|
if (ffpp.basename == 'ffmpeg' and is_outdated_version(ffpp._versions['ffmpeg'], '3.2', False)) and (not info_dict.get('acodec') or info_dict['acodec'].split('.')[0] in ('aac', 'mp4a')):
|
||||||
|
args += ['-bsf:a', 'aac_adtstoasc']
|
||||||
elif protocol == 'rtmp':
|
elif protocol == 'rtmp':
|
||||||
args += ['-f', 'flv']
|
args += ['-f', 'flv']
|
||||||
else:
|
else:
|
||||||
@ -293,6 +305,7 @@ class FFmpegFD(ExternalFD):
|
|||||||
class AVconvFD(FFmpegFD):
|
class AVconvFD(FFmpegFD):
|
||||||
pass
|
pass
|
||||||
|
|
||||||
|
|
||||||
_BY_NAME = dict(
|
_BY_NAME = dict(
|
||||||
(klass.get_basename(), klass)
|
(klass.get_basename(), klass)
|
||||||
for name, klass in globals().items()
|
for name, klass in globals().items()
|
||||||
|
@ -314,7 +314,8 @@ class F4mFD(FragmentFD):
|
|||||||
man_url = info_dict['url']
|
man_url = info_dict['url']
|
||||||
requested_bitrate = info_dict.get('tbr')
|
requested_bitrate = info_dict.get('tbr')
|
||||||
self.to_screen('[%s] Downloading f4m manifest' % self.FD_NAME)
|
self.to_screen('[%s] Downloading f4m manifest' % self.FD_NAME)
|
||||||
urlh = self.ydl.urlopen(man_url)
|
|
||||||
|
urlh = self.ydl.urlopen(self._prepare_url(info_dict, man_url))
|
||||||
man_url = urlh.geturl()
|
man_url = urlh.geturl()
|
||||||
# Some manifests may be malformed, e.g. prosiebensat1 generated manifests
|
# Some manifests may be malformed, e.g. prosiebensat1 generated manifests
|
||||||
# (see https://github.com/rg3/youtube-dl/issues/6215#issuecomment-121704244
|
# (see https://github.com/rg3/youtube-dl/issues/6215#issuecomment-121704244
|
||||||
@ -387,7 +388,10 @@ class F4mFD(FragmentFD):
|
|||||||
url_parsed = base_url_parsed._replace(path=base_url_parsed.path + name, query='&'.join(query))
|
url_parsed = base_url_parsed._replace(path=base_url_parsed.path + name, query='&'.join(query))
|
||||||
frag_filename = '%s-%s' % (ctx['tmpfilename'], name)
|
frag_filename = '%s-%s' % (ctx['tmpfilename'], name)
|
||||||
try:
|
try:
|
||||||
success = ctx['dl'].download(frag_filename, {'url': url_parsed.geturl()})
|
success = ctx['dl'].download(frag_filename, {
|
||||||
|
'url': url_parsed.geturl(),
|
||||||
|
'http_headers': info_dict.get('http_headers'),
|
||||||
|
})
|
||||||
if not success:
|
if not success:
|
||||||
return False
|
return False
|
||||||
(down, frag_sanitized) = sanitize_open(frag_filename, 'rb')
|
(down, frag_sanitized) = sanitize_open(frag_filename, 'rb')
|
||||||
|
@ -9,6 +9,7 @@ from ..utils import (
|
|||||||
error_to_compat_str,
|
error_to_compat_str,
|
||||||
encodeFilename,
|
encodeFilename,
|
||||||
sanitize_open,
|
sanitize_open,
|
||||||
|
sanitized_Request,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@ -37,6 +38,10 @@ class FragmentFD(FileDownloader):
|
|||||||
def report_skip_fragment(self, fragment_name):
|
def report_skip_fragment(self, fragment_name):
|
||||||
self.to_screen('[download] Skipping fragment %s...' % fragment_name)
|
self.to_screen('[download] Skipping fragment %s...' % fragment_name)
|
||||||
|
|
||||||
|
def _prepare_url(self, info_dict, url):
|
||||||
|
headers = info_dict.get('http_headers')
|
||||||
|
return sanitized_Request(url, None, headers) if headers else url
|
||||||
|
|
||||||
def _prepare_and_start_frag_download(self, ctx):
|
def _prepare_and_start_frag_download(self, ctx):
|
||||||
self._prepare_frag_download(ctx)
|
self._prepare_frag_download(ctx)
|
||||||
self._start_frag_download(ctx)
|
self._start_frag_download(ctx)
|
||||||
@ -56,6 +61,7 @@ class FragmentFD(FileDownloader):
|
|||||||
'noprogress': True,
|
'noprogress': True,
|
||||||
'ratelimit': self.params.get('ratelimit'),
|
'ratelimit': self.params.get('ratelimit'),
|
||||||
'retries': self.params.get('retries', 0),
|
'retries': self.params.get('retries', 0),
|
||||||
|
'nopart': self.params.get('nopart', False),
|
||||||
'test': self.params.get('test', False),
|
'test': self.params.get('test', False),
|
||||||
}
|
}
|
||||||
)
|
)
|
||||||
|
@ -59,11 +59,15 @@ class HlsFD(FragmentFD):
|
|||||||
def real_download(self, filename, info_dict):
|
def real_download(self, filename, info_dict):
|
||||||
man_url = info_dict['url']
|
man_url = info_dict['url']
|
||||||
self.to_screen('[%s] Downloading m3u8 manifest' % self.FD_NAME)
|
self.to_screen('[%s] Downloading m3u8 manifest' % self.FD_NAME)
|
||||||
manifest = self.ydl.urlopen(man_url).read()
|
|
||||||
|
manifest = self.ydl.urlopen(self._prepare_url(info_dict, man_url)).read()
|
||||||
|
|
||||||
s = manifest.decode('utf-8', 'ignore')
|
s = manifest.decode('utf-8', 'ignore')
|
||||||
|
|
||||||
if not self.can_download(s, info_dict):
|
if not self.can_download(s, info_dict):
|
||||||
|
if info_dict.get('extra_param_to_segment_url'):
|
||||||
|
self.report_error('pycrypto not found. Please install it.')
|
||||||
|
return False
|
||||||
self.report_warning(
|
self.report_warning(
|
||||||
'hlsnative has detected features it does not support, '
|
'hlsnative has detected features it does not support, '
|
||||||
'extraction will be delegated to ffmpeg')
|
'extraction will be delegated to ffmpeg')
|
||||||
@ -112,7 +116,10 @@ class HlsFD(FragmentFD):
|
|||||||
count = 0
|
count = 0
|
||||||
while count <= fragment_retries:
|
while count <= fragment_retries:
|
||||||
try:
|
try:
|
||||||
success = ctx['dl'].download(frag_filename, {'url': frag_url})
|
success = ctx['dl'].download(frag_filename, {
|
||||||
|
'url': frag_url,
|
||||||
|
'http_headers': info_dict.get('http_headers'),
|
||||||
|
})
|
||||||
if not success:
|
if not success:
|
||||||
return False
|
return False
|
||||||
down, frag_sanitized = sanitize_open(frag_filename, 'rb')
|
down, frag_sanitized = sanitize_open(frag_filename, 'rb')
|
||||||
|
274
youtube_dl/downloader/ism.py
Normal file
274
youtube_dl/downloader/ism.py
Normal file
@ -0,0 +1,274 @@
|
|||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
import os
|
||||||
|
import time
|
||||||
|
import struct
|
||||||
|
import binascii
|
||||||
|
import io
|
||||||
|
|
||||||
|
from .fragment import FragmentFD
|
||||||
|
from ..compat import compat_urllib_error
|
||||||
|
from ..utils import (
|
||||||
|
sanitize_open,
|
||||||
|
encodeFilename,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
u8 = struct.Struct(b'>B')
|
||||||
|
u88 = struct.Struct(b'>Bx')
|
||||||
|
u16 = struct.Struct(b'>H')
|
||||||
|
u1616 = struct.Struct(b'>Hxx')
|
||||||
|
u32 = struct.Struct(b'>I')
|
||||||
|
u64 = struct.Struct(b'>Q')
|
||||||
|
|
||||||
|
s88 = struct.Struct(b'>bx')
|
||||||
|
s16 = struct.Struct(b'>h')
|
||||||
|
s1616 = struct.Struct(b'>hxx')
|
||||||
|
s32 = struct.Struct(b'>i')
|
||||||
|
|
||||||
|
unity_matrix = (s32.pack(0x10000) + s32.pack(0) * 3) * 2 + s32.pack(0x40000000)
|
||||||
|
|
||||||
|
TRACK_ENABLED = 0x1
|
||||||
|
TRACK_IN_MOVIE = 0x2
|
||||||
|
TRACK_IN_PREVIEW = 0x4
|
||||||
|
|
||||||
|
SELF_CONTAINED = 0x1
|
||||||
|
|
||||||
|
|
||||||
|
def box(box_type, payload):
|
||||||
|
return u32.pack(8 + len(payload)) + box_type + payload
|
||||||
|
|
||||||
|
|
||||||
|
def full_box(box_type, version, flags, payload):
|
||||||
|
return box(box_type, u8.pack(version) + u32.pack(flags)[1:] + payload)
|
||||||
|
|
||||||
|
|
||||||
|
def write_piff_header(stream, params):
|
||||||
|
track_id = params['track_id']
|
||||||
|
fourcc = params['fourcc']
|
||||||
|
duration = params['duration']
|
||||||
|
timescale = params.get('timescale', 10000000)
|
||||||
|
language = params.get('language', 'und')
|
||||||
|
height = params.get('height', 0)
|
||||||
|
width = params.get('width', 0)
|
||||||
|
is_audio = width == 0 and height == 0
|
||||||
|
creation_time = modification_time = int(time.time())
|
||||||
|
|
||||||
|
ftyp_payload = b'isml' # major brand
|
||||||
|
ftyp_payload += u32.pack(1) # minor version
|
||||||
|
ftyp_payload += b'piff' + b'iso2' # compatible brands
|
||||||
|
stream.write(box(b'ftyp', ftyp_payload)) # File Type Box
|
||||||
|
|
||||||
|
mvhd_payload = u64.pack(creation_time)
|
||||||
|
mvhd_payload += u64.pack(modification_time)
|
||||||
|
mvhd_payload += u32.pack(timescale)
|
||||||
|
mvhd_payload += u64.pack(duration)
|
||||||
|
mvhd_payload += s1616.pack(1) # rate
|
||||||
|
mvhd_payload += s88.pack(1) # volume
|
||||||
|
mvhd_payload += u16.pack(0) # reserved
|
||||||
|
mvhd_payload += u32.pack(0) * 2 # reserved
|
||||||
|
mvhd_payload += unity_matrix
|
||||||
|
mvhd_payload += u32.pack(0) * 6 # pre defined
|
||||||
|
mvhd_payload += u32.pack(0xffffffff) # next track id
|
||||||
|
moov_payload = full_box(b'mvhd', 1, 0, mvhd_payload) # Movie Header Box
|
||||||
|
|
||||||
|
tkhd_payload = u64.pack(creation_time)
|
||||||
|
tkhd_payload += u64.pack(modification_time)
|
||||||
|
tkhd_payload += u32.pack(track_id) # track id
|
||||||
|
tkhd_payload += u32.pack(0) # reserved
|
||||||
|
tkhd_payload += u64.pack(duration)
|
||||||
|
tkhd_payload += u32.pack(0) * 2 # reserved
|
||||||
|
tkhd_payload += s16.pack(0) # layer
|
||||||
|
tkhd_payload += s16.pack(0) # alternate group
|
||||||
|
tkhd_payload += s88.pack(1 if is_audio else 0) # volume
|
||||||
|
tkhd_payload += u16.pack(0) # reserved
|
||||||
|
tkhd_payload += unity_matrix
|
||||||
|
tkhd_payload += u1616.pack(width)
|
||||||
|
tkhd_payload += u1616.pack(height)
|
||||||
|
trak_payload = full_box(b'tkhd', 1, TRACK_ENABLED | TRACK_IN_MOVIE | TRACK_IN_PREVIEW, tkhd_payload) # Track Header Box
|
||||||
|
|
||||||
|
mdhd_payload = u64.pack(creation_time)
|
||||||
|
mdhd_payload += u64.pack(modification_time)
|
||||||
|
mdhd_payload += u32.pack(timescale)
|
||||||
|
mdhd_payload += u64.pack(duration)
|
||||||
|
mdhd_payload += u16.pack(((ord(language[0]) - 0x60) << 10) | ((ord(language[1]) - 0x60) << 5) | (ord(language[2]) - 0x60))
|
||||||
|
mdhd_payload += u16.pack(0) # pre defined
|
||||||
|
mdia_payload = full_box(b'mdhd', 1, 0, mdhd_payload) # Media Header Box
|
||||||
|
|
||||||
|
hdlr_payload = u32.pack(0) # pre defined
|
||||||
|
hdlr_payload += b'soun' if is_audio else b'vide' # handler type
|
||||||
|
hdlr_payload += u32.pack(0) * 3 # reserved
|
||||||
|
hdlr_payload += (b'Sound' if is_audio else b'Video') + b'Handler\0' # name
|
||||||
|
mdia_payload += full_box(b'hdlr', 0, 0, hdlr_payload) # Handler Reference Box
|
||||||
|
|
||||||
|
if is_audio:
|
||||||
|
smhd_payload = s88.pack(0) # balance
|
||||||
|
smhd_payload = u16.pack(0) # reserved
|
||||||
|
media_header_box = full_box(b'smhd', 0, 0, smhd_payload) # Sound Media Header
|
||||||
|
else:
|
||||||
|
vmhd_payload = u16.pack(0) # graphics mode
|
||||||
|
vmhd_payload += u16.pack(0) * 3 # opcolor
|
||||||
|
media_header_box = full_box(b'vmhd', 0, 1, vmhd_payload) # Video Media Header
|
||||||
|
minf_payload = media_header_box
|
||||||
|
|
||||||
|
dref_payload = u32.pack(1) # entry count
|
||||||
|
dref_payload += full_box(b'url ', 0, SELF_CONTAINED, b'') # Data Entry URL Box
|
||||||
|
dinf_payload = full_box(b'dref', 0, 0, dref_payload) # Data Reference Box
|
||||||
|
minf_payload += box(b'dinf', dinf_payload) # Data Information Box
|
||||||
|
|
||||||
|
stsd_payload = u32.pack(1) # entry count
|
||||||
|
|
||||||
|
sample_entry_payload = u8.pack(0) * 6 # reserved
|
||||||
|
sample_entry_payload += u16.pack(1) # data reference index
|
||||||
|
if is_audio:
|
||||||
|
sample_entry_payload += u32.pack(0) * 2 # reserved
|
||||||
|
sample_entry_payload += u16.pack(params.get('channels', 2))
|
||||||
|
sample_entry_payload += u16.pack(params.get('bits_per_sample', 16))
|
||||||
|
sample_entry_payload += u16.pack(0) # pre defined
|
||||||
|
sample_entry_payload += u16.pack(0) # reserved
|
||||||
|
sample_entry_payload += u1616.pack(params['sampling_rate'])
|
||||||
|
|
||||||
|
if fourcc == 'AACL':
|
||||||
|
sample_entry_box = box(b'mp4a', sample_entry_payload)
|
||||||
|
else:
|
||||||
|
sample_entry_payload = sample_entry_payload
|
||||||
|
sample_entry_payload += u16.pack(0) # pre defined
|
||||||
|
sample_entry_payload += u16.pack(0) # reserved
|
||||||
|
sample_entry_payload += u32.pack(0) * 3 # pre defined
|
||||||
|
sample_entry_payload += u16.pack(width)
|
||||||
|
sample_entry_payload += u16.pack(height)
|
||||||
|
sample_entry_payload += u1616.pack(0x48) # horiz resolution 72 dpi
|
||||||
|
sample_entry_payload += u1616.pack(0x48) # vert resolution 72 dpi
|
||||||
|
sample_entry_payload += u32.pack(0) # reserved
|
||||||
|
sample_entry_payload += u16.pack(1) # frame count
|
||||||
|
sample_entry_payload += u8.pack(0) * 32 # compressor name
|
||||||
|
sample_entry_payload += u16.pack(0x18) # depth
|
||||||
|
sample_entry_payload += s16.pack(-1) # pre defined
|
||||||
|
|
||||||
|
codec_private_data = binascii.unhexlify(params['codec_private_data'])
|
||||||
|
if fourcc in ('H264', 'AVC1'):
|
||||||
|
sps, pps = codec_private_data.split(u32.pack(1))[1:]
|
||||||
|
avcc_payload = u8.pack(1) # configuration version
|
||||||
|
avcc_payload += sps[1:4] # avc profile indication + profile compatibility + avc level indication
|
||||||
|
avcc_payload += u8.pack(0xfc | (params.get('nal_unit_length_field', 4) - 1)) # complete represenation (1) + reserved (11111) + length size minus one
|
||||||
|
avcc_payload += u8.pack(1) # reserved (0) + number of sps (0000001)
|
||||||
|
avcc_payload += u16.pack(len(sps))
|
||||||
|
avcc_payload += sps
|
||||||
|
avcc_payload += u8.pack(1) # number of pps
|
||||||
|
avcc_payload += u16.pack(len(pps))
|
||||||
|
avcc_payload += pps
|
||||||
|
sample_entry_payload += box(b'avcC', avcc_payload) # AVC Decoder Configuration Record
|
||||||
|
sample_entry_box = box(b'avc1', sample_entry_payload) # AVC Simple Entry
|
||||||
|
stsd_payload += sample_entry_box
|
||||||
|
|
||||||
|
stbl_payload = full_box(b'stsd', 0, 0, stsd_payload) # Sample Description Box
|
||||||
|
|
||||||
|
stts_payload = u32.pack(0) # entry count
|
||||||
|
stbl_payload += full_box(b'stts', 0, 0, stts_payload) # Decoding Time to Sample Box
|
||||||
|
|
||||||
|
stsc_payload = u32.pack(0) # entry count
|
||||||
|
stbl_payload += full_box(b'stsc', 0, 0, stsc_payload) # Sample To Chunk Box
|
||||||
|
|
||||||
|
stco_payload = u32.pack(0) # entry count
|
||||||
|
stbl_payload += full_box(b'stco', 0, 0, stco_payload) # Chunk Offset Box
|
||||||
|
|
||||||
|
minf_payload += box(b'stbl', stbl_payload) # Sample Table Box
|
||||||
|
|
||||||
|
mdia_payload += box(b'minf', minf_payload) # Media Information Box
|
||||||
|
|
||||||
|
trak_payload += box(b'mdia', mdia_payload) # Media Box
|
||||||
|
|
||||||
|
moov_payload += box(b'trak', trak_payload) # Track Box
|
||||||
|
|
||||||
|
mehd_payload = u64.pack(duration)
|
||||||
|
mvex_payload = full_box(b'mehd', 1, 0, mehd_payload) # Movie Extends Header Box
|
||||||
|
|
||||||
|
trex_payload = u32.pack(track_id) # track id
|
||||||
|
trex_payload += u32.pack(1) # default sample description index
|
||||||
|
trex_payload += u32.pack(0) # default sample duration
|
||||||
|
trex_payload += u32.pack(0) # default sample size
|
||||||
|
trex_payload += u32.pack(0) # default sample flags
|
||||||
|
mvex_payload += full_box(b'trex', 0, 0, trex_payload) # Track Extends Box
|
||||||
|
|
||||||
|
moov_payload += box(b'mvex', mvex_payload) # Movie Extends Box
|
||||||
|
stream.write(box(b'moov', moov_payload)) # Movie Box
|
||||||
|
|
||||||
|
|
||||||
|
def extract_box_data(data, box_sequence):
|
||||||
|
data_reader = io.BytesIO(data)
|
||||||
|
while True:
|
||||||
|
box_size = u32.unpack(data_reader.read(4))[0]
|
||||||
|
box_type = data_reader.read(4)
|
||||||
|
if box_type == box_sequence[0]:
|
||||||
|
box_data = data_reader.read(box_size - 8)
|
||||||
|
if len(box_sequence) == 1:
|
||||||
|
return box_data
|
||||||
|
return extract_box_data(box_data, box_sequence[1:])
|
||||||
|
data_reader.seek(box_size - 8, 1)
|
||||||
|
|
||||||
|
|
||||||
|
class IsmFD(FragmentFD):
|
||||||
|
"""
|
||||||
|
Download segments in a ISM manifest
|
||||||
|
"""
|
||||||
|
|
||||||
|
FD_NAME = 'ism'
|
||||||
|
|
||||||
|
def real_download(self, filename, info_dict):
|
||||||
|
segments = info_dict['fragments'][:1] if self.params.get(
|
||||||
|
'test', False) else info_dict['fragments']
|
||||||
|
|
||||||
|
ctx = {
|
||||||
|
'filename': filename,
|
||||||
|
'total_frags': len(segments),
|
||||||
|
}
|
||||||
|
|
||||||
|
self._prepare_and_start_frag_download(ctx)
|
||||||
|
|
||||||
|
segments_filenames = []
|
||||||
|
|
||||||
|
fragment_retries = self.params.get('fragment_retries', 0)
|
||||||
|
skip_unavailable_fragments = self.params.get('skip_unavailable_fragments', True)
|
||||||
|
|
||||||
|
track_written = False
|
||||||
|
for i, segment in enumerate(segments):
|
||||||
|
segment_url = segment['url']
|
||||||
|
segment_name = 'Frag%d' % i
|
||||||
|
target_filename = '%s-%s' % (ctx['tmpfilename'], segment_name)
|
||||||
|
count = 0
|
||||||
|
while count <= fragment_retries:
|
||||||
|
try:
|
||||||
|
success = ctx['dl'].download(target_filename, {
|
||||||
|
'url': segment_url,
|
||||||
|
'http_headers': info_dict.get('http_headers'),
|
||||||
|
})
|
||||||
|
if not success:
|
||||||
|
return False
|
||||||
|
down, target_sanitized = sanitize_open(target_filename, 'rb')
|
||||||
|
down_data = down.read()
|
||||||
|
if not track_written:
|
||||||
|
tfhd_data = extract_box_data(down_data, [b'moof', b'traf', b'tfhd'])
|
||||||
|
info_dict['_download_params']['track_id'] = u32.unpack(tfhd_data[4:8])[0]
|
||||||
|
write_piff_header(ctx['dest_stream'], info_dict['_download_params'])
|
||||||
|
track_written = True
|
||||||
|
ctx['dest_stream'].write(down_data)
|
||||||
|
down.close()
|
||||||
|
segments_filenames.append(target_sanitized)
|
||||||
|
break
|
||||||
|
except compat_urllib_error.HTTPError as err:
|
||||||
|
count += 1
|
||||||
|
if count <= fragment_retries:
|
||||||
|
self.report_retry_fragment(err, segment_name, count, fragment_retries)
|
||||||
|
if count > fragment_retries:
|
||||||
|
if skip_unavailable_fragments:
|
||||||
|
self.report_skip_fragment(segment_name)
|
||||||
|
continue
|
||||||
|
self.report_error('giving up after %s fragment retries' % fragment_retries)
|
||||||
|
return False
|
||||||
|
|
||||||
|
self._finish_frag_download(ctx)
|
||||||
|
|
||||||
|
for segment_file in segments_filenames:
|
||||||
|
os.remove(encodeFilename(segment_file))
|
||||||
|
|
||||||
|
return True
|
@ -102,16 +102,16 @@ class ABCIViewIE(InfoExtractor):
|
|||||||
|
|
||||||
# ABC iview programs are normally available for 14 days only.
|
# ABC iview programs are normally available for 14 days only.
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://iview.abc.net.au/programs/gardening-australia/FA1505V024S00',
|
'url': 'http://iview.abc.net.au/programs/diaries-of-a-broken-mind/ZX9735A001S00',
|
||||||
'md5': '979d10b2939101f0d27a06b79edad536',
|
'md5': 'cde42d728b3b7c2b32b1b94b4a548afc',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': 'FA1505V024S00',
|
'id': 'ZX9735A001S00',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Series 27 Ep 24',
|
'title': 'Diaries Of A Broken Mind',
|
||||||
'description': 'md5:b28baeae7504d1148e1d2f0e3ed3c15d',
|
'description': 'md5:7de3903874b7a1be279fe6b68718fc9e',
|
||||||
'upload_date': '20160820',
|
'upload_date': '20161010',
|
||||||
'uploader_id': 'abc1',
|
'uploader_id': 'abc2',
|
||||||
'timestamp': 1471719600,
|
'timestamp': 1476064920,
|
||||||
},
|
},
|
||||||
'skip': 'Video gone',
|
'skip': 'Video gone',
|
||||||
}]
|
}]
|
||||||
@ -121,7 +121,7 @@ class ABCIViewIE(InfoExtractor):
|
|||||||
webpage = self._download_webpage(url, video_id)
|
webpage = self._download_webpage(url, video_id)
|
||||||
video_params = self._parse_json(self._search_regex(
|
video_params = self._parse_json(self._search_regex(
|
||||||
r'videoParams\s*=\s*({.+?});', webpage, 'video params'), video_id)
|
r'videoParams\s*=\s*({.+?});', webpage, 'video params'), video_id)
|
||||||
title = video_params['title']
|
title = video_params.get('title') or video_params['seriesTitle']
|
||||||
stream = next(s for s in video_params['playlist'] if s.get('type') == 'program')
|
stream = next(s for s in video_params['playlist'] if s.get('type') == 'program')
|
||||||
|
|
||||||
formats = self._extract_akamai_formats(stream['hds-unmetered'], video_id)
|
formats = self._extract_akamai_formats(stream['hds-unmetered'], video_id)
|
||||||
@ -144,8 +144,8 @@ class ABCIViewIE(InfoExtractor):
|
|||||||
'timestamp': parse_iso8601(video_params.get('pubDate'), ' '),
|
'timestamp': parse_iso8601(video_params.get('pubDate'), ' '),
|
||||||
'series': video_params.get('seriesTitle'),
|
'series': video_params.get('seriesTitle'),
|
||||||
'series_id': video_params.get('seriesHouseNumber') or video_id[:7],
|
'series_id': video_params.get('seriesHouseNumber') or video_id[:7],
|
||||||
'episode_number': int_or_none(self._html_search_meta('episodeNumber', webpage)),
|
'episode_number': int_or_none(self._html_search_meta('episodeNumber', webpage, default=None)),
|
||||||
'episode': self._html_search_meta('episode_title', webpage),
|
'episode': self._html_search_meta('episode_title', webpage, default=None),
|
||||||
'uploader_id': video_params.get('channel'),
|
'uploader_id': video_params.get('channel'),
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
'subtitles': subtitles,
|
'subtitles': subtitles,
|
||||||
|
@ -23,7 +23,7 @@ class AbcNewsVideoIE(AMPIE):
|
|||||||
'title': '\'This Week\' Exclusive: Iran\'s Foreign Minister Zarif',
|
'title': '\'This Week\' Exclusive: Iran\'s Foreign Minister Zarif',
|
||||||
'description': 'George Stephanopoulos goes one-on-one with Iranian Foreign Minister Dr. Javad Zarif.',
|
'description': 'George Stephanopoulos goes one-on-one with Iranian Foreign Minister Dr. Javad Zarif.',
|
||||||
'duration': 180,
|
'duration': 180,
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
# m3u8 download
|
# m3u8 download
|
||||||
@ -59,7 +59,7 @@ class AbcNewsIE(InfoExtractor):
|
|||||||
'display_id': 'dramatic-video-rare-death-job-america',
|
'display_id': 'dramatic-video-rare-death-job-america',
|
||||||
'title': 'Occupational Hazards',
|
'title': 'Occupational Hazards',
|
||||||
'description': 'Nightline investigates the dangers that lurk at various jobs.',
|
'description': 'Nightline investigates the dangers that lurk at various jobs.',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'upload_date': '20100428',
|
'upload_date': '20100428',
|
||||||
'timestamp': 1272412800,
|
'timestamp': 1272412800,
|
||||||
},
|
},
|
||||||
|
@ -23,7 +23,7 @@ class ABCOTVSIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'East Bay museum celebrates vintage synthesizers',
|
'title': 'East Bay museum celebrates vintage synthesizers',
|
||||||
'description': 'md5:a4f10fb2f2a02565c1749d4adbab4b10',
|
'description': 'md5:a4f10fb2f2a02565c1749d4adbab4b10',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'timestamp': 1421123075,
|
'timestamp': 1421123075,
|
||||||
'upload_date': '20150113',
|
'upload_date': '20150113',
|
||||||
'uploader': 'Jonathan Bloom',
|
'uploader': 'Jonathan Bloom',
|
||||||
|
@ -8,6 +8,7 @@ from .common import InfoExtractor
|
|||||||
from ..compat import compat_str
|
from ..compat import compat_str
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
int_or_none,
|
int_or_none,
|
||||||
|
parse_iso8601,
|
||||||
OnDemandPagedList,
|
OnDemandPagedList,
|
||||||
)
|
)
|
||||||
|
|
||||||
@ -15,18 +16,33 @@ from ..utils import (
|
|||||||
class ACastIE(InfoExtractor):
|
class ACastIE(InfoExtractor):
|
||||||
IE_NAME = 'acast'
|
IE_NAME = 'acast'
|
||||||
_VALID_URL = r'https?://(?:www\.)?acast\.com/(?P<channel>[^/]+)/(?P<id>[^/#?]+)'
|
_VALID_URL = r'https?://(?:www\.)?acast\.com/(?P<channel>[^/]+)/(?P<id>[^/#?]+)'
|
||||||
_TEST = {
|
_TESTS = [{
|
||||||
|
# test with one bling
|
||||||
'url': 'https://www.acast.com/condenasttraveler/-where-are-you-taipei-101-taiwan',
|
'url': 'https://www.acast.com/condenasttraveler/-where-are-you-taipei-101-taiwan',
|
||||||
'md5': 'ada3de5a1e3a2a381327d749854788bb',
|
'md5': 'ada3de5a1e3a2a381327d749854788bb',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '57de3baa-4bb0-487e-9418-2692c1277a34',
|
'id': '57de3baa-4bb0-487e-9418-2692c1277a34',
|
||||||
'ext': 'mp3',
|
'ext': 'mp3',
|
||||||
'title': '"Where Are You?": Taipei 101, Taiwan',
|
'title': '"Where Are You?": Taipei 101, Taiwan',
|
||||||
'timestamp': 1196172000000,
|
'timestamp': 1196172000,
|
||||||
|
'upload_date': '20071127',
|
||||||
'description': 'md5:a0b4ef3634e63866b542e5b1199a1a0e',
|
'description': 'md5:a0b4ef3634e63866b542e5b1199a1a0e',
|
||||||
'duration': 211,
|
'duration': 211,
|
||||||
}
|
}
|
||||||
|
}, {
|
||||||
|
# test with multiple blings
|
||||||
|
'url': 'https://www.acast.com/sparpodcast/2.raggarmordet-rosterurdetforflutna',
|
||||||
|
'md5': '55c0097badd7095f494c99a172f86501',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '2a92b283-1a75-4ad8-8396-499c641de0d9',
|
||||||
|
'ext': 'mp3',
|
||||||
|
'title': '2. Raggarmordet - Röster ur det förflutna',
|
||||||
|
'timestamp': 1477346700,
|
||||||
|
'upload_date': '20161024',
|
||||||
|
'description': 'md5:4f81f6d8cf2e12ee21a321d8bca32db4',
|
||||||
|
'duration': 2797,
|
||||||
}
|
}
|
||||||
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
channel, display_id = re.match(self._VALID_URL, url).groups()
|
channel, display_id = re.match(self._VALID_URL, url).groups()
|
||||||
@ -35,11 +51,11 @@ class ACastIE(InfoExtractor):
|
|||||||
return {
|
return {
|
||||||
'id': compat_str(cast_data['id']),
|
'id': compat_str(cast_data['id']),
|
||||||
'display_id': display_id,
|
'display_id': display_id,
|
||||||
'url': cast_data['blings'][0]['audio'],
|
'url': [b['audio'] for b in cast_data['blings'] if b['type'] == 'BlingAudio'][0],
|
||||||
'title': cast_data['name'],
|
'title': cast_data['name'],
|
||||||
'description': cast_data.get('description'),
|
'description': cast_data.get('description'),
|
||||||
'thumbnail': cast_data.get('image'),
|
'thumbnail': cast_data.get('image'),
|
||||||
'timestamp': int_or_none(cast_data.get('publishingDate')),
|
'timestamp': parse_iso8601(cast_data.get('publishingDate')),
|
||||||
'duration': int_or_none(cast_data.get('duration')),
|
'duration': int_or_none(cast_data.get('duration')),
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -26,6 +26,21 @@ MSO_INFO = {
|
|||||||
'username_field': 'UserName',
|
'username_field': 'UserName',
|
||||||
'password_field': 'UserPassword',
|
'password_field': 'UserPassword',
|
||||||
},
|
},
|
||||||
|
'Comcast_SSO': {
|
||||||
|
'name': 'Comcast XFINITY',
|
||||||
|
'username_field': 'user',
|
||||||
|
'password_field': 'passwd',
|
||||||
|
},
|
||||||
|
'TWC': {
|
||||||
|
'name': 'Time Warner Cable | Spectrum',
|
||||||
|
'username_field': 'Ecom_User_ID',
|
||||||
|
'password_field': 'Ecom_Password',
|
||||||
|
},
|
||||||
|
'Charter_Direct': {
|
||||||
|
'name': 'Charter Spectrum',
|
||||||
|
'username_field': 'IDToken1',
|
||||||
|
'password_field': 'IDToken2',
|
||||||
|
},
|
||||||
'thr030': {
|
'thr030': {
|
||||||
'name': '3 Rivers Communications'
|
'name': '3 Rivers Communications'
|
||||||
},
|
},
|
||||||
@ -1364,6 +1379,45 @@ class AdobePassIE(InfoExtractor):
|
|||||||
'domain_name': 'adobe.com',
|
'domain_name': 'adobe.com',
|
||||||
'redirect_url': url,
|
'redirect_url': url,
|
||||||
})
|
})
|
||||||
|
|
||||||
|
if mso_id == 'Comcast_SSO':
|
||||||
|
# Comcast page flow varies by video site and whether you
|
||||||
|
# are on Comcast's network.
|
||||||
|
provider_redirect_page, urlh = provider_redirect_page_res
|
||||||
|
# Check for Comcast auto login
|
||||||
|
if 'automatically signing you in' in provider_redirect_page:
|
||||||
|
oauth_redirect_url = self._html_search_regex(
|
||||||
|
r'window\.location\s*=\s*[\'"]([^\'"]+)',
|
||||||
|
provider_redirect_page, 'oauth redirect')
|
||||||
|
# Just need to process the request. No useful data comes back
|
||||||
|
self._download_webpage(
|
||||||
|
oauth_redirect_url, video_id, 'Confirming auto login')
|
||||||
|
else:
|
||||||
|
if '<form name="signin"' in provider_redirect_page:
|
||||||
|
# already have the form, just fill it
|
||||||
|
provider_login_page_res = provider_redirect_page_res
|
||||||
|
elif 'http-equiv="refresh"' in provider_redirect_page:
|
||||||
|
# redirects to the login page
|
||||||
|
oauth_redirect_url = self._html_search_regex(
|
||||||
|
r'content="0;\s*url=([^\'"]+)',
|
||||||
|
provider_redirect_page, 'meta refresh redirect')
|
||||||
|
provider_login_page_res = self._download_webpage_handle(
|
||||||
|
oauth_redirect_url,
|
||||||
|
video_id, 'Downloading Provider Login Page')
|
||||||
|
else:
|
||||||
|
provider_login_page_res = post_form(
|
||||||
|
provider_redirect_page_res, 'Downloading Provider Login Page')
|
||||||
|
|
||||||
|
mvpd_confirm_page_res = post_form(provider_login_page_res, 'Logging in', {
|
||||||
|
mso_info.get('username_field', 'username'): username,
|
||||||
|
mso_info.get('password_field', 'password'): password,
|
||||||
|
})
|
||||||
|
mvpd_confirm_page, urlh = mvpd_confirm_page_res
|
||||||
|
if '<button class="submit" value="Resume">Resume</button>' in mvpd_confirm_page:
|
||||||
|
post_form(mvpd_confirm_page_res, 'Confirming Login')
|
||||||
|
|
||||||
|
else:
|
||||||
|
# Normal, non-Comcast flow
|
||||||
provider_login_page_res = post_form(
|
provider_login_page_res = post_form(
|
||||||
provider_redirect_page_res, 'Downloading Provider Login Page')
|
provider_redirect_page_res, 'Downloading Provider Login Page')
|
||||||
mvpd_confirm_page_res = post_form(provider_login_page_res, 'Logging in', {
|
mvpd_confirm_page_res = post_form(provider_login_page_res, 'Logging in', {
|
||||||
|
@ -30,7 +30,7 @@ class AdobeTVIE(AdobeTVBaseIE):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Quick Tip - How to Draw a Circle Around an Object in Photoshop',
|
'title': 'Quick Tip - How to Draw a Circle Around an Object in Photoshop',
|
||||||
'description': 'md5:99ec318dc909d7ba2a1f2b038f7d2311',
|
'description': 'md5:99ec318dc909d7ba2a1f2b038f7d2311',
|
||||||
'thumbnail': 're:https?://.*\.jpg$',
|
'thumbnail': r're:https?://.*\.jpg$',
|
||||||
'upload_date': '20110914',
|
'upload_date': '20110914',
|
||||||
'duration': 60,
|
'duration': 60,
|
||||||
'view_count': int,
|
'view_count': int,
|
||||||
|
@ -96,6 +96,27 @@ class AdultSwimIE(TurnerBaseIE):
|
|||||||
'skip_download': True,
|
'skip_download': True,
|
||||||
},
|
},
|
||||||
'expected_warnings': ['Unable to download f4m manifest'],
|
'expected_warnings': ['Unable to download f4m manifest'],
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.adultswim.com/videos/toonami/friday-october-14th-2016/',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'eYiLsKVgQ6qTC6agD67Sig',
|
||||||
|
'title': 'Toonami - Friday, October 14th, 2016',
|
||||||
|
'description': 'md5:99892c96ffc85e159a428de85c30acde',
|
||||||
|
},
|
||||||
|
'playlist': [{
|
||||||
|
'md5': '',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'eYiLsKVgQ6qTC6agD67Sig',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Toonami - Friday, October 14th, 2016',
|
||||||
|
'description': 'md5:99892c96ffc85e159a428de85c30acde',
|
||||||
|
},
|
||||||
|
}],
|
||||||
|
'params': {
|
||||||
|
# m3u8 download
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
'expected_warnings': ['Unable to download f4m manifest'],
|
||||||
}]
|
}]
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
@ -163,6 +184,8 @@ class AdultSwimIE(TurnerBaseIE):
|
|||||||
segment_ids = [clip['videoPlaybackID'] for clip in video_info['clips']]
|
segment_ids = [clip['videoPlaybackID'] for clip in video_info['clips']]
|
||||||
elif video_info.get('videoPlaybackID'):
|
elif video_info.get('videoPlaybackID'):
|
||||||
segment_ids = [video_info['videoPlaybackID']]
|
segment_ids = [video_info['videoPlaybackID']]
|
||||||
|
elif video_info.get('id'):
|
||||||
|
segment_ids = [video_info['id']]
|
||||||
else:
|
else:
|
||||||
if video_info.get('auth') is True:
|
if video_info.get('auth') is True:
|
||||||
raise ExtractorError(
|
raise ExtractorError(
|
||||||
|
@ -23,10 +23,10 @@ class AENetworksBaseIE(ThePlatformIE):
|
|||||||
class AENetworksIE(AENetworksBaseIE):
|
class AENetworksIE(AENetworksBaseIE):
|
||||||
IE_NAME = 'aenetworks'
|
IE_NAME = 'aenetworks'
|
||||||
IE_DESC = 'A+E Networks: A&E, Lifetime, History.com, FYI Network'
|
IE_DESC = 'A+E Networks: A&E, Lifetime, History.com, FYI Network'
|
||||||
_VALID_URL = r'https?://(?:www\.)?(?P<domain>(?:history|aetv|mylifetime)\.com|fyi\.tv)/(?:shows/(?P<show_path>[^/]+(?:/[^/]+){0,2})|movies/(?P<movie_display_id>[^/]+)/full-movie)'
|
_VALID_URL = r'https?://(?:www\.)?(?P<domain>(?:history|aetv|mylifetime|lifetimemovieclub)\.com|fyi\.tv)/(?:shows/(?P<show_path>[^/]+(?:/[^/]+){0,2})|movies/(?P<movie_display_id>[^/]+)(?:/full-movie)?)'
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.history.com/shows/mountain-men/season-1/episode-1',
|
'url': 'http://www.history.com/shows/mountain-men/season-1/episode-1',
|
||||||
'md5': '8ff93eb073449f151d6b90c0ae1ef0c7',
|
'md5': 'a97a65f7e823ae10e9244bc5433d5fe6',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '22253814',
|
'id': '22253814',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
@ -62,11 +62,15 @@ class AENetworksIE(AENetworksBaseIE):
|
|||||||
}, {
|
}, {
|
||||||
'url': 'http://www.mylifetime.com/movies/center-stage-on-pointe/full-movie',
|
'url': 'http://www.mylifetime.com/movies/center-stage-on-pointe/full-movie',
|
||||||
'only_matching': True
|
'only_matching': True
|
||||||
|
}, {
|
||||||
|
'url': 'https://www.lifetimemovieclub.com/movies/a-killer-among-us',
|
||||||
|
'only_matching': True
|
||||||
}]
|
}]
|
||||||
_DOMAIN_TO_REQUESTOR_ID = {
|
_DOMAIN_TO_REQUESTOR_ID = {
|
||||||
'history.com': 'HISTORY',
|
'history.com': 'HISTORY',
|
||||||
'aetv.com': 'AETV',
|
'aetv.com': 'AETV',
|
||||||
'mylifetime.com': 'LIFETIME',
|
'mylifetime.com': 'LIFETIME',
|
||||||
|
'lifetimemovieclub.com': 'LIFETIMEMOVIECLUB',
|
||||||
'fyi.tv': 'FYI',
|
'fyi.tv': 'FYI',
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -87,7 +91,7 @@ class AENetworksIE(AENetworksBaseIE):
|
|||||||
self._html_search_meta('aetn:SeriesTitle', webpage))
|
self._html_search_meta('aetn:SeriesTitle', webpage))
|
||||||
elif url_parts_len == 2:
|
elif url_parts_len == 2:
|
||||||
entries = []
|
entries = []
|
||||||
for episode_item in re.findall(r'(?s)<div[^>]+class="[^"]*episode-item[^"]*"[^>]*>', webpage):
|
for episode_item in re.findall(r'(?s)<[^>]+class="[^"]*(?:episode|program)-item[^"]*"[^>]*>', webpage):
|
||||||
episode_attributes = extract_attributes(episode_item)
|
episode_attributes = extract_attributes(episode_item)
|
||||||
episode_url = compat_urlparse.urljoin(
|
episode_url = compat_urlparse.urljoin(
|
||||||
url, episode_attributes['data-canonical'])
|
url, episode_attributes['data-canonical'])
|
||||||
@ -99,7 +103,7 @@ class AENetworksIE(AENetworksBaseIE):
|
|||||||
|
|
||||||
query = {
|
query = {
|
||||||
'mbr': 'true',
|
'mbr': 'true',
|
||||||
'assetTypes': 'medium_video_s3'
|
'assetTypes': 'high_video_s3'
|
||||||
}
|
}
|
||||||
video_id = self._html_search_meta('aetn:VideoID', webpage)
|
video_id = self._html_search_meta('aetn:VideoID', webpage)
|
||||||
media_url = self._search_regex(
|
media_url = self._search_regex(
|
||||||
@ -155,7 +159,7 @@ class HistoryTopicIE(AENetworksBaseIE):
|
|||||||
'id': 'world-war-i-history',
|
'id': 'world-war-i-history',
|
||||||
'title': 'World War I History',
|
'title': 'World War I History',
|
||||||
},
|
},
|
||||||
'playlist_mincount': 24,
|
'playlist_mincount': 23,
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.history.com/topics/world-war-i-history/videos',
|
'url': 'http://www.history.com/topics/world-war-i-history/videos',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
@ -193,7 +197,8 @@ class HistoryTopicIE(AENetworksBaseIE):
|
|||||||
return self.theplatform_url_result(
|
return self.theplatform_url_result(
|
||||||
release_url, video_id, {
|
release_url, video_id, {
|
||||||
'mbr': 'true',
|
'mbr': 'true',
|
||||||
'switch': 'hls'
|
'switch': 'hls',
|
||||||
|
'assetTypes': 'high_video_ak',
|
||||||
})
|
})
|
||||||
else:
|
else:
|
||||||
webpage = self._download_webpage(url, topic_id)
|
webpage = self._download_webpage(url, topic_id)
|
||||||
@ -203,6 +208,7 @@ class HistoryTopicIE(AENetworksBaseIE):
|
|||||||
entries.append(self.theplatform_url_result(
|
entries.append(self.theplatform_url_result(
|
||||||
video_attributes['data-release-url'], video_attributes['data-id'], {
|
video_attributes['data-release-url'], video_attributes['data-id'], {
|
||||||
'mbr': 'true',
|
'mbr': 'true',
|
||||||
'switch': 'hls'
|
'switch': 'hls',
|
||||||
|
'assetTypes': 'high_video_ak',
|
||||||
}))
|
}))
|
||||||
return self.playlist_result(entries, topic_id, get_element_by_attribute('class', 'show-title', webpage))
|
return self.playlist_result(entries, topic_id, get_element_by_attribute('class', 'show-title', webpage))
|
||||||
|
@ -11,19 +11,27 @@ from ..compat import (
|
|||||||
from ..utils import (
|
from ..utils import (
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
|
update_url_query,
|
||||||
xpath_element,
|
xpath_element,
|
||||||
xpath_text,
|
xpath_text,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class AfreecaTVIE(InfoExtractor):
|
class AfreecaTVIE(InfoExtractor):
|
||||||
|
IE_NAME = 'afreecatv'
|
||||||
IE_DESC = 'afreecatv.com'
|
IE_DESC = 'afreecatv.com'
|
||||||
_VALID_URL = r'''(?x)^
|
_VALID_URL = r'''(?x)
|
||||||
https?://(?:(live|afbbs|www)\.)?afreeca(?:tv)?\.com(?::\d+)?
|
https?://
|
||||||
|
(?:
|
||||||
|
(?:(?:live|afbbs|www)\.)?afreeca(?:tv)?\.com(?::\d+)?
|
||||||
(?:
|
(?:
|
||||||
/app/(?:index|read_ucc_bbs)\.cgi|
|
/app/(?:index|read_ucc_bbs)\.cgi|
|
||||||
/player/[Pp]layer\.(?:swf|html))
|
/player/[Pp]layer\.(?:swf|html)
|
||||||
\?.*?\bnTitleNo=(?P<id>\d+)'''
|
)\?.*?\bnTitleNo=|
|
||||||
|
vod\.afreecatv\.com/PLAYER/STATION/
|
||||||
|
)
|
||||||
|
(?P<id>\d+)
|
||||||
|
'''
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://live.afreecatv.com:8079/app/index.cgi?szType=read_ucc_bbs&szBjId=dailyapril&nStationNo=16711924&nBbsNo=18605867&nTitleNo=36164052&szSkin=',
|
'url': 'http://live.afreecatv.com:8079/app/index.cgi?szType=read_ucc_bbs&szBjId=dailyapril&nStationNo=16711924&nBbsNo=18605867&nTitleNo=36164052&szSkin=',
|
||||||
'md5': 'f72c89fe7ecc14c1b5ce506c4996046e',
|
'md5': 'f72c89fe7ecc14c1b5ce506c4996046e',
|
||||||
@ -66,6 +74,9 @@ class AfreecaTVIE(InfoExtractor):
|
|||||||
}, {
|
}, {
|
||||||
'url': 'http://www.afreecatv.com/player/Player.swf?szType=szBjId=djleegoon&nStationNo=11273158&nBbsNo=13161095&nTitleNo=36327652',
|
'url': 'http://www.afreecatv.com/player/Player.swf?szType=szBjId=djleegoon&nStationNo=11273158&nBbsNo=13161095&nTitleNo=36327652',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://vod.afreecatv.com/PLAYER/STATION/15055030',
|
||||||
|
'only_matching': True,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
@ -83,7 +94,9 @@ class AfreecaTVIE(InfoExtractor):
|
|||||||
info_url = compat_urlparse.urlunparse(parsed_url._replace(
|
info_url = compat_urlparse.urlunparse(parsed_url._replace(
|
||||||
netloc='afbbs.afreecatv.com:8080',
|
netloc='afbbs.afreecatv.com:8080',
|
||||||
path='/api/video/get_video_info.php'))
|
path='/api/video/get_video_info.php'))
|
||||||
video_xml = self._download_xml(info_url, video_id)
|
|
||||||
|
video_xml = self._download_xml(
|
||||||
|
update_url_query(info_url, {'nTitleNo': video_id}), video_id)
|
||||||
|
|
||||||
if xpath_element(video_xml, './track/video/file') is None:
|
if xpath_element(video_xml, './track/video/file') is None:
|
||||||
raise ExtractorError('Specified AfreecaTV video does not exist',
|
raise ExtractorError('Specified AfreecaTV video does not exist',
|
||||||
@ -131,3 +144,107 @@ class AfreecaTVIE(InfoExtractor):
|
|||||||
expected=True)
|
expected=True)
|
||||||
|
|
||||||
return info
|
return info
|
||||||
|
|
||||||
|
|
||||||
|
class AfreecaTVGlobalIE(AfreecaTVIE):
|
||||||
|
IE_NAME = 'afreecatv:global'
|
||||||
|
_VALID_URL = r'https?://(?:www\.)?afreeca\.tv/(?P<channel_id>\d+)(?:/v/(?P<video_id>\d+))?'
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'http://afreeca.tv/36853014/v/58301',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '58301',
|
||||||
|
'title': 'tryhard top100',
|
||||||
|
'uploader_id': '36853014',
|
||||||
|
'uploader': 'makgi Hearthstone Live!',
|
||||||
|
},
|
||||||
|
'playlist_count': 3,
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
channel_id, video_id = re.match(self._VALID_URL, url).groups()
|
||||||
|
video_type = 'video' if video_id else 'live'
|
||||||
|
query = {
|
||||||
|
'pt': 'view',
|
||||||
|
'bid': channel_id,
|
||||||
|
}
|
||||||
|
if video_id:
|
||||||
|
query['vno'] = video_id
|
||||||
|
video_data = self._download_json(
|
||||||
|
'http://api.afreeca.tv/%s/view_%s.php' % (video_type, video_type),
|
||||||
|
video_id or channel_id, query=query)['channel']
|
||||||
|
|
||||||
|
if video_data.get('result') != 1:
|
||||||
|
raise ExtractorError('%s said: %s' % (self.IE_NAME, video_data['remsg']))
|
||||||
|
|
||||||
|
title = video_data['title']
|
||||||
|
|
||||||
|
info = {
|
||||||
|
'thumbnail': video_data.get('thumb'),
|
||||||
|
'view_count': int_or_none(video_data.get('vcnt')),
|
||||||
|
'age_limit': int_or_none(video_data.get('grade')),
|
||||||
|
'uploader_id': channel_id,
|
||||||
|
'uploader': video_data.get('cname'),
|
||||||
|
}
|
||||||
|
|
||||||
|
if video_id:
|
||||||
|
entries = []
|
||||||
|
for i, f in enumerate(video_data.get('flist', [])):
|
||||||
|
video_key = self.parse_video_key(f.get('key', ''))
|
||||||
|
f_url = f.get('file')
|
||||||
|
if not video_key or not f_url:
|
||||||
|
continue
|
||||||
|
entries.append({
|
||||||
|
'id': '%s_%s' % (video_id, video_key.get('part', i + 1)),
|
||||||
|
'title': title,
|
||||||
|
'upload_date': video_key.get('upload_date'),
|
||||||
|
'duration': int_or_none(f.get('length')),
|
||||||
|
'url': f_url,
|
||||||
|
'protocol': 'm3u8_native',
|
||||||
|
'ext': 'mp4',
|
||||||
|
})
|
||||||
|
|
||||||
|
info.update({
|
||||||
|
'id': video_id,
|
||||||
|
'title': title,
|
||||||
|
'duration': int_or_none(video_data.get('length')),
|
||||||
|
})
|
||||||
|
if len(entries) > 1:
|
||||||
|
info['_type'] = 'multi_video'
|
||||||
|
info['entries'] = entries
|
||||||
|
elif len(entries) == 1:
|
||||||
|
i = entries[0].copy()
|
||||||
|
i.update(info)
|
||||||
|
info = i
|
||||||
|
else:
|
||||||
|
formats = []
|
||||||
|
for s in video_data.get('strm', []):
|
||||||
|
s_url = s.get('purl')
|
||||||
|
if not s_url:
|
||||||
|
continue
|
||||||
|
stype = s.get('stype')
|
||||||
|
if stype == 'HLS':
|
||||||
|
formats.extend(self._extract_m3u8_formats(
|
||||||
|
s_url, channel_id, 'mp4', m3u8_id=stype, fatal=False))
|
||||||
|
elif stype == 'RTMP':
|
||||||
|
format_id = [stype]
|
||||||
|
label = s.get('label')
|
||||||
|
if label:
|
||||||
|
format_id.append(label)
|
||||||
|
formats.append({
|
||||||
|
'format_id': '-'.join(format_id),
|
||||||
|
'url': s_url,
|
||||||
|
'tbr': int_or_none(s.get('bps')),
|
||||||
|
'height': int_or_none(s.get('brt')),
|
||||||
|
'ext': 'flv',
|
||||||
|
'rtmp_live': True,
|
||||||
|
})
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
|
info.update({
|
||||||
|
'id': channel_id,
|
||||||
|
'title': self._live_title(title),
|
||||||
|
'is_live': True,
|
||||||
|
'formats': formats,
|
||||||
|
})
|
||||||
|
|
||||||
|
return info
|
||||||
|
@ -20,7 +20,7 @@ class AirMozillaIE(InfoExtractor):
|
|||||||
'id': '6x4q2w',
|
'id': '6x4q2w',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Privacy Lab - a meetup for privacy minded people in San Francisco',
|
'title': 'Privacy Lab - a meetup for privacy minded people in San Francisco',
|
||||||
'thumbnail': 're:https?://vid\.ly/(?P<id>[0-9a-z-]+)/poster',
|
'thumbnail': r're:https?://vid\.ly/(?P<id>[0-9a-z-]+)/poster',
|
||||||
'description': 'Brings together privacy professionals and others interested in privacy at for-profits, non-profits, and NGOs in an effort to contribute to the state of the ecosystem...',
|
'description': 'Brings together privacy professionals and others interested in privacy at for-profits, non-profits, and NGOs in an effort to contribute to the state of the ecosystem...',
|
||||||
'timestamp': 1422487800,
|
'timestamp': 1422487800,
|
||||||
'upload_date': '20150128',
|
'upload_date': '20150128',
|
||||||
|
@ -1,94 +1,109 @@
|
|||||||
# coding: utf-8
|
# coding: utf-8
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
import re
|
|
||||||
import json
|
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..compat import compat_str
|
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
|
remove_end,
|
||||||
qualities,
|
qualities,
|
||||||
unescapeHTML,
|
url_basename,
|
||||||
xpath_element,
|
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class AllocineIE(InfoExtractor):
|
class AllocineIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?allocine\.fr/(?P<typ>article|video|film)/(fichearticle_gen_carticle=|player_gen_cmedia=|fichefilm_gen_cfilm=|video-)(?P<id>[0-9]+)(?:\.html)?'
|
_VALID_URL = r'https?://(?:www\.)?allocine\.fr/(?:article|video|film)/(?:fichearticle_gen_carticle=|player_gen_cmedia=|fichefilm_gen_cfilm=|video-)(?P<id>[0-9]+)(?:\.html)?'
|
||||||
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.allocine.fr/article/fichearticle_gen_carticle=18635087.html',
|
'url': 'http://www.allocine.fr/article/fichearticle_gen_carticle=18635087.html',
|
||||||
'md5': '0c9fcf59a841f65635fa300ac43d8269',
|
'md5': '0c9fcf59a841f65635fa300ac43d8269',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '19546517',
|
'id': '19546517',
|
||||||
|
'display_id': '18635087',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Astérix - Le Domaine des Dieux Teaser VF',
|
'title': 'Astérix - Le Domaine des Dieux Teaser VF',
|
||||||
'description': 'md5:abcd09ce503c6560512c14ebfdb720d2',
|
'description': 'md5:4a754271d9c6f16c72629a8a993ee884',
|
||||||
'thumbnail': 're:http://.*\.jpg',
|
'thumbnail': r're:http://.*\.jpg',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.allocine.fr/video/player_gen_cmedia=19540403&cfilm=222257.html',
|
'url': 'http://www.allocine.fr/video/player_gen_cmedia=19540403&cfilm=222257.html',
|
||||||
'md5': 'd0cdce5d2b9522ce279fdfec07ff16e0',
|
'md5': 'd0cdce5d2b9522ce279fdfec07ff16e0',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '19540403',
|
'id': '19540403',
|
||||||
|
'display_id': '19540403',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Planes 2 Bande-annonce VF',
|
'title': 'Planes 2 Bande-annonce VF',
|
||||||
'description': 'Regardez la bande annonce du film Planes 2 (Planes 2 Bande-annonce VF). Planes 2, un film de Roberts Gannaway',
|
'description': 'Regardez la bande annonce du film Planes 2 (Planes 2 Bande-annonce VF). Planes 2, un film de Roberts Gannaway',
|
||||||
'thumbnail': 're:http://.*\.jpg',
|
'thumbnail': r're:http://.*\.jpg',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.allocine.fr/film/fichefilm_gen_cfilm=181290.html',
|
'url': 'http://www.allocine.fr/video/player_gen_cmedia=19544709&cfilm=181290.html',
|
||||||
'md5': '101250fb127ef9ca3d73186ff22a47ce',
|
'md5': '101250fb127ef9ca3d73186ff22a47ce',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '19544709',
|
'id': '19544709',
|
||||||
|
'display_id': '19544709',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Dragons 2 - Bande annonce finale VF',
|
'title': 'Dragons 2 - Bande annonce finale VF',
|
||||||
'description': 'md5:601d15393ac40f249648ef000720e7e3',
|
'description': 'md5:6cdd2d7c2687d4c6aafe80a35e17267a',
|
||||||
'thumbnail': 're:http://.*\.jpg',
|
'thumbnail': r're:http://.*\.jpg',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.allocine.fr/video/video-19550147/',
|
'url': 'http://www.allocine.fr/video/video-19550147/',
|
||||||
'only_matching': True,
|
'md5': '3566c0668c0235e2d224fd8edb389f67',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '19550147',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Faux Raccord N°123 - Les gaffes de Cliffhanger',
|
||||||
|
'description': 'md5:bc734b83ffa2d8a12188d9eb48bb6354',
|
||||||
|
'thumbnail': r're:http://.*\.jpg',
|
||||||
|
},
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
mobj = re.match(self._VALID_URL, url)
|
display_id = self._match_id(url)
|
||||||
typ = mobj.group('typ')
|
|
||||||
display_id = mobj.group('id')
|
|
||||||
|
|
||||||
webpage = self._download_webpage(url, display_id)
|
webpage = self._download_webpage(url, display_id)
|
||||||
|
|
||||||
if typ == 'film':
|
formats = []
|
||||||
video_id = self._search_regex(r'href="/video/player_gen_cmedia=([0-9]+).+"', webpage, 'video id')
|
|
||||||
else:
|
|
||||||
player = self._search_regex(r'data-player=\'([^\']+)\'>', webpage, 'data player', default=None)
|
|
||||||
if player:
|
|
||||||
player_data = json.loads(player)
|
|
||||||
video_id = compat_str(player_data['refMedia'])
|
|
||||||
else:
|
|
||||||
model = self._search_regex(r'data-model="([^"]+)">', webpage, 'data model')
|
|
||||||
model_data = self._parse_json(unescapeHTML(model), display_id)
|
|
||||||
video_id = compat_str(model_data['id'])
|
|
||||||
|
|
||||||
xml = self._download_xml('http://www.allocine.fr/ws/AcVisiondataV4.ashx?media=%s' % video_id, display_id)
|
|
||||||
|
|
||||||
video = xpath_element(xml, './/AcVisionVideo').attrib
|
|
||||||
quality = qualities(['ld', 'md', 'hd'])
|
quality = qualities(['ld', 'md', 'hd'])
|
||||||
|
|
||||||
formats = []
|
model = self._html_search_regex(
|
||||||
for k, v in video.items():
|
r'data-model="([^"]+)"', webpage, 'data model', default=None)
|
||||||
if re.match(r'.+_path', k):
|
if model:
|
||||||
format_id = k.split('_')[0]
|
model_data = self._parse_json(model, display_id)
|
||||||
|
|
||||||
|
for video_url in model_data['sources'].values():
|
||||||
|
video_id, format_id = url_basename(video_url).split('_')[:2]
|
||||||
formats.append({
|
formats.append({
|
||||||
'format_id': format_id,
|
'format_id': format_id,
|
||||||
'quality': quality(format_id),
|
'quality': quality(format_id),
|
||||||
'url': v,
|
'url': video_url,
|
||||||
})
|
})
|
||||||
|
|
||||||
|
title = model_data['title']
|
||||||
|
else:
|
||||||
|
video_id = display_id
|
||||||
|
media_data = self._download_json(
|
||||||
|
'http://www.allocine.fr/ws/AcVisiondataV5.ashx?media=%s' % video_id, display_id)
|
||||||
|
for key, value in media_data['video'].items():
|
||||||
|
if not key.endswith('Path'):
|
||||||
|
continue
|
||||||
|
|
||||||
|
format_id = key[:-len('Path')]
|
||||||
|
formats.append({
|
||||||
|
'format_id': format_id,
|
||||||
|
'quality': quality(format_id),
|
||||||
|
'url': value,
|
||||||
|
})
|
||||||
|
|
||||||
|
title = remove_end(self._html_search_regex(
|
||||||
|
r'(?s)<title>(.+?)</title>', webpage, 'title'
|
||||||
|
).strip(), ' - AlloCiné')
|
||||||
|
|
||||||
self._sort_formats(formats)
|
self._sort_formats(formats)
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': video['videoTitle'],
|
'display_id': display_id,
|
||||||
|
'title': title,
|
||||||
'thumbnail': self._og_search_thumbnail(webpage),
|
'thumbnail': self._og_search_thumbnail(webpage),
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
'description': self._og_search_description(webpage),
|
'description': self._og_search_description(webpage),
|
||||||
|
@ -19,7 +19,7 @@ class AlphaPornoIE(InfoExtractor):
|
|||||||
'display_id': 'sensual-striptease-porn-with-samantha-alexandra',
|
'display_id': 'sensual-striptease-porn-with-samantha-alexandra',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Sensual striptease porn with Samantha Alexandra',
|
'title': 'Sensual striptease porn with Samantha Alexandra',
|
||||||
'thumbnail': 're:https?://.*\.jpg$',
|
'thumbnail': r're:https?://.*\.jpg$',
|
||||||
'timestamp': 1418694611,
|
'timestamp': 1418694611,
|
||||||
'upload_date': '20141216',
|
'upload_date': '20141216',
|
||||||
'duration': 387,
|
'duration': 387,
|
||||||
|
@ -10,7 +10,7 @@ from ..utils import (
|
|||||||
|
|
||||||
|
|
||||||
class AMCNetworksIE(ThePlatformIE):
|
class AMCNetworksIE(ThePlatformIE):
|
||||||
_VALID_URL = r'https?://(?:www\.)?(?:amc|bbcamerica|ifc|wetv)\.com/(?:movies/|shows/[^/]+/(?:full-episodes/)?season-\d+/episode-\d+(?:-(?:[^/]+/)?|/))(?P<id>[^/?#]+)'
|
_VALID_URL = r'https?://(?:www\.)?(?:amc|bbcamerica|ifc|wetv)\.com/(?:movies|shows(?:/[^/]+)+)/(?P<id>[^/?#]+)'
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.ifc.com/shows/maron/season-04/episode-01/step-1',
|
'url': 'http://www.ifc.com/shows/maron/season-04/episode-01/step-1',
|
||||||
'md5': '',
|
'md5': '',
|
||||||
@ -41,6 +41,15 @@ class AMCNetworksIE(ThePlatformIE):
|
|||||||
}, {
|
}, {
|
||||||
'url': 'http://www.ifc.com/movies/chaos',
|
'url': 'http://www.ifc.com/movies/chaos',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.bbcamerica.com/shows/doctor-who/full-episodes/the-power-of-the-daleks/episode-01-episode-1-color-version',
|
||||||
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.wetv.com/shows/mama-june-from-not-to-hot/full-episode/season-01/thin-tervention',
|
||||||
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.wetv.com/shows/la-hair/videos/season-05/episode-09-episode-9-2/episode-9-sneak-peek-3',
|
||||||
|
'only_matching': True,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
@ -50,20 +59,30 @@ class AMCNetworksIE(ThePlatformIE):
|
|||||||
'mbr': 'true',
|
'mbr': 'true',
|
||||||
'manifest': 'm3u',
|
'manifest': 'm3u',
|
||||||
}
|
}
|
||||||
media_url = self._search_regex(r'window\.platformLinkURL\s*=\s*[\'"]([^\'"]+)', webpage, 'media url')
|
media_url = self._search_regex(
|
||||||
|
r'window\.platformLinkURL\s*=\s*[\'"]([^\'"]+)',
|
||||||
|
webpage, 'media url')
|
||||||
theplatform_metadata = self._download_theplatform_metadata(self._search_regex(
|
theplatform_metadata = self._download_theplatform_metadata(self._search_regex(
|
||||||
r'https?://link.theplatform.com/s/([^?]+)', media_url, 'theplatform_path'), display_id)
|
r'link\.theplatform\.com/s/([^?]+)',
|
||||||
|
media_url, 'theplatform_path'), display_id)
|
||||||
info = self._parse_theplatform_metadata(theplatform_metadata)
|
info = self._parse_theplatform_metadata(theplatform_metadata)
|
||||||
video_id = theplatform_metadata['pid']
|
video_id = theplatform_metadata['pid']
|
||||||
title = theplatform_metadata['title']
|
title = theplatform_metadata['title']
|
||||||
rating = theplatform_metadata['ratings'][0]['rating']
|
rating = theplatform_metadata['ratings'][0]['rating']
|
||||||
auth_required = self._search_regex(r'window\.authRequired\s*=\s*(true|false);', webpage, 'auth required')
|
auth_required = self._search_regex(
|
||||||
|
r'window\.authRequired\s*=\s*(true|false);',
|
||||||
|
webpage, 'auth required')
|
||||||
if auth_required == 'true':
|
if auth_required == 'true':
|
||||||
requestor_id = self._search_regex(r'window\.requestor_id\s*=\s*[\'"]([^\'"]+)', webpage, 'requestor id')
|
requestor_id = self._search_regex(
|
||||||
resource = self._get_mvpd_resource(requestor_id, title, video_id, rating)
|
r'window\.requestor_id\s*=\s*[\'"]([^\'"]+)',
|
||||||
query['auth'] = self._extract_mvpd_auth(url, video_id, requestor_id, resource)
|
webpage, 'requestor id')
|
||||||
|
resource = self._get_mvpd_resource(
|
||||||
|
requestor_id, title, video_id, rating)
|
||||||
|
query['auth'] = self._extract_mvpd_auth(
|
||||||
|
url, video_id, requestor_id, resource)
|
||||||
media_url = update_url_query(media_url, query)
|
media_url = update_url_query(media_url, query)
|
||||||
formats, subtitles = self._extract_theplatform_smil(media_url, video_id)
|
formats, subtitles = self._extract_theplatform_smil(
|
||||||
|
media_url, video_id)
|
||||||
self._sort_formats(formats)
|
self._sort_formats(formats)
|
||||||
info.update({
|
info.update({
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
@ -75,9 +94,11 @@ class AMCNetworksIE(ThePlatformIE):
|
|||||||
if ns_keys:
|
if ns_keys:
|
||||||
ns = list(ns_keys)[0]
|
ns = list(ns_keys)[0]
|
||||||
series = theplatform_metadata.get(ns + '$show')
|
series = theplatform_metadata.get(ns + '$show')
|
||||||
season_number = int_or_none(theplatform_metadata.get(ns + '$season'))
|
season_number = int_or_none(
|
||||||
|
theplatform_metadata.get(ns + '$season'))
|
||||||
episode = theplatform_metadata.get(ns + '$episodeTitle')
|
episode = theplatform_metadata.get(ns + '$episodeTitle')
|
||||||
episode_number = int_or_none(theplatform_metadata.get(ns + '$episode'))
|
episode_number = int_or_none(
|
||||||
|
theplatform_metadata.get(ns + '$episode'))
|
||||||
if season_number:
|
if season_number:
|
||||||
title = 'Season %d - %s' % (season_number, title)
|
title = 'Season %d - %s' % (season_number, title)
|
||||||
if series:
|
if series:
|
||||||
|
@ -157,22 +157,16 @@ class AnvatoIE(InfoExtractor):
|
|||||||
video_data_url, video_id, transform_source=strip_jsonp,
|
video_data_url, video_id, transform_source=strip_jsonp,
|
||||||
data=json.dumps(payload).encode('utf-8'))
|
data=json.dumps(payload).encode('utf-8'))
|
||||||
|
|
||||||
def _extract_anvato_videos(self, webpage, video_id):
|
def _get_anvato_videos(self, access_key, video_id):
|
||||||
anvplayer_data = self._parse_json(self._html_search_regex(
|
|
||||||
r'<script[^>]+data-anvp=\'([^\']+)\'', webpage,
|
|
||||||
'Anvato player data'), video_id)
|
|
||||||
|
|
||||||
video_id = anvplayer_data['video']
|
|
||||||
access_key = anvplayer_data['accessKey']
|
|
||||||
|
|
||||||
video_data = self._get_video_json(access_key, video_id)
|
video_data = self._get_video_json(access_key, video_id)
|
||||||
|
|
||||||
formats = []
|
formats = []
|
||||||
for published_url in video_data['published_urls']:
|
for published_url in video_data['published_urls']:
|
||||||
video_url = published_url['embed_url']
|
video_url = published_url['embed_url']
|
||||||
|
media_format = published_url.get('format')
|
||||||
ext = determine_ext(video_url)
|
ext = determine_ext(video_url)
|
||||||
|
|
||||||
if ext == 'smil':
|
if ext == 'smil' or media_format == 'smil':
|
||||||
formats.extend(self._extract_smil_formats(video_url, video_id))
|
formats.extend(self._extract_smil_formats(video_url, video_id))
|
||||||
continue
|
continue
|
||||||
|
|
||||||
@ -183,7 +177,7 @@ class AnvatoIE(InfoExtractor):
|
|||||||
'tbr': tbr if tbr != 0 else None,
|
'tbr': tbr if tbr != 0 else None,
|
||||||
}
|
}
|
||||||
|
|
||||||
if ext == 'm3u8':
|
if ext == 'm3u8' or media_format in ('m3u8', 'm3u8-variant'):
|
||||||
# Not using _extract_m3u8_formats here as individual media
|
# Not using _extract_m3u8_formats here as individual media
|
||||||
# playlists are also included in published_urls.
|
# playlists are also included in published_urls.
|
||||||
if tbr is None:
|
if tbr is None:
|
||||||
@ -194,7 +188,7 @@ class AnvatoIE(InfoExtractor):
|
|||||||
'format_id': '-'.join(filter(None, ['hls', compat_str(tbr)])),
|
'format_id': '-'.join(filter(None, ['hls', compat_str(tbr)])),
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
})
|
})
|
||||||
elif ext == 'mp3':
|
elif ext == 'mp3' or media_format == 'mp3':
|
||||||
a_format['vcodec'] = 'none'
|
a_format['vcodec'] = 'none'
|
||||||
else:
|
else:
|
||||||
a_format.update({
|
a_format.update({
|
||||||
@ -218,7 +212,19 @@ class AnvatoIE(InfoExtractor):
|
|||||||
'formats': formats,
|
'formats': formats,
|
||||||
'title': video_data.get('def_title'),
|
'title': video_data.get('def_title'),
|
||||||
'description': video_data.get('def_description'),
|
'description': video_data.get('def_description'),
|
||||||
|
'tags': video_data.get('def_tags', '').split(','),
|
||||||
'categories': video_data.get('categories'),
|
'categories': video_data.get('categories'),
|
||||||
'thumbnail': video_data.get('thumbnail'),
|
'thumbnail': video_data.get('thumbnail'),
|
||||||
|
'timestamp': int_or_none(video_data.get(
|
||||||
|
'ts_published') or video_data.get('ts_added')),
|
||||||
|
'uploader': video_data.get('mcp_id'),
|
||||||
|
'duration': int_or_none(video_data.get('duration')),
|
||||||
'subtitles': subtitles,
|
'subtitles': subtitles,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
def _extract_anvato_videos(self, webpage, video_id):
|
||||||
|
anvplayer_data = self._parse_json(self._html_search_regex(
|
||||||
|
r'<script[^>]+data-anvp=\'([^\']+)\'', webpage,
|
||||||
|
'Anvato player data'), video_id)
|
||||||
|
return self._get_anvato_videos(
|
||||||
|
anvplayer_data['accessKey'], anvplayer_data['video'])
|
||||||
|
@ -12,7 +12,7 @@ from ..utils import (
|
|||||||
|
|
||||||
class AolIE(InfoExtractor):
|
class AolIE(InfoExtractor):
|
||||||
IE_NAME = 'on.aol.com'
|
IE_NAME = 'on.aol.com'
|
||||||
_VALID_URL = r'(?:aol-video:|https?://on\.aol\.com/(?:[^/]+/)*(?:[^/?#&]+-)?)(?P<id>[^/?#&]+)'
|
_VALID_URL = r'(?:aol-video:|https?://(?:(?:www|on)\.)?aol\.com/(?:[^/]+/)*(?:[^/?#&]+-)?)(?P<id>[^/?#&]+)'
|
||||||
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
# video with 5min ID
|
# video with 5min ID
|
||||||
@ -33,7 +33,7 @@ class AolIE(InfoExtractor):
|
|||||||
}
|
}
|
||||||
}, {
|
}, {
|
||||||
# video with vidible ID
|
# video with vidible ID
|
||||||
'url': 'http://on.aol.com/video/netflix-is-raising-rates-5707d6b8e4b090497b04f706?context=PC:homepage:PL1944:1460189336183',
|
'url': 'http://www.aol.com/video/view/netflix-is-raising-rates/5707d6b8e4b090497b04f706/',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '5707d6b8e4b090497b04f706',
|
'id': '5707d6b8e4b090497b04f706',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
@ -108,30 +108,3 @@ class AolIE(InfoExtractor):
|
|||||||
'uploader': video_data.get('videoOwner'),
|
'uploader': video_data.get('videoOwner'),
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
class AolFeaturesIE(InfoExtractor):
|
|
||||||
IE_NAME = 'features.aol.com'
|
|
||||||
_VALID_URL = r'https?://features\.aol\.com/video/(?P<id>[^/?#]+)'
|
|
||||||
|
|
||||||
_TESTS = [{
|
|
||||||
'url': 'http://features.aol.com/video/behind-secret-second-careers-late-night-talk-show-hosts',
|
|
||||||
'md5': '7db483bb0c09c85e241f84a34238cc75',
|
|
||||||
'info_dict': {
|
|
||||||
'id': '519507715',
|
|
||||||
'ext': 'mp4',
|
|
||||||
'title': 'What To Watch - February 17, 2016',
|
|
||||||
},
|
|
||||||
'add_ie': ['FiveMin'],
|
|
||||||
'params': {
|
|
||||||
# encrypted m3u8 download
|
|
||||||
'skip_download': True,
|
|
||||||
},
|
|
||||||
}]
|
|
||||||
|
|
||||||
def _real_extract(self, url):
|
|
||||||
display_id = self._match_id(url)
|
|
||||||
webpage = self._download_webpage(url, display_id)
|
|
||||||
return self.url_result(self._search_regex(
|
|
||||||
r'<script type="text/javascript" src="(https?://[^/]*?5min\.com/Scripts/PlayerSeed\.js[^"]+)"',
|
|
||||||
webpage, '5min embed url'), 'FiveMin')
|
|
||||||
|
@ -1,13 +1,13 @@
|
|||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
from .jwplatform import JWPlatformBaseIE
|
from .common import InfoExtractor
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
unified_strdate,
|
unified_strdate,
|
||||||
clean_html,
|
clean_html,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class ArchiveOrgIE(JWPlatformBaseIE):
|
class ArchiveOrgIE(InfoExtractor):
|
||||||
IE_NAME = 'archive.org'
|
IE_NAME = 'archive.org'
|
||||||
IE_DESC = 'archive.org videos'
|
IE_DESC = 'archive.org videos'
|
||||||
_VALID_URL = r'https?://(?:www\.)?archive\.org/(?:details|embed)/(?P<id>[^/?#]+)(?:[?].*)?$'
|
_VALID_URL = r'https?://(?:www\.)?archive\.org/(?:details|embed)/(?P<id>[^/?#]+)(?:[?].*)?$'
|
||||||
|
@ -174,11 +174,15 @@ class ARDMediathekIE(InfoExtractor):
|
|||||||
|
|
||||||
webpage = self._download_webpage(url, video_id)
|
webpage = self._download_webpage(url, video_id)
|
||||||
|
|
||||||
if '>Der gewünschte Beitrag ist nicht mehr verfügbar.<' in webpage:
|
ERRORS = (
|
||||||
raise ExtractorError('Video %s is no longer available' % video_id, expected=True)
|
('>Leider liegt eine Störung vor.', 'Video %s is unavailable'),
|
||||||
|
('>Der gewünschte Beitrag ist nicht mehr verfügbar.<',
|
||||||
|
'Video %s is no longer available'),
|
||||||
|
)
|
||||||
|
|
||||||
if 'Diese Sendung ist für Jugendliche unter 12 Jahren nicht geeignet. Der Clip ist deshalb nur von 20 bis 6 Uhr verfügbar.' in webpage:
|
for pattern, message in ERRORS:
|
||||||
raise ExtractorError('This program is only suitable for those aged 12 and older. Video %s is therefore only available between 20 pm and 6 am.' % video_id, expected=True)
|
if pattern in webpage:
|
||||||
|
raise ExtractorError(message % video_id, expected=True)
|
||||||
|
|
||||||
if re.search(r'[\?&]rss($|[=&])', url):
|
if re.search(r'[\?&]rss($|[=&])', url):
|
||||||
doc = compat_etree_fromstring(webpage.encode('utf-8'))
|
doc = compat_etree_fromstring(webpage.encode('utf-8'))
|
||||||
@ -249,7 +253,7 @@ class ARDIE(InfoExtractor):
|
|||||||
'duration': 2600,
|
'duration': 2600,
|
||||||
'title': 'Die Story im Ersten: Mission unter falscher Flagge',
|
'title': 'Die Story im Ersten: Mission unter falscher Flagge',
|
||||||
'upload_date': '20140804',
|
'upload_date': '20140804',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
},
|
},
|
||||||
'skip': 'HTTP Error 404: Not Found',
|
'skip': 'HTTP Error 404: Not Found',
|
||||||
}
|
}
|
||||||
|
@ -4,8 +4,10 @@ from __future__ import unicode_literals
|
|||||||
import re
|
import re
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
|
from ..compat import compat_urlparse
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
determine_ext,
|
determine_ext,
|
||||||
|
ExtractorError,
|
||||||
float_or_none,
|
float_or_none,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
mimetype2ext,
|
mimetype2ext,
|
||||||
@ -15,7 +17,13 @@ from ..utils import (
|
|||||||
|
|
||||||
|
|
||||||
class ArkenaIE(InfoExtractor):
|
class ArkenaIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://play\.arkena\.com/(?:config|embed)/avp/v\d/player/media/(?P<id>[^/]+)/[^/]+/(?P<account_id>\d+)'
|
_VALID_URL = r'''(?x)
|
||||||
|
https?://
|
||||||
|
(?:
|
||||||
|
video\.arkena\.com/play2/embed/player\?|
|
||||||
|
play\.arkena\.com/(?:config|embed)/avp/v\d/player/media/(?P<id>[^/]+)/[^/]+/(?P<account_id>\d+)
|
||||||
|
)
|
||||||
|
'''
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'https://play.arkena.com/embed/avp/v2/player/media/b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe/1/129411',
|
'url': 'https://play.arkena.com/embed/avp/v2/player/media/b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe/1/129411',
|
||||||
'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
|
'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
|
||||||
@ -37,6 +45,9 @@ class ArkenaIE(InfoExtractor):
|
|||||||
}, {
|
}, {
|
||||||
'url': 'http://play.arkena.com/embed/avp/v1/player/media/327336/darkmatter/131064/',
|
'url': 'http://play.arkena.com/embed/avp/v1/player/media/327336/darkmatter/131064/',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://video.arkena.com/play2/embed/player?accountId=472718&mediaId=35763b3b-00090078-bf604299&pageStyling=styled',
|
||||||
|
'only_matching': True,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
@ -53,6 +64,14 @@ class ArkenaIE(InfoExtractor):
|
|||||||
video_id = mobj.group('id')
|
video_id = mobj.group('id')
|
||||||
account_id = mobj.group('account_id')
|
account_id = mobj.group('account_id')
|
||||||
|
|
||||||
|
# Handle http://video.arkena.com/play2/embed/player URL
|
||||||
|
if not video_id:
|
||||||
|
qs = compat_urlparse.parse_qs(compat_urlparse.urlparse(url).query)
|
||||||
|
video_id = qs.get('mediaId', [None])[0]
|
||||||
|
account_id = qs.get('accountId', [None])[0]
|
||||||
|
if not video_id or not account_id:
|
||||||
|
raise ExtractorError('Invalid URL', expected=True)
|
||||||
|
|
||||||
playlist = self._download_json(
|
playlist = self._download_json(
|
||||||
'https://play.arkena.com/config/avp/v2/player/media/%s/0/%s/?callbackMethod=_'
|
'https://play.arkena.com/config/avp/v2/player/media/%s/0/%s/?callbackMethod=_'
|
||||||
% (video_id, account_id),
|
% (video_id, account_id),
|
||||||
|
@ -410,6 +410,22 @@ class ArteTVEmbedIE(ArteTVPlus7IE):
|
|||||||
return self._extract_from_json_url(json_url, video_id, lang)
|
return self._extract_from_json_url(json_url, video_id, lang)
|
||||||
|
|
||||||
|
|
||||||
|
class TheOperaPlatformIE(ArteTVPlus7IE):
|
||||||
|
IE_NAME = 'theoperaplatform'
|
||||||
|
_VALID_URL = r'https?://(?:www\.)?theoperaplatform\.eu/(?P<lang>fr|de|en|es)/(?P<id>[^/?#&]+)'
|
||||||
|
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'http://www.theoperaplatform.eu/de/opera/verdi-otello',
|
||||||
|
'md5': '970655901fa2e82e04c00b955e9afe7b',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '060338-009-A',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Verdi - OTELLO',
|
||||||
|
'upload_date': '20160927',
|
||||||
|
},
|
||||||
|
}]
|
||||||
|
|
||||||
|
|
||||||
class ArteTVPlaylistIE(ArteTVBaseIE):
|
class ArteTVPlaylistIE(ArteTVBaseIE):
|
||||||
IE_NAME = 'arte.tv:playlist'
|
IE_NAME = 'arte.tv:playlist'
|
||||||
_VALID_URL = r'https?://(?:www\.)?arte\.tv/guide/(?P<lang>fr|de|en|es)/[^#]*#collection/(?P<id>PL-\d+)'
|
_VALID_URL = r'https?://(?:www\.)?arte\.tv/guide/(?P<lang>fr|de|en|es)/[^#]*#collection/(?P<id>PL-\d+)'
|
||||||
|
@ -30,7 +30,7 @@ class AtresPlayerIE(InfoExtractor):
|
|||||||
'title': 'Especial Solidario de Nochebuena',
|
'title': 'Especial Solidario de Nochebuena',
|
||||||
'description': 'md5:e2d52ff12214fa937107d21064075bf1',
|
'description': 'md5:e2d52ff12214fa937107d21064075bf1',
|
||||||
'duration': 5527.6,
|
'duration': 5527.6,
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
},
|
},
|
||||||
'skip': 'This video is only available for registered users'
|
'skip': 'This video is only available for registered users'
|
||||||
},
|
},
|
||||||
@ -43,7 +43,7 @@ class AtresPlayerIE(InfoExtractor):
|
|||||||
'title': 'David Bustamante',
|
'title': 'David Bustamante',
|
||||||
'description': 'md5:f33f1c0a05be57f6708d4dd83a3b81c6',
|
'description': 'md5:f33f1c0a05be57f6708d4dd83a3b81c6',
|
||||||
'duration': 1439.0,
|
'duration': 1439.0,
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
|
@ -14,7 +14,7 @@ class ATTTechChannelIE(InfoExtractor):
|
|||||||
'ext': 'flv',
|
'ext': 'flv',
|
||||||
'title': 'AT&T Archives : The UNIX System: Making Computers Easier to Use',
|
'title': 'AT&T Archives : The UNIX System: Making Computers Easier to Use',
|
||||||
'description': 'A 1982 film about UNIX is the foundation for software in use around Bell Labs and AT&T.',
|
'description': 'A 1982 film about UNIX is the foundation for software in use around Bell Labs and AT&T.',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'upload_date': '20140127',
|
'upload_date': '20140127',
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
|
@ -6,8 +6,8 @@ from ..utils import float_or_none
|
|||||||
|
|
||||||
|
|
||||||
class AudioBoomIE(InfoExtractor):
|
class AudioBoomIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?audioboom\.com/boos/(?P<id>[0-9]+)'
|
_VALID_URL = r'https?://(?:www\.)?audioboom\.com/(?:boos|posts)/(?P<id>[0-9]+)'
|
||||||
_TEST = {
|
_TESTS = [{
|
||||||
'url': 'https://audioboom.com/boos/4279833-3-09-2016-czaban-hour-3?t=0',
|
'url': 'https://audioboom.com/boos/4279833-3-09-2016-czaban-hour-3?t=0',
|
||||||
'md5': '63a8d73a055c6ed0f1e51921a10a5a76',
|
'md5': '63a8d73a055c6ed0f1e51921a10a5a76',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
@ -17,9 +17,12 @@ class AudioBoomIE(InfoExtractor):
|
|||||||
'description': 'Guest: Nate Davis - NFL free agency, Guest: Stan Gans',
|
'description': 'Guest: Nate Davis - NFL free agency, Guest: Stan Gans',
|
||||||
'duration': 2245.72,
|
'duration': 2245.72,
|
||||||
'uploader': 'Steve Czaban',
|
'uploader': 'Steve Czaban',
|
||||||
'uploader_url': 're:https?://(?:www\.)?audioboom\.com/channel/steveczabanyahoosportsradio',
|
'uploader_url': r're:https?://(?:www\.)?audioboom\.com/channel/steveczabanyahoosportsradio',
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'https://audioboom.com/posts/4279833-3-09-2016-czaban-hour-3?t=0',
|
||||||
|
'only_matching': True,
|
||||||
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
|
213
youtube_dl/extractor/azmedien.py
Normal file
213
youtube_dl/extractor/azmedien.py
Normal file
@ -0,0 +1,213 @@
|
|||||||
|
# coding: utf-8
|
||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
import re
|
||||||
|
|
||||||
|
from .common import InfoExtractor
|
||||||
|
from .kaltura import KalturaIE
|
||||||
|
from ..utils import (
|
||||||
|
get_element_by_class,
|
||||||
|
get_element_by_id,
|
||||||
|
strip_or_none,
|
||||||
|
urljoin,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
class AZMedienBaseIE(InfoExtractor):
|
||||||
|
def _kaltura_video(self, partner_id, entry_id):
|
||||||
|
return self.url_result(
|
||||||
|
'kaltura:%s:%s' % (partner_id, entry_id), ie=KalturaIE.ie_key(),
|
||||||
|
video_id=entry_id)
|
||||||
|
|
||||||
|
|
||||||
|
class AZMedienIE(AZMedienBaseIE):
|
||||||
|
IE_DESC = 'AZ Medien videos'
|
||||||
|
_VALID_URL = r'''(?x)
|
||||||
|
https?://
|
||||||
|
(?:www\.)?
|
||||||
|
(?:
|
||||||
|
telezueri\.ch|
|
||||||
|
telebaern\.tv|
|
||||||
|
telem1\.ch
|
||||||
|
)/
|
||||||
|
[0-9]+-show-[^/\#]+
|
||||||
|
(?:
|
||||||
|
/[0-9]+-episode-[^/\#]+
|
||||||
|
(?:
|
||||||
|
/[0-9]+-segment-(?:[^/\#]+\#)?|
|
||||||
|
\#
|
||||||
|
)|
|
||||||
|
\#
|
||||||
|
)
|
||||||
|
(?P<id>[^\#]+)
|
||||||
|
'''
|
||||||
|
|
||||||
|
_TESTS = [{
|
||||||
|
# URL with 'segment'
|
||||||
|
'url': 'http://www.telezueri.ch/62-show-zuerinews/13772-episode-sonntag-18-dezember-2016/32419-segment-massenabweisungen-beim-hiltl-club-wegen-pelzboom',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '1_2444peh4',
|
||||||
|
'ext': 'mov',
|
||||||
|
'title': 'Massenabweisungen beim Hiltl Club wegen Pelzboom',
|
||||||
|
'description': 'md5:9ea9dd1b159ad65b36ddcf7f0d7c76a8',
|
||||||
|
'uploader_id': 'TeleZ?ri',
|
||||||
|
'upload_date': '20161218',
|
||||||
|
'timestamp': 1482084490,
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# URL with 'segment' and fragment:
|
||||||
|
'url': 'http://www.telebaern.tv/118-show-news/14240-episode-dienstag-17-januar-2017/33666-segment-achtung-gefahr#zu-wenig-pflegerinnen-und-pfleger',
|
||||||
|
'only_matching': True
|
||||||
|
}, {
|
||||||
|
# URL with 'episode' and fragment:
|
||||||
|
'url': 'http://www.telem1.ch/47-show-sonntalk/13986-episode-soldaten-fuer-grenzschutz-energiestrategie-obama-bilanz#soldaten-fuer-grenzschutz-energiestrategie-obama-bilanz',
|
||||||
|
'only_matching': True
|
||||||
|
}, {
|
||||||
|
# URL with 'show' and fragment:
|
||||||
|
'url': 'http://www.telezueri.ch/66-show-sonntalk#burka-plakate-trump-putin-china-besuch',
|
||||||
|
'only_matching': True
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
video_id = self._match_id(url)
|
||||||
|
|
||||||
|
webpage = self._download_webpage(url, video_id)
|
||||||
|
|
||||||
|
partner_id = self._search_regex(
|
||||||
|
r'<script[^>]+src=["\'](?:https?:)?//(?:[^/]+\.)?kaltura\.com(?:/[^/]+)*/(?:p|partner_id)/([0-9]+)',
|
||||||
|
webpage, 'kaltura partner id')
|
||||||
|
entry_id = self._html_search_regex(
|
||||||
|
r'<a[^>]+data-id=(["\'])(?P<id>(?:(?!\1).)+)\1[^>]+data-slug=["\']%s'
|
||||||
|
% re.escape(video_id), webpage, 'kaltura entry id', group='id')
|
||||||
|
|
||||||
|
return self._kaltura_video(partner_id, entry_id)
|
||||||
|
|
||||||
|
|
||||||
|
class AZMedienPlaylistIE(AZMedienBaseIE):
|
||||||
|
IE_DESC = 'AZ Medien playlists'
|
||||||
|
_VALID_URL = r'''(?x)
|
||||||
|
https?://
|
||||||
|
(?:www\.)?
|
||||||
|
(?:
|
||||||
|
telezueri\.ch|
|
||||||
|
telebaern\.tv|
|
||||||
|
telem1\.ch
|
||||||
|
)/
|
||||||
|
(?P<id>[0-9]+-
|
||||||
|
(?:
|
||||||
|
show|
|
||||||
|
topic|
|
||||||
|
themen
|
||||||
|
)-[^/\#]+
|
||||||
|
(?:
|
||||||
|
/[0-9]+-episode-[^/\#]+
|
||||||
|
)?
|
||||||
|
)$
|
||||||
|
'''
|
||||||
|
|
||||||
|
_TESTS = [{
|
||||||
|
# URL with 'episode'
|
||||||
|
'url': 'http://www.telebaern.tv/118-show-news/13735-episode-donnerstag-15-dezember-2016',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '118-show-news/13735-episode-donnerstag-15-dezember-2016',
|
||||||
|
'title': 'News - Donnerstag, 15. Dezember 2016',
|
||||||
|
},
|
||||||
|
'playlist_count': 9,
|
||||||
|
}, {
|
||||||
|
# URL with 'themen'
|
||||||
|
'url': 'http://www.telem1.ch/258-themen-tele-m1-classics',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '258-themen-tele-m1-classics',
|
||||||
|
'title': 'Tele M1 Classics',
|
||||||
|
},
|
||||||
|
'playlist_mincount': 15,
|
||||||
|
}, {
|
||||||
|
# URL with 'topic', contains nested playlists
|
||||||
|
'url': 'http://www.telezueri.ch/219-topic-aera-trump-hat-offiziell-begonnen',
|
||||||
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
# URL with 'show' only
|
||||||
|
'url': 'http://www.telezueri.ch/86-show-talktaeglich',
|
||||||
|
'only_matching': True
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
show_id = self._match_id(url)
|
||||||
|
webpage = self._download_webpage(url, show_id)
|
||||||
|
|
||||||
|
entries = []
|
||||||
|
|
||||||
|
partner_id = self._search_regex(
|
||||||
|
r'src=["\'](?:https?:)?//(?:[^/]+\.)kaltura\.com/(?:[^/]+/)*(?:p|partner_id)/(\d+)',
|
||||||
|
webpage, 'kaltura partner id', default=None)
|
||||||
|
|
||||||
|
if partner_id:
|
||||||
|
entries = [
|
||||||
|
self._kaltura_video(partner_id, m.group('id'))
|
||||||
|
for m in re.finditer(
|
||||||
|
r'data-id=(["\'])(?P<id>(?:(?!\1).)+)\1', webpage)]
|
||||||
|
|
||||||
|
if not entries:
|
||||||
|
entries = [
|
||||||
|
self.url_result(m.group('url'), ie=AZMedienIE.ie_key())
|
||||||
|
for m in re.finditer(
|
||||||
|
r'<a[^>]+data-real=(["\'])(?P<url>http.+?)\1', webpage)]
|
||||||
|
|
||||||
|
if not entries:
|
||||||
|
entries = [
|
||||||
|
# May contain nested playlists (e.g. [1]) thus no explicit
|
||||||
|
# ie_key
|
||||||
|
# 1. http://www.telezueri.ch/219-topic-aera-trump-hat-offiziell-begonnen)
|
||||||
|
self.url_result(urljoin(url, m.group('url')))
|
||||||
|
for m in re.finditer(
|
||||||
|
r'<a[^>]+name=[^>]+href=(["\'])(?P<url>/.+?)\1', webpage)]
|
||||||
|
|
||||||
|
title = self._search_regex(
|
||||||
|
r'episodeShareTitle\s*=\s*(["\'])(?P<title>(?:(?!\1).)+)\1',
|
||||||
|
webpage, 'title',
|
||||||
|
default=strip_or_none(get_element_by_id(
|
||||||
|
'video-title', webpage)), group='title')
|
||||||
|
|
||||||
|
return self.playlist_result(entries, show_id, title)
|
||||||
|
|
||||||
|
|
||||||
|
class AZMedienShowPlaylistIE(AZMedienBaseIE):
|
||||||
|
IE_DESC = 'AZ Medien show playlists'
|
||||||
|
_VALID_URL = r'''(?x)
|
||||||
|
https?://
|
||||||
|
(?:www\.)?
|
||||||
|
(?:
|
||||||
|
telezueri\.ch|
|
||||||
|
telebaern\.tv|
|
||||||
|
telem1\.ch
|
||||||
|
)/
|
||||||
|
(?:
|
||||||
|
all-episodes|
|
||||||
|
alle-episoden
|
||||||
|
)/
|
||||||
|
(?P<id>[^/?#&]+)
|
||||||
|
'''
|
||||||
|
|
||||||
|
_TEST = {
|
||||||
|
'url': 'http://www.telezueri.ch/all-episodes/astrotalk',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'astrotalk',
|
||||||
|
'title': 'TeleZüri: AstroTalk - alle episoden',
|
||||||
|
'description': 'md5:4c0f7e7d741d906004266e295ceb4a26',
|
||||||
|
},
|
||||||
|
'playlist_mincount': 13,
|
||||||
|
}
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
playlist_id = self._match_id(url)
|
||||||
|
webpage = self._download_webpage(url, playlist_id)
|
||||||
|
episodes = get_element_by_class('search-mobile-box', webpage)
|
||||||
|
entries = [self.url_result(
|
||||||
|
urljoin(url, m.group('url'))) for m in re.finditer(
|
||||||
|
r'<a[^>]+href=(["\'])(?P<url>(?:(?!\1).)+)\1', episodes)]
|
||||||
|
title = self._og_search_title(webpage, fatal=False)
|
||||||
|
description = self._og_search_description(webpage)
|
||||||
|
return self.playlist_result(entries, playlist_id, title, description)
|
@ -11,7 +11,7 @@ from ..utils import (
|
|||||||
|
|
||||||
|
|
||||||
class AzubuIE(InfoExtractor):
|
class AzubuIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?azubu\.tv/[^/]+#!/play/(?P<id>\d+)'
|
_VALID_URL = r'https?://(?:www\.)?azubu\.(?:tv|uol.com.br)/[^/]+#!/play/(?P<id>\d+)'
|
||||||
_TESTS = [
|
_TESTS = [
|
||||||
{
|
{
|
||||||
'url': 'http://www.azubu.tv/GSL#!/play/15575/2014-hot6-cup-last-big-match-ro8-day-1',
|
'url': 'http://www.azubu.tv/GSL#!/play/15575/2014-hot6-cup-last-big-match-ro8-day-1',
|
||||||
@ -21,7 +21,7 @@ class AzubuIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': '2014 HOT6 CUP LAST BIG MATCH Ro8 Day 1',
|
'title': '2014 HOT6 CUP LAST BIG MATCH Ro8 Day 1',
|
||||||
'description': 'md5:d06bdea27b8cc4388a90ad35b5c66c01',
|
'description': 'md5:d06bdea27b8cc4388a90ad35b5c66c01',
|
||||||
'thumbnail': 're:^https?://.*\.jpe?g',
|
'thumbnail': r're:^https?://.*\.jpe?g',
|
||||||
'timestamp': 1417523507.334,
|
'timestamp': 1417523507.334,
|
||||||
'upload_date': '20141202',
|
'upload_date': '20141202',
|
||||||
'duration': 9988.7,
|
'duration': 9988.7,
|
||||||
@ -38,7 +38,7 @@ class AzubuIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Fnatic at Worlds 2014: Toyz - "I love Rekkles, he has amazing mechanics"',
|
'title': 'Fnatic at Worlds 2014: Toyz - "I love Rekkles, he has amazing mechanics"',
|
||||||
'description': 'md5:4a649737b5f6c8b5c5be543e88dc62af',
|
'description': 'md5:4a649737b5f6c8b5c5be543e88dc62af',
|
||||||
'thumbnail': 're:^https?://.*\.jpe?g',
|
'thumbnail': r're:^https?://.*\.jpe?g',
|
||||||
'timestamp': 1410530893.320,
|
'timestamp': 1410530893.320,
|
||||||
'upload_date': '20140912',
|
'upload_date': '20140912',
|
||||||
'duration': 172.385,
|
'duration': 172.385,
|
||||||
@ -103,12 +103,15 @@ class AzubuIE(InfoExtractor):
|
|||||||
|
|
||||||
|
|
||||||
class AzubuLiveIE(InfoExtractor):
|
class AzubuLiveIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?azubu\.tv/(?P<id>[^/]+)$'
|
_VALID_URL = r'https?://(?:www\.)?azubu\.(?:tv|uol.com.br)/(?P<id>[^/]+)$'
|
||||||
|
|
||||||
_TEST = {
|
_TESTS = [{
|
||||||
'url': 'http://www.azubu.tv/MarsTVMDLen',
|
'url': 'http://www.azubu.tv/MarsTVMDLen',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
}
|
}, {
|
||||||
|
'url': 'http://azubu.uol.com.br/adolfz',
|
||||||
|
'only_matching': True,
|
||||||
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
user = self._match_id(url)
|
user = self._match_id(url)
|
||||||
|
@ -1,7 +1,9 @@
|
|||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
import json
|
import json
|
||||||
|
import random
|
||||||
import re
|
import re
|
||||||
|
import time
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..compat import (
|
from ..compat import (
|
||||||
@ -12,6 +14,9 @@ from ..utils import (
|
|||||||
ExtractorError,
|
ExtractorError,
|
||||||
float_or_none,
|
float_or_none,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
|
parse_filesize,
|
||||||
|
unescapeHTML,
|
||||||
|
update_url_query,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@ -81,35 +86,68 @@ class BandcampIE(InfoExtractor):
|
|||||||
r'(?ms)var TralbumData = .*?[{,]\s*id: (?P<id>\d+),?$',
|
r'(?ms)var TralbumData = .*?[{,]\s*id: (?P<id>\d+),?$',
|
||||||
webpage, 'video id')
|
webpage, 'video id')
|
||||||
|
|
||||||
download_webpage = self._download_webpage(download_link, video_id, 'Downloading free downloads page')
|
download_webpage = self._download_webpage(
|
||||||
# We get the dictionary of the track from some javascript code
|
download_link, video_id, 'Downloading free downloads page')
|
||||||
all_info = self._parse_json(self._search_regex(
|
|
||||||
r'(?sm)items: (.*?),$', download_webpage, 'items'), video_id)
|
blob = self._parse_json(
|
||||||
info = all_info[0]
|
self._search_regex(
|
||||||
# We pick mp3-320 for now, until format selection can be easily implemented.
|
r'data-blob=(["\'])(?P<blob>{.+?})\1', download_webpage,
|
||||||
mp3_info = info['downloads']['mp3-320']
|
'blob', group='blob'),
|
||||||
# If we try to use this url it says the link has expired
|
video_id, transform_source=unescapeHTML)
|
||||||
initial_url = mp3_info['url']
|
|
||||||
m_url = re.match(
|
info = blob['digital_items'][0]
|
||||||
r'(?P<server>http://(.*?)\.bandcamp\.com)/download/track\?enc=mp3-320&fsig=(?P<fsig>.*?)&id=(?P<id>.*?)&ts=(?P<ts>.*)$',
|
|
||||||
initial_url)
|
downloads = info['downloads']
|
||||||
# We build the url we will use to get the final track url
|
track = info['title']
|
||||||
# This url is build in Bandcamp in the script download_bunde_*.js
|
|
||||||
request_url = '%s/statdownload/track?enc=mp3-320&fsig=%s&id=%s&ts=%s&.rand=665028774616&.vrs=1' % (m_url.group('server'), m_url.group('fsig'), video_id, m_url.group('ts'))
|
artist = info.get('artist')
|
||||||
final_url_webpage = self._download_webpage(request_url, video_id, 'Requesting download url')
|
title = '%s - %s' % (artist, track) if artist else track
|
||||||
# If we could correctly generate the .rand field the url would be
|
|
||||||
# in the "download_url" key
|
download_formats = {}
|
||||||
final_url = self._proto_relative_url(self._search_regex(
|
for f in blob['download_formats']:
|
||||||
r'"retry_url":"(.+?)"', final_url_webpage, 'final video URL'), 'http:')
|
name, ext = f.get('name'), f.get('file_extension')
|
||||||
|
if all(isinstance(x, compat_str) for x in (name, ext)):
|
||||||
|
download_formats[name] = ext.strip('.')
|
||||||
|
|
||||||
|
formats = []
|
||||||
|
for format_id, f in downloads.items():
|
||||||
|
format_url = f.get('url')
|
||||||
|
if not format_url:
|
||||||
|
continue
|
||||||
|
# Stat URL generation algorithm is reverse engineered from
|
||||||
|
# download_*_bundle_*.js
|
||||||
|
stat_url = update_url_query(
|
||||||
|
format_url.replace('/download/', '/statdownload/'), {
|
||||||
|
'.rand': int(time.time() * 1000 * random.random()),
|
||||||
|
})
|
||||||
|
format_id = f.get('encoding_name') or format_id
|
||||||
|
stat = self._download_json(
|
||||||
|
stat_url, video_id, 'Downloading %s JSON' % format_id,
|
||||||
|
transform_source=lambda s: s[s.index('{'):s.rindex('}') + 1],
|
||||||
|
fatal=False)
|
||||||
|
if not stat:
|
||||||
|
continue
|
||||||
|
retry_url = stat.get('retry_url')
|
||||||
|
if not isinstance(retry_url, compat_str):
|
||||||
|
continue
|
||||||
|
formats.append({
|
||||||
|
'url': self._proto_relative_url(retry_url, 'http:'),
|
||||||
|
'ext': download_formats.get(format_id),
|
||||||
|
'format_id': format_id,
|
||||||
|
'format_note': f.get('description'),
|
||||||
|
'filesize': parse_filesize(f.get('size_mb')),
|
||||||
|
'vcodec': 'none',
|
||||||
|
})
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': info['title'],
|
'title': title,
|
||||||
'ext': 'mp3',
|
|
||||||
'vcodec': 'none',
|
|
||||||
'url': final_url,
|
|
||||||
'thumbnail': info.get('thumb_url'),
|
'thumbnail': info.get('thumb_url'),
|
||||||
'uploader': info.get('artist'),
|
'uploader': info.get('artist'),
|
||||||
|
'artist': artist,
|
||||||
|
'track': track,
|
||||||
|
'formats': formats,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@ -171,6 +209,15 @@ class BandcampAlbumIE(InfoExtractor):
|
|||||||
'id': 'entropy-ep',
|
'id': 'entropy-ep',
|
||||||
},
|
},
|
||||||
'playlist_mincount': 3,
|
'playlist_mincount': 3,
|
||||||
|
}, {
|
||||||
|
# not all tracks have songs
|
||||||
|
'url': 'https://insulters.bandcamp.com/album/we-are-the-plague',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'we-are-the-plague',
|
||||||
|
'title': 'WE ARE THE PLAGUE',
|
||||||
|
'uploader_id': 'insulters',
|
||||||
|
},
|
||||||
|
'playlist_count': 2,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
@ -179,12 +226,16 @@ class BandcampAlbumIE(InfoExtractor):
|
|||||||
album_id = mobj.group('album_id')
|
album_id = mobj.group('album_id')
|
||||||
playlist_id = album_id or uploader_id
|
playlist_id = album_id or uploader_id
|
||||||
webpage = self._download_webpage(url, playlist_id)
|
webpage = self._download_webpage(url, playlist_id)
|
||||||
tracks_paths = re.findall(r'<a href="(.*?)" itemprop="url">', webpage)
|
track_elements = re.findall(
|
||||||
if not tracks_paths:
|
r'(?s)<div[^>]*>(.*?<a[^>]+href="([^"]+?)"[^>]+itemprop="url"[^>]*>.*?)</div>', webpage)
|
||||||
|
if not track_elements:
|
||||||
raise ExtractorError('The page doesn\'t contain any tracks')
|
raise ExtractorError('The page doesn\'t contain any tracks')
|
||||||
|
# Only tracks with duration info have songs
|
||||||
entries = [
|
entries = [
|
||||||
self.url_result(compat_urlparse.urljoin(url, t_path), ie=BandcampIE.ie_key())
|
self.url_result(compat_urlparse.urljoin(url, t_path), ie=BandcampIE.ie_key())
|
||||||
for t_path in tracks_paths]
|
for elem_content, t_path in track_elements
|
||||||
|
if self._html_search_meta('duration', elem_content, default=None)]
|
||||||
|
|
||||||
title = self._html_search_regex(
|
title = self._html_search_regex(
|
||||||
r'album_title\s*:\s*"((?:\\.|[^"\\])+?)"',
|
r'album_title\s*:\s*"((?:\\.|[^"\\])+?)"',
|
||||||
webpage, 'title', fatal=False)
|
webpage, 'title', fatal=False)
|
||||||
|
@ -225,6 +225,8 @@ class BBCCoUkIE(InfoExtractor):
|
|||||||
}
|
}
|
||||||
]
|
]
|
||||||
|
|
||||||
|
_USP_RE = r'/([^/]+?)\.ism(?:\.hlsv2\.ism)?/[^/]+\.m3u8'
|
||||||
|
|
||||||
class MediaSelectionError(Exception):
|
class MediaSelectionError(Exception):
|
||||||
def __init__(self, id):
|
def __init__(self, id):
|
||||||
self.id = id
|
self.id = id
|
||||||
@ -336,6 +338,15 @@ class BBCCoUkIE(InfoExtractor):
|
|||||||
formats.extend(self._extract_m3u8_formats(
|
formats.extend(self._extract_m3u8_formats(
|
||||||
href, programme_id, ext='mp4', entry_protocol='m3u8_native',
|
href, programme_id, ext='mp4', entry_protocol='m3u8_native',
|
||||||
m3u8_id=format_id, fatal=False))
|
m3u8_id=format_id, fatal=False))
|
||||||
|
if re.search(self._USP_RE, href):
|
||||||
|
usp_formats = self._extract_m3u8_formats(
|
||||||
|
re.sub(self._USP_RE, r'/\1.ism/\1.m3u8', href),
|
||||||
|
programme_id, ext='mp4', entry_protocol='m3u8_native',
|
||||||
|
m3u8_id=format_id, fatal=False)
|
||||||
|
for f in usp_formats:
|
||||||
|
if f.get('height') and f['height'] > 720:
|
||||||
|
continue
|
||||||
|
formats.append(f)
|
||||||
elif transfer_format == 'hds':
|
elif transfer_format == 'hds':
|
||||||
formats.extend(self._extract_f4m_formats(
|
formats.extend(self._extract_f4m_formats(
|
||||||
href, programme_id, f4m_id=format_id, fatal=False))
|
href, programme_id, f4m_id=format_id, fatal=False))
|
||||||
|
73
youtube_dl/extractor/beampro.py
Normal file
73
youtube_dl/extractor/beampro.py
Normal file
@ -0,0 +1,73 @@
|
|||||||
|
# coding: utf-8
|
||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
from .common import InfoExtractor
|
||||||
|
from ..utils import (
|
||||||
|
ExtractorError,
|
||||||
|
clean_html,
|
||||||
|
compat_str,
|
||||||
|
int_or_none,
|
||||||
|
parse_iso8601,
|
||||||
|
try_get,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
class BeamProLiveIE(InfoExtractor):
|
||||||
|
IE_NAME = 'Beam:live'
|
||||||
|
_VALID_URL = r'https?://(?:\w+\.)?beam\.pro/(?P<id>[^/?#&]+)'
|
||||||
|
_RATINGS = {'family': 0, 'teen': 13, '18+': 18}
|
||||||
|
_TEST = {
|
||||||
|
'url': 'http://www.beam.pro/niterhayven',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '261562',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Introducing The Witcher 3 // The Grind Starts Now!',
|
||||||
|
'description': 'md5:0b161ac080f15fe05d18a07adb44a74d',
|
||||||
|
'thumbnail': r're:https://.*\.jpg$',
|
||||||
|
'timestamp': 1483477281,
|
||||||
|
'upload_date': '20170103',
|
||||||
|
'uploader': 'niterhayven',
|
||||||
|
'uploader_id': '373396',
|
||||||
|
'age_limit': 18,
|
||||||
|
'is_live': True,
|
||||||
|
'view_count': int,
|
||||||
|
},
|
||||||
|
'skip': 'niterhayven is offline',
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
channel_name = self._match_id(url)
|
||||||
|
|
||||||
|
chan = self._download_json(
|
||||||
|
'https://beam.pro/api/v1/channels/%s' % channel_name, channel_name)
|
||||||
|
|
||||||
|
if chan.get('online') is False:
|
||||||
|
raise ExtractorError(
|
||||||
|
'{0} is offline'.format(channel_name), expected=True)
|
||||||
|
|
||||||
|
channel_id = chan['id']
|
||||||
|
|
||||||
|
formats = self._extract_m3u8_formats(
|
||||||
|
'https://beam.pro/api/v1/channels/%s/manifest.m3u8' % channel_id,
|
||||||
|
channel_name, ext='mp4', m3u8_id='hls', fatal=False)
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
|
user_id = chan.get('userId') or try_get(chan, lambda x: x['user']['id'])
|
||||||
|
|
||||||
|
return {
|
||||||
|
'id': compat_str(chan.get('id') or channel_name),
|
||||||
|
'title': self._live_title(chan.get('name') or channel_name),
|
||||||
|
'description': clean_html(chan.get('description')),
|
||||||
|
'thumbnail': try_get(chan, lambda x: x['thumbnail']['url'], compat_str),
|
||||||
|
'timestamp': parse_iso8601(chan.get('updatedAt')),
|
||||||
|
'uploader': chan.get('token') or try_get(
|
||||||
|
chan, lambda x: x['user']['username'], compat_str),
|
||||||
|
'uploader_id': compat_str(user_id) if user_id else None,
|
||||||
|
'age_limit': self._RATINGS.get(chan.get('audience')),
|
||||||
|
'is_live': True,
|
||||||
|
'view_count': int_or_none(chan.get('viewersTotal')),
|
||||||
|
'formats': formats,
|
||||||
|
}
|
@ -8,10 +8,10 @@ from ..compat import compat_str
|
|||||||
from ..utils import int_or_none
|
from ..utils import int_or_none
|
||||||
|
|
||||||
|
|
||||||
class BeatportProIE(InfoExtractor):
|
class BeatportIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://pro\.beatport\.com/track/(?P<display_id>[^/]+)/(?P<id>[0-9]+)'
|
_VALID_URL = r'https?://(?:www\.|pro\.)?beatport\.com/track/(?P<display_id>[^/]+)/(?P<id>[0-9]+)'
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'https://pro.beatport.com/track/synesthesia-original-mix/5379371',
|
'url': 'https://beatport.com/track/synesthesia-original-mix/5379371',
|
||||||
'md5': 'b3c34d8639a2f6a7f734382358478887',
|
'md5': 'b3c34d8639a2f6a7f734382358478887',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '5379371',
|
'id': '5379371',
|
||||||
@ -20,7 +20,7 @@ class BeatportProIE(InfoExtractor):
|
|||||||
'title': 'Froxic - Synesthesia (Original Mix)',
|
'title': 'Froxic - Synesthesia (Original Mix)',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'https://pro.beatport.com/track/love-and-war-original-mix/3756896',
|
'url': 'https://beatport.com/track/love-and-war-original-mix/3756896',
|
||||||
'md5': 'e44c3025dfa38c6577fbaeb43da43514',
|
'md5': 'e44c3025dfa38c6577fbaeb43da43514',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '3756896',
|
'id': '3756896',
|
||||||
@ -29,7 +29,7 @@ class BeatportProIE(InfoExtractor):
|
|||||||
'title': 'Wolfgang Gartner - Love & War (Original Mix)',
|
'title': 'Wolfgang Gartner - Love & War (Original Mix)',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'https://pro.beatport.com/track/birds-original-mix/4991738',
|
'url': 'https://beatport.com/track/birds-original-mix/4991738',
|
||||||
'md5': 'a1fd8e8046de3950fd039304c186c05f',
|
'md5': 'a1fd8e8046de3950fd039304c186c05f',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '4991738',
|
'id': '4991738',
|
@ -46,19 +46,19 @@ class BeegIE(InfoExtractor):
|
|||||||
self._proto_relative_url(cpl_url), video_id,
|
self._proto_relative_url(cpl_url), video_id,
|
||||||
'Downloading cpl JS', fatal=False)
|
'Downloading cpl JS', fatal=False)
|
||||||
if cpl:
|
if cpl:
|
||||||
beeg_version = self._search_regex(
|
beeg_version = int_or_none(self._search_regex(
|
||||||
r'beeg_version\s*=\s*(\d+)', cpl,
|
r'beeg_version\s*=\s*([^\b]+)', cpl,
|
||||||
'beeg version', default=None) or self._search_regex(
|
'beeg version', default=None)) or self._search_regex(
|
||||||
r'/(\d+)\.js', cpl_url, 'beeg version', default=None)
|
r'/(\d+)\.js', cpl_url, 'beeg version', default=None)
|
||||||
beeg_salt = self._search_regex(
|
beeg_salt = self._search_regex(
|
||||||
r'beeg_salt\s*=\s*(["\'])(?P<beeg_salt>.+?)\1', cpl, 'beeg beeg_salt',
|
r'beeg_salt\s*=\s*(["\'])(?P<beeg_salt>.+?)\1', cpl, 'beeg salt',
|
||||||
default=None, group='beeg_salt')
|
default=None, group='beeg_salt')
|
||||||
|
|
||||||
beeg_version = beeg_version or '1750'
|
beeg_version = beeg_version or '2000'
|
||||||
beeg_salt = beeg_salt or 'MIDtGaw96f0N1kMMAM1DE46EC9pmFr'
|
beeg_salt = beeg_salt or 'pmweAkq8lAYKdfWcFCUj0yoVgoPlinamH5UE1CB3H'
|
||||||
|
|
||||||
video = self._download_json(
|
video = self._download_json(
|
||||||
'http://api.beeg.com/api/v6/%s/video/%s' % (beeg_version, video_id),
|
'https://api.beeg.com/api/v6/%s/video/%s' % (beeg_version, video_id),
|
||||||
video_id)
|
video_id)
|
||||||
|
|
||||||
def split(o, e):
|
def split(o, e):
|
||||||
|
@ -24,7 +24,7 @@ class BellMediaIE(InfoExtractor):
|
|||||||
space
|
space
|
||||||
)\.ca|
|
)\.ca|
|
||||||
much\.com
|
much\.com
|
||||||
)/.*?(?:\bvid=|-vid|~|%7E|/(?:episode)?)(?P<id>[0-9]{6})'''
|
)/.*?(?:\bvid=|-vid|~|%7E|/(?:episode)?)(?P<id>[0-9]{6,})'''
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.ctv.ca/video/player?vid=706966',
|
'url': 'http://www.ctv.ca/video/player?vid=706966',
|
||||||
'md5': 'ff2ebbeae0aa2dcc32a830c3fd69b7b0',
|
'md5': 'ff2ebbeae0aa2dcc32a830c3fd69b7b0',
|
||||||
@ -55,6 +55,9 @@ class BellMediaIE(InfoExtractor):
|
|||||||
}, {
|
}, {
|
||||||
'url': 'http://www.much.com/shows/the-almost-impossible-gameshow/928979/episode-6',
|
'url': 'http://www.much.com/shows/the-almost-impossible-gameshow/928979/episode-6',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.ctv.ca/DCs-Legends-of-Tomorrow/Video/S2E11-Turncoat-vid1051430',
|
||||||
|
'only_matching': True,
|
||||||
}]
|
}]
|
||||||
_DOMAINS = {
|
_DOMAINS = {
|
||||||
'thecomedynetwork': 'comedy',
|
'thecomedynetwork': 'comedy',
|
||||||
|
@ -17,7 +17,7 @@ class BetIE(MTVServicesInfoExtractor):
|
|||||||
'description': 'President Obama urges persistence in confronting racism and bias.',
|
'description': 'President Obama urges persistence in confronting racism and bias.',
|
||||||
'duration': 1534,
|
'duration': 1534,
|
||||||
'upload_date': '20141208',
|
'upload_date': '20141208',
|
||||||
'thumbnail': 're:(?i)^https?://.*\.jpg$',
|
'thumbnail': r're:(?i)^https?://.*\.jpg$',
|
||||||
'subtitles': {
|
'subtitles': {
|
||||||
'en': 'mincount:2',
|
'en': 'mincount:2',
|
||||||
}
|
}
|
||||||
@ -37,7 +37,7 @@ class BetIE(MTVServicesInfoExtractor):
|
|||||||
'description': 'A BET News special.',
|
'description': 'A BET News special.',
|
||||||
'duration': 1696,
|
'duration': 1696,
|
||||||
'upload_date': '20141125',
|
'upload_date': '20141125',
|
||||||
'thumbnail': 're:(?i)^https?://.*\.jpg$',
|
'thumbnail': r're:(?i)^https?://.*\.jpg$',
|
||||||
'subtitles': {
|
'subtitles': {
|
||||||
'en': 'mincount:2',
|
'en': 'mincount:2',
|
||||||
}
|
}
|
||||||
|
@ -19,7 +19,7 @@ class BildIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Das können die neuen iPads',
|
'title': 'Das können die neuen iPads',
|
||||||
'description': 'md5:a4058c4fa2a804ab59c00d7244bbf62f',
|
'description': 'md5:a4058c4fa2a804ab59c00d7244bbf62f',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'duration': 196,
|
'duration': 196,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -5,19 +5,27 @@ import hashlib
|
|||||||
import re
|
import re
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..compat import compat_parse_qs
|
from ..compat import (
|
||||||
|
compat_parse_qs,
|
||||||
|
compat_urlparse,
|
||||||
|
)
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
|
ExtractorError,
|
||||||
int_or_none,
|
int_or_none,
|
||||||
float_or_none,
|
float_or_none,
|
||||||
|
parse_iso8601,
|
||||||
|
smuggle_url,
|
||||||
|
strip_jsonp,
|
||||||
unified_timestamp,
|
unified_timestamp,
|
||||||
|
unsmuggle_url,
|
||||||
urlencode_postdata,
|
urlencode_postdata,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class BiliBiliIE(InfoExtractor):
|
class BiliBiliIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.|bangumi\.|)bilibili\.(?:tv|com)/(?:video/av|anime/v/)(?P<id>\d+)'
|
_VALID_URL = r'https?://(?:www\.|bangumi\.|)bilibili\.(?:tv|com)/(?:video/av|anime/(?P<anime_id>\d+)/play#)(?P<id>\d+)'
|
||||||
|
|
||||||
_TEST = {
|
_TESTS = [{
|
||||||
'url': 'http://www.bilibili.tv/video/av1074402/',
|
'url': 'http://www.bilibili.tv/video/av1074402/',
|
||||||
'md5': '9fa226fe2b8a9a4d5a69b4c6a183417e',
|
'md5': '9fa226fe2b8a9a4d5a69b4c6a183417e',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
@ -28,29 +36,65 @@ class BiliBiliIE(InfoExtractor):
|
|||||||
'duration': 308.315,
|
'duration': 308.315,
|
||||||
'timestamp': 1398012660,
|
'timestamp': 1398012660,
|
||||||
'upload_date': '20140420',
|
'upload_date': '20140420',
|
||||||
'thumbnail': 're:^https?://.+\.jpg',
|
'thumbnail': r're:^https?://.+\.jpg',
|
||||||
'uploader': '菊子桑',
|
'uploader': '菊子桑',
|
||||||
'uploader_id': '156160',
|
'uploader_id': '156160',
|
||||||
},
|
},
|
||||||
}
|
}, {
|
||||||
|
# Tested in BiliBiliBangumiIE
|
||||||
|
'url': 'http://bangumi.bilibili.com/anime/1869/play#40062',
|
||||||
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://bangumi.bilibili.com/anime/5802/play#100643',
|
||||||
|
'md5': '3f721ad1e75030cc06faf73587cfec57',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '100643',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'CHAOS;CHILD',
|
||||||
|
'description': '如果你是神明,并且能够让妄想成为现实。那你会进行怎么样的妄想?是淫靡的世界?独裁社会?毁灭性的制裁?还是……2015年,涩谷。从6年前发生的大灾害“涩谷地震”之后复兴了的这个街区里新设立的私立高中...',
|
||||||
|
},
|
||||||
|
'skip': 'Geo-restricted to China',
|
||||||
|
}]
|
||||||
|
|
||||||
_APP_KEY = '6f90a59ac58a4123'
|
_APP_KEY = '84956560bc028eb7'
|
||||||
_BILIBILI_KEY = '0bfd84cc3940035173f35e6777508326'
|
_BILIBILI_KEY = '94aba54af9065f71de72f5508f1cd42e'
|
||||||
|
|
||||||
|
def _report_error(self, result):
|
||||||
|
if 'message' in result:
|
||||||
|
raise ExtractorError('%s said: %s' % (self.IE_NAME, result['message']), expected=True)
|
||||||
|
elif 'code' in result:
|
||||||
|
raise ExtractorError('%s returns error %d' % (self.IE_NAME, result['code']), expected=True)
|
||||||
|
else:
|
||||||
|
raise ExtractorError('Can\'t extract Bangumi episode ID')
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
url, smuggled_data = unsmuggle_url(url, {})
|
||||||
|
|
||||||
|
mobj = re.match(self._VALID_URL, url)
|
||||||
|
video_id = mobj.group('id')
|
||||||
|
anime_id = mobj.group('anime_id')
|
||||||
webpage = self._download_webpage(url, video_id)
|
webpage = self._download_webpage(url, video_id)
|
||||||
|
|
||||||
if 'anime/v' not in url:
|
if 'anime/' not in url:
|
||||||
cid = compat_parse_qs(self._search_regex(
|
cid = compat_parse_qs(self._search_regex(
|
||||||
[r'EmbedPlayer\([^)]+,\s*"([^"]+)"\)',
|
[r'EmbedPlayer\([^)]+,\s*"([^"]+)"\)',
|
||||||
r'<iframe[^>]+src="https://secure\.bilibili\.com/secure,([^"]+)"'],
|
r'<iframe[^>]+src="https://secure\.bilibili\.com/secure,([^"]+)"'],
|
||||||
webpage, 'player parameters'))['cid'][0]
|
webpage, 'player parameters'))['cid'][0]
|
||||||
else:
|
else:
|
||||||
|
if 'no_bangumi_tip' not in smuggled_data:
|
||||||
|
self.to_screen('Downloading episode %s. To download all videos in anime %s, re-run youtube-dl with %s' % (
|
||||||
|
video_id, anime_id, compat_urlparse.urljoin(url, '//bangumi.bilibili.com/anime/%s' % anime_id)))
|
||||||
|
headers = {
|
||||||
|
'Content-Type': 'application/x-www-form-urlencoded; charset=UTF-8',
|
||||||
|
}
|
||||||
|
headers.update(self.geo_verification_headers())
|
||||||
|
|
||||||
js = self._download_json(
|
js = self._download_json(
|
||||||
'http://bangumi.bilibili.com/web_api/get_source', video_id,
|
'http://bangumi.bilibili.com/web_api/get_source', video_id,
|
||||||
data=urlencode_postdata({'episode_id': video_id}),
|
data=urlencode_postdata({'episode_id': video_id}),
|
||||||
headers={'Content-Type': 'application/x-www-form-urlencoded; charset=UTF-8'})
|
headers=headers)
|
||||||
|
if 'result' not in js:
|
||||||
|
self._report_error(js)
|
||||||
cid = js['result']['cid']
|
cid = js['result']['cid']
|
||||||
|
|
||||||
payload = 'appkey=%s&cid=%s&otype=json&quality=2&type=mp4' % (self._APP_KEY, cid)
|
payload = 'appkey=%s&cid=%s&otype=json&quality=2&type=mp4' % (self._APP_KEY, cid)
|
||||||
@ -58,7 +102,11 @@ class BiliBiliIE(InfoExtractor):
|
|||||||
|
|
||||||
video_info = self._download_json(
|
video_info = self._download_json(
|
||||||
'http://interface.bilibili.com/playurl?%s&sign=%s' % (payload, sign),
|
'http://interface.bilibili.com/playurl?%s&sign=%s' % (payload, sign),
|
||||||
video_id, note='Downloading video info page')
|
video_id, note='Downloading video info page',
|
||||||
|
headers=self.geo_verification_headers())
|
||||||
|
|
||||||
|
if 'durl' not in video_info:
|
||||||
|
self._report_error(video_info)
|
||||||
|
|
||||||
entries = []
|
entries = []
|
||||||
|
|
||||||
@ -85,7 +133,7 @@ class BiliBiliIE(InfoExtractor):
|
|||||||
title = self._html_search_regex('<h1[^>]+title="([^"]+)">', webpage, 'title')
|
title = self._html_search_regex('<h1[^>]+title="([^"]+)">', webpage, 'title')
|
||||||
description = self._html_search_meta('description', webpage)
|
description = self._html_search_meta('description', webpage)
|
||||||
timestamp = unified_timestamp(self._html_search_regex(
|
timestamp = unified_timestamp(self._html_search_regex(
|
||||||
r'<time[^>]+datetime="([^"]+)"', webpage, 'upload time', fatal=False))
|
r'<time[^>]+datetime="([^"]+)"', webpage, 'upload time', default=None))
|
||||||
thumbnail = self._html_search_meta(['og:image', 'thumbnailUrl'], webpage)
|
thumbnail = self._html_search_meta(['og:image', 'thumbnailUrl'], webpage)
|
||||||
|
|
||||||
# TODO 'view_count' requires deobfuscating Javascript
|
# TODO 'view_count' requires deobfuscating Javascript
|
||||||
@ -99,7 +147,7 @@ class BiliBiliIE(InfoExtractor):
|
|||||||
}
|
}
|
||||||
|
|
||||||
uploader_mobj = re.search(
|
uploader_mobj = re.search(
|
||||||
r'<a[^>]+href="https?://space\.bilibili\.com/(?P<id>\d+)"[^>]+title="(?P<name>[^"]+)"',
|
r'<a[^>]+href="(?:https?:)?//space\.bilibili\.com/(?P<id>\d+)"[^>]+title="(?P<name>[^"]+)"',
|
||||||
webpage)
|
webpage)
|
||||||
if uploader_mobj:
|
if uploader_mobj:
|
||||||
info.update({
|
info.update({
|
||||||
@ -123,3 +171,70 @@ class BiliBiliIE(InfoExtractor):
|
|||||||
'description': description,
|
'description': description,
|
||||||
'entries': entries,
|
'entries': entries,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
class BiliBiliBangumiIE(InfoExtractor):
|
||||||
|
_VALID_URL = r'https?://bangumi\.bilibili\.com/anime/(?P<id>\d+)'
|
||||||
|
|
||||||
|
IE_NAME = 'bangumi.bilibili.com'
|
||||||
|
IE_DESC = 'BiliBili番剧'
|
||||||
|
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'http://bangumi.bilibili.com/anime/1869',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '1869',
|
||||||
|
'title': '混沌武士',
|
||||||
|
'description': 'md5:6a9622b911565794c11f25f81d6a97d2',
|
||||||
|
},
|
||||||
|
'playlist_count': 26,
|
||||||
|
}, {
|
||||||
|
'url': 'http://bangumi.bilibili.com/anime/1869',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '1869',
|
||||||
|
'title': '混沌武士',
|
||||||
|
'description': 'md5:6a9622b911565794c11f25f81d6a97d2',
|
||||||
|
},
|
||||||
|
'playlist': [{
|
||||||
|
'md5': '91da8621454dd58316851c27c68b0c13',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '40062',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': '混沌武士',
|
||||||
|
'description': '故事发生在日本的江户时代。风是一个小酒馆的打工女。一日,酒馆里来了一群恶霸,虽然他们的举动令风十分不满,但是毕竟风只是一届女流,无法对他们采取什么行动,只能在心里嘟哝。这时,酒家里又进来了个“不良份子...',
|
||||||
|
'timestamp': 1414538739,
|
||||||
|
'upload_date': '20141028',
|
||||||
|
'episode': '疾风怒涛 Tempestuous Temperaments',
|
||||||
|
'episode_number': 1,
|
||||||
|
},
|
||||||
|
}],
|
||||||
|
'params': {
|
||||||
|
'playlist_items': '1',
|
||||||
|
},
|
||||||
|
}]
|
||||||
|
|
||||||
|
@classmethod
|
||||||
|
def suitable(cls, url):
|
||||||
|
return False if BiliBiliIE.suitable(url) else super(BiliBiliBangumiIE, cls).suitable(url)
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
bangumi_id = self._match_id(url)
|
||||||
|
|
||||||
|
# Sometimes this API returns a JSONP response
|
||||||
|
season_info = self._download_json(
|
||||||
|
'http://bangumi.bilibili.com/jsonp/seasoninfo/%s.ver' % bangumi_id,
|
||||||
|
bangumi_id, transform_source=strip_jsonp)['result']
|
||||||
|
|
||||||
|
entries = [{
|
||||||
|
'_type': 'url_transparent',
|
||||||
|
'url': smuggle_url(episode['webplay_url'], {'no_bangumi_tip': 1}),
|
||||||
|
'ie_key': BiliBiliIE.ie_key(),
|
||||||
|
'timestamp': parse_iso8601(episode.get('update_time'), delimiter=' '),
|
||||||
|
'episode': episode.get('index_title'),
|
||||||
|
'episode_number': int_or_none(episode.get('index')),
|
||||||
|
} for episode in season_info['episodes']]
|
||||||
|
|
||||||
|
entries = sorted(entries, key=lambda entry: entry.get('episode_number'))
|
||||||
|
|
||||||
|
return self.playlist_result(
|
||||||
|
entries, bangumi_id,
|
||||||
|
season_info.get('bangumi_title'), season_info.get('evaluate'))
|
||||||
|
@ -19,7 +19,7 @@ class BioBioChileTVIE(InfoExtractor):
|
|||||||
'id': 'sobre-camaras-y-camarillas-parlamentarias',
|
'id': 'sobre-camaras-y-camarillas-parlamentarias',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Sobre Cámaras y camarillas parlamentarias',
|
'title': 'Sobre Cámaras y camarillas parlamentarias',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'uploader': 'Fernando Atria',
|
'uploader': 'Fernando Atria',
|
||||||
},
|
},
|
||||||
'skip': 'URL expired and redirected to http://www.biobiochile.cl/portada/bbtv/index.html',
|
'skip': 'URL expired and redirected to http://www.biobiochile.cl/portada/bbtv/index.html',
|
||||||
@ -31,7 +31,7 @@ class BioBioChileTVIE(InfoExtractor):
|
|||||||
'id': 'natalia-valdebenito-repasa-a-diputado-hasbun-paso-a-la-categoria-de-hablar-brutalidades',
|
'id': 'natalia-valdebenito-repasa-a-diputado-hasbun-paso-a-la-categoria-de-hablar-brutalidades',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Natalia Valdebenito repasa a diputado Hasbún: Pasó a la categoría de hablar brutalidades',
|
'title': 'Natalia Valdebenito repasa a diputado Hasbún: Pasó a la categoría de hablar brutalidades',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'uploader': 'Piangella Obrador',
|
'uploader': 'Piangella Obrador',
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
|
@ -33,6 +33,10 @@ class BloombergIE(InfoExtractor):
|
|||||||
'params': {
|
'params': {
|
||||||
'format': 'best[format_id^=hds]',
|
'format': 'best[format_id^=hds]',
|
||||||
},
|
},
|
||||||
|
}, {
|
||||||
|
# data-bmmrid=
|
||||||
|
'url': 'https://www.bloomberg.com/politics/articles/2017-02-08/le-pen-aide-briefed-french-central-banker-on-plan-to-print-money',
|
||||||
|
'only_matching': True,
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.bloomberg.com/news/articles/2015-11-12/five-strange-things-that-have-been-happening-in-financial-markets',
|
'url': 'http://www.bloomberg.com/news/articles/2015-11-12/five-strange-things-that-have-been-happening-in-financial-markets',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
@ -45,8 +49,10 @@ class BloombergIE(InfoExtractor):
|
|||||||
name = self._match_id(url)
|
name = self._match_id(url)
|
||||||
webpage = self._download_webpage(url, name)
|
webpage = self._download_webpage(url, name)
|
||||||
video_id = self._search_regex(
|
video_id = self._search_regex(
|
||||||
r'["\']bmmrId["\']\s*:\s*(["\'])(?P<url>.+?)\1',
|
(r'["\']bmmrId["\']\s*:\s*(["\'])(?P<id>(?:(?!\1).)+)\1',
|
||||||
webpage, 'id', group='url', default=None)
|
r'videoId\s*:\s*(["\'])(?P<id>(?:(?!\1).)+)\1',
|
||||||
|
r'data-bmmrid=(["\'])(?P<id>(?:(?!\1).)+)\1'),
|
||||||
|
webpage, 'id', group='id', default=None)
|
||||||
if not video_id:
|
if not video_id:
|
||||||
bplayer_data = self._parse_json(self._search_regex(
|
bplayer_data = self._parse_json(self._search_regex(
|
||||||
r'BPlayer\(null,\s*({[^;]+})\);', webpage, 'id'), name)
|
r'BPlayer\(null,\s*({[^;]+})\);', webpage, 'id'), name)
|
||||||
|
@ -1,9 +1,9 @@
|
|||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
import re
|
import re
|
||||||
import json
|
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
|
from ..compat import compat_str
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
int_or_none,
|
int_or_none,
|
||||||
parse_age_limit,
|
parse_age_limit,
|
||||||
@ -11,7 +11,7 @@ from ..utils import (
|
|||||||
|
|
||||||
|
|
||||||
class BreakIE(InfoExtractor):
|
class BreakIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:www\.)?break\.com/video/(?:[^/]+/)*.+-(?P<id>\d+)'
|
_VALID_URL = r'https?://(?:www\.)?(?P<site>break|screenjunkies)\.com/video/(?P<display_id>[^/]+?)(?:-(?P<id>\d+))?(?:[/?#&]|$)'
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.break.com/video/when-girls-act-like-guys-2468056',
|
'url': 'http://www.break.com/video/when-girls-act-like-guys-2468056',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
@ -20,45 +20,124 @@ class BreakIE(InfoExtractor):
|
|||||||
'title': 'When Girls Act Like D-Bags',
|
'title': 'When Girls Act Like D-Bags',
|
||||||
'age_limit': 13,
|
'age_limit': 13,
|
||||||
}
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.screenjunkies.com/video/best-quentin-tarantino-movie-2841915',
|
||||||
|
'md5': '5c2b686bec3d43de42bde9ec047536b0',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '2841915',
|
||||||
|
'display_id': 'best-quentin-tarantino-movie',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Best Quentin Tarantino Movie',
|
||||||
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
|
'duration': 3671,
|
||||||
|
'age_limit': 13,
|
||||||
|
'tags': list,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.screenjunkies.com/video/honest-trailers-the-dark-knight',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '2348808',
|
||||||
|
'display_id': 'honest-trailers-the-dark-knight',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Honest Trailers - The Dark Knight',
|
||||||
|
'thumbnail': r're:^https?://.*\.(?:jpg|png)',
|
||||||
|
'age_limit': 10,
|
||||||
|
'tags': list,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# requires subscription but worked around
|
||||||
|
'url': 'http://www.screenjunkies.com/video/knocking-dead-ep-1-the-show-so-far-3003285',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '3003285',
|
||||||
|
'display_id': 'knocking-dead-ep-1-the-show-so-far',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'State of The Dead Recap: Knocking Dead Pilot',
|
||||||
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
|
'duration': 3307,
|
||||||
|
'age_limit': 13,
|
||||||
|
'tags': list,
|
||||||
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.break.com/video/ugc/baby-flex-2773063',
|
'url': 'http://www.break.com/video/ugc/baby-flex-2773063',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
_DEFAULT_BITRATES = (48, 150, 320, 496, 864, 2240, 3264)
|
||||||
video_id = self._match_id(url)
|
|
||||||
webpage = self._download_webpage(
|
|
||||||
'http://www.break.com/embed/%s' % video_id, video_id)
|
|
||||||
info = json.loads(self._search_regex(
|
|
||||||
r'var embedVars = ({.*})\s*?</script>',
|
|
||||||
webpage, 'info json', flags=re.DOTALL))
|
|
||||||
|
|
||||||
youtube_id = info.get('youtubeId')
|
def _real_extract(self, url):
|
||||||
|
site, display_id, video_id = re.match(self._VALID_URL, url).groups()
|
||||||
|
|
||||||
|
if not video_id:
|
||||||
|
webpage = self._download_webpage(url, display_id)
|
||||||
|
video_id = self._search_regex(
|
||||||
|
(r'src=["\']/embed/(\d+)', r'data-video-content-id=["\'](\d+)'),
|
||||||
|
webpage, 'video id')
|
||||||
|
|
||||||
|
webpage = self._download_webpage(
|
||||||
|
'http://www.%s.com/embed/%s' % (site, video_id),
|
||||||
|
display_id, 'Downloading video embed page')
|
||||||
|
embed_vars = self._parse_json(
|
||||||
|
self._search_regex(
|
||||||
|
r'(?s)embedVars\s*=\s*({.+?})\s*</script>', webpage, 'embed vars'),
|
||||||
|
display_id)
|
||||||
|
|
||||||
|
youtube_id = embed_vars.get('youtubeId')
|
||||||
if youtube_id:
|
if youtube_id:
|
||||||
return self.url_result(youtube_id, 'Youtube')
|
return self.url_result(youtube_id, 'Youtube')
|
||||||
|
|
||||||
formats = [{
|
title = embed_vars['contentName']
|
||||||
'url': media['uri'] + '?' + info['AuthToken'],
|
|
||||||
'tbr': media['bitRate'],
|
|
||||||
'width': media['width'],
|
|
||||||
'height': media['height'],
|
|
||||||
} for media in info['media'] if media.get('mediaPurpose') == 'play']
|
|
||||||
|
|
||||||
if not formats:
|
formats = []
|
||||||
|
bitrates = []
|
||||||
|
for f in embed_vars.get('media', []):
|
||||||
|
if not f.get('uri') or f.get('mediaPurpose') != 'play':
|
||||||
|
continue
|
||||||
|
bitrate = int_or_none(f.get('bitRate'))
|
||||||
|
if bitrate:
|
||||||
|
bitrates.append(bitrate)
|
||||||
formats.append({
|
formats.append({
|
||||||
'url': info['videoUri']
|
'url': f['uri'],
|
||||||
|
'format_id': 'http-%d' % bitrate if bitrate else 'http',
|
||||||
|
'width': int_or_none(f.get('width')),
|
||||||
|
'height': int_or_none(f.get('height')),
|
||||||
|
'tbr': bitrate,
|
||||||
|
'format': 'mp4',
|
||||||
})
|
})
|
||||||
|
|
||||||
self._sort_formats(formats)
|
if not bitrates:
|
||||||
|
# When subscriptionLevel > 0, i.e. plus subscription is required
|
||||||
|
# media list will be empty. However, hds and hls uris are still
|
||||||
|
# available. We can grab them assuming bitrates to be default.
|
||||||
|
bitrates = self._DEFAULT_BITRATES
|
||||||
|
|
||||||
duration = int_or_none(info.get('videoLengthInSeconds'))
|
auth_token = embed_vars.get('AuthToken')
|
||||||
age_limit = parse_age_limit(info.get('audienceRating'))
|
|
||||||
|
def construct_manifest_url(base_url, ext):
|
||||||
|
pieces = [base_url]
|
||||||
|
pieces.extend([compat_str(b) for b in bitrates])
|
||||||
|
pieces.append('_kbps.mp4.%s?%s' % (ext, auth_token))
|
||||||
|
return ','.join(pieces)
|
||||||
|
|
||||||
|
if bitrates and auth_token:
|
||||||
|
hds_url = embed_vars.get('hdsUri')
|
||||||
|
if hds_url:
|
||||||
|
formats.extend(self._extract_f4m_formats(
|
||||||
|
construct_manifest_url(hds_url, 'f4m'),
|
||||||
|
display_id, f4m_id='hds', fatal=False))
|
||||||
|
hls_url = embed_vars.get('hlsUri')
|
||||||
|
if hls_url:
|
||||||
|
formats.extend(self._extract_m3u8_formats(
|
||||||
|
construct_manifest_url(hls_url, 'm3u8'),
|
||||||
|
display_id, 'mp4', entry_protocol='m3u8_native', m3u8_id='hls', fatal=False))
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': info['contentName'],
|
'display_id': display_id,
|
||||||
'thumbnail': info['thumbUri'],
|
'title': title,
|
||||||
'duration': duration,
|
'thumbnail': embed_vars.get('thumbUri'),
|
||||||
'age_limit': age_limit,
|
'duration': int_or_none(embed_vars.get('videoLengthInSeconds')) or None,
|
||||||
|
'age_limit': parse_age_limit(embed_vars.get('audienceRating')),
|
||||||
|
'tags': embed_vars.get('tags', '').split(','),
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
}
|
}
|
||||||
|
@ -179,7 +179,7 @@ class BrightcoveLegacyIE(InfoExtractor):
|
|||||||
|
|
||||||
params = {}
|
params = {}
|
||||||
|
|
||||||
playerID = find_param('playerID')
|
playerID = find_param('playerID') or find_param('playerId')
|
||||||
if playerID is None:
|
if playerID is None:
|
||||||
raise ExtractorError('Cannot find player ID')
|
raise ExtractorError('Cannot find player ID')
|
||||||
params['playerID'] = playerID
|
params['playerID'] = playerID
|
||||||
@ -191,6 +191,10 @@ class BrightcoveLegacyIE(InfoExtractor):
|
|||||||
# These fields hold the id of the video
|
# These fields hold the id of the video
|
||||||
videoPlayer = find_param('@videoPlayer') or find_param('videoId') or find_param('videoID') or find_param('@videoList')
|
videoPlayer = find_param('@videoPlayer') or find_param('videoId') or find_param('videoID') or find_param('@videoList')
|
||||||
if videoPlayer is not None:
|
if videoPlayer is not None:
|
||||||
|
if isinstance(videoPlayer, list):
|
||||||
|
videoPlayer = videoPlayer[0]
|
||||||
|
if not (videoPlayer.isdigit() or videoPlayer.startswith('ref:')):
|
||||||
|
return None
|
||||||
params['@videoPlayer'] = videoPlayer
|
params['@videoPlayer'] = videoPlayer
|
||||||
linkBase = find_param('linkBaseURL')
|
linkBase = find_param('linkBaseURL')
|
||||||
if linkBase is not None:
|
if linkBase is not None:
|
||||||
@ -204,7 +208,7 @@ class BrightcoveLegacyIE(InfoExtractor):
|
|||||||
# // build Brightcove <object /> XML
|
# // build Brightcove <object /> XML
|
||||||
# }
|
# }
|
||||||
m = re.search(
|
m = re.search(
|
||||||
r'''(?x)customBC.\createVideo\(
|
r'''(?x)customBC\.createVideo\(
|
||||||
.*? # skipping width and height
|
.*? # skipping width and height
|
||||||
["\'](?P<playerID>\d+)["\']\s*,\s* # playerID
|
["\'](?P<playerID>\d+)["\']\s*,\s* # playerID
|
||||||
["\'](?P<playerKey>AQ[^"\']{48})[^"\']*["\']\s*,\s* # playerKey begins with AQ and is 50 characters
|
["\'](?P<playerKey>AQ[^"\']{48})[^"\']*["\']\s*,\s* # playerKey begins with AQ and is 50 characters
|
||||||
@ -232,13 +236,16 @@ class BrightcoveLegacyIE(InfoExtractor):
|
|||||||
"""Return a list of all Brightcove URLs from the webpage """
|
"""Return a list of all Brightcove URLs from the webpage """
|
||||||
|
|
||||||
url_m = re.search(
|
url_m = re.search(
|
||||||
r'<meta\s+property=[\'"]og:video[\'"]\s+content=[\'"](https?://(?:secure|c)\.brightcove.com/[^\'"]+)[\'"]',
|
r'''(?x)
|
||||||
webpage)
|
<meta\s+
|
||||||
|
(?:property|itemprop)=([\'"])(?:og:video|embedURL)\1[^>]+
|
||||||
|
content=([\'"])(?P<url>https?://(?:secure|c)\.brightcove.com/(?:(?!\2).)+)\2
|
||||||
|
''', webpage)
|
||||||
if url_m:
|
if url_m:
|
||||||
url = unescapeHTML(url_m.group(1))
|
url = unescapeHTML(url_m.group('url'))
|
||||||
# Some sites don't add it, we can't download with this url, for example:
|
# Some sites don't add it, we can't download with this url, for example:
|
||||||
# http://www.ktvu.com/videos/news/raw-video-caltrain-releases-video-of-man-almost/vCTZdY/
|
# http://www.ktvu.com/videos/news/raw-video-caltrain-releases-video-of-man-almost/vCTZdY/
|
||||||
if 'playerKey' in url or 'videoId' in url:
|
if 'playerKey' in url or 'videoId' in url or 'idVideo' in url:
|
||||||
return [url]
|
return [url]
|
||||||
|
|
||||||
matches = re.findall(
|
matches = re.findall(
|
||||||
@ -259,7 +266,7 @@ class BrightcoveLegacyIE(InfoExtractor):
|
|||||||
url, smuggled_data = unsmuggle_url(url, {})
|
url, smuggled_data = unsmuggle_url(url, {})
|
||||||
|
|
||||||
# Change the 'videoId' and others field to '@videoPlayer'
|
# Change the 'videoId' and others field to '@videoPlayer'
|
||||||
url = re.sub(r'(?<=[?&])(videoI(d|D)|bctid)', '%40videoPlayer', url)
|
url = re.sub(r'(?<=[?&])(videoI(d|D)|idVideo|bctid)', '%40videoPlayer', url)
|
||||||
# Change bckey (used by bcove.me urls) to playerKey
|
# Change bckey (used by bcove.me urls) to playerKey
|
||||||
url = re.sub(r'(?<=[?&])bckey', 'playerKey', url)
|
url = re.sub(r'(?<=[?&])bckey', 'playerKey', url)
|
||||||
mobj = re.match(self._VALID_URL, url)
|
mobj = re.match(self._VALID_URL, url)
|
||||||
@ -508,6 +515,9 @@ class BrightcoveNewIE(InfoExtractor):
|
|||||||
return entries
|
return entries
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
|
url, smuggled_data = unsmuggle_url(url, {})
|
||||||
|
self._initialize_geo_bypass(smuggled_data.get('geo_countries'))
|
||||||
|
|
||||||
account_id, player_id, embed, video_id = re.match(self._VALID_URL, url).groups()
|
account_id, player_id, embed, video_id = re.match(self._VALID_URL, url).groups()
|
||||||
|
|
||||||
webpage = self._download_webpage(
|
webpage = self._download_webpage(
|
||||||
@ -537,8 +547,10 @@ class BrightcoveNewIE(InfoExtractor):
|
|||||||
except ExtractorError as e:
|
except ExtractorError as e:
|
||||||
if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403:
|
if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403:
|
||||||
json_data = self._parse_json(e.cause.read().decode(), video_id)[0]
|
json_data = self._parse_json(e.cause.read().decode(), video_id)[0]
|
||||||
raise ExtractorError(
|
message = json_data.get('message') or json_data['error_code']
|
||||||
json_data.get('message') or json_data['error_code'], expected=True)
|
if json_data.get('error_subcode') == 'CLIENT_GEO':
|
||||||
|
self.raise_geo_restricted(msg=message)
|
||||||
|
raise ExtractorError(message, expected=True)
|
||||||
raise
|
raise
|
||||||
|
|
||||||
title = json_data['name'].strip()
|
title = json_data['name'].strip()
|
||||||
@ -548,7 +560,7 @@ class BrightcoveNewIE(InfoExtractor):
|
|||||||
container = source.get('container')
|
container = source.get('container')
|
||||||
ext = mimetype2ext(source.get('type'))
|
ext = mimetype2ext(source.get('type'))
|
||||||
src = source.get('src')
|
src = source.get('src')
|
||||||
if ext == 'ism':
|
if ext == 'ism' or container == 'WVM':
|
||||||
continue
|
continue
|
||||||
elif ext == 'm3u8' or container == 'M2TS':
|
elif ext == 'm3u8' or container == 'M2TS':
|
||||||
if not src:
|
if not src:
|
||||||
|
@ -16,7 +16,7 @@ class BYUtvIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Season 5 Episode 5',
|
'title': 'Season 5 Episode 5',
|
||||||
'description': 'md5:e07269172baff037f8e8bf9956bc9747',
|
'description': 'md5:e07269172baff037f8e8bf9956bc9747',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'duration': 1486.486,
|
'duration': 1486.486,
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
|
@ -26,7 +26,7 @@ class CamdemyIE(InfoExtractor):
|
|||||||
'id': '5181',
|
'id': '5181',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Ch1-1 Introduction, Signals (02-23-2012)',
|
'title': 'Ch1-1 Introduction, Signals (02-23-2012)',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'creator': 'ss11spring',
|
'creator': 'ss11spring',
|
||||||
'duration': 1591,
|
'duration': 1591,
|
||||||
'upload_date': '20130114',
|
'upload_date': '20130114',
|
||||||
@ -41,7 +41,7 @@ class CamdemyIE(InfoExtractor):
|
|||||||
'id': '13885',
|
'id': '13885',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'EverCam + Camdemy QuickStart',
|
'title': 'EverCam + Camdemy QuickStart',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'description': 'md5:2a9f989c2b153a2342acee579c6e7db6',
|
'description': 'md5:2a9f989c2b153a2342acee579c6e7db6',
|
||||||
'creator': 'evercam',
|
'creator': 'evercam',
|
||||||
'duration': 318,
|
'duration': 318,
|
||||||
|
@ -6,11 +6,13 @@ import re
|
|||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..compat import compat_urllib_parse_urlparse
|
from ..compat import compat_urllib_parse_urlparse
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
|
dict_get,
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
HEADRequest,
|
HEADRequest,
|
||||||
unified_strdate,
|
|
||||||
qualities,
|
|
||||||
int_or_none,
|
int_or_none,
|
||||||
|
qualities,
|
||||||
|
remove_end,
|
||||||
|
unified_strdate,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@ -25,6 +27,7 @@ class CanalplusIE(InfoExtractor):
|
|||||||
(?:www\.)?d8\.tv|
|
(?:www\.)?d8\.tv|
|
||||||
(?:www\.)?c8\.fr|
|
(?:www\.)?c8\.fr|
|
||||||
(?:www\.)?d17\.tv|
|
(?:www\.)?d17\.tv|
|
||||||
|
(?:(?:football|www)\.)?cstar\.fr|
|
||||||
(?:www\.)?itele\.fr
|
(?:www\.)?itele\.fr
|
||||||
)/(?:(?:[^/]+/)*(?P<display_id>[^/?#&]+))?(?:\?.*\bvid=(?P<vid>\d+))?|
|
)/(?:(?:[^/]+/)*(?P<display_id>[^/?#&]+))?(?:\?.*\bvid=(?P<vid>\d+))?|
|
||||||
player\.canalplus\.fr/#/(?P<id>\d+)
|
player\.canalplus\.fr/#/(?P<id>\d+)
|
||||||
@ -38,49 +41,62 @@ class CanalplusIE(InfoExtractor):
|
|||||||
'd8': 'd8',
|
'd8': 'd8',
|
||||||
'c8': 'd8',
|
'c8': 'd8',
|
||||||
'd17': 'd17',
|
'd17': 'd17',
|
||||||
|
'cstar': 'd17',
|
||||||
'itele': 'itele',
|
'itele': 'itele',
|
||||||
}
|
}
|
||||||
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.canalplus.fr/c-emissions/pid1830-c-zapping.html?vid=1192814',
|
'url': 'http://www.canalplus.fr/c-emissions/pid1830-c-zapping.html?vid=1192814',
|
||||||
'md5': '41f438a4904f7664b91b4ed0dec969dc',
|
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '1192814',
|
'id': '1405510',
|
||||||
|
'display_id': 'pid1830-c-zapping',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': "L'Année du Zapping 2014 - L'Année du Zapping 2014",
|
'title': 'Zapping - 02/07/2016',
|
||||||
'description': "Toute l'année 2014 dans un Zapping exceptionnel !",
|
'description': 'Le meilleur de toutes les chaînes, tous les jours',
|
||||||
'upload_date': '20150105',
|
'upload_date': '20160702',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.piwiplus.fr/videos-piwi/pid1405-le-labyrinthe-boing-super-ranger.html?vid=1108190',
|
'url': 'http://www.piwiplus.fr/videos-piwi/pid1405-le-labyrinthe-boing-super-ranger.html?vid=1108190',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '1108190',
|
'id': '1108190',
|
||||||
'ext': 'flv',
|
'display_id': 'pid1405-le-labyrinthe-boing-super-ranger',
|
||||||
'title': 'Le labyrinthe - Boing super ranger',
|
'ext': 'mp4',
|
||||||
|
'title': 'BOING SUPER RANGER - Ep : Le labyrinthe',
|
||||||
'description': 'md5:4cea7a37153be42c1ba2c1d3064376ff',
|
'description': 'md5:4cea7a37153be42c1ba2c1d3064376ff',
|
||||||
'upload_date': '20140724',
|
'upload_date': '20140724',
|
||||||
},
|
},
|
||||||
'skip': 'Only works from France',
|
'skip': 'Only works from France',
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.d8.tv/d8-docs-mags/pid5198-d8-en-quete-d-actualite.html?vid=1390231',
|
'url': 'http://www.c8.fr/c8-divertissement/ms-touche-pas-a-mon-poste/pid6318-videos-integrales.html',
|
||||||
|
'md5': '4b47b12b4ee43002626b97fad8fb1de5',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '1390231',
|
'id': '1420213',
|
||||||
|
'display_id': 'pid6318-videos-integrales',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': "Vacances pas chères : prix discount ou grosses dépenses ? - En quête d'actualité",
|
'title': 'TPMP ! Même le matin - Les 35H de Baba - 14/10/2016',
|
||||||
'description': 'md5:edb6cf1cb4a1e807b5dd089e1ac8bfc6',
|
'description': 'md5:f96736c1b0ffaa96fd5b9e60ad871799',
|
||||||
'upload_date': '20160512',
|
'upload_date': '20161014',
|
||||||
},
|
},
|
||||||
'params': {
|
'skip': 'Only works from France',
|
||||||
'skip_download': True,
|
}, {
|
||||||
|
'url': 'http://www.itele.fr/chroniques/invite-michael-darmon/rachida-dati-nicolas-sarkozy-est-le-plus-en-phase-avec-les-inquietudes-des-francais-171510',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '1420176',
|
||||||
|
'display_id': 'rachida-dati-nicolas-sarkozy-est-le-plus-en-phase-avec-les-inquietudes-des-francais-171510',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'L\'invité de Michaël Darmon du 14/10/2016 - ',
|
||||||
|
'description': 'Chaque matin du lundi au vendredi, Michaël Darmon reçoit un invité politique à 8h25.',
|
||||||
|
'upload_date': '20161014',
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://www.itele.fr/chroniques/invite-bruce-toussaint/thierry-solere-nicolas-sarkozy-officialisera-sa-candidature-a-la-primaire-quand-il-le-voudra-167224',
|
'url': 'http://football.cstar.fr/cstar-minisite-foot/pid7566-feminines-videos.html?vid=1416769',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '1398334',
|
'id': '1416769',
|
||||||
|
'display_id': 'pid7566-feminines-videos',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': "L'invité de Bruce Toussaint du 07/06/2016 - ",
|
'title': 'France - Albanie : les temps forts de la soirée - 20/09/2016',
|
||||||
'description': 'md5:40ac7c9ad0feaeb6f605bad986f61324',
|
'description': 'md5:c3f30f2aaac294c1c969b3294de6904e',
|
||||||
'upload_date': '20160607',
|
'upload_date': '20160921',
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
'skip_download': True,
|
'skip_download': True,
|
||||||
@ -95,18 +111,18 @@ class CanalplusIE(InfoExtractor):
|
|||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
mobj = re.match(self._VALID_URL, url)
|
mobj = re.match(self._VALID_URL, url)
|
||||||
video_id = mobj.groupdict().get('id') or mobj.groupdict().get('vid')
|
|
||||||
|
|
||||||
site_id = self._SITE_ID_MAP[compat_urllib_parse_urlparse(url).netloc.rsplit('.', 2)[-2]]
|
site_id = self._SITE_ID_MAP[compat_urllib_parse_urlparse(url).netloc.rsplit('.', 2)[-2]]
|
||||||
|
|
||||||
# Beware, some subclasses do not define an id group
|
# Beware, some subclasses do not define an id group
|
||||||
display_id = mobj.group('display_id') or video_id
|
display_id = remove_end(dict_get(mobj.groupdict(), ('display_id', 'id', 'vid')), '.html')
|
||||||
|
|
||||||
if video_id is None:
|
|
||||||
webpage = self._download_webpage(url, display_id)
|
webpage = self._download_webpage(url, display_id)
|
||||||
video_id = self._search_regex(
|
video_id = self._search_regex(
|
||||||
[r'<canal:player[^>]+?videoId=(["\'])(?P<id>\d+)', r'id=["\']canal_video_player(?P<id>\d+)'],
|
[r'<canal:player[^>]+?videoId=(["\'])(?P<id>\d+)',
|
||||||
webpage, 'video id', group='id')
|
r'id=["\']canal_video_player(?P<id>\d+)',
|
||||||
|
r'data-video=["\'](?P<id>\d+)'],
|
||||||
|
webpage, 'video id', default=mobj.group('vid'), group='id')
|
||||||
|
|
||||||
info_url = self._VIDEO_INFO_TEMPLATE % (site_id, video_id)
|
info_url = self._VIDEO_INFO_TEMPLATE % (site_id, video_id)
|
||||||
video_data = self._download_json(info_url, video_id, 'Downloading video JSON')
|
video_data = self._download_json(info_url, video_id, 'Downloading video JSON')
|
||||||
|
@ -17,7 +17,7 @@ class CanvasIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'De afspraak veilt voor de Warmste Week',
|
'title': 'De afspraak veilt voor de Warmste Week',
|
||||||
'description': 'md5:24cb860c320dc2be7358e0e5aa317ba6',
|
'description': 'md5:24cb860c320dc2be7358e0e5aa317ba6',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'duration': 49.02,
|
'duration': 49.02,
|
||||||
}
|
}
|
||||||
}, {
|
}, {
|
||||||
@ -29,7 +29,7 @@ class CanvasIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Pieter 0167',
|
'title': 'Pieter 0167',
|
||||||
'description': 'md5:943cd30f48a5d29ba02c3a104dc4ec4e',
|
'description': 'md5:943cd30f48a5d29ba02c3a104dc4ec4e',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'duration': 2553.08,
|
'duration': 2553.08,
|
||||||
'subtitles': {
|
'subtitles': {
|
||||||
'nl': [{
|
'nl': [{
|
||||||
@ -48,7 +48,7 @@ class CanvasIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Herbekijk Sorry voor alles',
|
'title': 'Herbekijk Sorry voor alles',
|
||||||
'description': 'md5:8bb2805df8164e5eb95d6a7a29dc0dd3',
|
'description': 'md5:8bb2805df8164e5eb95d6a7a29dc0dd3',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'duration': 3788.06,
|
'duration': 3788.06,
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
@ -89,6 +89,9 @@ class CanvasIE(InfoExtractor):
|
|||||||
elif format_type == 'HDS':
|
elif format_type == 'HDS':
|
||||||
formats.extend(self._extract_f4m_formats(
|
formats.extend(self._extract_f4m_formats(
|
||||||
format_url, display_id, f4m_id=format_type, fatal=False))
|
format_url, display_id, f4m_id=format_type, fatal=False))
|
||||||
|
elif format_type == 'MPEG_DASH':
|
||||||
|
formats.extend(self._extract_mpd_formats(
|
||||||
|
format_url, display_id, mpd_id=format_type, fatal=False))
|
||||||
else:
|
else:
|
||||||
formats.append({
|
formats.append({
|
||||||
'format_id': format_type,
|
'format_id': format_type,
|
||||||
|
@ -9,6 +9,8 @@ from ..utils import (
|
|||||||
try_get,
|
try_get,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
from .videomore import VideomoreIE
|
||||||
|
|
||||||
|
|
||||||
class CarambaTVIE(InfoExtractor):
|
class CarambaTVIE(InfoExtractor):
|
||||||
_VALID_URL = r'(?:carambatv:|https?://video1\.carambatv\.ru/v/)(?P<id>\d+)'
|
_VALID_URL = r'(?:carambatv:|https?://video1\.carambatv\.ru/v/)(?P<id>\d+)'
|
||||||
@ -19,7 +21,7 @@ class CarambaTVIE(InfoExtractor):
|
|||||||
'id': '191910501',
|
'id': '191910501',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': '[BadComedian] - Разборка в Маниле (Абсолютный обзор)',
|
'title': '[BadComedian] - Разборка в Маниле (Абсолютный обзор)',
|
||||||
'thumbnail': 're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'duration': 2678.31,
|
'duration': 2678.31,
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
@ -62,14 +64,16 @@ class CarambaTVPageIE(InfoExtractor):
|
|||||||
_VALID_URL = r'https?://carambatv\.ru/(?:[^/]+/)+(?P<id>[^/?#&]+)'
|
_VALID_URL = r'https?://carambatv\.ru/(?:[^/]+/)+(?P<id>[^/?#&]+)'
|
||||||
_TEST = {
|
_TEST = {
|
||||||
'url': 'http://carambatv.ru/movie/bad-comedian/razborka-v-manile/',
|
'url': 'http://carambatv.ru/movie/bad-comedian/razborka-v-manile/',
|
||||||
'md5': '',
|
'md5': 'a49fb0ec2ad66503eeb46aac237d3c86',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '191910501',
|
'id': '475222',
|
||||||
'ext': 'mp4',
|
'ext': 'flv',
|
||||||
'title': '[BadComedian] - Разборка в Маниле (Абсолютный обзор)',
|
'title': '[BadComedian] - Разборка в Маниле (Абсолютный обзор)',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'duration': 2678.31,
|
# duration reported by videomore is incorrect
|
||||||
|
'duration': int,
|
||||||
},
|
},
|
||||||
|
'add_ie': [VideomoreIE.ie_key()],
|
||||||
}
|
}
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
@ -77,6 +81,16 @@ class CarambaTVPageIE(InfoExtractor):
|
|||||||
|
|
||||||
webpage = self._download_webpage(url, video_id)
|
webpage = self._download_webpage(url, video_id)
|
||||||
|
|
||||||
|
videomore_url = VideomoreIE._extract_url(webpage)
|
||||||
|
if videomore_url:
|
||||||
|
title = self._og_search_title(webpage)
|
||||||
|
return {
|
||||||
|
'_type': 'url_transparent',
|
||||||
|
'url': videomore_url,
|
||||||
|
'ie_key': VideomoreIE.ie_key(),
|
||||||
|
'title': title,
|
||||||
|
}
|
||||||
|
|
||||||
video_url = self._og_search_property('video:iframe', webpage, default=None)
|
video_url = self._og_search_property('video:iframe', webpage, default=None)
|
||||||
|
|
||||||
if not video_url:
|
if not video_url:
|
||||||
|
@ -90,19 +90,21 @@ class CBCIE(InfoExtractor):
|
|||||||
},
|
},
|
||||||
}],
|
}],
|
||||||
'skip': 'Geo-restricted to Canada',
|
'skip': 'Geo-restricted to Canada',
|
||||||
|
}, {
|
||||||
|
# multiple CBC.APP.Caffeine.initInstance(...)
|
||||||
|
'url': 'http://www.cbc.ca/news/canada/calgary/dog-indoor-exercise-winter-1.3928238',
|
||||||
|
'info_dict': {
|
||||||
|
'title': 'Keep Rover active during the deep freeze with doggie pushups and other fun indoor tasks',
|
||||||
|
'id': 'dog-indoor-exercise-winter-1.3928238',
|
||||||
|
},
|
||||||
|
'playlist_mincount': 6,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
def suitable(cls, url):
|
def suitable(cls, url):
|
||||||
return False if CBCPlayerIE.suitable(url) else super(CBCIE, cls).suitable(url)
|
return False if CBCPlayerIE.suitable(url) else super(CBCIE, cls).suitable(url)
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _extract_player_init(self, player_init, display_id):
|
||||||
display_id = self._match_id(url)
|
|
||||||
webpage = self._download_webpage(url, display_id)
|
|
||||||
player_init = self._search_regex(
|
|
||||||
r'CBC\.APP\.Caffeine\.initInstance\(({.+?})\);', webpage, 'player init',
|
|
||||||
default=None)
|
|
||||||
if player_init:
|
|
||||||
player_info = self._parse_json(player_init, display_id, js_to_json)
|
player_info = self._parse_json(player_init, display_id, js_to_json)
|
||||||
media_id = player_info.get('mediaId')
|
media_id = player_info.get('mediaId')
|
||||||
if not media_id:
|
if not media_id:
|
||||||
@ -117,9 +119,20 @@ class CBCIE(InfoExtractor):
|
|||||||
'http://feed.theplatform.com/f/h9dtGB/punlNGjMlc1F?fields=id&byContent=byReleases%3DbyId%253D' + clip_id,
|
'http://feed.theplatform.com/f/h9dtGB/punlNGjMlc1F?fields=id&byContent=byReleases%3DbyId%253D' + clip_id,
|
||||||
clip_id)['entries'][0]['id'].split('/')[-1]
|
clip_id)['entries'][0]['id'].split('/')[-1]
|
||||||
return self.url_result('cbcplayer:%s' % media_id, 'CBCPlayer', media_id)
|
return self.url_result('cbcplayer:%s' % media_id, 'CBCPlayer', media_id)
|
||||||
else:
|
|
||||||
entries = [self.url_result('cbcplayer:%s' % media_id, 'CBCPlayer', media_id) for media_id in re.findall(r'<iframe[^>]+src="[^"]+?mediaId=(\d+)"', webpage)]
|
def _real_extract(self, url):
|
||||||
return self.playlist_result(entries)
|
display_id = self._match_id(url)
|
||||||
|
webpage = self._download_webpage(url, display_id)
|
||||||
|
entries = [
|
||||||
|
self._extract_player_init(player_init, display_id)
|
||||||
|
for player_init in re.findall(r'CBC\.APP\.Caffeine\.initInstance\(({.+?})\);', webpage)]
|
||||||
|
entries.extend([
|
||||||
|
self.url_result('cbcplayer:%s' % media_id, 'CBCPlayer', media_id)
|
||||||
|
for media_id in re.findall(r'<iframe[^>]+src="[^"]+?mediaId=(\d+)"', webpage)])
|
||||||
|
return self.playlist_result(
|
||||||
|
entries, display_id,
|
||||||
|
self._og_search_title(webpage, fatal=False),
|
||||||
|
self._og_search_description(webpage))
|
||||||
|
|
||||||
|
|
||||||
class CBCPlayerIE(InfoExtractor):
|
class CBCPlayerIE(InfoExtractor):
|
||||||
@ -283,11 +296,12 @@ class CBCWatchVideoIE(CBCWatchBaseIE):
|
|||||||
formats = self._extract_m3u8_formats(re.sub(r'/([^/]+)/[^/?]+\.m3u8', r'/\1/\1.m3u8', m3u8_url), video_id, 'mp4', fatal=False)
|
formats = self._extract_m3u8_formats(re.sub(r'/([^/]+)/[^/?]+\.m3u8', r'/\1/\1.m3u8', m3u8_url), video_id, 'mp4', fatal=False)
|
||||||
if len(formats) < 2:
|
if len(formats) < 2:
|
||||||
formats = self._extract_m3u8_formats(m3u8_url, video_id, 'mp4')
|
formats = self._extract_m3u8_formats(m3u8_url, video_id, 'mp4')
|
||||||
# Despite metadata in m3u8 all video+audio formats are
|
|
||||||
# actually video-only (no audio)
|
|
||||||
for f in formats:
|
for f in formats:
|
||||||
if f.get('acodec') != 'none' and f.get('vcodec') != 'none':
|
format_id = f.get('format_id')
|
||||||
f['acodec'] = 'none'
|
if format_id.startswith('AAC'):
|
||||||
|
f['acodec'] = 'aac'
|
||||||
|
elif format_id.startswith('AC3'):
|
||||||
|
f['acodec'] = 'ac-3'
|
||||||
self._sort_formats(formats)
|
self._sort_formats(formats)
|
||||||
|
|
||||||
info = {
|
info = {
|
||||||
|
@ -63,7 +63,7 @@ class CBSInteractiveIE(ThePlatformIE):
|
|||||||
webpage = self._download_webpage(url, display_id)
|
webpage = self._download_webpage(url, display_id)
|
||||||
|
|
||||||
data_json = self._html_search_regex(
|
data_json = self._html_search_regex(
|
||||||
r"data-(?:cnet|zdnet)-video(?:-uvp)?-options='([^']+)'",
|
r"data-(?:cnet|zdnet)-video(?:-uvp(?:js)?)?-options='([^']+)'",
|
||||||
webpage, 'data json')
|
webpage, 'data json')
|
||||||
data = self._parse_json(data_json, display_id)
|
data = self._parse_json(data_json, display_id)
|
||||||
vdata = data.get('video') or data['videos'][0]
|
vdata = data.get('video') or data['videos'][0]
|
||||||
|
@ -4,11 +4,14 @@ from __future__ import unicode_literals
|
|||||||
from .anvato import AnvatoIE
|
from .anvato import AnvatoIE
|
||||||
from .sendtonews import SendtoNewsIE
|
from .sendtonews import SendtoNewsIE
|
||||||
from ..compat import compat_urlparse
|
from ..compat import compat_urlparse
|
||||||
from ..utils import unified_timestamp
|
from ..utils import (
|
||||||
|
parse_iso8601,
|
||||||
|
unified_timestamp,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class CBSLocalIE(AnvatoIE):
|
class CBSLocalIE(AnvatoIE):
|
||||||
_VALID_URL = r'https?://[a-z]+\.cbslocal\.com/\d+/\d+/\d+/(?P<id>[0-9a-z-]+)'
|
_VALID_URL = r'https?://[a-z]+\.cbslocal\.com/(?:\d+/\d+/\d+|video)/(?P<id>[0-9a-z-]+)'
|
||||||
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
# Anvato backend
|
# Anvato backend
|
||||||
@ -22,6 +25,7 @@ class CBSLocalIE(AnvatoIE):
|
|||||||
'thumbnail': 're:^https?://.*',
|
'thumbnail': 're:^https?://.*',
|
||||||
'timestamp': 1463440500,
|
'timestamp': 1463440500,
|
||||||
'upload_date': '20160516',
|
'upload_date': '20160516',
|
||||||
|
'uploader': 'CBS',
|
||||||
'subtitles': {
|
'subtitles': {
|
||||||
'en': 'mincount:5',
|
'en': 'mincount:5',
|
||||||
},
|
},
|
||||||
@ -35,6 +39,7 @@ class CBSLocalIE(AnvatoIE):
|
|||||||
'Syndication\\Curb.tv',
|
'Syndication\\Curb.tv',
|
||||||
'Content\\News'
|
'Content\\News'
|
||||||
],
|
],
|
||||||
|
'tags': ['CBS 2 News Evening'],
|
||||||
},
|
},
|
||||||
}, {
|
}, {
|
||||||
# SendtoNews embed
|
# SendtoNews embed
|
||||||
@ -47,6 +52,31 @@ class CBSLocalIE(AnvatoIE):
|
|||||||
# m3u8 download
|
# m3u8 download
|
||||||
'skip_download': True,
|
'skip_download': True,
|
||||||
},
|
},
|
||||||
|
}, {
|
||||||
|
'url': 'http://newyork.cbslocal.com/video/3580809-a-very-blue-anniversary/',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '3580809',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'A Very Blue Anniversary',
|
||||||
|
'description': 'CBS2’s Cindy Hsu has more.',
|
||||||
|
'thumbnail': 're:^https?://.*',
|
||||||
|
'timestamp': 1479962220,
|
||||||
|
'upload_date': '20161124',
|
||||||
|
'uploader': 'CBS',
|
||||||
|
'subtitles': {
|
||||||
|
'en': 'mincount:5',
|
||||||
|
},
|
||||||
|
'categories': [
|
||||||
|
'Stations\\Spoken Word\\WCBSTV',
|
||||||
|
'Syndication\\AOL',
|
||||||
|
'Syndication\\MSN',
|
||||||
|
'Syndication\\NDN',
|
||||||
|
'Syndication\\Yahoo',
|
||||||
|
'Content\\News',
|
||||||
|
'Content\\News\\Local News',
|
||||||
|
],
|
||||||
|
'tags': ['CBS 2 News Weekends', 'Cindy Hsu', 'Blue Man Group'],
|
||||||
|
},
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
@ -62,8 +92,11 @@ class CBSLocalIE(AnvatoIE):
|
|||||||
info_dict = self._extract_anvato_videos(webpage, display_id)
|
info_dict = self._extract_anvato_videos(webpage, display_id)
|
||||||
|
|
||||||
time_str = self._html_search_regex(
|
time_str = self._html_search_regex(
|
||||||
r'class="entry-date">([^<]+)<', webpage, 'released date', fatal=False)
|
r'class="entry-date">([^<]+)<', webpage, 'released date', default=None)
|
||||||
|
if time_str:
|
||||||
timestamp = unified_timestamp(time_str)
|
timestamp = unified_timestamp(time_str)
|
||||||
|
else:
|
||||||
|
timestamp = parse_iso8601(self._html_search_meta('uploadDate', webpage))
|
||||||
|
|
||||||
info_dict.update({
|
info_dict.update({
|
||||||
'display_id': display_id,
|
'display_id': display_id,
|
||||||
|
@ -39,7 +39,7 @@ class CBSNewsIE(CBSIE):
|
|||||||
'upload_date': '20140404',
|
'upload_date': '20140404',
|
||||||
'timestamp': 1396650660,
|
'timestamp': 1396650660,
|
||||||
'uploader': 'CBSI-NEW',
|
'uploader': 'CBSI-NEW',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'duration': 205,
|
'duration': 205,
|
||||||
'subtitles': {
|
'subtitles': {
|
||||||
'en': [{
|
'en': [{
|
||||||
|
@ -19,7 +19,7 @@ class CCCIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Introduction to Processor Design',
|
'title': 'Introduction to Processor Design',
|
||||||
'description': 'md5:df55f6d073d4ceae55aae6f2fd98a0ac',
|
'description': 'md5:df55f6d073d4ceae55aae6f2fd98a0ac',
|
||||||
'thumbnail': 're:^https?://.*\.jpg$',
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
'upload_date': '20131228',
|
'upload_date': '20131228',
|
||||||
'timestamp': 1388188800,
|
'timestamp': 1388188800,
|
||||||
'duration': 3710,
|
'duration': 3710,
|
||||||
@ -32,7 +32,7 @@ class CCCIE(InfoExtractor):
|
|||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
display_id = self._match_id(url)
|
display_id = self._match_id(url)
|
||||||
webpage = self._download_webpage(url, display_id)
|
webpage = self._download_webpage(url, display_id)
|
||||||
event_id = self._search_regex("data-id='(\d+)'", webpage, 'event id')
|
event_id = self._search_regex(r"data-id='(\d+)'", webpage, 'event id')
|
||||||
event_data = self._download_json('https://media.ccc.de/public/events/%s' % event_id, event_id)
|
event_data = self._download_json('https://media.ccc.de/public/events/%s' % event_id, event_id)
|
||||||
|
|
||||||
formats = []
|
formats = []
|
||||||
|
99
youtube_dl/extractor/ccma.py
Normal file
99
youtube_dl/extractor/ccma.py
Normal file
@ -0,0 +1,99 @@
|
|||||||
|
# coding: utf-8
|
||||||
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
import re
|
||||||
|
|
||||||
|
from .common import InfoExtractor
|
||||||
|
from ..utils import (
|
||||||
|
int_or_none,
|
||||||
|
parse_duration,
|
||||||
|
parse_iso8601,
|
||||||
|
clean_html,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
class CCMAIE(InfoExtractor):
|
||||||
|
_VALID_URL = r'https?://(?:www\.)?ccma\.cat/(?:[^/]+/)*?(?P<type>video|audio)/(?P<id>\d+)'
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'http://www.ccma.cat/tv3/alacarta/lespot-de-la-marato-de-tv3/lespot-de-la-marato-de-tv3/video/5630208/',
|
||||||
|
'md5': '7296ca43977c8ea4469e719c609b0871',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '5630208',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'L\'espot de La Marató de TV3',
|
||||||
|
'description': 'md5:f12987f320e2f6e988e9908e4fe97765',
|
||||||
|
'timestamp': 1470918540,
|
||||||
|
'upload_date': '20160811',
|
||||||
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'http://www.ccma.cat/catradio/alacarta/programa/el-consell-de-savis-analitza-el-derbi/audio/943685/',
|
||||||
|
'md5': 'fa3e38f269329a278271276330261425',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '943685',
|
||||||
|
'ext': 'mp3',
|
||||||
|
'title': 'El Consell de Savis analitza el derbi',
|
||||||
|
'description': 'md5:e2a3648145f3241cb9c6b4b624033e53',
|
||||||
|
'upload_date': '20171205',
|
||||||
|
'timestamp': 1512507300,
|
||||||
|
}
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
media_type, media_id = re.match(self._VALID_URL, url).groups()
|
||||||
|
media_data = {}
|
||||||
|
formats = []
|
||||||
|
profiles = ['pc'] if media_type == 'audio' else ['mobil', 'pc']
|
||||||
|
for i, profile in enumerate(profiles):
|
||||||
|
md = self._download_json('http://dinamics.ccma.cat/pvideo/media.jsp', media_id, query={
|
||||||
|
'media': media_type,
|
||||||
|
'idint': media_id,
|
||||||
|
'profile': profile,
|
||||||
|
}, fatal=False)
|
||||||
|
if md:
|
||||||
|
media_data = md
|
||||||
|
media_url = media_data.get('media', {}).get('url')
|
||||||
|
if media_url:
|
||||||
|
formats.append({
|
||||||
|
'format_id': profile,
|
||||||
|
'url': media_url,
|
||||||
|
'quality': i,
|
||||||
|
})
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
|
informacio = media_data['informacio']
|
||||||
|
title = informacio['titol']
|
||||||
|
durada = informacio.get('durada', {})
|
||||||
|
duration = int_or_none(durada.get('milisegons'), 1000) or parse_duration(durada.get('text'))
|
||||||
|
timestamp = parse_iso8601(informacio.get('data_emissio', {}).get('utc'))
|
||||||
|
|
||||||
|
subtitles = {}
|
||||||
|
subtitols = media_data.get('subtitols', {})
|
||||||
|
if subtitols:
|
||||||
|
sub_url = subtitols.get('url')
|
||||||
|
if sub_url:
|
||||||
|
subtitles.setdefault(
|
||||||
|
subtitols.get('iso') or subtitols.get('text') or 'ca', []).append({
|
||||||
|
'url': sub_url,
|
||||||
|
})
|
||||||
|
|
||||||
|
thumbnails = []
|
||||||
|
imatges = media_data.get('imatges', {})
|
||||||
|
if imatges:
|
||||||
|
thumbnail_url = imatges.get('url')
|
||||||
|
if thumbnail_url:
|
||||||
|
thumbnails = [{
|
||||||
|
'url': thumbnail_url,
|
||||||
|
'width': int_or_none(imatges.get('amplada')),
|
||||||
|
'height': int_or_none(imatges.get('alcada')),
|
||||||
|
}]
|
||||||
|
|
||||||
|
return {
|
||||||
|
'id': media_id,
|
||||||
|
'title': title,
|
||||||
|
'description': clean_html(informacio.get('descripcio')),
|
||||||
|
'duration': duration,
|
||||||
|
'timestamp': timestamp,
|
||||||
|
'thumnails': thumbnails,
|
||||||
|
'subtitles': subtitles,
|
||||||
|
'formats': formats,
|
||||||
|
}
|
@ -4,50 +4,188 @@ from __future__ import unicode_literals
|
|||||||
import re
|
import re
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..utils import float_or_none
|
from ..compat import compat_str
|
||||||
|
from ..utils import (
|
||||||
|
float_or_none,
|
||||||
|
try_get,
|
||||||
|
unified_timestamp,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class CCTVIE(InfoExtractor):
|
class CCTVIE(InfoExtractor):
|
||||||
_VALID_URL = r'''(?x)https?://(?:.+?\.)?
|
IE_DESC = '央视网'
|
||||||
(?:
|
_VALID_URL = r'https?://(?:(?:[^/]+)\.(?:cntv|cctv)\.(?:com|cn)|(?:www\.)?ncpa-classic\.com)/(?:[^/]+/)*?(?P<id>[^/?#&]+?)(?:/index)?(?:\.s?html|[?#&]|$)'
|
||||||
cctv\.(?:com|cn)|
|
|
||||||
cntv\.cn
|
|
||||||
)/
|
|
||||||
(?:
|
|
||||||
video/[^/]+/(?P<id>[0-9a-f]{32})|
|
|
||||||
\d{4}/\d{2}/\d{2}/(?P<display_id>VID[0-9A-Za-z]+)
|
|
||||||
)'''
|
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://english.cntv.cn/2016/09/03/VIDEhnkB5y9AgHyIEVphCEz1160903.shtml',
|
# fo.addVariable("videoCenterId","id")
|
||||||
'md5': '819c7b49fc3927d529fb4cd555621823',
|
'url': 'http://sports.cntv.cn/2016/02/12/ARTIaBRxv4rTT1yWf1frW2wi160212.shtml',
|
||||||
|
'md5': 'd61ec00a493e09da810bf406a078f691',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '454368eb19ad44a1925bf1eb96140a61',
|
'id': '5ecdbeab623f4973b40ff25f18b174e8',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Portrait of Real Current Life 09/03/2016 Modern Inventors Part 1',
|
'title': '[NBA]二少联手砍下46分 雷霆主场击败鹈鹕(快讯)',
|
||||||
}
|
'description': 'md5:7e14a5328dc5eb3d1cd6afbbe0574e95',
|
||||||
|
'duration': 98,
|
||||||
|
'uploader': 'songjunjie',
|
||||||
|
'timestamp': 1455279956,
|
||||||
|
'upload_date': '20160212',
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# var guid = "id"
|
||||||
|
'url': 'http://tv.cctv.com/2016/02/05/VIDEUS7apq3lKrHG9Dncm03B160205.shtml',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'efc5d49e5b3b4ab2b34f3a502b73d3ae',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': '[赛车]“车王”舒马赫恢复情况成谜(快讯)',
|
||||||
|
'description': '2月4日,蒙特泽莫罗透露了关于“车王”舒马赫恢复情况,但情况是否属实遭到了质疑。',
|
||||||
|
'duration': 37,
|
||||||
|
'uploader': 'shujun',
|
||||||
|
'timestamp': 1454677291,
|
||||||
|
'upload_date': '20160205',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# changePlayer('id')
|
||||||
|
'url': 'http://english.cntv.cn/special/four_comprehensives/index.shtml',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '4bb9bb4db7a6471ba85fdeda5af0381e',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'NHnews008 ANNUAL POLITICAL SEASON',
|
||||||
|
'description': 'Four Comprehensives',
|
||||||
|
'duration': 60,
|
||||||
|
'uploader': 'zhangyunlei',
|
||||||
|
'timestamp': 1425385521,
|
||||||
|
'upload_date': '20150303',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# loadvideo('id')
|
||||||
|
'url': 'http://cctv.cntv.cn/lm/tvseries_russian/yilugesanghua/index.shtml',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'b15f009ff45c43968b9af583fc2e04b2',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': 'Путь,усыпанный космеями Серия 1',
|
||||||
|
'description': 'Путь, усыпанный космеями',
|
||||||
|
'duration': 2645,
|
||||||
|
'uploader': 'renxue',
|
||||||
|
'timestamp': 1477479241,
|
||||||
|
'upload_date': '20161026',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# var initMyAray = 'id'
|
||||||
|
'url': 'http://www.ncpa-classic.com/2013/05/22/VIDE1369219508996867.shtml',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'a194cfa7f18c426b823d876668325946',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'title': '小泽征尔音乐塾 音乐梦想无国界',
|
||||||
|
'duration': 2173,
|
||||||
|
'timestamp': 1369248264,
|
||||||
|
'upload_date': '20130522',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
}, {
|
||||||
|
# var ids = ["id"]
|
||||||
|
'url': 'http://www.ncpa-classic.com/clt/more/416/index.shtml',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'a8606119a4884588a79d81c02abecc16',
|
||||||
|
'ext': 'mp3',
|
||||||
|
'title': '来自维也纳的新年贺礼',
|
||||||
|
'description': 'md5:f13764ae8dd484e84dd4b39d5bcba2a7',
|
||||||
|
'duration': 1578,
|
||||||
|
'uploader': 'djy',
|
||||||
|
'timestamp': 1482942419,
|
||||||
|
'upload_date': '20161228',
|
||||||
|
},
|
||||||
|
'params': {
|
||||||
|
'skip_download': True,
|
||||||
|
},
|
||||||
|
'expected_warnings': ['Failed to download m3u8 information'],
|
||||||
|
}, {
|
||||||
|
'url': 'http://ent.cntv.cn/2016/01/18/ARTIjprSSJH8DryTVr5Bx8Wb160118.shtml',
|
||||||
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://tv.cntv.cn/video/C39296/e0210d949f113ddfb38d31f00a4e5c44',
|
||||||
|
'only_matching': True,
|
||||||
|
}, {
|
||||||
|
'url': 'http://english.cntv.cn/2016/09/03/VIDEhnkB5y9AgHyIEVphCEz1160903.shtml',
|
||||||
|
'only_matching': True,
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://tv.cctv.com/2016/09/07/VIDE5C1FnlX5bUywlrjhxXOV160907.shtml',
|
'url': 'http://tv.cctv.com/2016/09/07/VIDE5C1FnlX5bUywlrjhxXOV160907.shtml',
|
||||||
'only_matching': True,
|
'only_matching': True,
|
||||||
}, {
|
}, {
|
||||||
'url': 'http://tv.cntv.cn/video/C39296/95cfac44cabd3ddc4a9438780a4e5c44',
|
'url': 'http://tv.cntv.cn/video/C39296/95cfac44cabd3ddc4a9438780a4e5c44',
|
||||||
'only_matching': True
|
'only_matching': True,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id, display_id = re.match(self._VALID_URL, url).groups()
|
video_id = self._match_id(url)
|
||||||
if not video_id:
|
webpage = self._download_webpage(url, video_id)
|
||||||
webpage = self._download_webpage(url, display_id)
|
|
||||||
video_id = self._search_regex(
|
video_id = self._search_regex(
|
||||||
r'(?:fo\.addVariable\("videoCenterId",\s*|guid\s*=\s*)"([0-9a-f]{32})',
|
[r'var\s+guid\s*=\s*["\']([\da-fA-F]+)',
|
||||||
webpage, 'video_id')
|
r'videoCenterId["\']\s*,\s*["\']([\da-fA-F]+)',
|
||||||
api_data = self._download_json(
|
r'changePlayer\s*\(\s*["\']([\da-fA-F]+)',
|
||||||
'http://vdn.apps.cntv.cn/api/getHttpVideoInfo.do?pid=' + video_id, video_id)
|
r'load[Vv]ideo\s*\(\s*["\']([\da-fA-F]+)',
|
||||||
m3u8_url = re.sub(r'maxbr=\d+&?', '', api_data['hls_url'])
|
r'var\s+initMyAray\s*=\s*["\']([\da-fA-F]+)',
|
||||||
|
r'var\s+ids\s*=\s*\[["\']([\da-fA-F]+)'],
|
||||||
|
webpage, 'video id')
|
||||||
|
|
||||||
|
data = self._download_json(
|
||||||
|
'http://vdn.apps.cntv.cn/api/getHttpVideoInfo.do', video_id,
|
||||||
|
query={
|
||||||
|
'pid': video_id,
|
||||||
|
'url': url,
|
||||||
|
'idl': 32,
|
||||||
|
'idlr': 32,
|
||||||
|
'modifyed': 'false',
|
||||||
|
})
|
||||||
|
|
||||||
|
title = data['title']
|
||||||
|
|
||||||
|
formats = []
|
||||||
|
|
||||||
|
video = data.get('video')
|
||||||
|
if isinstance(video, dict):
|
||||||
|
for quality, chapters_key in enumerate(('lowChapters', 'chapters')):
|
||||||
|
video_url = try_get(
|
||||||
|
video, lambda x: x[chapters_key][0]['url'], compat_str)
|
||||||
|
if video_url:
|
||||||
|
formats.append({
|
||||||
|
'url': video_url,
|
||||||
|
'format_id': 'http',
|
||||||
|
'quality': quality,
|
||||||
|
'preference': -1,
|
||||||
|
})
|
||||||
|
|
||||||
|
hls_url = try_get(data, lambda x: x['hls_url'], compat_str)
|
||||||
|
if hls_url:
|
||||||
|
hls_url = re.sub(r'maxbr=\d+&?', '', hls_url)
|
||||||
|
formats.extend(self._extract_m3u8_formats(
|
||||||
|
hls_url, video_id, 'mp4', entry_protocol='m3u8_native',
|
||||||
|
m3u8_id='hls', fatal=False))
|
||||||
|
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
|
uploader = data.get('editer_name')
|
||||||
|
description = self._html_search_meta(
|
||||||
|
'description', webpage, default=None)
|
||||||
|
timestamp = unified_timestamp(data.get('f_pgmtime'))
|
||||||
|
duration = float_or_none(try_get(video, lambda x: x['totalLength']))
|
||||||
|
|
||||||
return {
|
return {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': api_data['title'],
|
'title': title,
|
||||||
'formats': self._extract_m3u8_formats(
|
'description': description,
|
||||||
m3u8_url, video_id, 'mp4', 'm3u8_native', fatal=False),
|
'uploader': uploader,
|
||||||
'duration': float_or_none(api_data.get('video', {}).get('totalLength')),
|
'timestamp': timestamp,
|
||||||
|
'duration': duration,
|
||||||
|
'formats': formats,
|
||||||
}
|
}
|
||||||
|
@ -1,18 +1,21 @@
|
|||||||
# coding: utf-8
|
# coding: utf-8
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
|
import codecs
|
||||||
import re
|
import re
|
||||||
|
|
||||||
from .common import InfoExtractor
|
from .common import InfoExtractor
|
||||||
from ..utils import (
|
from ..utils import (
|
||||||
decode_packed_codes,
|
|
||||||
ExtractorError,
|
ExtractorError,
|
||||||
parse_duration
|
float_or_none,
|
||||||
|
int_or_none,
|
||||||
|
parse_duration,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
class CDAIE(InfoExtractor):
|
class CDAIE(InfoExtractor):
|
||||||
_VALID_URL = r'https?://(?:(?:www\.)?cda\.pl/video|ebd\.cda\.pl/[0-9]+x[0-9]+)/(?P<id>[0-9a-z]+)'
|
_VALID_URL = r'https?://(?:(?:www\.)?cda\.pl/video|ebd\.cda\.pl/[0-9]+x[0-9]+)/(?P<id>[0-9a-z]+)'
|
||||||
|
_BASE_URL = 'http://www.cda.pl/'
|
||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.cda.pl/video/5749950c',
|
'url': 'http://www.cda.pl/video/5749950c',
|
||||||
'md5': '6f844bf51b15f31fae165365707ae970',
|
'md5': '6f844bf51b15f31fae165365707ae970',
|
||||||
@ -21,6 +24,9 @@ class CDAIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'height': 720,
|
'height': 720,
|
||||||
'title': 'Oto dlaczego przed zakrętem należy zwolnić.',
|
'title': 'Oto dlaczego przed zakrętem należy zwolnić.',
|
||||||
|
'description': 'md5:269ccd135d550da90d1662651fcb9772',
|
||||||
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
|
'average_rating': float,
|
||||||
'duration': 39
|
'duration': 39
|
||||||
}
|
}
|
||||||
}, {
|
}, {
|
||||||
@ -30,6 +36,11 @@ class CDAIE(InfoExtractor):
|
|||||||
'id': '57413289',
|
'id': '57413289',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Lądowanie na lotnisku na Maderze',
|
'title': 'Lądowanie na lotnisku na Maderze',
|
||||||
|
'description': 'md5:60d76b71186dcce4e0ba6d4bbdb13e1a',
|
||||||
|
'thumbnail': r're:^https?://.*\.jpg$',
|
||||||
|
'uploader': 'crash404',
|
||||||
|
'view_count': int,
|
||||||
|
'average_rating': float,
|
||||||
'duration': 137
|
'duration': 137
|
||||||
}
|
}
|
||||||
}, {
|
}, {
|
||||||
@ -39,31 +50,59 @@ class CDAIE(InfoExtractor):
|
|||||||
|
|
||||||
def _real_extract(self, url):
|
def _real_extract(self, url):
|
||||||
video_id = self._match_id(url)
|
video_id = self._match_id(url)
|
||||||
webpage = self._download_webpage('http://ebd.cda.pl/0x0/' + video_id, video_id)
|
self._set_cookie('cda.pl', 'cda.player', 'html5')
|
||||||
|
webpage = self._download_webpage(
|
||||||
|
self._BASE_URL + '/video/' + video_id, video_id)
|
||||||
|
|
||||||
if 'Ten film jest dostępny dla użytkowników premium' in webpage:
|
if 'Ten film jest dostępny dla użytkowników premium' in webpage:
|
||||||
raise ExtractorError('This video is only available for premium users.', expected=True)
|
raise ExtractorError('This video is only available for premium users.', expected=True)
|
||||||
|
|
||||||
title = self._html_search_regex(r'<title>(.+?)</title>', webpage, 'title')
|
|
||||||
|
|
||||||
formats = []
|
formats = []
|
||||||
|
|
||||||
|
uploader = self._search_regex(r'''(?x)
|
||||||
|
<(span|meta)[^>]+itemprop=(["\'])author\2[^>]*>
|
||||||
|
(?:<\1[^>]*>[^<]*</\1>|(?!</\1>)(?:.|\n))*?
|
||||||
|
<(span|meta)[^>]+itemprop=(["\'])name\4[^>]*>(?P<uploader>[^<]+)</\3>
|
||||||
|
''', webpage, 'uploader', default=None, group='uploader')
|
||||||
|
view_count = self._search_regex(
|
||||||
|
r'Odsłony:(?:\s| )*([0-9]+)', webpage,
|
||||||
|
'view_count', default=None)
|
||||||
|
average_rating = self._search_regex(
|
||||||
|
r'<(?:span|meta)[^>]+itemprop=(["\'])ratingValue\1[^>]*>(?P<rating_value>[0-9.]+)',
|
||||||
|
webpage, 'rating', fatal=False, group='rating_value')
|
||||||
|
|
||||||
info_dict = {
|
info_dict = {
|
||||||
'id': video_id,
|
'id': video_id,
|
||||||
'title': title,
|
'title': self._og_search_title(webpage),
|
||||||
|
'description': self._og_search_description(webpage),
|
||||||
|
'uploader': uploader,
|
||||||
|
'view_count': int_or_none(view_count),
|
||||||
|
'average_rating': float_or_none(average_rating),
|
||||||
|
'thumbnail': self._og_search_thumbnail(webpage),
|
||||||
'formats': formats,
|
'formats': formats,
|
||||||
'duration': None,
|
'duration': None,
|
||||||
}
|
}
|
||||||
|
|
||||||
def extract_format(page, version):
|
def extract_format(page, version):
|
||||||
unpacked = decode_packed_codes(page)
|
json_str = self._search_regex(
|
||||||
format_url = self._search_regex(
|
r'player_data=(\\?["\'])(?P<player_data>.+?)\1', page,
|
||||||
r"(?:file|url)\s*:\s*(\\?[\"'])(?P<url>http.+?)\1", unpacked,
|
'%s player_json' % version, fatal=False, group='player_data')
|
||||||
'%s url' % version, fatal=False, group='url')
|
if not json_str:
|
||||||
if not format_url:
|
|
||||||
return
|
return
|
||||||
|
player_data = self._parse_json(
|
||||||
|
json_str, '%s player_data' % version, fatal=False)
|
||||||
|
if not player_data:
|
||||||
|
return
|
||||||
|
video = player_data.get('video')
|
||||||
|
if not video or 'file' not in video:
|
||||||
|
self.report_warning('Unable to extract %s version information' % version)
|
||||||
|
return
|
||||||
|
if video['file'].startswith('uggc'):
|
||||||
|
video['file'] = codecs.decode(video['file'], 'rot_13')
|
||||||
|
if video['file'].endswith('adc.mp4'):
|
||||||
|
video['file'] = video['file'].replace('adc.mp4', '.mp4')
|
||||||
f = {
|
f = {
|
||||||
'url': format_url,
|
'url': video['file'],
|
||||||
}
|
}
|
||||||
m = re.search(
|
m = re.search(
|
||||||
r'<a[^>]+data-quality="(?P<format_id>[^"]+)"[^>]+href="[^"]+"[^>]+class="[^"]*quality-btn-active[^"]*">(?P<height>[0-9]+)p',
|
r'<a[^>]+data-quality="(?P<format_id>[^"]+)"[^>]+href="[^"]+"[^>]+class="[^"]*quality-btn-active[^"]*">(?P<height>[0-9]+)p',
|
||||||
@ -75,9 +114,7 @@ class CDAIE(InfoExtractor):
|
|||||||
})
|
})
|
||||||
info_dict['formats'].append(f)
|
info_dict['formats'].append(f)
|
||||||
if not info_dict['duration']:
|
if not info_dict['duration']:
|
||||||
info_dict['duration'] = parse_duration(self._search_regex(
|
info_dict['duration'] = parse_duration(video.get('duration'))
|
||||||
r"duration\s*:\s*(\\?[\"'])(?P<duration>.+?)\1",
|
|
||||||
unpacked, 'duration', fatal=False, group='duration'))
|
|
||||||
|
|
||||||
extract_format(webpage, 'default')
|
extract_format(webpage, 'default')
|
||||||
|
|
||||||
@ -85,7 +122,8 @@ class CDAIE(InfoExtractor):
|
|||||||
r'<a[^>]+data-quality="[^"]+"[^>]+href="([^"]+)"[^>]+class="quality-btn"[^>]*>([0-9]+p)',
|
r'<a[^>]+data-quality="[^"]+"[^>]+href="([^"]+)"[^>]+class="quality-btn"[^>]*>([0-9]+p)',
|
||||||
webpage):
|
webpage):
|
||||||
webpage = self._download_webpage(
|
webpage = self._download_webpage(
|
||||||
href, video_id, 'Downloading %s version information' % resolution, fatal=False)
|
self._BASE_URL + href, video_id,
|
||||||
|
'Downloading %s version information' % resolution, fatal=False)
|
||||||
if not webpage:
|
if not webpage:
|
||||||
# Manually report warning because empty page is returned when
|
# Manually report warning because empty page is returned when
|
||||||
# invalid version is requested.
|
# invalid version is requested.
|
||||||
|
@ -13,6 +13,7 @@ from ..utils import (
|
|||||||
float_or_none,
|
float_or_none,
|
||||||
sanitized_Request,
|
sanitized_Request,
|
||||||
urlencode_postdata,
|
urlencode_postdata,
|
||||||
|
USER_AGENTS,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
@ -21,11 +22,11 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
_TESTS = [{
|
_TESTS = [{
|
||||||
'url': 'http://www.ceskatelevize.cz/ivysilani/ivysilani/10441294653-hyde-park-civilizace/214411058091220',
|
'url': 'http://www.ceskatelevize.cz/ivysilani/ivysilani/10441294653-hyde-park-civilizace/214411058091220',
|
||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': '61924494876951776',
|
'id': '61924494877246241',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Hyde Park Civilizace',
|
'title': 'Hyde Park Civilizace: Život v Grónsku',
|
||||||
'description': 'md5:fe93f6eda372d150759d11644ebbfb4a',
|
'description': 'md5:3fec8f6bb497be5cdb0c9e8781076626',
|
||||||
'thumbnail': 're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'duration': 3350,
|
'duration': 3350,
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
@ -39,7 +40,7 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Hyde Park Civilizace: Bonus 01 - En',
|
'title': 'Hyde Park Civilizace: Bonus 01 - En',
|
||||||
'description': 'English Subtittles',
|
'description': 'English Subtittles',
|
||||||
'thumbnail': 're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'duration': 81.3,
|
'duration': 81.3,
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
@ -52,7 +53,7 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
'info_dict': {
|
'info_dict': {
|
||||||
'id': 402,
|
'id': 402,
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 're:^ČT Sport \d{4}-\d{2}-\d{2} \d{2}:\d{2}$',
|
'title': r're:^ČT Sport \d{4}-\d{2}-\d{2} \d{2}:\d{2}$',
|
||||||
'is_live': True,
|
'is_live': True,
|
||||||
},
|
},
|
||||||
'params': {
|
'params': {
|
||||||
@ -80,7 +81,7 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
'id': '61924494877068022',
|
'id': '61924494877068022',
|
||||||
'ext': 'mp4',
|
'ext': 'mp4',
|
||||||
'title': 'Queer: Bogotart (Queer)',
|
'title': 'Queer: Bogotart (Queer)',
|
||||||
'thumbnail': 're:^https?://.*\.jpg',
|
'thumbnail': r're:^https?://.*\.jpg',
|
||||||
'duration': 1558.3,
|
'duration': 1558.3,
|
||||||
},
|
},
|
||||||
}],
|
}],
|
||||||
@ -114,6 +115,9 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
'requestSource': 'iVysilani',
|
'requestSource': 'iVysilani',
|
||||||
}
|
}
|
||||||
|
|
||||||
|
entries = []
|
||||||
|
|
||||||
|
for user_agent in (None, USER_AGENTS['Safari']):
|
||||||
req = sanitized_Request(
|
req = sanitized_Request(
|
||||||
'http://www.ceskatelevize.cz/ivysilani/ajax/get-client-playlist',
|
'http://www.ceskatelevize.cz/ivysilani/ajax/get-client-playlist',
|
||||||
data=urlencode_postdata(data))
|
data=urlencode_postdata(data))
|
||||||
@ -121,9 +125,14 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
req.add_header('Content-type', 'application/x-www-form-urlencoded')
|
req.add_header('Content-type', 'application/x-www-form-urlencoded')
|
||||||
req.add_header('x-addr', '127.0.0.1')
|
req.add_header('x-addr', '127.0.0.1')
|
||||||
req.add_header('X-Requested-With', 'XMLHttpRequest')
|
req.add_header('X-Requested-With', 'XMLHttpRequest')
|
||||||
|
if user_agent:
|
||||||
|
req.add_header('User-Agent', user_agent)
|
||||||
req.add_header('Referer', url)
|
req.add_header('Referer', url)
|
||||||
|
|
||||||
playlistpage = self._download_json(req, playlist_id)
|
playlistpage = self._download_json(req, playlist_id, fatal=False)
|
||||||
|
|
||||||
|
if not playlistpage:
|
||||||
|
continue
|
||||||
|
|
||||||
playlist_url = playlistpage['url']
|
playlist_url = playlistpage['url']
|
||||||
if playlist_url == 'error_region':
|
if playlist_url == 'error_region':
|
||||||
@ -135,19 +144,38 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
playlist_title = self._og_search_title(webpage, default=None)
|
playlist_title = self._og_search_title(webpage, default=None)
|
||||||
playlist_description = self._og_search_description(webpage, default=None)
|
playlist_description = self._og_search_description(webpage, default=None)
|
||||||
|
|
||||||
playlist = self._download_json(req, playlist_id)['playlist']
|
playlist = self._download_json(req, playlist_id, fatal=False)
|
||||||
|
if not playlist:
|
||||||
|
continue
|
||||||
|
|
||||||
|
playlist = playlist.get('playlist')
|
||||||
|
if not isinstance(playlist, list):
|
||||||
|
continue
|
||||||
|
|
||||||
playlist_len = len(playlist)
|
playlist_len = len(playlist)
|
||||||
|
|
||||||
entries = []
|
for num, item in enumerate(playlist):
|
||||||
for item in playlist:
|
|
||||||
is_live = item.get('type') == 'LIVE'
|
is_live = item.get('type') == 'LIVE'
|
||||||
formats = []
|
formats = []
|
||||||
for format_id, stream_url in item['streamUrls'].items():
|
for format_id, stream_url in item.get('streamUrls', {}).items():
|
||||||
formats.extend(self._extract_m3u8_formats(
|
if 'playerType=flash' in stream_url:
|
||||||
|
stream_formats = self._extract_m3u8_formats(
|
||||||
stream_url, playlist_id, 'mp4',
|
stream_url, playlist_id, 'mp4',
|
||||||
entry_protocol='m3u8' if is_live else 'm3u8_native',
|
entry_protocol='m3u8' if is_live else 'm3u8_native',
|
||||||
fatal=False))
|
m3u8_id='hls-%s' % format_id, fatal=False)
|
||||||
self._sort_formats(formats)
|
else:
|
||||||
|
stream_formats = self._extract_mpd_formats(
|
||||||
|
stream_url, playlist_id,
|
||||||
|
mpd_id='dash-%s' % format_id, fatal=False)
|
||||||
|
# See https://github.com/rg3/youtube-dl/issues/12119#issuecomment-280037031
|
||||||
|
if format_id == 'audioDescription':
|
||||||
|
for f in stream_formats:
|
||||||
|
f['source_preference'] = -10
|
||||||
|
formats.extend(stream_formats)
|
||||||
|
|
||||||
|
if user_agent and len(entries) == playlist_len:
|
||||||
|
entries[num]['formats'].extend(formats)
|
||||||
|
continue
|
||||||
|
|
||||||
item_id = item.get('id') or item['assetId']
|
item_id = item.get('id') or item['assetId']
|
||||||
title = item['title']
|
title = item['title']
|
||||||
@ -179,6 +207,9 @@ class CeskaTelevizeIE(InfoExtractor):
|
|||||||
'is_live': is_live,
|
'is_live': is_live,
|
||||||
})
|
})
|
||||||
|
|
||||||
|
for e in entries:
|
||||||
|
self._sort_formats(e['formats'])
|
||||||
|
|
||||||
return self.playlist_result(entries, playlist_id, playlist_title, playlist_description)
|
return self.playlist_result(entries, playlist_id, playlist_title, playlist_description)
|
||||||
|
|
||||||
def _get_subtitles(self, episode_id, subs):
|
def _get_subtitles(self, episode_id, subs):
|
||||||
|
Some files were not shown because too many files have changed in this diff Show More
Loading…
x
Reference in New Issue
Block a user