]> jfr.im git - yt-dlp.git/blame - test/test_subtitles.py
[lynda] Convert to new subtitles system
[yt-dlp.git] / test / test_subtitles.py
CommitLineData
ae84f879 1#!/usr/bin/env python
a0f59cdc 2from __future__ import unicode_literals
ae84f879
JMF
3
4# Allow direct execution
5import os
6import sys
7import unittest
8sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
9
d0efb9ec 10from test.helper import FakeYDL, md5
ae84f879
JMF
11
12
13from youtube_dl.extractor import (
b4bcffef 14 BlipTVIE,
ae84f879
JMF
15 YoutubeIE,
16 DailymotionIE,
17 TEDIE,
4edff4cf 18 VimeoIE,
7bc8780c 19 WallaIE,
0b54a5b1 20 CeskaTelevizeIE,
311c3938 21 LyndaIE,
ae84f879
JMF
22)
23
24
25class BaseTestSubtitles(unittest.TestCase):
26 url = None
27 IE = None
5f6a1245 28
ae84f879
JMF
29 def setUp(self):
30 self.DL = FakeYDL()
a504ced0
JMF
31 self.ie = self.IE()
32 self.DL.add_info_extractor(self.ie)
ae84f879
JMF
33
34 def getInfoDict(self):
a504ced0 35 info_dict = self.DL.extract_info(self.url, download=False)
ae84f879
JMF
36 return info_dict
37
38 def getSubtitles(self):
39 info_dict = self.getInfoDict()
c84dd8a9 40 subtitles = info_dict['requested_subtitles']
a504ced0
JMF
41 if not subtitles:
42 return subtitles
43 for sub_info in subtitles.values():
44 if sub_info.get('data') is None:
45 uf = self.DL.urlopen(sub_info['url'])
46 sub_info['data'] = uf.read().decode('utf-8')
47 return dict((l, sub_info['data']) for l, sub_info in subtitles.items())
ae84f879
JMF
48
49
50class TestYoutubeSubtitles(BaseTestSubtitles):
51 url = 'QRS8MkLhQmM'
52 IE = YoutubeIE
53
ae84f879
JMF
54 def test_youtube_subtitles(self):
55 self.DL.params['writesubtitles'] = True
56 subtitles = self.getSubtitles()
57 self.assertEqual(md5(subtitles['en']), '4cd9278a35ba2305f47354ee13472260')
58
59 def test_youtube_subtitles_lang(self):
60 self.DL.params['writesubtitles'] = True
61 self.DL.params['subtitleslangs'] = ['it']
62 subtitles = self.getSubtitles()
63 self.assertEqual(md5(subtitles['it']), '164a51f16f260476a05b50fe4c2f161d')
64
65 def test_youtube_allsubtitles(self):
66 self.DL.params['writesubtitles'] = True
67 self.DL.params['allsubtitles'] = True
68 subtitles = self.getSubtitles()
69 self.assertEqual(len(subtitles.keys()), 13)
70
71 def test_youtube_subtitles_sbv_format(self):
72 self.DL.params['writesubtitles'] = True
73 self.DL.params['subtitlesformat'] = 'sbv'
74 subtitles = self.getSubtitles()
75 self.assertEqual(md5(subtitles['en']), '13aeaa0c245a8bed9a451cb643e3ad8b')
76
77 def test_youtube_subtitles_vtt_format(self):
78 self.DL.params['writesubtitles'] = True
79 self.DL.params['subtitlesformat'] = 'vtt'
80 subtitles = self.getSubtitles()
4e0084d9 81 self.assertEqual(md5(subtitles['en']), '3cb210999d3e021bd6c7f0ea751eab06')
ae84f879
JMF
82
83 def test_youtube_list_subtitles(self):
a0f59cdc 84 self.DL.expect_warning('Video doesn\'t have automatic captions')
ae84f879
JMF
85 self.DL.params['listsubtitles'] = True
86 info_dict = self.getInfoDict()
87 self.assertEqual(info_dict, None)
88
89 def test_youtube_automatic_captions(self):
90 self.url = '8YoUxe5ncPo'
91 self.DL.params['writeautomaticsub'] = True
92 self.DL.params['subtitleslangs'] = ['it']
93 subtitles = self.getSubtitles()
94 self.assertTrue(subtitles['it'] is not None)
95
7d900ef1
JMF
96 def test_youtube_translated_subtitles(self):
97 # This video has a subtitles track, which can be translated
98 self.url = 'Ky9eprVWzlI'
99 self.DL.params['writeautomaticsub'] = True
100 self.DL.params['subtitleslangs'] = ['it']
101 subtitles = self.getSubtitles()
102 self.assertTrue(subtitles['it'] is not None)
103
ae84f879 104 def test_youtube_nosubtitles(self):
a0f59cdc 105 self.DL.expect_warning('video doesn\'t have subtitles')
345e3783 106 self.url = 'n5BB19UTcdA'
ae84f879
JMF
107 self.DL.params['writesubtitles'] = True
108 self.DL.params['allsubtitles'] = True
109 subtitles = self.getSubtitles()
110 self.assertEqual(len(subtitles), 0)
111
112 def test_youtube_multiple_langs(self):
113 self.url = 'QRS8MkLhQmM'
114 self.DL.params['writesubtitles'] = True
115 langs = ['it', 'fr', 'de']
116 self.DL.params['subtitleslangs'] = langs
117 subtitles = self.getSubtitles()
118 for lang in langs:
a0f59cdc 119 self.assertTrue(subtitles.get(lang) is not None, 'Subtitles for \'%s\' not extracted' % lang)
ae84f879
JMF
120
121
122class TestDailymotionSubtitles(BaseTestSubtitles):
123 url = 'http://www.dailymotion.com/video/xczg00'
124 IE = DailymotionIE
125
ae84f879
JMF
126 def test_subtitles(self):
127 self.DL.params['writesubtitles'] = True
128 subtitles = self.getSubtitles()
129 self.assertEqual(md5(subtitles['en']), '976553874490cba125086bbfea3ff76f')
130
131 def test_subtitles_lang(self):
132 self.DL.params['writesubtitles'] = True
133 self.DL.params['subtitleslangs'] = ['fr']
134 subtitles = self.getSubtitles()
135 self.assertEqual(md5(subtitles['fr']), '594564ec7d588942e384e920e5341792')
136
137 def test_allsubtitles(self):
138 self.DL.params['writesubtitles'] = True
139 self.DL.params['allsubtitles'] = True
140 subtitles = self.getSubtitles()
8fb474fb 141 self.assertTrue(len(subtitles.keys()) >= 6)
ae84f879 142
ae84f879 143 def test_nosubtitles(self):
a0f59cdc 144 self.DL.expect_warning('video doesn\'t have subtitles')
ae84f879
JMF
145 self.url = 'http://www.dailymotion.com/video/x12u166_le-zapping-tele-star-du-08-aout-2013_tv'
146 self.DL.params['writesubtitles'] = True
147 self.DL.params['allsubtitles'] = True
148 subtitles = self.getSubtitles()
149 self.assertEqual(len(subtitles), 0)
150
151 def test_multiple_langs(self):
152 self.DL.params['writesubtitles'] = True
153 langs = ['es', 'fr', 'de']
154 self.DL.params['subtitleslangs'] = langs
155 subtitles = self.getSubtitles()
156 for lang in langs:
a0f59cdc 157 self.assertTrue(subtitles.get(lang) is not None, 'Subtitles for \'%s\' not extracted' % lang)
ae84f879
JMF
158
159
160class TestTedSubtitles(BaseTestSubtitles):
161 url = 'http://www.ted.com/talks/dan_dennett_on_our_consciousness.html'
162 IE = TEDIE
163
164 def test_no_writesubtitles(self):
165 subtitles = self.getSubtitles()
a504ced0 166 self.assertFalse(subtitles)
ae84f879
JMF
167
168 def test_subtitles(self):
169 self.DL.params['writesubtitles'] = True
170 subtitles = self.getSubtitles()
26dca166 171 self.assertEqual(md5(subtitles['en']), '4262c1665ff928a2dada178f62cb8d14')
ae84f879
JMF
172
173 def test_subtitles_lang(self):
174 self.DL.params['writesubtitles'] = True
175 self.DL.params['subtitleslangs'] = ['fr']
176 subtitles = self.getSubtitles()
26dca166 177 self.assertEqual(md5(subtitles['fr']), '66a63f7f42c97a50f8c0e90bc7797bb5')
ae84f879
JMF
178
179 def test_allsubtitles(self):
180 self.DL.params['writesubtitles'] = True
181 self.DL.params['allsubtitles'] = True
182 subtitles = self.getSubtitles()
0321213c 183 self.assertTrue(len(subtitles.keys()) >= 28)
ae84f879
JMF
184
185 def test_list_subtitles(self):
ae84f879
JMF
186 self.DL.params['listsubtitles'] = True
187 info_dict = self.getInfoDict()
188 self.assertEqual(info_dict, None)
189
ae84f879
JMF
190 def test_multiple_langs(self):
191 self.DL.params['writesubtitles'] = True
192 langs = ['es', 'fr', 'de']
193 self.DL.params['subtitleslangs'] = langs
194 subtitles = self.getSubtitles()
195 for lang in langs:
a0f59cdc 196 self.assertTrue(subtitles.get(lang) is not None, 'Subtitles for \'%s\' not extracted' % lang)
ae84f879 197
b4bcffef
PH
198
199class TestBlipTVSubtitles(BaseTestSubtitles):
200 url = 'http://blip.tv/a/a-6603250'
201 IE = BlipTVIE
202
203 def test_list_subtitles(self):
b4bcffef
PH
204 self.DL.params['listsubtitles'] = True
205 info_dict = self.getInfoDict()
206 self.assertEqual(info_dict, None)
207
208 def test_allsubtitles(self):
b4bcffef
PH
209 self.DL.params['writesubtitles'] = True
210 self.DL.params['allsubtitles'] = True
211 subtitles = self.getSubtitles()
212 self.assertEqual(set(subtitles.keys()), set(['en']))
213 self.assertEqual(md5(subtitles['en']), '5b75c300af65fe4476dff79478bb93e4')
214
215
4edff4cf
S
216class TestVimeoSubtitles(BaseTestSubtitles):
217 url = 'http://vimeo.com/76979871'
218 IE = VimeoIE
b0268cb6 219
4edff4cf
S
220 def test_subtitles(self):
221 self.DL.params['writesubtitles'] = True
222 subtitles = self.getSubtitles()
36e7a4ca 223 self.assertEqual(md5(subtitles['en']), '8062383cf4dec168fc40a088aa6d5888')
4edff4cf
S
224
225 def test_subtitles_lang(self):
226 self.DL.params['writesubtitles'] = True
227 self.DL.params['subtitleslangs'] = ['fr']
228 subtitles = self.getSubtitles()
229 self.assertEqual(md5(subtitles['fr']), 'b6191146a6c5d3a452244d853fde6dc8')
230
231 def test_allsubtitles(self):
232 self.DL.params['writesubtitles'] = True
233 self.DL.params['allsubtitles'] = True
234 subtitles = self.getSubtitles()
235 self.assertEqual(set(subtitles.keys()), set(['de', 'en', 'es', 'fr']))
236
4edff4cf 237 def test_nosubtitles(self):
a0f59cdc 238 self.DL.expect_warning('video doesn\'t have subtitles')
4edff4cf
S
239 self.url = 'http://vimeo.com/56015672'
240 self.DL.params['writesubtitles'] = True
241 self.DL.params['allsubtitles'] = True
242 subtitles = self.getSubtitles()
243 self.assertEqual(len(subtitles), 0)
244
245 def test_multiple_langs(self):
246 self.DL.params['writesubtitles'] = True
247 langs = ['es', 'fr', 'de']
248 self.DL.params['subtitleslangs'] = langs
249 subtitles = self.getSubtitles()
250 for lang in langs:
a0f59cdc 251 self.assertTrue(subtitles.get(lang) is not None, 'Subtitles for \'%s\' not extracted' % lang)
4edff4cf
S
252
253
0ca41c3d 254class TestWallaSubtitles(BaseTestSubtitles):
7bc8780c
S
255 url = 'http://vod.walla.co.il/movie/2705958/the-yes-men'
256 IE = WallaIE
257
258 def test_list_subtitles(self):
a0f59cdc 259 self.DL.expect_warning('Automatic Captions not supported by this server')
7bc8780c
S
260 self.DL.params['listsubtitles'] = True
261 info_dict = self.getInfoDict()
262 self.assertEqual(info_dict, None)
263
264 def test_allsubtitles(self):
a0f59cdc 265 self.DL.expect_warning('Automatic Captions not supported by this server')
7bc8780c
S
266 self.DL.params['writesubtitles'] = True
267 self.DL.params['allsubtitles'] = True
268 subtitles = self.getSubtitles()
269 self.assertEqual(set(subtitles.keys()), set(['heb']))
270 self.assertEqual(md5(subtitles['heb']), 'e758c5d7cb982f6bef14f377ec7a3920')
271
272 def test_nosubtitles(self):
a0f59cdc 273 self.DL.expect_warning('video doesn\'t have subtitles')
7bc8780c
S
274 self.url = 'http://vod.walla.co.il/movie/2642630/one-direction-all-for-one'
275 self.DL.params['writesubtitles'] = True
276 self.DL.params['allsubtitles'] = True
277 subtitles = self.getSubtitles()
278 self.assertEqual(len(subtitles), 0)
279
280
0b54a5b1
S
281class TestCeskaTelevizeSubtitles(BaseTestSubtitles):
282 url = 'http://www.ceskatelevize.cz/ivysilani/10600540290-u6-uzasny-svet-techniky'
283 IE = CeskaTelevizeIE
284
285 def test_list_subtitles(self):
286 self.DL.expect_warning('Automatic Captions not supported by this server')
287 self.DL.params['listsubtitles'] = True
288 info_dict = self.getInfoDict()
289 self.assertEqual(info_dict, None)
290
291 def test_allsubtitles(self):
292 self.DL.expect_warning('Automatic Captions not supported by this server')
293 self.DL.params['writesubtitles'] = True
294 self.DL.params['allsubtitles'] = True
295 subtitles = self.getSubtitles()
296 self.assertEqual(set(subtitles.keys()), set(['cs']))
8fb474fb 297 self.assertTrue(len(subtitles['cs']) > 20000)
0b54a5b1
S
298
299 def test_nosubtitles(self):
300 self.DL.expect_warning('video doesn\'t have subtitles')
301 self.url = 'http://www.ceskatelevize.cz/ivysilani/ivysilani/10441294653-hyde-park-civilizace/214411058091220'
302 self.DL.params['writesubtitles'] = True
303 self.DL.params['allsubtitles'] = True
304 subtitles = self.getSubtitles()
305 self.assertEqual(len(subtitles), 0)
306
307
311c3938
JMF
308class TestLyndaSubtitles(BaseTestSubtitles):
309 url = 'http://www.lynda.com/Bootstrap-tutorials/Using-exercise-files/110885/114408-4.html'
310 IE = LyndaIE
311
312 def test_allsubtitles(self):
313 self.DL.params['writesubtitles'] = True
314 self.DL.params['allsubtitles'] = True
315 subtitles = self.getSubtitles()
316 self.assertEqual(set(subtitles.keys()), set(['en']))
317 self.assertEqual(md5(subtitles['en']), '09bbe67222259bed60deaa26997d73a7')
318
319
ae84f879
JMF
320if __name__ == '__main__':
321 unittest.main()