File: youtube.lua

package info (click to toggle)
libquvi-scripts 0.9.20131130-3
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, forky, sid, trixie
  • size: 2,828 kB
  • sloc: sh: 11,744; ansic: 2,587; makefile: 226
file content (126 lines) | stat: -rw-r--r-- 3,510 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
-- libquvi-scripts v0.9.20131130
-- Copyright (C) 2013  Toni Gundogdu <legatvs@gmail.com>
--
-- This file is part of libquvi-scripts <http://quvi.sourceforge.net/>.
--
-- This program is free software: you can redistribute it and/or
-- modify it under the terms of the GNU Affero General Public
-- License as published by the Free Software Foundation, either
-- version 3 of the License, or (at your option) any later version.
--
-- This program is distributed in the hope that it will be useful,
-- but WITHOUT ANY WARRANTY; without even the implied warranty of
-- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-- GNU Affero General Public License for more details.
--
-- You should have received a copy of the GNU Affero General
-- Public License along with this program.  If not, see
-- <http://www.gnu.org/licenses/>.
--

local YouTube = {} -- Utility functions unique to this script

-- Identify the script.
function ident(qargs)
  local Y = require 'quvi/youtube'
  return Y.ident(qargs)
end

-- Parse subtitle properties.
function parse(qargs)
  local Y = require 'quvi/youtube'
  local C = require 'quvi/const'

  local u = Y.normalize(qargs.input_url)
  local v = u:match('v=([%w-_]+)') or error('no match: media ID')

  qargs.subtitles = {}

  YouTube.tts_get(qargs, v, u, C)
  YouTube.cc_get(qargs, v, C)

  return qargs
end

--
-- Utility functions
--

-- Extract the TTS (text-to-speech, or transcript).
function YouTube.tts_get(qargs, v, u, C)
  local u_fmt = "%s&tlang=%s&type=trackformat=1,&lang=en&kind=asr"
  local p = quvi.http.fetch(u).data

  local tts_url = p:match('[\'"]TTS_URL[\'"]:%s+[\'"](.-)[\'"]')
  if not tts_url then return end

  p = nil

  tts_url = tts_url:gsub('\\u0026','&')
  local U = require 'quvi/util'
  tts_url = U.slash_unescape(tts_url)
  tts_url = U.unescape(tts_url)

  local langs = tts_url:match('asr_langs=(.-)&')
  if not langs then return end

  local r = {}
  for c in langs:gmatch('(%w+)') do
    table.insert(r, {
      url = string.format(u_fmt, tts_url, c),
      translated = '',
      id = 'tts_'..c,
      original = '',
      code = c
    })
  end

  table.insert(qargs.subtitles, {format=C.sif_tt, type=C.st_tts, lang=r})
end

-- Return a new timed-text track URL.
function YouTube.tt_track_new(scheme, v, name, lang)
  local t = {
    scheme, '://youtube.com/api/timedtext?hl=en&type=track',
    '&v=', v, '&name=', name, '&lang=', lang
  }
  return table.concat(t)
end

-- Return a new timed-text list URL.
function YouTube.tt_list_new(scheme, v)
  local t = {scheme, '://video.google.com/timedtext?hl=en&type=list&v=', v}
  return table.concat(t)
end

-- Extract the CC (closed-captions) data.
function YouTube.cc_get(qargs, v, C)
  local U = require 'socket.url'
  local u = U.parse(qargs.input_url)

  local l = YouTube.tt_list_new(u.scheme, v)
  local x = quvi.http.fetch(l).data

  local L = require 'lxp.lom'
  local t = L.parse(x)

  local r = {}
  for i=1, #t do
    if t[i].tag == 'track' then
      local lang = t[i].attr['lang_code']
      if lang then
        local name = t[i].attr['name'] or ''
        table.insert(r, {
          translated = t[i].attr['lang_translated'] or '',
          url = YouTube.tt_track_new(u.scheme, v, name, lang),
          original = t[i].attr['lang_original'] or '',
          id = table.concat({'cc_', lang}),
          code = lang
        })
      end
    end
  end
  table.insert(qargs.subtitles, {format=C.sif_tt, type=C.st_cc, lang=r})
end

-- vim: set ts=2 sw=2 tw=72 expandtab: