Update rotana.net guide.

Test

```shell
npm test -- rotana.net

> test
> run-script-os rotana.net

> test:win32
> SET "TZ=Pacific/Nauru" && npx jest --runInBand rotana.net

 PASS  sites/rotana.net/rotana.net.test.js (6.081 s)
  √ can use defined user agent (3 ms)
  √ can generate valid english url (1 ms)
  √ can generate valid arabic url
  √ can parse english response (630 ms)
  √ can parse arabic response (560 ms)
  √ can handle empty guide (3 ms)

Test Suites: 1 passed, 1 total
Tests:       6 passed, 6 total
Snapshots:   0 total
Time:        6.406 s, estimated 8 s
Ran all test suites matching /rotana.net/i.
```

Grab

```shell
npm run grab -- --site=rotana.net --lang=en

> grab
> npx tsx scripts/commands/epg/grab.ts --site=rotana.net --lang=en

starting...
config:
  output: guide.xml
  maxConnections: 1
  gzip: false
  site: rotana.net
  lang: en
loading channels...
  found 16 channel(s)
run #1:
  [1/32] rotana.net (en) - 432 - Nov 26, 2024 (24 programs)
  [2/32] rotana.net (en) - 432 - Nov 27, 2024 (23 programs)
  [3/32] rotana.net (en) - 433 - Nov 27, 2024 (14 programs)
  [4/32] rotana.net (en) - LBC.sa - Nov 27, 2024 (19 programs)
  [5/32] rotana.net (en) - LBC.sa - Nov 26, 2024 (20 programs)
  [6/32] rotana.net (en) - 433 - Nov 26, 2024 (14 programs)
  [7/32] rotana.net (en) - AlResalah.sa - Nov 27, 2024 (54 programs)
  [8/32] rotana.net (en) - RotanaAflam.sa - Nov 26, 2024 (16 programs)
  [9/32] rotana.net (en) - AlResalah.sa - Nov 26, 2024 (57 programs)
  [10/32] rotana.net (en) - MPlusHD.sa - Nov 27, 2024 (2 programs)
  [11/32] rotana.net (en) - MPlusHD.sa - Nov 26, 2024 (240 programs)
  [12/32] rotana.net (en) - RotanaComedy.sa - Nov 26, 2024 (13 programs)
  [13/32] rotana.net (en) - RotanaClip.sa - Nov 27, 2024 (2 programs)
  [14/32] rotana.net (en) - RotanaClip.sa - Nov 26, 2024 (246 programs)
  [15/32] rotana.net (en) - RotanaClassic.sa - Nov 27, 2024 (18 programs)
  [16/32] rotana.net (en) - RotanaClassic.sa - Nov 26, 2024 (18 programs)
  [17/32] rotana.net (en) - RotanaCinemaKSA.sa - Nov 27, 2024 (13 programs)
  [18/32] rotana.net (en) - RotanaCinemaKSA.sa - Nov 26, 2024 (14 programs)
  [19/32] rotana.net (en) - RotanaCinemaEgypt.eg - Nov 27, 2024 (12 programs)
  [20/32] rotana.net (en) - RotanaCinemaEgypt.eg - Nov 26, 2024 (13 programs)
  [21/32] rotana.net (en) - RotanaAmerica.sa - Nov 27, 2024 (18 programs)
  [22/32] rotana.net (en) - RotanaAmerica.sa - Nov 26, 2024 (15 programs)
  [23/32] rotana.net (en) - RotanaAflam.sa - Nov 27, 2024 (16 programs)
  [24/32] rotana.net (en) - RotanaKids.sa - Nov 26, 2024 (83 programs)
  [25/32] rotana.net (en) - RotanaKhalijia.sa - Nov 26, 2024 (23 programs)
  [26/32] rotana.net (en) - RotanaDrama.sa - Nov 27, 2024 (26 programs)
  [27/32] rotana.net (en) - RotanaMusic.sa - Nov 27, 2024 (0 programs)
  [28/32] rotana.net (en) - RotanaMusic.sa - Nov 26, 2024 (0 programs)
  [29/32] rotana.net (en) - RotanaKhalijia.sa - Nov 27, 2024 (24 programs)
  [30/32] rotana.net (en) - RotanaDrama.sa - Nov 26, 2024 (26 programs)
  [31/32] rotana.net (en) - RotanaKids.sa - Nov 27, 2024 (83 programs)
  [32/32] rotana.net (en) - RotanaComedy.sa - Nov 27, 2024 (13 programs)
  saving to "guide.xml"...
  done in 00h 00m 49s
```

Signed-off-by: Toha <tohenk@yahoo.com>
This commit is contained in:
Toha
2024-11-27 03:48:25 +07:00
parent b311572748
commit e09316dc63
8 changed files with 833 additions and 606 deletions

View File

@@ -10,6 +10,9 @@ dayjs.extend(timezone)
dayjs.extend(utc)
dayjs.extend(customParseFormat)
const tz = 'Asia/Riyadh'
const nworker = 25
const headers = {
'User-Agent':
'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/118.0.0.0 Safari/537.36 OPR/104.0.0.0'
@@ -33,11 +36,33 @@ module.exports = {
}
const items = parseItems(content, date)
for (const item of items) {
const program = await parseProgram(item, channel)
if (program) {
programs.push(program)
if (items.length) {
const workers = []
const n = Math.min(nworker, items.length)
while (workers.length < n) {
const worker = () => {
if (items.length) {
const item = items.shift()
parseProgram(item, channel)
.then(() => {
programs.push(item)
worker()
})
} else {
workers.splice(workers.indexOf(worker), 1)
}
}
workers.push(worker)
worker()
}
await new Promise(resolve => {
const interval = setInterval(() => {
if (workers.length === 0) {
clearInterval(interval)
resolve()
}
}, 500)
})
}
return programs
@@ -58,85 +83,116 @@ module.exports = {
}
}
async function parseProgram(item, channel, options = {}) {
options = options || {}
const deep = options.deep !== undefined ? options.deep : true
const raw = options.raw !== undefined ? options.raw : false
const top = item.find('.iq-accordion-block')
const info = top.find('.iq-accordion-title .big-title span')
if (info.length) {
const [time, title] = info.text().split('\n')
const [d, m, y] = item._date.split('-')
const start = dayjs.tz(`${y}-${m}-${d} ${time.trim()}`, 'YYYY-MM-DD HH:mm', 'Asia/Riyadh')
let description, image, stop
if (deep) {
const pid = top.attr('id').split('-')[1]
if (pid) {
const url = `https://rotana.net/${channel.lang}/streams?channel=${channel.site_id}&itemId=${pid}`
const params = {
headers: Object.assign({}, headers, { 'X-Requested-With': 'XMLHttpRequest' }),
Cookie: cookies[channel.lang]
}
debug(`fetching description ${url}`)
const result = await axios
.get(url, params)
.then(response => response.data)
.catch(console.error)
async function parseProgram(item, channel) {
if (item.program) {
const url = `https://rotana.net/${channel.lang}/streams?channel=${channel.site_id}&itemId=${item.program}`
const params = {
headers: Object.assign({}, headers, { 'X-Requested-With': 'XMLHttpRequest' }),
Cookie: cookies[channel.lang]
}
debug(`fetching description ${url}`)
const result = await axios
.get(url, params)
.then(response => response.data)
.catch(console.error)
const $ = cheerio.load(result)
const details = $('.trending-info div > span')
if (details.length) {
description = details.text().split('\n')[3].trim()
}
const img = $('.row > div > img')
if (img.length) {
image = img.attr('src')
}
}
if (item._next) {
const next = await parseProgram(item._next, channel, { deep: false, raw: true })
if (next.start) {
stop = next.start
const $ = cheerio.load(result)
const details = $('.trending-info .row div > span')
if (details.length) {
for (const el of details[0].children) {
switch (el.constructor.name) {
case 'Text':
if (item.description === undefined) {
const desc = $(el).text().trim()
if (desc) {
item.description = desc
}
}
break;
case 'Element':
if (el.name === 'span') {
const [k, v] = $(el).text().split(':').map(a => a.trim())
switch (k) {
case 'Category':
case 'التصنيف':
item.category = v;
break;
case 'Country':
case 'البلد':
item.country = v;
break;
case 'Director':
case 'المخرج':
item.director = v;
break;
case 'Language':
case 'اللغة':
item.language = v;
break;
case 'Release Year':
case 'سنة الإصدار':
item.date = v;
break;
}
}
break;
}
}
}
return {
title: title?.trim(),
description: description?.trim(),
image,
start: raw ? start : start?.toISOString(),
stop: raw ? stop : stop?.toISOString()
const img = $('.row > div > img')
if (img.length) {
item.image = img.attr('src')
}
delete item.program
}
}
function parseItems(content, date) {
const result = []
const $ = cheerio.load(content)
const expectedId = `item-${date.format('DD-MM-YYYY')}`
let lastId
const items = []
let curDate
$('.hour > div').each((_, item) => {
const $item = $(item)
if ($item.hasClass('bg')) {
lastId = $item.attr('id')
curDate = $item.attr('id')
curDate = curDate.substr(curDate.indexOf('-') + 1).split('-')
} else if ($item.hasClass('iq-accordion')) {
$item._date = lastId.substr(lastId.indexOf('-') + 1)
// is date match?
if (lastId === expectedId) {
// set next item
if (result.length) {
result[result.length - 1]._next = $item
}
result.push($item)
} else if (result.length && !result[result.length - 1]._next) {
// set next item
result[result.length - 1]._next = $item
const top = $item.find('.iq-accordion-block')
const heading = top.find('.iq-accordion-title .big-title')
if (heading.length) {
const progId = top.attr('id')
const title = heading.find('span:eq(1)').text()
.split('\n')
.map(a => a.trim())
.join(' ')
const time = heading.find('span:eq(0)').text()
const [d, m, y] = curDate
items.push({
program: progId.substr(progId.indexOf('-') + 1),
title: title ? title.trim() : title,
start: `${y}-${m}-${d} ${time.trim()}`,
})
}
}
})
return result
items.sort((a, b) => a.start.localeCompare(b.start))
for (let i = 0; i < items.length; i++) {
if (i < items.length - 2) {
items[i].stop = items[i + 1].start
} else {
const dt = dayjs.tz(items[i].start).add(1, 'd')
items[i].stop = `${dt.format('YYYY-MM-DD')} 00:00`
}
}
const expectedDate = `${date.format('YYYY-MM-DD')}`
return items
.filter(a => a.start.startsWith(expectedDate) || a.stop.startsWith(expectedDate))
.map(a => {
a.start = dayjs.tz(a.start, tz)
a.stop = dayjs.tz(a.stop, tz)
return a
})
}
function parseCookies(headers) {