Files
einundzwanzig.space/tasks/fetch_feed.js
Dennis Reimann bdc9e708c9 Trim feed size
Link to shownotes for older episodes
2023-08-02 16:32:36 +02:00

239 lines
6.2 KiB
JavaScript

const { writeFileSync } = require('fs')
const { join, resolve } = require('path')
const { replacements, slugify, stripHTML } = require('../helpers')
const { masterFeedUrl, publicFeedUrl } = require('../content/meta.json')
const team = require('../content/team.json')
const nodes = require('../content/nodes.json')
const request = require('sync-request')
const { XMLParser, XMLBuilder, XMLValidator } = require('fast-xml-parser')
const xmlFormat = require('xml-formatter')
const debug = process.env.CI
const dir = resolve(__dirname, '..')
const write = (name, data) => writeFileSync(join(dir, name), data)
const writeJSON = (name, data) =>
write(`generated/${name}.json`, JSON.stringify(data, null, 2))
const commonOpts = {
attributeNamePrefix: '',
attributesGroupName: '__attr',
ignoreAttributes: false,
cdataPropName: '__cdata'
}
const xml2jsonOpts = {
...commonOpts,
parseTagValue: true,
parseAttributeValue: false,
trimValues: true,
parseTrueNumberOnly: false,
arrayMode: false
}
const json2xmlOpts = {
...commonOpts,
indentBy: ' '
}
const parser = new XMLParser(xml2jsonOpts, true)
const builder = new XMLBuilder(json2xmlOpts)
const parseEpisode = e => {
const guid = e.guid['#text']
const title = e.title.__cdata.trim()
const content = replacements(e.description.__cdata).trim()
const description = stripHTML(content)
let [, categoryName = 'News', number, titlePlain] = title.match(
/([\w\s]+?)?\s?#(\d+) - (.*)/
) || [, , , title]
if (!number) categoryName = 'Verschiedenes'
if (categoryName === 'Der-Weg') categoryName = 'Der Weg'
if (categoryName === 'Buchclub') categoryName = 'Lesestunde'
const firstLine = description.split('\n')[0]
const blockMatch = firstLine.match(/Blockzeit\s(\d+)/)
const block = blockMatch ? parseInt(blockMatch[1]) : null
const category = slugify(categoryName)
const slug = slugify(`${categoryName} ${number || ''} ${titlePlain}`)
const date = new Date(e.pubDate)
const img = e['itunes:image'].__attr.href
const image = ['interview', 'lesestunde', 'verschiedenes'].includes(category)
? img
: `/img/cover/${category}.png`
const duration = e['itunes:duration']
const enclosure = e.enclosure.__attr
const [, participantsString] =
firstLine.match(/ - (?:(?:von und )?mit )([^.]*)/i) || []
const participants = participantsString
? participantsString
.replace(/(\s*,\s*|\s*und\s*|\s*&\s*)/gi, '%')
.trim()
.split('%')
: []
return {
block,
category,
categoryName,
number,
title,
titlePlain,
description,
content,
duration,
slug,
image,
guid,
date,
enclosure,
participants
}
}
;(async () => {
// Load and adapt feed
const anchorXML = request('GET', masterFeedUrl).getBody('utf8')
const xml = anchorXML
.replace(`"${masterFeedUrl}"`, `"${publicFeedUrl}"`)
.replace(
'xmlns:anchor="https://anchor.fm/xmlns"',
'xmlns:anchor="https://anchor.fm/xmlns" xmlns:podcast="https://podcastindex.org/namespace/1.0"'
)
.replace('<channel>', '<channel><podcast:value></podcast:value>')
const feed = parser.parse(xml)
const episodes = []
const _noParticipants = [],
_noNode = []
const members = [
{ name: 'Dennis', ...nodes.dennis },
{ name: 'Fab', ...nodes.fab },
{ name: 'Gigi', ...nodes.gigi },
{ name: 'Markus', ...nodes.markus },
{ name: 'Daniel', ...nodes.daniel }
]
// remove invalid tag
delete feed.rss.channel.author
// podcast
feed.rss.channel['podcast:value'] = {
__attr: {
type: 'lightning',
method: 'keysend'
},
'podcast:valueRecipient': members.map(p => ({
__attr: {
...p,
type: 'node',
split: Math.round(100 / members.length)
}
}))
}
// episodes
feed.rss.channel.item = feed.rss.channel.item.map((item, index) => {
const episode = parseEpisode(item)
episodes.push(episode)
const link = `https://einundzwanzig.space/podcast/${episode.slug}`
let description = episode.description
if (index > 20) {
description = `Shownotes: ${link}`
}
const updated = {
...item,
link, // replace Anchor link
description,
'itunes:summary': description // please the validator, Anchor's itunes:summary contains HTML
}
if (episode.number) {
updated['podcast:episode'] = {
__attr: {
display: `${episode.categoryName} #${episode.number}`
},
'#text': episode.number
}
}
const value = episode.participants.reduce((result, name) => {
const id = name.toLowerCase()
const node = nodes[id]
if (node) {
result.push({ name, ...node })
} else if (debug) {
_noNode.push({ episode: episode.slug, name })
}
return result
}, [])
if (value.length) {
updated['podcast:value'] = {
__attr: {
type: 'lightning',
method: 'keysend'
},
'podcast:valueRecipient': value.map(p => ({
__attr: {
...p,
type: 'node',
split: Math.round(100 / value.length)
}
}))
}
} else if (debug) {
_noParticipants.push({ episode: episode.slug })
}
const people = episode.participants.reduce((result, name) => {
const id = name.toLowerCase()
const person = team[id]
if (person) {
result.push(person)
}
return result
}, [])
if (people.length) {
updated['podcast:person'] = []
people.forEach(p => {
updated['podcast:person'].push({
__attr: {
href: `https://twitter.com/${p.twitter}`
},
'#text': p.name
})
})
}
return updated
})
const outputXML = builder.build(feed)
writeJSON('episodes', episodes)
const validation = XMLValidator.validate(outputXML)
if (validation) {
write(
'dist/feed.xml',
xmlFormat(outputXML, {
indentation: json2xmlOpts.indentBy,
collapseContent: true
})
)
} else {
console.error(validation.err)
}
if (_noParticipants.length) {
console.log('Keine Teilnehmerliste')
console.table(_noParticipants)
}
if (_noNode.length) {
console.log('Teilnehmer ohne Node')
console.table(_noNode)
}
})()