Files
einundzwanzig.space/tasks/fetch_feed.js
Dennis Reimann d6bcb7b771 Customize feed
2021-09-20 14:04:31 +02:00

110 lines
4.5 KiB
JavaScript

const { writeFileSync } = require('fs')
const { join, resolve } = require('path')
const { replacements, slugify, stripHTML } = require('../helpers')
const { masterFeedUrl, publicFeedUrl } = require('../content/meta.json')
const request = require('sync-request')
const parser = require('fast-xml-parser')
const JSON2XMLParser = require("fast-xml-parser").j2xParser;
const he = require('he')
const dir = resolve(__dirname, '..')
const write = (name, data) => writeFileSync(join(dir, name), data)
const writeJSON = (name, data) => write(`generated/${name}.json`, JSON.stringify(data, null, 2))
const commonOpts = {
attributeNamePrefix: "",
attrNodeName: "__attr",
textNodeName: "#text",
ignoreAttributes: false,
cdataTagName: "__cdata",
cdataPositionChar: "\\c"
}
const xml2jsonOpts = {
...commonOpts,
ignoreNameSpace: false,
parseNodeValue: true,
parseAttributeValue: false,
trimValues: true,
parseTrueNumberOnly: false,
arrayMode: false,
numParseOptions: {
hex: true,
leadingZeros: true,
},
tagValueProcessor: val => he.decode(val),
attrValueProcessor: val => he.decode(val, { isAttributeValue: true })
}
var json2xmlOpts = {
...commonOpts,
format: false,
indentBy: " ",
supressEmptyNode: false,
tagValueProcessor: a => a,
attrValueProcessor: a => he.encode(a, { isAttributeValue: true, useNamedReferences: true })
};
const parseEpisode = e => {
const guid = e.guid['#text']
const title = e.title.__cdata.trim()
const content = replacements(e.description.__cdata).trim()
const description = stripHTML(content)
let [, categoryName = 'News', number, titlePlain] = title.match(/([\w\s]+?)?\s?#(\d+) - (.*)/) || [, , , title]
if (!number) categoryName = 'Verschiedenes'
if (categoryName === 'Der-Weg') categoryName = 'Der Weg'
const firstLine = description.split('\n')[0]
const blockMatch = firstLine.match(/Blockzeit\s(\d+)/)
const block = blockMatch ? parseInt(blockMatch[1]) : null
const category = slugify(categoryName)
const slug = slugify(`${categoryName} ${number || ''} ${titlePlain}`)
const date = new Date(e.pubDate)
const img = e['itunes:image'].__attr.href
const image = ['interview', 'lesestunde', 'verschiedenes'].includes(category) ? img : `/img/cover/${category}.png`
const duration = e['itunes:duration']
const enclosure = e.enclosure.__attr
const [, participantsString] = firstLine.match(/ - (?:(?:von und )?mit )(.*)/i) || []
const participants = participantsString ? participantsString.replace(/(\s*,\s*|\s*und\s*)/ig, '%').split('%') : []
return { block, category, categoryName, number, title, titlePlain, description, content, duration, slug, image, guid , date, enclosure, participants }
}
;(async () => {
// Load and adapt feed
const anchorXML = request('GET', masterFeedUrl).getBody('utf8')
const xml = anchorXML
.replace(`"${masterFeedUrl}"`, `"${publicFeedUrl}"`)
.replace('xmlns:anchor="https://anchor.fm/xmlns"', 'xmlns:anchor="https://anchor.fm/xmlns" xmlns:podcast="https://podcastindex.org/namespace/1.0"')
.replace('<channel>', `<channel>
<podcast:value type="lightning" method="keysend">
<podcast:valueRecipient name="Dennis" type="node" address="0231f73aef9bbdbf69e840640255946264026b56e17701f2d410b08b8b6e5d637a" split="1" />
<podcast:valueRecipient name="Fab" type="node" address="03f14237bb08f0afcb1ea07eff6b0b41e79294e66888971cccf1f585f5e21bf8f9" split="1" />
<podcast:valueRecipient name="Gigi" type="node" address="02e12fea95f576a680ec1938b7ed98ef0855eadeced493566877d404e404bfbf52" split="1" />
<podcast:valueRecipient name="Markus" type="node" address="0286e50ebeaafdf7dc321f6c8cb7e964e236b03ed67494b6337215c5c3c42252f2" split="1" />
<podcast:valueRecipient name="Daniel" type="node" address="0201d14101401add234ebe3bc0e3020a39726daadf82bc3fa6b9871c4f5b17ab3f" split="1" />
</podcast:value>`)
const feed = parser.parse(xml, xml2jsonOpts, true)
const episodes = []
delete feed.rss.channel.author // remove invalid tag
feed.rss.channel.item = feed.rss.channel.item.map(item => {
const episode = parseEpisode(item)
episodes.push(episode)
return {
...item,
link: `https://einundzwanzig.space/podcast/${episode.slug}`, // replace Anchor link
'itunes:summary': episode.description // please the validator, Anchor's itunes:summary contains HTML
}
})
writeJSON('feed', feed)
const JSON2XML = new JSON2XMLParser(json2xmlOpts)
const outputXML = JSON2XML.parse(feed)
writeJSON('episodes', episodes)
write('dist/feed.xml', outputXML)
write('dist/anchor.xml', anchorXML)
})()