Rewrite DAAI feed, close #87
This commit is contained in:
parent
aa26c36bc9
commit
eb431dc9bf
9
itsb.xml
9
itsb.xml
|
@ -820,9 +820,14 @@
|
|||
<frequency>3-5 reports/year</frequency>
|
||||
<feed format="rss" lang="English" id="daai-rss">
|
||||
<curl>
|
||||
<url verify-ssl="false">https://mwt.gov.na/published-daai-report/-/document_library/PVB0Gp2amxBo/view/1344073?_com_liferay_document_library_web_portlet_DLPortlet_INSTANCE_PVB0Gp2amxBo_displayStyle=list</url>
|
||||
<url>https://mwt.gov.na/published-daai-report</url>
|
||||
</curl>
|
||||
<pup>tr[data-title]</pup>
|
||||
<!--
|
||||
We would need both :not(:first-child) and :not(:nth-child(2)) to
|
||||
properly remove all the header rows since there are two of them,
|
||||
but pup does not allow that so the jq script will ignore the first row it gets.
|
||||
-->
|
||||
<pup>#our-content tr:not(:first-child)</pup>
|
||||
<jq path="daai.jq" />
|
||||
<json2xml />
|
||||
<output>daai.xml</output>
|
||||
|
|
22
jq/daai.jq
22
jq/daai.jq
|
@ -9,22 +9,28 @@ import "./helpers" as helpers;
|
|||
"channel": {
|
||||
"title": "DAAI",
|
||||
"description": "Namibian Directorate of Aircraft Accidents and Investigation reports",
|
||||
"link": "https://mwt.gov.na/web/mwt/published-reports",
|
||||
"link": "https://mwt.gov.na/published-daai-report",
|
||||
"language": "en-na",
|
||||
"pubDate": (now | strftime("%a, %d %b %Y %T %z")),
|
||||
"docs": "https://www.rssboard.org/rss-specification",
|
||||
"ttl": 1440,
|
||||
"generator": "ITSB",
|
||||
"item": [
|
||||
.[]
|
||||
.[1:][].children
|
||||
| {
|
||||
"title": .["data-title"],
|
||||
"link": (.children[0].children[0].href | sub("\\?.*$"; "")),
|
||||
"pubDate": (.children[3].children[0].onmouseover | match("'(.*)'").captures[0].string | strptime("%e/%m/%y %I:%M %p") | mktime | strftime("%a, %d %b %Y %T %z")),
|
||||
"guid": {
|
||||
"@isPermaLink": "true",
|
||||
"#text": (.children[0].children[0].href | sub("\\?.*$"; ""))
|
||||
"title": "\(.[1].children[0].text) - \(.[2].children[0].text) \(.[3].children[0].children[0].text) - \(.[-1].children[-1].text)",
|
||||
"link": (.[3].children[0].children[0].href | helpers::urlresolve("https://mwt.gov.na/published-daai-report")),
|
||||
"category": [
|
||||
[.[1].children[0].text, .[-1].children[-1].text][]
|
||||
| {
|
||||
"@domain": "https://mwt.gov.na",
|
||||
"#text": .
|
||||
}
|
||||
]
|
||||
}
|
||||
| .guid = {
|
||||
"@isPermaLink": "true",
|
||||
"#text": .link
|
||||
}
|
||||
]
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue