Open cnrdh opened 1 year ago
$ cat data/news/**/**/*.md | grep -E '\]\(https?:' | grep -v mynewsdesk |grep '!' | nd-map -t 'u=d.split("(").at(1),url = URL.canParse(u) ? new URL(u): u, url.origin' | nd-map '{hostname:d}' | nd-count
{"hostname":"https://norargo.hi.no","count":1}
{"hostname":"https://framsenteret.no","count":20}
{"hostname":"https://blogg.uit.no","count":5}
{"hostname":"http://www.akvaplan.niva.no","count":1}
{"hostname":"https://arvenetternansen.com","count":2}
{"hostname":"https://image.forskning.no","count":9}
{"hostname":"https://image.forskersonen.no","count":2}
{"hostname":"https://www.nilu.no","count":3}
{"hostname":"https://mrfylke.no","count":1}
{"hostname":"https://uit.no","count":14}
{"hostname":"https://recruiterprod.blob.core.windows.net","count":1}