diff options
author | Petter Reinholdtsen <pere@hungry.com> | 2014-12-08 08:23:47 +0100 |
---|---|---|
committer | Petter Reinholdtsen <pere@hungry.com> | 2014-12-08 08:23:47 +0100 |
commit | 7c4cd08f1a031b564ad62d8aa75c4f44ca16b3c4 (patch) | |
tree | cb132210b13f97edfc84bacad8944915776b6b47 | |
parent | 3ac6eb2db52f6423700ce59dd0e703c41ce71c3a (diff) |
Add meta-info about some scrapers.
-rw-r--r-- | scrapersources/postliste-arendal | 8 | ||||
-rw-r--r-- | scrapersources/postliste-bioforsk | 11 | ||||
-rw-r--r-- | scrapersources/postliste-ntnu | 12 | ||||
-rw-r--r-- | scrapersources/postliste-oep-deliverydates | 10 | ||||
-rw-r--r-- | scrapersources/postliste-stortinget | 10 |
5 files changed, 49 insertions, 2 deletions
diff --git a/scrapersources/postliste-arendal b/scrapersources/postliste-arendal index a952b63..ed64507 100644 --- a/scrapersources/postliste-arendal +++ b/scrapersources/postliste-arendal @@ -1,4 +1,12 @@ # coding=utf-8 +# YAML-tagger: +# Type: kommune +# Status: unfinished +# Name: Arendal kommune +# Format: HTML +# Datatype: ? +# Vendor: ? +# Missingfields: caseid, casedesc, etc import scraperwiki diff --git a/scrapersources/postliste-bioforsk b/scrapersources/postliste-bioforsk index b41b30f..4aac9f0 100644 --- a/scrapersources/postliste-bioforsk +++ b/scrapersources/postliste-bioforsk @@ -1,4 +1,13 @@ -# -*- coding: UTF-8 -*- +# -*- coding: utf-8 -*- +# FIXME: This source uses an unsupported PDF format. +# YAML-tagger: +# Type: unknown +# Status: unfinished +# Name: Bioforsk +# Format: PDF +# Datatype: ? +# Vendor: ? +# Run: daily import scraperwiki import json diff --git a/scrapersources/postliste-ntnu b/scrapersources/postliste-ntnu index d6c6695..f78af9d 100644 --- a/scrapersources/postliste-ntnu +++ b/scrapersources/postliste-ntnu @@ -1,4 +1,14 @@ -# -*- coding: UTF-8 -*- +# -*- coding: utf-8 -*- +# YAML-tagger: +# Type: university +# Status: unfinished +# Name: Norges Teknisk-Naturvitenskaplige universitet +# Format: HTML +# Datatype: ? +# Vendor: ? +# Run: daily +# +# Tidligere ble det publisert PDF-er import scraperwiki import json diff --git a/scrapersources/postliste-oep-deliverydates b/scrapersources/postliste-oep-deliverydates index ebce253..97b1536 100644 --- a/scrapersources/postliste-oep-deliverydates +++ b/scrapersources/postliste-oep-deliverydates @@ -1,3 +1,13 @@ +# -*- coding: utf-8 -*- +# YAML-tagger: +# Type: statlig +# Status: finished +# Name: Offentlig Elektronisk postjournal delivery dates +# Format: HTML +# Datatype: ? +# Vendor: ? +# Run: hourly + import scraperwiki import lxml.html import datetime diff --git a/scrapersources/postliste-stortinget b/scrapersources/postliste-stortinget index 98fd7d6..8fd48fe 100644 --- a/scrapersources/postliste-stortinget +++ b/scrapersources/postliste-stortinget @@ -1,3 +1,13 @@ +# -*- coding: utf-8 -*- +# YAML-tagger: +# Type: statlig +# Status: finished +# Name: Stortinget +# Format: PDF +# Datatype: ePhorte +# Vendor: Ergo +# Run: daily + # Based on the scraper advanced-scraping-pdf # See also # https://views.scraperwiki.com/run/pdf-to-html-preview-1/?url=http%3A%2F%2Fwww.stortinget.no%2FGlobal%2Fpdf%2Fpostjournal%2Fpj-2012-05-09.pdf |