aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorPetter Reinholdtsen <pere@hungry.com>2014-12-08 08:23:47 +0100
committerPetter Reinholdtsen <pere@hungry.com>2014-12-08 08:23:47 +0100
commit7c4cd08f1a031b564ad62d8aa75c4f44ca16b3c4 (patch)
treecb132210b13f97edfc84bacad8944915776b6b47
parent3ac6eb2db52f6423700ce59dd0e703c41ce71c3a (diff)
Add meta-info about some scrapers.
-rw-r--r--scrapersources/postliste-arendal8
-rw-r--r--scrapersources/postliste-bioforsk11
-rw-r--r--scrapersources/postliste-ntnu12
-rw-r--r--scrapersources/postliste-oep-deliverydates10
-rw-r--r--scrapersources/postliste-stortinget10
5 files changed, 49 insertions, 2 deletions
diff --git a/scrapersources/postliste-arendal b/scrapersources/postliste-arendal
index a952b63..ed64507 100644
--- a/scrapersources/postliste-arendal
+++ b/scrapersources/postliste-arendal
@@ -1,4 +1,12 @@
# coding=utf-8
+# YAML-tagger:
+# Type: kommune
+# Status: unfinished
+# Name: Arendal kommune
+# Format: HTML
+# Datatype: ?
+# Vendor: ?
+# Missingfields: caseid, casedesc, etc
import scraperwiki
diff --git a/scrapersources/postliste-bioforsk b/scrapersources/postliste-bioforsk
index b41b30f..4aac9f0 100644
--- a/scrapersources/postliste-bioforsk
+++ b/scrapersources/postliste-bioforsk
@@ -1,4 +1,13 @@
-# -*- coding: UTF-8 -*-
+# -*- coding: utf-8 -*-
+# FIXME: This source uses an unsupported PDF format.
+# YAML-tagger:
+# Type: unknown
+# Status: unfinished
+# Name: Bioforsk
+# Format: PDF
+# Datatype: ?
+# Vendor: ?
+# Run: daily
import scraperwiki
import json
diff --git a/scrapersources/postliste-ntnu b/scrapersources/postliste-ntnu
index d6c6695..f78af9d 100644
--- a/scrapersources/postliste-ntnu
+++ b/scrapersources/postliste-ntnu
@@ -1,4 +1,14 @@
-# -*- coding: UTF-8 -*-
+# -*- coding: utf-8 -*-
+# YAML-tagger:
+# Type: university
+# Status: unfinished
+# Name: Norges Teknisk-Naturvitenskaplige universitet
+# Format: HTML
+# Datatype: ?
+# Vendor: ?
+# Run: daily
+#
+# Tidligere ble det publisert PDF-er
import scraperwiki
import json
diff --git a/scrapersources/postliste-oep-deliverydates b/scrapersources/postliste-oep-deliverydates
index ebce253..97b1536 100644
--- a/scrapersources/postliste-oep-deliverydates
+++ b/scrapersources/postliste-oep-deliverydates
@@ -1,3 +1,13 @@
+# -*- coding: utf-8 -*-
+# YAML-tagger:
+# Type: statlig
+# Status: finished
+# Name: Offentlig Elektronisk postjournal delivery dates
+# Format: HTML
+# Datatype: ?
+# Vendor: ?
+# Run: hourly
+
import scraperwiki
import lxml.html
import datetime
diff --git a/scrapersources/postliste-stortinget b/scrapersources/postliste-stortinget
index 98fd7d6..8fd48fe 100644
--- a/scrapersources/postliste-stortinget
+++ b/scrapersources/postliste-stortinget
@@ -1,3 +1,13 @@
+# -*- coding: utf-8 -*-
+# YAML-tagger:
+# Type: statlig
+# Status: finished
+# Name: Stortinget
+# Format: PDF
+# Datatype: ePhorte
+# Vendor: Ergo
+# Run: daily
+
# Based on the scraper advanced-scraping-pdf
# See also
# https://views.scraperwiki.com/run/pdf-to-html-preview-1/?url=http%3A%2F%2Fwww.stortinget.no%2FGlobal%2Fpdf%2Fpostjournal%2Fpj-2012-05-09.pdf