Skip to content

Commit ea9ae64

Browse files
committed
Added award, fund and quality
1 parent a943fef commit ea9ae64

File tree

3 files changed

+36
-3
lines changed

3 files changed

+36
-3
lines changed

Makefile

+4-1
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,9 @@ specification::
9696
curl -qfsL '$(SOURCE_URL)/specification/main/specification/provision.csv' > specification/provision.csv
9797
curl -qfsL '$(SOURCE_URL)/specification/main/specification/provision-rule.csv' > specification/provision-rule.csv
9898
curl -qfsL '$(SOURCE_URL)/specification/main/specification/provision-reason.csv' > specification/provision-reason.csv
99+
curl -qfsL '$(SOURCE_URL)/specification/main/specification/fund.csv' > specification/fund.csv
100+
curl -qfsL '$(SOURCE_URL)/specification/main/specification/award.csv' > specification/award.csv
101+
curl -qfsL '$(SOURCE_URL)/specification/main/specification/quality.csv' > specification/quality.csv
99102

100103
check-performance::
101-
python check/performance.py
104+
python check/performance.py

bin/guess-lpa.py

+28
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
#!/usr/bin/env python3
2+
3+
import csv
4+
5+
6+
organisations = {}
7+
datasets = {}
8+
9+
10+
for row in csv.DictReader(open("collection/source.csv")):
11+
organisation = row["organisation"]
12+
pipelines = row.get("datasets", "") or row.get("pipelines", "")
13+
14+
for dataset in pipelines.split(";"):
15+
organisations.setdefault(organisation, set())
16+
organisations[organisation].add(dataset)
17+
18+
datasets.setdefault(dataset, set())
19+
datasets[dataset].add(organisation)
20+
21+
22+
#for organisation in sorted(organisations):
23+
#if not (organisation.startswith("local-authority") or organisation.startswith("development-corporation") or organisation.startswith("national-park")):
24+
#print('"' + organisation + '":', sorted(organisations[organisation]))
25+
26+
for organisation in sorted(organisations):
27+
if (organisation.startswith("local-authority") or organisation.startswith("development-corporation") or organisation.startswith("national-park")):
28+
print(organisation)

bin/load.py

+4-2
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44

55
import os
66
import sys
7-
import csv
87
import logging
98
import sqlite3
109

@@ -23,12 +22,14 @@
2322
"old-resource": "collection",
2423
"log": "collection",
2524

25+
"award": "specification",
2626
"collection": "specification",
2727
"theme": "specification",
2828
"typology": "specification",
2929
"dataset": "specification",
3030
"dataset-field": "specification",
3131
"field": "specification",
32+
"fund": "specification",
3233
"datatype": "specification",
3334
"prefix": "specification",
3435
"severity": "specification",
@@ -46,6 +47,8 @@
4647
"provision": "specification",
4748
"provision-rule": "specification",
4849
"provision-reason": "specification",
50+
"quality": "specification",
51+
"datatype": "specification",
4952
"specification": "specification",
5053
"specification-status": "specification",
5154

@@ -206,4 +209,3 @@ def create_parquet_from_table(df, name, output_dir):
206209
where t1.rn = 1
207210
""")
208211
conn.close()
209-

0 commit comments

Comments
 (0)