Skip to content

Commit 5754535

Browse files
committed
update prioritized tools to use metadata csv
1 parent 3832c80 commit 5754535

File tree

2 files changed

+8
-18
lines changed

2 files changed

+8
-18
lines changed

data/prioritized-tool-urls.txt

Lines changed: 1 addition & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -18,18 +18,11 @@
1818
//creativecommons.org/licenses/by-nc-sa/2.5
1919
//creativecommons.org/licenses/by-nd/2.5
2020
//creativecommons.org/licenses/by-sa/2.5
21-
//creativecommons.org/licenses/by/2.1
22-
//creativecommons.org/licenses/by-nc/2.1
23-
//creativecommons.org/licenses/by-nc-nd/2.1
24-
//creativecommons.org/licenses/by-nc-sa/2.1
25-
//creativecommons.org/licenses/by-nd/2.1
26-
//creativecommons.org/licenses/by-sa/2.1
2721
//creativecommons.org/licenses/by/2.0
2822
//creativecommons.org/licenses/by-nc/2.0
2923
//creativecommons.org/licenses/by-nc-nd/2.0
3024
//creativecommons.org/licenses/by-nc-sa/2.0
3125
//creativecommons.org/licenses/by-nd/2.0
32-
//creativecommons.org/licenses/by-nd-nc/2.0
3326
//creativecommons.org/licenses/by-sa/2.0
3427
//creativecommons.org/licenses/by/1.0
3528
//creativecommons.org/licenses/by-nc/1.0
@@ -558,7 +551,6 @@
558551
//creativecommons.org/licenses/by-nc-nd/2.0/jp
559552
//creativecommons.org/licenses/by-nc-sa/2.0/jp
560553
//creativecommons.org/licenses/by-nd/2.0/jp
561-
//creativecommons.org/licenses/by-nd-nc/2.0/jp
562554
//creativecommons.org/licenses/by-sa/2.0/jp
563555
//creativecommons.org/licenses/by/2.0/kr
564556
//creativecommons.org/licenses/by-nc/2.0/kr
@@ -615,11 +607,6 @@
615607
//creativecommons.org/licenses/by-nd-nc/1.0/nl
616608
//creativecommons.org/licenses/by-sa/1.0/nl
617609
//creativecommons.org/licenses/devnations/2.0
618-
//creativecommons.org/licenses/nc/2.0
619-
//creativecommons.org/licenses/nc-sa/2.0
620-
//creativecommons.org/licenses/nd/2.0
621-
//creativecommons.org/licenses/nd-nc/2.0
622-
//creativecommons.org/licenses/sa/2.0
623610
//creativecommons.org/licenses/nc/1.0
624611
//creativecommons.org/licenses/nc-sa/1.0
625612
//creativecommons.org/licenses/nc-sampling+/1.0
@@ -649,4 +636,4 @@
649636
//creativecommons.org/licenses/nc-sampling+/1.0/tw
650637
//creativecommons.org/licenses/sampling/1.0/tw
651638
//creativecommons.org/licenses/sampling+/1.0/tw
652-
//creativecommons.org/licenses/publicdomain
639+
//creativecommons.org/publicdomain/certification/1.0/us

dev/prioritize_tools.py

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,6 +14,7 @@
1414
4. Save prioritized CC Legal Tool URLs
1515
"""
1616
# Standard library
17+
import csv
1718
import os
1819
import sys
1920
import textwrap
@@ -39,12 +40,14 @@
3940

4041
def get_tool_urls():
4142
LOGGER.info("Loading CC Legal Tool paths and adding prefix")
42-
file_path = shared.path_join(PATHS["data"], "legal-tool-paths.txt")
43-
prefix = "//creativecommons.org/"
43+
file_path = shared.path_join(PATHS["data"], "cc-legal-tools.csv")
4444
tool_urls = []
4545
with open(file_path, "r", encoding="utf-8") as file_obj:
46-
for line in file_obj:
47-
tool_urls.append(f"{prefix}{line.strip()}")
46+
rows = csv.DictReader(file_obj, dialect="unix")
47+
for row in rows:
48+
tool_urls.append(
49+
row["CANONICAL_URL"].replace("https:", "").rstrip("/")
50+
)
4851
return tool_urls
4952

5053

0 commit comments

Comments
 (0)