From 5dd850d1cb24eba2ec38dc85e8a4c8319acac926 Mon Sep 17 00:00:00 2001 From: tim Date: Sat, 2 Dec 2023 00:17:58 +0200 Subject: [PATCH] Add reminder about old categories --- africat/aa_create_dataset.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/africat/aa_create_dataset.py b/africat/aa_create_dataset.py index dcaf528..6bf7ee2 100755 --- a/africat/aa_create_dataset.py +++ b/africat/aa_create_dataset.py @@ -96,6 +96,8 @@ def parse_and_extract(input_dir, verbose): cats = list() for cat in doc.findall('./category'): + # TODO check against a list of current categories, + # and strip any non-current categories cats.append(cat.text) #entry["categories"] = cats # if you want a list entry["categories"] = ";".join(cats) # if you want a string