Skip to content

Commit 160e484

Browse files
committed
Regex adjustments - see HEA-809
1 parent ecef5bd commit 160e484

2 files changed

Lines changed: 5 additions & 29 deletions

File tree

pipelines/assets/livelihood_activity_regexes.json

Lines changed: 3 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -92,43 +92,19 @@
9292
"people_per_household"
9393
],
9494
[
95-
"(?P<product_id>{label_pattern}{separator_pattern}{label_pattern}) {age_gender_pattern}{separator_pattern}\\({unit_of_measure_pattern}(?: collectés?|gathered)?\\)",
95+
"{product_pattern}{separator_pattern} {age_gender_pattern} ?\\(?{unit_of_measure_pattern}(?: collectés?|gathered)?\\)?",
9696
null,
9797
true,
9898
"quantity_produced"
9999
],
100100
[
101-
"{product_pattern}{separator_pattern} {age_gender_pattern} ?\\({unit_of_measure_pattern}(?: collectés?|gathered)?\\)",
102-
null,
103-
true,
104-
"quantity_produced"
105-
],
106-
[
107-
"{product_pattern}: {label_pattern} {age_gender_pattern} \\({unit_of_measure_pattern}(?: collectés?|gathered)?\\)",
108-
null,
109-
true,
110-
"quantity_produced"
111-
],
112-
[
113-
"{product_pattern}{separator_pattern} {age_gender_pattern}{separator_pattern} (?:no\\.|nbr?\\.) people per hh",
101+
"{product_pattern}{separator_pattern} {age_gender_pattern}{separator_pattern} {nbr_pattern} (?:de )?(?:pers|personnes|people)(?: ?/ ?| par | per )(?:ménage|mènage|hh)",
114102
null,
115103
true,
116104
"people_per_household"
117105
],
118106
[
119-
"{product_pattern} *: *{age_gender_pattern}",
120-
null,
121-
true,
122-
null
123-
],
124-
[
125-
"{product_pattern} +{age_gender_pattern}",
126-
null,
127-
true,
128-
null
129-
],
130-
[
131-
"{age_gender_pattern} {product_pattern}",
107+
"{product_pattern}{separator_pattern} {age_gender_pattern}",
132108
null,
133109
true,
134110
null

pipelines_tests/test_assets/test_livelihood_activity_regexes.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1087,9 +1087,9 @@
10871087
"product_id": "threshing, harvesting",
10881088
"household_labor_provider": "women"
10891089
},
1090-
"poisson : peche homme (kg collectés)": {
1090+
"poisson/peche homme (kg collectés)": {
10911091
"is_start": true,
1092-
"product_id": "poisson : peche",
1092+
"product_id": "poisson/peche",
10931093
"household_labor_provider": "men",
10941094
"unit_of_measure_id": "kg",
10951095
"attribute": "quantity_produced"

0 commit comments

Comments
 (0)