From 5b5608711a79eb48e61f31eca2cbee4170ac86f1 Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Fri, 29 Nov 2024 17:20:32 +0100 Subject: [PATCH 1/8] :test_tube: [#472] add regression tests if filter with icontains have value with comma --- src/objects/tests/v2/test_filters.py | 57 ++++++++++++++++++++++++++++ 1 file changed, 57 insertions(+) diff --git a/src/objects/tests/v2/test_filters.py b/src/objects/tests/v2/test_filters.py index f0e6eaa1..339adbae 100644 --- a/src/objects/tests/v2/test_filters.py +++ b/src/objects/tests/v2/test_filters.py @@ -359,6 +359,63 @@ def test_filter_icontains_numeric(self): f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", ) + def test_filter_icontains_string_with_comma(self): + """ + regression test for https://github.com/maykinmedia/objects-api/issues/472 + """ + record = ObjectRecordFactory.create( + data={"name": "Something important"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"name": "Advies, support en kennis om te weten"}, + object__object_type=self.object_type, + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get( + self.url, {"data_attrs": "name__icontains__Advies, support en kennis"} + ) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_two_icontains_with_comma(self): + """ + regression test for https://github.com/maykinmedia/objects-api/issues/472 + """ + record = ObjectRecordFactory.create( + data={"name": "Something important"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"name": "Advies, support en kennis om te weten"}, + object__object_type=self.object_type, + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get( + self.url, + { + "data_attrs": "name__icontains__Advies, support en kennis,name__icontains__om" + }, + ) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + def test_filter_exclude_old_records(self): record_old = ObjectRecordFactory.create( data={"diameter": 45}, From 47bd81fdd5db734c673e95b31c3c0ac62a4ab178 Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Wed, 11 Dec 2024 17:07:14 +0100 Subject: [PATCH 2/8] :sparkles: [#472] add 'data_attr' query param --- src/objects/api/v2/filters.py | 116 ++++++++++++++++-------- src/objects/tests/v2/test_filters.py | 130 +++++++++++++++------------ src/objects/utils/filters.py | 22 +++++ 3 files changed, 175 insertions(+), 93 deletions(-) diff --git a/src/objects/api/v2/filters.py b/src/objects/api/v2/filters.py index 442dfa18..8af36773 100644 --- a/src/objects/api/v2/filters.py +++ b/src/objects/api/v2/filters.py @@ -1,6 +1,7 @@ from datetime import date as date_ from django import forms +from django.db.models import QuerySet from django.utils.translation import gettext_lazy as _ from django_filters import filters @@ -8,12 +9,51 @@ from vng_api_common.filtersets import FilterSet from objects.core.models import ObjectRecord, ObjectType -from objects.utils.filters import ObjectTypeFilter +from objects.utils.filters import ManyCharFilter, ObjectTypeFilter from ..constants import Operators from ..utils import display_choice_values_for_help_text, string_to_value from ..validators import validate_data_attrs +DATA_ATTR_VALUE_HELP_TEXT = f"""A valid parameter value has the form `key__operator__value`. +`key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. +Note: Values can be string, numeric, or dates (ISO format; YYYY-MM-DD). + +Valid operator values are: +{display_choice_values_for_help_text(Operators)} + +`value` may not contain double underscore or comma characters. +`key` may not contain comma characters and includes double underscore only if it indicates nested attributes. + +""" + + +def filter_data_attr_value_part(value_part: str, queryset: QuerySet) -> QuerySet: + """ + filter one value part for data_attr and data_attrs filters + """ + variable, operator, str_value = value_part.rsplit("__", 2) + real_value = string_to_value(str_value) + + if operator == "exact": + # for exact operator try to filter on string and numeric values + in_vals = [str_value] + if real_value != str_value: + in_vals.append(real_value) + queryset = queryset.filter(**{f"data__{variable}__in": in_vals}) + elif operator == "icontains": + # icontains treats everything like strings + queryset = queryset.filter(**{f"data__{variable}__icontains": str_value}) + elif operator == "in": + # in must be a list + values = str_value.split("|") + queryset = queryset.filter(**{f"data__{variable}__in": values}) + + else: + # gt, gte, lt, lte operators + queryset = queryset.filter(**{f"data__{variable}__{operator}": real_value}) + return queryset + class ObjectRecordFilterForm(forms.Form): def clean(self): @@ -62,25 +102,46 @@ class ObjectRecordFilterSet(FilterSet): method="filter_data_attrs", validators=[validate_data_attrs], help_text=_( - """Only include objects that have attributes with certain values. + """**DEPRECATED**: Only include objects that have attributes with certain values. Data filtering expressions are comma-separated and are structured as follows: -A valid parameter value has the form `key__operator__value`. -`key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. -Note: Values can be string, numeric, or dates (ISO format; YYYY-MM-DD). - -Valid operator values are: -%(operator_choices)s -`value` may not contain double underscore or comma characters. -`key` may not contain comma characters and includes double underscore only if it indicates nested attributes. +%(value_part_help_text)s Example: in order to display only objects with `height` equal to 100, query `data_attrs=height__exact__100` should be used. If `height` is nested inside `dimensions` attribute, query should look like `data_attrs=dimensions__height__exact__100` + +`value` may not contain comma, since commas are used as separator between filtering expressions. +If you want to use commas in `value` you can use `data_attr` query parameter. +""" + ) + % {"value_part_help_text": DATA_ATTR_VALUE_HELP_TEXT}, + ) + + data_attr = ManyCharFilter( + method="filter_data_attr", + # validators=[validate_data_attrs], + help_text=_( + """Only include objects that have attributes with certain values. + +%(value_part_help_text)s + +Example: in order to display only objects with `height` equal to 100, query `data_attr=height__exact__100` +should be used. If `height` is nested inside `dimensions` attribute, query should look like +`data_attr=dimensions__height__exact__100` + +This filter is very similar to the old `data_attrs` filter, but it has two differences: + +* `value` may contain commas +* only one filtering expression is allowed + +If you want to use several filtering expressions, just use this `data_attr` several times in the query string. +Example: `data_attr=height__exact__100&data_attr=naam__icontains__boom` """ ) - % {"operator_choices": display_choice_values_for_help_text(Operators)}, + % {"value_part_help_text": DATA_ATTR_VALUE_HELP_TEXT}, ) + data_icontains = filters.CharFilter( method="filter_data_icontains", help_text=_("Search in all `data` values of string properties."), @@ -88,37 +149,20 @@ class ObjectRecordFilterSet(FilterSet): class Meta: model = ObjectRecord - fields = ("type", "data_attrs", "date", "registrationDate") + fields = ("type", "data_attrs", "data_attr", "date", "registrationDate") form = ObjectRecordFilterForm def filter_data_attrs(self, queryset, name, value: str): parts = value.split(",") for value_part in parts: - variable, operator, str_value = value_part.rsplit("__", 2) - real_value = string_to_value(str_value) - - if operator == "exact": - # for exact operator try to filter on string and numeric values - in_vals = [str_value] - if real_value != value: - in_vals.append(real_value) - queryset = queryset.filter(**{f"data__{variable}__in": in_vals}) - elif operator == "icontains": - # icontains treats everything like strings - queryset = queryset.filter( - **{f"data__{variable}__icontains": str_value} - ) - elif operator == "in": - # in must be a list - values = str_value.split("|") - queryset = queryset.filter(**{f"data__{variable}__in": values}) - - else: - # gt, gte, lt, lte operators - queryset = queryset.filter( - **{f"data__{variable}__{operator}": real_value} - ) + queryset = filter_data_attr_value_part(value_part, queryset) + + return queryset + + def filter_data_attr(self, queryset, name, value: list): + for value_part in value: + queryset = filter_data_attr_value_part(value_part, queryset) return queryset diff --git a/src/objects/tests/v2/test_filters.py b/src/objects/tests/v2/test_filters.py index 339adbae..684b3da8 100644 --- a/src/objects/tests/v2/test_filters.py +++ b/src/objects/tests/v2/test_filters.py @@ -3,6 +3,7 @@ from django.db.utils import ProgrammingError +from furl import furl from rest_framework import status from rest_framework.test import APITestCase @@ -359,63 +360,6 @@ def test_filter_icontains_numeric(self): f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", ) - def test_filter_icontains_string_with_comma(self): - """ - regression test for https://github.com/maykinmedia/objects-api/issues/472 - """ - record = ObjectRecordFactory.create( - data={"name": "Something important"}, object__object_type=self.object_type - ) - ObjectRecordFactory.create( - data={"name": "Advies, support en kennis om te weten"}, - object__object_type=self.object_type, - ) - ObjectRecordFactory.create(data={}, object__object_type=self.object_type) - - response = self.client.get( - self.url, {"data_attrs": "name__icontains__Advies, support en kennis"} - ) - - self.assertEqual(response.status_code, status.HTTP_200_OK) - - data = response.json()["results"] - - self.assertEqual(len(data), 1) - self.assertEqual( - data[0]["url"], - f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", - ) - - def test_filter_two_icontains_with_comma(self): - """ - regression test for https://github.com/maykinmedia/objects-api/issues/472 - """ - record = ObjectRecordFactory.create( - data={"name": "Something important"}, object__object_type=self.object_type - ) - ObjectRecordFactory.create( - data={"name": "Advies, support en kennis om te weten"}, - object__object_type=self.object_type, - ) - ObjectRecordFactory.create(data={}, object__object_type=self.object_type) - - response = self.client.get( - self.url, - { - "data_attrs": "name__icontains__Advies, support en kennis,name__icontains__om" - }, - ) - - self.assertEqual(response.status_code, status.HTTP_200_OK) - - data = response.json()["results"] - - self.assertEqual(len(data), 1) - self.assertEqual( - data[0]["url"], - f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", - ) - def test_filter_exclude_old_records(self): record_old = ObjectRecordFactory.create( data={"diameter": 45}, @@ -485,6 +429,78 @@ def test_filter_in_string(self): ) +class FilterDataAttrTests(TokenAuthMixin, APITestCase): + url = reverse_lazy("object-list") + + @classmethod + def setUpTestData(cls): + super().setUpTestData() + + cls.object_type = ObjectTypeFactory(service__api_root=OBJECT_TYPES_API) + PermissionFactory.create( + object_type=cls.object_type, + mode=PermissionModes.read_only, + token_auth=cls.token_auth, + ) + + def test_filter_icontains_string_with_comma(self): + """ + regression test for https://github.com/maykinmedia/objects-api/issues/472 + """ + ObjectRecordFactory.create( + data={"name": "Something important"}, object__object_type=self.object_type + ) + record = ObjectRecordFactory.create( + data={"name": "Advies, support en kennis om te weten"}, + object__object_type=self.object_type, + ) + + response = self.client.get( + self.url, {"data_attr": "name__icontains__Advies, support en kennis"} + ) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_two_icontains_with_comma(self): + """ + regression test for https://github.com/maykinmedia/objects-api/issues/472 + """ + ObjectRecordFactory.create( + data={"name": "Something important"}, object__object_type=self.object_type + ) + record = ObjectRecordFactory.create( + data={"name": "Advies, support en kennis om te weten"}, + object__object_type=self.object_type, + ) + url = ( + furl(self.url) + .add({"data_attr": "name__icontains__Advies, support en kennis"}) + .add({"data_attr": "name__icontains__om"}) + .url + ) + + response = self.client.get(url) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + + class FilterDateTests(TokenAuthMixin, APITestCase): @classmethod def setUpTestData(cls): diff --git a/src/objects/utils/filters.py b/src/objects/utils/filters.py index 61364a6a..14555b76 100644 --- a/src/objects/utils/filters.py +++ b/src/objects/utils/filters.py @@ -1,3 +1,4 @@ +from django import forms from django.core.exceptions import ValidationError from django.utils.translation import gettext_lazy as _ @@ -48,3 +49,24 @@ def to_python(self, value): class ObjectTypeFilter(URLModelChoiceFilter): field_class = ObjectTypeField + + +class ManyWidget(forms.Widget): + def value_from_datadict(self, data, files, name): + return data.getlist(name) + + +class ManyCharField(forms.CharField): + widget = ManyWidget + + def to_python(self, value): + if not value: + return [] + + # todo validator if it's list + return value + + +class ManyCharFilter(filters.CharFilter): + # django-filter doesn't support several uses of the same query param out of the box + field_class = ManyCharField From 7eba5fd51ff13cb627f9ae8b07ea06e5ca33bfe6 Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Thu, 12 Dec 2024 14:40:45 +0100 Subject: [PATCH 3/8] :construction_worker: [#472] update OAS check GH workflow --- .github/workflows/oas-check.yml | 7 +------ 1 file changed, 1 insertion(+), 6 deletions(-) diff --git a/.github/workflows/oas-check.yml b/.github/workflows/oas-check.yml index 334ca86f..0df85f2d 100644 --- a/.github/workflows/oas-check.yml +++ b/.github/workflows/oas-check.yml @@ -12,13 +12,8 @@ on: jobs: open-api-workflow-check-oas: uses: maykinmedia/open-api-workflows/.github/workflows/oas-check.yml@v1 - strategy: - matrix: - version: - - v2 with: - schema-path: 'src/objects/api/${{ matrix.version }}/openapi.yaml' - schema-options: "--api-version ${{ matrix.version }}" + schema-path: 'src/objects/api/v2/openapi.yaml' python-version: '3.11' django-settings-module: 'objects.conf.ci' apt-packages: 'libgdal-dev gdal-bin' From 12635f310ad1f47a9199dc6b6df8fa6d0a9a1572 Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Thu, 12 Dec 2024 14:45:57 +0100 Subject: [PATCH 4/8] :memo: [#472] update OAS with 'data_attr' filter --- src/objects/api/v2/openapi.yaml | 88 +++++++++++++++++++++++++++++++-- 1 file changed, 85 insertions(+), 3 deletions(-) diff --git a/src/objects/api/v2/openapi.yaml b/src/objects/api/v2/openapi.yaml index a3274cbd..3d84125b 100644 --- a/src/objects/api/v2/openapi.yaml +++ b/src/objects/api/v2/openapi.yaml @@ -1,7 +1,7 @@ openapi: 3.0.3 info: title: Objects API - version: 2.4.3 (v2) + version: 2.4.3 description: | An API to manage Objects. @@ -89,12 +89,49 @@ paths: data. According to the GeoJSON spec, WGS84 is the default (EPSG: 4326 is the same as WGS84).' - in: query - name: data_attrs + name: data_attr schema: type: string description: | Only include objects that have attributes with certain values. + + A valid parameter value has the form `key__operator__value`. + `key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. + Note: Values can be string, numeric, or dates (ISO format; YYYY-MM-DD). + + Valid operator values are: + * `exact` - equal to + * `gt` - greater than + * `gte` - greater than or equal to + * `lt` - lower than + * `lte` - lower than or equal to + * `icontains` - case-insensitive partial match + * `in` - in a list of values separated by `|` + + `value` may not contain double underscore or comma characters. + `key` may not contain comma characters and includes double underscore only if it indicates nested attributes. + + + + Example: in order to display only objects with `height` equal to 100, query `data_attr=height__exact__100` + should be used. If `height` is nested inside `dimensions` attribute, query should look like + `data_attr=dimensions__height__exact__100` + + This filter is very similar to the old `data_attrs` filter, but it has two differences: + + * `value` may contain commas + * only one filtering expression is allowed + + If you want to use several filtering expressions, just use this `data_attr` several times in the query string. + Example: `data_attr=height__exact__100&data_attr=naam__icontains__boom` + - in: query + name: data_attrs + schema: + type: string + description: | + **DEPRECATED**: Only include objects that have attributes with certain values. Data filtering expressions are comma-separated and are structured as follows: + A valid parameter value has the form `key__operator__value`. `key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. Note: Values can be string, numeric, or dates (ISO format; YYYY-MM-DD). @@ -111,9 +148,14 @@ paths: `value` may not contain double underscore or comma characters. `key` may not contain comma characters and includes double underscore only if it indicates nested attributes. + + Example: in order to display only objects with `height` equal to 100, query `data_attrs=height__exact__100` should be used. If `height` is nested inside `dimensions` attribute, query should look like `data_attrs=dimensions__height__exact__100` + + `value` may not contain comma, since commas are used as separator between filtering expressions. + If you want to use commas in `value` you can use `data_attr` query parameter. - in: query name: data_icontains schema: @@ -620,8 +662,9 @@ paths: data_attrs: type: string description: | - Only include objects that have attributes with certain values. + **DEPRECATED**: Only include objects that have attributes with certain values. Data filtering expressions are comma-separated and are structured as follows: + A valid parameter value has the form `key__operator__value`. `key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. Note: Values can be string, numeric, or dates (ISO format; YYYY-MM-DD). @@ -638,9 +681,48 @@ paths: `value` may not contain double underscore or comma characters. `key` may not contain comma characters and includes double underscore only if it indicates nested attributes. + + Example: in order to display only objects with `height` equal to 100, query `data_attrs=height__exact__100` should be used. If `height` is nested inside `dimensions` attribute, query should look like `data_attrs=dimensions__height__exact__100` + + `value` may not contain comma, since commas are used as separator between filtering expressions. + If you want to use commas in `value` you can use `data_attr` query parameter. + data_attr: + type: string + description: | + Only include objects that have attributes with certain values. + + A valid parameter value has the form `key__operator__value`. + `key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. + Note: Values can be string, numeric, or dates (ISO format; YYYY-MM-DD). + + Valid operator values are: + * `exact` - equal to + * `gt` - greater than + * `gte` - greater than or equal to + * `lt` - lower than + * `lte` - lower than or equal to + * `icontains` - case-insensitive partial match + * `in` - in a list of values separated by `|` + + `value` may not contain double underscore or comma characters. + `key` may not contain comma characters and includes double underscore only if it indicates nested attributes. + + + + Example: in order to display only objects with `height` equal to 100, query `data_attr=height__exact__100` + should be used. If `height` is nested inside `dimensions` attribute, query should look like + `data_attr=dimensions__height__exact__100` + + This filter is very similar to the old `data_attrs` filter, but it has two differences: + + * `value` may contain commas + * only one filtering expression is allowed + + If you want to use several filtering expressions, just use this `data_attr` several times in the query string. + Example: `data_attr=height__exact__100&data_attr=naam__icontains__boom` date: type: string format: date From 3676052ed384a3b8b8fe894849efaa9c7f5f1340 Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Thu, 12 Dec 2024 14:46:44 +0100 Subject: [PATCH 5/8] :green_heart: [#472] fix new filter field widget --- src/objects/tests/v2/test_filters.py | 1 - src/objects/utils/filters.py | 4 ++++ 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/src/objects/tests/v2/test_filters.py b/src/objects/tests/v2/test_filters.py index 684b3da8..19c714fe 100644 --- a/src/objects/tests/v2/test_filters.py +++ b/src/objects/tests/v2/test_filters.py @@ -500,7 +500,6 @@ def test_filter_two_icontains_with_comma(self): ) - class FilterDateTests(TokenAuthMixin, APITestCase): @classmethod def setUpTestData(cls): diff --git a/src/objects/utils/filters.py b/src/objects/utils/filters.py index 14555b76..0f19187c 100644 --- a/src/objects/utils/filters.py +++ b/src/objects/utils/filters.py @@ -53,6 +53,9 @@ class ObjectTypeFilter(URLModelChoiceFilter): class ManyWidget(forms.Widget): def value_from_datadict(self, data, files, name): + if name not in data: + return [] + return data.getlist(name) @@ -69,4 +72,5 @@ def to_python(self, value): class ManyCharFilter(filters.CharFilter): # django-filter doesn't support several uses of the same query param out of the box + # so we need to do it ourselves field_class = ManyCharField From 052359f6e5de34157ddb12e8aa172d0f436c310d Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Thu, 12 Dec 2024 15:33:54 +0100 Subject: [PATCH 6/8] :sparkles: [#472] add validation for 'data_attr' filter --- src/objects/api/v2/filters.py | 7 +++-- src/objects/api/v2/openapi.yaml | 6 ++-- src/objects/api/validators.py | 56 +++++++++++++++++++++++---------- src/objects/utils/filters.py | 1 - 4 files changed, 47 insertions(+), 23 deletions(-) diff --git a/src/objects/api/v2/filters.py b/src/objects/api/v2/filters.py index 8af36773..f962787c 100644 --- a/src/objects/api/v2/filters.py +++ b/src/objects/api/v2/filters.py @@ -13,7 +13,7 @@ from ..constants import Operators from ..utils import display_choice_values_for_help_text, string_to_value -from ..validators import validate_data_attrs +from ..validators import validate_data_attr, validate_data_attrs DATA_ATTR_VALUE_HELP_TEXT = f"""A valid parameter value has the form `key__operator__value`. `key` is the attribute name, `operator` is the comparison operator to be used and `value` is the attribute value. @@ -102,7 +102,8 @@ class ObjectRecordFilterSet(FilterSet): method="filter_data_attrs", validators=[validate_data_attrs], help_text=_( - """**DEPRECATED**: Only include objects that have attributes with certain values. + """**DEPRECATED: Use 'data_attr' instead**. +Only include objects that have attributes with certain values. Data filtering expressions are comma-separated and are structured as follows: %(value_part_help_text)s @@ -120,7 +121,7 @@ class ObjectRecordFilterSet(FilterSet): data_attr = ManyCharFilter( method="filter_data_attr", - # validators=[validate_data_attrs], + validators=[validate_data_attr], help_text=_( """Only include objects that have attributes with certain values. diff --git a/src/objects/api/v2/openapi.yaml b/src/objects/api/v2/openapi.yaml index 3d84125b..13bd3b3b 100644 --- a/src/objects/api/v2/openapi.yaml +++ b/src/objects/api/v2/openapi.yaml @@ -129,7 +129,8 @@ paths: schema: type: string description: | - **DEPRECATED**: Only include objects that have attributes with certain values. + **DEPRECATED: Use 'data_attr' instead**. + Only include objects that have attributes with certain values. Data filtering expressions are comma-separated and are structured as follows: A valid parameter value has the form `key__operator__value`. @@ -662,7 +663,8 @@ paths: data_attrs: type: string description: | - **DEPRECATED**: Only include objects that have attributes with certain values. + **DEPRECATED: Use 'data_attr' instead**. + Only include objects that have attributes with certain values. Data filtering expressions are comma-separated and are structured as follows: A valid parameter value has the form `key__operator__value`. diff --git a/src/objects/api/validators.py b/src/objects/api/validators.py index 11b86567..68f25593 100644 --- a/src/objects/api/validators.py +++ b/src/objects/api/validators.py @@ -68,32 +68,54 @@ def __call__(self, new_value, serializer_field): raise serializers.ValidationError(self.message, code=self.code) +def validate_data_attr_value_part(value_part: str, code: str): + try: + variable, operator, val = value_part.rsplit("__", 2) + except ValueError: + message = _( + "Filter expression '%(value_part)s' doesn't have the shape 'key__operator__value'" + ) % {"value_part": value_part} + raise serializers.ValidationError(message, code=code) + + if operator not in Operators.values: + message = _("Comparison operator `%(operator)s` is unknown") % { + "operator": operator + } + raise serializers.ValidationError(message, code=code) + + if operator not in ( + Operators.exact, + Operators.icontains, + Operators.in_list, + ) and isinstance(string_to_value(val), str): + message = _( + "Operator `%(operator)s` supports only dates and/or numeric values" + ) % {"operator": operator} + raise serializers.ValidationError(message, code=code) + + def validate_data_attrs(value: str): + # todo remove when 'data_attrs' filter is removed code = "invalid-data-attrs-query" parts = value.split(",") for value_part in parts: - try: - variable, operator, val = value_part.rsplit("__", 2) - except ValueError as exc: - raise serializers.ValidationError(exc.args[0], code=code) from exc - - if operator not in Operators.values: - message = _("Comparison operator `%(operator)s` is unknown") % { - "operator": operator - } - raise serializers.ValidationError(message, code=code) + validate_data_attr_value_part(value_part, code) - if operator not in ( - Operators.exact, - Operators.icontains, - Operators.in_list, - ) and isinstance(string_to_value(val), str): + +def validate_data_attr(value: list): + code = "invalid-data-attr-query" + + for value_part in value: + # check that comma can be only in the value part + if "," in value_part.rsplit("__", 1)[0]: message = _( - "Operator `%(operator)s` supports only dates and/or numeric values" - ) % {"operator": operator} + "Filter expression '%(value_part)s' doesn't have the shape 'key__operator__value'" + ) % {"value_part": value_part} raise serializers.ValidationError(message, code=code) + validate_data_attr_value_part(value_part, code) + class GeometryValidator: code = "geometry-not-allowed" diff --git a/src/objects/utils/filters.py b/src/objects/utils/filters.py index 0f19187c..421c0a2c 100644 --- a/src/objects/utils/filters.py +++ b/src/objects/utils/filters.py @@ -66,7 +66,6 @@ def to_python(self, value): if not value: return [] - # todo validator if it's list return value From 2e3ac54700663c1a779d8e0b1390db0a1872c35b Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Thu, 12 Dec 2024 16:12:35 +0100 Subject: [PATCH 7/8] :white_check_mark: [#472] add more tests for 'data_attr' filter --- src/objects/tests/v2/test_filters.py | 321 ++++++++++++++++++++++++++- 1 file changed, 320 insertions(+), 1 deletion(-) diff --git a/src/objects/tests/v2/test_filters.py b/src/objects/tests/v2/test_filters.py index 19c714fe..9c3e2318 100644 --- a/src/objects/tests/v2/test_filters.py +++ b/src/objects/tests/v2/test_filters.py @@ -261,7 +261,10 @@ def test_filter_invalid_param(self): self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST) self.assertEqual( - response.json(), ["not enough values to unpack (expected 3, got 2)"] + response.json(), + [ + "Filter expression 'diameter__exact' doesn't have the shape 'key__operator__value'" + ], ) def test_filter_nested_attr(self): @@ -443,6 +446,308 @@ def setUpTestData(cls): token_auth=cls.token_auth, ) + def test_filter_exact_string(self): + record = ObjectRecordFactory.create( + data={"name": "demo"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"name": "demo2"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get(self.url, {"data_attr": "name__exact__demo"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_exact_number(self): + record = ObjectRecordFactory.create( + data={"diameter": 4}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"diameter": 6}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get(self.url, {"data_attr": "diameter__exact__4"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_exact_date(self): + record = ObjectRecordFactory.create( + data={"date": "2000-11-01"}, object__object_type=self.object_type + ) + + response = self.client.get(self.url, {"data_attr": "date__exact__2000-11-01"}) + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_lte(self): + record1 = ObjectRecordFactory.create( + data={"diameter": 4}, object__object_type=self.object_type + ) + record2 = ObjectRecordFactory.create( + data={"diameter": 5}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"diameter": 6}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get(self.url, {"data_attr": "diameter__lte__5"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + data = sorted(data, key=lambda x: x["record"]["data"]["diameter"]) + + self.assertEqual(len(data), 2) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record1.object.uuid])}", + ) + self.assertEqual( + data[1]["url"], + f"http://testserver{reverse('object-detail', args=[record2.object.uuid])}", + ) + + def test_filter_lt(self): + record = ObjectRecordFactory.create( + data={"diameter": 4}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"diameter": 5}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"diameter": 6}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get(self.url, {"data_attr": "diameter__lt__5"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_lte_not_numerical(self): + response = self.client.get(self.url, {"data_attr": "diameter__lt__value"}) + + self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST) + self.assertEqual( + response.json(), ["Operator `lt` supports only dates and/or numeric values"] + ) + + def test_filter_lte_date(self): + record = ObjectRecordFactory.create( + data={"date": "2000-11-01"}, object__object_type=self.object_type + ) + + response = self.client.get(self.url, {"data_attr": "date__lte__2000-12-01"}) + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + response = self.client.get(self.url, {"data_attr": "date__lte__2000-10-01"}) + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + self.assertEqual(len(data), 0) + + response = self.client.get(self.url, {"data_attr": "date__lte__2000-11-01"}) + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_invalid_operator(self): + response = self.client.get(self.url, {"data_attr": "diameter__not__value"}) + + self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST) + self.assertEqual(response.json(), ["Comparison operator `not` is unknown"]) + + def test_filter_invalid_param(self): + response = self.client.get(self.url, {"data_attr": "diameter__exact"}) + + self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST) + self.assertEqual( + response.json(), + [ + "Filter expression 'diameter__exact' doesn't have the shape 'key__operator__value'" + ], + ) + + def test_filter_nested_attr(self): + record = ObjectRecordFactory.create( + data={"dimensions": {"diameter": 4}}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"dimensions": {"diameter": 5}}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"diameter": 4}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get( + self.url, {"data_attr": "dimensions__diameter__exact__4"} + ) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_icontains_string(self): + record = ObjectRecordFactory.create( + data={"name": "Something important"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"name": "Nothing important"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get(self.url, {"data_attr": "name__icontains__some"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_icontains_numeric(self): + record = ObjectRecordFactory.create( + data={"diameter": 45}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"diameter": 6}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) + + response = self.client.get(self.url, {"data_attr": "diameter__icontains__4"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + + def test_filter_exclude_old_records(self): + record_old = ObjectRecordFactory.create( + data={"diameter": 45}, + object__object_type=self.object_type, + start_at=date.today() - timedelta(days=10), + end_at=date.today() - timedelta(days=1), + ) + ObjectRecordFactory.create( + data={"diameter": 50}, object=record_old.object, start_at=record_old.end_at + ) + + response = self.client.get(self.url, {"data_attr": "diameter__exact__45"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + self.assertEqual(len(data), 0) + + def test_filter_date_field_gte(self): + ObjectRecordFactory.create( + data={"dateField": "2000-10-10"}, object__object_type=self.object_type + ) + + response = self.client.get( + self.url, {"data_attr": "dateField__gte__2000-10-10"} + ) + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 1) + + response = self.client.get( + self.url, {"data_attr": "dateField__gte__2000-10-11"} + ) + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 0) + + def test_filter_in_string(self): + record = ObjectRecordFactory.create( + data={"name": "demo1"}, object__object_type=self.object_type + ) + record2 = ObjectRecordFactory.create( + data={"name": "demo2"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create( + data={"name": "demo3"}, object__object_type=self.object_type + ) + + response = self.client.get(self.url, {"data_attr": "name__in__demo1|demo2"}) + + self.assertEqual(response.status_code, status.HTTP_200_OK) + + data = response.json()["results"] + + self.assertEqual(len(data), 2) + self.assertEqual( + data[0]["url"], + f"http://testserver{reverse('object-detail', args=[record2.object.uuid])}", + ) + self.assertEqual( + data[1]["url"], + f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", + ) + def test_filter_icontains_string_with_comma(self): """ regression test for https://github.com/maykinmedia/objects-api/issues/472 @@ -499,6 +804,20 @@ def test_filter_two_icontains_with_comma(self): f"http://testserver{reverse('object-detail', args=[record.object.uuid])}", ) + def test_filter_comma_separated_invalid(self): + response = self.client.get( + self.url, {"data_attr": "dimensions__diameter__exact__4,name__exact__demo"} + ) + + self.assertEqual(response.status_code, status.HTTP_400_BAD_REQUEST) + self.assertEqual( + response.json(), + [ + "Filter expression 'dimensions__diameter__exact__4,name__exact__demo' " + "doesn't have the shape 'key__operator__value'" + ], + ) + class FilterDateTests(TokenAuthMixin, APITestCase): @classmethod From 5ee5e7e0e480d37c7b370d345e90be652b523ca6 Mon Sep 17 00:00:00 2001 From: Anna Shamray Date: Wed, 18 Dec 2024 17:52:37 +0100 Subject: [PATCH 8/8] :ok_hand: [#472] process PR feedback --- src/objects/api/v2/filters.py | 79 ++++++++++++++++------------ src/objects/api/v2/openapi.yaml | 2 + src/objects/api/v2/views.py | 31 +++++++++-- src/objects/api/validators.py | 3 +- src/objects/tests/v2/test_filters.py | 7 ++- 5 files changed, 81 insertions(+), 41 deletions(-) diff --git a/src/objects/api/v2/filters.py b/src/objects/api/v2/filters.py index f962787c..6ed36484 100644 --- a/src/objects/api/v2/filters.py +++ b/src/objects/api/v2/filters.py @@ -27,6 +27,47 @@ """ +DATA_ATTRS_HELP_TEXT = ( + _( + """**DEPRECATED: Use 'data_attr' instead**. +Only include objects that have attributes with certain values. +Data filtering expressions are comma-separated and are structured as follows: + +%(value_part_help_text)s + +Example: in order to display only objects with `height` equal to 100, query `data_attrs=height__exact__100` +should be used. If `height` is nested inside `dimensions` attribute, query should look like +`data_attrs=dimensions__height__exact__100` + +`value` may not contain comma, since commas are used as separator between filtering expressions. +If you want to use commas in `value` you can use `data_attr` query parameter. +""" + ) + % {"value_part_help_text": DATA_ATTR_VALUE_HELP_TEXT} +) + +DATA_ATTR_HELP_TEXT = ( + _( + """Only include objects that have attributes with certain values. + +%(value_part_help_text)s + +Example: in order to display only objects with `height` equal to 100, query `data_attr=height__exact__100` +should be used. If `height` is nested inside `dimensions` attribute, query should look like +`data_attr=dimensions__height__exact__100` + +This filter is very similar to the old `data_attrs` filter, but it has two differences: + +* `value` may contain commas +* only one filtering expression is allowed + +If you want to use several filtering expressions, just use this `data_attr` several times in the query string. +Example: `data_attr=height__exact__100&data_attr=naam__icontains__boom` +""" + ) + % {"value_part_help_text": DATA_ATTR_VALUE_HELP_TEXT} +) + def filter_data_attr_value_part(value_part: str, queryset: QuerySet) -> QuerySet: """ @@ -98,49 +139,17 @@ class ObjectRecordFilterSet(FilterSet): "date would be between `registrationAt` attributes of different records" ), ) + data_attrs = filters.CharFilter( method="filter_data_attrs", validators=[validate_data_attrs], - help_text=_( - """**DEPRECATED: Use 'data_attr' instead**. -Only include objects that have attributes with certain values. -Data filtering expressions are comma-separated and are structured as follows: - -%(value_part_help_text)s - -Example: in order to display only objects with `height` equal to 100, query `data_attrs=height__exact__100` -should be used. If `height` is nested inside `dimensions` attribute, query should look like -`data_attrs=dimensions__height__exact__100` - -`value` may not contain comma, since commas are used as separator between filtering expressions. -If you want to use commas in `value` you can use `data_attr` query parameter. -""" - ) - % {"value_part_help_text": DATA_ATTR_VALUE_HELP_TEXT}, + help_text=DATA_ATTRS_HELP_TEXT, ) data_attr = ManyCharFilter( method="filter_data_attr", validators=[validate_data_attr], - help_text=_( - """Only include objects that have attributes with certain values. - -%(value_part_help_text)s - -Example: in order to display only objects with `height` equal to 100, query `data_attr=height__exact__100` -should be used. If `height` is nested inside `dimensions` attribute, query should look like -`data_attr=dimensions__height__exact__100` - -This filter is very similar to the old `data_attrs` filter, but it has two differences: - -* `value` may contain commas -* only one filtering expression is allowed - -If you want to use several filtering expressions, just use this `data_attr` several times in the query string. -Example: `data_attr=height__exact__100&data_attr=naam__icontains__boom` -""" - ) - % {"value_part_help_text": DATA_ATTR_VALUE_HELP_TEXT}, + help_text=DATA_ATTR_HELP_TEXT, ) data_icontains = filters.CharFilter( diff --git a/src/objects/api/v2/openapi.yaml b/src/objects/api/v2/openapi.yaml index 13bd3b3b..7fa40c26 100644 --- a/src/objects/api/v2/openapi.yaml +++ b/src/objects/api/v2/openapi.yaml @@ -124,6 +124,7 @@ paths: If you want to use several filtering expressions, just use this `data_attr` several times in the query string. Example: `data_attr=height__exact__100&data_attr=naam__icontains__boom` + explode: true - in: query name: data_attrs schema: @@ -157,6 +158,7 @@ paths: `value` may not contain comma, since commas are used as separator between filtering expressions. If you want to use commas in `value` you can use `data_attr` query parameter. + deprecated: true - in: query name: data_icontains schema: diff --git a/src/objects/api/v2/views.py b/src/objects/api/v2/views.py index 9a73f420..ab2e4245 100644 --- a/src/objects/api/v2/views.py +++ b/src/objects/api/v2/views.py @@ -4,8 +4,12 @@ from django.db import models from django.utils.dateparse import parse_date -from drf_spectacular.types import OpenApiTypes -from drf_spectacular.utils import OpenApiParameter, extend_schema, extend_schema_view +from drf_spectacular.utils import ( + OpenApiParameter, + OpenApiTypes, + extend_schema, + extend_schema_view, +) from rest_framework import mixins, viewsets from rest_framework.decorators import action from rest_framework.generics import get_object_or_404 @@ -28,13 +32,32 @@ PermissionSerializer, ) from ..utils import is_date -from .filters import ObjectRecordFilterSet +from .filters import DATA_ATTR_HELP_TEXT, DATA_ATTRS_HELP_TEXT, ObjectRecordFilterSet + +# manually override OAS because of "deprecated" attribute +data_attrs_parameter = OpenApiParameter( + name="data_attrs", + type=OpenApiTypes.STR, + location=OpenApiParameter.QUERY, + description=DATA_ATTRS_HELP_TEXT, + deprecated=True, +) + +# manually override OAS because of "explode" attribute +data_attr_parameter = OpenApiParameter( + name="data_attr", + location=OpenApiParameter.QUERY, + type=OpenApiTypes.STR, + description=DATA_ATTR_HELP_TEXT, + explode=True, +) @extend_schema_view( list=extend_schema( description="Retrieve a list of OBJECTs and their actual RECORD. " - "The actual record is defined as if the query parameter `date=` was given." + "The actual record is defined as if the query parameter `date=` was given.", + parameters=[data_attrs_parameter, data_attr_parameter], ), retrieve=extend_schema( description="Retrieve a single OBJECT and its actual RECORD. " diff --git a/src/objects/api/validators.py b/src/objects/api/validators.py index 68f25593..f0d49797 100644 --- a/src/objects/api/validators.py +++ b/src/objects/api/validators.py @@ -110,7 +110,8 @@ def validate_data_attr(value: list): # check that comma can be only in the value part if "," in value_part.rsplit("__", 1)[0]: message = _( - "Filter expression '%(value_part)s' doesn't have the shape 'key__operator__value'" + "Filter expression '%(value_part)s' must have the shape 'key__operator__value', " + "commas can only be present in the 'value'" ) % {"value_part": value_part} raise serializers.ValidationError(message, code=code) diff --git a/src/objects/tests/v2/test_filters.py b/src/objects/tests/v2/test_filters.py index 9c3e2318..4b30c381 100644 --- a/src/objects/tests/v2/test_filters.py +++ b/src/objects/tests/v2/test_filters.py @@ -492,6 +492,10 @@ def test_filter_exact_date(self): record = ObjectRecordFactory.create( data={"date": "2000-11-01"}, object__object_type=self.object_type ) + ObjectRecordFactory.create( + data={"date": "2020-11-01"}, object__object_type=self.object_type + ) + ObjectRecordFactory.create(data={}, object__object_type=self.object_type) response = self.client.get(self.url, {"data_attr": "date__exact__2000-11-01"}) self.assertEqual(response.status_code, status.HTTP_200_OK) @@ -814,7 +818,8 @@ def test_filter_comma_separated_invalid(self): response.json(), [ "Filter expression 'dimensions__diameter__exact__4,name__exact__demo' " - "doesn't have the shape 'key__operator__value'" + "must have the shape 'key__operator__value', commas can only be present in " + "the 'value'" ], )