diff --git a/.env-devel b/.env-devel index 32facad8357..7703fa8082a 100644 --- a/.env-devel +++ b/.env-devel @@ -90,8 +90,8 @@ EFS_GROUP_NAME=efs-group EFS_DNS_NAME=fs-xxx.efs.us-east-1.amazonaws.com EFS_MOUNTED_PATH=/tmp/efs EFS_PROJECT_SPECIFIC_DATA_DIRECTORY=project-specific-data -EFS_ONLY_ENABLED_FOR_USERIDS=[] EFS_GUARDIAN_TRACING={} +EFS_DEFAULT_USER_SERVICE_SIZE_BYTES=10000 # DATCORE_ADAPTER DATCORE_ADAPTER_TRACING={} diff --git a/packages/settings-library/src/settings_library/efs.py b/packages/settings-library/src/settings_library/efs.py index 34c48f9dca6..d8ad2b7395d 100644 --- a/packages/settings-library/src/settings_library/efs.py +++ b/packages/settings-library/src/settings_library/efs.py @@ -14,10 +14,6 @@ class AwsEfsSettings(BaseCustomSettings): EFS_MOUNTED_PATH: Path = Field( description="This is the path where EFS is mounted to the EC2 machine", ) - EFS_ONLY_ENABLED_FOR_USERIDS: list[int] = Field( - description="This is temporary solution so we can enable it for specific users for testing purpose", - examples=[[1]], - ) NFS_PROTOCOL = "4.1" diff --git a/services/clusters-keeper/src/simcore_service_clusters_keeper/core/settings.py b/services/clusters-keeper/src/simcore_service_clusters_keeper/core/settings.py index 3e85015ee4a..c4f656c68fb 100644 --- a/services/clusters-keeper/src/simcore_service_clusters_keeper/core/settings.py +++ b/services/clusters-keeper/src/simcore_service_clusters_keeper/core/settings.py @@ -381,15 +381,6 @@ def LOG_LEVEL(self) -> LogLevel: # noqa: N802 def _valid_log_level(cls, value: str) -> str: return cls.validate_log_level(value) - @field_validator("SERVICE_TRACKING_HEARTBEAT", mode="before") - @classmethod - def _validate_interval( - cls, value: str | datetime.timedelta - ) -> int | datetime.timedelta: - if isinstance(value, str): - return int(value) - return value - def get_application_settings(app: FastAPI) -> ApplicationSettings: return cast(ApplicationSettings, app.state.settings) diff --git a/services/clusters-keeper/tests/unit/test_modules_clusters_management_core.py b/services/clusters-keeper/tests/unit/test_modules_clusters_management_core.py index 438e69ee72e..d06a6aaeedd 100644 --- a/services/clusters-keeper/tests/unit/test_modules_clusters_management_core.py +++ b/services/clusters-keeper/tests/unit/test_modules_clusters_management_core.py @@ -4,6 +4,7 @@ import asyncio import dataclasses +import datetime from collections.abc import Awaitable, Callable from typing import Final from unittest.mock import MagicMock @@ -36,7 +37,9 @@ def wallet_id(faker: Faker, request: pytest.FixtureRequest) -> WalletID | None: return faker.pyint(min_value=1) if request.param == "with_wallet" else None -_FAST_TIME_BEFORE_TERMINATION_SECONDS: Final[int] = 10 +_FAST_TIME_BEFORE_TERMINATION_SECONDS: Final[datetime.timedelta] = datetime.timedelta( + seconds=10 +) @pytest.fixture @@ -149,7 +152,7 @@ async def test_cluster_management_core_properly_removes_unused_instances( mocked_dask_ping_scheduler.is_scheduler_busy.reset_mock() # running the cluster management task after the heartbeat came in shall not remove anything - await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS + 1) + await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS.total_seconds() + 1) await cluster_heartbeat(initialized_app, user_id=user_id, wallet_id=wallet_id) await check_clusters(initialized_app) await _assert_cluster_exist_and_state( @@ -161,7 +164,7 @@ async def test_cluster_management_core_properly_removes_unused_instances( mocked_dask_ping_scheduler.is_scheduler_busy.reset_mock() # after waiting the termination time, running the task shall remove the cluster - await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS + 1) + await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS.total_seconds() + 1) await check_clusters(initialized_app) await _assert_cluster_exist_and_state( ec2_client, instances=created_clusters, state="terminated" @@ -201,7 +204,7 @@ async def test_cluster_management_core_properly_removes_workers_on_shutdown( ec2_client, instance_ids=worker_instance_ids, state="running" ) # after waiting the termination time, running the task shall remove the cluster - await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS + 1) + await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS.total_seconds() + 1) await check_clusters(initialized_app) await _assert_cluster_exist_and_state( ec2_client, instances=created_clusters, state="terminated" @@ -314,7 +317,7 @@ async def test_cluster_management_core_removes_broken_clusters_after_some_delay( mocked_dask_ping_scheduler.is_scheduler_busy.reset_mock() # waiting for the termination time will now terminate the cluster - await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS + 1) + await asyncio.sleep(_FAST_TIME_BEFORE_TERMINATION_SECONDS.total_seconds() + 1) await check_clusters(initialized_app) await _assert_cluster_exist_and_state( ec2_client, instances=created_clusters, state="terminated" diff --git a/services/director-v2/src/simcore_service_director_v2/modules/comp_scheduler/_scheduler_base.py b/services/director-v2/src/simcore_service_director_v2/modules/comp_scheduler/_scheduler_base.py index a16821d0fba..d8fdccc1663 100644 --- a/services/director-v2/src/simcore_service_director_v2/modules/comp_scheduler/_scheduler_base.py +++ b/services/director-v2/src/simcore_service_director_v2/modules/comp_scheduler/_scheduler_base.py @@ -540,11 +540,7 @@ async def apply( project_id: ProjectID, iteration: Iteration, ) -> None: - """schedules a pipeline for a given user, project and iteration. - - Arguments: - wake_up_callback -- a callback function that is called in a separate thread everytime a pipeline node is completed - """ + """apply the scheduling of a pipeline for a given user, project and iteration.""" with log_context( _logger, level=logging.INFO, diff --git a/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_runs.py b/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_runs.py index b746407a8aa..13e01a4276f 100644 --- a/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_runs.py +++ b/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_runs.py @@ -143,7 +143,9 @@ async def list( return [ CompRunsAtDB.model_validate(row) async for row in conn.execute( - sa.select(comp_runs).where(sa.and_(*conditions)) + sa.select(comp_runs).where( + sa.and_(True, *conditions) # noqa: FBT003 + ) ) ] diff --git a/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_tasks/_utils.py b/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_tasks/_utils.py index 51082b698f1..c5fd0819fcd 100644 --- a/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_tasks/_utils.py +++ b/services/director-v2/src/simcore_service_director_v2/modules/db/repositories/comp_tasks/_utils.py @@ -89,9 +89,7 @@ async def _get_service_details( node.version, product_name, ) - obj: ServiceMetaDataPublished = ServiceMetaDataPublished.model_construct( - **service_details - ) + obj: ServiceMetaDataPublished = ServiceMetaDataPublished(**service_details) return obj @@ -105,7 +103,7 @@ def _compute_node_requirements( node_defined_resources[resource_name] = node_defined_resources.get( resource_name, 0 ) + min(resource_value.limit, resource_value.reservation) - return NodeRequirements.model_validate(node_defined_resources) + return NodeRequirements(**node_defined_resources) def _compute_node_boot_mode(node_resources: ServiceResourcesDict) -> BootMode: @@ -146,12 +144,12 @@ async def _get_node_infos( None, ) - result: tuple[ServiceMetaDataPublished, ServiceExtras, SimcoreServiceLabels] = ( - await asyncio.gather( - _get_service_details(catalog_client, user_id, product_name, node), - director_client.get_service_extras(node.key, node.version), - director_client.get_service_labels(node), - ) + result: tuple[ + ServiceMetaDataPublished, ServiceExtras, SimcoreServiceLabels + ] = await asyncio.gather( + _get_service_details(catalog_client, user_id, product_name, node), + director_client.get_service_extras(node.key, node.version), + director_client.get_service_labels(node), ) return result @@ -189,7 +187,7 @@ async def _generate_task_image( data.update(envs=_compute_node_envs(node_labels)) if node_extras and node_extras.container_spec: data.update(command=node_extras.container_spec.command) - return Image.model_validate(data) + return Image(**data) async def _get_pricing_and_hardware_infos( @@ -247,9 +245,9 @@ async def _get_pricing_and_hardware_infos( return pricing_info, hardware_info -_RAM_SAFE_MARGIN_RATIO: Final[float] = ( - 0.1 # NOTE: machines always have less available RAM than advertised -) +_RAM_SAFE_MARGIN_RATIO: Final[ + float +] = 0.1 # NOTE: machines always have less available RAM than advertised _CPUS_SAFE_MARGIN: Final[float] = 0.1 @@ -267,11 +265,11 @@ async def _update_project_node_resources_from_hardware_info( if not hardware_info.aws_ec2_instances: return try: - unordered_list_ec2_instance_types: list[EC2InstanceTypeGet] = ( - await get_instance_type_details( - rabbitmq_rpc_client, - instance_type_names=set(hardware_info.aws_ec2_instances), - ) + unordered_list_ec2_instance_types: list[ + EC2InstanceTypeGet + ] = await get_instance_type_details( + rabbitmq_rpc_client, + instance_type_names=set(hardware_info.aws_ec2_instances), ) assert unordered_list_ec2_instance_types # nosec @@ -347,7 +345,7 @@ async def generate_tasks_list_from_project( list_comp_tasks = [] unique_service_key_versions: set[ServiceKeyVersion] = { - ServiceKeyVersion.model_construct( + ServiceKeyVersion( key=node.key, version=node.version ) # the service key version is frozen for node in project.workbench.values() @@ -366,9 +364,7 @@ async def generate_tasks_list_from_project( for internal_id, node_id in enumerate(project.workbench, 1): node: Node = project.workbench[node_id] - node_key_version = ServiceKeyVersion.model_construct( - key=node.key, version=node.version - ) + node_key_version = ServiceKeyVersion(key=node.key, version=node.version) node_details, node_extras, node_labels = key_version_to_node_infos.get( node_key_version, (None, None, None), @@ -434,8 +430,8 @@ async def generate_tasks_list_from_project( task_db = CompTaskAtDB( project_id=project.uuid, node_id=NodeID(node_id), - schema=NodeSchema.model_validate( - node_details.model_dump( + schema=NodeSchema( + **node_details.model_dump( exclude_unset=True, by_alias=True, include={"inputs", "outputs"} ) ), diff --git a/services/director-v2/tests/unit/with_dbs/test_api_route_computations.py b/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_api_route_computations.py similarity index 99% rename from services/director-v2/tests/unit/with_dbs/test_api_route_computations.py rename to services/director-v2/tests/unit/with_dbs/comp_scheduler/test_api_route_computations.py index 2e75b18c009..4381c9311d4 100644 --- a/services/director-v2/tests/unit/with_dbs/test_api_route_computations.py +++ b/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_api_route_computations.py @@ -88,6 +88,8 @@ def minimal_configuration( redis_service: RedisSettings, monkeypatch: pytest.MonkeyPatch, faker: Faker, + with_disabled_auto_scheduling: mock.Mock, + with_disabled_scheduler_publisher: mock.Mock, ): monkeypatch.setenv("DIRECTOR_V2_DYNAMIC_SIDECAR_ENABLED", "false") monkeypatch.setenv("COMPUTATIONAL_BACKEND_DASK_CLIENT_ENABLED", "1") @@ -588,11 +590,7 @@ async def test_create_computation_with_wallet( @pytest.mark.parametrize( "default_pricing_plan", - [ - PricingPlanGet.model_construct( - **PricingPlanGet.model_config["json_schema_extra"]["examples"][0] - ) - ], + [PricingPlanGet(**PricingPlanGet.model_config["json_schema_extra"]["examples"][0])], ) async def test_create_computation_with_wallet_with_invalid_pricing_unit_name_raises_422( minimal_configuration: None, @@ -631,7 +629,7 @@ async def test_create_computation_with_wallet_with_invalid_pricing_unit_name_rai @pytest.mark.parametrize( "default_pricing_plan", [ - PricingPlanGet.model_construct( + PricingPlanGet( **PricingPlanGet.model_config["json_schema_extra"]["examples"][0] # type: ignore ) ], diff --git a/services/director-v2/tests/unit/with_dbs/test_api_route_computations_tasks.py b/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_api_route_computations_tasks.py similarity index 100% rename from services/director-v2/tests/unit/with_dbs/test_api_route_computations_tasks.py rename to services/director-v2/tests/unit/with_dbs/comp_scheduler/test_api_route_computations_tasks.py diff --git a/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_scheduler_dask.py b/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_scheduler_dask.py index f6a041b934e..7609f6e956e 100644 --- a/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_scheduler_dask.py +++ b/services/director-v2/tests/unit/with_dbs/comp_scheduler/test_scheduler_dask.py @@ -1606,7 +1606,9 @@ async def _return_random_task_result(job_id) -> TaskOutputData: @pytest.fixture def with_fast_service_heartbeat_s(monkeypatch: pytest.MonkeyPatch) -> int: seconds = 1 - monkeypatch.setenv("SERVICE_TRACKING_HEARTBEAT", f"{seconds}") + monkeypatch.setenv( + "SERVICE_TRACKING_HEARTBEAT", f"{datetime.timedelta(seconds=seconds)}" + ) return seconds diff --git a/services/director-v2/tests/unit/with_dbs/conftest.py b/services/director-v2/tests/unit/with_dbs/conftest.py index ee8259f9f5b..56784acba13 100644 --- a/services/director-v2/tests/unit/with_dbs/conftest.py +++ b/services/director-v2/tests/unit/with_dbs/conftest.py @@ -278,9 +278,9 @@ async def _(user: dict[str, Any], **cluster_kwargs) -> Cluster: .where(clusters.c.id == created_cluster.id) ): access_rights_in_db[row.gid] = { - "read": row[cluster_to_groups.c.read], - "write": row[cluster_to_groups.c.write], - "delete": row[cluster_to_groups.c.delete], + "read": row.read, + "write": row.write, + "delete": row.delete, } return Cluster( diff --git a/services/docker-compose.yml b/services/docker-compose.yml index e31261ca20c..691e544b0c0 100644 --- a/services/docker-compose.yml +++ b/services/docker-compose.yml @@ -345,7 +345,6 @@ services: EFS_DNS_NAME: ${EFS_DNS_NAME} EFS_MOUNTED_PATH: ${EFS_MOUNTED_PATH} - EFS_ONLY_ENABLED_FOR_USERIDS: ${EFS_ONLY_ENABLED_FOR_USERIDS} EFS_PROJECT_SPECIFIC_DATA_DIRECTORY: ${EFS_PROJECT_SPECIFIC_DATA_DIRECTORY} RABBIT_HOST: ${RABBIT_HOST} @@ -433,8 +432,8 @@ services: EFS_GROUP_ID: ${EFS_GROUP_ID} EFS_GROUP_NAME: ${EFS_GROUP_NAME} EFS_DNS_NAME: ${EFS_DNS_NAME} + EFS_DEFAULT_USER_SERVICE_SIZE_BYTES: ${EFS_DEFAULT_USER_SERVICE_SIZE_BYTES} EFS_MOUNTED_PATH: ${EFS_MOUNTED_PATH} - EFS_ONLY_ENABLED_FOR_USERIDS: ${EFS_ONLY_ENABLED_FOR_USERIDS} EFS_PROJECT_SPECIFIC_DATA_DIRECTORY: ${EFS_PROJECT_SPECIFIC_DATA_DIRECTORY} EFS_GUARDIAN_TRACING: ${EFS_GUARDIAN_TRACING} TRACING_OPENTELEMETRY_COLLECTOR_ENDPOINT: ${TRACING_OPENTELEMETRY_COLLECTOR_ENDPOINT} diff --git a/services/efs-guardian/tests/conftest.py b/services/efs-guardian/tests/conftest.py index 260e5a74026..96585f4c87b 100644 --- a/services/efs-guardian/tests/conftest.py +++ b/services/efs-guardian/tests/conftest.py @@ -72,7 +72,6 @@ def app_environment( "EFS_DNS_NAME": "fs-xxx.efs.us-east-1.amazonaws.com", "EFS_MOUNTED_PATH": "/tmp/efs", "EFS_PROJECT_SPECIFIC_DATA_DIRECTORY": "project-specific-data", - "EFS_ONLY_ENABLED_FOR_USERIDS": "[]", "EFS_GUARDIAN_TRACING": "null", "SC_USER_ID": "8004", "SC_USER_NAME": "scu",