From 03406036275b9e692bd1a64ee4a7026e31764541 Mon Sep 17 00:00:00 2001 From: Hasan Ramezani Date: Tue, 3 Dec 2024 14:23:27 +0100 Subject: [PATCH 1/3] Improve field value parsing by adding `NoDecode` and `ForceDecode` annotations --- docs/index.md | 82 +++++++++++++++++++++++++++++++++++ pydantic_settings/__init__.py | 4 ++ pydantic_settings/main.py | 2 + pydantic_settings/sources.py | 14 ++++++ tests/test_settings.py | 70 ++++++++++++++++++++++++++++++ 5 files changed, 172 insertions(+) diff --git a/docs/index.md b/docs/index.md index 5e02981..425522f 100644 --- a/docs/index.md +++ b/docs/index.md @@ -371,6 +371,88 @@ print(Settings().model_dump()) #> {'numbers': [1, 2, 3]} ``` +### Disabling JSON parsing + +pydatnic-settings by default parses complex types from environment variables as JSON strings. If you want to disable +this behavior for a field and parse the value by your own, you can annotate the field with `NoDecode`: + +```py +import os +from typing import List + +from pydantic import field_validator +from typing_extensions import Annotated + +from pydantic_settings import BaseSettings, NoDecode + + +class Settings(BaseSettings): + numbers: Annotated[List[int], NoDecode] # (1)! + + @field_validator('numbers', mode='before') + @classmethod + def decode_numbers(cls, v: str) -> List[int]: + return [int(x) for x in v.split(',')] + + +os.environ['numbers'] = '1,2,3' +print(Settings().model_dump()) +#> {'numbers': [1, 2, 3]} +``` + +1. The `NoDecode` annotation disables JSON parsing for the `numbers` field. The `decode_numbers` field validator + will be called to parse the value. + +You can also disable JSON parsing for all fields by setting the `enable_decoding` config setting to `False`: + +```py +import os +from typing import List + +from pydantic import field_validator + +from pydantic_settings import BaseSettings, SettingsConfigDict + + +class Settings(BaseSettings): + model_config = SettingsConfigDict(enable_decoding=False) + + numbers: List[int] + + @field_validator('numbers', mode='before') + @classmethod + def decode_numbers(cls, v: str) -> List[int]: + return [int(x) for x in v.split(',')] + + +os.environ['numbers'] = '1,2,3' +print(Settings().model_dump()) +#> {'numbers': [1, 2, 3]} +``` + +You can force JSON parsing for a field by annotating it with `ForceDecode`. This will bypass +the the `enable_decoding` config setting: + +```py +import os +from typing import List + +from typing_extensions import Annotated + +from pydantic_settings import BaseSettings, ForceDecode, SettingsConfigDict + + +class Settings(BaseSettings): + model_config = SettingsConfigDict(enable_decoding=False) + + numbers: Annotated[List[int], ForceDecode] + + +os.environ['numbers'] = '["1","2","3"]' +print(Settings().model_dump()) +#> {'numbers': [1, 2, 3]} +``` + ## Nested model default partial updates By default, Pydantic settings does not allow partial updates to nested model default objects. This behavior can be diff --git a/pydantic_settings/__init__.py b/pydantic_settings/__init__.py index 5b3aa9f..0a02868 100644 --- a/pydantic_settings/__init__.py +++ b/pydantic_settings/__init__.py @@ -11,8 +11,10 @@ CliSuppress, DotEnvSettingsSource, EnvSettingsSource, + ForceDecode, InitSettingsSource, JsonConfigSettingsSource, + NoDecode, PydanticBaseSettingsSource, PyprojectTomlConfigSettingsSource, SecretsSettingsSource, @@ -38,6 +40,8 @@ 'CliMutuallyExclusiveGroup', 'InitSettingsSource', 'JsonConfigSettingsSource', + 'NoDecode', + 'ForceDecode', 'PyprojectTomlConfigSettingsSource', 'PydanticBaseSettingsSource', 'SecretsSettingsSource', diff --git a/pydantic_settings/main.py b/pydantic_settings/main.py index 8f6fdbc..f376361 100644 --- a/pydantic_settings/main.py +++ b/pydantic_settings/main.py @@ -79,6 +79,7 @@ class SettingsConfigDict(ConfigDict, total=False): """ toml_file: PathType | None + enable_decoding: bool # Extend `config_keys` by pydantic settings config keys to @@ -433,6 +434,7 @@ def _settings_build_values( toml_file=None, secrets_dir=None, protected_namespaces=('model_validate', 'model_dump', 'settings_customise_sources'), + enable_decoding=True, ) diff --git a/pydantic_settings/sources.py b/pydantic_settings/sources.py index 2bf870b..4a37192 100644 --- a/pydantic_settings/sources.py +++ b/pydantic_settings/sources.py @@ -118,6 +118,14 @@ def import_azure_key_vault() -> None: ENV_FILE_SENTINEL: DotenvType = Path('') +class NoDecode: + pass + + +class ForceDecode: + pass + + class SettingsError(ValueError): pass @@ -312,6 +320,12 @@ def decode_complex_value(self, field_name: str, field: FieldInfo, value: Any) -> Returns: The decoded value for further preparation """ + if field and ( + NoDecode in field.metadata + or (self.config.get('enable_decoding') is False and ForceDecode not in field.metadata) + ): + return value + return json.loads(value) @abstractmethod diff --git a/tests/test_settings.py b/tests/test_settings.py index 143b285..2a6578b 100644 --- a/tests/test_settings.py +++ b/tests/test_settings.py @@ -1,4 +1,5 @@ import dataclasses +import json import os import pathlib import sys @@ -26,6 +27,7 @@ SecretStr, Tag, ValidationError, + field_validator, ) from pydantic import ( dataclasses as pydantic_dataclasses, @@ -37,7 +39,9 @@ BaseSettings, DotEnvSettingsSource, EnvSettingsSource, + ForceDecode, InitSettingsSource, + NoDecode, PydanticBaseSettingsSource, SecretsSettingsSource, SettingsConfigDict, @@ -2873,3 +2877,69 @@ class Settings(BaseSettings): s = Settings() assert s.foo.get_secret_value() == 123 assert s.bar.get_secret_value() == PostgresDsn('postgres://user:password@localhost/dbname') + + +def test_field_annotated_no_decode(env): + class Settings(BaseSettings): + a: List[str] # this field will be decoded because of default `enable_decoding=True` + b: Annotated[List[str], NoDecode] + + # decode the value here. the field value won't be decoded because of NoDecode + @field_validator('b', mode='before') + @classmethod + def decode_b(cls, v: str) -> List[str]: + return json.loads(v) + + env.set('a', '["one", "two"]') + env.set('b', '["1", "2"]') + + s = Settings() + assert s.model_dump() == {'a': ['one', 'two'], 'b': ['1', '2']} + + +def test_field_annotated_no_decode_and_disable_decoding(env): + class Settings(BaseSettings): + model_config = SettingsConfigDict(enable_decoding=False) + + a: Annotated[List[str], NoDecode] + + # decode the value here. the field value won't be decoded because of NoDecode + @field_validator('a', mode='before') + @classmethod + def decode_b(cls, v: str) -> List[str]: + return json.loads(v) + + env.set('a', '["one", "two"]') + + s = Settings() + assert s.model_dump() == {'a': ['one', 'two']} + + +def test_field_annotated_disable_decoding(env): + class Settings(BaseSettings): + model_config = SettingsConfigDict(enable_decoding=False) + + a: List[str] + + # decode the value here. the field value won't be decoded because of `enable_decoding=False` + @field_validator('a', mode='before') + @classmethod + def decode_b(cls, v: str) -> List[str]: + return json.loads(v) + + env.set('a', '["one", "two"]') + + s = Settings() + assert s.model_dump() == {'a': ['one', 'two']} + + +def test_field_annotated_force_decode_disable_decoding(env): + class Settings(BaseSettings): + model_config = SettingsConfigDict(enable_decoding=False) + + a: Annotated[List[str], ForceDecode] + + env.set('a', '["one", "two"]') + + s = Settings() + assert s.model_dump() == {'a': ['one', 'two']} From 5748f0669dc486b24fcf4ca5f557532250e20ced Mon Sep 17 00:00:00 2001 From: Hasan Ramezani Date: Wed, 4 Dec 2024 09:52:13 +0100 Subject: [PATCH 2/3] Address comments --- docs/index.md | 22 +++++++++++++++++----- pydantic_settings/sources.py | 4 ++++ 2 files changed, 21 insertions(+), 5 deletions(-) diff --git a/docs/index.md b/docs/index.md index 425522f..e19009d 100644 --- a/docs/index.md +++ b/docs/index.md @@ -373,8 +373,9 @@ print(Settings().model_dump()) ### Disabling JSON parsing -pydatnic-settings by default parses complex types from environment variables as JSON strings. If you want to disable -this behavior for a field and parse the value by your own, you can annotate the field with `NoDecode`: +pydantic-settings by default parses complex types from environment variables as JSON strings. If you want to disable +this behavior for a field and parse the value in your own validator, you can annotate the field with +[`NoDecode`](../api/pydantic_settings.md#pydantic_settings.NoDecode): ```py import os @@ -430,13 +431,14 @@ print(Settings().model_dump()) #> {'numbers': [1, 2, 3]} ``` -You can force JSON parsing for a field by annotating it with `ForceDecode`. This will bypass -the the `enable_decoding` config setting: +You can force JSON parsing for a field by annotating it with [`ForceDecode`](../api/pydantic_settings.md#pydantic_settings.ForceDecode). +This will bypass the the `enable_decoding` config setting: ```py import os from typing import List +from pydantic import field_validator from typing_extensions import Annotated from pydantic_settings import BaseSettings, ForceDecode, SettingsConfigDict @@ -446,13 +448,23 @@ class Settings(BaseSettings): model_config = SettingsConfigDict(enable_decoding=False) numbers: Annotated[List[int], ForceDecode] + numbers1: List[int] # (1)! + + @field_validator('numbers1', mode='before') + @classmethod + def decode_numbers1(cls, v: str) -> List[int]: + return [int(x) for x in v.split(',')] os.environ['numbers'] = '["1","2","3"]' +os.environ['numbers1'] = '1,2,3' print(Settings().model_dump()) -#> {'numbers': [1, 2, 3]} +#> {'numbers': [1, 2, 3], 'numbers1': [1, 2, 3]} ``` +1. The `numbers1` field is not annotated with `ForceDecode`, so it will not be parsed as JSON. + and we have to provide a custom validator to parse the value. + ## Nested model default partial updates By default, Pydantic settings does not allow partial updates to nested model default objects. This behavior can be diff --git a/pydantic_settings/sources.py b/pydantic_settings/sources.py index 4a37192..6b292e1 100644 --- a/pydantic_settings/sources.py +++ b/pydantic_settings/sources.py @@ -119,10 +119,14 @@ def import_azure_key_vault() -> None: class NoDecode: + """Annotation to prevent decoding of a field value.""" + pass class ForceDecode: + """Annotation to force decoding of a field value.""" + pass From cdf72c4003c87ba4382c021761df06287d4fcaf9 Mon Sep 17 00:00:00 2001 From: Hasan Ramezani Date: Wed, 4 Dec 2024 09:53:37 +0100 Subject: [PATCH 3/3] Update docs/index.md Co-authored-by: hyperlint-ai[bot] <154288675+hyperlint-ai[bot]@users.noreply.github.com> --- docs/index.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/index.md b/docs/index.md index e19009d..20151b2 100644 --- a/docs/index.md +++ b/docs/index.md @@ -432,7 +432,7 @@ print(Settings().model_dump()) ``` You can force JSON parsing for a field by annotating it with [`ForceDecode`](../api/pydantic_settings.md#pydantic_settings.ForceDecode). -This will bypass the the `enable_decoding` config setting: +This will bypass the `enable_decoding` config setting: ```py import os