Pydantic

Less boilerplate
More semantics
Composable models

Alexandre René

PyMoTW – 29 May 2020

Slides & examples: https://github.com/INM-6/Python-Module-of-the-Week/tree/master/session32_pydantic

Less boilerplate

class A:
  def __init__(self, x:int):
    self.x = x
class B(A):
  def __init__(self, x:int, y:int):
    super().__init__(x)
      # Remove y from signature
    self.y

class A(BaseModel):
  x: int
class B(A):
  y: int

Normal python

Pydantized python

More semantics

class Vector:
  def __init__(self, r:float, θ:float):
    if r <= 0:
      raise ValueError(
        "Negative radius")
    if θ < 0 or 2*np.pi < θ:
      raise ValueError(
        "Angle outside [0,2π]")
    self.r = r
    self.θ = θ

class Vector(BaseModel):
  r: PositiveFloat
  θ: confloat(gt=0, lt=2*np.pi)

Normal python

Pydantized python

{'title': 'Vector',
 'type': 'object',
 'properties': {
  'r': {'title': 'R', 'type': 'number',
        'exclusiveMinimum': 0},
  'θ': {'title': 'Θ',
   'type': 'number',
   'exclusiveMinimum': 0,
   'exclusiveMaximum': 6.283185307179586}},
 'required': ['r', 'θ']}

Vector.schema()

What is it's for

TODO: Example real-world application

Pydantic Less boilerplate More semantics Composable models Alexandre René PyMoTW – 29 May 2020 Slides & examples: https://github.com/INM-6/Python-Module-of-the-Week/tree/master/session32_pydantic

Pydantic intro

By alexrene

Pydantic intro

An introduction to Pydantic for scientific applications

5 years ago
143

	from typing import List
	Vector = List[float]

	def scale(scalar: float, vector: Vector) -> Vector:
	return [scalar * num for num in vector]

	class A(BaseModel):
	x: int
	s: str
	@validator('x', pre=True)
	def check_x(cls, v):
	if v < 0: # See PositiveInt
	raise ValueError(
	"`x` must be positive")
	return v
	@validator('s')
	def check_s(cls, v):
	if len(v) > 10: # See min_length
	raise ValueError(
	"`s` must not be longer than 10")
	return v
	def __new__(cls, **kwargs):
	super().__new__(cls)
	def __init__(self, **kwargs):
	super().__init__(**kwargs)

	class Foo(BaseModel):
	a: int
	b: int
	@root_validator
	def root_val_post(cls, values):
	print("root val post")
	return values
	@root_validator(pre=True)
	def root_val_pre(cls, values):
	print("root val pre")
	return values
	@validator('a')
	def val_post_a(cls, a):
	print("val post a")
	return a
	@validator('b', pre=True)
	def val_pre_b(cls, b):
	print("val pre b")
	return b
	@validator('a', pre=True)
	def val_pre_a(cls, a):
	print("val pre a")
	return a
	@validator('b')
	def val_post_b(cls, b):
	print("val post b")
	return b

	class Foo(BaseModel):
	a: int
	b: int
	@root_validator
	def root_val_post(cls, values):
	print("root val post")
	return values
	@root_validator(pre=True)
	def root_val_pre(cls, values):
	print("root val pre")
	return values
	@validator('a')
	def val_post_a(cls, a):
	print("val post a")
	return a
	@validator('b', pre=True)
	def val_pre_b(cls, b):
	print("val pre b")
	return b
	@validator('a', pre=True)
	def val_pre_a(cls, a):
	print("val pre a")
	return a
	@validator('b')
	def val_post_b(cls, b):
	print("val post b")
	return b

	class Foo(BaseModel):
	a: int
	b: int
	@root_validator
	def root_val_post(cls, values):
	print("root val post")
	return values
	@root_validator(pre=True)
	def root_val_pre(cls, values):
	print("root val pre")
	return values
	@validator('a')
	def val_post_a(cls, a):
	print("val post a")
	return a
	@validator('b', pre=True)
	def val_pre_b(cls, b):
	print("val pre b")
	return b
	@validator('a', pre=True)
	def val_pre_a(cls, a):
	print("val pre a")
	return a
	@validator('b')
	def val_post_b(cls, b):
	print("val post b")
	return b

	class _ArrayType(np.ndarray):
	@classmethod
	def __get_validators__(cls):
	yield cls.validate_type

	@classmethod
	def validate_type(cls, value, field):
	if isinstance(value, typing.NotCastableToArray):
	raise TypeError(f"Values of type {type(value)} cannot be casted "
	"to a numpy array.")
	if isinstance(value, np.ndarray):
	# Don't create a new array unless necessary
	if cls._ndim is not None and value.ndim != cls._ndim:
	raise TypeError(f"{field.name} expects a variable with "
	f"{cls._ndim} dimensions.")
	# Issubdtype allows specifying abstract dtypes like 'number', 'floating'
	if np.issubdtype(value.dtype, cls.dtype):
	result = value
	elif np.can_cast(value, cls.dtype):
	result = value.astype(cls.dtype)
	else:
	raise TypeError(f"Cannot safely cast '{field.name}' type "
	f"({value.dtype}) to type {cls.dtype}.")
	else:
	result = np.array(value)
	# Issubdtype allows specifying abstract dtypes like 'number', 'floating'
	if np.issubdtype(result.dtype, cls.dtype):
	pass
	elif np.can_cast(result, cls.dtype):
	if cls._ndim is not None and result.ndim != cls._ndim:
	raise TypeError(
	f"The shape of the data ({result.shape}) does not " "correspond to the expected of dimensions "
	f"({cls._ndim} for '{field.name}').")
	elif result.dtype != cls.dtype:
	result = result.astype(cls.dtype)
	else:
	raise TypeError(f"Cannot1 safely cast '{field.name}' (type "
	f"{result.dtype}) to type {cls.dtype}.")
	return result

	@classmethod
	def __modify_schema__(cls, field_schema):
	# FIXME: Figure out how to use get schema of subfield
	field_schema.update(type ='array',
	items={'type': 'number'})
	@classmethod
	def json_encoder(cls, v):
	"""See typing.json_encoders."""
	return v.tolist()

	class _ArrayMeta(type):
	def __getitem__(self, args):
	if isinstance(args, tuple):
	T = args[0]
	ndim = args[1] if len(args) > 1 else None
	extraargs = args[2:] # For catching errors only
	else:
	T = args
	ndim = None
	extraargs = []
	if (not isinstance(T, type) or len(extraargs) > 0
	or not isinstance(ndim, (int, type(None)))):
	raise TypeError(
	"`Array` must be specified as either `Array[T]`"
	"or `Array[T, n], where `T` is a type and `n` is an int. "
	f"(received: {', '.join((str(a) for a in args))}]).")
	dtype=typing.convert_dtype(T)
	specifier = str(dtype)
	if ndim is not None:
	specifier += f",{ndim}"
	return type(f'Array[{specifier}]', (_ArrayType,),
	{'dtype': dtype, '_ndim': ndim})

	class Array(np.ndarray, metaclass=_ArrayMeta):
	"""
	Use this to specify a NumPy array type annotation; `pydantic` will
	recognize the type and execute appropriate validation/parsing.

	This may become obsolete, or need to be updated, when NumPy officially
	supports type hints (see https://github.com/numpy/numpy-stubs).

	- `Array[T]` specifies an array with dtype `T`. Any expression for which
	`np.dtype(T)` is valid is accepted.
	- `Array[T,n]` specifies an array with dtype `T`, that must have exactly
	`n` dimensions.

	Example
	-------
	>>> from pydantic.dataclasses import dataclass
	>>> from mackelab_toolbox.typing import Array
	>>>
	>>> @dataclass
	>>> class Model:
	>>> x: Array[np.float64] # Array of 64-bit floats, any number of dimensions
	>>> v: Array['float64', 1] # 1-D array of 64-bit floats


	"""
	pass

Pydantic

Less boilerplate

More semantics

Composable models

Pydantic intro

More from alexrene