peft.SimulateQuantizedDense

peft.SimulateQuantizedDense#

class gemma.peft.SimulateQuantizedDense(
*,
wrapped: flax.linen.linear.Dense,
method: gemma.peft._quantization_utils.QuantizationMethod = QuantizationMethod.NONE,
parent: flax.linen.module.Module | flax.core.scope.Scope | flax.linen.module._Sentinel | None = <flax.linen.module._Sentinel object>,
name: str | None = None,
)[source]

Bases: flax.linen.module.Module

Wrapper around nn.Dense which adds a Quantized adapter.

wrapped: flax.linen.linear.Dense
method: gemma.peft._quantization_utils.QuantizationMethod = 'none'
name: str | None = None
parent: flax.linen.module.Module | flax.core.scope.Scope | flax.linen.module._Sentinel | None = None
scope: Scope | None = None