discriminativelrs.jl

FastAI/training/discriminativelrs.jl is a source file in module FastAI


			
			
			
			
			
			"""
			

			    DiscriminativeLRs(paramgroups, factors)

			

			Use different learning rates based on `paramgroups`. `factors` maps

			each group to a factor that the learning rate is multiplied by, so

			for a parameter `x` the factor is

			`get(factors, getgroup(paramgroups, x), 1)`.

			

			See [`ParamGroups`](#).

			

			## Examples

			

			Combining with regular gradient descent, but only training a part of

			the model.

			

			```julia

			using Flux.Optimise: Descent, Optimiser

			

			model = Chain(Dense(3, 5), Dense(5, 3))

			paramgroups = ParamGroups(IndexGrouper([1, 2]), model)

			

			dlro = DiscriminativeLRs(paramgroups, Dict(1 => 0., 2 => 1.))

			o = Optimiser(dlro, Descent(0.1))

			```

			"""
			

			
			
			struct
			
			 

	
			DiscriminativeLRs
			 
			<:
			 
			
			

	
			Flux
			.
			
			Optimise
			.
			
			AbstractOptimiser
			
			
    
			
			pg
			::

	
			ParamGroups
			
    
			
			factorfn
			::
			Any
			

			end
			

			

			
			function
			 
			

	
			DiscriminativeLRs
			(
			
			pg
			::

	
			ParamGroups
			,
			 
			
			factors
			::
			Dict
			)
			
			
    
			
			return
			 
			

	
			DiscriminativeLRs
			(
			pg
			,
			 
			

	
			group
			 
			->
			 
			
			get
			(
			factors
			,
			 

	
			group
			,
			 
			1
			)
			)
			

			end
			

			

			
			function
			 
			
			

	
			apply!
			(
			
			o
			::

	
			DiscriminativeLRs
			,
			 
			x
			,
			 
			
			Δ
			::
			
			AbstractArray
			{
			T
			}
			)
			 
			where
			 
			{
			T
			}
			
			
    
			
			factor
			 
			=
			 
			
			convert
			(
			T
			,
			 
			
			
			o
			.
			
			factorfn
			(
			

	
			getgroup
			(
			
			o
			.
			
			pg
			,
			 
			x
			)
			)
			)
			

			
    
			
			if
			
			 
			factor
			 
			==
			 
			
			one
			(
			T
			)
			
			
        
			
			return
			 
			Δ
			
    
			else
			
			
        
			
			@
			.
			
			 
			Δ
			 
			*=
			 
			factor
			
    
			end
			

			end
			

			

			
			function
			 
			
			

	
			FluxTraining
			.
			
			setlearningrate!
			(
			
			optimizer
			::

	
			Optimiser
			,
			 
			value
			)
			
			
    
			
			

	
			FluxTraining
			.
			
			setlearningrate!
			(
			
			
			optimizer
			.
			
			os
			[
			end
			]
			,
			 
			value
			)
			

			end

Tests


			
			
			
			@
			testset
			 
			
			"
			DiscriminativeLRs
			"
			 
			
			begin
			
    
			
			model
			 
			=
			 
			

	
			Chain
			(
			

	
			Dense
			(
			3
			,
			 
			5
			)
			,
			 
			

	
			Dense
			(
			5
			,
			 
			3
			)
			)
			
    
			
			pg
			 
			=
			 
			
			
			FastAI
			.
			

	
			ParamGroups
			(
			
			
			FastAI
			.
			

	
			IndexGrouper
			(
			
			[
			1
			,
			 
			2
			]
			)
			,
			 
			model
			)
			
    
			
			o
			 
			=
			 
			

	
			Optimiser
			(
			
			
			FastAI
			.
			

	
			DiscriminativeLRs
			(
			pg
			,
			 
			
			Dict
			(
			
			1
			 
			=>
			 
			0.0
			,
			 
			
			2
			 
			=>
			 
			1.0
			)
			)
			,
			
                  
			
			Descent
			(
			0.1
			)
			)
			
    
			
			x1
			 
			=
			 
			
			
			model
			[
			1
			]
			.
			
			weight
			
    
			
			x2
			 
			=
			 
			
			
			model
			[
			2
			]
			.
			
			weight
			
    
			# Weight of layer 1 has zeroed gradient
			
    
			
			@
			test
			
			 
			

	
			apply!
			(
			o
			,
			 
			x1
			,
			 
			
			ones
			(
			
			size
			(
			x1
			)
			)
			)
			 
			==
			 
			
			zeros
			(
			
			size
			(
			x1
			)
			)
			
    
			# Weight of layer 2 has regular gradient
			
    
			
			@
			test
			
			 
			

	
			apply!
			(
			o
			,
			 
			x2
			,
			 
			
			ones
			(
			
			size
			(
			x2
			)
			)
			)
			 
			!=
			 
			
			fill
			(
			0.1
			,
			 
			
			size
			(
			x1
			)
			)
			

			end