Julia-XAI
diff --git a/‎Project.toml‎
Lines changed: 5 additions & 2 deletions b/‎Project.toml‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎benchmark/Project.toml‎
Lines changed: 1 addition & 0 deletions b/‎benchmark/Project.toml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎benchmark/benchmarks.jl‎
Lines changed: 45 additions & 6 deletions b/‎benchmark/benchmarks.jl‎
Lines changed: 45 additions & 6 deletions
diff --git a/‎docs/literate/example.jl‎
Lines changed: 2 additions & 2 deletions b/‎docs/literate/example.jl‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/src/api.md‎
Lines changed: 1 addition & 1 deletion b/‎docs/src/api.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/ExplainabilityMethods.jl‎
Lines changed: 7 additions & 1 deletion b/‎src/ExplainabilityMethods.jl‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎src/flux.jl‎
Lines changed: 22 additions & 13 deletions b/‎src/flux.jl‎
Lines changed: 22 additions & 13 deletions
diff --git a/‎src/lrp.jl‎
Lines changed: 25 additions & 14 deletions b/‎src/lrp.jl‎
Lines changed: 25 additions & 14 deletions
diff --git a/‎src/lrp_checks.jl‎
Lines changed: 116 additions & 0 deletions b/‎src/lrp_checks.jl‎
Lines changed: 116 additions & 0 deletions
@@ -8,22 +8,25 @@ ColorSchemes = "35d6a980-a343-548e-a6ea-1d62b119f2f4"
 Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
 ImageCore = "a09fc81d-aa75-5fe9-8630-4744c3626534"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
+Markdown = "d6f4376e-aef5-505a-96c1-9c027394607a"
+PrettyTables = "08abe8d2-0d0c-5749-adfa-8a2ac140af0d"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 Zygote = "e88e6eb3-aa80-5325-afca-941959d7151f"
 
 [compat]
 ColorSchemes = "3"
 Flux = "0.12"
 ImageCore = "0.8, 0.9"
-JLD2 = "0.4"
+PrettyTables = "1"
 Zygote = "0.6"
 julia = "1.6"
 
 [extras]
 JLD2 = "033835bb-8acc-5ee8-8aae-3f567f8a3819"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 ReferenceTests = "324d217c-45ce-50fc-942e-d289b448e8cf"
+Suppressor = "fd094767-a336-5f1f-9728-57cf17d0bbfb"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 
 [targets]
-test = ["JLD2", "Random", "ReferenceTests", "Test"]
+test = ["JLD2", "Random", "ReferenceTests", "Suppressor", "Test"]
@@ -1,4 +1,5 @@
 [deps]
 BenchmarkTools = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf"
+ExplainabilityMethods = "cd722a4f-8d55-446b-8550-a4aabc9151ab"
 Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
 PkgBenchmark = "32113eaa-f34f-5b0d-bd6c-c81e245fc73d"
@@ -1,12 +1,12 @@
-using ExplainabilityMethods
-using ExplainabilityMethods: ANALYZERS
+using BenchmarkTools
 using Flux
+using ExplainabilityMethods
 
 on_CI = haskey(ENV, "GITHUB_ACTIONS")
 
 include("../test/vgg19.jl")
 vgg19 = VGG19(; pretrain=false)
-model = flatten_chain(strip_softmax(vgg19.layers))
+model = flatten_model(strip_softmax(vgg19.layers))
 img = rand(MersenneTwister(123), Float32, (224, 224, 3, 1))
 
 # Benchmark custom LRP composite
@@ -24,10 +24,49 @@ algs = Dict(
 
 # Define benchmark
 SUITE = BenchmarkGroup()
+SUITE["VGG"] = BenchmarkGroup([k for k in keys(algs)])
 for (name, alg) in algs
-    SUITE[name] = BenchmarkGroup(["construct analyzer", "analyze"])
-    SUITE[name]["construct analyzer"] = @benchmarkable alg($(model))
+    SUITE["VGG"][name] = BenchmarkGroup(["construct analyzer", "analyze"])
+    SUITE["VGG"][name]["construct analyzer"] = @benchmarkable alg($(model))
 
     analyzer = alg(model)
-    SUITE[name]["analyze"] = @benchmarkable analyze($(img), $(analyzer))
+    SUITE["VGG"][name]["analyze"] = @benchmarkable analyze($(img), $(analyzer))
+end
+
+# Rules benchmarks – use wrapper to trigger AD fallback
+struct TestWrapper{T}
+    layer::T
+end
+(l::TestWrapper)(x) = l.layer(x)
+
+# generate input for conv layers
+insize = (128, 128, 3, 1)
+aₖ = randn(Float32, insize)
+
+layers = Dict(
+    "MaxPool" => (MaxPool((3, 3); pad=0), aₖ),
+    "MeanPool" => (MeanPool((3, 3); pad=0), aₖ),
+    "Conv" => (Conv((3, 3), 3 => 6), aₖ),
+    "flatten" => (flatten, aₖ),
+    "Dense" => (Dense(1000, 200, relu), randn(Float32, 1000)),
+)
+rules = Dict(
+    "ZeroRule" => ZeroRule(),
+    "EpsilonRule" => EpsilonRule(),
+    "GammaRule" => GammaRule(),
+    "ZBoxRule" => ZBoxRule(),
+)
+rulenames = [k for k in keys(rules)]
+
+for (layername, (layer, aₖ)) in layers
+    SUITE[layername] = BenchmarkGroup(rulenames)
+
+    for (rulename, ruletype) in rules
+        Rₖ₊₁ = layer(aₖ)
+        SUITE[layername][rulename] = BenchmarkGroup(["dispatch", "AD fallback"])
+        SUITE[layername][rulename]["dispatch"] = @benchmarkable rule($layer, $aₖ, $Rₖ₊₁)
+        SUITE[layername][rulename]["AD fallback"] = @benchmarkable rule(
+            $TestWrapper(layer), $aₖ, $Rₖ₊₁
+        )
+    end
 end
@@ -66,8 +66,8 @@ heatmap(expl)
 # ## Custom composites
 # If our model is a "flat" chain of Flux layers, we can assign LRP rules
 # to each layer individually. For this purpose,
-# ExplainabilityMethods exports the method [`flatten_chain`](@ref):
-model = flatten_chain(model)
+# ExplainabilityMethods exports the method [`flatten_model`](@ref):
+model = flatten_model(model)
 
 #md # !!! warning "Flattening models"
 #md #     Not all models can be flattened, e.g. those using
 
@@ -33,7 +33,7 @@ modify_denominator
 # Utilities
 ```@docs
 strip_softmax
-flatten_chain
+flatten_model
 ```
 
 # Index
 
@@ -7,11 +7,15 @@ using ColorSchemes
 using ImageCore
 using Base.Iterators
 
+using Markdown
+using PrettyTables
+
 include("analyze_api.jl")
 include("flux.jl")
 include("utils.jl")
 include("neuron_selection.jl")
 include("gradient.jl")
+include("lrp_checks.jl")
 include("lrp_rules.jl")
 include("lrp.jl")
 include("heatmap.jl")
@@ -25,13 +29,15 @@ export LRP, LRPZero, LRPEpsilon, LRPGamma
 
 # LRP rules
 export AbstractLRPRule
+export LRP_CONFIG
 export ZeroRule, EpsilonRule, GammaRule, ZBoxRule
 export modify_layer, modify_params, modify_denominator
+export check_model
 
 # heatmapping
 export heatmap
 
 # utils
-export strip_softmax, flatten_chain
+export strip_softmax, flatten_model, flatten_chain
 
 end # module
@@ -1,30 +1,39 @@
 ## Group layers by type:
-const ConvLayers = Union{Conv,DepthwiseConv,ConvTranspose,CrossCor}
-const DropoutLayers = Union{Dropout,typeof(Flux.dropout),AlphaDropout}
-const ReshapingLayers = Union{typeof(Flux.flatten)}
+const ConvLayer = Union{Conv,DepthwiseConv,ConvTranspose,CrossCor}
+const DropoutLayer = Union{Dropout,typeof(Flux.dropout),AlphaDropout}
+const ReshapingLayer = Union{typeof(Flux.flatten)}
 # Pooling layers
-const MaxPoolLayers = Union{MaxPool,AdaptiveMaxPool,GlobalMaxPool}
-const MeanPoolLayers = Union{MeanPool,AdaptiveMeanPool,GlobalMeanPool}
-const PoolingLayers = Union{MaxPoolLayers,MeanPoolLayers}
+const MaxPoolLayer = Union{MaxPool,AdaptiveMaxPool,GlobalMaxPool}
+const MeanPoolLayer = Union{MeanPool,AdaptiveMeanPool,GlobalMeanPool}
+const PoolingLayer = Union{MaxPoolLayer,MeanPoolLayer}
+# Activation functions that are similar to ReLU
+const ReluLikeActivation = Union{
+    typeof(relu),typeof(gelu),typeof(swish),typeof(softplus),typeof(mish)
+}
+# Layers & activation functions supported by LRP
+const LRPSupportedLayer = Union{Dense,ConvLayer,DropoutLayer,ReshapingLayer,PoolingLayer}
+const LRPSupportedActivation = Union{typeof(identity),ReluLikeActivation}
 
-_flatten_chain(x) = x
-_flatten_chain(c::Chain) = [c.layers...]
+_flatten_model(x) = x
+_flatten_model(c::Chain) = [c.layers...]
 """
-    flatten_chain(c)
+    flatten_model(c)
 
 Flatten a Flux chain containing Flux chains.
 """
-function flatten_chain(chain::Chain)
+function flatten_model(chain::Chain)
     if any(isa.(chain.layers, Chain))
-        flatchain = Chain(vcat(_flatten_chain.(chain.layers)...)...)
-        return flatten_chain(flatchain)
+        flatchain = Chain(vcat(_flatten_model.(chain.layers)...)...)
+        return flatten_model(flatchain)
     end
     return chain
 end
+@deprecate flatten_chain(c) flatten_model(c)
 
 is_softmax(layer) = layer isa Union{typeof(softmax),typeof(softmax!)}
 has_output_softmax(x) = is_softmax(x)
 has_output_softmax(model::Chain) = has_output_softmax(model[end])
+
 """
     check_ouput_softmax(model)
 
@@ -46,7 +55,7 @@ Remove softmax activation on model output if it exists.
 """
 function strip_softmax(model::Chain)
     if has_output_softmax(model)
-        model = flatten_chain(model)
+        model = flatten_model(model)
         return Chain(model.layers[1:(end - 1)]...)
     end
     return model
 
@@ -1,10 +1,13 @@
 """
     LRP(c::Chain, r::AbstractLRPRule)
     LRP(c::Chain, rs::AbstractVector{<:AbstractLRPRule})
-    LRP(layers::AbstractVector{LRPLayer})
 
 Analyze model by applying Layer-Wise Relevance Propagation.
 
+# Keyword arguments
+- `skip_checks::Bool`: Skip checks whether model is compatible with LRP and contains output softmax. Default is `false`.
+- `verbose::Bool`: Select whether the model checks should print a summary on failure. Default is `true`.
+
 # References
 [1] G. Montavon et al., Layer-Wise Relevance Propagation: An Overview
 [2] W. Samek et al., Explaining Deep Neural Networks and Beyond: A Review of Methods and Applications
@@ -14,26 +17,34 @@ struct LRP{R<:AbstractVector{<:AbstractLRPRule}} <: AbstractXAIMethod
     rules::R
 
     # Construct LRP analyzer by manually assigning a rule to each layer
-    function LRP(model::Chain, rules::AbstractVector{<:AbstractLRPRule})
-        check_ouput_softmax(model)
-        model = flatten_chain(model)
+    function LRP(
+        model::Chain,
+        rules::AbstractVector{<:AbstractLRPRule};
+        skip_checks=false,
+        verbose=true,
+    )
+        model = flatten_model(model)
+        if !skip_checks
+            check_ouput_softmax(model)
+            check_model(Val(:LRP), model; verbose=verbose)
+        end
         if length(model.layers) != length(rules)
             throw(ArgumentError("Length of rules doesn't match length of Flux chain."))
         end
         return new{typeof(rules)}(model, rules)
     end
-    # Construct LRP analyzer by assigning a single rule to all layers
-    function LRP(model::Chain, r::AbstractLRPRule)
-        check_ouput_softmax(model)
-        model = flatten_chain(model)
-        rules = repeat([r], length(model.layers))
-        return new{typeof(rules)}(model, rules)
-    end
+end
+
+# Construct LRP analyzer by assigning a single rule to all layers
+function LRP(model::Chain, r::AbstractLRPRule; kwargs...)
+    model = flatten_model(model)
+    rules = repeat([r], length(model.layers))
+    return LRP(model, rules; kwargs...)
 end
 # Additional constructors for convenience:
-LRPZero(model::Chain) = LRP(model, ZeroRule())
-LRPEpsilon(model::Chain) = LRP(model, EpsilonRule())
-LRPGamma(model::Chain) = LRP(model, GammaRule())
+LRPZero(model::Chain; kwargs...) = LRP(model, ZeroRule(); kwargs...)
+LRPEpsilon(model::Chain; kwargs...) = LRP(model, EpsilonRule(); kwargs...)
+LRPGamma(model::Chain; kwargs...) = LRP(model, GammaRule(); kwargs...)
 
 # The call to the LRP analyzer.
 function (analyzer::LRP)(input, ns::AbstractNeuronSelector; layerwise_relevances=false)
 
@@ -0,0 +1,116 @@
+module LRP_CONFIG
+using ExplainabilityMethods
+using ExplainabilityMethods: LRPSupportedLayer, LRPSupportedActivation
+"""
+    LRP_CONFIG.supports_layer(layer)
+
+Check whether LRP can be used on a layer or a Chain.
+To extend LRP to your own layers, define:
+```julia
+LRP_CONFIG.supports_layer(::MyLayer) = true
+```
+"""
+supports_layer(l) = false
+supports_layer(::LRPSupportedLayer) = true
+"""
+    LRP_CONFIG.supports_activation(σ)
+
+Check whether LRP can be used on a given activation function.
+To extend LRP to your own activation functions, define:
+```julia
+LRP_CONFIG.supports_activation(::MyActivation) = true
+```
+"""
+supports_activation(σ) = false
+supports_activation(::LRPSupportedActivation) = true
+end # LRP_CONFIG module
+
+_check_layer(::Val{:LRP}, layer) = LRP_CONFIG.supports_layer(layer)
+_check_layer(::Val{:LRP}, c::Chain) = all(_check_layer(Val(:LRP), l) for l in c)
+
+function _check_activation(::Val{:LRP}, layer)
+    hasproperty(layer, :σ) && return LRP_CONFIG.supports_activation(layer.σ)
+    return true
+end
+_check_activation(::Val{:LRP}, c::Chain) = all(_check_activation(Val(:LRP), l) for l in c)
+
+"""
+    check_model(method::Symbol, model; verbose=true)
+
+Check whether the given method can be used on the model.
+Currently, model checks are only implemented for LRP, using the symbol `:LRP`.
+
+# Example
+julia> check_model(:LRP, model)
+"""
+check_model(method::Symbol, model; kwargs...) = check_model(Val(method), model; kwargs...)
+function check_model(::Val{:LRP}, c::Chain; verbose=true)
+    layer_checks = collect(_check_layer.(Val(:LRP), c.layers))
+    activation_checks = collect(_check_activation.(Val(:LRP), c.layers))
+    passed_layer_checks = all(layer_checks)
+    passed_activation_checks = all(activation_checks)
+
+    passed_layer_checks && passed_activation_checks && return true
+
+    layer_names = [_print_name(l) for l in c]
+    activation_names = [_print_activation(l) for l in c]
+
+    verbose && _show_check_summary(
+        c, layer_names, layer_checks, activation_names, activation_checks
+    )
+    if !passed_layer_checks
+        verbose && display(
+            Markdown.parse(
+                """# Layers failed model check
+                Found unknown layers `$(join(unique(layer_names[.!layer_checks]), ", "))`
+                that are not supported by ExplainabilityMethods' LRP implementation yet.
+
+                If you think the missing layer should be supported by default, please [submit an issue](https://github.com/adrhill/ExplainabilityMethods.jl/issues).
+
+                These model checks can be skipped at your own risk by setting the LRP-analyzer keyword argument `skip_checks=true`.
+
+                ## Using custom layers
+                If you implemented custom layers, register them via
+                ```julia
+                LRP_CONFIG.supports_layer(::MyLayer) = true               # for structs
+                LRP_CONFIG.supports_activation(::typeof(mylayer)) = true  # for functions
+                ```
+                The default fallback for this layer will use Automatic Differentiation according to "Layer-Wise Relevance Propagation: An Overview".
+                You can also define a fully LRP-custom rule for your layer by using the interface
+                ```julia
+                function (rule::AbstractLRPRule)(layer::MyLayer, aₖ, Rₖ₊₁)
+                    # ...
+                    return Rₖ
+                end
+                ```
+                This pattern can also be used to dispatch on specific rules.
+                """,
+            ),
+        )
+        throw(ArgumentError("Unknown layers found in model"))
+    end
+    if !passed_activation_checks
+        verbose && display(
+            Markdown.parse(
+                """ # Activations failed model check
+                Found layers with unknown  or unsupported activation functions
+                `$(join(unique(activation_names[.!activation_checks]), ", "))`.
+                LRP assumes that the model is a "deep rectifier network" that only contains ReLU-like activation functions.
+
+                If you think the missing activation function should be supported by default, please [submit an issue](https://github.com/adrhill/ExplainabilityMethods.jl/issues).
+
+                These model checks can be skipped at your own risk by setting the LRP-analyzer keyword argument `skip_checks=true`.
+
+                ## Using custom activation functions
+                If you use custom ReLU-like activation functions, register them via
+                ```julia
+                LRP_CONFIG.supports_activation(::typeof(myfunction)) = true  # for functions
+                LRP_CONFIG.supports_activation(::MyActivation) = true        # for structs
+                ```
+                """,
+            ),
+        )
+        throw(ArgumentError("Unknown or unsupported activation functions found in model"))
+    end
+    return false
+end