diff --git a/LICENSE.txt b/LICENSE.txt
index 2f8ed18..d645695 100644
--- a/LICENSE.txt
+++ b/LICENSE.txt
@@ -1,374 +1,202 @@
-Mozilla Public License Version 2.0
-==================================
-
-1. Definitions
---------------
-
-1.1. "Contributor"
-    means each individual or legal entity that creates, contributes to
-    the creation of, or owns Covered Software.
-
-1.2. "Contributor Version"
-    means the combination of the Contributions of others (if any) used
-    by a Contributor and that particular Contributor's Contribution.
-
-1.3. "Contribution"
-    means Covered Software of a particular Contributor.
-
-1.4. "Covered Software"
-    means Source Code Form to which the initial Contributor has attached
-    the notice in Exhibit A, the Executable Form of such Source Code
-    Form, and Modifications of such Source Code Form, in each case
-    including portions thereof.
-
-1.5. "Incompatible With Secondary Licenses"
-    means
-
-    (a) that the initial Contributor has attached the notice described
-        in Exhibit B to the Covered Software; or
-
-    (b) that the Covered Software was made available under the terms of
-        version 1.1 or earlier of the License, but not also under the
-        terms of a Secondary License.
-
-1.6. "Executable Form"
-    means any form of the work other than Source Code Form.
-
-1.7. "Larger Work"
-    means a work that combines Covered Software with other material, in
-    a separate file or files, that is not Covered Software.
-
-1.8. "License"
-    means this document.
-
-1.9. "Licensable"
-    means having the right to grant, to the maximum extent possible,
-    whether at the time of the initial grant or subsequently, any and
-    all of the rights conveyed by this License.
-
-1.10. "Modifications"
-    means any of the following:
-
-    (a) any file in Source Code Form that results from an addition to,
-        deletion from, or modification of the contents of Covered
-        Software; or
-
-    (b) any new file in Source Code Form that contains any Covered
-        Software.
-
-1.11. "Patent Claims" of a Contributor
-    means any patent claim(s), including without limitation, method,
-    process, and apparatus claims, in any patent Licensable by such
-    Contributor that would be infringed, but for the grant of the
-    License, by the making, using, selling, offering for sale, having
-    made, import, or transfer of either its Contributions or its
-    Contributor Version.
-
-1.12. "Secondary License"
-    means either the GNU General Public License, Version 2.0, the GNU
-    Lesser General Public License, Version 2.1, the GNU Affero General
-    Public License, Version 3.0, or any later versions of those
-    licenses.
-
-1.13. "Source Code Form"
-    means the form of the work preferred for making modifications.
-
-1.14. "You" (or "Your")
-    means an individual or a legal entity exercising rights under this
-    License. For legal entities, "You" includes any entity that
-    controls, is controlled by, or is under common control with You. For
-    purposes of this definition, "control" means (a) the power, direct
-    or indirect, to cause the direction or management of such entity,
-    whether by contract or otherwise, or (b) ownership of more than
-    fifty percent (50%) of the outstanding shares or beneficial
-    ownership of such entity.
-
-2. License Grants and Conditions
---------------------------------
-
-2.1. Grants
-
-Each Contributor hereby grants You a world-wide, royalty-free,
-non-exclusive license:
-
-(a) under intellectual property rights (other than patent or trademark)
-    Licensable by such Contributor to use, reproduce, make available,
-    modify, display, perform, distribute, and otherwise exploit its
-    Contributions, either on an unmodified basis, with Modifications, or
-    as part of a Larger Work; and
-
-(b) under Patent Claims of such Contributor to make, use, sell, offer
-    for sale, have made, import, and otherwise transfer either its
-    Contributions or its Contributor Version.
-
-2.2. Effective Date
-
-The licenses granted in Section 2.1 with respect to any Contribution
-become effective for each Contribution on the date the Contributor first
-distributes such Contribution.
-
-2.3. Limitations on Grant Scope
-
-The licenses granted in this Section 2 are the only rights granted under
-this License. No additional rights or licenses will be implied from the
-distribution or licensing of Covered Software under this License.
-Notwithstanding Section 2.1(b) above, no patent license is granted by a
-Contributor:
-
-(a) for any code that a Contributor has removed from Covered Software;
-    or
-
-(b) for infringements caused by: (i) Your and any other third party's
-    modifications of Covered Software, or (ii) the combination of its
-    Contributions with other software (except as part of its Contributor
-    Version); or
-
-(c) under Patent Claims infringed by Covered Software in the absence of
-    its Contributions.
-
-This License does not grant any rights in the trademarks, service marks,
-or logos of any Contributor (except as may be necessary to comply with
-the notice requirements in Section 3.4).
-
-2.4. Subsequent Licenses
-
-No Contributor makes additional grants as a result of Your choice to
-distribute the Covered Software under a subsequent version of this
-License (see Section 10.2) or under the terms of a Secondary License (if
-permitted under the terms of Section 3.3).
-
-2.5. Representation
-
-Each Contributor represents that the Contributor believes its
-Contributions are its original creation(s) or it has sufficient rights
-to grant the rights to its Contributions conveyed by this License.
-
-2.6. Fair Use
-
-This License is not intended to limit any rights You have under
-applicable copyright doctrines of fair use, fair dealing, or other
-equivalents.
-
-2.7. Conditions
-
-Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted
-in Section 2.1.
-
-3. Responsibilities
--------------------
-
-3.1. Distribution of Source Form
-
-All distribution of Covered Software in Source Code Form, including any
-Modifications that You create or to which You contribute, must be under
-the terms of this License. You must inform recipients that the Source
-Code Form of the Covered Software is governed by the terms of this
-License, and how they can obtain a copy of this License. You may not
-attempt to alter or restrict the recipients' rights in the Source Code
-Form.
-
-3.2. Distribution of Executable Form
-
-If You distribute Covered Software in Executable Form then:
-
-(a) such Covered Software must also be made available in Source Code
-    Form, as described in Section 3.1, and You must inform recipients of
-    the Executable Form how they can obtain a copy of such Source Code
-    Form by reasonable means in a timely manner, at a charge no more
-    than the cost of distribution to the recipient; and
-
-(b) You may distribute such Executable Form under the terms of this
-    License, or sublicense it under different terms, provided that the
-    license for the Executable Form does not attempt to limit or alter
-    the recipients' rights in the Source Code Form under this License.
-
-3.3. Distribution of a Larger Work
-
-You may create and distribute a Larger Work under terms of Your choice,
-provided that You also comply with the requirements of this License for
-the Covered Software. If the Larger Work is a combination of Covered
-Software with a work governed by one or more Secondary Licenses, and the
-Covered Software is not Incompatible With Secondary Licenses, this
-License permits You to additionally distribute such Covered Software
-under the terms of such Secondary License(s), so that the recipient of
-the Larger Work may, at their option, further distribute the Covered
-Software under the terms of either this License or such Secondary
-License(s).
-
-3.4. Notices
-
-You may not remove or alter the substance of any license notices
-(including copyright notices, patent notices, disclaimers of warranty,
-or limitations of liability) contained within the Source Code Form of
-the Covered Software, except that You may alter any license notices to
-the extent required to remedy known factual inaccuracies.
-
-3.5. Application of Additional Terms
-
-You may choose to offer, and to charge a fee for, warranty, support,
-indemnity or liability obligations to one or more recipients of Covered
-Software. However, You may do so only on Your own behalf, and not on
-behalf of any Contributor. You must make it absolutely clear that any
-such warranty, support, indemnity, or liability obligation is offered by
-You alone, and You hereby agree to indemnify every Contributor for any
-liability incurred by such Contributor as a result of warranty, support,
-indemnity or liability terms You offer. You may include additional
-disclaimers of warranty and limitations of liability specific to any
-jurisdiction.
-
-4. Inability to Comply Due to Statute or Regulation
----------------------------------------------------
-
-If it is impossible for You to comply with any of the terms of this
-License with respect to some or all of the Covered Software due to
-statute, judicial order, or regulation then You must: (a) comply with
-the terms of this License to the maximum extent possible; and (b)
-describe the limitations and the code they affect. Such description must
-be placed in a text file included with all distributions of the Covered
-Software under this License. Except to the extent prohibited by statute
-or regulation, such description must be sufficiently detailed for a
-recipient of ordinary skill to be able to understand it.
-
-5. Termination
---------------
-
-5.1. The rights granted under this License will terminate automatically
-if You fail to comply with any of its terms. However, if You become
-compliant, then the rights granted under this License from a particular
-Contributor are reinstated (a) provisionally, unless and until such
-Contributor explicitly and finally terminates Your grants, and (b) on an
-ongoing basis, if such Contributor fails to notify You of the
-non-compliance by some reasonable means prior to 60 days after You have
-come back into compliance. Moreover, Your grants from a particular
-Contributor are reinstated on an ongoing basis if such Contributor
-notifies You of the non-compliance by some reasonable means, this is the
-first time You have received notice of non-compliance with this License
-from such Contributor, and You become compliant prior to 30 days after
-Your receipt of the notice.
-
-5.2. If You initiate litigation against any entity by asserting a patent
-infringement claim (excluding declaratory judgment actions,
-counter-claims, and cross-claims) alleging that a Contributor Version
-directly or indirectly infringes any patent, then the rights granted to
-You by any and all Contributors for the Covered Software under Section
-2.1 of this License shall terminate.
-
-5.3. In the event of termination under Sections 5.1 or 5.2 above, all
-end user license agreements (excluding distributors and resellers) which
-have been validly granted by You or Your distributors under this License
-prior to termination shall survive termination.
-
-************************************************************************
-*                                                                      *
-*  6. Disclaimer of Warranty                                           *
-*  -------------------------                                           *
-*                                                                      *
-*  Covered Software is provided under this License on an "as is"       *
-*  basis, without warranty of any kind, either expressed, implied, or  *
-*  statutory, including, without limitation, warranties that the       *
-*  Covered Software is free of defects, merchantable, fit for a        *
-*  particular purpose or non-infringing. The entire risk as to the     *
-*  quality and performance of the Covered Software is with You.        *
-*  Should any Covered Software prove defective in any respect, You     *
-*  (not any Contributor) assume the cost of any necessary servicing,   *
-*  repair, or correction. This disclaimer of warranty constitutes an   *
-*  essential part of this License. No use of any Covered Software is   *
-*  authorized under this License except under this disclaimer.         *
-*                                                                      *
-************************************************************************
-
-************************************************************************
-*                                                                      *
-*  7. Limitation of Liability                                          *
-*  --------------------------                                          *
-*                                                                      *
-*  Under no circumstances and under no legal theory, whether tort      *
-*  (including negligence), contract, or otherwise, shall any           *
-*  Contributor, or anyone who distributes Covered Software as          *
-*  permitted above, be liable to You for any direct, indirect,         *
-*  special, incidental, or consequential damages of any character      *
-*  including, without limitation, damages for lost profits, loss of    *
-*  goodwill, work stoppage, computer failure or malfunction, or any    *
-*  and all other commercial damages or losses, even if such party      *
-*  shall have been informed of the possibility of such damages. This   *
-*  limitation of liability shall not apply to liability for death or   *
-*  personal injury resulting from such party's negligence to the       *
-*  extent applicable law prohibits such limitation. Some               *
-*  jurisdictions do not allow the exclusion or limitation of           *
-*  incidental or consequential damages, so this exclusion and          *
-*  limitation may not apply to You.                                    *
-*                                                                      *
-************************************************************************
-
-8. Litigation
--------------
-
-Any litigation relating to this License may be brought only in the
-courts of a jurisdiction where the defendant maintains its principal
-place of business and such litigation shall be governed by laws of that
-jurisdiction, without reference to its conflict-of-law provisions.
-Nothing in this Section shall prevent a party's ability to bring
-cross-claims or counter-claims.
-
-9. Miscellaneous
-----------------
-
-This License represents the complete agreement concerning the subject
-matter hereof. If any provision of this License is held to be
-unenforceable, such provision shall be reformed only to the extent
-necessary to make it enforceable. Any law or regulation which provides
-that the language of a contract shall be construed against the drafter
-shall not be used to construe this License against a Contributor.
-
-10. Versions of the License
----------------------------
-
-10.1. New Versions
-
-Mozilla Foundation is the license steward. Except as provided in Section
-10.3, no one other than the license steward has the right to modify or
-publish new versions of this License. Each version will be given a
-distinguishing version number.
-
-10.2. Effect of New Versions
-
-You may distribute the Covered Software under the terms of the version
-of the License under which You originally received the Covered Software,
-or under the terms of any subsequent version published by the license
-steward.
-
-10.3. Modified Versions
-
-If you create software not governed by this License, and you want to
-create a new license for such software, you may create and use a
-modified version of this License if you rename the license and remove
-any references to the name of the license steward (except to note that
-such modified license differs from this License).
-
-10.4. Distributing Source Code Form that is Incompatible With Secondary
-Licenses
-
-If You choose to distribute Source Code Form that is Incompatible With
-Secondary Licenses under the terms of this version of the License, the
-notice described in Exhibit B of this License must be attached.
-
-Exhibit A - Source Code Form License Notice
--------------------------------------------
-
-  This Source Code Form is subject to the terms of the Mozilla Public
-  License, v. 2.0. If a copy of the MPL was not distributed with this
-  file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-If it is not possible or desirable to put the notice in a particular
-file, then You may include the notice in a location (such as a LICENSE
-file in a relevant directory) where a recipient would be likely to look
-for such a notice.
-
-You may add additional accurate notices of copyright ownership.
-
-Exhibit B - "Incompatible With Secondary Licenses" Notice
----------------------------------------------------------
-
-  This Source Code Form is "Incompatible With Secondary Licenses", as
-  defined by the Mozilla Public License, v. 2.0.
 
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/README.rst b/README.rst
index a44546a..bb761a0 100644
--- a/README.rst
+++ b/README.rst
@@ -6,11 +6,11 @@ For full API reference documentation, visit https://fabiankueppers.github.io/cal
 Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 AND Elektronische Fahrwerksysteme GmbH, Gaimersheim, Germany
 
-This Source Code Form is subject to the terms of the Mozilla Public
-License, v. 2.0. If a copy of the MPL was not distributed with this
-file, You can obtain one at http://mozilla.org/MPL/2.0/.
+This Source Code Form is subject to the terms of the Apache License 2.0.
+If a copy of the APL2 was not distributed with this
+file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-If you use this framework or parts of it for your research, please cite it by::
+**Important: updated references!** If you use this framework (*classification or detection*) or parts of it for your research, please cite it by::
 
     @InProceedings{Kueppers_2020_CVPR_Workshops,
        author = {Küppers, Fabian and Kronenberger, Jan and Shantia, Amirhossein and Haselhoff, Anselm},
@@ -20,6 +20,16 @@ If you use this framework or parts of it for your research, please cite it by::
        year = {2020}
     }
 
+*If you use Bayesian calibration methods with uncertainty, please cite it by*::
+
+    @InProceedings{Kueppers_2021_IV,
+           author = {Küppers, Fabian and Kronenberger, Jan and Schneider, Jonas and Haselhoff, Anselm},
+           title = {Bayesian Confidence Calibration for Epistemic Uncertainty Modelling},
+           booktitle = {Proceedings of the IEEE Intelligent Vehicles Symposium (IV)},
+           month = {July},
+           year = {2021},
+        }
+
 .. contents:: Table of Contents
    :depth: 2
 
@@ -30,6 +40,21 @@ This framework is designed to calibrate the confidence estimates of classifiers
 
 For example: given 100 predictions with a confidence of 80% of each prediction, the observed accuracy should also match 80% (neither more nor less). This behaviour is achievable with several calibration methods.
 
+Update on version 1.2
+---------------------
+TL;DR:
+- Bayesian confidence calibration: train and infer scaling methods using variational inference (VI) and MCMC sampling
+- New metrics: MMCE [13]_ and PICP [14]_ (*netcal.metrics.MMCE* and *netcal.metrics.PICP*)
+- New regularization methods: MMCE [13]_ and DCA [15]_ (*netcal.regularization.MMCEPenalty* and *netcal.regularization.DCAPenalty*)
+- Updated examples
+- Switched license from MPL2 to APL2
+
+Now you can also use Bayesian methods to obtain uncertainty within a calibration mapping mainly in the *netcal.scaling* package. We adapted Markov-Chain Monte-Carlo sampling (MCMC) as well as Variational Inference (VI) on common calibration methods.
+It is also easily possible to bring the scaling methods to CUDA in order to speed-up the computations. We further provide new metrics to evaluate confidence calibration (MMCE) and to evaluate the quality of prediction intervals (PICP).
+Finally, we updated our framework by new regularization methods that can be used during model training (MMCE and DCA).
+
+Update on version 1.1
+---------------------
 This framework can also be used to calibrate object detection models. It has recently been shown that calibration on object detection also depends on the position and/or scale of a predicted object [12]_. We provide calibration methods to perform confidence calibration w.r.t. the additional box regression branch.
 For this purpose, we extended the commonly used Histogram Binning [3]_, Logistic Calibration alias Platt scaling [10]_ and the Beta Calibration method [2]_ to also include the bounding box information into a calibration mapping.
 Furthermore, we provide two new methods called the *Dependent Logistic Calibration* and the *Dependent Beta Calibration* that are not only able to perform a calibration mapping
@@ -58,12 +83,16 @@ Or simply invoke the following command to install the calibration suite::
 
 Requirements
 ------------
-- numpy>=1.15
+- numpy>=1.17
 - scipy>=1.3
 - matplotlib>=3.1
-- scikit-learn>=0.20.0
-- torch>=1.1
-- tqdm
+- scikit-learn>=0.21
+- torch>=1.4
+- torchvision>=0.5.0
+- tqdm>=4.40
+- pyro-ppl>=1.3
+- tikzplotlib>=0.9.8
+- tensorboard>=2.2
 
 
 Calibration Metrics
@@ -74,10 +103,12 @@ For object detection, we implemented the *Detection Calibration Error* (D-ECE) [
 - (Detection) Expected Calibration Error [1]_, [12]_ (*netcal.metrics.ECE*)
 - (Detection) Maximum Calibration Error [1]_, [12]_  (*netcal.metrics.MCE*)
 - (Detection) Average Calibration Error [11]_, [12]_ (*netcal.metrics.ACE*)
+- Maximum Mean Calibration Error (MMCE) [13]_ (*netcal.metrics.MMCE*) (no position-dependency)
+- Prediction interval coverage probability (PICP) (*netcal.metrics.PICP*) - this score is not a direct measure of confidence calibration but rather to measure the quality of uncertainty prediction intervals.
 
 Methods
-==========
-The calibration methods are separated into binning and scaling methods. The binning methods divide the available information into several bins (like ECE or D-ECE) and perform calibration on each bin. The scaling methods scale the confidence estimates or logits directly to calibrated confidence estimates - on detection calibration, this is done w.r.t. the additional regression branch of a network.
+=======
+The post-hoc calibration methods are separated into binning and scaling methods. The binning methods divide the available information into several bins (like ECE or D-ECE) and perform calibration on each bin. The scaling methods scale the confidence estimates or logits directly to calibrated confidence estimates - on detection calibration, this is done w.r.t. the additional regression branch of a network.
 
 Important: if you use the detection mode, you need to specifiy the flag "detection=True" in the constructor of the according method (this is not necessary for *netcal.scaling.LogisticCalibrationDependent* and *netcal.scaling.BetaCalibrationDependent*).
 
@@ -106,14 +137,22 @@ Implemented scaling methods are:
 - Beta Calibration for classification [2]_ and object detection [12]_ (*netcal.scaling.BetaCalibration*)
 - Dependent Beta Calibration for object detection [12]_ (*netcal.scaling.BetaCalibrationDependent*) - on detection, this method is able to capture correlations between all input quantities and should be preferred over Beta Calibration for object detection
 
+**New on version 1.2:**: you can provide a parameter named "method" to the constructor of each scaling method. This parameter could be one of the following:
+- 'mle': use the method feed-forward with maximum likelihood estimates on the calibration parameters (standard)
+- 'momentum': use non-convex momentum optimization (e.g. default on dependent beta calibration)
+- 'mcmc': use Markov-Chain Monte-Carlo sampling to obtain multiple parameter sets in order to quantify uncertainty in the calibration
+- 'variational': use Variational Inference to obtain multiple parameter sets in order to quantify uncertainty in the calibration
+
 Regularization
 --------------
-Implemented regularization methods are:
+With some effort, it is also possible to push the model training towards calibrated confidences by regularization. Implemented regularization methods are:
 
-- Confidence Penalty [8]_ (*netcal.regularization.confidence_penalty*)
+- Confidence Penalty [8]_ (*netcal.regularization.confidence_penalty* and *netcal.regularization.ConfidencePenalty* - the latter one is a PyTorch implementation that might be used as a regularization term)
+- Maximum Mean Calibration Error (MMCE) [13]_ (*netcal.regularization.MMCEPenalty* - PyTorch regularization module)
+- DCA [15]_ (*netcal.regularization.DCAPenalty* - PyTorch regularization module)
 
 Visualization
-================
+=============
 For visualization of miscalibration, one can use a Confidence Histograms & Reliability Diagrams. These diagrams are similar to ECE, the output space is divided into equally spaced bins. The calibration gap between bin accuracy and bin confidence is visualized as a histogram.
 
 On detection calibration, the miscalibration can be visualized either along one additional box information (e.g. the x-position of the predictions) or distributed over two additional box information in terms of a heatmap.
@@ -121,7 +160,7 @@ On detection calibration, the miscalibration can be visualized either along one
 - Reliability Diagram [1]_, [12]_ (*netcal.presentation.ReliabilityDiagram*)
 
 Examples
-===========
+========
 The calibration methods work with the predicted confidence estimates of a neural network and on detection also with the bounding box regression branch.
 
 Classification
@@ -170,7 +209,7 @@ The miscalibration can be visualized with a Reliability Diagram:
 
 Detection
 ---------
-This is a basic example which uses softmax predictions of a classification task with 10 classes and the given NumPy arrays:
+In this example we use confidence predictions of an object detection model with the according x-position of the predicted bounding boxes. Our ground-truth provided to the calibration algorithm denotes if a bounding box has matched a ground-truth box with a certain IoU and the correct class label.
 
 .. code-block:: python
 
@@ -187,11 +226,11 @@ This is an example for *netcal.scaling.LogisticCalibration* and *netcal.scaling.
 
     input = np.stack((confidences, relative_x_position), axis=1)
 
-    lr = LogisticCalibration(detection=True)        # flag 'detection=True' is mandatory for this method
+    lr = LogisticCalibration(detection=True, use_cuda=False)    # flag 'detection=True' is mandatory for this method
     lr.fit(input, matched)
     calibrated = lr.transform(input)
 
-    lr_dependent = LogisticCalibrationDependent()   # flag 'detection=True' is not necessary as this method is only defined for detection
+    lr_dependent = LogisticCalibrationDependent(use_cuda=False) # flag 'detection=True' is not necessary as this method is only defined for detection
     lr_dependent.fit(input, matched)
     calibrated = lr_dependent.transform(input)
 
@@ -220,6 +259,89 @@ The miscalibration can be visualized with a Reliability Diagram:
     diagram.plot(input, matched)                # visualize miscalibration of uncalibrated
     diagram.plot(input_calibrated, matched)     # visualize miscalibration of calibrated
 
+Uncertainty in Calibration
+--------------------------
+We can also quantify the uncertainty in a calibration mapping if we use a Bayesian view on the calibration models. We can sample multiple parameter sets using MCMC sampling or VI. In this example, we reuse the data of the previous detection example.
+
+.. code-block:: python
+
+    matched                # binary NumPy 1-D array (0, 1) that indicates if a bounding box has matched a ground truth at a certain IoU with the right label - shape: (n_samples,)
+    confidences            # NumPy 1-D array with confidence estimates between 0-1 - shape: (n_samples,)
+    relative_x_position    # NumPy 1-D array with relative center-x position between 0-1 of each prediction - shape: (n_samples,)
+
+This is an example for *netcal.scaling.LogisticCalibration* and *netcal.scaling.LogisticCalibrationDependent* but also works for every calibration method (remind different constructor parameters):
+
+.. code-block:: python
+
+    import numpy as np
+    from netcal.scaling import LogisticCalibration, LogisticCalibrationDependent
+
+    input = np.stack((confidences, relative_x_position), axis=1)
+
+    # flag 'detection=True' is mandatory for this method
+    # use Variational Inference with 2000 optimization steps for creating this calibration mapping
+    lr = LogisticCalibration(detection=True, method'variational', vi_epochs=2000, use_cuda=False)
+    lr.fit(input, matched)
+
+    # 'num_samples=1000': sample 1000 parameter sets from VI
+    # thus, 'calibrated' has shape [1000, n_samples]
+    calibrated = lr.transform(input, num_samples=1000)
+
+    # flag 'detection=True' is not necessary as this method is only defined for detection
+    # this time, use Markov-Chain Monte-Carlo sampling with 250 warm-up steps, 250 parameter samples and one chain
+    lr_dependent = LogisticCalibrationDependent(method='mcmc',
+                                                mcmc_warmup_steps=250, mcmc_steps=250, mcmc_chains=1,
+                                                use_cuda=False)
+    lr_dependent.fit(input, matched)
+
+    # 'num_samples=1000': although we have only sampled 250 different parameter sets,
+    # we can randomly sample 1000 parameter sets from MCMC
+    calibrated = lr_dependent.transform(input)
+
+You can directly pass the output to the D-ECE and PICP instance to measure miscalibration and mask quality:
+.. code-block:: python
+
+    from netcal.metrics import ECE
+    from netcal.metrics import PICP
+
+    n_bins = 10
+    ece = ECE(n_bins, detection=True)
+    picp = PICP(n_bins, detection=True)
+
+    # the following function calls are equivalent:
+    miscalibration = ece.measure(calibrated, matched, uncertainty="mean")
+    miscalibration = ece.measure(np.mean(calibrated, axis=0), matched)
+
+    # now determine uncertainty quality
+    uncertainty = picp.measure(calibrated, matched, uncertainty="mean")
+
+    print("D-ECE:", miscalibration)
+    print("PICP:", uncertainty.picp) # prediction coverage probability
+    print("MPIW:", uncertainty.mpiw) # mean prediction interval width
+
+If we want to measure miscalibration and uncertainty quality by means of the relative x position, we need to broadcast the according information:
+
+.. code-block:: python
+
+    # broadcast and stack x information to calibrated information
+    broadcasted = np.broadcast_to(relative_x_position, calibrated.shape)
+    calibrated = np.stack((calibrated, broadcasted), axis=2)
+
+    n_bins = [10, 10]
+    ece = ECE(n_bins, detection=True)
+    picp = PICP(n_bins, detection=True)
+
+    # the following function calls are equivalent:
+    miscalibration = ece.measure(calibrated, matched, uncertainty="mean")
+    miscalibration = ece.measure(np.mean(calibrated, axis=0), matched)
+
+    # now determine uncertainty quality
+    uncertainty = picp.measure(calibrated, matched, uncertainty="mean")
+
+    print("D-ECE:", miscalibration)
+    print("PICP:", uncertainty.picp) # prediction coverage probability
+    print("MPIW:", uncertainty.mpiw) # mean prediction interval width
+
 References
 ==========
 .. [1] Naeini, Mahdi Pakdaman, Gregory Cooper, and Milos Hauskrecht: "Obtaining well calibrated probabilities using bayesian binning." Twenty-Ninth AAAI Conference on Artificial Intelligence, 2015.
@@ -234,3 +356,6 @@ References
 .. [10] Platt, John: "Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods." Advances in large margin classifiers, 10(3): 61–74, 1999.
 .. [11] Neumann, Lukas, Andrew Zisserman, and Andrea Vedaldi: "Relaxed Softmax: Efficient Confidence Auto-Calibration for Safe Pedestrian Detection." Conference on Neural Information Processing Systems (NIPS) Workshop MLITS, 2018.
 .. [12] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff: "Multivariate Confidence Calibration for Object Detection"." The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020
+.. [13] Kumar, Aviral, Sunita Sarawagi, and Ujjwal Jain: "Trainable calibration measures for neural networks from _kernel mean embeddings." International Conference on Machine Learning. 2018
+.. [14] Jiayu  Yao,  Weiwei  Pan,  Soumya  Ghosh,  and  Finale  Doshi-Velez: "Quality of Uncertainty Quantification for Bayesian Neural Network Inference." Workshop on Uncertainty and Robustness in Deep Learning, ICML, 2019
+.. [15] Liang, Gongbo, et al.: "Improved trainable calibration method for neural networks on medical imaging classification." arXiv preprint arXiv:2009.04057 (2020)
diff --git a/docs/build/html/.buildinfo b/docs/build/html/.buildinfo
index 515f083..299fd67 100644
--- a/docs/build/html/.buildinfo
+++ b/docs/build/html/.buildinfo
@@ -1,4 +1,4 @@
 # Sphinx build info version 1
 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done.
-config: 78e6332c97a52e1ea66f816824406211
+config: e4be416fe1fade80beef75b5aa42bfc9
 tags: 645f666f9bcd5a90fca523b33c5a78b7
diff --git a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.BBQ.html b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.BBQ.html
index 16e9055..7bc505e 100644
--- a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.BBQ.html
+++ b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.BBQ.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.binning.BBQ &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.binning.BBQ &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.binning.IsotonicRegression.html" title="netcal.binning.IsotonicRegression"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" accesskey="U">netcal.binning</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,9 +49,9 @@ <h3>Navigation</h3>
 <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.binning.BBQ">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.binning.</code><code class="sig-name descname">BBQ</code><span class="sig-paren">(</span><em class="sig-param">score_function: str = 'BIC'</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.BBQ" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.binning.</code><code class="sig-name descname">BBQ</code><span class="sig-paren">(</span><em class="sig-param">score_function: str = 'BIC'</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.BBQ" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
-<p>Bayesian Binning into Quantiles (BBQ). This method is originally proposed by <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. This method utilizes multiple <a class="reference internal" href="netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning" title="netcal.binning.HistogramBinning"><code class="xref py py-class docutils literal notranslate"><span class="pre">HistogramBinning</span></code></a>
+<p>Bayesian Binning into Quantiles (BBQ) <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. This method utilizes multiple <a class="reference internal" href="netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning" title="netcal.binning.HistogramBinning"><code class="xref py py-class docutils literal notranslate"><span class="pre">HistogramBinning</span></code></a>
 instances with different amounts of bins and computes a weighted sum of all methods to obtain a
 well-calibrated confidence estimate. The scoring function “BDeu”, which is proposed in the original paper,
 is currently not supported.</p>
@@ -82,6 +82,8 @@ <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Pe
 <li><p><strong>score_function</strong> (<em>str</em><em>, </em><em>default='BIC'</em>) – define score functions:
 - ‘BIC’: Bayesian-Information-Criterion
 - ‘AIC’: Akaike-Information-Criterion</p></li>
+<li><p><strong>equal_intervals</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, the bins have the same width. If False, the bins are splitted to equalize
+the number of samples in each bin.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
@@ -108,7 +110,7 @@ <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Pe
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([score_function, detection, …])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([score_function, equal_intervals, …])</p></td>
 <td><p>Constructor.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
@@ -124,10 +126,10 @@ <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Pe
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -213,7 +215,7 @@ <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Pe
 <dl class="method">
 <dt id="netcal.binning.BBQ.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.BBQ.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -230,7 +232,7 @@ <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Pe
 <dl class="method">
 <dt id="netcal.binning.BBQ.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.BBQ.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -258,7 +260,7 @@ <h1>netcal.binning.BBQ<a class="headerlink" href="#netcal-binning-bbq" title="Pe
 
 <dl class="method">
 <dt id="netcal.binning.BBQ.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.BBQ.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.BBQ.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -349,7 +351,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.binning.IsotonicRegression.html" title="netcal.binning.IsotonicRegression"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" >netcal.binning</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.ENIR.html b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.ENIR.html
index b859cb4..81be203 100644
--- a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.ENIR.html
+++ b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.ENIR.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.binning.ENIR &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.binning.ENIR &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.binning.BBQ.html" title="netcal.binning.BBQ"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" accesskey="U">netcal.binning</a> &#187;</li> 
       </ul>
     </div>  
@@ -51,7 +51,7 @@ <h1>netcal.binning.ENIR<a class="headerlink" href="#netcal-binning-enir" title="
 <dt id="netcal.binning.ENIR">
 <em class="property">class </em><code class="sig-prename descclassname">netcal.binning.</code><code class="sig-name descname">ENIR</code><span class="sig-paren">(</span><em class="sig-param">score_function: str = 'BIC'</em>, <em class="sig-param">quick_init: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.ENIR" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
-<p>Ensemble of Near Isotonic Regression (ENIR) models. This method is originally proposed by <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. These models allow - in contrast to standard
+<p>Ensemble of Near Isotonic Regression (ENIR) models <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. These models allow - in contrast to standard
 <a class="reference internal" href="netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression" title="netcal.binning.IsotonicRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">IsotonicRegression</span></code></a> method - a violation of the monotony restrictions. Using the <em>modified
 Pool-Adjacent-Violators Algorithm (mPAVA)</em>, this method build multiple Near Isotonic Regression models
 and weights them by a certain score function.</p>
@@ -125,10 +125,10 @@ <h1>netcal.binning.ENIR<a class="headerlink" href="#netcal-binning-enir" title="
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -214,7 +214,7 @@ <h1>netcal.binning.ENIR<a class="headerlink" href="#netcal-binning-enir" title="
 <dl class="method">
 <dt id="netcal.binning.ENIR.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.ENIR.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -231,7 +231,7 @@ <h1>netcal.binning.ENIR<a class="headerlink" href="#netcal-binning-enir" title="
 <dl class="method">
 <dt id="netcal.binning.ENIR.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.ENIR.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -259,7 +259,7 @@ <h1>netcal.binning.ENIR<a class="headerlink" href="#netcal-binning-enir" title="
 
 <dl class="method">
 <dt id="netcal.binning.ENIR.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.ENIR.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.ENIR.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -350,7 +350,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.binning.BBQ.html" title="netcal.binning.BBQ"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" >netcal.binning</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html
index a204644..27933c8 100644
--- a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html
+++ b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.binning.HistogramBinning &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.binning.HistogramBinning &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../netcal.binning.html" title="netcal.binning"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" accesskey="U">netcal.binning</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,13 +49,12 @@ <h3>Navigation</h3>
 <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-histogrambinning" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.binning.HistogramBinning">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.binning.</code><code class="sig-name descname">HistogramBinning</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">tuple</em>, <em class="sig-param">list] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.HistogramBinning" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.binning.</code><code class="sig-name descname">HistogramBinning</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">Iterable[int]] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.HistogramBinning" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
-<p>Simple Histogram Binning calibration method. This method is originally proposed by <a class="footnote-reference brackets" href="#id4" id="id1">1</a>. Each prediction is sorted into a bin
+<p>Simple Histogram Binning calibration method <a class="footnote-reference brackets" href="#id4" id="id1">1</a>. Each prediction is sorted into a bin
 and assigned its calibrated confidence estimate. This method normally works for binary
 classification. For multiclass classification, this method is applied into a 1-vs-all manner <a class="footnote-reference brackets" href="#id5" id="id2">2</a>.</p>
-<p>The bin boundaries are either chosen to be
-equal length intervals or to equalize the number of samples in each bin.</p>
+<p>The bin boundaries are either chosen to be equal length intervals or to equalize the number of samples in each bin.</p>
 <p>On object detection, use a multidimensional binning to include additional information of the box
 regression branch <a class="footnote-reference brackets" href="#id7" id="id3">3</a>.</p>
 <dl class="field-list simple">
@@ -109,7 +108,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
 <td><p>Clear model parameters.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y)</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
 <td><p>Function call to build the calibration model.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
@@ -122,10 +121,10 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -133,7 +132,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X)</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state])</p></td>
 <td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
 </tr>
 </tbody>
@@ -146,7 +145,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 
 <dl class="method">
 <dt id="netcal.binning.HistogramBinning.fit">
-<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; HistogramBinning<a class="headerlink" href="#netcal.binning.HistogramBinning.fit" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = False</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; HistogramBinning<a class="headerlink" href="#netcal.binning.HistogramBinning.fit" title="Permalink to this definition">¶</a></dt>
 <dd><p>Function call to build the calibration model.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
@@ -156,6 +155,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
 <li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number (only for compatibility here)</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
@@ -226,7 +226,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 <dl class="method">
 <dt id="netcal.binning.HistogramBinning.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.HistogramBinning.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -243,7 +243,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 <dl class="method">
 <dt id="netcal.binning.HistogramBinning.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.HistogramBinning.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -271,7 +271,7 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 
 <dl class="method">
 <dt id="netcal.binning.HistogramBinning.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.HistogramBinning.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.HistogramBinning.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -292,13 +292,18 @@ <h1>netcal.binning.HistogramBinning<a class="headerlink" href="#netcal-binning-h
 
 <dl class="method">
 <dt id="netcal.binning.HistogramBinning.transform">
-<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.HistogramBinning.transform" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1</em>, <em class="sig-param">random_state: int = None</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.HistogramBinning.transform" title="Permalink to this definition">¶</a></dt>
 <dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
 confidence estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with uncalibrated confidence estimates.
-1-D for binary classification, 2-D for multi class (softmax).</p>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with uncalibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference - only for compatibility and
+not used by Histogram Binning!</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+</ul>
 </dd>
 <dt class="field-even">Returns</dt>
 <dd class="field-even"><p>NumPy array with calibrated confidence estimates.
@@ -362,7 +367,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../netcal.binning.html" title="netcal.binning"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" >netcal.binning</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html
index 0d32efe..2d71ac8 100644
--- a/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html
+++ b/docs/build/html/_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.binning.IsotonicRegression &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.binning.IsotonicRegression &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.binning.HistogramBinning.html" title="netcal.binning.HistogramBinning"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" accesskey="U">netcal.binning</a> &#187;</li> 
       </ul>
     </div>  
@@ -51,7 +51,7 @@ <h1>netcal.binning.IsotonicRegression<a class="headerlink" href="#netcal-binning
 <dt id="netcal.binning.IsotonicRegression">
 <em class="property">class </em><code class="sig-prename descclassname">netcal.binning.</code><code class="sig-name descname">IsotonicRegression</code><span class="sig-paren">(</span><em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.IsotonicRegression" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
-<p>Isotonic Regression method. This method is originally proposed by <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. This method is similar to <a class="reference internal" href="netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning" title="netcal.binning.HistogramBinning"><code class="xref py py-class docutils literal notranslate"><span class="pre">HistogramBinning</span></code></a> but with dynamic bin sizes
+<p>Isotonic Regression method <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. This method is similar to <a class="reference internal" href="netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning" title="netcal.binning.HistogramBinning"><code class="xref py py-class docutils literal notranslate"><span class="pre">HistogramBinning</span></code></a> but with dynamic bin sizes
 and boundaries. A piecewise constant function gets fit to ground truth labels sorted by
 given confidence estimates.</p>
 <dl class="field-list simple">
@@ -99,10 +99,10 @@ <h1>netcal.binning.IsotonicRegression<a class="headerlink" href="#netcal-binning
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -188,7 +188,7 @@ <h1>netcal.binning.IsotonicRegression<a class="headerlink" href="#netcal-binning
 <dl class="method">
 <dt id="netcal.binning.IsotonicRegression.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.IsotonicRegression.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -205,7 +205,7 @@ <h1>netcal.binning.IsotonicRegression<a class="headerlink" href="#netcal-binning
 <dl class="method">
 <dt id="netcal.binning.IsotonicRegression.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.binning.IsotonicRegression.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -233,7 +233,7 @@ <h1>netcal.binning.IsotonicRegression<a class="headerlink" href="#netcal-binning
 
 <dl class="method">
 <dt id="netcal.binning.IsotonicRegression.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.IsotonicRegression.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.binning.IsotonicRegression.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -324,7 +324,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.binning.HistogramBinning.html" title="netcal.binning.HistogramBinning"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.binning.html" >netcal.binning</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ACE.html b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ACE.html
index ce137e1..01c9cb9 100644
--- a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ACE.html
+++ b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ACE.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.metrics.ACE &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.metrics.ACE &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../netcal.metrics.html" title="netcal.metrics"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" accesskey="U">netcal.metrics</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,7 +49,7 @@ <h3>Navigation</h3>
 <h1>netcal.metrics.ACE<a class="headerlink" href="#netcal-metrics-ace" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.metrics.ACE">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">ACE</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">tuple</em>, <em class="sig-param">list] = 10</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.ACE" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">ACE</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">Iterable[int]] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.ACE" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.metrics.Miscalibration._Miscalibration</span></code></p>
 <p>Average Calibration Error (ACE).
 This metric is used on classification <a class="footnote-reference brackets" href="#id3" id="id1">1</a> or as Detection Average Calibration Error (D-ACE)
@@ -65,10 +65,13 @@ <h1>netcal.metrics.ACE<a class="headerlink" href="#netcal-metrics-ace" title="Pe
 <li><p><strong>bins</strong> (<em>int</em><em> or </em><em>iterable</em><em>, </em><em>default: 10</em>) – Number of bins used by the Histogram Binning.
 On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = … = bins).
 If iterable, use different amount of bins for each dimension (nx1, nx2, … = bins).</p></li>
+<li><p><strong>equal_intervals</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, the bins have the same width. If False, the bins are splitted to equalize
+the number of samples in each bin.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
 box confidence must be present) with shape (n_samples, [n_box_features]).</p></li>
+<li><p><strong>sample_threshold</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Bins with an amount of samples below this threshold are not included into the miscalibration metrics.</p></li>
 </ul>
 </dd>
 </dl>
@@ -83,7 +86,8 @@ <h1>netcal.metrics.ACE<a class="headerlink" href="#netcal-metrics-ace" title="Pe
 <dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
 “Multivariate Confidence Calibration for Object Detection.”
-The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
+The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+<a class="reference external" href="https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf">Get source online</a></p>
 </dd>
 </dl>
 <p class="rubric">Methods</p>
@@ -93,68 +97,154 @@ <h1>netcal.metrics.ACE<a class="headerlink" href="#netcal-metrics-ace" title="Pe
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, detection, sample_threshold])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Constructor.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, return_map, return_num_samples])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">binning</span></code>(bin_bounds, samples, *values[, nan])</p></td>
+<td><p>Perform binning on value (and all additional values passed) based on samples.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, batched, uncertainty, …])</p></td>
 <td><p>Measure calibration by given predictions with confidence and the according ground truth.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X, y[, batched, uncertainty])</p></td>
+<td><p>Check input data.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">process</span></code>(metric, acc_hist, conf_hist, …)</p></td>
+<td><p>Determine miscalibration based on passed histograms.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">reduce</span></code>(histogram, distribution, axis[, …])</p></td>
+<td><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.</p></td>
+</tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
 </tbody>
 </table>
+<dl class="method">
+<dt id="netcal.metrics.ACE.binning">
+<code class="sig-name descname">binning</code><span class="sig-paren">(</span><em class="sig-param">bin_bounds: List</em>, <em class="sig-param">samples: numpy.ndarray</em>, <em class="sig-param">*values: Iterable</em>, <em class="sig-param">nan: float = 0.0</em><span class="sig-paren">)</span> &#x2192; Tuple<a class="headerlink" href="#netcal.metrics.ACE.binning" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform binning on value (and all additional values passed) based on samples.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>bin_bounds</strong> (<em>list</em><em>, </em><em>length=samples.shape</em><em>[</em><em>1</em><em>]</em>) – Binning boundaries used for each dimension given in ‘samples’ parameter.</p></li>
+<li><p><strong>samples</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – Array used to group all samples into bins.</p></li>
+<li><p><strong>*values</strong> (<em>instances np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>1</em><em>)</em>) – Arrays whose values are binned.</p></li>
+<li><p><strong>nan</strong> (<em>float</em><em>, </em><em>optional default: 0.0</em>) – If a bin has no samples or less than defined sample_threshold, the according bin is marked as
+NaN. Specify fill float to insert instead of NaN.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length equal to the amount of passed value arrays with binning schemes and an additional histogram</em></p></li>
+<li><p><em>with number of samples in each bin as well as an index tuple containing the bin indices.</em></p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.metrics.ACE.measure">
-<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">return_map: bool = False</em>, <em class="sig-param">return_num_samples: bool = False</em><span class="sig-paren">)</span> &#x2192; Union[numpy.ndarray, tuple]<a class="headerlink" href="#netcal.metrics.ACE.measure" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None, return_map: bool = False, return_num_samples: bool = False, return_uncertainty_map: bool = False</em><span class="sig-paren">)</span> &#x2192; Union[float, Tuple]<a class="headerlink" href="#netcal.metrics.ACE.measure" title="Permalink to this definition">¶</a></dt>
 <dd><p>Measure calibration by given predictions with confidence and the according ground truth.
 Assume binary predictions with y=1.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes/n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
-<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
-Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.</p></li>
+<li><p><strong>batched</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+All predictions given by X and y are separately evaluated and their results are averaged afterwards
+for visualization.</p></li>
+<li><p><strong>uncertainty</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – <p>Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+that output an ensemble of predictions per sample. Choose one of the following options:
+- flatten:  treat everything as a separate prediction - this option will yield into a slightly better</p>
+<blockquote>
+<div><p>calibration performance but without the visualization of a prediction interval.</p>
+</div></blockquote>
+<ul>
+<li><dl class="simple">
+<dt>mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample</dt><dd><p>(mean) with a standard deviation that is visualized.</p>
+</dd>
+</dl>
+</li>
+</ul>
+</p></li>
 <li><p><strong>return_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, return map with miscalibration metric separated into all remaining dimension bins.</p></li>
 <li><p><strong>return_num_samples</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, also return the number of samples in each bin.</p></li>
+<li><p><strong>return_uncertainty_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, also return the average deviation of the confidence within each bin.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Always returns miscalibration metric.
-If ‘return_map’ is False, return ACE only (or num_samples map).
-If ‘return_map’ is True, return tuple with ACE and map over all bins.
-If ‘return_num_samples’ is False, ACE only (or ACE map).
-If ‘return_num_samples’ is True, return tuple with ACE and number of samples in each bin.</p>
+<dd class="field-even"><p>Always returns Average Calibration Error.
+If ‘return_map’ is True, return tuple and append miscalibration map over all bins.
+If ‘return_num_samples’ is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+If ‘return_uncertainty’ is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)</p>
+<dd class="field-odd"><p>float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])</p>
 </dd>
 </dl>
 </dd></dl>
 
 <dl class="method">
-<dt id="netcal.metrics.ACE.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.ACE.squeeze_generic" title="Permalink to this definition">¶</a></dt>
-<dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
-of size 1.</p>
+<dt id="netcal.metrics.ACE.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None</em><span class="sig-paren">)</span> &#x2192; Tuple[List[numpy.ndarray], List[numpy.ndarray], List[numpy.ndarray], List, int]<a class="headerlink" href="#netcal.metrics.ACE.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Check input data. For detailed documentation of the input parameters, check “_measure” method.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.ACE.process">
+<code class="sig-name descname">process</code><span class="sig-paren">(</span><em class="sig-param">metric: str</em>, <em class="sig-param">acc_hist: numpy.ndarray</em>, <em class="sig-param">conf_hist: numpy.ndarray</em>, <em class="sig-param">variance_hist: numpy.ndarray</em>, <em class="sig-param">num_samples_hist: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; Tuple[float, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray]<a class="headerlink" href="#netcal.metrics.ACE.process" title="Permalink to this definition">¶</a></dt>
+<dd><p>Determine miscalibration based on passed histograms.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>a</strong> (<em>np.ndarray</em>) – NumPy array that should be squeezed.</p></li>
-<li><p><strong>axes_to_keep</strong> (<em>int</em><em> or </em><em>iterable</em>) – Axes that should be kept even if they have a size of 1.</p></li>
+<li><p><strong>metric</strong> (<em>str</em>) – Identifier to specify the used metric. Must be one of ‘ace’, ‘ece’ or ‘mce’.</p></li>
+<li><p><strong>acc_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average accuracy in each bin.</p></li>
+<li><p><strong>conf_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average confidence in each bin.</p></li>
+<li><p><strong>variance_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average variance in each bin. This array is currently not used but
+might be utilized in the future.</p></li>
+<li><p><strong>num_samples_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with number of samples in each bin.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Squeezed array.</p>
-</dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length 6 (miscalibration score, miscalibration map, accuracy map, confidence map, variance map, num samples map)</em></p></li>
+<li><p><em>All maps without confidence dimension.</em></p></li>
+</ul>
+</p>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.metrics.ACE.reduce">
+<code class="sig-name descname">reduce</code><span class="sig-paren">(</span><em class="sig-param">histogram: numpy.ndarray</em>, <em class="sig-param">distribution: numpy.ndarray</em>, <em class="sig-param">axis: int</em>, <em class="sig-param">reduce_result: Tuple = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.ACE.reduce" title="Permalink to this definition">¶</a></dt>
+<dd><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.
+If ‘reduce_result’ is given, reuse the data distribution of the previous result instead of the distribution
+given by ‘distribution’ parameter.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.ACE.squeeze_generic">
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[Iterable[int], int]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.ACE.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<dd><p>Squeeze input array a but keep axes defined by parameter
+‘axes_to_keep’ even if the dimension is of size 1.</p>
+</dd></dl>
+
 </dd></dl>
 
 </div>
@@ -207,7 +297,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../netcal.metrics.html" title="netcal.metrics"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" >netcal.metrics</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ECE.html b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ECE.html
index 32740af..25747c1 100644
--- a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ECE.html
+++ b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.ECE.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.metrics.ECE &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.metrics.ECE &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.metrics.ACE.html" title="netcal.metrics.ACE"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" accesskey="U">netcal.metrics</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,7 +49,7 @@ <h3>Navigation</h3>
 <h1>netcal.metrics.ECE<a class="headerlink" href="#netcal-metrics-ece" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.metrics.ECE">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">ECE</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">tuple</em>, <em class="sig-param">list] = 10</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.ECE" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">ECE</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">Iterable[int]] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.ECE" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.metrics.Miscalibration._Miscalibration</span></code></p>
 <p>Expected Calibration Error (ECE).
 This metric is used on classification <a class="footnote-reference brackets" href="#id3" id="id1">1</a> or as Detection Expected Calibration Error on object
@@ -66,10 +66,13 @@ <h1>netcal.metrics.ECE<a class="headerlink" href="#netcal-metrics-ece" title="Pe
 <li><p><strong>bins</strong> (<em>int</em><em> or </em><em>iterable</em><em>, </em><em>default: 10</em>) – Number of bins used by the Histogram Binning.
 On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = … = bins).
 If iterable, use different amount of bins for each dimension (nx1, nx2, … = bins).</p></li>
+<li><p><strong>equal_intervals</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, the bins have the same width. If False, the bins are splitted to equalize
+the number of samples in each bin.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
 box confidence must be present) with shape (n_samples, [n_box_features]).</p></li>
+<li><p><strong>sample_threshold</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Bins with an amount of samples below this threshold are not included into the miscalibration metrics.</p></li>
 </ul>
 </dd>
 </dl>
@@ -84,7 +87,8 @@ <h1>netcal.metrics.ECE<a class="headerlink" href="#netcal-metrics-ece" title="Pe
 <dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
 “Multivariate Confidence Calibration for Object Detection.”
-The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
+The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+<a class="reference external" href="https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf">Get source online</a>.</p>
 </dd>
 </dl>
 <p class="rubric">Methods</p>
@@ -94,68 +98,154 @@ <h1>netcal.metrics.ECE<a class="headerlink" href="#netcal-metrics-ece" title="Pe
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, detection, sample_threshold])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Constructor.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, return_map, return_num_samples])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">binning</span></code>(bin_bounds, samples, *values[, nan])</p></td>
+<td><p>Perform binning on value (and all additional values passed) based on samples.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, batched, uncertainty, …])</p></td>
 <td><p>Measure calibration by given predictions with confidence and the according ground truth.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X, y[, batched, uncertainty])</p></td>
+<td><p>Check input data.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">process</span></code>(metric, acc_hist, conf_hist, …)</p></td>
+<td><p>Determine miscalibration based on passed histograms.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">reduce</span></code>(histogram, distribution, axis[, …])</p></td>
+<td><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.</p></td>
+</tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
 </tbody>
 </table>
+<dl class="method">
+<dt id="netcal.metrics.ECE.binning">
+<code class="sig-name descname">binning</code><span class="sig-paren">(</span><em class="sig-param">bin_bounds: List</em>, <em class="sig-param">samples: numpy.ndarray</em>, <em class="sig-param">*values: Iterable</em>, <em class="sig-param">nan: float = 0.0</em><span class="sig-paren">)</span> &#x2192; Tuple<a class="headerlink" href="#netcal.metrics.ECE.binning" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform binning on value (and all additional values passed) based on samples.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>bin_bounds</strong> (<em>list</em><em>, </em><em>length=samples.shape</em><em>[</em><em>1</em><em>]</em>) – Binning boundaries used for each dimension given in ‘samples’ parameter.</p></li>
+<li><p><strong>samples</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – Array used to group all samples into bins.</p></li>
+<li><p><strong>*values</strong> (<em>instances np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>1</em><em>)</em>) – Arrays whose values are binned.</p></li>
+<li><p><strong>nan</strong> (<em>float</em><em>, </em><em>optional default: 0.0</em>) – If a bin has no samples or less than defined sample_threshold, the according bin is marked as
+NaN. Specify fill float to insert instead of NaN.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length equal to the amount of passed value arrays with binning schemes and an additional histogram</em></p></li>
+<li><p><em>with number of samples in each bin as well as an index tuple containing the bin indices.</em></p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.metrics.ECE.measure">
-<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">return_map: bool = False</em>, <em class="sig-param">return_num_samples: bool = False</em><span class="sig-paren">)</span> &#x2192; Union[numpy.ndarray, tuple]<a class="headerlink" href="#netcal.metrics.ECE.measure" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None, return_map: bool = False, return_num_samples: bool = False, return_uncertainty_map: bool = False</em><span class="sig-paren">)</span> &#x2192; Union[float, Tuple]<a class="headerlink" href="#netcal.metrics.ECE.measure" title="Permalink to this definition">¶</a></dt>
 <dd><p>Measure calibration by given predictions with confidence and the according ground truth.
 Assume binary predictions with y=1.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes/n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
-<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
-Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.</p></li>
+<li><p><strong>batched</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+All predictions given by X and y are separately evaluated and their results are averaged afterwards
+for visualization.</p></li>
+<li><p><strong>uncertainty</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – <p>Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+that output an ensemble of predictions per sample. Choose one of the following options:
+- flatten:  treat everything as a separate prediction - this option will yield into a slightly better</p>
+<blockquote>
+<div><p>calibration performance but without the visualization of a prediction interval.</p>
+</div></blockquote>
+<ul>
+<li><dl class="simple">
+<dt>mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample</dt><dd><p>(mean) with a standard deviation that is visualized.</p>
+</dd>
+</dl>
+</li>
+</ul>
+</p></li>
 <li><p><strong>return_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, return map with miscalibration metric separated into all remaining dimension bins.</p></li>
 <li><p><strong>return_num_samples</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, also return the number of samples in each bin.</p></li>
+<li><p><strong>return_uncertainty_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, also return the average deviation of the confidence within each bin.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Always returns miscalibration metric.
-If ‘return_map’ is False, return ECE only (or num_samples map).
-If ‘return_map’ is True, return tuple with ECE and map over all bins.
-If ‘return_num_samples’ is False, ECE only (or ECE map).
-If ‘return_num_samples’ is True, return tuple with ECE and number of samples in each bin.</p>
+<dd class="field-even"><p>Always returns Expected Calibration Error.
+If ‘return_map’ is True, return tuple and append miscalibration map over all bins.
+If ‘return_num_samples’ is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+If ‘return_uncertainty’ is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)</p>
+<dd class="field-odd"><p>float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])</p>
 </dd>
 </dl>
 </dd></dl>
 
 <dl class="method">
-<dt id="netcal.metrics.ECE.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.ECE.squeeze_generic" title="Permalink to this definition">¶</a></dt>
-<dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
-of size 1.</p>
+<dt id="netcal.metrics.ECE.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None</em><span class="sig-paren">)</span> &#x2192; Tuple[List[numpy.ndarray], List[numpy.ndarray], List[numpy.ndarray], List, int]<a class="headerlink" href="#netcal.metrics.ECE.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Check input data. For detailed documentation of the input parameters, check “_measure” method.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.ECE.process">
+<code class="sig-name descname">process</code><span class="sig-paren">(</span><em class="sig-param">metric: str</em>, <em class="sig-param">acc_hist: numpy.ndarray</em>, <em class="sig-param">conf_hist: numpy.ndarray</em>, <em class="sig-param">variance_hist: numpy.ndarray</em>, <em class="sig-param">num_samples_hist: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; Tuple[float, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray]<a class="headerlink" href="#netcal.metrics.ECE.process" title="Permalink to this definition">¶</a></dt>
+<dd><p>Determine miscalibration based on passed histograms.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>a</strong> (<em>np.ndarray</em>) – NumPy array that should be squeezed.</p></li>
-<li><p><strong>axes_to_keep</strong> (<em>int</em><em> or </em><em>iterable</em>) – Axes that should be kept even if they have a size of 1.</p></li>
+<li><p><strong>metric</strong> (<em>str</em>) – Identifier to specify the used metric. Must be one of ‘ace’, ‘ece’ or ‘mce’.</p></li>
+<li><p><strong>acc_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average accuracy in each bin.</p></li>
+<li><p><strong>conf_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average confidence in each bin.</p></li>
+<li><p><strong>variance_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average variance in each bin. This array is currently not used but
+might be utilized in the future.</p></li>
+<li><p><strong>num_samples_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with number of samples in each bin.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Squeezed array.</p>
-</dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length 6 (miscalibration score, miscalibration map, accuracy map, confidence map, variance map, num samples map)</em></p></li>
+<li><p><em>All maps without confidence dimension.</em></p></li>
+</ul>
+</p>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.metrics.ECE.reduce">
+<code class="sig-name descname">reduce</code><span class="sig-paren">(</span><em class="sig-param">histogram: numpy.ndarray</em>, <em class="sig-param">distribution: numpy.ndarray</em>, <em class="sig-param">axis: int</em>, <em class="sig-param">reduce_result: Tuple = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.ECE.reduce" title="Permalink to this definition">¶</a></dt>
+<dd><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.
+If ‘reduce_result’ is given, reuse the data distribution of the previous result instead of the distribution
+given by ‘distribution’ parameter.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.ECE.squeeze_generic">
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[Iterable[int], int]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.ECE.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<dd><p>Squeeze input array a but keep axes defined by parameter
+‘axes_to_keep’ even if the dimension is of size 1.</p>
+</dd></dl>
+
 </dd></dl>
 
 </div>
@@ -208,7 +298,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.metrics.ACE.html" title="netcal.metrics.ACE"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" >netcal.metrics</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MCE.html b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MCE.html
index f0f44c3..871eac3 100644
--- a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MCE.html
+++ b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MCE.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.metrics.MCE &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.metrics.MCE &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -17,7 +17,7 @@
     
     <link rel="index" title="Index" href="../../genindex.html" />
     <link rel="search" title="Search" href="../../search.html" />
-    <link rel="next" title="netcal.presentation" href="../netcal.presentation.html" />
+    <link rel="next" title="netcal.metrics.MMCE" href="netcal.metrics.MMCE.html" />
     <link rel="prev" title="netcal.metrics.ECE" href="netcal.metrics.ECE.html" /> 
   </head><body>
     <div class="related" role="navigation" aria-label="related navigation">
@@ -30,12 +30,12 @@ <h3>Navigation</h3>
           <a href="../../py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
         <li class="right" >
-          <a href="../netcal.presentation.html" title="netcal.presentation"
+          <a href="netcal.metrics.MMCE.html" title="netcal.metrics.MMCE"
              accesskey="N">next</a> |</li>
         <li class="right" >
           <a href="netcal.metrics.ECE.html" title="netcal.metrics.ECE"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" accesskey="U">netcal.metrics</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,7 +49,7 @@ <h3>Navigation</h3>
 <h1>netcal.metrics.MCE<a class="headerlink" href="#netcal-metrics-mce" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.metrics.MCE">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">MCE</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">tuple</em>, <em class="sig-param">list] = 10</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.MCE" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">MCE</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">Iterable[int]] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.MCE" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.metrics.Miscalibration._Miscalibration</span></code></p>
 <p>Maximum Calibration Error (MCE).
 This metric is used on classification <a class="footnote-reference brackets" href="#id3" id="id1">1</a> or as Detection Maximum calibration error (D-MCE) on
@@ -64,10 +64,13 @@ <h1>netcal.metrics.MCE<a class="headerlink" href="#netcal-metrics-mce" title="Pe
 <li><p><strong>bins</strong> (<em>int</em><em> or </em><em>iterable</em><em>, </em><em>default: 10</em>) – Number of bins used by the Histogram Binning.
 On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = … = bins).
 If iterable, use different amount of bins for each dimension (nx1, nx2, … = bins).</p></li>
+<li><p><strong>equal_intervals</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, the bins have the same width. If False, the bins are splitted to equalize
+the number of samples in each bin.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
 box confidence must be present) with shape (n_samples, [n_box_features]).</p></li>
+<li><p><strong>sample_threshold</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Bins with an amount of samples below this threshold are not included into the miscalibration metrics.</p></li>
 </ul>
 </dd>
 </dl>
@@ -82,7 +85,8 @@ <h1>netcal.metrics.MCE<a class="headerlink" href="#netcal-metrics-mce" title="Pe
 <dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
 “Multivariate Confidence Calibration for Object Detection.”
-The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
+The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+<a class="reference external" href="https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf">Get source online</a></p>
 </dd>
 </dl>
 <p class="rubric">Methods</p>
@@ -92,71 +96,154 @@ <h1>netcal.metrics.MCE<a class="headerlink" href="#netcal-metrics-mce" title="Pe
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, detection, sample_threshold])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Constructor.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, return_map, return_num_samples])</p></td>
-<td><p><dl class="field-list simple">
-<dt class="field-odd">param X</dt>
-<dd class="field-odd"><p>NumPy array with confidence values for each prediction on classification with shapes</p>
-</dd>
-</dl>
-</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">binning</span></code>(bin_bounds, samples, *values[, nan])</p></td>
+<td><p>Perform binning on value (and all additional values passed) based on samples.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, batched, uncertainty, …])</p></td>
+<td><p>Measure calibration by given predictions with confidence and the according ground truth.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X, y[, batched, uncertainty])</p></td>
+<td><p>Check input data.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">process</span></code>(metric, acc_hist, conf_hist, …)</p></td>
+<td><p>Determine miscalibration based on passed histograms.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">reduce</span></code>(histogram, distribution, axis[, …])</p></td>
+<td><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
 </tbody>
 </table>
+<dl class="method">
+<dt id="netcal.metrics.MCE.binning">
+<code class="sig-name descname">binning</code><span class="sig-paren">(</span><em class="sig-param">bin_bounds: List</em>, <em class="sig-param">samples: numpy.ndarray</em>, <em class="sig-param">*values: Iterable</em>, <em class="sig-param">nan: float = 0.0</em><span class="sig-paren">)</span> &#x2192; Tuple<a class="headerlink" href="#netcal.metrics.MCE.binning" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform binning on value (and all additional values passed) based on samples.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>bin_bounds</strong> (<em>list</em><em>, </em><em>length=samples.shape</em><em>[</em><em>1</em><em>]</em>) – Binning boundaries used for each dimension given in ‘samples’ parameter.</p></li>
+<li><p><strong>samples</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – Array used to group all samples into bins.</p></li>
+<li><p><strong>*values</strong> (<em>instances np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>1</em><em>)</em>) – Arrays whose values are binned.</p></li>
+<li><p><strong>nan</strong> (<em>float</em><em>, </em><em>optional default: 0.0</em>) – If a bin has no samples or less than defined sample_threshold, the according bin is marked as
+NaN. Specify fill float to insert instead of NaN.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length equal to the amount of passed value arrays with binning schemes and an additional histogram</em></p></li>
+<li><p><em>with number of samples in each bin as well as an index tuple containing the bin indices.</em></p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.metrics.MCE.measure">
-<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">return_map: bool = False</em>, <em class="sig-param">return_num_samples: bool = False</em><span class="sig-paren">)</span> &#x2192; Union[numpy.ndarray, tuple]<a class="headerlink" href="#netcal.metrics.MCE.measure" title="Permalink to this definition">¶</a></dt>
-<dd><dl class="field-list simple">
+<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None, return_map: bool = False, return_num_samples: bool = False, return_uncertainty_map: bool = False</em><span class="sig-paren">)</span> &#x2192; Union[float, Tuple]<a class="headerlink" href="#netcal.metrics.MCE.measure" title="Permalink to this definition">¶</a></dt>
+<dd><p>Measure calibration by given predictions with confidence and the according ground truth.
+Assume binary predictions with y=1.</p>
+<dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes/n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
-<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
-Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.</p></li>
+<li><p><strong>batched</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+All predictions given by X and y are separately evaluated and their results are averaged afterwards
+for visualization.</p></li>
+<li><p><strong>uncertainty</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – <p>Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+that output an ensemble of predictions per sample. Choose one of the following options:
+- flatten:  treat everything as a separate prediction - this option will yield into a slightly better</p>
+<blockquote>
+<div><p>calibration performance but without the visualization of a prediction interval.</p>
+</div></blockquote>
+<ul>
+<li><dl class="simple">
+<dt>mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample</dt><dd><p>(mean) with a standard deviation that is visualized.</p>
+</dd>
+</dl>
+</li>
+</ul>
+</p></li>
 <li><p><strong>return_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, return map with miscalibration metric separated into all remaining dimension bins.</p></li>
 <li><p><strong>return_num_samples</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, also return the number of samples in each bin.</p></li>
+<li><p><strong>return_uncertainty_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, also return the average deviation of the confidence within each bin.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Always returns miscalibration metric.
-If ‘return_map’ is False, return MCE only (or num_samples map).
-If ‘return_map’ is True, return tuple with MCE and map over all bins.
-If ‘return_num_samples’ is False, MCE only (or MCE map).
-If ‘return_num_samples’ is True, return tuple with MCE and number of samples in each bin.</p>
+<dd class="field-even"><p>Always returns Maximum Calibration Error.
+If ‘return_map’ is True, return tuple and append miscalibration map over all bins.
+If ‘return_num_samples’ is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+If ‘return_uncertainty’ is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)</p>
+<dd class="field-odd"><p>float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])</p>
 </dd>
 </dl>
 </dd></dl>
 
 <dl class="method">
-<dt id="netcal.metrics.MCE.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.MCE.squeeze_generic" title="Permalink to this definition">¶</a></dt>
-<dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
-of size 1.</p>
+<dt id="netcal.metrics.MCE.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None</em><span class="sig-paren">)</span> &#x2192; Tuple[List[numpy.ndarray], List[numpy.ndarray], List[numpy.ndarray], List, int]<a class="headerlink" href="#netcal.metrics.MCE.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Check input data. For detailed documentation of the input parameters, check “_measure” method.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.MCE.process">
+<code class="sig-name descname">process</code><span class="sig-paren">(</span><em class="sig-param">metric: str</em>, <em class="sig-param">acc_hist: numpy.ndarray</em>, <em class="sig-param">conf_hist: numpy.ndarray</em>, <em class="sig-param">variance_hist: numpy.ndarray</em>, <em class="sig-param">num_samples_hist: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; Tuple[float, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray]<a class="headerlink" href="#netcal.metrics.MCE.process" title="Permalink to this definition">¶</a></dt>
+<dd><p>Determine miscalibration based on passed histograms.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>a</strong> (<em>np.ndarray</em>) – NumPy array that should be squeezed.</p></li>
-<li><p><strong>axes_to_keep</strong> (<em>int</em><em> or </em><em>iterable</em>) – Axes that should be kept even if they have a size of 1.</p></li>
+<li><p><strong>metric</strong> (<em>str</em>) – Identifier to specify the used metric. Must be one of ‘ace’, ‘ece’ or ‘mce’.</p></li>
+<li><p><strong>acc_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average accuracy in each bin.</p></li>
+<li><p><strong>conf_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average confidence in each bin.</p></li>
+<li><p><strong>variance_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average variance in each bin. This array is currently not used but
+might be utilized in the future.</p></li>
+<li><p><strong>num_samples_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with number of samples in each bin.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Squeezed array.</p>
-</dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length 6 (miscalibration score, miscalibration map, accuracy map, confidence map, variance map, num samples map)</em></p></li>
+<li><p><em>All maps without confidence dimension.</em></p></li>
+</ul>
+</p>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.metrics.MCE.reduce">
+<code class="sig-name descname">reduce</code><span class="sig-paren">(</span><em class="sig-param">histogram: numpy.ndarray</em>, <em class="sig-param">distribution: numpy.ndarray</em>, <em class="sig-param">axis: int</em>, <em class="sig-param">reduce_result: Tuple = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.MCE.reduce" title="Permalink to this definition">¶</a></dt>
+<dd><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.
+If ‘reduce_result’ is given, reuse the data distribution of the previous result instead of the distribution
+given by ‘distribution’ parameter.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.MCE.squeeze_generic">
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[Iterable[int], int]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.MCE.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<dd><p>Squeeze input array a but keep axes defined by parameter
+‘axes_to_keep’ even if the dimension is of size 1.</p>
+</dd></dl>
+
 </dd></dl>
 
 </div>
@@ -171,8 +258,8 @@ <h4>Previous topic</h4>
   <p class="topless"><a href="netcal.metrics.ECE.html"
                         title="previous chapter">netcal.metrics.ECE</a></p>
   <h4>Next topic</h4>
-  <p class="topless"><a href="../netcal.presentation.html"
-                        title="next chapter">netcal.presentation</a></p>
+  <p class="topless"><a href="netcal.metrics.MMCE.html"
+                        title="next chapter">netcal.metrics.MMCE</a></p>
   <div role="note" aria-label="source link">
     <h3>This Page</h3>
     <ul class="this-page-menu">
@@ -204,12 +291,12 @@ <h3>Navigation</h3>
           <a href="../../py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
         <li class="right" >
-          <a href="../netcal.presentation.html" title="netcal.presentation"
+          <a href="netcal.metrics.MMCE.html" title="netcal.metrics.MMCE"
              >next</a> |</li>
         <li class="right" >
           <a href="netcal.metrics.ECE.html" title="netcal.metrics.ECE"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" >netcal.metrics</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MMCE.html b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MMCE.html
new file mode 100644
index 0000000..4fa4754
--- /dev/null
+++ b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.MMCE.html
@@ -0,0 +1,189 @@
+
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta charset="utf-8" />
+    <title>netcal.metrics.MMCE &#8212; calibration-framework 1.2.0 documentation</title>
+    <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
+    <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
+    
+    <script id="documentation_options" data-url_root="../../" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/language_data.js"></script>
+    <script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
+    
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="netcal.metrics.PICP" href="netcal.metrics.PICP.html" />
+    <link rel="prev" title="netcal.metrics.MCE" href="netcal.metrics.MCE.html" /> 
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.metrics.PICP.html" title="netcal.metrics.PICP"
+             accesskey="N">next</a> |</li>
+        <li class="right" >
+          <a href="netcal.metrics.MCE.html" title="netcal.metrics.MCE"
+             accesskey="P">previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" accesskey="U">netcal.metrics</a> &#187;</li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <div class="section" id="netcal-metrics-mmce">
+<h1>netcal.metrics.MMCE<a class="headerlink" href="#netcal-metrics-mmce" title="Permalink to this headline">¶</a></h1>
+<dl class="class">
+<dt id="netcal.metrics.MMCE">
+<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">MMCE</code><span class="sig-paren">(</span><em class="sig-param">detection: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.MMCE" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">object</span></code></p>
+<p>Maximum Mean Calibration Error (MMCE) <a class="footnote-reference brackets" href="#id2" id="id1">1</a>.
+A differentiable approximation to the Expected Calibration Error (ECE) using a
+reproducing _kernel Hilbert space (RKHS).
+Using a dataset <span class="math notranslate nohighlight">\(\mathcal{D}\)</span> of size <span class="math notranslate nohighlight">\(N\)</span> consisting of the ground truth labels <span class="math notranslate nohighlight">\(\hat{y} \in \{1, ..., K \}\)</span>
+with input <span class="math notranslate nohighlight">\(\hat{y} \in \mathcal{X}\)</span>, the MMCE is calculated by using a scoring classifier <span class="math notranslate nohighlight">\(\hat{p}=h(x)\)</span>
+that returns the highest probability for a certain class in conjunction with the predicted label
+information <span class="math notranslate nohighlight">\(y \in \{1, ..., K \}\)</span> and is defined by</p>
+<div class="math notranslate nohighlight">
+\[MMCE = \sqrt{\sum_{i, j \in \mathcal{D}} \frac{1}{N^2}(\mathbb{1}(\hat{y}_i = y_i) - \hat{p}_i) (\mathbb{1}(\hat{y}_j = y_j) - \hat{p}_j)k(\hat{p}_i, \hat{p}_j)} ,\]</div>
+<p>with <span class="math notranslate nohighlight">\(\mathbb{1}(*)\)</span> as the indicator function and a Laplacian _kernel <span class="math notranslate nohighlight">\(k\)</span> defined by</p>
+<div class="math notranslate nohighlight">
+\[k(\hat{p}_i, \hat{p}_j) = \exp(-2.5 |\hat{p}_i - \hat{p}_j|) .\]</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – Detection mode is currently not supported for MMCE!
+If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
+with shape (n_samples, [n_classes]).
+If True, the input array ‘X’ is treated as a box predictions with several box features (at least
+box confidence must be present) with shape (n_samples, [n_box_features]).</p>
+</dd>
+</dl>
+<p class="rubric">References</p>
+<dl class="footnote brackets">
+<dt class="label" id="id2"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>Kumar, Aviral, Sunita Sarawagi, and Ujjwal Jain:
+“Trainable calibration measures for neural networks from _kernel mean embeddings.”
+International Conference on Machine Learning. 2018.
+<a class="reference external" href="http://proceedings.mlr.press/v80/kumar18a/kumar18a.pdf">Get source online</a>.</p>
+</dd>
+</dl>
+<p class="rubric">Methods</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([detection])</p></td>
+<td><p>Constructor.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, batched])</p></td>
+<td><p>Measure calibration by given predictions with confidence and the according ground truth.</p></td>
+</tr>
+</tbody>
+</table>
+<dl class="method">
+<dt id="netcal.metrics.MMCE.measure">
+<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.MMCE.measure" title="Permalink to this definition">¶</a></dt>
+<dd><p>Measure calibration by given predictions with confidence and the according ground truth.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.</p></li>
+<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+If iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.</p></li>
+<li><p><strong>batched</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+All predictions given by X and y are separately evaluated and their results are averaged afterwards
+for visualization.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Returns Maximum Mean Calibration Error.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>float</p>
+</dd>
+</dl>
+</dd></dl>
+
+</dd></dl>
+
+</div>
+
+
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <h4>Previous topic</h4>
+  <p class="topless"><a href="netcal.metrics.MCE.html"
+                        title="previous chapter">netcal.metrics.MCE</a></p>
+  <h4>Next topic</h4>
+  <p class="topless"><a href="netcal.metrics.PICP.html"
+                        title="next chapter">netcal.metrics.PICP</a></p>
+  <div role="note" aria-label="source link">
+    <h3>This Page</h3>
+    <ul class="this-page-menu">
+      <li><a href="../../_sources/_autosummary/_autosummary_metric/netcal.metrics.MMCE.rst.txt"
+            rel="nofollow">Show Source</a></li>
+    </ul>
+   </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" />
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>$('#searchbox').show(0);</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.metrics.PICP.html" title="netcal.metrics.PICP"
+             >next</a> |</li>
+        <li class="right" >
+          <a href="netcal.metrics.MCE.html" title="netcal.metrics.MCE"
+             >previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" >netcal.metrics</a> &#187;</li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2019-2021, Ruhr West University of Applied Sciences, Bottrop, Germany AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany.
+      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 2.4.4.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.PICP.html b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.PICP.html
new file mode 100644
index 0000000..de55d2c
--- /dev/null
+++ b/docs/build/html/_autosummary/_autosummary_metric/netcal.metrics.PICP.html
@@ -0,0 +1,307 @@
+
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta charset="utf-8" />
+    <title>netcal.metrics.PICP &#8212; calibration-framework 1.2.0 documentation</title>
+    <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
+    <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
+    
+    <script id="documentation_options" data-url_root="../../" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/language_data.js"></script>
+    <script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
+    
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="netcal.presentation" href="../netcal.presentation.html" />
+    <link rel="prev" title="netcal.metrics.MMCE" href="netcal.metrics.MMCE.html" /> 
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="../netcal.presentation.html" title="netcal.presentation"
+             accesskey="N">next</a> |</li>
+        <li class="right" >
+          <a href="netcal.metrics.MMCE.html" title="netcal.metrics.MMCE"
+             accesskey="P">previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" accesskey="U">netcal.metrics</a> &#187;</li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <div class="section" id="netcal-metrics-picp">
+<h1>netcal.metrics.PICP<a class="headerlink" href="#netcal-metrics-picp" title="Permalink to this headline">¶</a></h1>
+<dl class="class">
+<dt id="netcal.metrics.PICP">
+<em class="property">class </em><code class="sig-prename descclassname">netcal.metrics.</code><code class="sig-name descname">PICP</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">Iterable[int]] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.PICP" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.metrics.Miscalibration._Miscalibration</span></code></p>
+<p>Compute Prediction Interval Coverage Probability (PICP) <a class="footnote-reference brackets" href="#id3" id="id1">1</a>,[2]_ and Mean Prediction Interval Width (MPIW) <a class="footnote-reference brackets" href="#id4" id="id2">2</a>.
+This metric is used for Bayesian models to determine the quality of the uncertainty estimates.
+In Bayesian mode, an uncertainty estimate is attached to each sample. The PICP measures the probability, that
+the true (observed) accuracy falls into the p% prediction interval. The uncertainty is well-calibrated, if
+the PICP is equal to p%. Simultaneously, the MPIW measures the mean width of all prediction intervals to evaluate
+the sharpness of the uncertainty estimates.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>bins</strong> (<em>int</em><em> or </em><em>iterable</em><em>, </em><em>default: 10</em>) – Number of bins used by the Histogram Binning.
+On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = … = bins).
+If iterable, use different amount of bins for each dimension (nx1, nx2, … = bins).</p></li>
+<li><p><strong>equal_intervals</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, the bins have the same width. If False, the bins are splitted to equalize
+the number of samples in each bin.</p></li>
+<li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
+with shape (n_samples, [n_classes]).
+If True, the input array ‘X’ is treated as a box predictions with several box features (at least
+box confidence must be present) with shape (n_samples, [n_box_features]).</p></li>
+<li><p><strong>sample_threshold</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Bins with an amount of samples below this threshold are not included into the process metrics.</p></li>
+</ul>
+</dd>
+</dl>
+<p class="rubric">References</p>
+<dl class="footnote brackets">
+<dt class="label" id="id3"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>Kuleshov, V.; Fenner, N. &amp; Ermon, S.:
+“Accurate Uncertainties for Deep Learning Using Calibrated Regression.”
+International Conference on Machine Learning (ICML), 2018
+<a class="reference external" href="http://proceedings.mlr.press/v80/kuleshov18a/kuleshov18a.pdf">Get source online</a></p>
+</dd>
+<dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
+<dd><p>Jiayu  Yao,  Weiwei  Pan,  Soumya  Ghosh,  and  Finale  Doshi-Velez:
+“Quality of Uncertainty Quantification for Bayesian Neural Network Inference.”
+Workshop on Uncertainty and Robustness in Deep Learning, ICML, 2019
+<a class="reference external" href="https://arxiv.org/pdf/1906.09686.pdf">Get source online</a></p>
+</dd>
+</dl>
+<p class="rubric">Methods</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, equal_intervals, detection, …])</p></td>
+<td><p>Constructor.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">accuracy</span></code>(X, y[, batched, uncertainty])</p></td>
+<td><p>Measure the accuracy of each point by binning.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">binning</span></code>(bin_bounds, samples, *values[, nan])</p></td>
+<td><p>Perform binning on value (and all additional values passed) based on samples.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">measure</span></code>(X, y[, p, use_hpd, batched, …])</p></td>
+<td><p>Measure calibration by given predictions with confidence and the according ground truth.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X, y[, batched, uncertainty])</p></td>
+<td><p>Check input data.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">process</span></code>(metric, acc_hist, conf_hist, …)</p></td>
+<td><p>Determine miscalibration based on passed histograms.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">reduce</span></code>(histogram, distribution, axis[, …])</p></td>
+<td><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
+<td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
+</tr>
+</tbody>
+</table>
+<dl class="method">
+<dt id="netcal.metrics.PICP.accuracy">
+<code class="sig-name descname">accuracy</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = 'mean'</em><span class="sig-paren">)</span> &#x2192; Tuple[List[numpy.ndarray], List[numpy.ndarray], List[numpy.ndarray], List[numpy.ndarray], List, int]<a class="headerlink" href="#netcal.metrics.PICP.accuracy" title="Permalink to this definition">¶</a></dt>
+<dd><p>Measure the accuracy of each point by binning.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.PICP.binning">
+<code class="sig-name descname">binning</code><span class="sig-paren">(</span><em class="sig-param">bin_bounds: List</em>, <em class="sig-param">samples: numpy.ndarray</em>, <em class="sig-param">*values: Iterable</em>, <em class="sig-param">nan: float = 0.0</em><span class="sig-paren">)</span> &#x2192; Tuple<a class="headerlink" href="#netcal.metrics.PICP.binning" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform binning on value (and all additional values passed) based on samples.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>bin_bounds</strong> (<em>list</em><em>, </em><em>length=samples.shape</em><em>[</em><em>1</em><em>]</em>) – Binning boundaries used for each dimension given in ‘samples’ parameter.</p></li>
+<li><p><strong>samples</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – Array used to group all samples into bins.</p></li>
+<li><p><strong>*values</strong> (<em>instances np.ndarray of shape</em><em> (</em><em>n_samples</em><em>, </em><em>1</em><em>)</em>) – Arrays whose values are binned.</p></li>
+<li><p><strong>nan</strong> (<em>float</em><em>, </em><em>optional default: 0.0</em>) – If a bin has no samples or less than defined sample_threshold, the according bin is marked as
+NaN. Specify fill float to insert instead of NaN.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length equal to the amount of passed value arrays with binning schemes and an additional histogram</em></p></li>
+<li><p><em>with number of samples in each bin as well as an index tuple containing the bin indices.</em></p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.PICP.measure">
+<code class="sig-name descname">measure</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], p: float = 0.05, use_hpd: bool = True, batched: bool = False, uncertainty: str = 'mean', return_map: bool = False</em><span class="sig-paren">)</span> &#x2192; NamedTuple<a class="headerlink" href="#netcal.metrics.PICP.measure" title="Permalink to this definition">¶</a></dt>
+<dd><p>Measure calibration by given predictions with confidence and the according ground truth.
+Assume binary predictions with y=1.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes/n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
+If iterable over multiple instances of np.ndarray and parameter batched=True,
+interpret this parameter as multiple predictions that should be averaged.</p></li>
+<li><p><strong>p</strong> (<em>float</em><em>, </em><em>optional</em><em>, </em><em>default: 0.05</em>) – Confidence level.</p></li>
+<li><p><strong>use_hpd</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, use highest posterior density (HPD) interval to determine the prediction interval width.
+Use variance with Gaussian assumption otherwise.</p></li>
+<li><p><strong>batched</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+All predictions given by X and y are separately evaluated and their results are averaged afterwards
+for visualization.</p></li>
+<li><p><strong>uncertainty</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: &quot;mean&quot;</em>) – Mode to measure mean estimate and uncertainty of the samples in Bayesian mode. Must be one
+of “mean” (mean of all samples), “mode” (mode of all samples), “median” (median of all samples) or
+“flatten” (no uncertainty will be computed, all samples are seen as independent predictions).</p></li>
+<li><p><strong>return_map</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, return map with PICP and MPIW metric separated into all remaining dimension bins.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>Namedtuple PICPResult with fields “picp” and “mpiw”, where each field either holds the PICP/MPIW score</em></p></li>
+<li><p><em>or a tuple of (float, np.ndarray)</em> – Always returns a named tuple with PICP (prediction interval coverage probability) and MPIW
+(mean prediction interval width).
+If ‘return_map’ is True, each field holds a tuple for the metric itself and the PICP/MPIW distribution
+over all bins.</p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.PICP.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None</em><span class="sig-paren">)</span> &#x2192; Tuple[List[numpy.ndarray], List[numpy.ndarray], List[numpy.ndarray], List, int]<a class="headerlink" href="#netcal.metrics.PICP.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Check input data. For detailed documentation of the input parameters, check “_measure” method.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.PICP.process">
+<code class="sig-name descname">process</code><span class="sig-paren">(</span><em class="sig-param">metric: str</em>, <em class="sig-param">acc_hist: numpy.ndarray</em>, <em class="sig-param">conf_hist: numpy.ndarray</em>, <em class="sig-param">variance_hist: numpy.ndarray</em>, <em class="sig-param">num_samples_hist: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; Tuple[float, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray, numpy.ndarray]<a class="headerlink" href="#netcal.metrics.PICP.process" title="Permalink to this definition">¶</a></dt>
+<dd><p>Determine miscalibration based on passed histograms.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>metric</strong> (<em>str</em>) – Identifier to specify the used metric. Must be one of ‘ace’, ‘ece’ or ‘mce’.</p></li>
+<li><p><strong>acc_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average accuracy in each bin.</p></li>
+<li><p><strong>conf_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average confidence in each bin.</p></li>
+<li><p><strong>variance_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with average variance in each bin. This array is currently not used but
+might be utilized in the future.</p></li>
+<li><p><strong>num_samples_hist</strong> (<em>np.ndarray of shape</em><em> (</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>n_bins</em><em>, </em><em>[</em><em>..</em><em>]</em><em>]</em><em>]</em><em>)</em>) – Histogram with number of samples in each bin.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>tuple of length 6 (miscalibration score, miscalibration map, accuracy map, confidence map, variance map, num samples map)</em></p></li>
+<li><p><em>All maps without confidence dimension.</em></p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.PICP.reduce">
+<code class="sig-name descname">reduce</code><span class="sig-paren">(</span><em class="sig-param">histogram: numpy.ndarray</em>, <em class="sig-param">distribution: numpy.ndarray</em>, <em class="sig-param">axis: int</em>, <em class="sig-param">reduce_result: Tuple = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.metrics.PICP.reduce" title="Permalink to this definition">¶</a></dt>
+<dd><p>Calculate the weighted mean on a given histogram based on a dedicated data distribution.
+If ‘reduce_result’ is given, reuse the data distribution of the previous result instead of the distribution
+given by ‘distribution’ parameter.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.metrics.PICP.squeeze_generic">
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[Iterable[int], int]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.metrics.PICP.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<dd><p>Squeeze input array a but keep axes defined by parameter
+‘axes_to_keep’ even if the dimension is of size 1.</p>
+</dd></dl>
+
+</dd></dl>
+
+</div>
+
+
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <h4>Previous topic</h4>
+  <p class="topless"><a href="netcal.metrics.MMCE.html"
+                        title="previous chapter">netcal.metrics.MMCE</a></p>
+  <h4>Next topic</h4>
+  <p class="topless"><a href="../netcal.presentation.html"
+                        title="next chapter">netcal.presentation</a></p>
+  <div role="note" aria-label="source link">
+    <h3>This Page</h3>
+    <ul class="this-page-menu">
+      <li><a href="../../_sources/_autosummary/_autosummary_metric/netcal.metrics.PICP.rst.txt"
+            rel="nofollow">Show Source</a></li>
+    </ul>
+   </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" />
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>$('#searchbox').show(0);</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="../netcal.presentation.html" title="netcal.presentation"
+             >next</a> |</li>
+        <li class="right" >
+          <a href="netcal.metrics.MMCE.html" title="netcal.metrics.MMCE"
+             >previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.metrics.html" >netcal.metrics</a> &#187;</li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2019-2021, Ruhr West University of Applied Sciences, Bottrop, Germany AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany.
+      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 2.4.4.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/build/html/_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html b/docs/build/html/_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html
index e472b67..3ef42de 100644
--- a/docs/build/html/_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html
+++ b/docs/build/html/_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.presentation.ReliabilityDiagram &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.presentation.ReliabilityDiagram &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../netcal.presentation.html" title="netcal.presentation"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.presentation.html" accesskey="U">netcal.presentation</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,7 +49,7 @@ <h3>Navigation</h3>
 <h1>netcal.presentation.ReliabilityDiagram<a class="headerlink" href="#netcal-presentation-reliabilitydiagram" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.presentation.ReliabilityDiagram">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.presentation.</code><code class="sig-name descname">ReliabilityDiagram</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">tuple</em>, <em class="sig-param">list] = 10</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em>, <em class="sig-param">feature_names: list = None</em>, <em class="sig-param">fmin: float = None</em>, <em class="sig-param">fmax: float = None</em>, <em class="sig-param">metric: str = 'ECE'</em>, <em class="sig-param">title_suffix: str = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.presentation.ReliabilityDiagram" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.presentation.</code><code class="sig-name descname">ReliabilityDiagram</code><span class="sig-paren">(</span><em class="sig-param">bins: Union[int</em>, <em class="sig-param">Iterable[int]] = 10</em>, <em class="sig-param">equal_intervals: bool = True</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">sample_threshold: int = 1</em>, <em class="sig-param">fmin: float = None</em>, <em class="sig-param">fmax: float = None</em>, <em class="sig-param">metric: str = 'ECE'</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.presentation.ReliabilityDiagram" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">object</span></code></p>
 <p>Plot Confidence Histogram and Reliability Diagram to visualize miscalibration.
 On classification, plot the gaps between average confidence and observed accuracy bin-wise over the confidence
@@ -61,6 +61,8 @@ <h1>netcal.presentation.ReliabilityDiagram<a class="headerlink" href="#netcal-pr
 <li><p><strong>bins</strong> (<em>int</em><em> or </em><em>iterable</em><em>, </em><em>default: 10</em>) – Number of bins used by the ACE/ECE/MCE.
 On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = … = bins).
 If iterable, use different amount of bins for each dimension (nx1, nx2, … = bins).</p></li>
+<li><p><strong>equal_intervals</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: True</em>) – If True, the bins have the same width. If False, the bins are splitted to equalize
+the number of samples in each bin.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
@@ -68,7 +70,6 @@ <h1>netcal.presentation.ReliabilityDiagram<a class="headerlink" href="#netcal-pr
 <li><p><strong>fmin</strong> (<em>float</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Minimum value for scale color.</p></li>
 <li><p><strong>fmax</strong> (<em>float</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Maximum value for scale color.</p></li>
 <li><p><strong>metric</strong> (<em>str</em><em>, </em><em>default: 'ECE'</em>) – Metric to measure miscalibration. Might be either ‘ECE’, ‘ACE’ or ‘MCE’.</p></li>
-<li><p><strong>title_suffix</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Suffix for plot title.</p></li>
 </ul>
 </dd>
 </dl>
@@ -89,7 +90,8 @@ <h1>netcal.presentation.ReliabilityDiagram<a class="headerlink" href="#netcal-pr
 <dt class="label" id="id7"><span class="brackets"><a class="fn-backref" href="#id3">3</a></span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
 “Multivariate Confidence Calibration for Object Detection.”
-The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
+The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+<a class="reference external" href="https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf">Get source online</a></p>
 </dd>
 </dl>
 <p class="rubric">Methods</p>
@@ -99,45 +101,67 @@ <h1>netcal.presentation.ReliabilityDiagram<a class="headerlink" href="#netcal-pr
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, detection, …])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Constructor.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">plot</span></code>(X, y[, batched, filename])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">plot</span></code>(X, y[, batched, uncertainty, filename, …])</p></td>
 <td><p>Reliability diagram to visualize miscalibration.</p></td>
 </tr>
 </tbody>
 </table>
 <dl class="method">
 <dt id="netcal.presentation.ReliabilityDiagram.plot">
-<code class="sig-name descname">plot</code><span class="sig-paren">(</span><em class="sig-param">X: Union[tuple, list, numpy.ndarray], y: Union[tuple, list, numpy.ndarray], batched: bool = False, filename: str = None, **save_args</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.presentation.ReliabilityDiagram.plot" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">plot</code><span class="sig-paren">(</span><em class="sig-param">X: Union[Iterable[numpy.ndarray], numpy.ndarray], y: Union[Iterable[numpy.ndarray], numpy.ndarray], batched: bool = False, uncertainty: str = None, filename: str = None, tikz: bool = False, title_suffix: str = None, feature_names: List[str] = None, **save_args</em><span class="sig-paren">)</span> &#x2192; Union[matplotlib.figure.Figure, str]<a class="headerlink" href="#netcal.presentation.ReliabilityDiagram.plot" title="Permalink to this definition">¶</a></dt>
 <dd><p>Reliability diagram to visualize miscalibration. This could be either in classical way for confidences only
 or w.r.t. additional properties (like x/y-coordinates of detection boxes, width, height, etc.). The additional
-properties get binned. Afterwards, the ECE will be calculated for each bin. This is visualized as (multiple)
-2-D plots.</p>
+properties get binned. Afterwards, the miscalibration will be calculated for each bin. This is
+visualized as a 2-D plots.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<li><p><strong>X</strong> (<em>iterable of np.ndarray</em><em>, or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes/n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
 If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
 interpret this parameter as multiple predictions that should be averaged.
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
-<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+<li><p><strong>y</strong> (<em>iterable of np.ndarray with same length as X</em><em> or </em><em>np.ndarray of shape=</em><em>(</em><em>[</em><em>n_bayes</em><em>]</em><em>, </em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+for a single sample (e.g. variational inference or MC dropout samples).
 If iterable over multiple instances of np.ndarray and parameter batched=True,
 interpret this parameter as multiple predictions that should be averaged.</p></li>
 <li><p><strong>batched</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
 All predictions given by X and y are separately evaluated and their results are averaged afterwards
 for visualization.</p></li>
+<li><p><strong>uncertainty</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – <p>Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+that output an ensemble of predictions per sample. Choose one of the following options:
+- flatten:  treat everything as a separate prediction - this option will yield into a slightly better</p>
+<blockquote>
+<div><p>calibration performance but without the visualization of a prediction interval.</p>
+</div></blockquote>
+<ul>
+<li><dl class="simple">
+<dt>mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample</dt><dd><p>(mean) with a standard deviation that is visualized.</p>
+</dd>
+</dl>
+</li>
+</ul>
+</p></li>
 <li><p><strong>filename</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Optional filename to save the plotted figure.</p></li>
-<li><p><strong>**save_args</strong> (<em>args</em>) – Additional arguments passed to ‘matplotlib.pyplot.Figure.savefig’ function.</p></li>
+<li><p><strong>tikz</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, use ‘tikzplotlib’ package to return tikz-code for Latex rather than a Matplotlib figure.</p></li>
+<li><p><strong>title_suffix</strong> (<em>str</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Suffix for plot title.</p></li>
+<li><p><strong>feature_names</strong> (<em>list</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Names of the additional features that are attached to the axes of a reliability diagram.</p></li>
+<li><p><strong>**save_args</strong> (<em>args</em>) – Additional arguments passed to ‘matplotlib.pyplot.Figure.savefig’ function if ‘tikz’ is False.
+If ‘tikz’ is True, the argument are passed to ‘tikzplotlib.get_tikz_code’ function.</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
 <dd class="field-even"><p></p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>matplotlib.pyplot.Figure</p>
+<dd class="field-odd"><p>matplotlib.pyplot.Figure if ‘tikz’ is False else str with tikz code.</p>
 </dd>
 <dt class="field-even">Raises</dt>
 <dd class="field-even"><p><strong>AttributeError</strong> – <ul class="simple">
@@ -204,7 +228,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../netcal.presentation.html" title="netcal.presentation"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.presentation.html" >netcal.presentation</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html
new file mode 100644
index 0000000..a420c81
--- /dev/null
+++ b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html
@@ -0,0 +1,1049 @@
+
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta charset="utf-8" />
+    <title>netcal.regularization.ConfidencePenalty &#8212; calibration-framework 1.2.0 documentation</title>
+    <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
+    <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
+    
+    <script id="documentation_options" data-url_root="../../" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/language_data.js"></script>
+    <script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
+    
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="netcal.regularization.MMCEPenalty" href="netcal.regularization.MMCEPenalty.html" />
+    <link rel="prev" title="netcal.regularization.confidence_penalty" href="netcal.regularization.confidence_penalty.html" /> 
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.MMCEPenalty.html" title="netcal.regularization.MMCEPenalty"
+             accesskey="N">next</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.confidence_penalty.html" title="netcal.regularization.confidence_penalty"
+             accesskey="P">previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" accesskey="U">netcal.regularization</a> &#187;</li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <div class="section" id="netcal-regularization-confidencepenalty">
+<h1>netcal.regularization.ConfidencePenalty<a class="headerlink" href="#netcal-regularization-confidencepenalty" title="Permalink to this headline">¶</a></h1>
+<dl class="class">
+<dt id="netcal.regularization.ConfidencePenalty">
+<em class="property">class </em><code class="sig-prename descclassname">netcal.regularization.</code><code class="sig-name descname">ConfidencePenalty</code><span class="sig-paren">(</span><em class="sig-param">weight: float = 1.0</em>, <em class="sig-param">threshold: float = -1.0</em>, <em class="sig-param">reduction='mean'</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">torch.nn.modules.loss._Loss</span></code></p>
+<p>Confidence penalty regularization implementation for PyTorch.
+This penalty term can be applied to any loss function as a regularizer <a class="footnote-reference brackets" href="#id2" id="id1">1</a>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>weight</strong> (<em>float</em>) – Weight of entropy.</p></li>
+<li><p><strong>threshold</strong> (<em>float</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Entropy threshold (no penalty is assigned above threshold).</p></li>
+<li><p><strong>reduction</strong> (<em>'str'</em>) – Specifies the reduction to apply to the output.</p></li>
+</ul>
+</dd>
+</dl>
+<p class="rubric">References</p>
+<dl class="footnote brackets">
+<dt class="label" id="id2"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>G. Pereyra, G. Tucker, J. Chorowski, Lukasz Kaiser, and G. Hinton:
+“Regularizing neural networks by penalizing confident output distributions.”
+CoRR, 2017.
+<a class="reference external" href="https://arxiv.org/pdf/1701.06548">Get source online</a></p>
+</dd>
+</dl>
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.__init__">
+<code class="sig-name descname">__init__</code><span class="sig-paren">(</span><em class="sig-param">weight: float = 1.0</em>, <em class="sig-param">threshold: float = -1.0</em>, <em class="sig-param">reduction='mean'</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.__init__" title="Permalink to this definition">¶</a></dt>
+<dd><p>Constructor. For parameter description, see class docstring.</p>
+</dd></dl>
+
+<p class="rubric">Methods</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([weight, threshold, reduction])</p></td>
+<td><p>Constructor.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">add_module</span></code>(name, module)</p></td>
+<td><p>Adds a child module to the current module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">apply</span></code>(fn)</p></td>
+<td><p>Applies <code class="docutils literal notranslate"><span class="pre">fn</span></code> recursively to every submodule (as returned by <code class="docutils literal notranslate"><span class="pre">.children()</span></code>) as well as self.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">bfloat16</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">bfloat16</span></code> datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">buffers</span></code>([recurse])</p></td>
+<td><p>Returns an iterator over module buffers.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">children</span></code>()</p></td>
+<td><p>Returns an iterator over immediate children modules.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">cpu</span></code>()</p></td>
+<td><p>Moves all model parameters and buffers to the CPU.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">cuda</span></code>([device])</p></td>
+<td><p>Moves all model parameters and buffers to the GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">double</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">double</span></code> datatype.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">eval</span></code>()</p></td>
+<td><p>Sets the module in evaluation mode.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">extra_repr</span></code>()</p></td>
+<td><p>Set the extra representation of the module</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">float</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to float datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">forward</span></code>(input)</p></td>
+<td><p>Forward call.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">half</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">half</span></code> datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_state_dict</span></code>(state_dict[, strict])</p></td>
+<td><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into this module and its descendants.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">modules</span></code>()</p></td>
+<td><p>Returns an iterator over all modules in the network.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_buffers</span></code>([prefix, recurse])</p></td>
+<td><p>Returns an iterator over module buffers, yielding both the name of the buffer as well as the buffer itself.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_children</span></code>()</p></td>
+<td><p>Returns an iterator over immediate children modules, yielding both the name of the module as well as the module itself.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_modules</span></code>([memo, prefix])</p></td>
+<td><p>Returns an iterator over all modules in the network, yielding both the name of the module as well as the module itself.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_parameters</span></code>([prefix, recurse])</p></td>
+<td><p>Returns an iterator over module parameters, yielding both the name of the parameter as well as the parameter itself.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">parameters</span></code>([recurse])</p></td>
+<td><p>Returns an iterator over module parameters.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_backward_hook</span></code>(hook)</p></td>
+<td><p>Registers a backward hook on the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_buffer</span></code>(name, tensor)</p></td>
+<td><p>Adds a persistent buffer to the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_forward_hook</span></code>(hook)</p></td>
+<td><p>Registers a forward hook on the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_forward_pre_hook</span></code>(hook)</p></td>
+<td><p>Registers a forward pre-hook on the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_parameter</span></code>(name, param)</p></td>
+<td><p>Adds a parameter to the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">requires_grad_</span></code>([requires_grad])</p></td>
+<td><p>Change if autograd should record operations on parameters in this module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">share_memory</span></code>()</p></td>
+<td><p></p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">state_dict</span></code>([destination, prefix, keep_vars])</p></td>
+<td><p>Returns a dictionary containing a whole state of the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(*args, **kwargs)</p></td>
+<td><p>Moves and/or casts the parameters and buffers.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">train</span></code>([mode])</p></td>
+<td><p>Sets the module in training mode.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">type</span></code>(dst_type)</p></td>
+<td><p>Casts all parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dst_type</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">zero_grad</span></code>()</p></td>
+<td><p>Sets gradients of all model parameters to zero.</p></td>
+</tr>
+</tbody>
+</table>
+<p class="rubric">Attributes</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">dump_patches</span></code></p></td>
+<td><p></p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">epsilon</span></code></p></td>
+<td><p></p></td>
+</tr>
+</tbody>
+</table>
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty._load_from_state_dict">
+<code class="sig-name descname">_load_from_state_dict</code><span class="sig-paren">(</span><em class="sig-param">state_dict</em>, <em class="sig-param">prefix</em>, <em class="sig-param">local_metadata</em>, <em class="sig-param">strict</em>, <em class="sig-param">missing_keys</em>, <em class="sig-param">unexpected_keys</em>, <em class="sig-param">error_msgs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty._load_from_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into only
+this module, but not its descendants. This is called on every submodule
+in <code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code>. Metadata saved for this
+module in input <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> is provided as <code class="xref py py-attr docutils literal notranslate"><span class="pre">local_metadata</span></code>.
+For state dicts without metadata, <code class="xref py py-attr docutils literal notranslate"><span class="pre">local_metadata</span></code> is empty.
+Subclasses can achieve class-specific backward compatible loading using
+the version number at <cite>local_metadata.get(“version”, None)</cite>.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p><a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> is not the same object as the input
+<a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> to <code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code>. So
+it can be modified.</p>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>state_dict</strong> (<em>dict</em>) – a dict containing parameters and
+persistent buffers.</p></li>
+<li><p><strong>prefix</strong> (<em>str</em>) – the prefix for parameters and buffers used in this
+module</p></li>
+<li><p><strong>local_metadata</strong> (<em>dict</em>) – a dict containing the metadata for this module.
+See</p></li>
+<li><p><strong>strict</strong> (<em>bool</em>) – whether to strictly enforce that the keys in
+<a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> with <code class="xref py py-attr docutils literal notranslate"><span class="pre">prefix</span></code> match the names of
+parameters and buffers in this module</p></li>
+<li><p><strong>missing_keys</strong> (<em>list of str</em>) – if <code class="docutils literal notranslate"><span class="pre">strict=True</span></code>, add missing keys to
+this list</p></li>
+<li><p><strong>unexpected_keys</strong> (<em>list of str</em>) – if <code class="docutils literal notranslate"><span class="pre">strict=True</span></code>, add unexpected
+keys to this list</p></li>
+<li><p><strong>error_msgs</strong> (<em>list of str</em>) – error messages should be added to this
+list, and will be reported together in
+<code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code></p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty._named_members">
+<code class="sig-name descname">_named_members</code><span class="sig-paren">(</span><em class="sig-param">get_members_fn</em>, <em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty._named_members" title="Permalink to this definition">¶</a></dt>
+<dd><p>Helper method for yielding various names + members of modules.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty._register_load_state_dict_pre_hook">
+<code class="sig-name descname">_register_load_state_dict_pre_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty._register_load_state_dict_pre_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>These hooks will be called with arguments: <cite>state_dict</cite>, <cite>prefix</cite>,
+<cite>local_metadata</cite>, <cite>strict</cite>, <cite>missing_keys</cite>, <cite>unexpected_keys</cite>,
+<cite>error_msgs</cite>, before loading <cite>state_dict</cite> into <cite>self</cite>. These arguments
+are exactly the same as those of <cite>_load_from_state_dict</cite>.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty._register_state_dict_hook">
+<code class="sig-name descname">_register_state_dict_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty._register_state_dict_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>These hooks will be called with arguments: <cite>self</cite>, <cite>state_dict</cite>,
+<cite>prefix</cite>, <cite>local_metadata</cite>, after the <cite>state_dict</cite> of <cite>self</cite> is set.
+Note that only parameters and buffers of <cite>self</cite> or its children are
+guaranteed to exist in <cite>state_dict</cite>. The hooks may modify <cite>state_dict</cite>
+inplace or return a new one.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty._save_to_state_dict">
+<code class="sig-name descname">_save_to_state_dict</code><span class="sig-paren">(</span><em class="sig-param">destination</em>, <em class="sig-param">prefix</em>, <em class="sig-param">keep_vars</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty._save_to_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Saves module state to <cite>destination</cite> dictionary, containing a state
+of the module, but not its descendants. This is called on every
+submodule in <code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code>.</p>
+<p>In rare cases, subclasses can achieve class-specific behavior by
+overriding this method with custom logic.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>destination</strong> (<em>dict</em>) – a dict where state will be stored</p></li>
+<li><p><strong>prefix</strong> (<em>str</em>) – the prefix for parameters and buffers used in this
+module</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.add_module">
+<code class="sig-name descname">add_module</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">module</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.add_module" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a child module to the current module.</p>
+<p>The module can be accessed as an attribute using the given name.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the child module. The child module can be
+accessed from this module using the given name</p></li>
+<li><p><strong>module</strong> (<em>Module</em>) – child module to be added to the module.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.apply">
+<code class="sig-name descname">apply</code><span class="sig-paren">(</span><em class="sig-param">fn</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.apply" title="Permalink to this definition">¶</a></dt>
+<dd><p>Applies <code class="docutils literal notranslate"><span class="pre">fn</span></code> recursively to every submodule (as returned by <code class="docutils literal notranslate"><span class="pre">.children()</span></code>)
+as well as self. Typical use includes initializing the parameters of a model
+(see also <span class="xref std std-ref">nn-init-doc</span>).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>fn</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code> -&gt; None) – function to be applied to each submodule</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="nd">@torch</span><span class="o">.</span><span class="n">no_grad</span><span class="p">()</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">init_weights</span><span class="p">(</span><span class="n">m</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="n">m</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">if</span> <span class="nb">type</span><span class="p">(</span><span class="n">m</span><span class="p">)</span> <span class="o">==</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">:</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="n">m</span><span class="o">.</span><span class="n">weight</span><span class="o">.</span><span class="n">fill_</span><span class="p">(</span><span class="mf">1.0</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="nb">print</span><span class="p">(</span><span class="n">m</span><span class="o">.</span><span class="n">weight</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">),</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">))</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span><span class="o">.</span><span class="n">apply</span><span class="p">(</span><span class="n">init_weights</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 1.,  1.],</span>
+<span class="go">        [ 1.,  1.]])</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 1.,  1.],</span>
+<span class="go">        [ 1.,  1.]])</span>
+<span class="go">Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+<span class="go">Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.bfloat16">
+<code class="sig-name descname">bfloat16</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.bfloat16" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">bfloat16</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.buffers">
+<code class="sig-name descname">buffers</code><span class="sig-paren">(</span><em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.buffers" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module buffers.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields buffers of this module
+and all submodules. Otherwise, yields only buffers that
+are direct members of this module.</p>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>torch.Tensor</em> – module buffer</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">buf</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">buffers</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="nb">type</span><span class="p">(</span><span class="n">buf</span><span class="p">),</span> <span class="n">buf</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L,)</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L, 1L, 5L, 5L)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.children">
+<code class="sig-name descname">children</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.children" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over immediate children modules.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>Module</em> – a child module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.cpu">
+<code class="sig-name descname">cpu</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.cpu" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves all model parameters and buffers to the CPU.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.cuda">
+<code class="sig-name descname">cuda</code><span class="sig-paren">(</span><em class="sig-param">device=None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.cuda" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves all model parameters and buffers to the GPU.</p>
+<p>This also makes associated parameters and buffers different objects. So
+it should be called before constructing optimizer if the module will
+live on GPU while being optimized.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>device</strong> (<em>int</em><em>, </em><em>optional</em>) – if specified, all parameters will be
+copied to that device</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.double">
+<code class="sig-name descname">double</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.double" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">double</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.eval">
+<code class="sig-name descname">eval</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.eval" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets the module in evaluation mode.</p>
+<p>This has any effect only on certain modules. See documentations of
+particular modules for details of their behaviors in training/evaluation
+mode, if they are affected, e.g. <code class="xref py py-class docutils literal notranslate"><span class="pre">Dropout</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">BatchNorm</span></code>,
+etc.</p>
+<p>This is equivalent with <code class="xref py py-meth docutils literal notranslate"><span class="pre">self.train(False)</span></code>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.extra_repr">
+<code class="sig-name descname">extra_repr</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.extra_repr" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set the extra representation of the module</p>
+<p>To print customized extra information, you should reimplement
+this method in your own modules. Both single-line and multi-line
+strings are acceptable.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.float">
+<code class="sig-name descname">float</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.float" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to float datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.forward">
+<code class="sig-name descname">forward</code><span class="sig-paren">(</span><em class="sig-param">input: torch.Tensor</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.forward" title="Permalink to this definition">¶</a></dt>
+<dd><p>Forward call. Additional arguments and keyword-arguments are ignored.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.half">
+<code class="sig-name descname">half</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.half" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">half</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.load_state_dict">
+<code class="sig-name descname">load_state_dict</code><span class="sig-paren">(</span><em class="sig-param">state_dict</em>, <em class="sig-param">strict=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.load_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into
+this module and its descendants. If <code class="xref py py-attr docutils literal notranslate"><span class="pre">strict</span></code> is <code class="docutils literal notranslate"><span class="pre">True</span></code>, then
+the keys of <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> must exactly match the keys returned
+by this module’s <code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code> function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>state_dict</strong> (<em>dict</em>) – a dict containing parameters and
+persistent buffers.</p></li>
+<li><p><strong>strict</strong> (<em>bool</em><em>, </em><em>optional</em>) – whether to strictly enforce that the keys
+in <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.state_dict" title="netcal.regularization.ConfidencePenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> match the keys returned by this module’s
+<code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code> function. Default: <code class="docutils literal notranslate"><span class="pre">True</span></code></p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><strong>missing_keys</strong> is a list of str containing the missing keys</p></li>
+<li><p><strong>unexpected_keys</strong> is a list of str containing the unexpected keys</p></li>
+</ul>
+</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p><code class="docutils literal notranslate"><span class="pre">NamedTuple</span></code> with <code class="docutils literal notranslate"><span class="pre">missing_keys</span></code> and <code class="docutils literal notranslate"><span class="pre">unexpected_keys</span></code> fields</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.modules">
+<code class="sig-name descname">modules</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.modules" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over all modules in the network.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>Module</em> – a module in the network</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Duplicate modules are returned only once. In the following
+example, <code class="docutils literal notranslate"><span class="pre">l</span></code> will be returned only once.</p>
+</div>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">l</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">l</span><span class="p">,</span> <span class="n">l</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">m</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">net</span><span class="o">.</span><span class="n">modules</span><span class="p">()):</span>
+<span class="go">        print(idx, &#39;-&gt;&#39;, m)</span>
+
+<span class="go">0 -&gt; Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+<span class="go">1 -&gt; Linear(in_features=2, out_features=2, bias=True)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.named_buffers">
+<code class="sig-name descname">named_buffers</code><span class="sig-paren">(</span><em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.named_buffers" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module buffers, yielding both the
+name of the buffer as well as the buffer itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>prefix</strong> (<em>str</em>) – prefix to prepend to all buffer names.</p></li>
+<li><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields buffers of this module
+and all submodules. Otherwise, yields only buffers that
+are direct members of this module.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>(string, torch.Tensor)</em> – Tuple containing the name and buffer</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">buf</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">named_buffers</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>   <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;running_var&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>       <span class="nb">print</span><span class="p">(</span><span class="n">buf</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.named_children">
+<code class="sig-name descname">named_children</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.named_children" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over immediate children modules, yielding both
+the name of the module as well as the module itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>(string, Module)</em> – Tuple containing a name and child module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">module</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">named_children</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;conv4&#39;</span><span class="p">,</span> <span class="s1">&#39;conv5&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="nb">print</span><span class="p">(</span><span class="n">module</span><span class="p">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.named_modules">
+<code class="sig-name descname">named_modules</code><span class="sig-paren">(</span><em class="sig-param">memo=None</em>, <em class="sig-param">prefix=''</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.named_modules" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over all modules in the network, yielding
+both the name of the module as well as the module itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>(string, Module)</em> – Tuple of name and module</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Duplicate modules are returned only once. In the following
+example, <code class="docutils literal notranslate"><span class="pre">l</span></code> will be returned only once.</p>
+</div>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">l</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">l</span><span class="p">,</span> <span class="n">l</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">m</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">net</span><span class="o">.</span><span class="n">named_modules</span><span class="p">()):</span>
+<span class="go">        print(idx, &#39;-&gt;&#39;, m)</span>
+
+<span class="go">0 -&gt; (&#39;&#39;, Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">))</span>
+<span class="go">1 -&gt; (&#39;0&#39;, Linear(in_features=2, out_features=2, bias=True))</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.named_parameters">
+<code class="sig-name descname">named_parameters</code><span class="sig-paren">(</span><em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.named_parameters" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module parameters, yielding both the
+name of the parameter as well as the parameter itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>prefix</strong> (<em>str</em>) – prefix to prepend to all parameter names.</p></li>
+<li><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields parameters of this module
+and all submodules. Otherwise, yields only parameters that
+are direct members of this module.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>(string, Parameter)</em> – Tuple containing the name and parameter</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">param</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">named_parameters</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>   <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;bias&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>       <span class="nb">print</span><span class="p">(</span><span class="n">param</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.parameters">
+<code class="sig-name descname">parameters</code><span class="sig-paren">(</span><em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.parameters" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module parameters.</p>
+<p>This is typically passed to an optimizer.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields parameters of this module
+and all submodules. Otherwise, yields only parameters that
+are direct members of this module.</p>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>Parameter</em> – module parameter</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">param</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">parameters</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="nb">type</span><span class="p">(</span><span class="n">param</span><span class="p">),</span> <span class="n">param</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L,)</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L, 1L, 5L, 5L)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.register_backward_hook">
+<code class="sig-name descname">register_backward_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.register_backward_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a backward hook on the module.</p>
+<p>The hook will be called every time the gradients with respect to module
+inputs are computed. The hook should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="n">grad_input</span><span class="p">,</span> <span class="n">grad_output</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">Tensor</span> <span class="ow">or</span> <span class="kc">None</span>
+</pre></div>
+</div>
+<p>The <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> and <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_output</span></code> may be tuples if the
+module has multiple inputs or outputs. The hook should not modify its
+arguments, but it can optionally return a new gradient with respect to
+input that will be used in place of <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> in subsequent
+computations.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>The current implementation will not have the presented behavior
+for complex <code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code> that perform many operations.
+In some failure cases, <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> and <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_output</span></code> will only
+contain the gradients for a subset of the inputs and outputs.
+For such <code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code>, you should use <code class="xref py py-func docutils literal notranslate"><span class="pre">torch.Tensor.register_hook()</span></code>
+directly on a specific input or output to get the required gradients.</p>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.register_buffer">
+<code class="sig-name descname">register_buffer</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">tensor</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.register_buffer" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a persistent buffer to the module.</p>
+<p>This is typically used to register a buffer that should not to be
+considered a model parameter. For example, BatchNorm’s <code class="docutils literal notranslate"><span class="pre">running_mean</span></code>
+is not a parameter, but is part of the persistent state.</p>
+<p>Buffers can be accessed as attributes using given names.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the buffer. The buffer can be accessed
+from this module using the given name</p></li>
+<li><p><strong>tensor</strong> (<em>Tensor</em>) – buffer to be registered.</p></li>
+</ul>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="bp">self</span><span class="o">.</span><span class="n">register_buffer</span><span class="p">(</span><span class="s1">&#39;running_mean&#39;</span><span class="p">,</span> <span class="n">torch</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="n">num_features</span><span class="p">))</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.register_forward_hook">
+<code class="sig-name descname">register_forward_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.register_forward_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a forward hook on the module.</p>
+<p>The hook will be called every time after <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.forward" title="netcal.regularization.ConfidencePenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> has computed an output.
+It should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="nb">input</span><span class="p">,</span> <span class="n">output</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">modified</span> <span class="n">output</span>
+</pre></div>
+</div>
+<p>The hook can modify the output. It can modify the input inplace but
+it will not have effect on forward since this is called after
+<a class="reference internal" href="#netcal.regularization.ConfidencePenalty.forward" title="netcal.regularization.ConfidencePenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> is called.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.register_forward_pre_hook">
+<code class="sig-name descname">register_forward_pre_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.register_forward_pre_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a forward pre-hook on the module.</p>
+<p>The hook will be called every time before <a class="reference internal" href="#netcal.regularization.ConfidencePenalty.forward" title="netcal.regularization.ConfidencePenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> is invoked.
+It should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="nb">input</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">modified</span> <span class="nb">input</span>
+</pre></div>
+</div>
+<p>The hook can modify the input. User can either return a tuple or a
+single modified value in the hook. We will wrap the value into a tuple
+if a single value is returned(unless that value is already a tuple).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.register_parameter">
+<code class="sig-name descname">register_parameter</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">param</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.register_parameter" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a parameter to the module.</p>
+<p>The parameter can be accessed as an attribute using given name.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the parameter. The parameter can be accessed
+from this module using the given name</p></li>
+<li><p><strong>param</strong> (<em>Parameter</em>) – parameter to be added to the module.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.requires_grad_">
+<code class="sig-name descname">requires_grad_</code><span class="sig-paren">(</span><em class="sig-param">requires_grad=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.requires_grad_" title="Permalink to this definition">¶</a></dt>
+<dd><p>Change if autograd should record operations on parameters in this
+module.</p>
+<p>This method sets the parameters’ <code class="xref py py-attr docutils literal notranslate"><span class="pre">requires_grad</span></code> attributes
+in-place.</p>
+<p>This method is helpful for freezing part of the module for finetuning
+or training parts of a model individually (e.g., GAN training).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>requires_grad</strong> (<em>bool</em>) – whether autograd should record operations on
+parameters in this module. Default: <code class="docutils literal notranslate"><span class="pre">True</span></code>.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.state_dict">
+<code class="sig-name descname">state_dict</code><span class="sig-paren">(</span><em class="sig-param">destination=None</em>, <em class="sig-param">prefix=''</em>, <em class="sig-param">keep_vars=False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns a dictionary containing a whole state of the module.</p>
+<p>Both parameters and persistent buffers (e.g. running averages) are
+included. Keys are corresponding parameter and buffer names.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a dictionary containing a whole state of the module</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>dict</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">module</span><span class="o">.</span><span class="n">state_dict</span><span class="p">()</span><span class="o">.</span><span class="n">keys</span><span class="p">()</span>
+<span class="go">[&#39;bias&#39;, &#39;weight&#39;]</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves and/or casts the parameters and buffers.</p>
+<p>This can be called as</p>
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device=None</em>, <em class="sig-param">dtype=None</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">dtype</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">tensor</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">memory_format=torch.channels_last</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<p>Its signature is similar to <code class="xref py py-meth docutils literal notranslate"><span class="pre">torch.Tensor.to()</span></code>, but only accepts
+floating point desired <code class="xref py py-attr docutils literal notranslate"><span class="pre">dtype</span></code> s. In addition, this method will
+only cast the floating point parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dtype</span></code>
+(if given). The integral parameters and buffers will be moved
+<code class="xref py py-attr docutils literal notranslate"><span class="pre">device</span></code>, if that is given, but with dtypes unchanged. When
+<code class="xref py py-attr docutils literal notranslate"><span class="pre">non_blocking</span></code> is set, it tries to convert/move asynchronously
+with respect to the host if possible, e.g., moving CPU Tensors with
+pinned memory to CUDA devices.</p>
+<p>See below for examples.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>This method modifies the module in-place.</p>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>device</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.device</span></code>) – the desired device of the parameters
+and buffers in this module</p></li>
+<li><p><strong>dtype</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.dtype</span></code>) – the desired floating point type of
+the floating point parameters and buffers in this module</p></li>
+<li><p><strong>tensor</strong> (<em>torch.Tensor</em>) – Tensor whose dtype and device are the desired
+dtype and device for all parameters and buffers in this module</p></li>
+<li><p><strong>memory_format</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.memory_format</span></code>) – the desired memory
+format for 4D parameters and buffers in this module (keyword
+only argument)</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1913, -0.3420],</span>
+<span class="go">        [-0.5113, -0.2325]])</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">double</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1913, -0.3420],</span>
+<span class="go">        [-0.5113, -0.2325]], dtype=torch.float64)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">gpu1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">&quot;cuda:1&quot;</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">gpu1</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">torch</span><span class="o">.</span><span class="n">half</span><span class="p">,</span> <span class="n">non_blocking</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1914, -0.3420],</span>
+<span class="go">        [-0.5112, -0.2324]], dtype=torch.float16, device=&#39;cuda:1&#39;)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">cpu</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">&quot;cpu&quot;</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">cpu</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1914, -0.3420],</span>
+<span class="go">        [-0.5112, -0.2324]], dtype=torch.float16)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.train">
+<code class="sig-name descname">train</code><span class="sig-paren">(</span><em class="sig-param">mode=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.train" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets the module in training mode.</p>
+<p>This has any effect only on certain modules. See documentations of
+particular modules for details of their behaviors in training/evaluation
+mode, if they are affected, e.g. <code class="xref py py-class docutils literal notranslate"><span class="pre">Dropout</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">BatchNorm</span></code>,
+etc.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>mode</strong> (<em>bool</em>) – whether to set training mode (<code class="docutils literal notranslate"><span class="pre">True</span></code>) or evaluation
+mode (<code class="docutils literal notranslate"><span class="pre">False</span></code>). Default: <code class="docutils literal notranslate"><span class="pre">True</span></code>.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.type">
+<code class="sig-name descname">type</code><span class="sig-paren">(</span><em class="sig-param">dst_type</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.type" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dst_type</span></code>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>dst_type</strong> (<em>type</em><em> or </em><em>string</em>) – the desired type</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.ConfidencePenalty.zero_grad">
+<code class="sig-name descname">zero_grad</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.ConfidencePenalty.zero_grad" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets gradients of all model parameters to zero.</p>
+</dd></dl>
+
+</dd></dl>
+
+</div>
+
+
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <h4>Previous topic</h4>
+  <p class="topless"><a href="netcal.regularization.confidence_penalty.html"
+                        title="previous chapter">netcal.regularization.confidence_penalty</a></p>
+  <h4>Next topic</h4>
+  <p class="topless"><a href="netcal.regularization.MMCEPenalty.html"
+                        title="next chapter">netcal.regularization.MMCEPenalty</a></p>
+  <div role="note" aria-label="source link">
+    <h3>This Page</h3>
+    <ul class="this-page-menu">
+      <li><a href="../../_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.rst.txt"
+            rel="nofollow">Show Source</a></li>
+    </ul>
+   </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" />
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>$('#searchbox').show(0);</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.MMCEPenalty.html" title="netcal.regularization.MMCEPenalty"
+             >next</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.confidence_penalty.html" title="netcal.regularization.confidence_penalty"
+             >previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" >netcal.regularization</a> &#187;</li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2019-2021, Ruhr West University of Applied Sciences, Bottrop, Germany AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany.
+      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 2.4.4.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html
new file mode 100644
index 0000000..1fa3904
--- /dev/null
+++ b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html
@@ -0,0 +1,1041 @@
+
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta charset="utf-8" />
+    <title>netcal.regularization.DCAPenalty &#8212; calibration-framework 1.2.0 documentation</title>
+    <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
+    <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
+    
+    <script id="documentation_options" data-url_root="../../" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/language_data.js"></script>
+    <script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
+    
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="netcal.metrics" href="../netcal.metrics.html" />
+    <link rel="prev" title="netcal.regularization.MMCEPenalty" href="netcal.regularization.MMCEPenalty.html" /> 
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="../netcal.metrics.html" title="netcal.metrics"
+             accesskey="N">next</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.MMCEPenalty.html" title="netcal.regularization.MMCEPenalty"
+             accesskey="P">previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" accesskey="U">netcal.regularization</a> &#187;</li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <div class="section" id="netcal-regularization-dcapenalty">
+<h1>netcal.regularization.DCAPenalty<a class="headerlink" href="#netcal-regularization-dcapenalty" title="Permalink to this headline">¶</a></h1>
+<dl class="class">
+<dt id="netcal.regularization.DCAPenalty">
+<em class="property">class </em><code class="sig-prename descclassname">netcal.regularization.</code><code class="sig-name descname">DCAPenalty</code><span class="sig-paren">(</span><em class="sig-param">weight: float = 1.0</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">torch.nn.modules.loss._Loss</span></code></p>
+<p>Difference between Confidence and Accuracy (DCA) <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. This regularization returns a single scalar indicating
+the difference between mean confidence and accuracy within a single batch.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>weight</strong> (<em>float</em>) – Weight of DCA regularization.</p>
+</dd>
+</dl>
+<p class="rubric">References</p>
+<dl class="footnote brackets">
+<dt class="label" id="id2"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>Liang, Gongbo, et al.:
+“Improved trainable calibration method for neural networks on medical imaging classification.”
+arXiv preprint arXiv:2009.04057 (2020).</p>
+</dd>
+</dl>
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.__init__">
+<code class="sig-name descname">__init__</code><span class="sig-paren">(</span><em class="sig-param">weight: float = 1.0</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.__init__" title="Permalink to this definition">¶</a></dt>
+<dd><p>Constructor. For parameter description, see class docstring.</p>
+</dd></dl>
+
+<p class="rubric">Methods</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([weight])</p></td>
+<td><p>Constructor.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">add_module</span></code>(name, module)</p></td>
+<td><p>Adds a child module to the current module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">apply</span></code>(fn)</p></td>
+<td><p>Applies <code class="docutils literal notranslate"><span class="pre">fn</span></code> recursively to every submodule (as returned by <code class="docutils literal notranslate"><span class="pre">.children()</span></code>) as well as self.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">bfloat16</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">bfloat16</span></code> datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">buffers</span></code>([recurse])</p></td>
+<td><p>Returns an iterator over module buffers.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">children</span></code>()</p></td>
+<td><p>Returns an iterator over immediate children modules.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">cpu</span></code>()</p></td>
+<td><p>Moves all model parameters and buffers to the CPU.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">cuda</span></code>([device])</p></td>
+<td><p>Moves all model parameters and buffers to the GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">double</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">double</span></code> datatype.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">eval</span></code>()</p></td>
+<td><p>Sets the module in evaluation mode.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">extra_repr</span></code>()</p></td>
+<td><p>Set the extra representation of the module</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">float</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to float datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">forward</span></code>(input, target)</p></td>
+<td><p>Forward call of module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">half</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">half</span></code> datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_state_dict</span></code>(state_dict[, strict])</p></td>
+<td><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into this module and its descendants.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">modules</span></code>()</p></td>
+<td><p>Returns an iterator over all modules in the network.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_buffers</span></code>([prefix, recurse])</p></td>
+<td><p>Returns an iterator over module buffers, yielding both the name of the buffer as well as the buffer itself.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_children</span></code>()</p></td>
+<td><p>Returns an iterator over immediate children modules, yielding both the name of the module as well as the module itself.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_modules</span></code>([memo, prefix])</p></td>
+<td><p>Returns an iterator over all modules in the network, yielding both the name of the module as well as the module itself.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_parameters</span></code>([prefix, recurse])</p></td>
+<td><p>Returns an iterator over module parameters, yielding both the name of the parameter as well as the parameter itself.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">parameters</span></code>([recurse])</p></td>
+<td><p>Returns an iterator over module parameters.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_backward_hook</span></code>(hook)</p></td>
+<td><p>Registers a backward hook on the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_buffer</span></code>(name, tensor)</p></td>
+<td><p>Adds a persistent buffer to the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_forward_hook</span></code>(hook)</p></td>
+<td><p>Registers a forward hook on the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_forward_pre_hook</span></code>(hook)</p></td>
+<td><p>Registers a forward pre-hook on the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_parameter</span></code>(name, param)</p></td>
+<td><p>Adds a parameter to the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">requires_grad_</span></code>([requires_grad])</p></td>
+<td><p>Change if autograd should record operations on parameters in this module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">share_memory</span></code>()</p></td>
+<td><p></p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">state_dict</span></code>([destination, prefix, keep_vars])</p></td>
+<td><p>Returns a dictionary containing a whole state of the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(*args, **kwargs)</p></td>
+<td><p>Moves and/or casts the parameters and buffers.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">train</span></code>([mode])</p></td>
+<td><p>Sets the module in training mode.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">type</span></code>(dst_type)</p></td>
+<td><p>Casts all parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dst_type</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">zero_grad</span></code>()</p></td>
+<td><p>Sets gradients of all model parameters to zero.</p></td>
+</tr>
+</tbody>
+</table>
+<p class="rubric">Attributes</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">dump_patches</span></code></p></td>
+<td><p></p></td>
+</tr>
+</tbody>
+</table>
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty._load_from_state_dict">
+<code class="sig-name descname">_load_from_state_dict</code><span class="sig-paren">(</span><em class="sig-param">state_dict</em>, <em class="sig-param">prefix</em>, <em class="sig-param">local_metadata</em>, <em class="sig-param">strict</em>, <em class="sig-param">missing_keys</em>, <em class="sig-param">unexpected_keys</em>, <em class="sig-param">error_msgs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty._load_from_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into only
+this module, but not its descendants. This is called on every submodule
+in <code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code>. Metadata saved for this
+module in input <a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> is provided as <code class="xref py py-attr docutils literal notranslate"><span class="pre">local_metadata</span></code>.
+For state dicts without metadata, <code class="xref py py-attr docutils literal notranslate"><span class="pre">local_metadata</span></code> is empty.
+Subclasses can achieve class-specific backward compatible loading using
+the version number at <cite>local_metadata.get(“version”, None)</cite>.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p><a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> is not the same object as the input
+<a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> to <code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code>. So
+it can be modified.</p>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>state_dict</strong> (<em>dict</em>) – a dict containing parameters and
+persistent buffers.</p></li>
+<li><p><strong>prefix</strong> (<em>str</em>) – the prefix for parameters and buffers used in this
+module</p></li>
+<li><p><strong>local_metadata</strong> (<em>dict</em>) – a dict containing the metadata for this module.
+See</p></li>
+<li><p><strong>strict</strong> (<em>bool</em>) – whether to strictly enforce that the keys in
+<a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> with <code class="xref py py-attr docutils literal notranslate"><span class="pre">prefix</span></code> match the names of
+parameters and buffers in this module</p></li>
+<li><p><strong>missing_keys</strong> (<em>list of str</em>) – if <code class="docutils literal notranslate"><span class="pre">strict=True</span></code>, add missing keys to
+this list</p></li>
+<li><p><strong>unexpected_keys</strong> (<em>list of str</em>) – if <code class="docutils literal notranslate"><span class="pre">strict=True</span></code>, add unexpected
+keys to this list</p></li>
+<li><p><strong>error_msgs</strong> (<em>list of str</em>) – error messages should be added to this
+list, and will be reported together in
+<code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code></p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty._named_members">
+<code class="sig-name descname">_named_members</code><span class="sig-paren">(</span><em class="sig-param">get_members_fn</em>, <em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty._named_members" title="Permalink to this definition">¶</a></dt>
+<dd><p>Helper method for yielding various names + members of modules.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty._register_load_state_dict_pre_hook">
+<code class="sig-name descname">_register_load_state_dict_pre_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty._register_load_state_dict_pre_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>These hooks will be called with arguments: <cite>state_dict</cite>, <cite>prefix</cite>,
+<cite>local_metadata</cite>, <cite>strict</cite>, <cite>missing_keys</cite>, <cite>unexpected_keys</cite>,
+<cite>error_msgs</cite>, before loading <cite>state_dict</cite> into <cite>self</cite>. These arguments
+are exactly the same as those of <cite>_load_from_state_dict</cite>.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty._register_state_dict_hook">
+<code class="sig-name descname">_register_state_dict_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty._register_state_dict_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>These hooks will be called with arguments: <cite>self</cite>, <cite>state_dict</cite>,
+<cite>prefix</cite>, <cite>local_metadata</cite>, after the <cite>state_dict</cite> of <cite>self</cite> is set.
+Note that only parameters and buffers of <cite>self</cite> or its children are
+guaranteed to exist in <cite>state_dict</cite>. The hooks may modify <cite>state_dict</cite>
+inplace or return a new one.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty._save_to_state_dict">
+<code class="sig-name descname">_save_to_state_dict</code><span class="sig-paren">(</span><em class="sig-param">destination</em>, <em class="sig-param">prefix</em>, <em class="sig-param">keep_vars</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty._save_to_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Saves module state to <cite>destination</cite> dictionary, containing a state
+of the module, but not its descendants. This is called on every
+submodule in <code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code>.</p>
+<p>In rare cases, subclasses can achieve class-specific behavior by
+overriding this method with custom logic.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>destination</strong> (<em>dict</em>) – a dict where state will be stored</p></li>
+<li><p><strong>prefix</strong> (<em>str</em>) – the prefix for parameters and buffers used in this
+module</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.add_module">
+<code class="sig-name descname">add_module</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">module</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.add_module" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a child module to the current module.</p>
+<p>The module can be accessed as an attribute using the given name.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the child module. The child module can be
+accessed from this module using the given name</p></li>
+<li><p><strong>module</strong> (<em>Module</em>) – child module to be added to the module.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.apply">
+<code class="sig-name descname">apply</code><span class="sig-paren">(</span><em class="sig-param">fn</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.apply" title="Permalink to this definition">¶</a></dt>
+<dd><p>Applies <code class="docutils literal notranslate"><span class="pre">fn</span></code> recursively to every submodule (as returned by <code class="docutils literal notranslate"><span class="pre">.children()</span></code>)
+as well as self. Typical use includes initializing the parameters of a model
+(see also <span class="xref std std-ref">nn-init-doc</span>).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>fn</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code> -&gt; None) – function to be applied to each submodule</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="nd">@torch</span><span class="o">.</span><span class="n">no_grad</span><span class="p">()</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">init_weights</span><span class="p">(</span><span class="n">m</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="n">m</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">if</span> <span class="nb">type</span><span class="p">(</span><span class="n">m</span><span class="p">)</span> <span class="o">==</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">:</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="n">m</span><span class="o">.</span><span class="n">weight</span><span class="o">.</span><span class="n">fill_</span><span class="p">(</span><span class="mf">1.0</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="nb">print</span><span class="p">(</span><span class="n">m</span><span class="o">.</span><span class="n">weight</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">),</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">))</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span><span class="o">.</span><span class="n">apply</span><span class="p">(</span><span class="n">init_weights</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 1.,  1.],</span>
+<span class="go">        [ 1.,  1.]])</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 1.,  1.],</span>
+<span class="go">        [ 1.,  1.]])</span>
+<span class="go">Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+<span class="go">Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.bfloat16">
+<code class="sig-name descname">bfloat16</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.bfloat16" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">bfloat16</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.buffers">
+<code class="sig-name descname">buffers</code><span class="sig-paren">(</span><em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.buffers" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module buffers.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields buffers of this module
+and all submodules. Otherwise, yields only buffers that
+are direct members of this module.</p>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>torch.Tensor</em> – module buffer</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">buf</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">buffers</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="nb">type</span><span class="p">(</span><span class="n">buf</span><span class="p">),</span> <span class="n">buf</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L,)</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L, 1L, 5L, 5L)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.children">
+<code class="sig-name descname">children</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.children" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over immediate children modules.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>Module</em> – a child module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.cpu">
+<code class="sig-name descname">cpu</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.cpu" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves all model parameters and buffers to the CPU.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.cuda">
+<code class="sig-name descname">cuda</code><span class="sig-paren">(</span><em class="sig-param">device=None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.cuda" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves all model parameters and buffers to the GPU.</p>
+<p>This also makes associated parameters and buffers different objects. So
+it should be called before constructing optimizer if the module will
+live on GPU while being optimized.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>device</strong> (<em>int</em><em>, </em><em>optional</em>) – if specified, all parameters will be
+copied to that device</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.double">
+<code class="sig-name descname">double</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.double" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">double</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.eval">
+<code class="sig-name descname">eval</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.eval" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets the module in evaluation mode.</p>
+<p>This has any effect only on certain modules. See documentations of
+particular modules for details of their behaviors in training/evaluation
+mode, if they are affected, e.g. <code class="xref py py-class docutils literal notranslate"><span class="pre">Dropout</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">BatchNorm</span></code>,
+etc.</p>
+<p>This is equivalent with <code class="xref py py-meth docutils literal notranslate"><span class="pre">self.train(False)</span></code>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.extra_repr">
+<code class="sig-name descname">extra_repr</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.extra_repr" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set the extra representation of the module</p>
+<p>To print customized extra information, you should reimplement
+this method in your own modules. Both single-line and multi-line
+strings are acceptable.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.float">
+<code class="sig-name descname">float</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.float" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to float datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.forward">
+<code class="sig-name descname">forward</code><span class="sig-paren">(</span><em class="sig-param">input: torch.Tensor</em>, <em class="sig-param">target: torch.Tensor</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.forward" title="Permalink to this definition">¶</a></dt>
+<dd><p>Forward call of module. Providing the target scores is mandatory.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.half">
+<code class="sig-name descname">half</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.half" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">half</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.load_state_dict">
+<code class="sig-name descname">load_state_dict</code><span class="sig-paren">(</span><em class="sig-param">state_dict</em>, <em class="sig-param">strict=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.load_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into
+this module and its descendants. If <code class="xref py py-attr docutils literal notranslate"><span class="pre">strict</span></code> is <code class="docutils literal notranslate"><span class="pre">True</span></code>, then
+the keys of <a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> must exactly match the keys returned
+by this module’s <code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code> function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>state_dict</strong> (<em>dict</em>) – a dict containing parameters and
+persistent buffers.</p></li>
+<li><p><strong>strict</strong> (<em>bool</em><em>, </em><em>optional</em>) – whether to strictly enforce that the keys
+in <a class="reference internal" href="#netcal.regularization.DCAPenalty.state_dict" title="netcal.regularization.DCAPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> match the keys returned by this module’s
+<code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code> function. Default: <code class="docutils literal notranslate"><span class="pre">True</span></code></p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><strong>missing_keys</strong> is a list of str containing the missing keys</p></li>
+<li><p><strong>unexpected_keys</strong> is a list of str containing the unexpected keys</p></li>
+</ul>
+</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p><code class="docutils literal notranslate"><span class="pre">NamedTuple</span></code> with <code class="docutils literal notranslate"><span class="pre">missing_keys</span></code> and <code class="docutils literal notranslate"><span class="pre">unexpected_keys</span></code> fields</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.modules">
+<code class="sig-name descname">modules</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.modules" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over all modules in the network.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>Module</em> – a module in the network</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Duplicate modules are returned only once. In the following
+example, <code class="docutils literal notranslate"><span class="pre">l</span></code> will be returned only once.</p>
+</div>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">l</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">l</span><span class="p">,</span> <span class="n">l</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">m</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">net</span><span class="o">.</span><span class="n">modules</span><span class="p">()):</span>
+<span class="go">        print(idx, &#39;-&gt;&#39;, m)</span>
+
+<span class="go">0 -&gt; Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+<span class="go">1 -&gt; Linear(in_features=2, out_features=2, bias=True)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.named_buffers">
+<code class="sig-name descname">named_buffers</code><span class="sig-paren">(</span><em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.named_buffers" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module buffers, yielding both the
+name of the buffer as well as the buffer itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>prefix</strong> (<em>str</em>) – prefix to prepend to all buffer names.</p></li>
+<li><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields buffers of this module
+and all submodules. Otherwise, yields only buffers that
+are direct members of this module.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>(string, torch.Tensor)</em> – Tuple containing the name and buffer</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">buf</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">named_buffers</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>   <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;running_var&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>       <span class="nb">print</span><span class="p">(</span><span class="n">buf</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.named_children">
+<code class="sig-name descname">named_children</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.named_children" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over immediate children modules, yielding both
+the name of the module as well as the module itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>(string, Module)</em> – Tuple containing a name and child module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">module</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">named_children</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;conv4&#39;</span><span class="p">,</span> <span class="s1">&#39;conv5&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="nb">print</span><span class="p">(</span><span class="n">module</span><span class="p">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.named_modules">
+<code class="sig-name descname">named_modules</code><span class="sig-paren">(</span><em class="sig-param">memo=None</em>, <em class="sig-param">prefix=''</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.named_modules" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over all modules in the network, yielding
+both the name of the module as well as the module itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>(string, Module)</em> – Tuple of name and module</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Duplicate modules are returned only once. In the following
+example, <code class="docutils literal notranslate"><span class="pre">l</span></code> will be returned only once.</p>
+</div>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">l</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">l</span><span class="p">,</span> <span class="n">l</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">m</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">net</span><span class="o">.</span><span class="n">named_modules</span><span class="p">()):</span>
+<span class="go">        print(idx, &#39;-&gt;&#39;, m)</span>
+
+<span class="go">0 -&gt; (&#39;&#39;, Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">))</span>
+<span class="go">1 -&gt; (&#39;0&#39;, Linear(in_features=2, out_features=2, bias=True))</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.named_parameters">
+<code class="sig-name descname">named_parameters</code><span class="sig-paren">(</span><em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.named_parameters" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module parameters, yielding both the
+name of the parameter as well as the parameter itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>prefix</strong> (<em>str</em>) – prefix to prepend to all parameter names.</p></li>
+<li><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields parameters of this module
+and all submodules. Otherwise, yields only parameters that
+are direct members of this module.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>(string, Parameter)</em> – Tuple containing the name and parameter</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">param</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">named_parameters</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>   <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;bias&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>       <span class="nb">print</span><span class="p">(</span><span class="n">param</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.parameters">
+<code class="sig-name descname">parameters</code><span class="sig-paren">(</span><em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.parameters" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module parameters.</p>
+<p>This is typically passed to an optimizer.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields parameters of this module
+and all submodules. Otherwise, yields only parameters that
+are direct members of this module.</p>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>Parameter</em> – module parameter</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">param</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">parameters</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="nb">type</span><span class="p">(</span><span class="n">param</span><span class="p">),</span> <span class="n">param</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L,)</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L, 1L, 5L, 5L)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.register_backward_hook">
+<code class="sig-name descname">register_backward_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.register_backward_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a backward hook on the module.</p>
+<p>The hook will be called every time the gradients with respect to module
+inputs are computed. The hook should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="n">grad_input</span><span class="p">,</span> <span class="n">grad_output</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">Tensor</span> <span class="ow">or</span> <span class="kc">None</span>
+</pre></div>
+</div>
+<p>The <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> and <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_output</span></code> may be tuples if the
+module has multiple inputs or outputs. The hook should not modify its
+arguments, but it can optionally return a new gradient with respect to
+input that will be used in place of <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> in subsequent
+computations.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>The current implementation will not have the presented behavior
+for complex <code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code> that perform many operations.
+In some failure cases, <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> and <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_output</span></code> will only
+contain the gradients for a subset of the inputs and outputs.
+For such <code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code>, you should use <code class="xref py py-func docutils literal notranslate"><span class="pre">torch.Tensor.register_hook()</span></code>
+directly on a specific input or output to get the required gradients.</p>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.register_buffer">
+<code class="sig-name descname">register_buffer</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">tensor</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.register_buffer" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a persistent buffer to the module.</p>
+<p>This is typically used to register a buffer that should not to be
+considered a model parameter. For example, BatchNorm’s <code class="docutils literal notranslate"><span class="pre">running_mean</span></code>
+is not a parameter, but is part of the persistent state.</p>
+<p>Buffers can be accessed as attributes using given names.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the buffer. The buffer can be accessed
+from this module using the given name</p></li>
+<li><p><strong>tensor</strong> (<em>Tensor</em>) – buffer to be registered.</p></li>
+</ul>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="bp">self</span><span class="o">.</span><span class="n">register_buffer</span><span class="p">(</span><span class="s1">&#39;running_mean&#39;</span><span class="p">,</span> <span class="n">torch</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="n">num_features</span><span class="p">))</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.register_forward_hook">
+<code class="sig-name descname">register_forward_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.register_forward_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a forward hook on the module.</p>
+<p>The hook will be called every time after <a class="reference internal" href="#netcal.regularization.DCAPenalty.forward" title="netcal.regularization.DCAPenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> has computed an output.
+It should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="nb">input</span><span class="p">,</span> <span class="n">output</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">modified</span> <span class="n">output</span>
+</pre></div>
+</div>
+<p>The hook can modify the output. It can modify the input inplace but
+it will not have effect on forward since this is called after
+<a class="reference internal" href="#netcal.regularization.DCAPenalty.forward" title="netcal.regularization.DCAPenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> is called.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.register_forward_pre_hook">
+<code class="sig-name descname">register_forward_pre_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.register_forward_pre_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a forward pre-hook on the module.</p>
+<p>The hook will be called every time before <a class="reference internal" href="#netcal.regularization.DCAPenalty.forward" title="netcal.regularization.DCAPenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> is invoked.
+It should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="nb">input</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">modified</span> <span class="nb">input</span>
+</pre></div>
+</div>
+<p>The hook can modify the input. User can either return a tuple or a
+single modified value in the hook. We will wrap the value into a tuple
+if a single value is returned(unless that value is already a tuple).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.register_parameter">
+<code class="sig-name descname">register_parameter</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">param</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.register_parameter" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a parameter to the module.</p>
+<p>The parameter can be accessed as an attribute using given name.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the parameter. The parameter can be accessed
+from this module using the given name</p></li>
+<li><p><strong>param</strong> (<em>Parameter</em>) – parameter to be added to the module.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.requires_grad_">
+<code class="sig-name descname">requires_grad_</code><span class="sig-paren">(</span><em class="sig-param">requires_grad=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.requires_grad_" title="Permalink to this definition">¶</a></dt>
+<dd><p>Change if autograd should record operations on parameters in this
+module.</p>
+<p>This method sets the parameters’ <code class="xref py py-attr docutils literal notranslate"><span class="pre">requires_grad</span></code> attributes
+in-place.</p>
+<p>This method is helpful for freezing part of the module for finetuning
+or training parts of a model individually (e.g., GAN training).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>requires_grad</strong> (<em>bool</em>) – whether autograd should record operations on
+parameters in this module. Default: <code class="docutils literal notranslate"><span class="pre">True</span></code>.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.state_dict">
+<code class="sig-name descname">state_dict</code><span class="sig-paren">(</span><em class="sig-param">destination=None</em>, <em class="sig-param">prefix=''</em>, <em class="sig-param">keep_vars=False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns a dictionary containing a whole state of the module.</p>
+<p>Both parameters and persistent buffers (e.g. running averages) are
+included. Keys are corresponding parameter and buffer names.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a dictionary containing a whole state of the module</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>dict</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">module</span><span class="o">.</span><span class="n">state_dict</span><span class="p">()</span><span class="o">.</span><span class="n">keys</span><span class="p">()</span>
+<span class="go">[&#39;bias&#39;, &#39;weight&#39;]</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves and/or casts the parameters and buffers.</p>
+<p>This can be called as</p>
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device=None</em>, <em class="sig-param">dtype=None</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">dtype</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">tensor</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">memory_format=torch.channels_last</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<p>Its signature is similar to <code class="xref py py-meth docutils literal notranslate"><span class="pre">torch.Tensor.to()</span></code>, but only accepts
+floating point desired <code class="xref py py-attr docutils literal notranslate"><span class="pre">dtype</span></code> s. In addition, this method will
+only cast the floating point parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dtype</span></code>
+(if given). The integral parameters and buffers will be moved
+<code class="xref py py-attr docutils literal notranslate"><span class="pre">device</span></code>, if that is given, but with dtypes unchanged. When
+<code class="xref py py-attr docutils literal notranslate"><span class="pre">non_blocking</span></code> is set, it tries to convert/move asynchronously
+with respect to the host if possible, e.g., moving CPU Tensors with
+pinned memory to CUDA devices.</p>
+<p>See below for examples.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>This method modifies the module in-place.</p>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>device</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.device</span></code>) – the desired device of the parameters
+and buffers in this module</p></li>
+<li><p><strong>dtype</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.dtype</span></code>) – the desired floating point type of
+the floating point parameters and buffers in this module</p></li>
+<li><p><strong>tensor</strong> (<em>torch.Tensor</em>) – Tensor whose dtype and device are the desired
+dtype and device for all parameters and buffers in this module</p></li>
+<li><p><strong>memory_format</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.memory_format</span></code>) – the desired memory
+format for 4D parameters and buffers in this module (keyword
+only argument)</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1913, -0.3420],</span>
+<span class="go">        [-0.5113, -0.2325]])</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">double</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1913, -0.3420],</span>
+<span class="go">        [-0.5113, -0.2325]], dtype=torch.float64)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">gpu1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">&quot;cuda:1&quot;</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">gpu1</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">torch</span><span class="o">.</span><span class="n">half</span><span class="p">,</span> <span class="n">non_blocking</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1914, -0.3420],</span>
+<span class="go">        [-0.5112, -0.2324]], dtype=torch.float16, device=&#39;cuda:1&#39;)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">cpu</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">&quot;cpu&quot;</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">cpu</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1914, -0.3420],</span>
+<span class="go">        [-0.5112, -0.2324]], dtype=torch.float16)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.train">
+<code class="sig-name descname">train</code><span class="sig-paren">(</span><em class="sig-param">mode=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.train" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets the module in training mode.</p>
+<p>This has any effect only on certain modules. See documentations of
+particular modules for details of their behaviors in training/evaluation
+mode, if they are affected, e.g. <code class="xref py py-class docutils literal notranslate"><span class="pre">Dropout</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">BatchNorm</span></code>,
+etc.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>mode</strong> (<em>bool</em>) – whether to set training mode (<code class="docutils literal notranslate"><span class="pre">True</span></code>) or evaluation
+mode (<code class="docutils literal notranslate"><span class="pre">False</span></code>). Default: <code class="docutils literal notranslate"><span class="pre">True</span></code>.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.type">
+<code class="sig-name descname">type</code><span class="sig-paren">(</span><em class="sig-param">dst_type</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.type" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dst_type</span></code>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>dst_type</strong> (<em>type</em><em> or </em><em>string</em>) – the desired type</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.DCAPenalty.zero_grad">
+<code class="sig-name descname">zero_grad</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.DCAPenalty.zero_grad" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets gradients of all model parameters to zero.</p>
+</dd></dl>
+
+</dd></dl>
+
+</div>
+
+
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <h4>Previous topic</h4>
+  <p class="topless"><a href="netcal.regularization.MMCEPenalty.html"
+                        title="previous chapter">netcal.regularization.MMCEPenalty</a></p>
+  <h4>Next topic</h4>
+  <p class="topless"><a href="../netcal.metrics.html"
+                        title="next chapter">netcal.metrics</a></p>
+  <div role="note" aria-label="source link">
+    <h3>This Page</h3>
+    <ul class="this-page-menu">
+      <li><a href="../../_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.rst.txt"
+            rel="nofollow">Show Source</a></li>
+    </ul>
+   </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" />
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>$('#searchbox').show(0);</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="../netcal.metrics.html" title="netcal.metrics"
+             >next</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.MMCEPenalty.html" title="netcal.regularization.MMCEPenalty"
+             >previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" >netcal.regularization</a> &#187;</li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2019-2021, Ruhr West University of Applied Sciences, Bottrop, Germany AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany.
+      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 2.4.4.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html
new file mode 100644
index 0000000..e0fea94
--- /dev/null
+++ b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html
@@ -0,0 +1,1054 @@
+
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta charset="utf-8" />
+    <title>netcal.regularization.MMCEPenalty &#8212; calibration-framework 1.2.0 documentation</title>
+    <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
+    <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
+    
+    <script id="documentation_options" data-url_root="../../" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/language_data.js"></script>
+    <script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
+    
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="netcal.regularization.DCAPenalty" href="netcal.regularization.DCAPenalty.html" />
+    <link rel="prev" title="netcal.regularization.ConfidencePenalty" href="netcal.regularization.ConfidencePenalty.html" /> 
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.DCAPenalty.html" title="netcal.regularization.DCAPenalty"
+             accesskey="N">next</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.ConfidencePenalty.html" title="netcal.regularization.ConfidencePenalty"
+             accesskey="P">previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" accesskey="U">netcal.regularization</a> &#187;</li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <div class="section" id="netcal-regularization-mmcepenalty">
+<h1>netcal.regularization.MMCEPenalty<a class="headerlink" href="#netcal-regularization-mmcepenalty" title="Permalink to this headline">¶</a></h1>
+<dl class="class">
+<dt id="netcal.regularization.MMCEPenalty">
+<em class="property">class </em><code class="sig-prename descclassname">netcal.regularization.</code><code class="sig-name descname">MMCEPenalty</code><span class="sig-paren">(</span><em class="sig-param">weight: float = 1.0</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">torch.nn.modules.loss._Loss</span></code></p>
+<p>Maximum mean calibration error (MMCE) <a class="footnote-reference brackets" href="#id2" id="id1">1</a>. This term can be used for online confidence calibration directly
+during model training.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>weight</strong> (<em>float</em>) – Weight of MMCE regularization.</p>
+</dd>
+</dl>
+<p class="rubric">References</p>
+<dl class="footnote brackets">
+<dt class="label" id="id2"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>Kumar, Aviral, Sunita Sarawagi, and Ujjwal Jain:
+“Trainable calibration measures for neural networks from kernel mean embeddings.”
+International Conference on Machine Learning. PMLR, 2018.
+<a class="reference external" href="http://proceedings.mlr.press/v80/kumar18a/kumar18a.pdf">Get source online:</a></p>
+</dd>
+</dl>
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.__init__">
+<code class="sig-name descname">__init__</code><span class="sig-paren">(</span><em class="sig-param">weight: float = 1.0</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.__init__" title="Permalink to this definition">¶</a></dt>
+<dd><p>Constructor. For parameter description, see class docstring.</p>
+</dd></dl>
+
+<p class="rubric">Methods</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([weight])</p></td>
+<td><p>Constructor.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">add_module</span></code>(name, module)</p></td>
+<td><p>Adds a child module to the current module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">apply</span></code>(fn)</p></td>
+<td><p>Applies <code class="docutils literal notranslate"><span class="pre">fn</span></code> recursively to every submodule (as returned by <code class="docutils literal notranslate"><span class="pre">.children()</span></code>) as well as self.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">bfloat16</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">bfloat16</span></code> datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">buffers</span></code>([recurse])</p></td>
+<td><p>Returns an iterator over module buffers.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">children</span></code>()</p></td>
+<td><p>Returns an iterator over immediate children modules.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">cpu</span></code>()</p></td>
+<td><p>Moves all model parameters and buffers to the CPU.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">cuda</span></code>([device])</p></td>
+<td><p>Moves all model parameters and buffers to the GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">double</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">double</span></code> datatype.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">eval</span></code>()</p></td>
+<td><p>Sets the module in evaluation mode.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">extra_repr</span></code>()</p></td>
+<td><p>Set the extra representation of the module</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">float</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to float datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">forward</span></code>(input, target)</p></td>
+<td><p>Forward call of module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">half</span></code>()</p></td>
+<td><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">half</span></code> datatype.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">kernel</span></code>(c1, c2)</p></td>
+<td><p>Laplacian kernel</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_state_dict</span></code>(state_dict[, strict])</p></td>
+<td><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into this module and its descendants.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">modules</span></code>()</p></td>
+<td><p>Returns an iterator over all modules in the network.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_buffers</span></code>([prefix, recurse])</p></td>
+<td><p>Returns an iterator over module buffers, yielding both the name of the buffer as well as the buffer itself.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_children</span></code>()</p></td>
+<td><p>Returns an iterator over immediate children modules, yielding both the name of the module as well as the module itself.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_modules</span></code>([memo, prefix])</p></td>
+<td><p>Returns an iterator over all modules in the network, yielding both the name of the module as well as the module itself.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">named_parameters</span></code>([prefix, recurse])</p></td>
+<td><p>Returns an iterator over module parameters, yielding both the name of the parameter as well as the parameter itself.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">parameters</span></code>([recurse])</p></td>
+<td><p>Returns an iterator over module parameters.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_backward_hook</span></code>(hook)</p></td>
+<td><p>Registers a backward hook on the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_buffer</span></code>(name, tensor)</p></td>
+<td><p>Adds a persistent buffer to the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_forward_hook</span></code>(hook)</p></td>
+<td><p>Registers a forward hook on the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_forward_pre_hook</span></code>(hook)</p></td>
+<td><p>Registers a forward pre-hook on the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">register_parameter</span></code>(name, param)</p></td>
+<td><p>Adds a parameter to the module.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">requires_grad_</span></code>([requires_grad])</p></td>
+<td><p>Change if autograd should record operations on parameters in this module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">share_memory</span></code>()</p></td>
+<td><p></p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">state_dict</span></code>([destination, prefix, keep_vars])</p></td>
+<td><p>Returns a dictionary containing a whole state of the module.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(*args, **kwargs)</p></td>
+<td><p>Moves and/or casts the parameters and buffers.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">train</span></code>([mode])</p></td>
+<td><p>Sets the module in training mode.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">type</span></code>(dst_type)</p></td>
+<td><p>Casts all parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dst_type</span></code>.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">zero_grad</span></code>()</p></td>
+<td><p>Sets gradients of all model parameters to zero.</p></td>
+</tr>
+</tbody>
+</table>
+<p class="rubric">Attributes</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">dump_patches</span></code></p></td>
+<td><p></p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">epsilon</span></code></p></td>
+<td><p></p></td>
+</tr>
+</tbody>
+</table>
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty._load_from_state_dict">
+<code class="sig-name descname">_load_from_state_dict</code><span class="sig-paren">(</span><em class="sig-param">state_dict</em>, <em class="sig-param">prefix</em>, <em class="sig-param">local_metadata</em>, <em class="sig-param">strict</em>, <em class="sig-param">missing_keys</em>, <em class="sig-param">unexpected_keys</em>, <em class="sig-param">error_msgs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty._load_from_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into only
+this module, but not its descendants. This is called on every submodule
+in <code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code>. Metadata saved for this
+module in input <a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> is provided as <code class="xref py py-attr docutils literal notranslate"><span class="pre">local_metadata</span></code>.
+For state dicts without metadata, <code class="xref py py-attr docutils literal notranslate"><span class="pre">local_metadata</span></code> is empty.
+Subclasses can achieve class-specific backward compatible loading using
+the version number at <cite>local_metadata.get(“version”, None)</cite>.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p><a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> is not the same object as the input
+<a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> to <code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code>. So
+it can be modified.</p>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>state_dict</strong> (<em>dict</em>) – a dict containing parameters and
+persistent buffers.</p></li>
+<li><p><strong>prefix</strong> (<em>str</em>) – the prefix for parameters and buffers used in this
+module</p></li>
+<li><p><strong>local_metadata</strong> (<em>dict</em>) – a dict containing the metadata for this module.
+See</p></li>
+<li><p><strong>strict</strong> (<em>bool</em>) – whether to strictly enforce that the keys in
+<a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> with <code class="xref py py-attr docutils literal notranslate"><span class="pre">prefix</span></code> match the names of
+parameters and buffers in this module</p></li>
+<li><p><strong>missing_keys</strong> (<em>list of str</em>) – if <code class="docutils literal notranslate"><span class="pre">strict=True</span></code>, add missing keys to
+this list</p></li>
+<li><p><strong>unexpected_keys</strong> (<em>list of str</em>) – if <code class="docutils literal notranslate"><span class="pre">strict=True</span></code>, add unexpected
+keys to this list</p></li>
+<li><p><strong>error_msgs</strong> (<em>list of str</em>) – error messages should be added to this
+list, and will be reported together in
+<code class="xref py py-meth docutils literal notranslate"><span class="pre">load_state_dict()</span></code></p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty._named_members">
+<code class="sig-name descname">_named_members</code><span class="sig-paren">(</span><em class="sig-param">get_members_fn</em>, <em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty._named_members" title="Permalink to this definition">¶</a></dt>
+<dd><p>Helper method for yielding various names + members of modules.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty._register_load_state_dict_pre_hook">
+<code class="sig-name descname">_register_load_state_dict_pre_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty._register_load_state_dict_pre_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>These hooks will be called with arguments: <cite>state_dict</cite>, <cite>prefix</cite>,
+<cite>local_metadata</cite>, <cite>strict</cite>, <cite>missing_keys</cite>, <cite>unexpected_keys</cite>,
+<cite>error_msgs</cite>, before loading <cite>state_dict</cite> into <cite>self</cite>. These arguments
+are exactly the same as those of <cite>_load_from_state_dict</cite>.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty._register_state_dict_hook">
+<code class="sig-name descname">_register_state_dict_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty._register_state_dict_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>These hooks will be called with arguments: <cite>self</cite>, <cite>state_dict</cite>,
+<cite>prefix</cite>, <cite>local_metadata</cite>, after the <cite>state_dict</cite> of <cite>self</cite> is set.
+Note that only parameters and buffers of <cite>self</cite> or its children are
+guaranteed to exist in <cite>state_dict</cite>. The hooks may modify <cite>state_dict</cite>
+inplace or return a new one.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty._save_to_state_dict">
+<code class="sig-name descname">_save_to_state_dict</code><span class="sig-paren">(</span><em class="sig-param">destination</em>, <em class="sig-param">prefix</em>, <em class="sig-param">keep_vars</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty._save_to_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Saves module state to <cite>destination</cite> dictionary, containing a state
+of the module, but not its descendants. This is called on every
+submodule in <code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code>.</p>
+<p>In rare cases, subclasses can achieve class-specific behavior by
+overriding this method with custom logic.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>destination</strong> (<em>dict</em>) – a dict where state will be stored</p></li>
+<li><p><strong>prefix</strong> (<em>str</em>) – the prefix for parameters and buffers used in this
+module</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.add_module">
+<code class="sig-name descname">add_module</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">module</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.add_module" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a child module to the current module.</p>
+<p>The module can be accessed as an attribute using the given name.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the child module. The child module can be
+accessed from this module using the given name</p></li>
+<li><p><strong>module</strong> (<em>Module</em>) – child module to be added to the module.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.apply">
+<code class="sig-name descname">apply</code><span class="sig-paren">(</span><em class="sig-param">fn</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.apply" title="Permalink to this definition">¶</a></dt>
+<dd><p>Applies <code class="docutils literal notranslate"><span class="pre">fn</span></code> recursively to every submodule (as returned by <code class="docutils literal notranslate"><span class="pre">.children()</span></code>)
+as well as self. Typical use includes initializing the parameters of a model
+(see also <span class="xref std std-ref">nn-init-doc</span>).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>fn</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code> -&gt; None) – function to be applied to each submodule</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="nd">@torch</span><span class="o">.</span><span class="n">no_grad</span><span class="p">()</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">init_weights</span><span class="p">(</span><span class="n">m</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="n">m</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">if</span> <span class="nb">type</span><span class="p">(</span><span class="n">m</span><span class="p">)</span> <span class="o">==</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">:</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="n">m</span><span class="o">.</span><span class="n">weight</span><span class="o">.</span><span class="n">fill_</span><span class="p">(</span><span class="mf">1.0</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="nb">print</span><span class="p">(</span><span class="n">m</span><span class="o">.</span><span class="n">weight</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">),</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">))</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span><span class="o">.</span><span class="n">apply</span><span class="p">(</span><span class="n">init_weights</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 1.,  1.],</span>
+<span class="go">        [ 1.,  1.]])</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 1.,  1.],</span>
+<span class="go">        [ 1.,  1.]])</span>
+<span class="go">Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+<span class="go">Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.bfloat16">
+<code class="sig-name descname">bfloat16</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.bfloat16" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">bfloat16</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.buffers">
+<code class="sig-name descname">buffers</code><span class="sig-paren">(</span><em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.buffers" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module buffers.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields buffers of this module
+and all submodules. Otherwise, yields only buffers that
+are direct members of this module.</p>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>torch.Tensor</em> – module buffer</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">buf</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">buffers</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="nb">type</span><span class="p">(</span><span class="n">buf</span><span class="p">),</span> <span class="n">buf</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L,)</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L, 1L, 5L, 5L)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.children">
+<code class="sig-name descname">children</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.children" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over immediate children modules.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>Module</em> – a child module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.cpu">
+<code class="sig-name descname">cpu</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.cpu" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves all model parameters and buffers to the CPU.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.cuda">
+<code class="sig-name descname">cuda</code><span class="sig-paren">(</span><em class="sig-param">device=None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.cuda" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves all model parameters and buffers to the GPU.</p>
+<p>This also makes associated parameters and buffers different objects. So
+it should be called before constructing optimizer if the module will
+live on GPU while being optimized.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>device</strong> (<em>int</em><em>, </em><em>optional</em>) – if specified, all parameters will be
+copied to that device</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.double">
+<code class="sig-name descname">double</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.double" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">double</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.eval">
+<code class="sig-name descname">eval</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.eval" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets the module in evaluation mode.</p>
+<p>This has any effect only on certain modules. See documentations of
+particular modules for details of their behaviors in training/evaluation
+mode, if they are affected, e.g. <code class="xref py py-class docutils literal notranslate"><span class="pre">Dropout</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">BatchNorm</span></code>,
+etc.</p>
+<p>This is equivalent with <code class="xref py py-meth docutils literal notranslate"><span class="pre">self.train(False)</span></code>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.extra_repr">
+<code class="sig-name descname">extra_repr</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.extra_repr" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set the extra representation of the module</p>
+<p>To print customized extra information, you should reimplement
+this method in your own modules. Both single-line and multi-line
+strings are acceptable.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.float">
+<code class="sig-name descname">float</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.float" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to float datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.forward">
+<code class="sig-name descname">forward</code><span class="sig-paren">(</span><em class="sig-param">input: torch.Tensor</em>, <em class="sig-param">target: torch.Tensor</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.forward" title="Permalink to this definition">¶</a></dt>
+<dd><p>Forward call of module. Returns a single scalar indicating the MMCE for the current batch.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.half">
+<code class="sig-name descname">half</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.half" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all floating point parameters and buffers to <code class="docutils literal notranslate"><span class="pre">half</span></code> datatype.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>self</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.kernel">
+<code class="sig-name descname">kernel</code><span class="sig-paren">(</span><em class="sig-param">c1: torch.Tensor</em>, <em class="sig-param">c2: torch.Tensor</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.regularization.MMCEPenalty.kernel" title="Permalink to this definition">¶</a></dt>
+<dd><p>Laplacian kernel</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.load_state_dict">
+<code class="sig-name descname">load_state_dict</code><span class="sig-paren">(</span><em class="sig-param">state_dict</em>, <em class="sig-param">strict=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.load_state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Copies parameters and buffers from <a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> into
+this module and its descendants. If <code class="xref py py-attr docutils literal notranslate"><span class="pre">strict</span></code> is <code class="docutils literal notranslate"><span class="pre">True</span></code>, then
+the keys of <a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> must exactly match the keys returned
+by this module’s <code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code> function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>state_dict</strong> (<em>dict</em>) – a dict containing parameters and
+persistent buffers.</p></li>
+<li><p><strong>strict</strong> (<em>bool</em><em>, </em><em>optional</em>) – whether to strictly enforce that the keys
+in <a class="reference internal" href="#netcal.regularization.MMCEPenalty.state_dict" title="netcal.regularization.MMCEPenalty.state_dict"><code class="xref py py-attr docutils literal notranslate"><span class="pre">state_dict</span></code></a> match the keys returned by this module’s
+<code class="xref py py-meth docutils literal notranslate"><span class="pre">state_dict()</span></code> function. Default: <code class="docutils literal notranslate"><span class="pre">True</span></code></p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><strong>missing_keys</strong> is a list of str containing the missing keys</p></li>
+<li><p><strong>unexpected_keys</strong> is a list of str containing the unexpected keys</p></li>
+</ul>
+</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p><code class="docutils literal notranslate"><span class="pre">NamedTuple</span></code> with <code class="docutils literal notranslate"><span class="pre">missing_keys</span></code> and <code class="docutils literal notranslate"><span class="pre">unexpected_keys</span></code> fields</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.modules">
+<code class="sig-name descname">modules</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.modules" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over all modules in the network.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>Module</em> – a module in the network</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Duplicate modules are returned only once. In the following
+example, <code class="docutils literal notranslate"><span class="pre">l</span></code> will be returned only once.</p>
+</div>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">l</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">l</span><span class="p">,</span> <span class="n">l</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">m</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">net</span><span class="o">.</span><span class="n">modules</span><span class="p">()):</span>
+<span class="go">        print(idx, &#39;-&gt;&#39;, m)</span>
+
+<span class="go">0 -&gt; Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">)</span>
+<span class="go">1 -&gt; Linear(in_features=2, out_features=2, bias=True)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.named_buffers">
+<code class="sig-name descname">named_buffers</code><span class="sig-paren">(</span><em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.named_buffers" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module buffers, yielding both the
+name of the buffer as well as the buffer itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>prefix</strong> (<em>str</em>) – prefix to prepend to all buffer names.</p></li>
+<li><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields buffers of this module
+and all submodules. Otherwise, yields only buffers that
+are direct members of this module.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>(string, torch.Tensor)</em> – Tuple containing the name and buffer</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">buf</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">named_buffers</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>   <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;running_var&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>       <span class="nb">print</span><span class="p">(</span><span class="n">buf</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.named_children">
+<code class="sig-name descname">named_children</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.named_children" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over immediate children modules, yielding both
+the name of the module as well as the module itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>(string, Module)</em> – Tuple containing a name and child module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">module</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">named_children</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;conv4&#39;</span><span class="p">,</span> <span class="s1">&#39;conv5&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="nb">print</span><span class="p">(</span><span class="n">module</span><span class="p">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.named_modules">
+<code class="sig-name descname">named_modules</code><span class="sig-paren">(</span><em class="sig-param">memo=None</em>, <em class="sig-param">prefix=''</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.named_modules" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over all modules in the network, yielding
+both the name of the module as well as the module itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Yields</dt>
+<dd class="field-odd"><p><em>(string, Module)</em> – Tuple of name and module</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>Duplicate modules are returned only once. In the following
+example, <code class="docutils literal notranslate"><span class="pre">l</span></code> will be returned only once.</p>
+</div>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">l</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">l</span><span class="p">,</span> <span class="n">l</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">idx</span><span class="p">,</span> <span class="n">m</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="n">net</span><span class="o">.</span><span class="n">named_modules</span><span class="p">()):</span>
+<span class="go">        print(idx, &#39;-&gt;&#39;, m)</span>
+
+<span class="go">0 -&gt; (&#39;&#39;, Sequential(</span>
+<span class="go">  (0): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">  (1): Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="go">))</span>
+<span class="go">1 -&gt; (&#39;0&#39;, Linear(in_features=2, out_features=2, bias=True))</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.named_parameters">
+<code class="sig-name descname">named_parameters</code><span class="sig-paren">(</span><em class="sig-param">prefix=''</em>, <em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.named_parameters" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module parameters, yielding both the
+name of the parameter as well as the parameter itself.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>prefix</strong> (<em>str</em>) – prefix to prepend to all parameter names.</p></li>
+<li><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields parameters of this module
+and all submodules. Otherwise, yields only parameters that
+are direct members of this module.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>(string, Parameter)</em> – Tuple containing the name and parameter</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">name</span><span class="p">,</span> <span class="n">param</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">named_parameters</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>   <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;bias&#39;</span><span class="p">]:</span>
+<span class="gp">&gt;&gt;&gt; </span>       <span class="nb">print</span><span class="p">(</span><span class="n">param</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.parameters">
+<code class="sig-name descname">parameters</code><span class="sig-paren">(</span><em class="sig-param">recurse=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.parameters" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns an iterator over module parameters.</p>
+<p>This is typically passed to an optimizer.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>recurse</strong> (<em>bool</em>) – if True, then yields parameters of this module
+and all submodules. Otherwise, yields only parameters that
+are direct members of this module.</p>
+</dd>
+<dt class="field-even">Yields</dt>
+<dd class="field-even"><p><em>Parameter</em> – module parameter</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="k">for</span> <span class="n">param</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">parameters</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="nb">print</span><span class="p">(</span><span class="nb">type</span><span class="p">(</span><span class="n">param</span><span class="p">),</span> <span class="n">param</span><span class="o">.</span><span class="n">size</span><span class="p">())</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L,)</span>
+<span class="go">&lt;class &#39;torch.Tensor&#39;&gt; (20L, 1L, 5L, 5L)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.register_backward_hook">
+<code class="sig-name descname">register_backward_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.register_backward_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a backward hook on the module.</p>
+<p>The hook will be called every time the gradients with respect to module
+inputs are computed. The hook should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="n">grad_input</span><span class="p">,</span> <span class="n">grad_output</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">Tensor</span> <span class="ow">or</span> <span class="kc">None</span>
+</pre></div>
+</div>
+<p>The <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> and <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_output</span></code> may be tuples if the
+module has multiple inputs or outputs. The hook should not modify its
+arguments, but it can optionally return a new gradient with respect to
+input that will be used in place of <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> in subsequent
+computations.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+<div class="admonition warning">
+<p class="admonition-title">Warning</p>
+<p>The current implementation will not have the presented behavior
+for complex <code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code> that perform many operations.
+In some failure cases, <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_input</span></code> and <code class="xref py py-attr docutils literal notranslate"><span class="pre">grad_output</span></code> will only
+contain the gradients for a subset of the inputs and outputs.
+For such <code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code>, you should use <code class="xref py py-func docutils literal notranslate"><span class="pre">torch.Tensor.register_hook()</span></code>
+directly on a specific input or output to get the required gradients.</p>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.register_buffer">
+<code class="sig-name descname">register_buffer</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">tensor</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.register_buffer" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a persistent buffer to the module.</p>
+<p>This is typically used to register a buffer that should not to be
+considered a model parameter. For example, BatchNorm’s <code class="docutils literal notranslate"><span class="pre">running_mean</span></code>
+is not a parameter, but is part of the persistent state.</p>
+<p>Buffers can be accessed as attributes using given names.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the buffer. The buffer can be accessed
+from this module using the given name</p></li>
+<li><p><strong>tensor</strong> (<em>Tensor</em>) – buffer to be registered.</p></li>
+</ul>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="bp">self</span><span class="o">.</span><span class="n">register_buffer</span><span class="p">(</span><span class="s1">&#39;running_mean&#39;</span><span class="p">,</span> <span class="n">torch</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="n">num_features</span><span class="p">))</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.register_forward_hook">
+<code class="sig-name descname">register_forward_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.register_forward_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a forward hook on the module.</p>
+<p>The hook will be called every time after <a class="reference internal" href="#netcal.regularization.MMCEPenalty.forward" title="netcal.regularization.MMCEPenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> has computed an output.
+It should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="nb">input</span><span class="p">,</span> <span class="n">output</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">modified</span> <span class="n">output</span>
+</pre></div>
+</div>
+<p>The hook can modify the output. It can modify the input inplace but
+it will not have effect on forward since this is called after
+<a class="reference internal" href="#netcal.regularization.MMCEPenalty.forward" title="netcal.regularization.MMCEPenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> is called.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.register_forward_pre_hook">
+<code class="sig-name descname">register_forward_pre_hook</code><span class="sig-paren">(</span><em class="sig-param">hook</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.register_forward_pre_hook" title="Permalink to this definition">¶</a></dt>
+<dd><p>Registers a forward pre-hook on the module.</p>
+<p>The hook will be called every time before <a class="reference internal" href="#netcal.regularization.MMCEPenalty.forward" title="netcal.regularization.MMCEPenalty.forward"><code class="xref py py-func docutils literal notranslate"><span class="pre">forward()</span></code></a> is invoked.
+It should have the following signature:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">hook</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="nb">input</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">modified</span> <span class="nb">input</span>
+</pre></div>
+</div>
+<p>The hook can modify the input. User can either return a tuple or a
+single modified value in the hook. We will wrap the value into a tuple
+if a single value is returned(unless that value is already a tuple).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a handle that can be used to remove the added hook by calling
+<code class="docutils literal notranslate"><span class="pre">handle.remove()</span></code></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">torch.utils.hooks.RemovableHandle</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.register_parameter">
+<code class="sig-name descname">register_parameter</code><span class="sig-paren">(</span><em class="sig-param">name</em>, <em class="sig-param">param</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.register_parameter" title="Permalink to this definition">¶</a></dt>
+<dd><p>Adds a parameter to the module.</p>
+<p>The parameter can be accessed as an attribute using given name.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>name</strong> (<em>string</em>) – name of the parameter. The parameter can be accessed
+from this module using the given name</p></li>
+<li><p><strong>param</strong> (<em>Parameter</em>) – parameter to be added to the module.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.requires_grad_">
+<code class="sig-name descname">requires_grad_</code><span class="sig-paren">(</span><em class="sig-param">requires_grad=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.requires_grad_" title="Permalink to this definition">¶</a></dt>
+<dd><p>Change if autograd should record operations on parameters in this
+module.</p>
+<p>This method sets the parameters’ <code class="xref py py-attr docutils literal notranslate"><span class="pre">requires_grad</span></code> attributes
+in-place.</p>
+<p>This method is helpful for freezing part of the module for finetuning
+or training parts of a model individually (e.g., GAN training).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>requires_grad</strong> (<em>bool</em>) – whether autograd should record operations on
+parameters in this module. Default: <code class="docutils literal notranslate"><span class="pre">True</span></code>.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.state_dict">
+<code class="sig-name descname">state_dict</code><span class="sig-paren">(</span><em class="sig-param">destination=None</em>, <em class="sig-param">prefix=''</em>, <em class="sig-param">keep_vars=False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.state_dict" title="Permalink to this definition">¶</a></dt>
+<dd><p>Returns a dictionary containing a whole state of the module.</p>
+<p>Both parameters and persistent buffers (e.g. running averages) are
+included. Keys are corresponding parameter and buffer names.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>a dictionary containing a whole state of the module</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>dict</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">module</span><span class="o">.</span><span class="n">state_dict</span><span class="p">()</span><span class="o">.</span><span class="n">keys</span><span class="p">()</span>
+<span class="go">[&#39;bias&#39;, &#39;weight&#39;]</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Moves and/or casts the parameters and buffers.</p>
+<p>This can be called as</p>
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device=None</em>, <em class="sig-param">dtype=None</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">dtype</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">tensor</em>, <em class="sig-param">non_blocking=False</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<dl class="function">
+<dt>
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">memory_format=torch.channels_last</em><span class="sig-paren">)</span></dt>
+<dd></dd></dl>
+
+<p>Its signature is similar to <code class="xref py py-meth docutils literal notranslate"><span class="pre">torch.Tensor.to()</span></code>, but only accepts
+floating point desired <code class="xref py py-attr docutils literal notranslate"><span class="pre">dtype</span></code> s. In addition, this method will
+only cast the floating point parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dtype</span></code>
+(if given). The integral parameters and buffers will be moved
+<code class="xref py py-attr docutils literal notranslate"><span class="pre">device</span></code>, if that is given, but with dtypes unchanged. When
+<code class="xref py py-attr docutils literal notranslate"><span class="pre">non_blocking</span></code> is set, it tries to convert/move asynchronously
+with respect to the host if possible, e.g., moving CPU Tensors with
+pinned memory to CUDA devices.</p>
+<p>See below for examples.</p>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>This method modifies the module in-place.</p>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>device</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.device</span></code>) – the desired device of the parameters
+and buffers in this module</p></li>
+<li><p><strong>dtype</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.dtype</span></code>) – the desired floating point type of
+the floating point parameters and buffers in this module</p></li>
+<li><p><strong>tensor</strong> (<em>torch.Tensor</em>) – Tensor whose dtype and device are the desired
+dtype and device for all parameters and buffers in this module</p></li>
+<li><p><strong>memory_format</strong> (<code class="xref py py-class docutils literal notranslate"><span class="pre">torch.memory_format</span></code>) – the desired memory
+format for 4D parameters and buffers in this module (keyword
+only argument)</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+<p>Example:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">2</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1913, -0.3420],</span>
+<span class="go">        [-0.5113, -0.2325]])</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">double</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1913, -0.3420],</span>
+<span class="go">        [-0.5113, -0.2325]], dtype=torch.float64)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">gpu1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">&quot;cuda:1&quot;</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">gpu1</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">torch</span><span class="o">.</span><span class="n">half</span><span class="p">,</span> <span class="n">non_blocking</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1914, -0.3420],</span>
+<span class="go">        [-0.5112, -0.2324]], dtype=torch.float16, device=&#39;cuda:1&#39;)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">cpu</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">&quot;cpu&quot;</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="n">cpu</span><span class="p">)</span>
+<span class="go">Linear(in_features=2, out_features=2, bias=True)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">linear</span><span class="o">.</span><span class="n">weight</span>
+<span class="go">Parameter containing:</span>
+<span class="go">tensor([[ 0.1914, -0.3420],</span>
+<span class="go">        [-0.5112, -0.2324]], dtype=torch.float16)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.train">
+<code class="sig-name descname">train</code><span class="sig-paren">(</span><em class="sig-param">mode=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.train" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets the module in training mode.</p>
+<p>This has any effect only on certain modules. See documentations of
+particular modules for details of their behaviors in training/evaluation
+mode, if they are affected, e.g. <code class="xref py py-class docutils literal notranslate"><span class="pre">Dropout</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">BatchNorm</span></code>,
+etc.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>mode</strong> (<em>bool</em>) – whether to set training mode (<code class="docutils literal notranslate"><span class="pre">True</span></code>) or evaluation
+mode (<code class="docutils literal notranslate"><span class="pre">False</span></code>). Default: <code class="docutils literal notranslate"><span class="pre">True</span></code>.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.type">
+<code class="sig-name descname">type</code><span class="sig-paren">(</span><em class="sig-param">dst_type</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.type" title="Permalink to this definition">¶</a></dt>
+<dd><p>Casts all parameters and buffers to <code class="xref py py-attr docutils literal notranslate"><span class="pre">dst_type</span></code>.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>dst_type</strong> (<em>type</em><em> or </em><em>string</em>) – the desired type</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>Module</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.regularization.MMCEPenalty.zero_grad">
+<code class="sig-name descname">zero_grad</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.regularization.MMCEPenalty.zero_grad" title="Permalink to this definition">¶</a></dt>
+<dd><p>Sets gradients of all model parameters to zero.</p>
+</dd></dl>
+
+</dd></dl>
+
+</div>
+
+
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <h4>Previous topic</h4>
+  <p class="topless"><a href="netcal.regularization.ConfidencePenalty.html"
+                        title="previous chapter">netcal.regularization.ConfidencePenalty</a></p>
+  <h4>Next topic</h4>
+  <p class="topless"><a href="netcal.regularization.DCAPenalty.html"
+                        title="next chapter">netcal.regularization.DCAPenalty</a></p>
+  <div role="note" aria-label="source link">
+    <h3>This Page</h3>
+    <ul class="this-page-menu">
+      <li><a href="../../_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.rst.txt"
+            rel="nofollow">Show Source</a></li>
+    </ul>
+   </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" />
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>$('#searchbox').show(0);</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.DCAPenalty.html" title="netcal.regularization.DCAPenalty"
+             >next</a> |</li>
+        <li class="right" >
+          <a href="netcal.regularization.ConfidencePenalty.html" title="netcal.regularization.ConfidencePenalty"
+             >previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" >netcal.regularization</a> &#187;</li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2019-2021, Ruhr West University of Applied Sciences, Bottrop, Germany AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany.
+      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 2.4.4.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.html b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.html
index 0fb8a0b..ad78aa5 100644
--- a/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.html
+++ b/docs/build/html/_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.regularization.confidence_penalty &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.regularization.confidence_penalty &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -17,7 +17,7 @@
     
     <link rel="index" title="Index" href="../../genindex.html" />
     <link rel="search" title="Search" href="../../search.html" />
-    <link rel="next" title="netcal.metrics" href="../netcal.metrics.html" />
+    <link rel="next" title="netcal.regularization.ConfidencePenalty" href="netcal.regularization.ConfidencePenalty.html" />
     <link rel="prev" title="netcal.regularization" href="../netcal.regularization.html" /> 
   </head><body>
     <div class="related" role="navigation" aria-label="related navigation">
@@ -30,12 +30,12 @@ <h3>Navigation</h3>
           <a href="../../py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
         <li class="right" >
-          <a href="../netcal.metrics.html" title="netcal.metrics"
+          <a href="netcal.regularization.ConfidencePenalty.html" title="netcal.regularization.ConfidencePenalty"
              accesskey="N">next</a> |</li>
         <li class="right" >
           <a href="../netcal.regularization.html" title="netcal.regularization"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" accesskey="U">netcal.regularization</a> &#187;</li> 
       </ul>
     </div>  
@@ -91,8 +91,8 @@ <h4>Previous topic</h4>
   <p class="topless"><a href="../netcal.regularization.html"
                         title="previous chapter">netcal.regularization</a></p>
   <h4>Next topic</h4>
-  <p class="topless"><a href="../netcal.metrics.html"
-                        title="next chapter">netcal.metrics</a></p>
+  <p class="topless"><a href="netcal.regularization.ConfidencePenalty.html"
+                        title="next chapter">netcal.regularization.ConfidencePenalty</a></p>
   <div role="note" aria-label="source link">
     <h3>This Page</h3>
     <ul class="this-page-menu">
@@ -124,12 +124,12 @@ <h3>Navigation</h3>
           <a href="../../py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
         <li class="right" >
-          <a href="../netcal.metrics.html" title="netcal.metrics"
+          <a href="netcal.regularization.ConfidencePenalty.html" title="netcal.regularization.ConfidencePenalty"
              >next</a> |</li>
         <li class="right" >
           <a href="../netcal.regularization.html" title="netcal.regularization"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.regularization.html" >netcal.regularization</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html
new file mode 100644
index 0000000..44ed2e8
--- /dev/null
+++ b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html
@@ -0,0 +1,555 @@
+
+<!DOCTYPE html>
+
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta charset="utf-8" />
+    <title>netcal.scaling.AbstractLogisticRegression &#8212; calibration-framework 1.2.0 documentation</title>
+    <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
+    <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
+    
+    <script id="documentation_options" data-url_root="../../" src="../../_static/documentation_options.js"></script>
+    <script src="../../_static/jquery.js"></script>
+    <script src="../../_static/underscore.js"></script>
+    <script src="../../_static/doctools.js"></script>
+    <script src="../../_static/language_data.js"></script>
+    <script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
+    
+    <link rel="index" title="Index" href="../../genindex.html" />
+    <link rel="search" title="Search" href="../../search.html" />
+    <link rel="next" title="netcal.scaling.LogisticCalibration" href="netcal.scaling.LogisticCalibration.html" />
+    <link rel="prev" title="netcal.scaling" href="../netcal.scaling.html" /> 
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.scaling.LogisticCalibration.html" title="netcal.scaling.LogisticCalibration"
+             accesskey="N">next</a> |</li>
+        <li class="right" >
+          <a href="../netcal.scaling.html" title="netcal.scaling"
+             accesskey="P">previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" accesskey="U">netcal.scaling</a> &#187;</li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <div class="section" id="netcal-scaling-abstractlogisticregression">
+<h1>netcal.scaling.AbstractLogisticRegression<a class="headerlink" href="#netcal-scaling-abstractlogisticregression" title="Permalink to this headline">¶</a></h1>
+<dl class="class">
+<dt id="netcal.scaling.AbstractLogisticRegression">
+<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">AbstractLogisticRegression</code><span class="sig-paren">(</span><em class="sig-param">method: str = 'mle'</em>, <em class="sig-param">momentum_epochs: int = 1000</em>, <em class="sig-param">mcmc_steps: int = 250</em>, <em class="sig-param">mcmc_chains: int = 1</em>, <em class="sig-param">mcmc_warmup_steps: int = 100</em>, <em class="sig-param">vi_epochs: int = 1000</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em>, <em class="sig-param">use_cuda: Union[str</em>, <em class="sig-param">bool] = False</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
+<p>Abstract class for all calibration methods that base on logistic regression. We extended common
+scaling calibration methods by Bayesian epistemic uncertainty modelling <a class="footnote-reference brackets" href="#id3" id="id1">1</a>.
+On the one hand, this class supports Maximum Likelihood (MLE) estimates without uncertainty.
+This method is commonly solved by negative log likelihood optimization given by</p>
+<div class="math notranslate nohighlight">
+\[\theta_\text{MLE} = \underset{\theta}{\text{min}} \, -\sum_{i=1}^N \log p(y | x_i, \theta)\]</div>
+<p>with samples <span class="math notranslate nohighlight">\(X\)</span>, label <span class="math notranslate nohighlight">\(y\)</span>, weights <span class="math notranslate nohighlight">\(\theta\)</span> and likelihood <span class="math notranslate nohighlight">\(p(y|X, \theta)\)</span>.
+See the implementations of the methods for more details.</p>
+<p>On the other hand, methods to obtain uncertainty in calibration are currently Variational Inference (VI) and
+Markov-Chain Monte-Carlo (MCMC) sampling. Instead of estimating the weights <span class="math notranslate nohighlight">\(\theta\)</span> of the logistic
+regression directly, we place a probability distribution over the weights by</p>
+<div class="math notranslate nohighlight">
+\[p(\theta | X, y) = \frac{p(y | X, \theta) p(\theta)}{\int p(y | X, \theta) p(\theta) d\theta}\]</div>
+<p>Since the marginal likelihood cannot be evaluated analytically for logistic regression, we need to approximate the
+posterior by either MCMC sampling or Variational Inference. Using several techniques, we sample multiple times from
+the posterior in order to get multiple related calibration results with a mean and a deviation for each sample.</p>
+<p>MCMC sampling allows the sampling of a posterior without knowing the marginal likelihood. This method is unbiased
+but computational expensive. In contrast, Variational Inference defines an easy variational
+distribution <span class="math notranslate nohighlight">\(q_\Phi(\theta)\)</span> (e.g. a normal distribution) for each weight parametrized by <span class="math notranslate nohighlight">\(\Phi\)</span>.
+The optimization objective is then the minimization of the Kullback-Leibler divergence between the
+variational distribution <span class="math notranslate nohighlight">\(q_\Phi(\theta))\)</span> and the true posterior <span class="math notranslate nohighlight">\(p(\theta | X, y)\)</span>.
+This can be solved using the ELBO method <a class="footnote-reference brackets" href="#id4" id="id2">2</a>. Variational Inference is faster than MCMC but also biased.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>method</strong> (<em>str</em><em>, </em><em>default: &quot;mle&quot;</em>) – Method that is used to obtain a calibration mapping:
+- ‘mle’: Maximum likelihood estimate without uncertainty using a convex optimizer.
+- ‘momentum’: MLE estimate using Momentum optimizer for non-convex optimization.
+- ‘variational’: Variational Inference with uncertainty.
+- ‘mcmc’: Markov-Chain Monte-Carlo sampling with uncertainty.</p></li>
+<li><p><strong>momentum_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used by momentum optimizer.</p></li>
+<li><p><strong>mcmc_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 20</em>) – Number of weight samples obtained by MCMC sampling.</p></li>
+<li><p><strong>mcmc_chains</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Number of Markov-chains used in parallel for MCMC sampling (this will result
+in mcmc_steps * mcmc_chains samples).</p></li>
+<li><p><strong>mcmc_warmup_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 100</em>) – Warmup steps used for MCMC sampling.</p></li>
+<li><p><strong>vi_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used for ELBO optimization.</p></li>
+<li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
+with shape (n_samples, [n_classes]).
+If True, the input array ‘X’ is treated as a box predictions with several box features (at least
+box confidence must be present) with shape (n_samples, [n_box_features]).</p></li>
+<li><p><strong>independent_probabilities</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Boolean for multi class probabilities.
+If set to True, the probability estimates for each
+class are treated as independent of each other (sigmoid).</p></li>
+<li><p><strong>use_cuda</strong> (<em>str</em><em> or </em><em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Specify if CUDA should be used. If str, you can also specify the device
+number like ‘cuda:0’, etc.</p></li>
+</ul>
+</dd>
+</dl>
+<p class="rubric">References</p>
+<dl class="footnote brackets">
+<dt class="label" id="id3"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dd><p>Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+“Bayesian Confidence Calibration for Epistemic Uncertainty Modelling.”
+2021 IEEE Intelligent Vehicles Symposium (IV), 2021</p>
+</dd>
+<dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
+<dd><p>Michael I Jordan, Zoubin Ghahramani, Tommi S Jaakkola, and Lawrence K Saul:
+“An introduction to variational methods for graphical models.” Machine learning, 37(2): 183–233, 1999.</p>
+</dd>
+</dl>
+<p class="rubric">Methods</p>
+<table class="longtable docutils align-default">
+<colgroup>
+<col style="width: 10%" />
+<col style="width: 90%" />
+</colgroup>
+<tbody>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([method, momentum_epochs, …])</p></td>
+<td><p>Create an instance of <cite>AbstractLogisticRegression</cite>.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
+<td><p>Clear model parameters.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">convex</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Convex optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
+<td><p>Build logitic calibration model either conventional with single MLE estimate or with Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
+<td><p>Fit to data, then transform it.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
+<td><p>Get parameters for this estimator.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">guide</span></code>([X, y])</p></td>
+<td><p>Variational substitution definition for each parameter.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
+<td><p>Load model from saved torch dump.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mask</span></code>()</p></td>
+<td><p>Seek for all relevant weights whose values are negative.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mcmc</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">model</span></code>([X, y])</p></td>
+<td><p>Definition of the log regression model.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">momentum</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Momentum optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X)</p></td>
+<td><p>Preprocessing of input data before called at the beginning of the fit-function.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prior</span></code>()</p></td>
+<td><p>Prior definition of the weights and intercept used for log regression.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
+<td><p>Set the parameters of this estimator.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
+<td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(device)</p></td>
+<td><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state, …])</p></td>
+<td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">variational</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform variational inference using the guide.</p></td>
+</tr>
+</tbody>
+</table>
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.clear">
+<code class="sig-name descname">clear</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.clear" title="Permalink to this definition">¶</a></dt>
+<dd><p>Clear model parameters.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.convex">
+<code class="sig-name descname">convex</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.convex" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convex optimization to find the global optimum of current parameter search.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.fit">
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = True</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; AbstractLogisticRegression<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.fit" title="Permalink to this definition">¶</a></dt>
+<dd><p>Build logitic calibration model either conventional with single MLE estimate or with
+Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Instance of class <a class="reference internal" href="#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p><a class="reference internal" href="#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression</a></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.fit_transform">
+<code class="sig-name descname">fit_transform</code><span class="sig-paren">(</span><em class="sig-param">X</em>, <em class="sig-param">y=None</em>, <em class="sig-param">**fit_params</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.fit_transform" title="Permalink to this definition">¶</a></dt>
+<dd><p>Fit to data, then transform it.</p>
+<p>Fits transformer to X and y with optional parameters fit_params
+and returns a transformed version of X.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>numpy array of shape</em><em> [</em><em>n_samples</em><em>, </em><em>n_features</em><em>]</em>) – Training set.</p></li>
+<li><p><strong>y</strong> (<em>numpy array of shape</em><em> [</em><em>n_samples</em><em>]</em>) – Target values.</p></li>
+<li><p><strong>**fit_params</strong> (<em>dict</em>) – Additional fit parameters.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><strong>X_new</strong> – Transformed array.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>numpy array of shape [n_samples, n_features_new]</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.get_params">
+<code class="sig-name descname">get_params</code><span class="sig-paren">(</span><em class="sig-param">deep=True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.get_params" title="Permalink to this definition">¶</a></dt>
+<dd><p>Get parameters for this estimator.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>deep</strong> (<em>boolean</em><em>, </em><em>optional</em>) – If True, will return the parameters for this estimator and
+contained subobjects that are estimators.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><strong>params</strong> – Parameter names mapped to their values.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>mapping of string to any</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.guide">
+<code class="sig-name descname">guide</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.guide" title="Permalink to this definition">¶</a></dt>
+<dd><p>Variational substitution definition for each parameter. The signature is the same as for the
+“self.model” function but the variables are not used.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.load_model">
+<code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.load_model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Load model from saved torch dump.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Instance of a child class of <cite>AbstractCalibration</cite>.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p><a class="reference internal" href="../../_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration" title="netcal.AbstractCalibration">AbstractCalibration</a></p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.mask">
+<code class="sig-name descname">mask</code><span class="sig-paren">(</span><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, List]<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.mask" title="Permalink to this definition">¶</a></dt>
+<dd><p>Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+in the interval [0, 0].
+Constraints on the intercepts might also be set.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>Indices of masked values and list of boundary constraints for optimization.</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>tuple of (np.ndarray, list)</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.mcmc">
+<code class="sig-name descname">mcmc</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.mcmc" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.model">
+<em class="property">abstract </em><code class="sig-name descname">model</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Definition of the log regression model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Logit of the log regression model.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor, shape=(n_samples, [n_classes])</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.momentum">
+<code class="sig-name descname">momentum</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.momentum" title="Permalink to this definition">¶</a></dt>
+<dd><p>Momentum optimization to find the global optimum of current parameter search.
+This method is slow but tends to find the global optimum for non-convex optimization.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.prepare">
+<em class="property">abstract </em><code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Preprocessing of input data before called at the beginning of the fit-function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Prepared data vector X as torch tensor.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.prior">
+<em class="property">abstract </em><code class="sig-name descname">prior</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.prior" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prior definition of the weights and intercept used for log regression. This function has to set the
+sites at least for “weights” and “bias”.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.save_model">
+<code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.save_model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.set_params">
+<code class="sig-name descname">set_params</code><span class="sig-paren">(</span><em class="sig-param">**params</em><span class="sig-paren">)</span> &#x2192; netcal.AbstractCalibration.AbstractCalibration<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.set_params" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set the parameters of this estimator.</p>
+<p>The method works on simple estimators as well as on nested objects
+(such as pipelines). The latter have parameters of the form
+<code class="docutils literal notranslate"><span class="pre">&lt;component&gt;__&lt;parameter&gt;</span></code> so that it’s possible to update each
+component of a nested object.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p></p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>self</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.squeeze_generic">
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
+of size 1.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>a</strong> (<em>np.ndarray</em>) – NumPy array that should be squeezed.</p></li>
+<li><p><strong>axes_to_keep</strong> (<em>int</em><em> or </em><em>iterable</em>) – Axes that should be kept even if they have a size of 1.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Squeezed array.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>np.ndarray</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device: torch.device</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.transform">
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1000</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">mean_estimate: bool = False</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.transform" title="Permalink to this definition">¶</a></dt>
+<dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
+confidence estimates.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference.</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+<li><p><strong>mean_estimate</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+distribution. This parameter has no effect on MLE.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if ‘mean_estimate’ is True</em></p></li>
+<li><p><em>or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if ‘mean_estimate’ is False</em> – On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).
+On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+log regression parameter distribution obtained by VI or MCMC.</p></li>
+</ul>
+</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.AbstractLogisticRegression.variational">
+<code class="sig-name descname">variational</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.AbstractLogisticRegression.variational" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform variational inference using the guide.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+</dd></dl>
+
+</div>
+
+
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <h4>Previous topic</h4>
+  <p class="topless"><a href="../netcal.scaling.html"
+                        title="previous chapter">netcal.scaling</a></p>
+  <h4>Next topic</h4>
+  <p class="topless"><a href="netcal.scaling.LogisticCalibration.html"
+                        title="next chapter">netcal.scaling.LogisticCalibration</a></p>
+  <div role="note" aria-label="source link">
+    <h3>This Page</h3>
+    <ul class="this-page-menu">
+      <li><a href="../../_sources/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.rst.txt"
+            rel="nofollow">Show Source</a></li>
+    </ul>
+   </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" />
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>$('#searchbox').show(0);</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="right" >
+          <a href="../../py-modindex.html" title="Python Module Index"
+             >modules</a> |</li>
+        <li class="right" >
+          <a href="netcal.scaling.LogisticCalibration.html" title="netcal.scaling.LogisticCalibration"
+             >next</a> |</li>
+        <li class="right" >
+          <a href="../netcal.scaling.html" title="netcal.scaling"
+             >previous</a> |</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
+          <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" >netcal.scaling</a> &#187;</li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2019-2021, Ruhr West University of Applied Sciences, Bottrop, Germany AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany.
+      Created using <a href="http://sphinx-doc.org/">Sphinx</a> 2.4.4.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html
index 2febf42..bf315ad 100644
--- a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html
+++ b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.scaling.BetaCalibration &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.scaling.BetaCalibration &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.TemperatureScaling.html" title="netcal.scaling.TemperatureScaling"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" accesskey="U">netcal.scaling</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,8 +49,8 @@ <h3>Navigation</h3>
 <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-betacalibration" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.scaling.BetaCalibration">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">BetaCalibration</code><span class="sig-paren">(</span><em class="sig-param">auto_select: bool = False</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration" title="Permalink to this definition">¶</a></dt>
-<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">BetaCalibration</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.scaling.AbstractLogisticRegression.AbstractLogisticRegression</span></code></p>
 <p>On classification, apply the beta calibration method to obtain a calibration mapping. The original method was
 proposed by <a class="footnote-reference brackets" href="#id4" id="id1">1</a>.
 For the multiclass case, we extended this method to work with multinomial logistic regression instead of a
@@ -58,7 +58,8 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 On detection mode, this calibration method uses multiple independent Beta distributions to obtain a
 calibration mapping by means of the confidence as well as additional features <a class="footnote-reference brackets" href="#id5" id="id2">2</a>. This calibration scheme
 assumes independence between all variables.</p>
-<p>It is necessary to provide all data in input parameter <code class="docutils literal notranslate"><span class="pre">X</span></code> as an NumPy array of shape <code class="docutils literal notranslate"><span class="pre">(n_samples,</span> <span class="pre">n_features)</span></code>,
+<p>On detection, it is necessary to provide all data in input parameter <code class="docutils literal notranslate"><span class="pre">X</span></code> as an NumPy array
+of shape <code class="docutils literal notranslate"><span class="pre">(n_samples,</span> <span class="pre">n_features)</span></code>,
 whereas the confidence must be the first feature given in the input array. The ground-truth samples <code class="docutils literal notranslate"><span class="pre">y</span></code>
 must be an array of shape <code class="docutils literal notranslate"><span class="pre">(n_samples,)</span></code> consisting of binary labels <span class="math notranslate nohighlight">\(y \in \{0, 1\}\)</span>. Those
 labels indicate if the according sample has matched a ground truth box <span class="math notranslate nohighlight">\(\text{m}=1\)</span> or is a false
@@ -97,7 +98,17 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>auto_select</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Auto selection of best combination on detection mode.</p></li>
+<li><p><strong>method</strong> (<em>str</em><em>, </em><em>default: &quot;mle&quot;</em>) – Method that is used to obtain a calibration mapping:
+- ‘mle’: Maximum likelihood estimate without uncertainty using a convex optimizer.
+- ‘momentum’: MLE estimate using Momentum optimizer for non-convex optimization.
+- ‘variational’: Variational Inference with uncertainty.
+- ‘mcmc’: Markov-Chain Monte-Carlo sampling with uncertainty.</p></li>
+<li><p><strong>momentum_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used by momentum optimizer.</p></li>
+<li><p><strong>mcmc_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 20</em>) – Number of weight samples obtained by MCMC sampling.</p></li>
+<li><p><strong>mcmc_chains</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Number of Markov-chains used in parallel for MCMC sampling (this will result
+in mcmc_steps * mcmc_chains samples).</p></li>
+<li><p><strong>mcmc_warmup_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 100</em>) – Warmup steps used for MCMC sampling.</p></li>
+<li><p><strong>vi_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used for ELBO optimization.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
@@ -105,6 +116,8 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 <li><p><strong>independent_probabilities</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Boolean for multi class probabilities.
 If set to True, the probability estimates for each
 class are treated as independent of each other (sigmoid).</p></li>
+<li><p><strong>use_cuda</strong> (<em>str</em><em> or </em><em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Specify if CUDA should be used. If str, you can also specify the device
+number like ‘cuda:0’, etc.</p></li>
 </ul>
 </dd>
 </dl>
@@ -121,6 +134,11 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 “Multivariate Confidence Calibration for Object Detection.”
 The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
 </dd>
+<dt class="label" id="id6"><span class="brackets">3</span></dt>
+<dd><p>Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+“Bayesian Confidence Calibration for Epistemic Uncertainty Modelling.”
+2021 IEEE Intelligent Vehicles Symposium (IV), 2021</p>
+</dd>
 </dl>
 <p class="rubric">Methods</p>
 <table class="longtable docutils align-default">
@@ -129,26 +147,50 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([auto_select, detection, …])</p></td>
-<td><p>Constructor</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>(*args, **kwargs)</p></td>
+<td><p>Create an instance of <cite>BetaCalibration</cite>.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
 <td><p>Clear model parameters.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y)</p></td>
-<td><p>Build Beta Calibration model.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">convex</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Convex optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
+<td><p>Build logitic calibration model either conventional with single MLE estimate or with Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
 <td><p>Fit to data, then transform it.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">guide</span></code>([X, y])</p></td>
+<td><p>Variational substitution definition for each parameter.</p></td>
+</tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mask</span></code>()</p></td>
+<td><p>Seek for all relevant weights whose values are negative.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mcmc</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">model</span></code>([X, y])</p></td>
+<td><p>Definition of the log regression model.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">momentum</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Momentum optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X)</p></td>
+<td><p>Preprocessing of input data before called at the beginning of the fit-function.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prior</span></code>()</p></td>
+<td><p>Prior definition of the weights used for log regression.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -156,9 +198,15 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X)</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(device)</p></td>
+<td><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state, …])</p></td>
 <td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">variational</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform variational inference using the guide.</p></td>
+</tr>
 </tbody>
 </table>
 <dl class="method">
@@ -167,10 +215,25 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 <dd><p>Clear model parameters.</p>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.convex">
+<code class="sig-name descname">convex</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.convex" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convex optimization to find the global optimum of current parameter search.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibration.fit">
-<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; BetaCalibration<a class="headerlink" href="#netcal.scaling.BetaCalibration.fit" title="Permalink to this definition">¶</a></dt>
-<dd><p>Build Beta Calibration model.</p>
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = True</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; AbstractLogisticRegression<a class="headerlink" href="#netcal.scaling.BetaCalibration.fit" title="Permalink to this definition">¶</a></dt>
+<dd><p>Build logitic calibration model either conventional with single MLE estimate or with
+Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
@@ -179,13 +242,14 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
 <li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Instance of class <a class="reference internal" href="#netcal.scaling.BetaCalibration" title="netcal.scaling.BetaCalibration"><code class="xref py py-class docutils literal notranslate"><span class="pre">BetaCalibration</span></code></a>.</p>
+<dd class="field-even"><p>Instance of class <a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>.</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p><a class="reference internal" href="#netcal.scaling.BetaCalibration" title="netcal.scaling.BetaCalibration">BetaCalibration</a></p>
+<dd class="field-odd"><p><a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression</a></p>
 </dd>
 </dl>
 </dd></dl>
@@ -231,10 +295,32 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.guide">
+<code class="sig-name descname">guide</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.guide" title="Permalink to this definition">¶</a></dt>
+<dd><p>Variational substitution definition for each parameter. The signature is the same as for the
+“self.model” function but the variables are not used.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.intercept">
+<em class="property">property </em><code class="sig-name descname">intercept</code><a class="headerlink" href="#netcal.scaling.BetaCalibration.intercept" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for intercept of logistic calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibration.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -248,10 +334,101 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.mask">
+<code class="sig-name descname">mask</code><span class="sig-paren">(</span><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, List]<a class="headerlink" href="#netcal.scaling.BetaCalibration.mask" title="Permalink to this definition">¶</a></dt>
+<dd><p>Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+in the interval [0, 0].</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>Indices of masked values.</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>list</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.mcmc">
+<code class="sig-name descname">mcmc</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.mcmc" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.model">
+<code class="sig-name descname">model</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.BetaCalibration.model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Definition of the log regression model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Logit of the log regression model.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor, shape=(n_samples, [n_classes])</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.momentum">
+<code class="sig-name descname">momentum</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.momentum" title="Permalink to this definition">¶</a></dt>
+<dd><p>Momentum optimization to find the global optimum of current parameter search.
+This method is slow but tends to find the global optimum for non-convex optimization.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.BetaCalibration.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Preprocessing of input data before called at the beginning of the fit-function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Prepared data vector X as torch tensor.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.prior">
+<code class="sig-name descname">prior</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.prior" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prior definition of the weights used for log regression. This function has to set the
+variables ‘self.weight_prior_dist’, ‘self.weight_mean_init’ and ‘self.weight_stddev_init’.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibration.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -279,7 +456,7 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibration.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibration.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibration.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -298,27 +475,62 @@ <h1>netcal.scaling.BetaCalibration<a class="headerlink" href="#netcal-scaling-be
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device: torch.device</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibration.transform">
-<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibration.transform" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1000</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">mean_estimate: bool = False</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibration.transform" title="Permalink to this definition">¶</a></dt>
 <dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
 confidence estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
-On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference.</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+<li><p><strong>mean_estimate</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+distribution. This parameter has no effect on MLE.</p></li>
+</ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>NumPy array with calibrated confidence estimates.
-1-D for binary classification, 2-D for multi class (softmax).</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if ‘mean_estimate’ is True</em></p></li>
+<li><p><em>or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if ‘mean_estimate’ is False</em> – On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).
+On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+log regression parameter distribution obtained by VI or MCMC.</p></li>
+</ul>
+</p>
 </dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray, shape=(n_samples, [n_classes])</p>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.variational">
+<code class="sig-name descname">variational</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibration.variational" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform variational inference using the guide.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibration.weights">
+<em class="property">property </em><code class="sig-name descname">weights</code><a class="headerlink" href="#netcal.scaling.BetaCalibration.weights" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for weights of beta calibration.</p>
+</dd></dl>
+
 </dd></dl>
 
 </div>
@@ -371,7 +583,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.TemperatureScaling.html" title="netcal.scaling.TemperatureScaling"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" >netcal.scaling</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html
index ecb290f..7cb48d9 100644
--- a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html
+++ b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.scaling.BetaCalibrationDependent &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.scaling.BetaCalibrationDependent &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.BetaCalibration.html" title="netcal.scaling.BetaCalibration"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" accesskey="U">netcal.scaling</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,8 +49,8 @@ <h3>Navigation</h3>
 <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-scaling-betacalibrationdependent" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.scaling.BetaCalibrationDependent">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">BetaCalibrationDependent</code><span class="sig-paren">(</span><em class="sig-param">momentum: bool = True</em>, <em class="sig-param">max_iter: int = 1000</em>, <em class="sig-param">detection: bool = True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent" title="Permalink to this definition">¶</a></dt>
-<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">BetaCalibrationDependent</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">method: str = 'momentum'</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.scaling.AbstractLogisticRegression.AbstractLogisticRegression</span></code></p>
 <p>This calibration method uses a multivariate variant of a Beta distribution to obtain a
 calibration mapping by means of the confidence as well as additional features. This method is originally
 proposed by <a class="footnote-reference brackets" href="#id4" id="id1">1</a>. This calibration scheme
@@ -102,13 +102,22 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>momentum</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If True, momentum optimizer will be used instead of standard SciPy optimizer.</p></li>
-<li><p><strong>max_iter</strong> (<em>int</em><em>, </em><em>default: 1000</em>) – Maximum iteration of optimizer.</p></li>
-<li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: True</em>) – IMPORTANT: this parameter is only for compatibility reasons. It MUST be set to True.
-If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
-with shape (n_samples, [n_classes]).
-If True, the input array ‘X’ is treated as a box predictions with several box features (at least
-box confidence must be present) with shape (n_samples, [n_box_features]).</p></li>
+<li><p><strong>method</strong> (<em>str</em><em>, </em><em>default: &quot;momentum&quot;</em>) – Method that is used to obtain a calibration mapping:
+- ‘mle’: Maximum likelihood estimate without uncertainty using a convex optimizer.
+- ‘momentum’: MLE estimate using Momentum optimizer for non-convex optimization.
+- ‘variational’: Variational Inference with uncertainty.
+- ‘mcmc’: Markov-Chain Monte-Carlo sampling with uncertainty.</p></li>
+<li><p><strong>momentum_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used by momentum optimizer.</p></li>
+<li><p><strong>mcmc_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 20</em>) – Number of weight samples obtained by MCMC sampling.</p></li>
+<li><p><strong>mcmc_chains</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Number of Markov-chains used in parallel for MCMC sampling (this will result
+in mcmc_steps * mcmc_chains samples).</p></li>
+<li><p><strong>mcmc_warmup_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 100</em>) – Warmup steps used for MCMC sampling.</p></li>
+<li><p><strong>vi_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used for ELBO optimization.</p></li>
+<li><p><strong>independent_probabilities</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Boolean for multi class probabilities.
+If set to True, the probability estimates for each
+class are treated as independent of each other (sigmoid).</p></li>
+<li><p><strong>use_cuda</strong> (<em>str</em><em> or </em><em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Specify if CUDA should be used. If str, you can also specify the device
+number like ‘cuda:0’, etc.</p></li>
 </ul>
 </dd>
 </dl>
@@ -124,6 +133,11 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 “Multivariate generalized beta distributions with applications to utility assessment”
 Journal of Educational Statistics 7.4, pp. 271-294, 1982</p>
 </dd>
+<dt class="label" id="id6"><span class="brackets">3</span></dt>
+<dd><p>Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+“Bayesian Confidence Calibration for Epistemic Uncertainty Modelling.”
+2021 IEEE Intelligent Vehicles Symposium (IV), 2021</p>
+</dd>
 </dl>
 <p class="rubric">Methods</p>
 <table class="longtable docutils align-default">
@@ -132,26 +146,50 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([momentum, max_iter, detection])</p></td>
-<td><p>Constructor.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>(*args[, method])</p></td>
+<td><p>Create an instance of <cite>BetaCalibrationDependent</cite>.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
 <td><p>Clear model parameters.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, device])</p></td>
-<td><p>Build dependent Beta Calibration model for multivariate Beta distributions.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">convex</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Convex optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
+<td><p>Build logitic calibration model either conventional with single MLE estimate or with Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
 <td><p>Fit to data, then transform it.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">guide</span></code>([X, y])</p></td>
+<td><p>Variational substitution definition for each parameter.</p></td>
+</tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mask</span></code>()</p></td>
+<td><p>Seek for all relevant weights whose values are negative.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mcmc</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">model</span></code>([X, y])</p></td>
+<td><p>Definition of the log regression model.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">momentum</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Momentum optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X)</p></td>
+<td><p>Preprocessing of input data before called at the beginning of the fit-function.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prior</span></code>()</p></td>
+<td><p>Prior definition of the weights used for log regression.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -159,21 +197,54 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X)</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(device)</p></td>
+<td><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state, …])</p></td>
 <td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">variational</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform variational inference using the guide.</p></td>
+</tr>
 </tbody>
 </table>
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.alphas">
+<em class="property">property </em><code class="sig-name descname">alphas</code><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.alphas" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for alpha values of dependent beta calibration.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.betas">
+<em class="property">property </em><code class="sig-name descname">betas</code><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.betas" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for beta values of dependent beta calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibrationDependent.clear">
 <code class="sig-name descname">clear</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.clear" title="Permalink to this definition">¶</a></dt>
 <dd><p>Clear model parameters.</p>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.convex">
+<code class="sig-name descname">convex</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.convex" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convex optimization to find the global optimum of current parameter search.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibrationDependent.fit">
-<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">device: str = None</em><span class="sig-paren">)</span> &#x2192; BetaCalibrationDependent<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.fit" title="Permalink to this definition">¶</a></dt>
-<dd><p>Build dependent Beta Calibration model for multivariate Beta distributions.</p>
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = True</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; AbstractLogisticRegression<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.fit" title="Permalink to this definition">¶</a></dt>
+<dd><p>Build logitic calibration model either conventional with single MLE estimate or with
+Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
@@ -182,13 +253,14 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
 <li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Instance of class <a class="reference internal" href="#netcal.scaling.BetaCalibrationDependent" title="netcal.scaling.BetaCalibrationDependent"><code class="xref py py-class docutils literal notranslate"><span class="pre">BetaCalibrationDependent</span></code></a>.</p>
+<dd class="field-even"><p>Instance of class <a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>.</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p><a class="reference internal" href="#netcal.scaling.BetaCalibrationDependent" title="netcal.scaling.BetaCalibrationDependent">BetaCalibrationDependent</a></p>
+<dd class="field-odd"><p><a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression</a></p>
 </dd>
 </dl>
 </dd></dl>
@@ -234,10 +306,32 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.guide">
+<code class="sig-name descname">guide</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.guide" title="Permalink to this definition">¶</a></dt>
+<dd><p>Variational substitution definition for each parameter. The signature is the same as for the
+“self.model” function but the variables are not used.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.intercept">
+<em class="property">property </em><code class="sig-name descname">intercept</code><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.intercept" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for intercept of dependent beta calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibrationDependent.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -251,10 +345,102 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.mask">
+<code class="sig-name descname">mask</code><span class="sig-paren">(</span><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, List]<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.mask" title="Permalink to this definition">¶</a></dt>
+<dd><p>Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+in the interval [0, 0].
+Constraints on the intercepts might also be set.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>Indices of masked values and list of boundary constraints for optimization.</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>tuple of (np.ndarray, list)</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.mcmc">
+<code class="sig-name descname">mcmc</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.mcmc" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.model">
+<code class="sig-name descname">model</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Definition of the log regression model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Logit of the log regression model.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor, shape=(n_samples, [n_classes])</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.momentum">
+<code class="sig-name descname">momentum</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.momentum" title="Permalink to this definition">¶</a></dt>
+<dd><p>Momentum optimization to find the global optimum of current parameter search.
+This method is slow but tends to find the global optimum for non-convex optimization.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Preprocessing of input data before called at the beginning of the fit-function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Prepared data vector X as torch tensor.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.prior">
+<code class="sig-name descname">prior</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.prior" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prior definition of the weights used for log regression. This function has to set the
+variables ‘self.weight_prior_dist’, ‘self.weight_mean_init’ and ‘self.weight_stddev_init’.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibrationDependent.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -282,7 +468,7 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibrationDependent.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -301,23 +487,52 @@ <h1>netcal.scaling.BetaCalibrationDependent<a class="headerlink" href="#netcal-s
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device: torch.device</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.BetaCalibrationDependent.transform">
-<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.transform" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1000</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">mean_estimate: bool = False</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.transform" title="Permalink to this definition">¶</a></dt>
 <dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
 confidence estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
-On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference.</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+<li><p><strong>mean_estimate</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+distribution. This parameter has no effect on MLE.</p></li>
+</ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>NumPy array with calibrated confidence estimates.
-1-D for binary classification, 2-D for multi class (softmax).</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if ‘mean_estimate’ is True</em></p></li>
+<li><p><em>or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if ‘mean_estimate’ is False</em> – On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).
+On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+log regression parameter distribution obtained by VI or MCMC.</p></li>
+</ul>
+</p>
 </dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray, shape=(n_samples, [n_classes])</p>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.BetaCalibrationDependent.variational">
+<code class="sig-name descname">variational</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.BetaCalibrationDependent.variational" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform variational inference using the guide.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
@@ -374,7 +589,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.BetaCalibration.html" title="netcal.scaling.BetaCalibration"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" >netcal.scaling</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html
index 12d11e1..2ad5b50 100644
--- a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html
+++ b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.scaling.LogisticCalibration &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.scaling.LogisticCalibration &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -18,7 +18,7 @@
     <link rel="index" title="Index" href="../../genindex.html" />
     <link rel="search" title="Search" href="../../search.html" />
     <link rel="next" title="netcal.scaling.LogisticCalibrationDependent" href="netcal.scaling.LogisticCalibrationDependent.html" />
-    <link rel="prev" title="netcal.scaling" href="../netcal.scaling.html" /> 
+    <link rel="prev" title="netcal.scaling.AbstractLogisticRegression" href="netcal.scaling.AbstractLogisticRegression.html" /> 
   </head><body>
     <div class="related" role="navigation" aria-label="related navigation">
       <h3>Navigation</h3>
@@ -33,9 +33,9 @@ <h3>Navigation</h3>
           <a href="netcal.scaling.LogisticCalibrationDependent.html" title="netcal.scaling.LogisticCalibrationDependent"
              accesskey="N">next</a> |</li>
         <li class="right" >
-          <a href="../netcal.scaling.html" title="netcal.scaling"
+          <a href="netcal.scaling.AbstractLogisticRegression.html" title="netcal.scaling.AbstractLogisticRegression"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" accesskey="U">netcal.scaling</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,8 +49,8 @@ <h3>Navigation</h3>
 <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scaling-logisticcalibration" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.scaling.LogisticCalibration">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">LogisticCalibration</code><span class="sig-paren">(</span><em class="sig-param">temperature_only: bool = False</em>, <em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration" title="Permalink to this definition">¶</a></dt>
-<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">LogisticCalibration</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">temperature_only: bool = False</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.scaling.AbstractLogisticRegression.AbstractLogisticRegression</span></code></p>
 <p>On classification, apply the logistic calibration method aka Platt scaling to obtain a
 calibration mapping. This method is originally proposed by <a class="footnote-reference brackets" href="#id7" id="id1">1</a>.
 For the multiclass case, we use the Vector scaling proposed in <a class="footnote-reference brackets" href="#id8" id="id2">2</a>.
@@ -93,6 +93,17 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>temperature_only</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If True, use Temperature Scaling instead of Platt/Vector Scaling.</p></li>
+<li><p><strong>method</strong> (<em>str</em><em>, </em><em>default: &quot;mle&quot;</em>) – Method that is used to obtain a calibration mapping:
+- ‘mle’: Maximum likelihood estimate without uncertainty using a convex optimizer.
+- ‘momentum’: MLE estimate using Momentum optimizer for non-convex optimization.
+- ‘variational’: Variational Inference with uncertainty.
+- ‘mcmc’: Markov-Chain Monte-Carlo sampling with uncertainty.</p></li>
+<li><p><strong>momentum_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used by momentum optimizer.</p></li>
+<li><p><strong>mcmc_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 20</em>) – Number of weight samples obtained by MCMC sampling.</p></li>
+<li><p><strong>mcmc_chains</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Number of Markov-chains used in parallel for MCMC sampling (this will result
+in mcmc_steps * mcmc_chains samples).</p></li>
+<li><p><strong>mcmc_warmup_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 100</em>) – Warmup steps used for MCMC sampling.</p></li>
+<li><p><strong>vi_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used for ELBO optimization.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
@@ -100,6 +111,8 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 <li><p><strong>independent_probabilities</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Boolean for multi class probabilities.
 If set to True, the probability estimates for each
 class are treated as independent of each other (sigmoid).</p></li>
+<li><p><strong>use_cuda</strong> (<em>str</em><em> or </em><em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Specify if CUDA should be used. If str, you can also specify the device
+number like ‘cuda:0’, etc.</p></li>
 </ul>
 </dd>
 </dl>
@@ -122,6 +135,11 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 “Multivariate Confidence Calibration for Object Detection.”
 The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
 </dd>
+<dt class="label" id="id11"><span class="brackets">4</span></dt>
+<dd><p>Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+“Bayesian Confidence Calibration for Epistemic Uncertainty Modelling.”
+2021 IEEE Intelligent Vehicles Symposium (IV), 2021</p>
+</dd>
 </dl>
 <p class="rubric">Methods</p>
 <table class="longtable docutils align-default">
@@ -130,26 +148,50 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([temperature_only, detection, …])</p></td>
-<td><p>Constructor</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>(*args[, temperature_only])</p></td>
+<td><p>Create an instance of <cite>LogisticCalibration</cite>.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
 <td><p>Clear model parameters.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y)</p></td>
-<td><p>Build logitic calibration model.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">convex</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Convex optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
+<td><p>Build logitic calibration model either conventional with single MLE estimate or with Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
 <td><p>Fit to data, then transform it.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">guide</span></code>([X, y])</p></td>
+<td><p>Variational substitution definition for each parameter.</p></td>
+</tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mask</span></code>()</p></td>
+<td><p>Seek for all relevant weights whose values are negative.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mcmc</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">model</span></code>([X, y])</p></td>
+<td><p>Definition of the log regression model.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">momentum</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Momentum optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X)</p></td>
+<td><p>Preprocessing of input data before called at the beginning of the fit-function.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prior</span></code>()</p></td>
+<td><p>Prior definition of the weights used for log regression.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -157,9 +199,15 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X)</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(device)</p></td>
+<td><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state, …])</p></td>
 <td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">variational</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform variational inference using the guide.</p></td>
+</tr>
 </tbody>
 </table>
 <dl class="method">
@@ -168,10 +216,25 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 <dd><p>Clear model parameters.</p>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.convex">
+<code class="sig-name descname">convex</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.convex" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convex optimization to find the global optimum of current parameter search.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibration.fit">
-<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; LogisticCalibration<a class="headerlink" href="#netcal.scaling.LogisticCalibration.fit" title="Permalink to this definition">¶</a></dt>
-<dd><p>Build logitic calibration model.</p>
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = True</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; AbstractLogisticRegression<a class="headerlink" href="#netcal.scaling.LogisticCalibration.fit" title="Permalink to this definition">¶</a></dt>
+<dd><p>Build logitic calibration model either conventional with single MLE estimate or with
+Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
@@ -180,13 +243,14 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
 <li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Instance of class <a class="reference internal" href="#netcal.scaling.LogisticCalibration" title="netcal.scaling.LogisticCalibration"><code class="xref py py-class docutils literal notranslate"><span class="pre">LogisticCalibration</span></code></a>.</p>
+<dd class="field-even"><p>Instance of class <a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>.</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p><a class="reference internal" href="#netcal.scaling.LogisticCalibration" title="netcal.scaling.LogisticCalibration">LogisticCalibration</a></p>
+<dd class="field-odd"><p><a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression</a></p>
 </dd>
 </dl>
 </dd></dl>
@@ -232,10 +296,32 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.guide">
+<code class="sig-name descname">guide</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.guide" title="Permalink to this definition">¶</a></dt>
+<dd><p>Variational substitution definition for each parameter. The signature is the same as for the
+“self.model” function but the variables are not used.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.intercept">
+<em class="property">property </em><code class="sig-name descname">intercept</code><a class="headerlink" href="#netcal.scaling.LogisticCalibration.intercept" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for intercept of logistic calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibration.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -249,10 +335,102 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.mask">
+<code class="sig-name descname">mask</code><span class="sig-paren">(</span><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, List]<a class="headerlink" href="#netcal.scaling.LogisticCalibration.mask" title="Permalink to this definition">¶</a></dt>
+<dd><p>Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+in the interval [0, 0].
+Constraints on the intercepts might also be set.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>Indices of masked values and list of boundary constraints for optimization.</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>tuple of (np.ndarray, list)</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.mcmc">
+<code class="sig-name descname">mcmc</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.mcmc" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.model">
+<code class="sig-name descname">model</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.LogisticCalibration.model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Definition of the log regression model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Logit of the log regression model.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor, shape=(n_samples, [n_classes])</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.momentum">
+<code class="sig-name descname">momentum</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.momentum" title="Permalink to this definition">¶</a></dt>
+<dd><p>Momentum optimization to find the global optimum of current parameter search.
+This method is slow but tends to find the global optimum for non-convex optimization.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.LogisticCalibration.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Preprocessing of input data before called at the beginning of the fit-function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Prepared data vector X as torch tensor.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.prior">
+<code class="sig-name descname">prior</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.prior" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prior definition of the weights used for log regression. This function has to set the
+variables ‘self.weight_prior_dist’, ‘self.weight_mean_init’ and ‘self.weight_stddev_init’.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibration.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -280,7 +458,7 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibration.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibration.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibration.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -299,27 +477,62 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device: torch.device</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibration.transform">
-<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibration.transform" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1000</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">mean_estimate: bool = False</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibration.transform" title="Permalink to this definition">¶</a></dt>
 <dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
 confidence estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
-On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference.</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+<li><p><strong>mean_estimate</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+distribution. This parameter has no effect on MLE.</p></li>
+</ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>NumPy array with calibrated confidence estimates.
-1-D for binary classification, 2-D for multi class (softmax).</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if ‘mean_estimate’ is True</em></p></li>
+<li><p><em>or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if ‘mean_estimate’ is False</em> – On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).
+On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+log regression parameter distribution obtained by VI or MCMC.</p></li>
+</ul>
+</p>
 </dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray, shape=(n_samples, [n_classes])</p>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.variational">
+<code class="sig-name descname">variational</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibration.variational" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform variational inference using the guide.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibration.weights">
+<em class="property">property </em><code class="sig-name descname">weights</code><a class="headerlink" href="#netcal.scaling.LogisticCalibration.weights" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for weights of logistic calibration.</p>
+</dd></dl>
+
 </dd></dl>
 
 </div>
@@ -331,8 +544,8 @@ <h1>netcal.scaling.LogisticCalibration<a class="headerlink" href="#netcal-scalin
       <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
         <div class="sphinxsidebarwrapper">
   <h4>Previous topic</h4>
-  <p class="topless"><a href="../netcal.scaling.html"
-                        title="previous chapter">netcal.scaling</a></p>
+  <p class="topless"><a href="netcal.scaling.AbstractLogisticRegression.html"
+                        title="previous chapter">netcal.scaling.AbstractLogisticRegression</a></p>
   <h4>Next topic</h4>
   <p class="topless"><a href="netcal.scaling.LogisticCalibrationDependent.html"
                         title="next chapter">netcal.scaling.LogisticCalibrationDependent</a></p>
@@ -370,9 +583,9 @@ <h3>Navigation</h3>
           <a href="netcal.scaling.LogisticCalibrationDependent.html" title="netcal.scaling.LogisticCalibrationDependent"
              >next</a> |</li>
         <li class="right" >
-          <a href="../netcal.scaling.html" title="netcal.scaling"
+          <a href="netcal.scaling.AbstractLogisticRegression.html" title="netcal.scaling.AbstractLogisticRegression"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" >netcal.scaling</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html
index 184db6b..ab31934 100644
--- a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html
+++ b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.scaling.LogisticCalibrationDependent &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.scaling.LogisticCalibrationDependent &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.LogisticCalibration.html" title="netcal.scaling.LogisticCalibration"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" accesskey="U">netcal.scaling</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,12 +49,11 @@ <h3>Navigation</h3>
 <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netcal-scaling-logisticcalibrationdependent" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.scaling.LogisticCalibrationDependent">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">LogisticCalibrationDependent</code><span class="sig-paren">(</span><em class="sig-param">detection: bool = True</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent" title="Permalink to this definition">¶</a></dt>
-<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.AbstractCalibration.AbstractCalibration</span></code></p>
-<p>This calibration method uses multivariate normal distributions to obtain a
-calibration mapping by means of the confidence as well as additional features. This method is originally
-proposed by <a class="footnote-reference brackets" href="#id3" id="id1">1</a>. This calibration scheme
-tries to model several dependencies in the variables given by the input <code class="docutils literal notranslate"><span class="pre">X</span></code>.</p>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">LogisticCalibrationDependent</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent" title="Permalink to this definition">¶</a></dt>
+<dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.scaling.AbstractLogisticRegression.AbstractLogisticRegression</span></code></p>
+<p>This calibration method is for detection only and uses multivariate normal distributions to obtain a
+calibration mapping by means of the confidence as well as additional features. This calibration scheme
+tries to model several dependencies in the variables given by the input <code class="docutils literal notranslate"><span class="pre">X</span></code> <a class="footnote-reference brackets" href="#id3" id="id1">1</a>.</p>
 <p>It is necessary to provide all data in input parameter <code class="docutils literal notranslate"><span class="pre">X</span></code> as an NumPy array of shape <code class="docutils literal notranslate"><span class="pre">(n_samples,</span> <span class="pre">n_features)</span></code>,
 whereas the confidence must be the first feature given in the input array. The ground-truth samples <code class="docutils literal notranslate"><span class="pre">y</span></code>
 must be an array of shape <code class="docutils literal notranslate"><span class="pre">(n_samples,)</span></code> consisting of binary labels <span class="math notranslate nohighlight">\(y \in \{0, 1\}\)</span>. Those
@@ -71,7 +70,7 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 input <span class="math notranslate nohighlight">\(s = (\hat{p}, \hat{r})\)</span> of size K by</p>
 <div class="math notranslate nohighlight">
 \[g(s) = \frac{1}{1 + \exp(-z(s))} ,\]</div>
-<p>According to <a class="footnote-reference brackets" href="#id3" id="id2">1</a>, we can interpret the logit <span class="math notranslate nohighlight">\(z\)</span> as the logarithm of the posterior odds</p>
+<p>According to <a class="footnote-reference brackets" href="#id4" id="id2">2</a>, we can interpret the logit <span class="math notranslate nohighlight">\(z\)</span> as the logarithm of the posterior odds</p>
 <div class="math notranslate nohighlight">
 \[z(s) = \log \frac{f(\text{m}=1 | s)}{f(\text{m}=0 | s)} \approx
 \log \frac{f(s | \text{m}=1)}{f(s | \text{m}=1)} = \ell r(s)\]</div>
@@ -86,24 +85,48 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 <p>To keep the restrictions to covariance matrices (symmetric and positive semidefinit), we optimize a decomposed
 matrix V as</p>
 <div class="math notranslate nohighlight">
-\[\Sigma = V^T * V\]</div>
+\[\Sigma = V^T V\]</div>
 <p>instead of estimating <span class="math notranslate nohighlight">\(\Sigma\)</span> directly. This guarantees both requirements.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: True</em>) – IMPORTANT: this parameter is only for compatibility reasons. It MUST be set to True.
-If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
-with shape (n_samples, [n_classes]).
-If True, the input array ‘X’ is treated as a box predictions with several box features (at least
-box confidence must be present) with shape (n_samples, [n_box_features]).</p>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>method</strong> (<em>str</em><em>, </em><em>default: &quot;mle&quot;</em>) – Method that is used to obtain a calibration mapping:
+- ‘mle’: Maximum likelihood estimate without uncertainty using a convex optimizer.
+- ‘momentum’: MLE estimate using Momentum optimizer for non-convex optimization.
+- ‘variational’: Variational Inference with uncertainty.
+- ‘mcmc’: Markov-Chain Monte-Carlo sampling with uncertainty.</p></li>
+<li><p><strong>momentum_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used by momentum optimizer.</p></li>
+<li><p><strong>mcmc_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 20</em>) – Number of weight samples obtained by MCMC sampling.</p></li>
+<li><p><strong>mcmc_chains</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Number of Markov-chains used in parallel for MCMC sampling (this will result
+in mcmc_steps * mcmc_chains samples).</p></li>
+<li><p><strong>mcmc_warmup_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 100</em>) – Warmup steps used for MCMC sampling.</p></li>
+<li><p><strong>vi_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used for ELBO optimization.</p></li>
+<li><p><strong>independent_probabilities</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Boolean for multi class probabilities.
+If set to True, the probability estimates for each
+class are treated as independent of each other (sigmoid).</p></li>
+<li><p><strong>use_cuda</strong> (<em>str</em><em> or </em><em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Specify if CUDA should be used. If str, you can also specify the device
+number like ‘cuda:0’, etc.</p></li>
+</ul>
 </dd>
 </dl>
 <p class="rubric">References</p>
 <dl class="footnote brackets">
-<dt class="label" id="id3"><span class="brackets">1</span><span class="fn-backref">(<a href="#id1">1</a>,<a href="#id2">2</a>)</span></dt>
+<dt class="label" id="id3"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
 “Multivariate Confidence Calibration for Object Detection.”
 The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
 </dd>
+<dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
+<dd><p>Kull, Meelis, Telmo Silva Filho, and Peter Flach:
+“Beta calibration: a well-founded and easily implemented improvement on logistic calibration for binary classifiers”
+Artificial Intelligence and Statistics, PMLR 54:623-631, 2017
+<a class="reference external" href="http://proceedings.mlr.press/v54/kull17a/kull17a.pdf">Get source online</a></p>
+</dd>
+<dt class="label" id="id5"><span class="brackets">3</span></dt>
+<dd><p>Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+“Bayesian Confidence Calibration for Epistemic Uncertainty Modelling.”
+2021 IEEE Intelligent Vehicles Symposium (IV), 2021</p>
+</dd>
 </dl>
 <p class="rubric">Methods</p>
 <table class="longtable docutils align-default">
@@ -112,26 +135,50 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([detection])</p></td>
-<td><p>Constructor.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>(*args, **kwargs)</p></td>
+<td><p>Create an instance of <cite>LogisticCalibrationDependent</cite>.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
 <td><p>Clear model parameters.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y)</p></td>
-<td><p>Build Logistic Calibration model for multivariate normal distributions.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">convex</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Convex optimization to find the global optimum of current parameter search.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
+<td><p>Build logitic calibration model either conventional with single MLE estimate or with Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
 <td><p>Fit to data, then transform it.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">guide</span></code>([X, y])</p></td>
+<td><p>Variational substitution definition for each parameter.</p></td>
+</tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mask</span></code>()</p></td>
+<td><p>Seek for all relevant weights whose values are negative.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mcmc</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">model</span></code>([X, y])</p></td>
+<td><p>Definition of the log regression model.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">momentum</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Momentum optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X)</p></td>
+<td><p>Preprocessing of input data before called at the beginning of the fit-function.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prior</span></code>()</p></td>
+<td><p>Prior definition of the weights used for log regression.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -139,9 +186,15 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X)</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(device)</p></td>
+<td><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state, …])</p></td>
 <td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">variational</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform variational inference using the guide.</p></td>
+</tr>
 </tbody>
 </table>
 <dl class="method">
@@ -150,10 +203,31 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 <dd><p>Clear model parameters.</p>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.convex">
+<code class="sig-name descname">convex</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.convex" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convex optimization to find the global optimum of current parameter search.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.covariances">
+<em class="property">property </em><code class="sig-name descname">covariances</code><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.covariances" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for covariance matrices of dependent logistic calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibrationDependent.fit">
-<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; LogisticCalibrationDependent<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.fit" title="Permalink to this definition">¶</a></dt>
-<dd><p>Build Logistic Calibration model for multivariate normal distributions.</p>
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = True</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; AbstractLogisticRegression<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.fit" title="Permalink to this definition">¶</a></dt>
+<dd><p>Build logitic calibration model either conventional with single MLE estimate or with
+Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
@@ -162,13 +236,14 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
 <li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Instance of class <a class="reference internal" href="#netcal.scaling.LogisticCalibrationDependent" title="netcal.scaling.LogisticCalibrationDependent"><code class="xref py py-class docutils literal notranslate"><span class="pre">LogisticCalibrationDependent</span></code></a>.</p>
+<dd class="field-even"><p>Instance of class <a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>.</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p><a class="reference internal" href="#netcal.scaling.LogisticCalibrationDependent" title="netcal.scaling.LogisticCalibrationDependent">LogisticCalibrationDependent</a></p>
+<dd class="field-odd"><p><a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression</a></p>
 </dd>
 </dl>
 </dd></dl>
@@ -214,10 +289,32 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.guide">
+<code class="sig-name descname">guide</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.guide" title="Permalink to this definition">¶</a></dt>
+<dd><p>Variational substitution definition for each parameter. The signature is the same as for the
+“self.model” function but the variables are not used.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.intercept">
+<em class="property">property </em><code class="sig-name descname">intercept</code><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.intercept" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for intercept of dependent logistic calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibrationDependent.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -231,10 +328,108 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.mask">
+<code class="sig-name descname">mask</code><span class="sig-paren">(</span><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, List]<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.mask" title="Permalink to this definition">¶</a></dt>
+<dd><p>Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+in the interval [0, 0].
+Constraints on the intercepts might also be set.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>Indices of masked values and list of boundary constraints for optimization.</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>tuple of (np.ndarray, list)</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.mcmc">
+<code class="sig-name descname">mcmc</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.mcmc" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.means">
+<em class="property">property </em><code class="sig-name descname">means</code><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.means" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for mean vectors of dependent logistic calibration.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.model">
+<code class="sig-name descname">model</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Definition of the log regression model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Logit of the log regression model.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor, shape=(n_samples, [n_classes])</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.momentum">
+<code class="sig-name descname">momentum</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.momentum" title="Permalink to this definition">¶</a></dt>
+<dd><p>Momentum optimization to find the global optimum of current parameter search.
+This method is slow but tends to find the global optimum for non-convex optimization.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Preprocessing of input data before called at the beginning of the fit-function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Prepared data vector X as torch tensor.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.prior">
+<code class="sig-name descname">prior</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.prior" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prior definition of the weights used for log regression. This function has to set the
+variables ‘self.weight_prior_dist’, ‘self.weight_mean_init’ and ‘self.weight_stddev_init’.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibrationDependent.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -262,7 +457,7 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibrationDependent.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -281,23 +476,52 @@ <h1>netcal.scaling.LogisticCalibrationDependent<a class="headerlink" href="#netc
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device: torch.device</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.LogisticCalibrationDependent.transform">
-<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.transform" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1000</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">mean_estimate: bool = False</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.transform" title="Permalink to this definition">¶</a></dt>
 <dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
 confidence estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
-On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference.</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+<li><p><strong>mean_estimate</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+distribution. This parameter has no effect on MLE.</p></li>
+</ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>NumPy array with calibrated confidence estimates.
-1-D for binary classification, 2-D for multi class (softmax).</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if ‘mean_estimate’ is True</em></p></li>
+<li><p><em>or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if ‘mean_estimate’ is False</em> – On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).
+On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+log regression parameter distribution obtained by VI or MCMC.</p></li>
+</ul>
+</p>
 </dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray, shape=(n_samples, [n_classes])</p>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.LogisticCalibrationDependent.variational">
+<code class="sig-name descname">variational</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.LogisticCalibrationDependent.variational" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform variational inference using the guide.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
@@ -354,7 +578,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.LogisticCalibration.html" title="netcal.scaling.LogisticCalibration"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" >netcal.scaling</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html
index ad8a050..c11a866 100644
--- a/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html
+++ b/docs/build/html/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.scaling.TemperatureScaling &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.scaling.TemperatureScaling &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.LogisticCalibrationDependent.html" title="netcal.scaling.LogisticCalibrationDependent"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" accesskey="U">netcal.scaling</a> &#187;</li> 
       </ul>
     </div>  
@@ -49,19 +49,38 @@ <h3>Navigation</h3>
 <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling-temperaturescaling" title="Permalink to this headline">¶</a></h1>
 <dl class="class">
 <dt id="netcal.scaling.TemperatureScaling">
-<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">TemperatureScaling</code><span class="sig-paren">(</span><em class="sig-param">detection: bool = False</em>, <em class="sig-param">independent_probabilities: bool = False</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><code class="sig-prename descclassname">netcal.scaling.</code><code class="sig-name descname">TemperatureScaling</code><span class="sig-paren">(</span><em class="sig-param">*args</em>, <em class="sig-param">**kwargs</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling" title="Permalink to this definition">¶</a></dt>
 <dd><p>Bases: <code class="xref py py-class docutils literal notranslate"><span class="pre">netcal.scaling.LogisticCalibration.LogisticCalibration</span></code></p>
-<p>Perform Temperature scaling to logits of NN. This method is originally proposed by <a class="footnote-reference brackets" href="#id3" id="id1">1</a>.
-The calibrated probability <span class="math notranslate nohighlight">\(\hat{q}\)</span> is computed by</p>
+<p>On classification or detection, apply the temperature scaling method described in <a class="footnote-reference brackets" href="#id2" id="id1">1</a> to obtain a
+calibration mapping. For confidence calibration in classification tasks, a
+confidence mapping <span class="math notranslate nohighlight">\(g\)</span> is applied on top of a miscalibrated scoring classifier <span class="math notranslate nohighlight">\(\hat{p} = h(x)\)</span> to
+deliver a calibrated confidence score <span class="math notranslate nohighlight">\(\hat{q} = g(h(x))\)</span>.</p>
+<p>For detection calibration, we can also use the additional box regression output which we denote as
+<span class="math notranslate nohighlight">\(\hat{r} \in [0, 1]^J\)</span> with <span class="math notranslate nohighlight">\(J\)</span> as the number of dimensions used for the box encoding (e.g.
+<span class="math notranslate nohighlight">\(J=4\)</span> for x position, y position, width and height).
+Therefore, the calibration map is not only a function of the confidence score, but also of <span class="math notranslate nohighlight">\(\hat{r}\)</span>.
+To define a general calibration map, we use the the combined input <span class="math notranslate nohighlight">\(s = (\hat{p}, \hat{r})\)</span> of size K
+and perform a temperature scaling defined by</p>
 <div class="math notranslate nohighlight">
-\[\hat{q} = \sigma_{\text{SM}} (z / T)\]</div>
-<p>with <span class="math notranslate nohighlight">\(\sigma_{\text{SM}}\)</span> as the softmax operator (or the sigmoid alternatively),
-<span class="math notranslate nohighlight">\(z\)</span> as the logits and <span class="math notranslate nohighlight">\(T\)</span> as the temperature estimated by logistic regression.
-This leds to calibrated confidence estimates.
-This methods can also be applied on object detection tasks with an additional regression output <a class="footnote-reference brackets" href="#id4" id="id2">2</a>.</p>
+\[\hat{q} = \sigma(s / T)\]</div>
+<p>with the temperature <span class="math notranslate nohighlight">\(T \in \mathbb{R}\)</span> as a single scalar value.
+The function <span class="math notranslate nohighlight">\(\sigma(*)\)</span> is either the sigmoid (on detection or binary classification) or the
+softmax operator (multiclass classification).</p>
+<p>We utilize standard optimization methods to determine the calibration mapping <span class="math notranslate nohighlight">\(g(s)\)</span>.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
+<li><p><strong>method</strong> (<em>str</em><em>, </em><em>default: &quot;mle&quot;</em>) – Method that is used to obtain a calibration mapping:
+- ‘mle’: Maximum likelihood estimate without uncertainty using a convex optimizer.
+- ‘momentum’: MLE estimate using Momentum optimizer for non-convex optimization.
+- ‘variational’: Variational Inference with uncertainty.
+- ‘mcmc’: Markov-Chain Monte-Carlo sampling with uncertainty.</p></li>
+<li><p><strong>momentum_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used by momentum optimizer.</p></li>
+<li><p><strong>mcmc_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 20</em>) – Number of weight samples obtained by MCMC sampling.</p></li>
+<li><p><strong>mcmc_chains</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1</em>) – Number of Markov-chains used in parallel for MCMC sampling (this will result
+in mcmc_steps * mcmc_chains samples).</p></li>
+<li><p><strong>mcmc_warmup_steps</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 100</em>) – Warmup steps used for MCMC sampling.</p></li>
+<li><p><strong>vi_epochs</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of epochs used for ELBO optimization.</p></li>
 <li><p><strong>detection</strong> (<em>bool</em><em>, </em><em>default: False</em>) – If False, the input array ‘X’ is treated as multi-class confidence input (softmax)
 with shape (n_samples, [n_classes]).
 If True, the input array ‘X’ is treated as a box predictions with several box features (at least
@@ -69,21 +88,28 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 <li><p><strong>independent_probabilities</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Boolean for multi class probabilities.
 If set to True, the probability estimates for each
 class are treated as independent of each other (sigmoid).</p></li>
+<li><p><strong>use_cuda</strong> (<em>str</em><em> or </em><em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – Specify if CUDA should be used. If str, you can also specify the device
+number like ‘cuda:0’, etc.</p></li>
 </ul>
 </dd>
 </dl>
 <p class="rubric">References</p>
 <dl class="footnote brackets">
-<dt class="label" id="id3"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
+<dt class="label" id="id2"><span class="brackets"><a class="fn-backref" href="#id1">1</a></span></dt>
 <dd><p>Chuan Guo, Geoff Pleiss, Yu Sun and Kilian Q. Weinberger:
 “On Calibration of Modern Neural Networks.”
 Proceedings of the 34th International Conference on Machine Learning-Volume 70. JMLR. org, 2017.
 <a class="reference external" href="https://arxiv.org/abs/1706.04599">Get source online</a></p>
 </dd>
-<dt class="label" id="id4"><span class="brackets"><a class="fn-backref" href="#id2">2</a></span></dt>
+<dt class="label" id="id3"><span class="brackets">2</span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
 “Multivariate Confidence Calibration for Object Detection.”
-The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.</p>
+The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.</p>
+</dd>
+<dt class="label" id="id4"><span class="brackets">3</span></dt>
+<dd><p>Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+“Bayesian Confidence Calibration for Epistemic Uncertainty Modelling.”
+2021 IEEE Intelligent Vehicles Symposium (IV), 2021</p>
 </dd>
 </dl>
 <p class="rubric">Methods</p>
@@ -93,26 +119,50 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>([detection, independent_probabilities])</p></td>
-<td><p>Constructor.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">__init__</span></code>(*args, **kwargs)</p></td>
+<td><p>Create an instance of <cite>TemperatureScaling</cite>.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">clear</span></code>()</p></td>
 <td><p>Clear model parameters.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y)</p></td>
-<td><p>Build logitic calibration model.</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">convex</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Convex optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit</span></code>(X, y[, random_state, tensorboard, log_dir])</p></td>
+<td><p>Build logitic calibration model either conventional with single MLE estimate or with Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">fit_transform</span></code>(X[, y])</p></td>
 <td><p>Fit to data, then transform it.</p></td>
 </tr>
-<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">get_params</span></code>([deep])</p></td>
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">guide</span></code>([X, y])</p></td>
+<td><p>Variational substitution definition for each parameter.</p></td>
+</tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mask</span></code>()</p></td>
+<td><p>Seek for all relevant weights whose values are negative.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">mcmc</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">model</span></code>([X, y])</p></td>
+<td><p>Definition of the log regression model.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">momentum</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Momentum optimization to find the global optimum of current parameter search.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prepare</span></code>(X)</p></td>
+<td><p>Preprocessing of input data before called at the beginning of the fit-function.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">prior</span></code>()</p></td>
+<td><p>Prior definition of the weights used for log regression.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -120,9 +170,15 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">squeeze_generic</span></code>(a, axes_to_keep)</p></td>
 <td><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is of size 1.</p></td>
 </tr>
-<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X)</p></td>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">to</span></code>(device)</p></td>
+<td><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">transform</span></code>(X[, num_samples, random_state, …])</p></td>
 <td><p>After model calibration, this function is used to get calibrated outputs of uncalibrated confidence estimates.</p></td>
 </tr>
+<tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">variational</span></code>(data, y, tensorboard, log_dir)</p></td>
+<td><p>Perform variational inference using the guide.</p></td>
+</tr>
 </tbody>
 </table>
 <dl class="method">
@@ -131,10 +187,25 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 <dd><p>Clear model parameters.</p>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.convex">
+<code class="sig-name descname">convex</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.convex" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convex optimization to find the global optimum of current parameter search.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.TemperatureScaling.fit">
-<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; LogisticCalibration<a class="headerlink" href="#netcal.scaling.TemperatureScaling.fit" title="Permalink to this definition">¶</a></dt>
-<dd><p>Build logitic calibration model.</p>
+<code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">tensorboard: bool = True</em>, <em class="sig-param">log_dir: str = None</em><span class="sig-paren">)</span> &#x2192; AbstractLogisticRegression<a class="headerlink" href="#netcal.scaling.TemperatureScaling.fit" title="Permalink to this definition">¶</a></dt>
+<dd><p>Build logitic calibration model either conventional with single MLE estimate or with
+Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><ul class="simple">
@@ -143,13 +214,14 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
 <li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – NumPy array with ground truth labels.
 Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
 </ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>Instance of class <a class="reference internal" href="netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration" title="netcal.scaling.LogisticCalibration"><code class="xref py py-class docutils literal notranslate"><span class="pre">LogisticCalibration</span></code></a>.</p>
+<dd class="field-even"><p>Instance of class <a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-class docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>.</p>
 </dd>
 <dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p><a class="reference internal" href="netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration" title="netcal.scaling.LogisticCalibration">LogisticCalibration</a></p>
+<dd class="field-odd"><p><a class="reference internal" href="netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression</a></p>
 </dd>
 </dl>
 </dd></dl>
@@ -195,10 +267,32 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.guide">
+<code class="sig-name descname">guide</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.guide" title="Permalink to this definition">¶</a></dt>
+<dd><p>Variational substitution definition for each parameter. The signature is the same as for the
+“self.model” function but the variables are not used.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.intercept">
+<em class="property">property </em><code class="sig-name descname">intercept</code><a class="headerlink" href="#netcal.scaling.TemperatureScaling.intercept" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for intercept of logistic calibration.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.TemperatureScaling.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -212,10 +306,102 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.mask">
+<code class="sig-name descname">mask</code><span class="sig-paren">(</span><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, List]<a class="headerlink" href="#netcal.scaling.TemperatureScaling.mask" title="Permalink to this definition">¶</a></dt>
+<dd><p>Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+in the interval [0, 0].
+Constraints on the intercepts might also be set.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Returns</dt>
+<dd class="field-odd"><p>Indices of masked values and list of boundary constraints for optimization.</p>
+</dd>
+<dt class="field-even">Return type</dt>
+<dd class="field-even"><p>tuple of (np.ndarray, list)</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.mcmc">
+<code class="sig-name descname">mcmc</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.mcmc" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.model">
+<code class="sig-name descname">model</code><span class="sig-paren">(</span><em class="sig-param">X: torch.Tensor = None</em>, <em class="sig-param">y: torch.Tensor = None</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.TemperatureScaling.model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Definition of the log regression model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_log_regression_features</em><em>)</em>) – Input data that has been prepared by “self.prepare” function call.</p></li>
+<li><p><strong>y</strong> (<em>torch.Tensor</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>)</em>) – Torch tensor with ground truth labels.
+Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Logit of the log regression model.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor, shape=(n_samples, [n_classes])</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.momentum">
+<code class="sig-name descname">momentum</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.momentum" title="Permalink to this definition">¶</a></dt>
+<dd><p>Momentum optimization to find the global optimum of current parameter search.
+This method is slow but tends to find the global optimum for non-convex optimization.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.prepare">
+<code class="sig-name descname">prepare</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; torch.Tensor<a class="headerlink" href="#netcal.scaling.TemperatureScaling.prepare" title="Permalink to this definition">¶</a></dt>
+<dd><p>Preprocessing of input data before called at the beginning of the fit-function.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+1-D for binary classification, 2-D for multi class (softmax).
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+</dd>
+<dt class="field-even">Returns</dt>
+<dd class="field-even"><p>Prepared data vector X as torch tensor.</p>
+</dd>
+<dt class="field-odd">Return type</dt>
+<dd class="field-odd"><p>torch.Tensor</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.prior">
+<code class="sig-name descname">prior</code><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.prior" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prior definition of the weights used for log regression. This function has to set the
+variables ‘self.weight_prior_dist’, ‘self.weight_mean_init’ and ‘self.weight_stddev_init’.</p>
+</dd></dl>
+
 <dl class="method">
 <dt id="netcal.scaling.TemperatureScaling.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -243,7 +429,7 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 
 <dl class="method">
 <dt id="netcal.scaling.TemperatureScaling.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.TemperatureScaling.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.TemperatureScaling.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -265,30 +451,65 @@ <h1>netcal.scaling.TemperatureScaling<a class="headerlink" href="#netcal-scaling
 <dl class="method">
 <dt id="netcal.scaling.TemperatureScaling.temperature">
 <em class="property">property </em><code class="sig-name descname">temperature</code><a class="headerlink" href="#netcal.scaling.TemperatureScaling.temperature" title="Permalink to this definition">¶</a></dt>
-<dd><p>Alias for the temperature</p>
+<dd><p>Getter for temperature of temperature scaling.</p>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.to">
+<code class="sig-name descname">to</code><span class="sig-paren">(</span><em class="sig-param">device: torch.device</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.to" title="Permalink to this definition">¶</a></dt>
+<dd><p>Set distribution parameters to the desired device in order to compute either on CPU or GPU.</p>
 </dd></dl>
 
 <dl class="method">
 <dt id="netcal.scaling.TemperatureScaling.transform">
-<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.TemperatureScaling.transform" title="Permalink to this definition">¶</a></dt>
+<code class="sig-name descname">transform</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">num_samples: int = 1000</em>, <em class="sig-param">random_state: int = None</em>, <em class="sig-param">mean_estimate: bool = False</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.scaling.TemperatureScaling.transform" title="Permalink to this definition">¶</a></dt>
 <dd><p>After model calibration, this function is used to get calibrated outputs of uncalibrated
 confidence estimates.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>X</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_classes</em><em>]</em><em>) or </em><em>(</em><em>n_samples</em><em>, </em><em>[</em><em>n_box_features</em><em>]</em><em>)</em>) – NumPy array with confidence values for each prediction on classification with shapes
 1-D for binary classification, 2-D for multi class (softmax).
-On detection, this array must have 2 dimensions with number of additional box features in last dim.</p>
+On detection, this array must have 2 dimensions with number of additional box features in last dim.</p></li>
+<li><p><strong>num_samples</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: 1000</em>) – Number of samples generated on MCMC sampling or Variational Inference.</p></li>
+<li><p><strong>random_state</strong> (<em>int</em><em>, </em><em>optional</em><em>, </em><em>default: None</em>) – Fix the random seed for the random number</p></li>
+<li><p><strong>mean_estimate</strong> (<em>bool</em><em>, </em><em>optional</em><em>, </em><em>default: False</em>) – If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+distribution. This parameter has no effect on MLE.</p></li>
+</ul>
 </dd>
 <dt class="field-even">Returns</dt>
-<dd class="field-even"><p>NumPy array with calibrated confidence estimates.
-1-D for binary classification, 2-D for multi class (softmax).</p>
+<dd class="field-even"><p><ul class="simple">
+<li><p><em>np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if ‘mean_estimate’ is True</em></p></li>
+<li><p><em>or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if ‘mean_estimate’ is False</em> – On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+1-D for binary classification, 2-D for multi class (softmax).
+On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+log regression parameter distribution obtained by VI or MCMC.</p></li>
+</ul>
+</p>
 </dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p>np.ndarray, shape=(n_samples, [n_classes])</p>
+</dl>
+</dd></dl>
+
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.variational">
+<code class="sig-name descname">variational</code><span class="sig-paren">(</span><em class="sig-param">data: torch.Tensor</em>, <em class="sig-param">y: torch.Tensor</em>, <em class="sig-param">tensorboard: bool</em>, <em class="sig-param">log_dir: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.scaling.TemperatureScaling.variational" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform variational inference using the guide.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters</dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>data_input</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>, </em><em>n_features</em><em>)</em>) – NumPy 2-D array with data input.</p></li>
+<li><p><strong>y</strong> (<em>np.ndarray</em><em>, </em><em>shape=</em><em>(</em><em>n_samples</em><em>,</em><em>)</em>) – NumPy array with ground truth labels as 1-D vector (binary).</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="method">
+<dt id="netcal.scaling.TemperatureScaling.weights">
+<em class="property">property </em><code class="sig-name descname">weights</code><a class="headerlink" href="#netcal.scaling.TemperatureScaling.weights" title="Permalink to this definition">¶</a></dt>
+<dd><p>Getter for weights of logistic calibration.</p>
+</dd></dl>
+
 </dd></dl>
 
 </div>
@@ -341,7 +562,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="netcal.scaling.LogisticCalibrationDependent.html" title="netcal.scaling.LogisticCalibrationDependent"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li>
           <li class="nav-item nav-item-1"><a href="../netcal.scaling.html" >netcal.scaling</a> &#187;</li> 
       </ul>
     </div>
diff --git a/docs/build/html/_autosummary/netcal.binning.html b/docs/build/html/_autosummary/netcal.binning.html
index 6eab21b..ec4acf8 100644
--- a/docs/build/html/_autosummary/netcal.binning.html
+++ b/docs/build/html/_autosummary/netcal.binning.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.binning &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.binning &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../index.html" title="API Reference"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -58,16 +58,16 @@ <h2>Available classes<a class="headerlink" href="#available-classes" title="Perm
 </colgroup>
 <tbody>
 <tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning" title="netcal.binning.HistogramBinning"><code class="xref py py-obj docutils literal notranslate"><span class="pre">HistogramBinning</span></code></a>([bins, equal_intervals, …])</p></td>
-<td><p>Simple Histogram Binning calibration method.</p></td>
+<td><p>Simple Histogram Binning calibration method <a href="#id5"><span class="problematic" id="id1">[1]_</span></a>.</p></td>
 </tr>
 <tr class="row-even"><td><p><a class="reference internal" href="_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression" title="netcal.binning.IsotonicRegression"><code class="xref py py-obj docutils literal notranslate"><span class="pre">IsotonicRegression</span></code></a>([detection, …])</p></td>
-<td><p>Isotonic Regression method.</p></td>
+<td><p>Isotonic Regression method <a href="#id6"><span class="problematic" id="id2">[1]_</span></a>.</p></td>
 </tr>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_binning/netcal.binning.BBQ.html#netcal.binning.BBQ" title="netcal.binning.BBQ"><code class="xref py py-obj docutils literal notranslate"><span class="pre">BBQ</span></code></a>([score_function, detection, …])</p></td>
-<td><p>Bayesian Binning into Quantiles (BBQ).</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_binning/netcal.binning.BBQ.html#netcal.binning.BBQ" title="netcal.binning.BBQ"><code class="xref py py-obj docutils literal notranslate"><span class="pre">BBQ</span></code></a>([score_function, equal_intervals, …])</p></td>
+<td><p>Bayesian Binning into Quantiles (BBQ) <a href="#id7"><span class="problematic" id="id3">[1]_</span></a>.</p></td>
 </tr>
 <tr class="row-even"><td><p><a class="reference internal" href="_autosummary_binning/netcal.binning.ENIR.html#netcal.binning.ENIR" title="netcal.binning.ENIR"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ENIR</span></code></a>([score_function, quick_init, …])</p></td>
-<td><p>Ensemble of Near Isotonic Regression (ENIR) models.</p></td>
+<td><p>Ensemble of Near Isotonic Regression (ENIR) models <a href="#id8"><span class="problematic" id="id4">[1]_</span></a>.</p></td>
 </tr>
 </tbody>
 </table>
@@ -130,7 +130,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../index.html" title="API Reference"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/_autosummary/netcal.metrics.html b/docs/build/html/_autosummary/netcal.metrics.html
index b3405b1..877004d 100644
--- a/docs/build/html/_autosummary/netcal.metrics.html
+++ b/docs/build/html/_autosummary/netcal.metrics.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.metrics &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.metrics &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
     
@@ -18,7 +18,7 @@
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
     <link rel="next" title="netcal.metrics.ACE" href="_autosummary_metric/netcal.metrics.ACE.html" />
-    <link rel="prev" title="netcal.regularization.confidence_penalty" href="_autosummary_regularization_func/netcal.regularization.confidence_penalty.html" /> 
+    <link rel="prev" title="netcal.regularization.DCAPenalty" href="_autosummary_regularization_func/netcal.regularization.DCAPenalty.html" /> 
   </head><body>
     <div class="related" role="navigation" aria-label="related navigation">
       <h3>Navigation</h3>
@@ -33,9 +33,9 @@ <h3>Navigation</h3>
           <a href="_autosummary_metric/netcal.metrics.ACE.html" title="netcal.metrics.ACE"
              accesskey="N">next</a> |</li>
         <li class="right" >
-          <a href="_autosummary_regularization_func/netcal.regularization.confidence_penalty.html" title="netcal.regularization.confidence_penalty"
+          <a href="_autosummary_regularization_func/netcal.regularization.DCAPenalty.html" title="netcal.regularization.DCAPenalty"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -59,15 +59,21 @@ <h2>Available classes<a class="headerlink" href="#available-classes" title="Perm
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE" title="netcal.metrics.ACE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ACE</span></code></a>([bins, detection, sample_threshold])</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE" title="netcal.metrics.ACE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ACE</span></code></a>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Average Calibration Error (ACE).</p></td>
 </tr>
-<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE" title="netcal.metrics.ECE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ECE</span></code></a>([bins, detection, sample_threshold])</p></td>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE" title="netcal.metrics.ECE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ECE</span></code></a>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Expected Calibration Error (ECE).</p></td>
 </tr>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE" title="netcal.metrics.MCE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">MCE</span></code></a>([bins, detection, sample_threshold])</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE" title="netcal.metrics.MCE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">MCE</span></code></a>([bins, equal_intervals, detection, …])</p></td>
 <td><p>Maximum Calibration Error (MCE).</p></td>
 </tr>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.MMCE.html#netcal.metrics.MMCE" title="netcal.metrics.MMCE"><code class="xref py py-obj docutils literal notranslate"><span class="pre">MMCE</span></code></a>([detection])</p></td>
+<td><p>Maximum Mean Calibration Error (MMCE) <a href="#id4"><span class="problematic" id="id1">[1]_</span></a>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP" title="netcal.metrics.PICP"><code class="xref py py-obj docutils literal notranslate"><span class="pre">PICP</span></code></a>([bins, equal_intervals, detection, …])</p></td>
+<td><p>Compute Prediction Interval Coverage Probability (PICP) <a href="#id5"><span class="problematic" id="id2">[1]_</span></a>,[2]_ and Mean Prediction Interval Width (MPIW) <a href="#id6"><span class="problematic" id="id3">[2]_</span></a>.</p></td>
+</tr>
 </tbody>
 </table>
 </div>
@@ -88,8 +94,8 @@ <h3><a href="../index.html">Table of Contents</a></h3>
 </ul>
 
   <h4>Previous topic</h4>
-  <p class="topless"><a href="_autosummary_regularization_func/netcal.regularization.confidence_penalty.html"
-                        title="previous chapter">netcal.regularization.confidence_penalty</a></p>
+  <p class="topless"><a href="_autosummary_regularization_func/netcal.regularization.DCAPenalty.html"
+                        title="previous chapter">netcal.regularization.DCAPenalty</a></p>
   <h4>Next topic</h4>
   <p class="topless"><a href="_autosummary_metric/netcal.metrics.ACE.html"
                         title="next chapter">netcal.metrics.ACE</a></p>
@@ -127,9 +133,9 @@ <h3>Navigation</h3>
           <a href="_autosummary_metric/netcal.metrics.ACE.html" title="netcal.metrics.ACE"
              >next</a> |</li>
         <li class="right" >
-          <a href="_autosummary_regularization_func/netcal.regularization.confidence_penalty.html" title="netcal.regularization.confidence_penalty"
+          <a href="_autosummary_regularization_func/netcal.regularization.DCAPenalty.html" title="netcal.regularization.DCAPenalty"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/_autosummary/netcal.presentation.html b/docs/build/html/_autosummary/netcal.presentation.html
index 20480d0..744cc64 100644
--- a/docs/build/html/_autosummary/netcal.presentation.html
+++ b/docs/build/html/_autosummary/netcal.presentation.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.presentation &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.presentation &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
     
@@ -18,7 +18,7 @@
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
     <link rel="next" title="netcal.presentation.ReliabilityDiagram" href="_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html" />
-    <link rel="prev" title="netcal.metrics.MCE" href="_autosummary_metric/netcal.metrics.MCE.html" /> 
+    <link rel="prev" title="netcal.metrics.PICP" href="_autosummary_metric/netcal.metrics.PICP.html" /> 
   </head><body>
     <div class="related" role="navigation" aria-label="related navigation">
       <h3>Navigation</h3>
@@ -33,9 +33,9 @@ <h3>Navigation</h3>
           <a href="_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html" title="netcal.presentation.ReliabilityDiagram"
              accesskey="N">next</a> |</li>
         <li class="right" >
-          <a href="_autosummary_metric/netcal.metrics.MCE.html" title="netcal.metrics.MCE"
+          <a href="_autosummary_metric/netcal.metrics.PICP.html" title="netcal.metrics.PICP"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -57,7 +57,7 @@ <h2>Available classes<a class="headerlink" href="#available-classes" title="Perm
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html#netcal.presentation.ReliabilityDiagram" title="netcal.presentation.ReliabilityDiagram"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ReliabilityDiagram</span></code></a>([bins, detection, …])</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html#netcal.presentation.ReliabilityDiagram" title="netcal.presentation.ReliabilityDiagram"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ReliabilityDiagram</span></code></a>([bins, equal_intervals, …])</p></td>
 <td><p>Plot Confidence Histogram and Reliability Diagram to visualize miscalibration.</p></td>
 </tr>
 </tbody>
@@ -80,8 +80,8 @@ <h3><a href="../index.html">Table of Contents</a></h3>
 </ul>
 
   <h4>Previous topic</h4>
-  <p class="topless"><a href="_autosummary_metric/netcal.metrics.MCE.html"
-                        title="previous chapter">netcal.metrics.MCE</a></p>
+  <p class="topless"><a href="_autosummary_metric/netcal.metrics.PICP.html"
+                        title="previous chapter">netcal.metrics.PICP</a></p>
   <h4>Next topic</h4>
   <p class="topless"><a href="_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html"
                         title="next chapter">netcal.presentation.ReliabilityDiagram</a></p>
@@ -119,9 +119,9 @@ <h3>Navigation</h3>
           <a href="_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html" title="netcal.presentation.ReliabilityDiagram"
              >next</a> |</li>
         <li class="right" >
-          <a href="_autosummary_metric/netcal.metrics.MCE.html" title="netcal.metrics.MCE"
+          <a href="_autosummary_metric/netcal.metrics.PICP.html" title="netcal.metrics.PICP"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/_autosummary/netcal.regularization.html b/docs/build/html/_autosummary/netcal.regularization.html
index 42d0e84..3c37967 100644
--- a/docs/build/html/_autosummary/netcal.regularization.html
+++ b/docs/build/html/_autosummary/netcal.regularization.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.regularization &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.regularization &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
     
@@ -35,7 +35,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html" title="netcal.scaling.BetaCalibrationDependent"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -61,6 +61,15 @@ <h2>Available functions<a class="headerlink" href="#available-functions" title="
 <tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_regularization_func/netcal.regularization.confidence_penalty.html#netcal.regularization.confidence_penalty" title="netcal.regularization.confidence_penalty"><code class="xref py py-obj docutils literal notranslate"><span class="pre">confidence_penalty</span></code></a>(X, weight[, threshold, base])</p></td>
 <td><p>Confidence Penalty Regularization.</p></td>
 </tr>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty" title="netcal.regularization.ConfidencePenalty"><code class="xref py py-obj docutils literal notranslate"><span class="pre">ConfidencePenalty</span></code></a>([weight, threshold, reduction])</p></td>
+<td><p>Confidence penalty regularization implementation for PyTorch.</p></td>
+</tr>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty" title="netcal.regularization.MMCEPenalty"><code class="xref py py-obj docutils literal notranslate"><span class="pre">MMCEPenalty</span></code></a>([weight])</p></td>
+<td><p>Maximum mean calibration error (MMCE) <a href="#id3"><span class="problematic" id="id1">[1]_</span></a>.</p></td>
+</tr>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty" title="netcal.regularization.DCAPenalty"><code class="xref py py-obj docutils literal notranslate"><span class="pre">DCAPenalty</span></code></a>([weight])</p></td>
+<td><p>Difference between Confidence and Accuracy (DCA) <a href="#id4"><span class="problematic" id="id2">[1]_</span></a>.</p></td>
+</tr>
 </tbody>
 </table>
 </div>
@@ -122,7 +131,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html" title="netcal.scaling.BetaCalibrationDependent"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/_autosummary/netcal.scaling.html b/docs/build/html/_autosummary/netcal.scaling.html
index 095da4e..d473031 100644
--- a/docs/build/html/_autosummary/netcal.scaling.html
+++ b/docs/build/html/_autosummary/netcal.scaling.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.scaling &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.scaling &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
     
@@ -17,7 +17,7 @@
     
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="netcal.scaling.LogisticCalibration" href="_autosummary_scaling/netcal.scaling.LogisticCalibration.html" />
+    <link rel="next" title="netcal.scaling.AbstractLogisticRegression" href="_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html" />
     <link rel="prev" title="netcal.binning.ENIR" href="_autosummary_binning/netcal.binning.ENIR.html" /> 
   </head><body>
     <div class="related" role="navigation" aria-label="related navigation">
@@ -30,12 +30,12 @@ <h3>Navigation</h3>
           <a href="../py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
         <li class="right" >
-          <a href="_autosummary_scaling/netcal.scaling.LogisticCalibration.html" title="netcal.scaling.LogisticCalibration"
+          <a href="_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html" title="netcal.scaling.AbstractLogisticRegression"
              accesskey="N">next</a> |</li>
         <li class="right" >
           <a href="_autosummary_binning/netcal.binning.ENIR.html" title="netcal.binning.ENIR"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -57,19 +57,22 @@ <h2>Available classes<a class="headerlink" href="#available-classes" title="Perm
 <col style="width: 90%" />
 </colgroup>
 <tbody>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration" title="netcal.scaling.LogisticCalibration"><code class="xref py py-obj docutils literal notranslate"><span class="pre">LogisticCalibration</span></code></a>([temperature_only, …])</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression" title="netcal.scaling.AbstractLogisticRegression"><code class="xref py py-obj docutils literal notranslate"><span class="pre">AbstractLogisticRegression</span></code></a>([method, …])</p></td>
+<td><p>Abstract class for all calibration methods that base on logistic regression.</p></td>
+</tr>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration" title="netcal.scaling.LogisticCalibration"><code class="xref py py-obj docutils literal notranslate"><span class="pre">LogisticCalibration</span></code></a>(*args[, temperature_only])</p></td>
 <td><p>On classification, apply the logistic calibration method aka Platt scaling to obtain a calibration mapping.</p></td>
 </tr>
-<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent" title="netcal.scaling.LogisticCalibrationDependent"><code class="xref py py-obj docutils literal notranslate"><span class="pre">LogisticCalibrationDependent</span></code></a>([detection])</p></td>
-<td><p>This calibration method uses multivariate normal distributions to obtain a calibration mapping by means of the confidence as well as additional features.</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent" title="netcal.scaling.LogisticCalibrationDependent"><code class="xref py py-obj docutils literal notranslate"><span class="pre">LogisticCalibrationDependent</span></code></a>(*args, **kwargs)</p></td>
+<td><p>This calibration method is for detection only and uses multivariate normal distributions to obtain a calibration mapping by means of the confidence as well as additional features.</p></td>
 </tr>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling" title="netcal.scaling.TemperatureScaling"><code class="xref py py-obj docutils literal notranslate"><span class="pre">TemperatureScaling</span></code></a>([detection, …])</p></td>
-<td><p>Perform Temperature scaling to logits of NN.</p></td>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling" title="netcal.scaling.TemperatureScaling"><code class="xref py py-obj docutils literal notranslate"><span class="pre">TemperatureScaling</span></code></a>(*args, **kwargs)</p></td>
+<td><p>On classification or detection, apply the temperature scaling method described in <a href="#id2"><span class="problematic" id="id1">[1]_</span></a> to obtain a calibration mapping.</p></td>
 </tr>
-<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration" title="netcal.scaling.BetaCalibration"><code class="xref py py-obj docutils literal notranslate"><span class="pre">BetaCalibration</span></code></a>([auto_select, detection, …])</p></td>
+<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration" title="netcal.scaling.BetaCalibration"><code class="xref py py-obj docutils literal notranslate"><span class="pre">BetaCalibration</span></code></a>(*args, **kwargs)</p></td>
 <td><p>On classification, apply the beta calibration method to obtain a calibration mapping.</p></td>
 </tr>
-<tr class="row-odd"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent" title="netcal.scaling.BetaCalibrationDependent"><code class="xref py py-obj docutils literal notranslate"><span class="pre">BetaCalibrationDependent</span></code></a>([momentum, …])</p></td>
+<tr class="row-even"><td><p><a class="reference internal" href="_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent" title="netcal.scaling.BetaCalibrationDependent"><code class="xref py py-obj docutils literal notranslate"><span class="pre">BetaCalibrationDependent</span></code></a>(*args[, method])</p></td>
 <td><p>This calibration method uses a multivariate variant of a Beta distribution to obtain a calibration mapping by means of the confidence as well as additional features.</p></td>
 </tr>
 </tbody>
@@ -95,8 +98,8 @@ <h4>Previous topic</h4>
   <p class="topless"><a href="_autosummary_binning/netcal.binning.ENIR.html"
                         title="previous chapter">netcal.binning.ENIR</a></p>
   <h4>Next topic</h4>
-  <p class="topless"><a href="_autosummary_scaling/netcal.scaling.LogisticCalibration.html"
-                        title="next chapter">netcal.scaling.LogisticCalibration</a></p>
+  <p class="topless"><a href="_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html"
+                        title="next chapter">netcal.scaling.AbstractLogisticRegression</a></p>
   <div role="note" aria-label="source link">
     <h3>This Page</h3>
     <ul class="this-page-menu">
@@ -128,12 +131,12 @@ <h3>Navigation</h3>
           <a href="../py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
         <li class="right" >
-          <a href="_autosummary_scaling/netcal.scaling.LogisticCalibration.html" title="netcal.scaling.LogisticCalibration"
+          <a href="_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html" title="netcal.scaling.AbstractLogisticRegression"
              >next</a> |</li>
         <li class="right" >
           <a href="_autosummary_binning/netcal.binning.ENIR.html" title="netcal.binning.ENIR"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/_autosummary_abstract_calibration/netcal.AbstractCalibration.html b/docs/build/html/_autosummary_abstract_calibration/netcal.AbstractCalibration.html
index 71827f1..7c46e1d 100644
--- a/docs/build/html/_autosummary_abstract_calibration/netcal.AbstractCalibration.html
+++ b/docs/build/html/_autosummary_abstract_calibration/netcal.AbstractCalibration.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>netcal.AbstractCalibration &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>netcal.AbstractCalibration &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="../_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="../_static/pygments.css" type="text/css" />
     
@@ -31,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html" title="netcal.presentation.ReliabilityDiagram"
              accesskey="P">previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -73,17 +73,6 @@ <h1>netcal.AbstractCalibration<a class="headerlink" href="#netcal-abstractcalibr
 </dl>
 </dd></dl>
 
-<dl class="attribute">
-<dt id="netcal.AbstractCalibration.logger">
-<code class="sig-name descname">logger</code><a class="headerlink" href="#netcal.AbstractCalibration.logger" title="Permalink to this definition">¶</a></dt>
-<dd><p>Logger for printing debug/info/warning/error messages.</p>
-<dl class="field-list simple">
-<dt class="field-odd">Type</dt>
-<dd class="field-odd"><p>RootLogger</p>
-</dd>
-</dl>
-</dd></dl>
-
 <p class="rubric">Methods</p>
 <table class="longtable docutils align-default">
 <colgroup>
@@ -107,10 +96,10 @@ <h1>netcal.AbstractCalibration<a class="headerlink" href="#netcal-abstractcalibr
 <td><p>Get parameters for this estimator.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">load_model</span></code>(filename)</p></td>
-<td><p>Load model from saved Pickle instance.</p></td>
+<td><p>Load model from saved torch dump.</p></td>
 </tr>
 <tr class="row-odd"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">save_model</span></code>(filename)</p></td>
-<td><p>Save model instance as Pickle Object.</p></td>
+<td><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p></td>
 </tr>
 <tr class="row-even"><td><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">set_params</span></code>(**params)</p></td>
 <td><p>Set the parameters of this estimator.</p></td>
@@ -131,7 +120,7 @@ <h1>netcal.AbstractCalibration<a class="headerlink" href="#netcal-abstractcalibr
 
 <dl class="method">
 <dt id="netcal.AbstractCalibration.fit">
-<em class="property">abstract </em><code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; tuple<a class="headerlink" href="#netcal.AbstractCalibration.fit" title="Permalink to this definition">¶</a></dt>
+<em class="property">abstract </em><code class="sig-name descname">fit</code><span class="sig-paren">(</span><em class="sig-param">X: numpy.ndarray</em>, <em class="sig-param">y: numpy.ndarray</em><span class="sig-paren">)</span> &#x2192; Tuple[numpy.ndarray, numpy.ndarray]<a class="headerlink" href="#netcal.AbstractCalibration.fit" title="Permalink to this definition">¶</a></dt>
 <dd><p>Abstract function call to build the calibration model.
 This function performs several checks and returns the improved X and y.</p>
 <dl class="field-list simple">
@@ -205,7 +194,7 @@ <h1>netcal.AbstractCalibration<a class="headerlink" href="#netcal-abstractcalibr
 <dl class="method">
 <dt id="netcal.AbstractCalibration.load_model">
 <code class="sig-name descname">load_model</code><span class="sig-paren">(</span><em class="sig-param">filename</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.AbstractCalibration.load_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Load model from saved Pickle instance.</p>
+<dd><p>Load model from saved torch dump.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -222,7 +211,7 @@ <h1>netcal.AbstractCalibration<a class="headerlink" href="#netcal-abstractcalibr
 <dl class="method">
 <dt id="netcal.AbstractCalibration.save_model">
 <code class="sig-name descname">save_model</code><span class="sig-paren">(</span><em class="sig-param">filename: str</em><span class="sig-paren">)</span><a class="headerlink" href="#netcal.AbstractCalibration.save_model" title="Permalink to this definition">¶</a></dt>
-<dd><p>Save model instance as Pickle Object.</p>
+<dd><p>Save model instance as with torch’s save function as this is safer for torch tensors.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters</dt>
 <dd class="field-odd"><p><strong>filename</strong> (<em>str</em>) – String with filename.</p>
@@ -250,7 +239,7 @@ <h1>netcal.AbstractCalibration<a class="headerlink" href="#netcal-abstractcalibr
 
 <dl class="method">
 <dt id="netcal.AbstractCalibration.squeeze_generic">
-<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, list, tuple]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.AbstractCalibration.squeeze_generic" title="Permalink to this definition">¶</a></dt>
+<em class="property">classmethod </em><code class="sig-name descname">squeeze_generic</code><span class="sig-paren">(</span><em class="sig-param">a: numpy.ndarray, axes_to_keep: Union[int, Iterable[int]]</em><span class="sig-paren">)</span> &#x2192; numpy.ndarray<a class="headerlink" href="#netcal.AbstractCalibration.squeeze_generic" title="Permalink to this definition">¶</a></dt>
 <dd><p>Squeeze input array a but keep axes defined by parameter ‘axes_to_keep’ even if the dimension is
 of size 1.</p>
 <dl class="field-list simple">
@@ -347,7 +336,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="../_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html" title="netcal.presentation.ReliabilityDiagram"
              >previous</a> |</li>
-        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="../index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ACE.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ACE.rst.txt
index 333d3d5..9e2f3d5 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ACE.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ACE.rst.txt
@@ -13,7 +13,11 @@ netcal.metrics.ACE
    .. autosummary::
    
       ~ACE.__init__
+      ~ACE.binning
       ~ACE.measure
+      ~ACE.prepare
+      ~ACE.process
+      ~ACE.reduce
       ~ACE.squeeze_generic
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ECE.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ECE.rst.txt
index 8d85d5a..d9344b3 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ECE.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.ECE.rst.txt
@@ -13,7 +13,11 @@ netcal.metrics.ECE
    .. autosummary::
    
       ~ECE.__init__
+      ~ECE.binning
       ~ECE.measure
+      ~ECE.prepare
+      ~ECE.process
+      ~ECE.reduce
       ~ECE.squeeze_generic
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MCE.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MCE.rst.txt
index 830fb8d..f2a508a 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MCE.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MCE.rst.txt
@@ -13,7 +13,11 @@ netcal.metrics.MCE
    .. autosummary::
    
       ~MCE.__init__
+      ~MCE.binning
       ~MCE.measure
+      ~MCE.prepare
+      ~MCE.process
+      ~MCE.reduce
       ~MCE.squeeze_generic
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MMCE.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MMCE.rst.txt
new file mode 100644
index 0000000..ec87d9d
--- /dev/null
+++ b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.MMCE.rst.txt
@@ -0,0 +1,18 @@
+netcal.metrics.MMCE
+===================
+
+.. currentmodule:: netcal.metrics
+
+.. autoclass:: MMCE
+   :no-private-members:
+
+   
+   
+   .. rubric:: Methods
+
+   .. autosummary::
+   
+      ~MMCE.__init__
+      ~MMCE.measure
+   
+   
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.PICP.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.PICP.rst.txt
new file mode 100644
index 0000000..a369dcd
--- /dev/null
+++ b/docs/build/html/_sources/_autosummary/_autosummary_metric/netcal.metrics.PICP.rst.txt
@@ -0,0 +1,24 @@
+netcal.metrics.PICP
+===================
+
+.. currentmodule:: netcal.metrics
+
+.. autoclass:: PICP
+   :no-private-members:
+
+   
+   
+   .. rubric:: Methods
+
+   .. autosummary::
+   
+      ~PICP.__init__
+      ~PICP.accuracy
+      ~PICP.binning
+      ~PICP.measure
+      ~PICP.prepare
+      ~PICP.process
+      ~PICP.reduce
+      ~PICP.squeeze_generic
+   
+   
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.rst.txt
new file mode 100644
index 0000000..b3683ee
--- /dev/null
+++ b/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.rst.txt
@@ -0,0 +1,61 @@
+netcal.regularization.ConfidencePenalty
+=======================================
+
+.. currentmodule:: netcal.regularization
+
+.. autoclass:: ConfidencePenalty
+
+   
+   .. automethod:: __init__
+
+   
+   .. rubric:: Methods
+
+   .. autosummary::
+   
+      ~ConfidencePenalty.__init__
+      ~ConfidencePenalty.add_module
+      ~ConfidencePenalty.apply
+      ~ConfidencePenalty.bfloat16
+      ~ConfidencePenalty.buffers
+      ~ConfidencePenalty.children
+      ~ConfidencePenalty.cpu
+      ~ConfidencePenalty.cuda
+      ~ConfidencePenalty.double
+      ~ConfidencePenalty.eval
+      ~ConfidencePenalty.extra_repr
+      ~ConfidencePenalty.float
+      ~ConfidencePenalty.forward
+      ~ConfidencePenalty.half
+      ~ConfidencePenalty.load_state_dict
+      ~ConfidencePenalty.modules
+      ~ConfidencePenalty.named_buffers
+      ~ConfidencePenalty.named_children
+      ~ConfidencePenalty.named_modules
+      ~ConfidencePenalty.named_parameters
+      ~ConfidencePenalty.parameters
+      ~ConfidencePenalty.register_backward_hook
+      ~ConfidencePenalty.register_buffer
+      ~ConfidencePenalty.register_forward_hook
+      ~ConfidencePenalty.register_forward_pre_hook
+      ~ConfidencePenalty.register_parameter
+      ~ConfidencePenalty.requires_grad_
+      ~ConfidencePenalty.share_memory
+      ~ConfidencePenalty.state_dict
+      ~ConfidencePenalty.to
+      ~ConfidencePenalty.train
+      ~ConfidencePenalty.type
+      ~ConfidencePenalty.zero_grad
+   
+   
+
+   
+   
+   .. rubric:: Attributes
+
+   .. autosummary::
+   
+      ~ConfidencePenalty.dump_patches
+      ~ConfidencePenalty.epsilon
+   
+   
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.rst.txt
new file mode 100644
index 0000000..adae756
--- /dev/null
+++ b/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.rst.txt
@@ -0,0 +1,60 @@
+netcal.regularization.DCAPenalty
+================================
+
+.. currentmodule:: netcal.regularization
+
+.. autoclass:: DCAPenalty
+
+   
+   .. automethod:: __init__
+
+   
+   .. rubric:: Methods
+
+   .. autosummary::
+   
+      ~DCAPenalty.__init__
+      ~DCAPenalty.add_module
+      ~DCAPenalty.apply
+      ~DCAPenalty.bfloat16
+      ~DCAPenalty.buffers
+      ~DCAPenalty.children
+      ~DCAPenalty.cpu
+      ~DCAPenalty.cuda
+      ~DCAPenalty.double
+      ~DCAPenalty.eval
+      ~DCAPenalty.extra_repr
+      ~DCAPenalty.float
+      ~DCAPenalty.forward
+      ~DCAPenalty.half
+      ~DCAPenalty.load_state_dict
+      ~DCAPenalty.modules
+      ~DCAPenalty.named_buffers
+      ~DCAPenalty.named_children
+      ~DCAPenalty.named_modules
+      ~DCAPenalty.named_parameters
+      ~DCAPenalty.parameters
+      ~DCAPenalty.register_backward_hook
+      ~DCAPenalty.register_buffer
+      ~DCAPenalty.register_forward_hook
+      ~DCAPenalty.register_forward_pre_hook
+      ~DCAPenalty.register_parameter
+      ~DCAPenalty.requires_grad_
+      ~DCAPenalty.share_memory
+      ~DCAPenalty.state_dict
+      ~DCAPenalty.to
+      ~DCAPenalty.train
+      ~DCAPenalty.type
+      ~DCAPenalty.zero_grad
+   
+   
+
+   
+   
+   .. rubric:: Attributes
+
+   .. autosummary::
+   
+      ~DCAPenalty.dump_patches
+   
+   
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.rst.txt
new file mode 100644
index 0000000..0dbd163
--- /dev/null
+++ b/docs/build/html/_sources/_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.rst.txt
@@ -0,0 +1,62 @@
+netcal.regularization.MMCEPenalty
+=================================
+
+.. currentmodule:: netcal.regularization
+
+.. autoclass:: MMCEPenalty
+
+   
+   .. automethod:: __init__
+
+   
+   .. rubric:: Methods
+
+   .. autosummary::
+   
+      ~MMCEPenalty.__init__
+      ~MMCEPenalty.add_module
+      ~MMCEPenalty.apply
+      ~MMCEPenalty.bfloat16
+      ~MMCEPenalty.buffers
+      ~MMCEPenalty.children
+      ~MMCEPenalty.cpu
+      ~MMCEPenalty.cuda
+      ~MMCEPenalty.double
+      ~MMCEPenalty.eval
+      ~MMCEPenalty.extra_repr
+      ~MMCEPenalty.float
+      ~MMCEPenalty.forward
+      ~MMCEPenalty.half
+      ~MMCEPenalty.kernel
+      ~MMCEPenalty.load_state_dict
+      ~MMCEPenalty.modules
+      ~MMCEPenalty.named_buffers
+      ~MMCEPenalty.named_children
+      ~MMCEPenalty.named_modules
+      ~MMCEPenalty.named_parameters
+      ~MMCEPenalty.parameters
+      ~MMCEPenalty.register_backward_hook
+      ~MMCEPenalty.register_buffer
+      ~MMCEPenalty.register_forward_hook
+      ~MMCEPenalty.register_forward_pre_hook
+      ~MMCEPenalty.register_parameter
+      ~MMCEPenalty.requires_grad_
+      ~MMCEPenalty.share_memory
+      ~MMCEPenalty.state_dict
+      ~MMCEPenalty.to
+      ~MMCEPenalty.train
+      ~MMCEPenalty.type
+      ~MMCEPenalty.zero_grad
+   
+   
+
+   
+   
+   .. rubric:: Attributes
+
+   .. autosummary::
+   
+      ~MMCEPenalty.dump_patches
+      ~MMCEPenalty.epsilon
+   
+   
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.rst.txt
new file mode 100644
index 0000000..d955507
--- /dev/null
+++ b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.rst.txt
@@ -0,0 +1,36 @@
+netcal.scaling.AbstractLogisticRegression
+=========================================
+
+.. currentmodule:: netcal.scaling
+
+.. autoclass:: AbstractLogisticRegression
+   :no-private-members:
+
+   
+   
+   .. rubric:: Methods
+
+   .. autosummary::
+   
+      ~AbstractLogisticRegression.__init__
+      ~AbstractLogisticRegression.clear
+      ~AbstractLogisticRegression.convex
+      ~AbstractLogisticRegression.fit
+      ~AbstractLogisticRegression.fit_transform
+      ~AbstractLogisticRegression.get_params
+      ~AbstractLogisticRegression.guide
+      ~AbstractLogisticRegression.load_model
+      ~AbstractLogisticRegression.mask
+      ~AbstractLogisticRegression.mcmc
+      ~AbstractLogisticRegression.model
+      ~AbstractLogisticRegression.momentum
+      ~AbstractLogisticRegression.prepare
+      ~AbstractLogisticRegression.prior
+      ~AbstractLogisticRegression.save_model
+      ~AbstractLogisticRegression.set_params
+      ~AbstractLogisticRegression.squeeze_generic
+      ~AbstractLogisticRegression.to
+      ~AbstractLogisticRegression.transform
+      ~AbstractLogisticRegression.variational
+   
+   
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.rst.txt
index 64a231d..b7baa15 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.rst.txt
@@ -14,13 +14,23 @@ netcal.scaling.BetaCalibration
    
       ~BetaCalibration.__init__
       ~BetaCalibration.clear
+      ~BetaCalibration.convex
       ~BetaCalibration.fit
       ~BetaCalibration.fit_transform
       ~BetaCalibration.get_params
+      ~BetaCalibration.guide
       ~BetaCalibration.load_model
+      ~BetaCalibration.mask
+      ~BetaCalibration.mcmc
+      ~BetaCalibration.model
+      ~BetaCalibration.momentum
+      ~BetaCalibration.prepare
+      ~BetaCalibration.prior
       ~BetaCalibration.save_model
       ~BetaCalibration.set_params
       ~BetaCalibration.squeeze_generic
+      ~BetaCalibration.to
       ~BetaCalibration.transform
+      ~BetaCalibration.variational
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.rst.txt
index d5378e4..c7f3a91 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.rst.txt
@@ -14,13 +14,23 @@ netcal.scaling.BetaCalibrationDependent
    
       ~BetaCalibrationDependent.__init__
       ~BetaCalibrationDependent.clear
+      ~BetaCalibrationDependent.convex
       ~BetaCalibrationDependent.fit
       ~BetaCalibrationDependent.fit_transform
       ~BetaCalibrationDependent.get_params
+      ~BetaCalibrationDependent.guide
       ~BetaCalibrationDependent.load_model
+      ~BetaCalibrationDependent.mask
+      ~BetaCalibrationDependent.mcmc
+      ~BetaCalibrationDependent.model
+      ~BetaCalibrationDependent.momentum
+      ~BetaCalibrationDependent.prepare
+      ~BetaCalibrationDependent.prior
       ~BetaCalibrationDependent.save_model
       ~BetaCalibrationDependent.set_params
       ~BetaCalibrationDependent.squeeze_generic
+      ~BetaCalibrationDependent.to
       ~BetaCalibrationDependent.transform
+      ~BetaCalibrationDependent.variational
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.rst.txt
index 5abfbb5..c2fddda 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.rst.txt
@@ -14,13 +14,23 @@ netcal.scaling.LogisticCalibration
    
       ~LogisticCalibration.__init__
       ~LogisticCalibration.clear
+      ~LogisticCalibration.convex
       ~LogisticCalibration.fit
       ~LogisticCalibration.fit_transform
       ~LogisticCalibration.get_params
+      ~LogisticCalibration.guide
       ~LogisticCalibration.load_model
+      ~LogisticCalibration.mask
+      ~LogisticCalibration.mcmc
+      ~LogisticCalibration.model
+      ~LogisticCalibration.momentum
+      ~LogisticCalibration.prepare
+      ~LogisticCalibration.prior
       ~LogisticCalibration.save_model
       ~LogisticCalibration.set_params
       ~LogisticCalibration.squeeze_generic
+      ~LogisticCalibration.to
       ~LogisticCalibration.transform
+      ~LogisticCalibration.variational
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.rst.txt
index 2a2ef4a..c690a1e 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.rst.txt
@@ -14,13 +14,23 @@ netcal.scaling.LogisticCalibrationDependent
    
       ~LogisticCalibrationDependent.__init__
       ~LogisticCalibrationDependent.clear
+      ~LogisticCalibrationDependent.convex
       ~LogisticCalibrationDependent.fit
       ~LogisticCalibrationDependent.fit_transform
       ~LogisticCalibrationDependent.get_params
+      ~LogisticCalibrationDependent.guide
       ~LogisticCalibrationDependent.load_model
+      ~LogisticCalibrationDependent.mask
+      ~LogisticCalibrationDependent.mcmc
+      ~LogisticCalibrationDependent.model
+      ~LogisticCalibrationDependent.momentum
+      ~LogisticCalibrationDependent.prepare
+      ~LogisticCalibrationDependent.prior
       ~LogisticCalibrationDependent.save_model
       ~LogisticCalibrationDependent.set_params
       ~LogisticCalibrationDependent.squeeze_generic
+      ~LogisticCalibrationDependent.to
       ~LogisticCalibrationDependent.transform
+      ~LogisticCalibrationDependent.variational
    
    
\ No newline at end of file
diff --git a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.rst.txt b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.rst.txt
index 8aac995..7a1f47e 100644
--- a/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.rst.txt
+++ b/docs/build/html/_sources/_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.rst.txt
@@ -14,13 +14,23 @@ netcal.scaling.TemperatureScaling
    
       ~TemperatureScaling.__init__
       ~TemperatureScaling.clear
+      ~TemperatureScaling.convex
       ~TemperatureScaling.fit
       ~TemperatureScaling.fit_transform
       ~TemperatureScaling.get_params
+      ~TemperatureScaling.guide
       ~TemperatureScaling.load_model
+      ~TemperatureScaling.mask
+      ~TemperatureScaling.mcmc
+      ~TemperatureScaling.model
+      ~TemperatureScaling.momentum
+      ~TemperatureScaling.prepare
+      ~TemperatureScaling.prior
       ~TemperatureScaling.save_model
       ~TemperatureScaling.set_params
       ~TemperatureScaling.squeeze_generic
+      ~TemperatureScaling.to
       ~TemperatureScaling.transform
+      ~TemperatureScaling.variational
    
    
\ No newline at end of file
diff --git a/docs/build/html/_static/documentation_options.js b/docs/build/html/_static/documentation_options.js
index 140bfcf..a2b3b33 100644
--- a/docs/build/html/_static/documentation_options.js
+++ b/docs/build/html/_static/documentation_options.js
@@ -1,6 +1,6 @@
 var DOCUMENTATION_OPTIONS = {
     URL_ROOT: document.getElementById("documentation_options").getAttribute('data-url_root'),
-    VERSION: '1.1.3',
+    VERSION: '1.2.0',
     LANGUAGE: 'None',
     COLLAPSE_INDEX: false,
     BUILDER: 'html',
diff --git a/docs/build/html/genindex.html b/docs/build/html/genindex.html
index c0b11b2..7b66702 100644
--- a/docs/build/html/genindex.html
+++ b/docs/build/html/genindex.html
@@ -5,7 +5,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>Index &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>Index &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="_static/pygments.css" type="text/css" />
     
@@ -28,7 +28,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
-        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -41,14 +41,17 @@ <h3>Navigation</h3>
 <h1 id="index">Index</h1>
 
 <div class="genindex-jumpbox">
- <a href="#A"><strong>A</strong></a>
+ <a href="#_"><strong>_</strong></a>
+ | <a href="#A"><strong>A</strong></a>
  | <a href="#B"><strong>B</strong></a>
  | <a href="#C"><strong>C</strong></a>
+ | <a href="#D"><strong>D</strong></a>
  | <a href="#E"><strong>E</strong></a>
  | <a href="#F"><strong>F</strong></a>
  | <a href="#G"><strong>G</strong></a>
  | <a href="#H"><strong>H</strong></a>
  | <a href="#I"><strong>I</strong></a>
+ | <a href="#K"><strong>K</strong></a>
  | <a href="#L"><strong>L</strong></a>
  | <a href="#M"><strong>M</strong></a>
  | <a href="#N"><strong>N</strong></a>
@@ -56,17 +59,98 @@ <h1 id="index">Index</h1>
  | <a href="#R"><strong>R</strong></a>
  | <a href="#S"><strong>S</strong></a>
  | <a href="#T"><strong>T</strong></a>
+ | <a href="#V"><strong>V</strong></a>
+ | <a href="#W"><strong>W</strong></a>
+ | <a href="#Z"><strong>Z</strong></a>
  
 </div>
+<h2 id="_">_</h2>
+<table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.__init__">__init__() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.__init__">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.__init__">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty._load_from_state_dict">_load_from_state_dict() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty._load_from_state_dict">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty._load_from_state_dict">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty._named_members">_named_members() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty._named_members">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty._named_members">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty._register_load_state_dict_pre_hook">_register_load_state_dict_pre_hook() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty._register_load_state_dict_pre_hook">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty._register_load_state_dict_pre_hook">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty._register_state_dict_hook">_register_state_dict_hook() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty._register_state_dict_hook">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty._register_state_dict_hook">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty._save_to_state_dict">_save_to_state_dict() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty._save_to_state_dict">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty._save_to_state_dict">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+</tr></table>
+
 <h2 id="A">A</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration">AbstractCalibration (class in netcal)</a>
 </li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression">AbstractLogisticRegression (class in netcal.scaling)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.accuracy">accuracy() (netcal.metrics.PICP method)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE">ACE (class in netcal.metrics)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.add_module">add_module() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.add_module">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.add_module">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE">ACE (class in netcal.metrics)</a>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.alphas">alphas() (netcal.scaling.BetaCalibrationDependent property)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.apply">apply() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.apply">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.apply">(netcal.regularization.MMCEPenalty method)</a>
 </li>
+      </ul></li>
   </ul></td>
 </tr></table>
 
@@ -75,18 +159,54 @@ <h2 id="B">B</h2>
   <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary/_autosummary_binning/netcal.binning.BBQ.html#netcal.binning.BBQ">BBQ (class in netcal.binning)</a>
 </li>
-  </ul></td>
-  <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration">BetaCalibration (class in netcal.scaling)</a>
 </li>
       <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent">BetaCalibrationDependent (class in netcal.scaling)</a>
 </li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.betas">betas() (netcal.scaling.BetaCalibrationDependent property)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.bfloat16">bfloat16() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.bfloat16">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.bfloat16">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE.binning">binning() (netcal.metrics.ACE method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE.binning">(netcal.metrics.ECE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE.binning">(netcal.metrics.MCE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.binning">(netcal.metrics.PICP method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.buffers">buffers() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.buffers">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.buffers">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
   </ul></td>
 </tr></table>
 
 <h2 id="C">C</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.children">children() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.children">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.children">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
       <li><a href="_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration.clear">clear() (netcal.AbstractCalibration method)</a>
 
       <ul>
@@ -97,6 +217,8 @@ <h2 id="C">C</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.clear">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.clear">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.clear">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.clear">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -109,24 +231,96 @@ <h2 id="C">C</h2>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.clear">(netcal.scaling.TemperatureScaling method)</a>
 </li>
       </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.html#netcal.regularization.confidence_penalty">confidence_penalty() (in module netcal.regularization)</a>
+</li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.html#netcal.regularization.confidence_penalty">confidence_penalty() (in module netcal.regularization)</a>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty">ConfidencePenalty (class in netcal.regularization)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.to">ConfidencePenalty.to() (in module netcal.regularization)</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.to">[1]</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.to">[2]</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.to">[3]</a>
+</li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.convex">convex() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.convex">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.convex">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.convex">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.convex">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.convex">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.covariances">covariances() (netcal.scaling.LogisticCalibrationDependent property)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.cpu">cpu() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.cpu">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.cpu">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.cuda">cuda() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.cuda">(netcal.regularization.DCAPenalty method)</a>
 </li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.cuda">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
   </ul></td>
 </tr></table>
 
-<h2 id="E">E</h2>
+<h2 id="D">D</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE">ECE (class in netcal.metrics)</a>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty">DCAPenalty (class in netcal.regularization)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.to">DCAPenalty.to() (in module netcal.regularization)</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.to">[1]</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.to">[2]</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.to">[3]</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.double">double() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.double">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.double">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+</tr></table>
+
+<h2 id="E">E</h2>
+<table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE">ECE (class in netcal.metrics)</a>
+</li>
       <li><a href="_autosummary/_autosummary_binning/netcal.binning.ENIR.html#netcal.binning.ENIR">ENIR (class in netcal.binning)</a>
 </li>
       <li><a href="_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration.epsilon">epsilon (netcal.AbstractCalibration attribute)</a>
 </li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.eval">eval() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.eval">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.eval">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.extra_repr">extra_repr() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.extra_repr">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.extra_repr">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
   </ul></td>
 </tr></table>
 
@@ -143,6 +337,8 @@ <h2 id="F">F</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.fit">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.fit">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.fit">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.fit">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -155,8 +351,6 @@ <h2 id="F">F</h2>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.fit">(netcal.scaling.TemperatureScaling method)</a>
 </li>
       </ul></li>
-  </ul></td>
-  <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration.fit_transform">fit_transform() (netcal.AbstractCalibration method)</a>
 
       <ul>
@@ -167,6 +361,8 @@ <h2 id="F">F</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.fit_transform">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.fit_transform">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.fit_transform">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.fit_transform">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -177,6 +373,24 @@ <h2 id="F">F</h2>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.fit_transform">(netcal.scaling.LogisticCalibrationDependent method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.fit_transform">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.float">float() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.float">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.float">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.forward">forward() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.forward">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.forward">(netcal.regularization.MMCEPenalty method)</a>
 </li>
       </ul></li>
   </ul></td>
@@ -197,6 +411,8 @@ <h2 id="G">G</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.get_params">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.get_params">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.get_params">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.get_params">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -207,6 +423,22 @@ <h2 id="G">G</h2>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.get_params">(netcal.scaling.LogisticCalibrationDependent method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.get_params">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.guide">guide() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.guide">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.guide">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.guide">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.guide">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.guide">(netcal.scaling.TemperatureScaling method)</a>
 </li>
       </ul></li>
   </ul></td>
@@ -214,6 +446,16 @@ <h2 id="G">G</h2>
 
 <h2 id="H">H</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.half">half() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.half">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.half">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning">HistogramBinning (class in netcal.binning)</a>
 </li>
@@ -222,12 +464,34 @@ <h2 id="H">H</h2>
 
 <h2 id="I">I</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.intercept">intercept() (netcal.scaling.BetaCalibration property)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.intercept">(netcal.scaling.BetaCalibrationDependent property)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.intercept">(netcal.scaling.LogisticCalibration property)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.intercept">(netcal.scaling.LogisticCalibrationDependent property)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.intercept">(netcal.scaling.TemperatureScaling property)</a>
+</li>
+      </ul></li>
+  </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression">IsotonicRegression (class in netcal.binning)</a>
 </li>
   </ul></td>
 </tr></table>
 
+<h2 id="K">K</h2>
+<table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.kernel">kernel() (netcal.regularization.MMCEPenalty method)</a>
+</li>
+  </ul></td>
+</tr></table>
+
 <h2 id="L">L</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
@@ -241,6 +505,8 @@ <h2 id="L">L</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.load_model">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.load_model">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.load_model">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.load_model">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -255,8 +521,14 @@ <h2 id="L">L</h2>
       </ul></li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration.logger">logger (netcal.AbstractCalibration attribute)</a>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.load_state_dict">load_state_dict() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.load_state_dict">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.load_state_dict">(netcal.regularization.MMCEPenalty method)</a>
 </li>
+      </ul></li>
       <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration">LogisticCalibration (class in netcal.scaling)</a>
 </li>
       <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent">LogisticCalibrationDependent (class in netcal.scaling)</a>
@@ -267,7 +539,37 @@ <h2 id="L">L</h2>
 <h2 id="M">M</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.mask">mask() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.mask">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.mask">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.mask">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.mask">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.mask">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
       <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE">MCE (class in netcal.metrics)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.mcmc">mcmc() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.mcmc">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.mcmc">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.mcmc">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.mcmc">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.mcmc">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.means">means() (netcal.scaling.LogisticCalibrationDependent property)</a>
 </li>
       <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE.measure">measure() (netcal.metrics.ACE method)</a>
 
@@ -275,6 +577,54 @@ <h2 id="M">M</h2>
         <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE.measure">(netcal.metrics.ECE method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE.measure">(netcal.metrics.MCE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MMCE.html#netcal.metrics.MMCE.measure">(netcal.metrics.MMCE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.measure">(netcal.metrics.PICP method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MMCE.html#netcal.metrics.MMCE">MMCE (class in netcal.metrics)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty">MMCEPenalty (class in netcal.regularization)</a>
+</li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.to">MMCEPenalty.to() (in module netcal.regularization)</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.to">[1]</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.to">[2]</a>, <a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.to">[3]</a>
+</li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.model">model() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.model">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.model">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.model">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.model">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.model">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.modules">modules() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.modules">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.modules">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.momentum">momentum() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.momentum">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.momentum">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.momentum">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.momentum">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.momentum">(netcal.scaling.TemperatureScaling method)</a>
 </li>
       </ul></li>
   </ul></td>
@@ -283,14 +633,46 @@ <h2 id="M">M</h2>
 <h2 id="N">N</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.named_buffers">named_buffers() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.named_buffers">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.named_buffers">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.named_children">named_children() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.named_children">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.named_children">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.named_modules">named_modules() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.named_modules">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.named_modules">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.named_parameters">named_parameters() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.named_parameters">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.named_parameters">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
       <li><a href="index.html#module-netcal">netcal (module)</a>
 </li>
       <li><a href="_autosummary/netcal.binning.html#module-netcal.binning">netcal.binning (module)</a>
 </li>
       <li><a href="_autosummary/netcal.metrics.html#module-netcal.metrics">netcal.metrics (module)</a>
 </li>
-  </ul></td>
-  <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary/netcal.presentation.html#module-netcal.presentation">netcal.presentation (module)</a>
 </li>
       <li><a href="_autosummary/netcal.regularization.html#module-netcal.regularization">netcal.regularization (module)</a>
@@ -303,16 +685,134 @@ <h2 id="N">N</h2>
 <h2 id="P">P</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.parameters">parameters() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.parameters">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.parameters">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP">PICP (class in netcal.metrics)</a>
+</li>
       <li><a href="_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html#netcal.presentation.ReliabilityDiagram.plot">plot() (netcal.presentation.ReliabilityDiagram method)</a>
 </li>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE.prepare">prepare() (netcal.metrics.ACE method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE.prepare">(netcal.metrics.ECE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE.prepare">(netcal.metrics.MCE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.prepare">(netcal.metrics.PICP method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.prepare">(netcal.scaling.AbstractLogisticRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.prepare">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.prepare">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.prepare">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.prepare">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.prepare">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.prior">prior() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.prior">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.prior">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.prior">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.prior">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.prior">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE.process">process() (netcal.metrics.ACE method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE.process">(netcal.metrics.ECE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE.process">(netcal.metrics.MCE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.process">(netcal.metrics.PICP method)</a>
+</li>
+      </ul></li>
   </ul></td>
 </tr></table>
 
 <h2 id="R">R</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ACE.html#netcal.metrics.ACE.reduce">reduce() (netcal.metrics.ACE method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE.reduce">(netcal.metrics.ECE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE.reduce">(netcal.metrics.MCE method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.reduce">(netcal.metrics.PICP method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.register_backward_hook">register_backward_hook() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.register_backward_hook">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.register_backward_hook">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.register_buffer">register_buffer() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.register_buffer">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.register_buffer">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.register_forward_hook">register_forward_hook() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.register_forward_hook">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.register_forward_hook">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.register_forward_pre_hook">register_forward_pre_hook() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.register_forward_pre_hook">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.register_forward_pre_hook">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.register_parameter">register_parameter() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.register_parameter">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.register_parameter">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
       <li><a href="_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.html#netcal.presentation.ReliabilityDiagram">ReliabilityDiagram (class in netcal.presentation)</a>
 </li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.requires_grad_">requires_grad_() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.requires_grad_">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.requires_grad_">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
   </ul></td>
 </tr></table>
 
@@ -329,6 +829,8 @@ <h2 id="S">S</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.save_model">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.save_model">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.save_model">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.save_model">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -351,6 +853,8 @@ <h2 id="S">S</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.set_params">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.set_params">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.set_params">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.set_params">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -381,6 +885,10 @@ <h2 id="S">S</h2>
         <li><a href="_autosummary/_autosummary_metric/netcal.metrics.ECE.html#netcal.metrics.ECE.squeeze_generic">(netcal.metrics.ECE class method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_metric/netcal.metrics.MCE.html#netcal.metrics.MCE.squeeze_generic">(netcal.metrics.MCE class method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_metric/netcal.metrics.PICP.html#netcal.metrics.PICP.squeeze_generic">(netcal.metrics.PICP class method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.squeeze_generic">(netcal.scaling.AbstractLogisticRegression class method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.squeeze_generic">(netcal.scaling.BetaCalibration class method)</a>
 </li>
@@ -391,6 +899,14 @@ <h2 id="S">S</h2>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.squeeze_generic">(netcal.scaling.LogisticCalibrationDependent class method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.squeeze_generic">(netcal.scaling.TemperatureScaling class method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.state_dict">state_dict() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.state_dict">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.state_dict">(netcal.regularization.MMCEPenalty method)</a>
 </li>
       </ul></li>
   </ul></td>
@@ -403,6 +919,36 @@ <h2 id="T">T</h2>
 </li>
       <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling">TemperatureScaling (class in netcal.scaling)</a>
 </li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.to">to() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.to">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.to">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.to">(netcal.scaling.AbstractLogisticRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.to">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.to">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.to">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.to">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.to">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.train">train() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.train">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.train">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+  <td style="width: 33%; vertical-align: top;"><ul>
       <li><a href="_autosummary_abstract_calibration/netcal.AbstractCalibration.html#netcal.AbstractCalibration.transform">transform() (netcal.AbstractCalibration method)</a>
 
       <ul>
@@ -413,6 +959,8 @@ <h2 id="T">T</h2>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.html#netcal.binning.HistogramBinning.transform">(netcal.binning.HistogramBinning method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.html#netcal.binning.IsotonicRegression.transform">(netcal.binning.IsotonicRegression method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.transform">(netcal.scaling.AbstractLogisticRegression method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.transform">(netcal.scaling.BetaCalibration method)</a>
 </li>
@@ -423,6 +971,62 @@ <h2 id="T">T</h2>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.transform">(netcal.scaling.LogisticCalibrationDependent method)</a>
 </li>
         <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.transform">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.type">type() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.type">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.type">(netcal.regularization.MMCEPenalty method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+</tr></table>
+
+<h2 id="V">V</h2>
+<table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.html#netcal.scaling.AbstractLogisticRegression.variational">variational() (netcal.scaling.AbstractLogisticRegression method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.variational">(netcal.scaling.BetaCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.html#netcal.scaling.BetaCalibrationDependent.variational">(netcal.scaling.BetaCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.variational">(netcal.scaling.LogisticCalibration method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.html#netcal.scaling.LogisticCalibrationDependent.variational">(netcal.scaling.LogisticCalibrationDependent method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.variational">(netcal.scaling.TemperatureScaling method)</a>
+</li>
+      </ul></li>
+  </ul></td>
+</tr></table>
+
+<h2 id="W">W</h2>
+<table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.html#netcal.scaling.BetaCalibration.weights">weights() (netcal.scaling.BetaCalibration property)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.html#netcal.scaling.LogisticCalibration.weights">(netcal.scaling.LogisticCalibration property)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.html#netcal.scaling.TemperatureScaling.weights">(netcal.scaling.TemperatureScaling property)</a>
+</li>
+      </ul></li>
+  </ul></td>
+</tr></table>
+
+<h2 id="Z">Z</h2>
+<table style="width: 100%" class="indextable genindextable"><tr>
+  <td style="width: 33%; vertical-align: top;"><ul>
+      <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.html#netcal.regularization.ConfidencePenalty.zero_grad">zero_grad() (netcal.regularization.ConfidencePenalty method)</a>
+
+      <ul>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.html#netcal.regularization.DCAPenalty.zero_grad">(netcal.regularization.DCAPenalty method)</a>
+</li>
+        <li><a href="_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.html#netcal.regularization.MMCEPenalty.zero_grad">(netcal.regularization.MMCEPenalty method)</a>
 </li>
       </ul></li>
   </ul></td>
@@ -458,7 +1062,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
-        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/index.html b/docs/build/html/index.html
index a2edcba..ba92cd1 100644
--- a/docs/build/html/index.html
+++ b/docs/build/html/index.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>API Reference &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>API Reference &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="_static/pygments.css" type="text/css" />
     
@@ -31,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="_autosummary/netcal.binning.html" title="netcal.binning"
              accesskey="N">next</a> |</li>
-        <li class="nav-item nav-item-0"><a href="#">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="#">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -41,7 +41,7 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <span class="target" id="module-netcal"></span><div class="section" id="api-reference">
-<h1><a class="toc-backref" href="#id47">API Reference</a><a class="headerlink" href="#api-reference" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id57">API Reference</a><a class="headerlink" href="#api-reference" title="Permalink to this headline">¶</a></h1>
 <p>This is the detailled API reference for the confidence calibration framework. This framework can be used to
 obtain well-calibrated confidence estimates from biased estimators like Neural Networks.
 The API reference contains a detailled description of all available methods and their parameters. For
@@ -85,15 +85,15 @@ <h1><a class="toc-backref" href="#id47">API Reference</a><a class="headerlink" h
 </table>
 </div>
 <div class="section" id="calibration-framework">
-<h1><a class="toc-backref" href="#id48">Calibration Framework</a><a class="headerlink" href="#calibration-framework" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id58">Calibration Framework</a><a class="headerlink" href="#calibration-framework" title="Permalink to this headline">¶</a></h1>
 <p>Calibration framework in Python 3 for Neural Networks.
 For full API reference documentation, visit <a class="reference external" href="https://fabiankueppers.github.io/calibration-framework">https://fabiankueppers.github.io/calibration-framework</a>.</p>
 <p>Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 AND Elektronische Fahrwerksysteme GmbH, Gaimersheim, Germany</p>
-<p>This Source Code Form is subject to the terms of the Mozilla Public
-License, v. 2.0. If a copy of the MPL was not distributed with this
-file, You can obtain one at <a class="reference external" href="http://mozilla.org/MPL/2.0/">http://mozilla.org/MPL/2.0/</a>.</p>
-<p>If you use this framework or parts of it for your research, please cite it by:</p>
+<p>This Source Code Form is subject to the terms of the Apache License 2.0.
+If a copy of the APL2 was not distributed with this
+file, You can obtain one at <a class="reference external" href="https://www.apache.org/licenses/LICENSE-2.0.txt">https://www.apache.org/licenses/LICENSE-2.0.txt</a>.</p>
+<p><strong>Important: updated references!</strong> If you use this framework (<em>classification or detection</em>) or parts of it for your research, please cite it by:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="nd">@InProceedings</span><span class="p">{</span><span class="n">Kueppers_2020_CVPR_Workshops</span><span class="p">,</span>
    <span class="n">author</span> <span class="o">=</span> <span class="p">{</span><span class="n">Küppers</span><span class="p">,</span> <span class="n">Fabian</span> <span class="ow">and</span> <span class="n">Kronenberger</span><span class="p">,</span> <span class="n">Jan</span> <span class="ow">and</span> <span class="n">Shantia</span><span class="p">,</span> <span class="n">Amirhossein</span> <span class="ow">and</span> <span class="n">Haselhoff</span><span class="p">,</span> <span class="n">Anselm</span><span class="p">},</span>
    <span class="n">title</span> <span class="o">=</span> <span class="p">{</span><span class="n">Multivariate</span> <span class="n">Confidence</span> <span class="n">Calibration</span> <span class="k">for</span> <span class="n">Object</span> <span class="n">Detection</span><span class="p">},</span>
@@ -103,44 +103,74 @@ <h1><a class="toc-backref" href="#id48">Calibration Framework</a><a class="heade
 <span class="p">}</span>
 </pre></div>
 </div>
+<p><em>If you use Bayesian calibration methods with uncertainty, please cite it by</em>:</p>
+<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="nd">@InProceedings</span><span class="p">{</span><span class="n">Kueppers_2021_IV</span><span class="p">,</span>
+       <span class="n">author</span> <span class="o">=</span> <span class="p">{</span><span class="n">Küppers</span><span class="p">,</span> <span class="n">Fabian</span> <span class="ow">and</span> <span class="n">Kronenberger</span><span class="p">,</span> <span class="n">Jan</span> <span class="ow">and</span> <span class="n">Schneider</span><span class="p">,</span> <span class="n">Jonas</span> <span class="ow">and</span> <span class="n">Haselhoff</span><span class="p">,</span> <span class="n">Anselm</span><span class="p">},</span>
+       <span class="n">title</span> <span class="o">=</span> <span class="p">{</span><span class="n">Bayesian</span> <span class="n">Confidence</span> <span class="n">Calibration</span> <span class="k">for</span> <span class="n">Epistemic</span> <span class="n">Uncertainty</span> <span class="n">Modelling</span><span class="p">},</span>
+       <span class="n">booktitle</span> <span class="o">=</span> <span class="p">{</span><span class="n">Proceedings</span> <span class="n">of</span> <span class="n">the</span> <span class="n">IEEE</span> <span class="n">Intelligent</span> <span class="n">Vehicles</span> <span class="n">Symposium</span> <span class="p">(</span><span class="n">IV</span><span class="p">)},</span>
+       <span class="n">month</span> <span class="o">=</span> <span class="p">{</span><span class="n">July</span><span class="p">},</span>
+       <span class="n">year</span> <span class="o">=</span> <span class="p">{</span><span class="mi">2021</span><span class="p">},</span>
+    <span class="p">}</span>
+</pre></div>
+</div>
 <div class="contents topic" id="table-of-contents">
 <p class="topic-title">Table of Contents</p>
 <ul class="simple">
-<li><p><a class="reference internal" href="#api-reference" id="id47">API Reference</a></p></li>
-<li><p><a class="reference internal" href="#calibration-framework" id="id48">Calibration Framework</a></p></li>
-<li><p><a class="reference internal" href="#overview" id="id49">Overview</a></p></li>
-<li><p><a class="reference internal" href="#installation" id="id50">Installation</a></p>
+<li><p><a class="reference internal" href="#api-reference" id="id57">API Reference</a></p></li>
+<li><p><a class="reference internal" href="#calibration-framework" id="id58">Calibration Framework</a></p></li>
+<li><p><a class="reference internal" href="#overview" id="id59">Overview</a></p>
+<ul>
+<li><p><a class="reference internal" href="#update-on-version-1-2" id="id60">Update on version 1.2</a></p></li>
+<li><p><a class="reference internal" href="#update-on-version-1-1" id="id61">Update on version 1.1</a></p></li>
+</ul>
+</li>
+<li><p><a class="reference internal" href="#installation" id="id62">Installation</a></p>
 <ul>
-<li><p><a class="reference internal" href="#requirements" id="id51">Requirements</a></p></li>
+<li><p><a class="reference internal" href="#requirements" id="id63">Requirements</a></p></li>
 </ul>
 </li>
-<li><p><a class="reference internal" href="#calibration-metrics" id="id52">Calibration Metrics</a></p></li>
-<li><p><a class="reference internal" href="#methods" id="id53">Methods</a></p>
+<li><p><a class="reference internal" href="#calibration-metrics" id="id64">Calibration Metrics</a></p></li>
+<li><p><a class="reference internal" href="#methods" id="id65">Methods</a></p>
 <ul>
-<li><p><a class="reference internal" href="#binning" id="id54">Binning</a></p></li>
-<li><p><a class="reference internal" href="#scaling" id="id55">Scaling</a></p></li>
-<li><p><a class="reference internal" href="#regularization" id="id56">Regularization</a></p></li>
+<li><p><a class="reference internal" href="#binning" id="id66">Binning</a></p></li>
+<li><p><a class="reference internal" href="#scaling" id="id67">Scaling</a></p></li>
+<li><p><a class="reference internal" href="#regularization" id="id68">Regularization</a></p></li>
 </ul>
 </li>
-<li><p><a class="reference internal" href="#visualization" id="id57">Visualization</a></p></li>
-<li><p><a class="reference internal" href="#examples" id="id58">Examples</a></p>
+<li><p><a class="reference internal" href="#visualization" id="id69">Visualization</a></p></li>
+<li><p><a class="reference internal" href="#examples" id="id70">Examples</a></p>
 <ul>
-<li><p><a class="reference internal" href="#classification" id="id59">Classification</a></p></li>
-<li><p><a class="reference internal" href="#detection" id="id60">Detection</a></p></li>
+<li><p><a class="reference internal" href="#classification" id="id71">Classification</a></p></li>
+<li><p><a class="reference internal" href="#detection" id="id72">Detection</a></p></li>
+<li><p><a class="reference internal" href="#uncertainty-in-calibration" id="id73">Uncertainty in Calibration</a></p></li>
 </ul>
 </li>
-<li><p><a class="reference internal" href="#references" id="id61">References</a></p></li>
+<li><p><a class="reference internal" href="#references" id="id74">References</a></p></li>
 </ul>
 </div>
 </div>
 <div class="section" id="overview">
-<h1><a class="toc-backref" href="#id49">Overview</a><a class="headerlink" href="#overview" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id59">Overview</a><a class="headerlink" href="#overview" title="Permalink to this headline">¶</a></h1>
 <p>This framework is designed to calibrate the confidence estimates of classifiers like neural networks. Modern neural networks are likely to be overconfident with their predictions. However, reliable confidence estimates of such classifiers are crucial especially in safety-critical applications.</p>
 <p>For example: given 100 predictions with a confidence of 80% of each prediction, the observed accuracy should also match 80% (neither more nor less). This behaviour is achievable with several calibration methods.</p>
-<p>This framework can also be used to calibrate object detection models. It has recently been shown that calibration on object detection also depends on the position and/or scale of a predicted object <a class="footnote-reference brackets" href="#id46" id="id1">12</a>. We provide calibration methods to perform confidence calibration w.r.t. the additional box regression branch.
-For this purpose, we extended the commonly used Histogram Binning <a class="footnote-reference brackets" href="#id37" id="id2">3</a>, Logistic Calibration alias Platt scaling <a class="footnote-reference brackets" href="#id44" id="id3">10</a> and the Beta Calibration method <a class="footnote-reference brackets" href="#id36" id="id4">2</a> to also include the bounding box information into a calibration mapping.
+<div class="section" id="update-on-version-1-2">
+<h2><a class="toc-backref" href="#id60">Update on version 1.2</a><a class="headerlink" href="#update-on-version-1-2" title="Permalink to this headline">¶</a></h2>
+<p>TL;DR:
+- Bayesian confidence calibration: train and infer scaling methods using variational inference (VI) and MCMC sampling
+- New metrics: MMCE <a class="footnote-reference brackets" href="#id54" id="id1">13</a> and PICP <a class="footnote-reference brackets" href="#id55" id="id2">14</a> (<em>netcal.metrics.MMCE</em> and <em>netcal.metrics.PICP</em>)
+- New regularization methods: MMCE <a class="footnote-reference brackets" href="#id54" id="id3">13</a> and DCA <a class="footnote-reference brackets" href="#id56" id="id4">15</a> (<em>netcal.regularization.MMCEPenalty</em> and <em>netcal.regularization.DCAPenalty</em>)
+- Updated examples
+- Switched license from MPL2 to APL2</p>
+<p>Now you can also use Bayesian methods to obtain uncertainty within a calibration mapping mainly in the <em>netcal.scaling</em> package. We adapted Markov-Chain Monte-Carlo sampling (MCMC) as well as Variational Inference (VI) on common calibration methods.
+It is also easily possible to bring the scaling methods to CUDA in order to speed-up the computations. We further provide new metrics to evaluate confidence calibration (MMCE) and to evaluate the quality of prediction intervals (PICP).
+Finally, we updated our framework by new regularization methods that can be used during model training (MMCE and DCA).</p>
+</div>
+<div class="section" id="update-on-version-1-1">
+<h2><a class="toc-backref" href="#id61">Update on version 1.1</a><a class="headerlink" href="#update-on-version-1-1" title="Permalink to this headline">¶</a></h2>
+<p>This framework can also be used to calibrate object detection models. It has recently been shown that calibration on object detection also depends on the position and/or scale of a predicted object <a class="footnote-reference brackets" href="#id53" id="id5">12</a>. We provide calibration methods to perform confidence calibration w.r.t. the additional box regression branch.
+For this purpose, we extended the commonly used Histogram Binning <a class="footnote-reference brackets" href="#id44" id="id6">3</a>, Logistic Calibration alias Platt scaling <a class="footnote-reference brackets" href="#id51" id="id7">10</a> and the Beta Calibration method <a class="footnote-reference brackets" href="#id43" id="id8">2</a> to also include the bounding box information into a calibration mapping.
 Furthermore, we provide two new methods called the <em>Dependent Logistic Calibration</em> and the <em>Dependent Beta Calibration</em> that are not only able to perform a calibration mapping
-w.r.t. additional bounding box information but also to model correlations and dependencies between all given quantities <a class="footnote-reference brackets" href="#id46" id="id5">12</a>. Those methods should be preffered over their counterparts in object detection mode.</p>
+w.r.t. additional bounding box information but also to model correlations and dependencies between all given quantities <a class="footnote-reference brackets" href="#id53" id="id9">12</a>. Those methods should be preffered over their counterparts in object detection mode.</p>
 <p>The framework is structured as follows:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">netcal</span>
   <span class="o">.</span><span class="n">binning</span>         <span class="c1"># binning methods</span>
@@ -153,8 +183,9 @@ <h1><a class="toc-backref" href="#id49">Overview</a><a class="headerlink" href="
 </pre></div>
 </div>
 </div>
+</div>
 <div class="section" id="installation">
-<h1><a class="toc-backref" href="#id50">Installation</a><a class="headerlink" href="#installation" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id62">Installation</a><a class="headerlink" href="#installation" title="Permalink to this headline">¶</a></h1>
 <p>The installation of the calibration suite is quite easy with setuptools. You can either install this framework using PIP:</p>
 <div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="n">pip3</span> <span class="n">install</span> <span class="n">netcal</span>
 </pre></div>
@@ -164,76 +195,87 @@ <h1><a class="toc-backref" href="#id50">Installation</a><a class="headerlink" hr
 </pre></div>
 </div>
 <div class="section" id="requirements">
-<h2><a class="toc-backref" href="#id51">Requirements</a><a class="headerlink" href="#requirements" title="Permalink to this headline">¶</a></h2>
+<h2><a class="toc-backref" href="#id63">Requirements</a><a class="headerlink" href="#requirements" title="Permalink to this headline">¶</a></h2>
 <ul class="simple">
-<li><p>numpy&gt;=1.15</p></li>
+<li><p>numpy&gt;=1.17</p></li>
 <li><p>scipy&gt;=1.3</p></li>
 <li><p>matplotlib&gt;=3.1</p></li>
-<li><p>scikit-learn&gt;=0.20.0</p></li>
-<li><p>torch&gt;=1.1</p></li>
-<li><p>tqdm</p></li>
+<li><p>scikit-learn&gt;=0.21</p></li>
+<li><p>torch&gt;=1.4</p></li>
+<li><p>tqdm&gt;=4.40</p></li>
+<li><p>pyro-ppl&gt;=1.3</p></li>
+<li><p>tikzplotlib&gt;=0.9.8</p></li>
 </ul>
 </div>
 </div>
 <div class="section" id="calibration-metrics">
-<h1><a class="toc-backref" href="#id52">Calibration Metrics</a><a class="headerlink" href="#calibration-metrics" title="Permalink to this headline">¶</a></h1>
-<p>The most common metric to determine miscalibration in the scope of classification is the <em>Expected Calibration Error</em> (ECE) <a class="footnote-reference brackets" href="#id35" id="id6">1</a>. This metric divides the confidence space into several bins and measures the observed accuracy in each bin. The bin gaps between observed accuracy and bin confidence are summed up and weighted by the amount of samples in each bin. The <em>Maximum Calibration Error</em> (MCE) denotes the highest gap over all bins. The <em>Average Calibration Error</em> (ACE) <a class="footnote-reference brackets" href="#id45" id="id7">11</a> denotes the average miscalibration where each bin gets weighted equally.
-For object detection, we implemented the <em>Detection Calibration Error</em> (D-ECE) <a class="footnote-reference brackets" href="#id46" id="id8">12</a> that is the natural extension of the ECE to object detection tasks. The miscalibration is determined w.r.t. the bounding box information provided (e.g. box location and/or scale). For this purpose, all available information gets binned in a multidimensional histogram. The accuracy is then calculated in each bin separately to determine the mean deviation between confidence and accuracy.</p>
+<h1><a class="toc-backref" href="#id64">Calibration Metrics</a><a class="headerlink" href="#calibration-metrics" title="Permalink to this headline">¶</a></h1>
+<p>The most common metric to determine miscalibration in the scope of classification is the <em>Expected Calibration Error</em> (ECE) <a class="footnote-reference brackets" href="#id42" id="id10">1</a>. This metric divides the confidence space into several bins and measures the observed accuracy in each bin. The bin gaps between observed accuracy and bin confidence are summed up and weighted by the amount of samples in each bin. The <em>Maximum Calibration Error</em> (MCE) denotes the highest gap over all bins. The <em>Average Calibration Error</em> (ACE) <a class="footnote-reference brackets" href="#id52" id="id11">11</a> denotes the average miscalibration where each bin gets weighted equally.
+For object detection, we implemented the <em>Detection Calibration Error</em> (D-ECE) <a class="footnote-reference brackets" href="#id53" id="id12">12</a> that is the natural extension of the ECE to object detection tasks. The miscalibration is determined w.r.t. the bounding box information provided (e.g. box location and/or scale). For this purpose, all available information gets binned in a multidimensional histogram. The accuracy is then calculated in each bin separately to determine the mean deviation between confidence and accuracy.</p>
 <ul class="simple">
-<li><p>(Detection) Expected Calibration Error <a class="footnote-reference brackets" href="#id35" id="id9">1</a>, <a class="footnote-reference brackets" href="#id46" id="id10">12</a> (<em>netcal.metrics.ECE</em>)</p></li>
-<li><p>(Detection) Maximum Calibration Error <a class="footnote-reference brackets" href="#id35" id="id11">1</a>, <a class="footnote-reference brackets" href="#id46" id="id12">12</a>  (<em>netcal.metrics.MCE</em>)</p></li>
-<li><p>(Detection) Average Calibration Error <a class="footnote-reference brackets" href="#id45" id="id13">11</a>, <a class="footnote-reference brackets" href="#id46" id="id14">12</a> (<em>netcal.metrics.ACE</em>)</p></li>
+<li><p>(Detection) Expected Calibration Error <a class="footnote-reference brackets" href="#id42" id="id13">1</a>, <a class="footnote-reference brackets" href="#id53" id="id14">12</a> (<em>netcal.metrics.ECE</em>)</p></li>
+<li><p>(Detection) Maximum Calibration Error <a class="footnote-reference brackets" href="#id42" id="id15">1</a>, <a class="footnote-reference brackets" href="#id53" id="id16">12</a>  (<em>netcal.metrics.MCE</em>)</p></li>
+<li><p>(Detection) Average Calibration Error <a class="footnote-reference brackets" href="#id52" id="id17">11</a>, <a class="footnote-reference brackets" href="#id53" id="id18">12</a> (<em>netcal.metrics.ACE</em>)</p></li>
+<li><p>Maximum Mean Calibration Error (MMCE) <a class="footnote-reference brackets" href="#id54" id="id19">13</a> (<em>netcal.metrics.MMCE</em>) (no position-dependency)</p></li>
+<li><p>Prediction interval coverage probability (PICP) (<em>netcal.metrics.PICP</em>) - this score is not a direct measure of confidence calibration but rather to measure the quality of uncertainty prediction intervals.</p></li>
 </ul>
 </div>
 <div class="section" id="methods">
-<h1><a class="toc-backref" href="#id53">Methods</a><a class="headerlink" href="#methods" title="Permalink to this headline">¶</a></h1>
-<p>The calibration methods are separated into binning and scaling methods. The binning methods divide the available information into several bins (like ECE or D-ECE) and perform calibration on each bin. The scaling methods scale the confidence estimates or logits directly to calibrated confidence estimates - on detection calibration, this is done w.r.t. the additional regression branch of a network.</p>
+<h1><a class="toc-backref" href="#id65">Methods</a><a class="headerlink" href="#methods" title="Permalink to this headline">¶</a></h1>
+<p>The post-hoc calibration methods are separated into binning and scaling methods. The binning methods divide the available information into several bins (like ECE or D-ECE) and perform calibration on each bin. The scaling methods scale the confidence estimates or logits directly to calibrated confidence estimates - on detection calibration, this is done w.r.t. the additional regression branch of a network.</p>
 <p>Important: if you use the detection mode, you need to specifiy the flag “detection=True” in the constructor of the according method (this is not necessary for <em>netcal.scaling.LogisticCalibrationDependent</em> and <em>netcal.scaling.BetaCalibrationDependent</em>).</p>
 <p>Most of the calibration methods are designed for binary classification tasks. For binning methods, multi-class calibration is performed in “one vs. all” by default.</p>
-<p>Some methods like “Isotonic Regression” utilize methods from the scikit-learn API <a class="footnote-reference brackets" href="#id43" id="id15">9</a>.</p>
+<p>Some methods like “Isotonic Regression” utilize methods from the scikit-learn API <a class="footnote-reference brackets" href="#id50" id="id20">9</a>.</p>
 <p>Another group are the regularization tools which are added to the loss during the training of a Neural Network.</p>
 <div class="section" id="binning">
-<h2><a class="toc-backref" href="#id54">Binning</a><a class="headerlink" href="#binning" title="Permalink to this headline">¶</a></h2>
+<h2><a class="toc-backref" href="#id66">Binning</a><a class="headerlink" href="#binning" title="Permalink to this headline">¶</a></h2>
 <p>Implemented binning methods are:</p>
 <ul class="simple">
-<li><p>Histogram Binning for classification <a class="footnote-reference brackets" href="#id37" id="id16">3</a>, <a class="footnote-reference brackets" href="#id38" id="id17">4</a> and object detection <a class="footnote-reference brackets" href="#id46" id="id18">12</a> (<em>netcal.binning.HistogramBinning</em>)</p></li>
-<li><p>Isotonic Regression <a class="footnote-reference brackets" href="#id38" id="id19">4</a>, <a class="footnote-reference brackets" href="#id39" id="id20">5</a> (<em>netcal.binning.IsotonicRegression</em>)</p></li>
-<li><p>Bayesian Binning into Quantiles (BBQ) <a class="footnote-reference brackets" href="#id35" id="id21">1</a> (<em>netcal.binning.BBQ</em>)</p></li>
-<li><p>Ensemble of Near Isotonic Regression (ENIR) <a class="footnote-reference brackets" href="#id40" id="id22">6</a> (<em>netcal.binning.ENIR</em>)</p></li>
+<li><p>Histogram Binning for classification <a class="footnote-reference brackets" href="#id44" id="id21">3</a>, <a class="footnote-reference brackets" href="#id45" id="id22">4</a> and object detection <a class="footnote-reference brackets" href="#id53" id="id23">12</a> (<em>netcal.binning.HistogramBinning</em>)</p></li>
+<li><p>Isotonic Regression <a class="footnote-reference brackets" href="#id45" id="id24">4</a>, <a class="footnote-reference brackets" href="#id46" id="id25">5</a> (<em>netcal.binning.IsotonicRegression</em>)</p></li>
+<li><p>Bayesian Binning into Quantiles (BBQ) <a class="footnote-reference brackets" href="#id42" id="id26">1</a> (<em>netcal.binning.BBQ</em>)</p></li>
+<li><p>Ensemble of Near Isotonic Regression (ENIR) <a class="footnote-reference brackets" href="#id47" id="id27">6</a> (<em>netcal.binning.ENIR</em>)</p></li>
 </ul>
 </div>
 <div class="section" id="scaling">
-<h2><a class="toc-backref" href="#id55">Scaling</a><a class="headerlink" href="#scaling" title="Permalink to this headline">¶</a></h2>
+<h2><a class="toc-backref" href="#id67">Scaling</a><a class="headerlink" href="#scaling" title="Permalink to this headline">¶</a></h2>
 <p>Implemented scaling methods are:</p>
 <ul class="simple">
-<li><p>Logistic Calibration/Platt Scaling for classification <a class="footnote-reference brackets" href="#id44" id="id23">10</a>, <a class="footnote-reference brackets" href="#id46" id="id24">12</a> and object detection <a class="footnote-reference brackets" href="#id46" id="id25">12</a> (<em>netcal.scaling.LogisticCalibration</em>)</p></li>
-<li><p>Dependent Logistic Calibration for object detection <a class="footnote-reference brackets" href="#id46" id="id26">12</a> (<em>netcal.scaling.LogisticCalibrationDependent</em>) - on detection, this method is able to capture correlations between all input quantities and should be preferred over Logistic Calibration for object detection</p></li>
-<li><p>Temperature Scaling for classification <a class="footnote-reference brackets" href="#id41" id="id27">7</a> and object detection <a class="footnote-reference brackets" href="#id46" id="id28">12</a> (<em>netcal.scaling.TemperatureScaling</em>)</p></li>
-<li><p>Beta Calibration for classification <a class="footnote-reference brackets" href="#id36" id="id29">2</a> and object detection <a class="footnote-reference brackets" href="#id46" id="id30">12</a> (<em>netcal.scaling.BetaCalibration</em>)</p></li>
-<li><p>Dependent Beta Calibration for object detection <a class="footnote-reference brackets" href="#id46" id="id31">12</a> (<em>netcal.scaling.BetaCalibrationDependent</em>) - on detection, this method is able to capture correlations between all input quantities and should be preferred over Beta Calibration for object detection</p></li>
+<li><p>Logistic Calibration/Platt Scaling for classification <a class="footnote-reference brackets" href="#id51" id="id28">10</a>, <a class="footnote-reference brackets" href="#id53" id="id29">12</a> and object detection <a class="footnote-reference brackets" href="#id53" id="id30">12</a> (<em>netcal.scaling.LogisticCalibration</em>)</p></li>
+<li><p>Dependent Logistic Calibration for object detection <a class="footnote-reference brackets" href="#id53" id="id31">12</a> (<em>netcal.scaling.LogisticCalibrationDependent</em>) - on detection, this method is able to capture correlations between all input quantities and should be preferred over Logistic Calibration for object detection</p></li>
+<li><p>Temperature Scaling for classification <a class="footnote-reference brackets" href="#id48" id="id32">7</a> and object detection <a class="footnote-reference brackets" href="#id53" id="id33">12</a> (<em>netcal.scaling.TemperatureScaling</em>)</p></li>
+<li><p>Beta Calibration for classification <a class="footnote-reference brackets" href="#id43" id="id34">2</a> and object detection <a class="footnote-reference brackets" href="#id53" id="id35">12</a> (<em>netcal.scaling.BetaCalibration</em>)</p></li>
+<li><p>Dependent Beta Calibration for object detection <a class="footnote-reference brackets" href="#id53" id="id36">12</a> (<em>netcal.scaling.BetaCalibrationDependent</em>) - on detection, this method is able to capture correlations between all input quantities and should be preferred over Beta Calibration for object detection</p></li>
 </ul>
+<p><strong>New on version 1.2:</strong>: you can provide a parameter named “method” to the constructor of each scaling method. This parameter could be one of the following:
+- ‘mle’: use the method feed-forward with maximum likelihood estimates on the calibration parameters (standard)
+- ‘momentum’: use non-convex momentum optimization (e.g. default on dependent beta calibration)
+- ‘mcmc’: use Markov-Chain Monte-Carlo sampling to obtain multiple parameter sets in order to quantify uncertainty in the calibration
+- ‘variational’: use Variational Inference to obtain multiple parameter sets in order to quantify uncertainty in the calibration</p>
 </div>
 <div class="section" id="regularization">
-<h2><a class="toc-backref" href="#id56">Regularization</a><a class="headerlink" href="#regularization" title="Permalink to this headline">¶</a></h2>
-<p>Implemented regularization methods are:</p>
+<h2><a class="toc-backref" href="#id68">Regularization</a><a class="headerlink" href="#regularization" title="Permalink to this headline">¶</a></h2>
+<p>With some effort, it is also possible to push the model training towards calibrated confidences by regularization. Implemented regularization methods are:</p>
 <ul class="simple">
-<li><p>Confidence Penalty <a class="footnote-reference brackets" href="#id42" id="id32">8</a> (<em>netcal.regularization.confidence_penalty</em>)</p></li>
+<li><p>Confidence Penalty <a class="footnote-reference brackets" href="#id49" id="id37">8</a> (<em>netcal.regularization.confidence_penalty</em> and <em>netcal.regularization.ConfidencePenalty</em> - the latter one is a PyTorch implementation that might be used as a regularization term)</p></li>
+<li><p>Maximum Mean Calibration Error (MMCE) <a class="footnote-reference brackets" href="#id54" id="id38">13</a> (<em>netcal.regularization.MMCEPenalty</em> - PyTorch regularization module)</p></li>
+<li><p>DCA <a class="footnote-reference brackets" href="#id56" id="id39">15</a> (<em>netcal.regularization.DCAPenalty</em> - PyTorch regularization module)</p></li>
 </ul>
 </div>
 </div>
 <div class="section" id="visualization">
-<h1><a class="toc-backref" href="#id57">Visualization</a><a class="headerlink" href="#visualization" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id69">Visualization</a><a class="headerlink" href="#visualization" title="Permalink to this headline">¶</a></h1>
 <p>For visualization of miscalibration, one can use a Confidence Histograms &amp; Reliability Diagrams. These diagrams are similar to ECE, the output space is divided into equally spaced bins. The calibration gap between bin accuracy and bin confidence is visualized as a histogram.</p>
 <p>On detection calibration, the miscalibration can be visualized either along one additional box information (e.g. the x-position of the predictions) or distributed over two additional box information in terms of a heatmap.</p>
 <ul class="simple">
-<li><p>Reliability Diagram <a class="footnote-reference brackets" href="#id35" id="id33">1</a>, <a class="footnote-reference brackets" href="#id46" id="id34">12</a> (<em>netcal.presentation.ReliabilityDiagram</em>)</p></li>
+<li><p>Reliability Diagram <a class="footnote-reference brackets" href="#id42" id="id40">1</a>, <a class="footnote-reference brackets" href="#id53" id="id41">12</a> (<em>netcal.presentation.ReliabilityDiagram</em>)</p></li>
 </ul>
 </div>
 <div class="section" id="examples">
-<h1><a class="toc-backref" href="#id58">Examples</a><a class="headerlink" href="#examples" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id70">Examples</a><a class="headerlink" href="#examples" title="Permalink to this headline">¶</a></h1>
 <p>The calibration methods work with the predicted confidence estimates of a neural network and on detection also with the bounding box regression branch.</p>
 <div class="section" id="classification">
-<h2><a class="toc-backref" href="#id59">Classification</a><a class="headerlink" href="#classification" title="Permalink to this headline">¶</a></h2>
+<h2><a class="toc-backref" href="#id71">Classification</a><a class="headerlink" href="#classification" title="Permalink to this headline">¶</a></h2>
 <p>This is a basic example which uses softmax predictions of a classification task with 10 classes and the given NumPy arrays:</p>
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">ground_truth</span>  <span class="c1"># this is a NumPy 1-D array with ground truth digits between 0-9 - shape: (n_samples,)</span>
 <span class="n">confidences</span>   <span class="c1"># this is a NumPy 2-D array with confidence estimates between 0-1 - shape: (n_samples, n_classes)</span>
@@ -270,8 +312,8 @@ <h2><a class="toc-backref" href="#id59">Classification</a><a class="headerlink"
 </div>
 </div>
 <div class="section" id="detection">
-<h2><a class="toc-backref" href="#id60">Detection</a><a class="headerlink" href="#detection" title="Permalink to this headline">¶</a></h2>
-<p>This is a basic example which uses softmax predictions of a classification task with 10 classes and the given NumPy arrays:</p>
+<h2><a class="toc-backref" href="#id72">Detection</a><a class="headerlink" href="#detection" title="Permalink to this headline">¶</a></h2>
+<p>In this example we use confidence predictions of an object detection model with the according x-position of the predicted bounding boxes. Our ground-truth provided to the calibration algorithm denotes if a bounding box has matched a ground-truth box with a certain IoU and the correct class label.</p>
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">matched</span>                <span class="c1"># binary NumPy 1-D array (0, 1) that indicates if a bounding box has matched a ground truth at a certain IoU with the right label - shape: (n_samples,)</span>
 <span class="n">confidences</span>            <span class="c1"># NumPy 1-D array with confidence estimates between 0-1 - shape: (n_samples,)</span>
 <span class="n">relative_x_position</span>    <span class="c1"># NumPy 1-D array with relative center-x position between 0-1 of each prediction - shape: (n_samples,)</span>
@@ -283,11 +325,11 @@ <h2><a class="toc-backref" href="#id60">Detection</a><a class="headerlink" href=
 
 <span class="nb">input</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">stack</span><span class="p">((</span><span class="n">confidences</span><span class="p">,</span> <span class="n">relative_x_position</span><span class="p">),</span> <span class="n">axis</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span>
 
-<span class="n">lr</span> <span class="o">=</span> <span class="n">LogisticCalibration</span><span class="p">(</span><span class="n">detection</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>        <span class="c1"># flag &#39;detection=True&#39; is mandatory for this method</span>
+<span class="n">lr</span> <span class="o">=</span> <span class="n">LogisticCalibration</span><span class="p">(</span><span class="n">detection</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span> <span class="n">use_cuda</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span>    <span class="c1"># flag &#39;detection=True&#39; is mandatory for this method</span>
 <span class="n">lr</span><span class="o">.</span><span class="n">fit</span><span class="p">(</span><span class="nb">input</span><span class="p">,</span> <span class="n">matched</span><span class="p">)</span>
 <span class="n">calibrated</span> <span class="o">=</span> <span class="n">lr</span><span class="o">.</span><span class="n">transform</span><span class="p">(</span><span class="nb">input</span><span class="p">)</span>
 
-<span class="n">lr_dependent</span> <span class="o">=</span> <span class="n">LogisticCalibrationDependent</span><span class="p">()</span>   <span class="c1"># flag &#39;detection=True&#39; is not necessary as this method is only defined for detection</span>
+<span class="n">lr_dependent</span> <span class="o">=</span> <span class="n">LogisticCalibrationDependent</span><span class="p">(</span><span class="n">use_cuda</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span> <span class="c1"># flag &#39;detection=True&#39; is not necessary as this method is only defined for detection</span>
 <span class="n">lr_dependent</span><span class="o">.</span><span class="n">fit</span><span class="p">(</span><span class="nb">input</span><span class="p">,</span> <span class="n">matched</span><span class="p">)</span>
 <span class="n">calibrated</span> <span class="o">=</span> <span class="n">lr_dependent</span><span class="o">.</span><span class="n">transform</span><span class="p">(</span><span class="nb">input</span><span class="p">)</span>
 </pre></div>
@@ -314,46 +356,129 @@ <h2><a class="toc-backref" href="#id60">Detection</a><a class="headerlink" href=
 </pre></div>
 </div>
 </div>
+<div class="section" id="uncertainty-in-calibration">
+<h2><a class="toc-backref" href="#id73">Uncertainty in Calibration</a><a class="headerlink" href="#uncertainty-in-calibration" title="Permalink to this headline">¶</a></h2>
+<p>We can also quantify the uncertainty in a calibration mapping if we use a Bayesian view on the calibration models. We can sample multiple parameter sets using MCMC sampling or VI. In this example, we reuse the data of the previous detection example.</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">matched</span>                <span class="c1"># binary NumPy 1-D array (0, 1) that indicates if a bounding box has matched a ground truth at a certain IoU with the right label - shape: (n_samples,)</span>
+<span class="n">confidences</span>            <span class="c1"># NumPy 1-D array with confidence estimates between 0-1 - shape: (n_samples,)</span>
+<span class="n">relative_x_position</span>    <span class="c1"># NumPy 1-D array with relative center-x position between 0-1 of each prediction - shape: (n_samples,)</span>
+</pre></div>
+</div>
+<p>This is an example for <em>netcal.scaling.LogisticCalibration</em> and <em>netcal.scaling.LogisticCalibrationDependent</em> but also works for every calibration method (remind different constructor parameters):</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="kn">from</span> <span class="nn">netcal.scaling</span> <span class="kn">import</span> <span class="n">LogisticCalibration</span><span class="p">,</span> <span class="n">LogisticCalibrationDependent</span>
+
+<span class="nb">input</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">stack</span><span class="p">((</span><span class="n">confidences</span><span class="p">,</span> <span class="n">relative_x_position</span><span class="p">),</span> <span class="n">axis</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span>
+
+<span class="c1"># flag &#39;detection=True&#39; is mandatory for this method</span>
+<span class="c1"># use Variational Inference with 2000 optimization steps for creating this calibration mapping</span>
+<span class="n">lr</span> <span class="o">=</span> <span class="n">LogisticCalibration</span><span class="p">(</span><span class="n">detection</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span> <span class="n">method</span><span class="s1">&#39;variational&#39;</span><span class="p">,</span> <span class="n">vi_epochs</span><span class="o">=</span><span class="mi">2000</span><span class="p">,</span> <span class="n">use_cuda</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span>
+<span class="n">lr</span><span class="o">.</span><span class="n">fit</span><span class="p">(</span><span class="nb">input</span><span class="p">,</span> <span class="n">matched</span><span class="p">)</span>
+
+<span class="c1"># &#39;num_samples=1000&#39;: sample 1000 parameter sets from VI</span>
+<span class="c1"># thus, &#39;calibrated&#39; has shape [1000, n_samples]</span>
+<span class="n">calibrated</span> <span class="o">=</span> <span class="n">lr</span><span class="o">.</span><span class="n">transform</span><span class="p">(</span><span class="nb">input</span><span class="p">,</span> <span class="n">num_samples</span><span class="o">=</span><span class="mi">1000</span><span class="p">)</span>
+
+<span class="c1"># flag &#39;detection=True&#39; is not necessary as this method is only defined for detection</span>
+<span class="c1"># this time, use Markov-Chain Monte-Carlo sampling with 250 warm-up steps, 250 parameter samples and one chain</span>
+<span class="n">lr_dependent</span> <span class="o">=</span> <span class="n">LogisticCalibrationDependent</span><span class="p">(</span><span class="n">method</span><span class="o">=</span><span class="s1">&#39;mcmc&#39;</span><span class="p">,</span>
+                                            <span class="n">mcmc_warmup_steps</span><span class="o">=</span><span class="mi">250</span><span class="p">,</span> <span class="n">mcmc_steps</span><span class="o">=</span><span class="mi">250</span><span class="p">,</span> <span class="n">mcmc_chains</span><span class="o">=</span><span class="mi">1</span><span class="p">,</span>
+                                            <span class="n">use_cuda</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span>
+<span class="n">lr_dependent</span><span class="o">.</span><span class="n">fit</span><span class="p">(</span><span class="nb">input</span><span class="p">,</span> <span class="n">matched</span><span class="p">)</span>
+
+<span class="c1"># &#39;num_samples=1000&#39;: although we have only sampled 250 different parameter sets,</span>
+<span class="c1"># we can randomly sample 1000 parameter sets from MCMC</span>
+<span class="n">calibrated</span> <span class="o">=</span> <span class="n">lr_dependent</span><span class="o">.</span><span class="n">transform</span><span class="p">(</span><span class="nb">input</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>You can directly pass the output to the D-ECE and PICP instance to measure miscalibration and mask quality:
+.. code-block:: python</p>
+<blockquote>
+<div><p>from netcal.metrics import ECE
+from netcal.metrics import PICP</p>
+<p>n_bins = 10
+ece = ECE(n_bins, detection=True)
+picp = PICP(n_bins, detection=True)</p>
+<p># the following function calls are equivalent:
+miscalibration = ece.measure(calibrated, matched, uncertainty=”mean”)
+miscalibration = ece.measure(np.mean(calibrated, axis=0), matched)</p>
+<p># now determine uncertainty quality
+uncertainty = picp.measure(calibrated, matched, uncertainty=”mean”)</p>
+<p>print(“D-ECE:”, miscalibration)
+print(“PICP:”, uncertainty.picp) # prediction coverage probability
+print(“MPIW:”, uncertainty.mpiw) # mean prediction interval width</p>
+</div></blockquote>
+<p>If we want to measure miscalibration and uncertainty quality by means of the relative x position, we need to broadcast the according information:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="c1"># broadcast and stack x information to calibrated information</span>
+<span class="n">broadcasted</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">broadcast_to</span><span class="p">(</span><span class="n">relative_x_position</span><span class="p">,</span> <span class="n">calibrated</span><span class="o">.</span><span class="n">shape</span><span class="p">)</span>
+<span class="n">calibrated</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">stack</span><span class="p">((</span><span class="n">calibrated</span><span class="p">,</span> <span class="n">broadcasted</span><span class="p">),</span> <span class="n">axis</span><span class="o">=</span><span class="mi">2</span><span class="p">)</span>
+
+<span class="n">n_bins</span> <span class="o">=</span> <span class="p">[</span><span class="mi">10</span><span class="p">,</span> <span class="mi">10</span><span class="p">]</span>
+<span class="n">ece</span> <span class="o">=</span> <span class="n">ECE</span><span class="p">(</span><span class="n">n_bins</span><span class="p">,</span> <span class="n">detection</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+<span class="n">picp</span> <span class="o">=</span> <span class="n">PICP</span><span class="p">(</span><span class="n">n_bins</span><span class="p">,</span> <span class="n">detection</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+
+<span class="c1"># the following function calls are equivalent:</span>
+<span class="n">miscalibration</span> <span class="o">=</span> <span class="n">ece</span><span class="o">.</span><span class="n">measure</span><span class="p">(</span><span class="n">calibrated</span><span class="p">,</span> <span class="n">matched</span><span class="p">,</span> <span class="n">uncertainty</span><span class="o">=</span><span class="s2">&quot;mean&quot;</span><span class="p">)</span>
+<span class="n">miscalibration</span> <span class="o">=</span> <span class="n">ece</span><span class="o">.</span><span class="n">measure</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="n">calibrated</span><span class="p">,</span> <span class="n">axis</span><span class="o">=</span><span class="mi">0</span><span class="p">),</span> <span class="n">matched</span><span class="p">)</span>
+
+<span class="c1"># now determine uncertainty quality</span>
+<span class="n">uncertainty</span> <span class="o">=</span> <span class="n">picp</span><span class="o">.</span><span class="n">measure</span><span class="p">(</span><span class="n">calibrated</span><span class="p">,</span> <span class="n">matched</span><span class="p">,</span> <span class="n">uncertainty</span><span class="o">=</span><span class="s2">&quot;mean&quot;</span><span class="p">)</span>
+
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;D-ECE:&quot;</span><span class="p">,</span> <span class="n">miscalibration</span><span class="p">)</span>
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;PICP:&quot;</span><span class="p">,</span> <span class="n">uncertainty</span><span class="o">.</span><span class="n">picp</span><span class="p">)</span> <span class="c1"># prediction coverage probability</span>
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;MPIW:&quot;</span><span class="p">,</span> <span class="n">uncertainty</span><span class="o">.</span><span class="n">mpiw</span><span class="p">)</span> <span class="c1"># mean prediction interval width</span>
+</pre></div>
+</div>
+</div>
 </div>
 <div class="section" id="references">
-<h1><a class="toc-backref" href="#id61">References</a><a class="headerlink" href="#references" title="Permalink to this headline">¶</a></h1>
+<h1><a class="toc-backref" href="#id74">References</a><a class="headerlink" href="#references" title="Permalink to this headline">¶</a></h1>
 <dl class="footnote brackets">
-<dt class="label" id="id35"><span class="brackets">1</span><span class="fn-backref">(<a href="#id6">1</a>,<a href="#id9">2</a>,<a href="#id11">3</a>,<a href="#id21">4</a>,<a href="#id33">5</a>)</span></dt>
+<dt class="label" id="id42"><span class="brackets">1</span><span class="fn-backref">(<a href="#id10">1</a>,<a href="#id13">2</a>,<a href="#id15">3</a>,<a href="#id26">4</a>,<a href="#id40">5</a>)</span></dt>
 <dd><p>Naeini, Mahdi Pakdaman, Gregory Cooper, and Milos Hauskrecht: “Obtaining well calibrated probabilities using bayesian binning.” Twenty-Ninth AAAI Conference on Artificial Intelligence, 2015.</p>
 </dd>
-<dt class="label" id="id36"><span class="brackets">2</span><span class="fn-backref">(<a href="#id4">1</a>,<a href="#id29">2</a>)</span></dt>
+<dt class="label" id="id43"><span class="brackets">2</span><span class="fn-backref">(<a href="#id8">1</a>,<a href="#id34">2</a>)</span></dt>
 <dd><p>Kull, Meelis, Telmo Silva Filho, and Peter Flach: “Beta calibration: a well-founded and easily implemented improvement on logistic calibration for binary classifiers.” Artificial Intelligence and Statistics, PMLR 54:623-631, 2017.</p>
 </dd>
-<dt class="label" id="id37"><span class="brackets">3</span><span class="fn-backref">(<a href="#id2">1</a>,<a href="#id16">2</a>)</span></dt>
+<dt class="label" id="id44"><span class="brackets">3</span><span class="fn-backref">(<a href="#id6">1</a>,<a href="#id21">2</a>)</span></dt>
 <dd><p>Zadrozny, Bianca and Elkan, Charles: “Obtaining calibrated probability estimates from decision trees and naive bayesian classifiers.” In ICML, pp. 609–616, 2001.</p>
 </dd>
-<dt class="label" id="id38"><span class="brackets">4</span><span class="fn-backref">(<a href="#id17">1</a>,<a href="#id19">2</a>)</span></dt>
+<dt class="label" id="id45"><span class="brackets">4</span><span class="fn-backref">(<a href="#id22">1</a>,<a href="#id24">2</a>)</span></dt>
 <dd><p>Zadrozny, Bianca and Elkan, Charles: “Transforming classifier scores into accurate multiclass probability estimates.” In KDD, pp. 694–699, 2002.</p>
 </dd>
-<dt class="label" id="id39"><span class="brackets"><a class="fn-backref" href="#id20">5</a></span></dt>
+<dt class="label" id="id46"><span class="brackets"><a class="fn-backref" href="#id25">5</a></span></dt>
 <dd><p>Ryan J Tibshirani, Holger Hoefling, and Robert Tibshirani: “Nearly-isotonic regression.” Technometrics, 53(1):54–61, 2011.</p>
 </dd>
-<dt class="label" id="id40"><span class="brackets"><a class="fn-backref" href="#id22">6</a></span></dt>
+<dt class="label" id="id47"><span class="brackets"><a class="fn-backref" href="#id27">6</a></span></dt>
 <dd><p>Naeini, Mahdi Pakdaman, and Gregory F. Cooper: “Binary classifier calibration using an ensemble of near isotonic regression models.” 2016 IEEE 16th International Conference on Data Mining (ICDM). IEEE, 2016.</p>
 </dd>
-<dt class="label" id="id41"><span class="brackets"><a class="fn-backref" href="#id27">7</a></span></dt>
+<dt class="label" id="id48"><span class="brackets"><a class="fn-backref" href="#id32">7</a></span></dt>
 <dd><p>Chuan Guo, Geoff Pleiss, Yu Sun and Kilian Q. Weinberger: “On Calibration of Modern Neural Networks.” Proceedings of the 34th International Conference on Machine Learning, 2017.</p>
 </dd>
-<dt class="label" id="id42"><span class="brackets"><a class="fn-backref" href="#id32">8</a></span></dt>
+<dt class="label" id="id49"><span class="brackets"><a class="fn-backref" href="#id37">8</a></span></dt>
 <dd><p>Pereyra, G., Tucker, G., Chorowski, J., Kaiser, L. and Hinton, G.: “Regularizing neural networks by penalizing confident output distributions.” CoRR, 2017.</p>
 </dd>
-<dt class="label" id="id43"><span class="brackets"><a class="fn-backref" href="#id15">9</a></span></dt>
+<dt class="label" id="id50"><span class="brackets"><a class="fn-backref" href="#id20">9</a></span></dt>
 <dd><p>Pedregosa, F., Varoquaux, G., Gramfort, A., Michel, V., Thirion, B., Grisel, O., Blondel, M., Prettenhofer, P., Weiss, R., Dubourg, V., Vanderplas, J., Passos, A., Cournapeau, D., Brucher, M., Perrot, M. and Duchesnay, E.: “Scikit-learn: Machine Learning in Python.” In Journal of Machine Learning Research, volume 12 pp 2825-2830, 2011.</p>
 </dd>
-<dt class="label" id="id44"><span class="brackets">10</span><span class="fn-backref">(<a href="#id3">1</a>,<a href="#id23">2</a>)</span></dt>
+<dt class="label" id="id51"><span class="brackets">10</span><span class="fn-backref">(<a href="#id7">1</a>,<a href="#id28">2</a>)</span></dt>
 <dd><p>Platt, John: “Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods.” Advances in large margin classifiers, 10(3): 61–74, 1999.</p>
 </dd>
-<dt class="label" id="id45"><span class="brackets">11</span><span class="fn-backref">(<a href="#id7">1</a>,<a href="#id13">2</a>)</span></dt>
+<dt class="label" id="id52"><span class="brackets">11</span><span class="fn-backref">(<a href="#id11">1</a>,<a href="#id17">2</a>)</span></dt>
 <dd><p>Neumann, Lukas, Andrew Zisserman, and Andrea Vedaldi: “Relaxed Softmax: Efficient Confidence Auto-Calibration for Safe Pedestrian Detection.” Conference on Neural Information Processing Systems (NIPS) Workshop MLITS, 2018.</p>
 </dd>
-<dt class="label" id="id46"><span class="brackets">12</span><span class="fn-backref">(<a href="#id1">1</a>,<a href="#id5">2</a>,<a href="#id8">3</a>,<a href="#id10">4</a>,<a href="#id12">5</a>,<a href="#id14">6</a>,<a href="#id18">7</a>,<a href="#id24">8</a>,<a href="#id25">9</a>,<a href="#id26">10</a>,<a href="#id28">11</a>,<a href="#id30">12</a>,<a href="#id31">13</a>,<a href="#id34">14</a>)</span></dt>
+<dt class="label" id="id53"><span class="brackets">12</span><span class="fn-backref">(<a href="#id5">1</a>,<a href="#id9">2</a>,<a href="#id12">3</a>,<a href="#id14">4</a>,<a href="#id16">5</a>,<a href="#id18">6</a>,<a href="#id23">7</a>,<a href="#id29">8</a>,<a href="#id30">9</a>,<a href="#id31">10</a>,<a href="#id33">11</a>,<a href="#id35">12</a>,<a href="#id36">13</a>,<a href="#id41">14</a>)</span></dt>
 <dd><p>Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff: “Multivariate Confidence Calibration for Object Detection”.” The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020</p>
 </dd>
+<dt class="label" id="id54"><span class="brackets">13</span><span class="fn-backref">(<a href="#id1">1</a>,<a href="#id3">2</a>,<a href="#id19">3</a>,<a href="#id38">4</a>)</span></dt>
+<dd><p>Kumar, Aviral, Sunita Sarawagi, and Ujjwal Jain: “Trainable calibration measures for neural networks from _kernel mean embeddings.” International Conference on Machine Learning. 2018</p>
+</dd>
+<dt class="label" id="id55"><span class="brackets"><a class="fn-backref" href="#id2">14</a></span></dt>
+<dd><p>Jiayu  Yao,  Weiwei  Pan,  Soumya  Ghosh,  and  Finale  Doshi-Velez: “Quality of Uncertainty Quantification for Bayesian Neural Network Inference.” Workshop on Uncertainty and Robustness in Deep Learning, ICML, 2019</p>
+</dd>
+<dt class="label" id="id56"><span class="brackets">15</span><span class="fn-backref">(<a href="#id4">1</a>,<a href="#id39">2</a>)</span></dt>
+<dd><p>Liang, Gongbo, et al.: “Improved trainable calibration method for neural networks on medical imaging classification.” arXiv preprint arXiv:2009.04057 (2020)</p>
+</dd>
 </dl>
 </div>
 
@@ -369,7 +494,11 @@ <h3><a href="#">Table of Contents</a></h3>
 </ul>
 </li>
 <li><a class="reference internal" href="#calibration-framework">Calibration Framework</a></li>
-<li><a class="reference internal" href="#overview">Overview</a></li>
+<li><a class="reference internal" href="#overview">Overview</a><ul>
+<li><a class="reference internal" href="#update-on-version-1-2">Update on version 1.2</a></li>
+<li><a class="reference internal" href="#update-on-version-1-1">Update on version 1.1</a></li>
+</ul>
+</li>
 <li><a class="reference internal" href="#installation">Installation</a><ul>
 <li><a class="reference internal" href="#requirements">Requirements</a></li>
 </ul>
@@ -385,6 +514,7 @@ <h3><a href="#">Table of Contents</a></h3>
 <li><a class="reference internal" href="#examples">Examples</a><ul>
 <li><a class="reference internal" href="#classification">Classification</a></li>
 <li><a class="reference internal" href="#detection">Detection</a></li>
+<li><a class="reference internal" href="#uncertainty-in-calibration">Uncertainty in Calibration</a></li>
 </ul>
 </li>
 <li><a class="reference internal" href="#references">References</a></li>
@@ -426,7 +556,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="_autosummary/netcal.binning.html" title="netcal.binning"
              >next</a> |</li>
-        <li class="nav-item nav-item-0"><a href="#">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="#">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/objects.inv b/docs/build/html/objects.inv
index 186d4ef..8eb5880 100644
Binary files a/docs/build/html/objects.inv and b/docs/build/html/objects.inv differ
diff --git a/docs/build/html/py-modindex.html b/docs/build/html/py-modindex.html
index 06c0578..80b0c81 100644
--- a/docs/build/html/py-modindex.html
+++ b/docs/build/html/py-modindex.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>Python Module Index &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>Python Module Index &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="_static/pygments.css" type="text/css" />
     
@@ -30,7 +30,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="#" title="Python Module Index"
              >modules</a> |</li>
-        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -112,7 +112,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="#" title="Python Module Index"
              >modules</a> |</li>
-        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/search.html b/docs/build/html/search.html
index fd5a4b4..4cfedd1 100644
--- a/docs/build/html/search.html
+++ b/docs/build/html/search.html
@@ -4,7 +4,7 @@
 <html xmlns="http://www.w3.org/1999/xhtml">
   <head>
     <meta charset="utf-8" />
-    <title>Search &#8212; calibration-framework 1.1.3 documentation</title>
+    <title>Search &#8212; calibration-framework 1.2.0 documentation</title>
     <link rel="stylesheet" href="_static/classic.css" type="text/css" />
     <link rel="stylesheet" href="_static/pygments.css" type="text/css" />
     
@@ -32,7 +32,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
-        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>  
 
@@ -83,7 +83,7 @@ <h3>Navigation</h3>
         <li class="right" >
           <a href="py-modindex.html" title="Python Module Index"
              >modules</a> |</li>
-        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.1.3 documentation</a> &#187;</li> 
+        <li class="nav-item nav-item-0"><a href="index.html">calibration-framework 1.2.0 documentation</a> &#187;</li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
diff --git a/docs/build/html/searchindex.js b/docs/build/html/searchindex.js
index 3f8080b..fe2e488 100644
--- a/docs/build/html/searchindex.js
+++ b/docs/build/html/searchindex.js
@@ -1 +1 @@
-Search.setIndex({docnames:["_autosummary/_autosummary_binning/netcal.binning.BBQ","_autosummary/_autosummary_binning/netcal.binning.ENIR","_autosummary/_autosummary_binning/netcal.binning.HistogramBinning","_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression","_autosummary/_autosummary_metric/netcal.metrics.ACE","_autosummary/_autosummary_metric/netcal.metrics.ECE","_autosummary/_autosummary_metric/netcal.metrics.MCE","_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram","_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent","_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling","_autosummary/netcal.binning","_autosummary/netcal.metrics","_autosummary/netcal.presentation","_autosummary/netcal.regularization","_autosummary/netcal.scaling","_autosummary_abstract_calibration/netcal.AbstractCalibration","index"],envversion:{"sphinx.domains.c":1,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":1,"sphinx.domains.index":1,"sphinx.domains.javascript":1,"sphinx.domains.math":2,"sphinx.domains.python":1,"sphinx.domains.rst":1,"sphinx.domains.std":1,sphinx:56},filenames:["_autosummary/_autosummary_binning/netcal.binning.BBQ.rst","_autosummary/_autosummary_binning/netcal.binning.ENIR.rst","_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.rst","_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.rst","_autosummary/_autosummary_metric/netcal.metrics.ACE.rst","_autosummary/_autosummary_metric/netcal.metrics.ECE.rst","_autosummary/_autosummary_metric/netcal.metrics.MCE.rst","_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.rst","_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.rst","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.rst","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.rst","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.rst","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.rst","_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.rst","_autosummary/netcal.binning.rst","_autosummary/netcal.metrics.rst","_autosummary/netcal.presentation.rst","_autosummary/netcal.regularization.rst","_autosummary/netcal.scaling.rst","_autosummary_abstract_calibration/netcal.AbstractCalibration.rst","index.rst"],objects:{"":{netcal:[20,0,0,"-"]},"netcal.AbstractCalibration":{clear:[19,2,1,""],epsilon:[19,3,1,""],fit:[19,2,1,""],fit_transform:[19,2,1,""],get_params:[19,2,1,""],load_model:[19,2,1,""],logger:[19,3,1,""],save_model:[19,2,1,""],set_params:[19,2,1,""],squeeze_generic:[19,2,1,""],transform:[19,2,1,""]},"netcal.binning":{BBQ:[0,1,1,""],ENIR:[1,1,1,""],HistogramBinning:[2,1,1,""],IsotonicRegression:[3,1,1,""]},"netcal.binning.BBQ":{clear:[0,2,1,""],fit:[0,2,1,""],fit_transform:[0,2,1,""],get_params:[0,2,1,""],load_model:[0,2,1,""],save_model:[0,2,1,""],set_params:[0,2,1,""],squeeze_generic:[0,2,1,""],transform:[0,2,1,""]},"netcal.binning.ENIR":{clear:[1,2,1,""],fit:[1,2,1,""],fit_transform:[1,2,1,""],get_params:[1,2,1,""],load_model:[1,2,1,""],save_model:[1,2,1,""],set_params:[1,2,1,""],squeeze_generic:[1,2,1,""],transform:[1,2,1,""]},"netcal.binning.HistogramBinning":{clear:[2,2,1,""],fit:[2,2,1,""],fit_transform:[2,2,1,""],get_degrees_of_freedom:[2,2,1,""],get_params:[2,2,1,""],load_model:[2,2,1,""],save_model:[2,2,1,""],set_params:[2,2,1,""],squeeze_generic:[2,2,1,""],transform:[2,2,1,""]},"netcal.binning.IsotonicRegression":{clear:[3,2,1,""],fit:[3,2,1,""],fit_transform:[3,2,1,""],get_params:[3,2,1,""],load_model:[3,2,1,""],save_model:[3,2,1,""],set_params:[3,2,1,""],squeeze_generic:[3,2,1,""],transform:[3,2,1,""]},"netcal.metrics":{ACE:[4,1,1,""],ECE:[5,1,1,""],MCE:[6,1,1,""]},"netcal.metrics.ACE":{measure:[4,2,1,""],squeeze_generic:[4,2,1,""]},"netcal.metrics.ECE":{measure:[5,2,1,""],squeeze_generic:[5,2,1,""]},"netcal.metrics.MCE":{measure:[6,2,1,""],squeeze_generic:[6,2,1,""]},"netcal.presentation":{ReliabilityDiagram:[7,1,1,""]},"netcal.presentation.ReliabilityDiagram":{plot:[7,2,1,""]},"netcal.regularization":{confidence_penalty:[8,4,1,""]},"netcal.scaling":{BetaCalibration:[9,1,1,""],BetaCalibrationDependent:[10,1,1,""],LogisticCalibration:[11,1,1,""],LogisticCalibrationDependent:[12,1,1,""],TemperatureScaling:[13,1,1,""]},"netcal.scaling.BetaCalibration":{clear:[9,2,1,""],fit:[9,2,1,""],fit_transform:[9,2,1,""],get_params:[9,2,1,""],load_model:[9,2,1,""],save_model:[9,2,1,""],set_params:[9,2,1,""],squeeze_generic:[9,2,1,""],transform:[9,2,1,""]},"netcal.scaling.BetaCalibrationDependent":{clear:[10,2,1,""],fit:[10,2,1,""],fit_transform:[10,2,1,""],get_params:[10,2,1,""],load_model:[10,2,1,""],save_model:[10,2,1,""],set_params:[10,2,1,""],squeeze_generic:[10,2,1,""],transform:[10,2,1,""]},"netcal.scaling.LogisticCalibration":{clear:[11,2,1,""],fit:[11,2,1,""],fit_transform:[11,2,1,""],get_params:[11,2,1,""],load_model:[11,2,1,""],save_model:[11,2,1,""],set_params:[11,2,1,""],squeeze_generic:[11,2,1,""],transform:[11,2,1,""]},"netcal.scaling.LogisticCalibrationDependent":{clear:[12,2,1,""],fit:[12,2,1,""],fit_transform:[12,2,1,""],get_params:[12,2,1,""],load_model:[12,2,1,""],save_model:[12,2,1,""],set_params:[12,2,1,""],squeeze_generic:[12,2,1,""],transform:[12,2,1,""]},"netcal.scaling.TemperatureScaling":{clear:[13,2,1,""],fit:[13,2,1,""],fit_transform:[13,2,1,""],get_params:[13,2,1,""],load_model:[13,2,1,""],save_model:[13,2,1,""],set_params:[13,2,1,""],squeeze_generic:[13,2,1,""],temperature:[13,2,1,""],transform:[13,2,1,""]},netcal:{AbstractCalibration:[19,1,1,""],binning:[14,0,0,"-"],metrics:[15,0,0,"-"],presentation:[16,0,0,"-"],regularization:[17,0,0,"-"],scaling:[18,0,0,"-"]}},objnames:{"0":["py","module","Python module"],"1":["py","class","Python class"],"2":["py","method","Python method"],"3":["py","attribute","Python attribute"],"4":["py","function","Python function"]},objtypes:{"0":"py:module","1":"py:class","2":"py:method","3":"py:attribute","4":"py:function"},terms:{"16th":[1,20],"22nd":7,"2nd":19,"34th":[7,11,13,20],"abstract":19,"boolean":[0,1,2,3,9,10,11,12,13,19],"case":[9,11],"class":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],"default":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],"float":[4,5,6,7,8,19],"function":[0,1,2,3,7,8,9,10,11,12,13,19],"import":[10,12,20],"int":[0,1,2,3,4,5,6,7,9,10,11,12,13,19],"k\u00fcpper":[2,4,5,6,7,9,10,11,12,13,20],"new":20,"public":20,"return":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,15,19],"true":[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],ACE:[7,15,16,20],AND:20,Axes:[0,1,2,3,4,5,6,9,10,11,12,13,19],ECE:[4,7,15,16,20],For:[2,9,10,11,12,17,20],Near:[1,20],The:[0,1,2,3,4,5,6,7,9,10,11,12,13,15,19,20],These:[0,1,17,20],Use:17,Using:[0,1,9,11],_miscalibr:[4,5,6],a_k:9,aaai:[0,5,6,20],abl:20,abov:8,abstractcalibr:[0,1,2,3,9,10,11,12,13,20],acc:[4,5,6],accord:[4,5,9,10,11,12,20],accur:[2,3,20],accuraci:[4,5,6,7,14,15,16,18,20],achiev:[17,20],adam:10,added:20,addit:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],adjac:1,advanc:[11,20],after:[0,1,2,3,9,10,11,12,13,19],afterward:7,aic:[0,1],aikaik:[0,1],aka:11,akaik:[0,1],algorithm:1,alia:[13,20],all:[0,1,2,4,5,6,7,9,10,11,12,19,20],allow:1,along:20,alpha:[9,10],alpha_0:10,alpha_k:[9,10],also:[4,5,6,9,10,11,12,13,20],altern:13,alwai:[4,5,6],amirhossein:[2,4,5,6,7,9,10,11,12,13,20],amount:[0,2,4,5,6,7,20],andrea:[4,20],andrew:[4,20],ani:[0,1,2,3,8,9,10,11,12,13,19],anoth:20,anselm:[2,4,5,6,7,9,10,11,12,13,20],appli:[2,8,9,10,11,12,13,17,20],applic:[10,20],approx:[0,1,9,10,11,12],approxim:[14,18],arg:7,argument:7,arrai:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],artifici:[0,5,6,9,20],assess:10,assign:[2,8],assum:[4,5,9,11],ast:10,ast_j:10,attributeerror:[7,19],author:20,auto:[4,9,20],auto_select:9,avail:20,averag:[4,5,6,7,15,20],axes:[0,1,2,3,4,5,6,9,10,11,12,13,19],axes_to_keep:[0,1,2,3,4,5,6,9,10,11,12,13,19],axi:20,b_i:5,b_k:9,background:[9,10,11,12],base:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],baseestim:19,basic:20,batch:[7,10],bayesian:[0,1,2,5,6,20],bbq:20,bdeu:0,been:20,befor:19,behaviour:20,below:20,best:9,beta:[9,10,20],beta_0:10,beta_k:[9,10],betacalibr:20,betacalibrationdepend:20,between:[4,5,6,7,9,11,15,16,20],bia:11,bianca:[2,3,20],bias:20,bic:[0,1,2],big:10,bigg:[9,10],bin:[4,5,6,7,15,16],binari:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],blondel:20,booktitl:20,bool:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],both:12,bottrop:20,bound:20,boundari:[2,3],box:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],branch:[2,20],brucher:20,build:[0,1,2,3,9,10,11,12,13,19],built:19,calcul:[0,1,4,5,6,7,20],calibr:[0,1,2,3,4,5,6,7,9,10,11,12,13,14,15,17,18,19],calibrated_scor:20,call:[2,19,20],callback:17,can:[0,1,7,8,9,10,11,12,13,19,20],captur:20,caruana:7,center:20,certain:[1,20],charl:[2,3,20],check:19,child:[0,1,2,3,9,10,11,12,13,19],chorowski:[8,20],chosen:2,chuan:[7,11,13,20],cite:20,classic:7,classif:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19],classifi:[1,2,3,9,10,11,12,20],classmethod:[0,1,2,3,4,5,6,9,10,11,12,13,19],clear:[0,1,2,3,9,10,11,12,13,19],code:20,color:7,combin:[9,10,11,12],command:20,common:[15,20],commonli:20,comparison:[11,20],compat:[10,12],compon:[0,1,2,3,9,10,11,12,13,19],comput:[0,2,4,5,6,7,9,10,11,12,13,19,20],conf:[4,5,6],confer:[0,1,2,4,5,6,7,9,10,11,12,13,20],confid:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20],confidence_penalti:20,conform:11,consecut:1,consist:[9,10,11,12,14,16,18],constant:3,constructor:20,contain:[0,1,2,3,9,10,11,12,13,19,20],contrast:1,convert:19,cooper:[0,1,5,6,20],coordin:7,copi:20,copyright:20,corr:[8,20],correl:20,could:7,counterpart:20,cournapeau:20,covari:12,criterion:[0,1],critic:20,cross:7,crucial:20,current:0,cvf:[2,4,5,6,7,9,10,11,12,13,20],cvpr:[2,4,5,6,7,9,10,11,12,13,20],data:[0,1,2,3,9,10,11,12,13,19,20],david:10,debug:19,decis:[2,20],decompos:12,deep:[0,1,2,3,9,10,11,12,13,19],defin:[0,1,2,3,4,5,6,9,10,11,12,13,19,20],degre:2,deliv:[9,10,11,12],denot:[0,1,4,5,6,9,10,11,12,20],densiti:[9,10,11,12],depend:[10,12,20],describ:10,descript:20,design:20,detail:20,detect:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],determin:[9,11,20],deviat:[15,20],devic:10,diagram:[7,16,20],dict:[0,1,2,3,9,10,11,12,13,19],differ:[0,2,4,5,6,7,20],digit:[19,20],dim:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],dimens:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],directli:[1,12,20],displai:16,distribut:[8,9,10,11,12,20],divid:20,divis:19,document:20,doe:[7,19],done:20,dubourg:20,duchesnai:20,dure:[17,20],dynam:3,each:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,15,16,19,20],easi:20,easili:[9,20],easy:10,ece:20,educ:10,effici:[4,20],either:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],elbow:[0,1],electron:[],elektronisch:20,elkan:[2,3,20],ell:[9,10,11,12],encod:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],enir:20,ensembl:[1,20],entropi:8,epsilon:19,equal:[1,2,4,15,16,20],equal_interv:2,error:[4,5,6,15,19,20],especi:20,estim:[0,1,2,3,9,10,11,12,13,14,17,18,19,20],etc:7,evalu:7,even:[0,1,2,3,4,5,6,9,10,11,12,13,19],everi:20,examin:7,exampl:17,exp:[0,1,9,10,11,12],expect:[5,15,20],express:[9,11],extend:[9,11,20],extens:20,fabian:[2,4,5,6,7,9,10,11,12,13,20],fabiankuepp:20,factor:11,fahrwerksystem:20,fals:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],featur:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],feature_nam:7,figur:7,file:20,filenam:[0,1,2,3,7,9,10,11,12,13,19],filho:[9,20],first:[9,10,11,12],fit:[0,1,2,3,7,9,10,11,12,13,19,20],fit_param:[0,1,2,3,9,10,11,12,13,19],fit_transform:[0,1,2,3,9,10,11,12,13,19],flach:[9,20],flag:20,fmax:7,fmin:7,follow:20,foral:10,form:[0,1,2,3,9,10,11,12,13,19,20],formul:11,found:[9,20],frac:[4,5,9,10,11,12],framework:[10,12],freedom:2,from:[0,1,2,3,9,10,11,12,13,19,20],full:20,furthermor:20,gaimersheim:20,gap:[7,15,16,20],gener:[9,10,11,12],geoff:[7,11,13,20],germani:20,get:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],get_degrees_of_freedom:2,get_param:[0,1,2,3,9,10,11,12,13,19],github:20,give:15,given:[0,1,3,4,5,7,9,10,11,12,15,20],gmbh:20,good:7,gramfort:20,gregori:[0,1,5,6,20],grisel:20,ground:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],ground_truth:20,group:[1,4,5,6,20],guarante:[12,19],guo:[7,11,13,20],has:[9,10,11,12,19,20],haselhoff:[2,4,5,6,7,9,10,11,12,13,20],hat:[0,1,9,10,11,12,13],hauskrecht:[0,5,6,20],have:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],heatmap:20,height:[7,9,10,11,12],highest:[15,20],hinton:[8,20],histogram:[2,4,5,6,7,20],histogrambin:[0,3,20],hoefl:20,holger:20,hot:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],how:20,howev:[11,20],http:20,icdm:[1,20],icml:[2,20],ieee:[1,2,4,5,6,7,9,10,11,12,13,20],implement:[9,20],improv:[9,19,20],includ:[2,7,20],independ:[0,1,2,3,9,11,13,19],independent_prob:[0,1,2,3,9,11,13,19],indic:[9,10,11,12,20],inequ:19,info:19,inform:[0,1,2,4,7,20],inherit:[19,20],initi:1,inproceed:20,input:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],input_calibr:20,insert:[10,12],instanc:[0,1,2,3,7,9,10,11,12,13,17,19],instead:[9,10,11,12],integ:2,intellig:[0,5,6,9,20],intern:[1,7,11,13,20],interpret:[7,9,10,11,12],interv:2,invok:20,iou:20,isoton:[1,3,20],isotonicregress:[1,20],iter:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],its:2,jan:[2,4,5,6,7,9,10,11,12,13,20],jmlr:[7,11,13],john:[11,20],journal:[10,20],june:20,kaiser:[8,20],kdd:[2,3,20],keep:[0,1,2,3,4,5,6,9,10,11,12,13,19],kept:[0,1,2,3,4,5,6,9,10,11,12,13,19],kerpen:[],kilian:[7,11,13,20],kronenberg:[2,4,5,6,7,9,10,11,12,13,20],kueppers_2020_cvpr_workshop:20,kull:[9,20],label:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],lambda_j:10,lambda_k:10,larg:[11,20],last:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],latter:[0,1,2,3,9,10,11,12,13,19],learn:[7,10,11,13,20],least:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],led:13,length:[0,1,2,7],less:20,let:[0,1],libbi:10,licens:20,like:[7,19,20],likelihood:[0,1,9,10,11,12,20],list:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],load:[0,1,2,3,9,10,11,12,13,19],load_model:[0,1,2,3,9,10,11,12,13,19],locat:20,log:[0,1,9,10,11,12,19],logarithm:[8,9,10,11,12],logger:19,logist:[9,10,11,12,13,20],logisticcalibr:[13,20],logisticcalibrationdepend:20,logit:[9,10,11,12,13,20],loss:[8,20],low:[0,1],lowest:19,lr_depend:20,luka:[4,20],lukasz:8,machin:[7,11,13,20],mahdi:[0,1,5,6,20],main:4,mandatori:20,manner:2,map:[0,1,2,3,4,5,6,9,10,11,12,13,19,20],margin:[11,20],match:[7,9,10,11,12,19,20],mathbb:[11,12],mathcal:[0,1],mathemat:[9,10,11,12],matplotlib:[7,20],matric:12,matrix:12,max_:6,max_it:10,maximum:[6,7,10,15,20],mce:[7,15,20],mean:[9,10,11,12,15,20],measur:[4,5,6,7,14,15,20],meeli:[9,20],melvin:10,messag:19,method:[0,1,2,3,4,5,6,7,9,10,11,12,13,14,15,16,17,18,19],metric:7,michel:20,might:[0,1,7],milo:[0,5,6,20],mine:[1,20],minimum:7,miscalibr:[4,5,6,7,9,10,11,12,15,16,20],miscellan:20,mizil:7,mlit:[4,20],mode:[2,4,5,6,7,9,11,20],model:[0,1,2,3,9,10,11,12,13,17,19,20],modern:[7,11,13,20],modifi:1,momentum:10,monotoni:1,month:20,more:[7,19,20],most:20,mozilla:20,mpava:1,mpl:20,multi:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],multiclass:[2,3,9,11,20],multidimension:[2,20],multinomi:9,multipl:[0,1,7,9,11],multivari:[2,4,5,6,7,9,10,11,12,13,20],must:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],n_bin:20,n_box_featur:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],n_class:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],n_featur:[0,1,2,3,9,10,11,12,13,19],n_features_new:[0,1,2,3,9,10,11,12,13,19],n_sampl:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],naeini:[0,1,5,6,20],naiv:[2,20],name:[0,1,2,3,9,10,11,12,13,19],natur:20,ndarrai:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19],nearli:20,necessari:[9,10,11,12,20],need:[2,19,20],neither:20,nest:[0,1,2,3,9,10,11,12,13,19],netcal:20,network:[7,8,11,13,20],neumann:[4,20],neural:[4,7,8,11,13,20],niculescu:7,ninth:[0,5,6,20],nip:[4,20],nir:1,none:[0,1,2,3,7,8,9,10,11,12,13,19],nor:20,norm:8,normal:[0,1,2,11,12],notat:10,novick:10,num_sampl:[4,5,6],number:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,15,19],numpi:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],nx1:[2,4,5,6,7],nx2:[2,4,5,6,7],object:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],observ:[7,15,16,18,20],obtain:[0,1,2,5,6,9,10,11,12,17,20],odd:[9,10,11,12],onc:7,one:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],onli:[4,5,6,7,9,10,11,12,20],onlin:[0,1,2,3,4,5,6,7,8,9,11,13],oper:[13,19],optim:[9,10,11,12],option:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19],org:[7,11,13,20],origin:[0,1,2,3,9,10,11,12,13],other:[0,1,2,3,9,11,13,19],out:[0,1],output:[0,1,2,3,8,9,10,11,12,13,19,20],over:[0,1,4,5,6,7,17,20],overconfid:20,own:20,packag:[14,16,18,20],pakdaman:[0,1,5,6,20],paper:0,param:[0,1,2,3,9,10,11,12,13,19],paramet:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,17,19,20],part:[11,20],pass:7,passo:20,pattern:[2,4,5,6,7,9,10,11,12,13,20],pedestrian:[4,20],pedregosa:20,penal:[8,17,20],penalti:[8,17,20],pereyra:[8,20],perform:[13,19,20],perrot:20,peter:[9,20],pickl:[0,1,2,3,9,10,11,12,13,19],piecewis:3,pip3:20,pip:20,pipelin:[0,1,2,3,9,10,11,12,13,19],platt:[11,20],pleas:20,pleiss:[7,11,13,20],plot:[7,20],pmlr:[9,20],pool:1,posit:[9,10,11,12,20],possibl:[0,1,2,3,9,10,11,12,13,19],posterior:[0,1,8,9,10,11,12],prebuild:17,predict:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,17,19,20],prefer:20,preffer:20,present:[0,1,2,3,4,5,6,9,10,11,12,13,19,20],press:[],prettenhof:20,print:19,probabilist:[11,20],probabl:[0,1,2,3,5,6,7,9,10,11,13,19,20],problem:[9,10,11,12],proceed:[7,11,13,20],process:[4,20],prod:10,prohibit:17,properti:[7,13],propos:[0,1,2,3,9,10,11,12,13],propto:[0,1],provid:[7,9,10,11,12,20],purpos:20,pyplot:7,python3:20,python:20,quantil:[0,20],quantiti:20,quick:1,quick_init:1,quit:20,rais:[7,19],rate:10,ratio:[9,10,11,12],readm:20,reason:[10,12],recent:20,recognit:[2,4,5,6,7,9,10,11,12,13,20],refer:[0,1,2,3,4,5,6,7,8,9,10,11,12,13],regress:[1,2,3,7,9,10,11,12,13,20],regular:11,rel:[0,1,20],relative_x_posit:20,relax:[4,20],reliabilitydiagram:20,reliabl:[7,16,20],remain:[4,5,6],remind:20,reparametr:9,requir:12,research:20,respect:[9,10,12],restrict:[1,12],result:7,return_map:[4,5,6],return_num_sampl:[4,5,6],right:20,robert:20,rootlogg:19,ruhr:20,runtimeerror:19,ryan:20,s_k:[9,10],safe:[4,20],safeti:20,same:[2,4,5,6,7,11],sampl:[2,4,5,6,7,9,10,11,12,15,16,20],sample_threshold:[4,5,6,7],save:[0,1,2,3,7,9,10,11,12,13,19],save_arg:7,save_model:[0,1,2,3,9,10,11,12,13,19],savefig:7,scale:7,scheme:[9,10,11,12],scienc:20,scikit:20,scipi:[10,20],scope:20,score:[0,1,2,3,9,10,11,12,20],score_funct:[0,1],second:7,see:20,select:9,self:[0,1,2,3,9,10,11,12,13,19],semidefinit:12,separ:[4,5,6,7,20],set:[0,1,2,3,7,9,10,11,12,13,19],set_param:[0,1,2,3,9,10,11,12,13,19],setup:20,setuptool:20,sever:[0,1,2,3,4,5,6,7,9,10,11,12,13,14,18,19,20],shantia:[2,4,5,6,7,9,10,11,12,13,20],shape:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],should:[0,1,2,3,4,5,6,7,9,10,11,12,13,17,19,20],shown:20,sigma:12,sigma_:[12,13],sigmoid:[0,1,2,3,9,11,13,19],silva:[9,20],similar:[3,15,16,20],simpl:[0,1,2,3,9,10,11,12,13,19],simpli:[2,11,20],size:[0,1,2,3,4,5,6,9,10,11,12,13,16,19],sklearn:19,snippet:20,softmax:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19,20],some:20,sort:[0,1,2,3],sourc:[0,1,2,3,4,5,6,7,8,9,11,13,20],space:[7,20],specifii:20,split:2,squeez:[0,1,2,3,4,5,6,9,10,11,12,13,19],squeeze_gener:[0,1,2,3,4,5,6,9,10,11,12,13,19],stack:20,standard:[1,9,10,11],statist:[9,10,20],str:[0,1,2,3,7,9,10,11,12,13,19],string:[0,1,2,3,7,9,10,11,12,13,19],structur:20,subject:20,subobject:[0,1,2,3,9,10,11,12,13,19],suffix:7,suit:20,sum:[0,9,10,20],sum_:[0,1,4,5],sum_k:9,summar:9,sun:[7,11,13,20],supervis:7,support:[0,11,20],symmetr:12,system:[4,20],target:[0,1,2,3,9,10,11,12,13,19],task:[4,5,9,10,11,12,13,20],technometr:20,telmo:[9,20],temperatur:[11,13,20],temperature_onli:11,temperaturesc:20,term:[8,20],text:[4,5,6,9,10,11,12,13],than:[7,19],thei:[0,1,2,3,4,5,6,9,10,11,12,13,19],them:1,therefor:[9,10,11,12],theta:[0,1],thi:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,16,18,19,20],thirion:20,those:[9,10,11,12,20],threshold:8,thu:11,tibshirani:20,time:12,titl:[7,20],title_suffix:7,tool:20,top:[9,10,11,12],torch:20,tqdm:20,train:[0,1,2,3,9,10,11,12,13,17,19,20],transform:[0,1,2,3,9,10,11,12,13,19,20],transformermixin:19,treat:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],tree:[2,20],tri:[10,12],truth:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],tucker:[8,20],tupl:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],twenti:[0,5,6,20],two:20,type:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19],typic:8,uncalibr:[0,1,2,3,9,10,11,12,13,19,20],uncalibrated_scor:20,union:[0,1,2,3,4,5,6,7,9,10,11,12,13,19],univari:[9,11],univers:20,updat:[0,1,2,3,9,10,11,12,13,19],use:[2,4,5,6,7,9,10,11,12,14,18,20],used:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],uses:[9,10,11,12,20],using:[0,1,5,6,7,9,11,20],util:[0,9,10,11,20],valid:7,valu:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,19],vanderpla:20,variabl:[9,10,11,12],varianc:11,variant:10,varoquaux:20,vector:[0,1,2,3,4,5,6,7,9,10,11,12,13,19,20],vedaldi:[4,20],version:[0,1,2,3,9,10,11,12,13,19],violat:1,vision:[2,4,5,6,7,9,10,11,12,13,20],visit:20,visteon:[],visual:[7,16],volum:[7,11,13,20],wai:7,want:20,warn:19,weight:[0,1,4,8,15,20],weinberg:[7,11,13,20],weiss:20,well:[0,1,2,3,5,6,9,10,11,12,13,19,20],west:20,where:[4,5,6,9,10,20],wherea:[9,10,11,12],which:[0,9,10,11,12,14,17,18,20],width:[2,7,9,10,11,12],wise:7,work:[0,1,2,3,9,10,11,12,13,19,20],workshop:[2,4,5,6,7,9,10,11,12,13,20],write:20,x_0:[0,1],x_1:[0,1],x_new:[0,1,2,3,9,10,11,12,13,19],y_0:[0,1],y_1:[0,1],year:20,you:20,your:20,zadrozni:[2,3,20],zisserman:[4,20]},titles:["netcal.binning.BBQ","netcal.binning.ENIR","netcal.binning.HistogramBinning","netcal.binning.IsotonicRegression","netcal.metrics.ACE","netcal.metrics.ECE","netcal.metrics.MCE","netcal.presentation.ReliabilityDiagram","netcal.regularization.confidence_penalty","netcal.scaling.BetaCalibration","netcal.scaling.BetaCalibrationDependent","netcal.scaling.LogisticCalibration","netcal.scaling.LogisticCalibrationDependent","netcal.scaling.TemperatureScaling","netcal.binning","netcal.metrics","netcal.presentation","netcal.regularization","netcal.scaling","netcal.AbstractCalibration","API Reference"],titleterms:{"class":[14,15,16,18],"function":17,ACE:4,ECE:5,abstractcalibr:19,api:20,avail:[14,15,16,17,18],bbq:0,betacalibr:9,betacalibrationdepend:10,bin:[0,1,2,3,14,20],calibr:20,classif:20,confidence_penalti:8,content:20,detect:20,enir:1,exampl:20,framework:20,histogrambin:2,instal:20,isotonicregress:3,logisticcalibr:11,logisticcalibrationdepend:12,mce:6,method:20,metric:[4,5,6,15,20],netcal:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19],overview:20,present:[7,16],refer:20,regular:[8,17,20],reliabilitydiagram:7,requir:20,scale:[9,10,11,12,13,18,20],tabl:20,temperaturesc:13,visual:20}})
\ No newline at end of file
+Search.setIndex({docnames:["_autosummary/_autosummary_binning/netcal.binning.BBQ","_autosummary/_autosummary_binning/netcal.binning.ENIR","_autosummary/_autosummary_binning/netcal.binning.HistogramBinning","_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression","_autosummary/_autosummary_metric/netcal.metrics.ACE","_autosummary/_autosummary_metric/netcal.metrics.ECE","_autosummary/_autosummary_metric/netcal.metrics.MCE","_autosummary/_autosummary_metric/netcal.metrics.MMCE","_autosummary/_autosummary_metric/netcal.metrics.PICP","_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram","_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty","_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty","_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty","_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty","_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent","_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling","_autosummary/netcal.binning","_autosummary/netcal.metrics","_autosummary/netcal.presentation","_autosummary/netcal.regularization","_autosummary/netcal.scaling","_autosummary_abstract_calibration/netcal.AbstractCalibration","index"],envversion:{"sphinx.domains.c":1,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":1,"sphinx.domains.index":1,"sphinx.domains.javascript":1,"sphinx.domains.math":2,"sphinx.domains.python":1,"sphinx.domains.rst":1,"sphinx.domains.std":1,sphinx:56},filenames:["_autosummary/_autosummary_binning/netcal.binning.BBQ.rst","_autosummary/_autosummary_binning/netcal.binning.ENIR.rst","_autosummary/_autosummary_binning/netcal.binning.HistogramBinning.rst","_autosummary/_autosummary_binning/netcal.binning.IsotonicRegression.rst","_autosummary/_autosummary_metric/netcal.metrics.ACE.rst","_autosummary/_autosummary_metric/netcal.metrics.ECE.rst","_autosummary/_autosummary_metric/netcal.metrics.MCE.rst","_autosummary/_autosummary_metric/netcal.metrics.MMCE.rst","_autosummary/_autosummary_metric/netcal.metrics.PICP.rst","_autosummary/_autosummary_presentation/netcal.presentation.ReliabilityDiagram.rst","_autosummary/_autosummary_regularization_func/netcal.regularization.ConfidencePenalty.rst","_autosummary/_autosummary_regularization_func/netcal.regularization.DCAPenalty.rst","_autosummary/_autosummary_regularization_func/netcal.regularization.MMCEPenalty.rst","_autosummary/_autosummary_regularization_func/netcal.regularization.confidence_penalty.rst","_autosummary/_autosummary_scaling/netcal.scaling.AbstractLogisticRegression.rst","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibration.rst","_autosummary/_autosummary_scaling/netcal.scaling.BetaCalibrationDependent.rst","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibration.rst","_autosummary/_autosummary_scaling/netcal.scaling.LogisticCalibrationDependent.rst","_autosummary/_autosummary_scaling/netcal.scaling.TemperatureScaling.rst","_autosummary/netcal.binning.rst","_autosummary/netcal.metrics.rst","_autosummary/netcal.presentation.rst","_autosummary/netcal.regularization.rst","_autosummary/netcal.scaling.rst","_autosummary_abstract_calibration/netcal.AbstractCalibration.rst","index.rst"],objects:{"":{netcal:[26,0,0,"-"]},"netcal.AbstractCalibration":{clear:[25,2,1,""],epsilon:[25,3,1,""],fit:[25,2,1,""],fit_transform:[25,2,1,""],get_params:[25,2,1,""],load_model:[25,2,1,""],save_model:[25,2,1,""],set_params:[25,2,1,""],squeeze_generic:[25,2,1,""],transform:[25,2,1,""]},"netcal.binning":{BBQ:[0,1,1,""],ENIR:[1,1,1,""],HistogramBinning:[2,1,1,""],IsotonicRegression:[3,1,1,""]},"netcal.binning.BBQ":{clear:[0,2,1,""],fit:[0,2,1,""],fit_transform:[0,2,1,""],get_params:[0,2,1,""],load_model:[0,2,1,""],save_model:[0,2,1,""],set_params:[0,2,1,""],squeeze_generic:[0,2,1,""],transform:[0,2,1,""]},"netcal.binning.ENIR":{clear:[1,2,1,""],fit:[1,2,1,""],fit_transform:[1,2,1,""],get_params:[1,2,1,""],load_model:[1,2,1,""],save_model:[1,2,1,""],set_params:[1,2,1,""],squeeze_generic:[1,2,1,""],transform:[1,2,1,""]},"netcal.binning.HistogramBinning":{clear:[2,2,1,""],fit:[2,2,1,""],fit_transform:[2,2,1,""],get_degrees_of_freedom:[2,2,1,""],get_params:[2,2,1,""],load_model:[2,2,1,""],save_model:[2,2,1,""],set_params:[2,2,1,""],squeeze_generic:[2,2,1,""],transform:[2,2,1,""]},"netcal.binning.IsotonicRegression":{clear:[3,2,1,""],fit:[3,2,1,""],fit_transform:[3,2,1,""],get_params:[3,2,1,""],load_model:[3,2,1,""],save_model:[3,2,1,""],set_params:[3,2,1,""],squeeze_generic:[3,2,1,""],transform:[3,2,1,""]},"netcal.metrics":{ACE:[4,1,1,""],ECE:[5,1,1,""],MCE:[6,1,1,""],MMCE:[7,1,1,""],PICP:[8,1,1,""]},"netcal.metrics.ACE":{binning:[4,2,1,""],measure:[4,2,1,""],prepare:[4,2,1,""],process:[4,2,1,""],reduce:[4,2,1,""],squeeze_generic:[4,2,1,""]},"netcal.metrics.ECE":{binning:[5,2,1,""],measure:[5,2,1,""],prepare:[5,2,1,""],process:[5,2,1,""],reduce:[5,2,1,""],squeeze_generic:[5,2,1,""]},"netcal.metrics.MCE":{binning:[6,2,1,""],measure:[6,2,1,""],prepare:[6,2,1,""],process:[6,2,1,""],reduce:[6,2,1,""],squeeze_generic:[6,2,1,""]},"netcal.metrics.MMCE":{measure:[7,2,1,""]},"netcal.metrics.PICP":{accuracy:[8,2,1,""],binning:[8,2,1,""],measure:[8,2,1,""],prepare:[8,2,1,""],process:[8,2,1,""],reduce:[8,2,1,""],squeeze_generic:[8,2,1,""]},"netcal.presentation":{ReliabilityDiagram:[9,1,1,""]},"netcal.presentation.ReliabilityDiagram":{plot:[9,2,1,""]},"netcal.regularization":{ConfidencePenalty:[10,1,1,""],DCAPenalty:[11,1,1,""],MMCEPenalty:[12,1,1,""],confidence_penalty:[13,4,1,""]},"netcal.regularization.ConfidencePenalty":{"double":[10,2,1,""],"float":[10,2,1,""],__init__:[10,2,1,""],_load_from_state_dict:[10,2,1,""],_named_members:[10,2,1,""],_register_load_state_dict_pre_hook:[10,2,1,""],_register_state_dict_hook:[10,2,1,""],_save_to_state_dict:[10,2,1,""],add_module:[10,2,1,""],apply:[10,2,1,""],bfloat16:[10,2,1,""],buffers:[10,2,1,""],children:[10,2,1,""],cpu:[10,2,1,""],cuda:[10,2,1,""],eval:[10,2,1,""],extra_repr:[10,2,1,""],forward:[10,2,1,""],half:[10,2,1,""],load_state_dict:[10,2,1,""],modules:[10,2,1,""],named_buffers:[10,2,1,""],named_children:[10,2,1,""],named_modules:[10,2,1,""],named_parameters:[10,2,1,""],parameters:[10,2,1,""],register_backward_hook:[10,2,1,""],register_buffer:[10,2,1,""],register_forward_hook:[10,2,1,""],register_forward_pre_hook:[10,2,1,""],register_parameter:[10,2,1,""],requires_grad_:[10,2,1,""],state_dict:[10,2,1,""],to:[10,2,1,""],train:[10,2,1,""],type:[10,2,1,""],zero_grad:[10,2,1,""]},"netcal.regularization.DCAPenalty":{"double":[11,2,1,""],"float":[11,2,1,""],__init__:[11,2,1,""],_load_from_state_dict:[11,2,1,""],_named_members:[11,2,1,""],_register_load_state_dict_pre_hook:[11,2,1,""],_register_state_dict_hook:[11,2,1,""],_save_to_state_dict:[11,2,1,""],add_module:[11,2,1,""],apply:[11,2,1,""],bfloat16:[11,2,1,""],buffers:[11,2,1,""],children:[11,2,1,""],cpu:[11,2,1,""],cuda:[11,2,1,""],eval:[11,2,1,""],extra_repr:[11,2,1,""],forward:[11,2,1,""],half:[11,2,1,""],load_state_dict:[11,2,1,""],modules:[11,2,1,""],named_buffers:[11,2,1,""],named_children:[11,2,1,""],named_modules:[11,2,1,""],named_parameters:[11,2,1,""],parameters:[11,2,1,""],register_backward_hook:[11,2,1,""],register_buffer:[11,2,1,""],register_forward_hook:[11,2,1,""],register_forward_pre_hook:[11,2,1,""],register_parameter:[11,2,1,""],requires_grad_:[11,2,1,""],state_dict:[11,2,1,""],to:[11,2,1,""],train:[11,2,1,""],type:[11,2,1,""],zero_grad:[11,2,1,""]},"netcal.regularization.MMCEPenalty":{"double":[12,2,1,""],"float":[12,2,1,""],__init__:[12,2,1,""],_load_from_state_dict:[12,2,1,""],_named_members:[12,2,1,""],_register_load_state_dict_pre_hook:[12,2,1,""],_register_state_dict_hook:[12,2,1,""],_save_to_state_dict:[12,2,1,""],add_module:[12,2,1,""],apply:[12,2,1,""],bfloat16:[12,2,1,""],buffers:[12,2,1,""],children:[12,2,1,""],cpu:[12,2,1,""],cuda:[12,2,1,""],eval:[12,2,1,""],extra_repr:[12,2,1,""],forward:[12,2,1,""],half:[12,2,1,""],kernel:[12,2,1,""],load_state_dict:[12,2,1,""],modules:[12,2,1,""],named_buffers:[12,2,1,""],named_children:[12,2,1,""],named_modules:[12,2,1,""],named_parameters:[12,2,1,""],parameters:[12,2,1,""],register_backward_hook:[12,2,1,""],register_buffer:[12,2,1,""],register_forward_hook:[12,2,1,""],register_forward_pre_hook:[12,2,1,""],register_parameter:[12,2,1,""],requires_grad_:[12,2,1,""],state_dict:[12,2,1,""],to:[12,2,1,""],train:[12,2,1,""],type:[12,2,1,""],zero_grad:[12,2,1,""]},"netcal.scaling":{AbstractLogisticRegression:[14,1,1,""],BetaCalibration:[15,1,1,""],BetaCalibrationDependent:[16,1,1,""],LogisticCalibration:[17,1,1,""],LogisticCalibrationDependent:[18,1,1,""],TemperatureScaling:[19,1,1,""]},"netcal.scaling.AbstractLogisticRegression":{clear:[14,2,1,""],convex:[14,2,1,""],fit:[14,2,1,""],fit_transform:[14,2,1,""],get_params:[14,2,1,""],guide:[14,2,1,""],load_model:[14,2,1,""],mask:[14,2,1,""],mcmc:[14,2,1,""],model:[14,2,1,""],momentum:[14,2,1,""],prepare:[14,2,1,""],prior:[14,2,1,""],save_model:[14,2,1,""],set_params:[14,2,1,""],squeeze_generic:[14,2,1,""],to:[14,2,1,""],transform:[14,2,1,""],variational:[14,2,1,""]},"netcal.scaling.BetaCalibration":{clear:[15,2,1,""],convex:[15,2,1,""],fit:[15,2,1,""],fit_transform:[15,2,1,""],get_params:[15,2,1,""],guide:[15,2,1,""],intercept:[15,2,1,""],load_model:[15,2,1,""],mask:[15,2,1,""],mcmc:[15,2,1,""],model:[15,2,1,""],momentum:[15,2,1,""],prepare:[15,2,1,""],prior:[15,2,1,""],save_model:[15,2,1,""],set_params:[15,2,1,""],squeeze_generic:[15,2,1,""],to:[15,2,1,""],transform:[15,2,1,""],variational:[15,2,1,""],weights:[15,2,1,""]},"netcal.scaling.BetaCalibrationDependent":{alphas:[16,2,1,""],betas:[16,2,1,""],clear:[16,2,1,""],convex:[16,2,1,""],fit:[16,2,1,""],fit_transform:[16,2,1,""],get_params:[16,2,1,""],guide:[16,2,1,""],intercept:[16,2,1,""],load_model:[16,2,1,""],mask:[16,2,1,""],mcmc:[16,2,1,""],model:[16,2,1,""],momentum:[16,2,1,""],prepare:[16,2,1,""],prior:[16,2,1,""],save_model:[16,2,1,""],set_params:[16,2,1,""],squeeze_generic:[16,2,1,""],to:[16,2,1,""],transform:[16,2,1,""],variational:[16,2,1,""]},"netcal.scaling.LogisticCalibration":{clear:[17,2,1,""],convex:[17,2,1,""],fit:[17,2,1,""],fit_transform:[17,2,1,""],get_params:[17,2,1,""],guide:[17,2,1,""],intercept:[17,2,1,""],load_model:[17,2,1,""],mask:[17,2,1,""],mcmc:[17,2,1,""],model:[17,2,1,""],momentum:[17,2,1,""],prepare:[17,2,1,""],prior:[17,2,1,""],save_model:[17,2,1,""],set_params:[17,2,1,""],squeeze_generic:[17,2,1,""],to:[17,2,1,""],transform:[17,2,1,""],variational:[17,2,1,""],weights:[17,2,1,""]},"netcal.scaling.LogisticCalibrationDependent":{clear:[18,2,1,""],convex:[18,2,1,""],covariances:[18,2,1,""],fit:[18,2,1,""],fit_transform:[18,2,1,""],get_params:[18,2,1,""],guide:[18,2,1,""],intercept:[18,2,1,""],load_model:[18,2,1,""],mask:[18,2,1,""],mcmc:[18,2,1,""],means:[18,2,1,""],model:[18,2,1,""],momentum:[18,2,1,""],prepare:[18,2,1,""],prior:[18,2,1,""],save_model:[18,2,1,""],set_params:[18,2,1,""],squeeze_generic:[18,2,1,""],to:[18,2,1,""],transform:[18,2,1,""],variational:[18,2,1,""]},"netcal.scaling.TemperatureScaling":{clear:[19,2,1,""],convex:[19,2,1,""],fit:[19,2,1,""],fit_transform:[19,2,1,""],get_params:[19,2,1,""],guide:[19,2,1,""],intercept:[19,2,1,""],load_model:[19,2,1,""],mask:[19,2,1,""],mcmc:[19,2,1,""],model:[19,2,1,""],momentum:[19,2,1,""],prepare:[19,2,1,""],prior:[19,2,1,""],save_model:[19,2,1,""],set_params:[19,2,1,""],squeeze_generic:[19,2,1,""],temperature:[19,2,1,""],to:[19,2,1,""],transform:[19,2,1,""],variational:[19,2,1,""],weights:[19,2,1,""]},netcal:{AbstractCalibration:[25,1,1,""],binning:[20,0,0,"-"],metrics:[21,0,0,"-"],presentation:[22,0,0,"-"],regularization:[23,0,0,"-"],scaling:[24,0,0,"-"]}},objnames:{"0":["py","module","Python module"],"1":["py","class","Python class"],"2":["py","method","Python method"],"3":["py","attribute","Python attribute"],"4":["py","function","Python function"]},objtypes:{"0":"py:module","1":"py:class","2":"py:method","3":"py:attribute","4":"py:function"},terms:{"16th":[1,26],"20l":[10,11,12],"22nd":9,"2nd":25,"34th":[9,17,19,26],"abstract":[14,25],"boolean":[0,1,2,3,14,15,16,17,18,19,25],"case":[10,11,12,15,17],"class":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25,26],"default":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25,26],"final":[8,26],"float":[4,5,6,7,8,9,10,11,12,13,25],"function":[0,1,2,3,7,9,10,11,12,13,14,15,16,17,18,19,25,26],"import":26,"int":[0,1,2,3,4,5,6,8,9,10,11,12,14,15,16,17,18,19,25],"k\u00fcpper":[2,4,5,6,9,14,15,16,17,18,19,26],"new":[10,11,12,26],"return":[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,21,25],"switch":26,"true":[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],"while":[10,11,12],ACE:[9,21,22,26],AND:26,Axes:[0,1,2,3,14,15,16,17,18,19,25],ECE:[4,7,9,21,22,26],For:[2,4,5,6,8,10,11,12,15,16,17,18,19,23,26],Its:[10,11,12],Near:[1,26],The:[0,1,2,3,4,5,6,8,9,10,11,12,14,15,16,17,18,19,21,25,26],These:[0,1,10,11,12,23,26],Use:[8,23],Using:[0,1,7,8,14,15,17],With:26,__init__:[10,11,12],_kernel:[7,26],_load_from_state_dict:[10,11,12],_loss:[10,11,12],_measur:[4,5,6,8],_miscalibr:[4,5,6,8],_named_memb:[10,11,12],_register_load_state_dict_pre_hook:[10,11,12],_register_state_dict_hook:[10,11,12],_save_to_state_dict:[10,11,12],a_k:15,aaai:[0,5,6,26],abl:26,abov:[10,13],abstractcalibr:[0,1,2,3,14,15,16,17,18,19,26],abstractlogisticregress:[15,16,17,18,19],acc:[4,5,6],acc_hist:[4,5,6,8],accept:[10,11,12],access:[10,11,12],accord:[4,5,6,7,8,15,16,17,18,26],accur:[2,3,8,26],accuraci:[4,5,6,8,9,11,20,21,22,24,26],ace:[4,5,6,8],achiev:[10,11,12,23,26],adam:16,adapt:26,add:[10,11,12],add_modul:[10,11,12],added:[10,11,12,26],addit:[0,1,2,3,4,5,6,8,9,10,11,12,14,15,16,17,18,19,25,26],adjac:1,advanc:[17,26],affect:[10,11,12],after:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],afterward:[4,5,6,7,8,9],aic:[0,1],aikaik:[0,1],aka:17,akaik:[0,1],algorithm:[1,14,15,16,17,18,19,26],alia:26,all:[0,1,2,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],allow:[1,14],along:26,alpha:[15,16],alpha_0:16,alpha_k:[15,16],alreadi:[10,11,12],also:[4,5,6,10,11,12,14,15,16,17,18,19,26],although:26,alwai:[4,5,6,8],amirhossein:[2,4,5,6,9,15,16,17,18,19,26],amount:[0,2,4,5,6,8,9,26],analyt:14,andrea:[4,26],andrew:[4,26],ani:[0,1,2,3,10,11,12,13,14,15,16,17,18,19,25],anoth:26,anselm:[2,4,5,6,9,14,15,16,17,18,19,26],apach:26,apl2:26,append:[4,5,6],appli:[2,10,11,12,13,15,16,17,18,19,23,26],applic:[16,26],approx:[0,1,15,16,17,18],approxim:[7,14,20,24],arg:[9,10,11,12,15,16,17,18,19],argument:[9,10,11,12],arrai:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],artifici:[0,5,6,15,18,26],arxiv:[11,26],assess:16,assign:[2,10,13],associ:[10,11,12],assum:[4,5,6,8,15,17],assumpt:8,ast:16,ast_j:16,asynchron:[10,11,12],attach:[8,9],attribut:[10,11,12],attributeerror:[9,25],author:26,auto:[4,26],autograd:[10,11,12],avail:26,averag:[4,5,6,7,8,9,10,11,12,21,26],avir:[7,12,26],axes:[0,1,2,3,4,5,6,8,9,14,15,16,17,18,19,25],axes_to_keep:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],axi:[4,5,6,8,26],b_i:5,b_k:15,background:[15,16,17,18],backward:[10,11,12],base:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25,26],baseestim:25,basic:26,batch:[4,5,6,7,8,9,11,12,16],batchnorm:[10,11,12],bayesian:[0,1,2,4,5,6,8,9,14,15,16,17,18,19,26],bbq:26,bdeu:0,been:[4,5,6,9,14,15,16,17,18,19,26],befor:[10,11,12,14,15,16,17,18,19,25],begin:[14,15,16,17,18,19],behavior:[10,11,12],behaviour:26,being:[10,11,12],below:[4,5,6,8,10,11,12,26],beta:[15,16,18,26],beta_0:16,beta_k:[15,16],betacalibr:26,betacalibrationdepend:26,better:[4,5,6,9],between:[4,5,6,9,11,14,15,17,21,22,26],bfloat16:[10,11,12],bia:[10,11,12,14,17],bianca:[2,3,26],bias:[14,26],bic:[0,1,2],big:16,bigg:[15,16],bin:[4,5,6,8,9,21,22],bin_bound:[4,5,6,8],binari:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],block:26,blondel:26,booktitl:26,bool:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25],both:[10,11,12,18],bottrop:26,bound:26,boundari:[2,3,4,5,6,8,14,16,17,18,19],box:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25,26],branch:[2,26],bring:26,broadcast:26,broadcast_to:26,brucher:26,buf:[10,11,12],buffer:[10,11,12],build:[0,1,2,3,14,15,16,17,18,19,25],built:25,calcul:[0,1,4,5,6,7,8,9,26],calibr:[0,1,2,3,4,5,6,7,8,9,11,12,14,15,16,17,18,19,20,21,23,24,25],calibrated_scor:26,call:[2,10,11,12,14,15,16,17,18,19,25,26],callback:23,can:[0,1,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25,26],cannot:14,captur:26,carlo:[4,5,6,9,14,15,16,17,18,19,26],caruana:9,cast:[10,11,12],center:26,certain:[1,7,10,11,12,26],chain:[14,15,16,17,18,19,26],chang:[10,11,12],channels_last:[10,11,12],charl:[2,3,26],check:[4,5,6,8,25],child:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],children:[10,11,12],choos:[4,5,6,9],chorowski:[10,13,26],chosen:2,chuan:[9,17,19,26],cite:26,classic:9,classif:[0,1,2,3,4,5,6,7,8,9,11,13,14,15,16,17,18,19,25],classifi:[1,2,3,7,15,16,17,18,19,26],classmethod:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],clear:[0,1,2,3,14,15,16,17,18,19,25],code:[9,26],color:9,combin:[15,16,17,18,19],command:26,common:[14,21,26],commonli:[14,26],comparison:[17,26],compat:[2,10,11,12],complex:[10,11,12],compon:[0,1,2,3,14,15,16,17,18,19,25],comput:[0,2,4,5,6,8,9,10,11,12,14,15,16,17,18,19,25,26],conf:[4,5,6],conf_hist:[4,5,6,8],confer:[0,1,2,4,5,6,7,8,9,12,15,16,17,18,19,26],confid:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26],confidence_penalti:26,confidencepenalti:26,conform:17,conjunct:7,consecut:1,consid:[10,11,12],consist:[7,15,16,17,18,20,22,24],constant:3,constraint:[14,15,16,17,18,19],construct:[10,11,12],constructor:[10,11,12,26],contain:[0,1,2,3,4,5,6,8,10,11,12,14,15,16,17,18,19,25,26],contrast:[1,14],conv4:[10,11,12],conv5:[10,11,12],convent:[14,15,16,17,18,19],convert:[10,11,12,25],convex:[14,15,16,17,18,19,26],cooper:[0,1,5,6,26],coordin:9,copi:[10,11,12,26],copyright:26,corr:[10,13,26],correct:26,correl:26,correspond:[10,11,12],could:[9,26],counterpart:26,cournapeau:26,covari:18,coverag:[8,26],cpu:[10,11,12,14,15,16,17,18,19],creat:26,criterion:[0,1],critic:26,cross:[4,5,6,7,8,9],crucial:26,cuda:[10,11,12,14,15,16,17,18,19,26],current:[0,4,5,6,7,8,10,11,12,14,15,16,17,18,19],custom:[10,11,12],cvf:[2,4,5,6,15,16,17,18,19,26],cvpr:[2,4,5,6,9,15,16,17,18,19,26],data:[0,1,2,3,4,5,6,8,9,14,15,16,17,18,19,25,26],data_input:[14,15,16,17,18,19],dataset:7,datatyp:[10,11,12],david:16,dca:[11,26],dcapenalti:26,decis:[2,26],decompos:18,dedic:[4,5,6,8],deep:[0,1,2,3,8,14,15,16,17,18,19,25,26],def:[10,11,12],defin:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25,26],definit:[14,15,16,17,18,19],degre:2,deliv:[15,16,17,18,19],denot:[0,1,4,5,6,15,16,17,18,19,26],densiti:[8,15,16,17,18],depend:[16,18,26],descend:[10,11,12],describ:[16,19],descript:[10,11,12,26],design:26,desir:[10,11,12,14,15,16,17,18,19],destin:[10,11,12],detail:[4,5,6,8,10,11,12,14,26],detect:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],determin:[4,5,6,8,15,17,19,26],deviat:[4,5,6,9,14,21,26],devic:[10,11,12,14,15,16,17,18,19],diagram:[9,22,26],dict:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],dictionari:[10,11,12],differ:[0,2,4,5,6,8,9,10,11,12,26],differenti:7,digit:[25,26],dim:[0,1,2,3,4,5,6,8,9,14,15,16,17,18,19,25],dimens:[0,1,2,3,4,5,6,8,9,14,15,16,17,18,19,25],direct:[10,11,12,26],directli:[1,10,11,12,14,15,16,17,18,19,26],displai:22,distribut:[4,5,6,8,10,13,14,15,16,17,18,19,26],diverg:14,divid:26,divis:25,doc:[10,11,12],docstr:[10,11,12],document:[4,5,6,8,10,11,12,26],doe:[9,25],done:26,doshi:[8,26],doubl:[10,11,12],dropout:[4,5,6,8,9,10,11,12],dst_type:[10,11,12],dtype:[10,11,12],dubourg:26,duchesnai:26,dump:[0,1,2,3,14,15,16,17,18,19,25],duplic:[10,11,12],dure:[12,23,26],dynam:3,each:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,21,22,25,26],easi:[14,26],easili:[15,18,26],easy:16,ece:[4,5,6,8,26],educ:16,effect:[10,11,12,14,15,16,17,18,19],effici:[4,26],effort:26,either:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],elbo:[14,15,16,17,18,19],elbow:[0,1],elektronisch:26,elkan:[2,3,26],ell:[15,16,17,18],els:9,embed:[7,12,26],empti:[10,11,12],encod:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],enforc:[10,11,12],enir:26,ensembl:[1,4,5,6,9,26],entropi:[10,13],enumer:[10,11,12],epistem:[14,15,16,17,18,19,26],epoch:[14,15,16,17,18,19],epsilon:25,equal:[0,1,2,4,5,6,8,9,21,22,26],equal_interv:[0,2,4,5,6,8,9],equival:[10,11,12,26],ermon:8,error:[4,5,6,7,10,11,12,21,26],error_msg:[10,11,12],especi:26,estim:[0,1,2,3,4,5,6,8,9,14,15,16,17,18,19,20,23,24,25,26],etc:[9,10,11,12,14,15,16,17,18,19],eval:[10,11,12],evalu:[4,5,6,7,8,9,10,11,12,14,26],even:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],everi:[10,11,12,26],everyth:[4,5,6,9],exactli:[10,11,12],examin:[4,5,6,7,8,9],exampl:[10,11,12,23],exclud:[4,5,6],exist:[10,11,12],exp:[0,1,7,15,16,17,18],expect:[5,7,21,26],expens:14,express:[15,17],extend:[14,15,17,26],extens:26,extra:[10,11,12],extra_repr:[10,11,12],fabian:[2,4,5,6,9,14,15,16,17,18,19,26],fabiankuepp:26,factor:17,fahrwerksystem:26,failur:[10,11,12],fall:8,fals:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],faster:14,featur:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],feature_nam:9,feed:26,fenner:8,field:[8,10,11,12],figur:9,file:26,filenam:[0,1,2,3,9,14,15,16,17,18,19,25],filho:[15,18,26],fill:[4,5,6,8],fill_:[10,11,12],find:[14,15,16,17,18,19],finetun:[10,11,12],first:[4,5,6,8,9,15,16,17,18],fit:[0,1,2,3,9,14,15,16,17,18,19,25,26],fit_param:[0,1,2,3,14,15,16,17,18,19,25],fit_transform:[0,1,2,3,14,15,16,17,18,19,25],fix:[2,14,15,16,17,18,19],flach:[15,18,26],flag:26,flatten:[4,5,6,8,9],float16:[10,11,12],float64:[10,11,12],fmax:9,fmin:9,follow:[4,5,6,9,10,11,12,26],foral:16,form:[0,1,2,3,14,15,16,17,18,19,25,26],format:[10,11,12],formul:17,forward:[10,11,12,26],found:[15,18,26],frac:[4,5,7,14,15,16,17,18],framework:[16,18],freedom:2,freez:[10,11,12],from:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],full:[14,15,16,17,18,19,26],further:26,furthermor:26,futur:[4,5,6,8],gaimersheim:26,gan:[10,11,12],gap:[9,21,22,26],gaussian:8,gener:[2,14,15,16,17,18,19],geoff:[9,17,19,26],germani:26,get:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25,26],get_degrees_of_freedom:2,get_members_fn:[10,11,12],get_param:[0,1,2,3,14,15,16,17,18,19,25],get_tikz_cod:9,getter:[15,16,17,18,19],ghahramani:14,ghosh:[8,26],github:26,give:21,given:[0,1,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,21,26],global:[14,15,16,17,18,19],gmbh:26,gongbo:[11,26],good:9,gpu1:[10,11,12],gpu:[10,11,12,14,15,16,17,18,19],grad_input:[10,11,12],grad_output:[10,11,12],gradient:[10,11,12],gramfort:26,graphic:14,gregori:[0,1,5,6,26],grisel:26,ground:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25,26],ground_truth:26,group:[1,4,5,6,8,26],guarante:[10,11,12,18,25],guid:[14,15,16,17,18,19],guo:[9,17,19,26],half:[10,11,12],hand:14,handl:[4,5,6,9,10,11,12],has:[4,5,6,8,9,10,11,12,14,15,16,17,18,19,25,26],haselhoff:[2,4,5,6,9,14,15,16,17,18,19,26],hat:[0,1,7,15,16,17,18,19],hauskrecht:[0,5,6,26],have:[0,1,2,3,4,5,6,8,9,10,11,12,14,15,16,17,18,19,25,26],heatmap:26,height:[9,15,16,17,18,19],help:[10,11,12],helper:[10,11,12],here:2,highest:[7,8,21,26],hilbert:7,hinton:[10,13,26],histogram:[2,4,5,6,8,9,26],histogrambin:[0,3,26],hoc:26,hoefl:26,hold:8,holger:26,hook:[10,11,12],host:[10,11,12],hot:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],how:26,howev:[17,26],hpd:8,http:26,icdm:[1,26],icml:[2,8,26],identifi:[4,5,6,8],idx:[10,11,12],ieee:[1,2,4,5,6,9,14,15,16,17,18,19,26],ignor:10,imag:[11,26],immedi:[10,11,12],implement:[10,11,12,14,15,18,26],improv:[11,15,18,25,26],in_featur:[10,11,12],includ:[2,4,5,6,8,9,10,11,12,26],independ:[0,1,2,3,8,14,15,16,17,18,19,25],independent_prob:[0,1,2,3,14,15,16,17,18,19,25],index:[4,5,6,8],indic:[4,5,6,7,8,11,12,14,15,16,17,18,19,26],individu:[10,11,12],inequ:25,infer:[2,4,5,6,8,9,14,15,16,17,18,19,26],inform:[0,1,2,4,7,9,10,11,12,26],inherit:[25,26],init:[10,11,12],init_weight:[10,11,12],initi:[1,10,11,12],inplac:[10,11,12],inproceed:26,input:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],input_calibr:26,insert:[4,5,6,8,16,18],instanc:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,23,25,26],instead:[4,5,6,8,14,15,16,17,18,19],integ:2,integr:[4,5,6,9,10,11,12],intellig:[0,5,6,14,15,16,17,18,19,26],intercept:[14,15,16,17,18,19],intern:[1,7,8,9,12,17,19,26],interpret:[4,5,6,7,8,9,15,16,17,18],interv:[2,4,5,6,8,9,14,15,16,17,18,19,26],introduct:14,invok:[10,11,12,26],iou:26,isoton:[1,3,26],isotonicregress:[1,26],iter:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25],its:[2,10,11,12],itself:[8,10,11,12],jaakkola:14,jain:[7,12,26],jan:[2,4,5,6,9,14,15,16,17,18,19,26],jiayu:[8,26],jmlr:[9,17,19],john:[17,26],jona:[14,15,16,17,18,19,26],jordan:14,journal:[16,26],juli:26,june:26,kaiser:[10,13,26],kdd:[2,3,26],keep:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],keep_var:[10,11,12],kei:[10,11,12],kept:[0,1,2,3,14,15,16,17,18,19,25],kernel:12,keyword:[10,11,12],kilian:[9,17,19,26],know:14,kronenberg:[2,4,5,6,9,14,15,16,17,18,19,26],kueppers_2020_cvpr_workshop:26,kueppers_2021_iv:26,kuleshov:8,kull:[15,18,26],kullback:14,kumar:[7,12,26],kwarg:[9,10,11,12,14,15,16,17,18,19],label:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25,26],lambda_j:16,lambda_k:16,laplacian:[7,12],larg:[17,26],last:[0,1,2,3,4,5,6,8,9,14,15,16,17,18,19,25],latex:9,latter:[0,1,2,3,14,15,16,17,18,19,25,26],lawrenc:14,lead:[14,15,16,17,18,19],learn:[7,8,9,12,14,16,17,19,26],least:[0,1,2,3,4,5,6,7,8,9,14,15,17,19,25],leibler:14,length:[0,1,2,4,5,6,7,8,9],less:[4,5,6,8,26],let:[0,1],level:8,liang:[11,26],libbi:16,licens:26,like:[9,14,15,16,17,18,19,25,26],likelihood:[0,1,14,15,16,17,18,19,26],line:[10,11,12],linear:[10,11,12],list:[4,5,6,8,9,10,11,12,14,15,16,17,18,19],live:[10,11,12],load:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],load_model:[0,1,2,3,14,15,16,17,18,19,25],load_state_dict:[10,11,12],local_metadata:[10,11,12],locat:26,log:[0,1,14,15,16,17,18,19,25],log_dir:[2,14,15,16,17,18,19],logarithm:[13,15,16,17,18],logic:[10,11,12],logist:[14,15,16,17,18,19,26],logisticcalibr:[19,26],logisticcalibrationdepend:26,logit:[14,15,16,17,18,19,26],loss:[10,11,12,13,26],low:[0,1],lowest:25,lr_depend:26,luka:[4,26],lukasz:[10,13],machin:[7,8,9,12,14,17,19,26],mahdi:[0,1,5,6,26],mai:[10,11,12],main:4,mainli:26,make:[10,11,12],mandatori:[11,26],mani:[10,11,12],manner:2,map:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25,26],margin:[14,17,26],mark:[4,5,6,8],markov:[14,15,16,17,18,19,26],mask:[14,15,16,17,18,19,26],match:[9,10,11,12,15,16,17,18,25,26],mathbb:[7,17,18,19],mathcal:[0,1,7],mathemat:[15,16,17,18],matplotlib:[9,26],matric:18,matrix:18,max_:6,maximum:[6,7,9,12,14,15,16,17,18,19,21,26],mce:[4,5,8,9,21,26],mcmc:[2,14,15,16,17,18,19,26],mcmc_chain:[14,15,16,17,18,19,26],mcmc_step:[14,15,16,17,18,19,26],mcmc_warmup_step:[14,15,16,17,18,19,26],mean:[4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,21,26],mean_estim:[14,15,16,17,18,19],measur:[4,5,6,7,8,9,12,20,21,26],median:8,medic:[11,26],meeli:[15,18,26],melvin:16,member:[10,11,12],memo:[10,11,12],memori:[10,11,12],memory_format:[10,11,12],messag:[10,11,12],metadata:[10,11,12],method:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,20,21,22,23,24,25],metric:9,michael:14,michel:26,might:[0,1,4,5,6,8,9,14,16,17,18,19,26],milo:[0,5,6,26],min:14,mine:[1,26],minim:14,minimum:9,miscalibr:[4,5,6,8,9,15,16,17,18,19,21,22,26],miscellan:26,miss:[10,11,12],missing_kei:[10,11,12],mizil:9,mle:[14,15,16,17,18,19,26],mlit:[4,26],mmce:[12,26],mmcepenalti:26,mode:[2,4,5,6,7,8,9,10,11,12,15,17,26],model:[0,1,2,3,8,10,11,12,14,15,16,17,18,19,23,25,26],modern:[9,17,19,26],modifi:[1,10,11,12],modul:[10,11,12,26],momentum:[14,15,16,17,18,19,26],momentum_epoch:[14,15,16,17,18,19],monotoni:1,mont:[4,5,6,9,14,15,16,17,18,19,26],month:26,more:[9,14,25,26],most:26,move:[10,11,12],mpava:1,mpiw:[8,26],mpl2:26,mulitpl:[4,5,6,8,9],multi:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25,26],multiclass:[2,3,14,15,16,17,18,19,26],multidimension:[2,26],multinomi:15,multipl:[0,1,4,5,6,7,8,9,10,11,12,14,15,17,26],multivari:[2,4,5,6,9,15,16,17,18,19,26],must:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],n_bay:[4,5,6,8,9],n_bin:[4,5,6,8,26],n_box_featur:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],n_class:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],n_featur:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],n_features_new:[0,1,2,3,14,15,16,17,18,19,25],n_log_regression_featur:[14,15,16,17,18,19],n_paramet:[14,15,16,17,18,19],n_sampl:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],naeini:[0,1,5,6,26],naiv:[2,26],name:[0,1,2,3,8,9,10,11,12,14,15,16,17,18,19,25,26],named_buff:[10,11,12],named_children:[10,11,12],named_modul:[10,11,12],named_paramet:[10,11,12],namedtupl:[8,10,11,12],nan:[4,5,6,8],natur:26,ndarrai:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25],nearli:26,necessari:[15,16,17,18,26],need:[2,14,25,26],neg:[14,15,16,17,18,19],neither:26,nest:[0,1,2,3,14,15,16,17,18,19,25],net:[10,11,12],netcal:26,network:[7,8,9,10,11,12,13,17,19,26],neumann:[4,26],neural:[4,7,8,9,10,11,12,13,17,19,26],niculescu:9,ninth:[0,5,6,26],nip:[4,26],nir:1,no_grad:[10,11,12],non:[14,15,16,17,18,19,26],non_block:[10,11,12],none:[0,1,2,3,4,5,6,8,9,10,11,12,13,14,15,16,17,18,19,25],nor:26,norm:13,normal:[0,1,2,14,17,18],notat:16,note:[10,11,12],novick:16,now:26,num:[4,5,6,8],num_featur:[10,11,12],num_sampl:[2,14,15,16,17,18,19,26],num_samples_hist:[4,5,6,8],number:[0,1,2,3,4,5,6,8,9,10,11,12,13,14,15,16,17,18,19,21,25],numpi:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],nx1:[2,4,5,6,8,9],nx2:[2,4,5,6,8,9],object:[0,1,2,3,4,5,6,7,9,10,11,12,14,15,16,17,18,19,25,26],observ:[8,9,21,22,24,26],obtain:[0,1,2,4,5,6,9,14,15,16,17,18,19,23,26],odd:[15,16,17,18],onc:[4,5,6,7,8,9,10,11,12],one:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,25,26],onli:[2,9,10,11,12,14,15,16,17,18,19,26],onlin:[0,1,2,3,4,5,6,7,8,9,10,12,13,15,17,18,19],oper:[10,11,12,19,25],optim:[10,11,12,14,15,16,17,18,19,26],optimum:[14,15,16,17,18,19],option:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25],order:[14,15,16,17,18,19,26],org:[9,17,19,26],origin:[0,15,16,17],other:[0,1,2,3,14,15,16,17,18,19,25],otherwis:[8,10,11,12],our:26,out:[0,1],out_featur:[10,11,12],output:[0,1,2,3,4,5,6,9,10,11,12,13,14,15,16,17,18,19,25,26],over:[0,1,4,5,6,7,8,9,10,11,12,14,23,26],overconfid:26,overrid:[10,11,12],own:[10,11,12,26],packag:[9,20,22,24,26],pakdaman:[0,1,5,6,26],pan:[8,26],paper:0,parallel:[14,15,16,17,18,19],param:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],paramet:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,23,25,26],parametr:14,part:[10,11,12,17,26],particular:[10,11,12],pass:[4,5,6,8,9,10,11,12,26],passo:26,pattern:[2,4,5,6,9,15,16,17,18,19,26],pedestrian:[4,26],pedregosa:26,penal:[10,13,23,26],penalti:[10,13,23,26],per:[4,5,6,9],pereyra:[10,13,26],perform:[4,5,6,8,9,10,11,12,14,15,16,17,18,19,25,26],perrot:26,persist:[10,11,12],peter:[15,18,26],phi:14,picp:26,picpresult:8,piecewis:3,pin:[10,11,12],pip3:26,pip:26,pipelin:[0,1,2,3,14,15,16,17,18,19,25],place:[10,11,12,14],platt:[17,26],pleas:26,pleiss:[9,17,19,26],plot:[9,26],pmlr:[12,15,18,26],point:[4,5,6,8,9,10,11,12],pool:1,posit:[15,16,17,18,19,26],possibl:[0,1,2,3,10,11,12,14,15,16,17,18,19,25,26],post:26,posterior:[0,1,8,13,14,15,16,17,18,19],ppl:26,pre:[10,11,12],prebuild:23,predict:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,23,25,26],prefer:26,preffer:26,prefix:[10,11,12],prepar:[4,5,6,8,14,15,16,17,18,19],prepend:[10,11,12],preprint:[11,26],preprocess:[14,15,16,17,18,19],present:[0,1,2,3,4,5,6,7,8,10,11,12,14,15,17,19,25,26],prettenhof:26,previou:[4,5,6,8,26],print:[10,11,12,26],prior:[14,15,16,17,18,19],probabilist:[14,15,16,17,18,19,26],probabl:[0,1,2,3,5,6,7,8,9,14,15,16,17,18,19,25,26],problem:[15,16,17,18],proceed:[9,17,19,26],process:[4,5,6,8,26],prod:16,prohibit:23,properti:[9,15,16,17,18,19],propos:[0,15,16,17],propto:[0,1],provid:[9,10,11,12,15,16,17,18,26],purpos:26,push:26,pyplot:9,pyro:26,python3:26,python:26,pytorch:[10,26],qualiti:[8,26],quantif:[8,26],quantifi:26,quantil:[0,26],quantiti:26,quick:1,quick_init:1,quit:26,rais:[9,25],random:[2,14,15,16,17,18,19],random_st:[2,14,15,16,17,18,19],randomli:26,rare:[10,11,12],rate:16,rather:[9,26],ratio:[15,16,17,18],readm:26,recent:26,recognit:[2,4,5,6,9,15,16,17,18,19,26],record:[10,11,12],recurs:[10,11,12],reduc:[4,5,6,8],reduce_result:[4,5,6,8],reduct:10,refer:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19],regist:[10,11,12],register_backward_hook:[10,11,12],register_buff:[10,11,12],register_forward_hook:[10,11,12],register_forward_pre_hook:[10,11,12],register_hook:[10,11,12],register_paramet:[10,11,12],regress:[1,2,3,8,9,14,15,16,17,18,19,26],regular:17,reimplement:[10,11,12],rel:[0,1,26],relat:14,relative_x_posit:26,relax:[4,26],relev:[14,15,16,17,18,19],reliabilitydiagram:26,reliabl:[9,22,26],remain:[4,5,6,8],remind:26,remov:[10,11,12],removablehandl:[10,11,12],reparametr:15,report:[10,11,12],represent:[10,11,12],reproduc:7,requir:[10,11,12,18],requires_grad:[10,11,12],requires_grad_:[10,11,12],research:26,respect:[10,11,12,15,16,18],restrict:[1,18],result:[4,5,6,7,8,9,14,15,16,17,18,19],return_map:[4,5,6,8],return_num_sampl:[4,5,6],return_uncertainti:[4,5,6],return_uncertainty_map:[4,5,6],reus:[4,5,6,8,26],right:26,rkh:7,robert:26,robust:[8,26],ruhr:26,run:[10,11,12],running_mean:[10,11,12],running_var:[10,11,12],runtimeerror:25,ryan:26,s_k:[15,16],safe:[4,26],safer:[0,1,2,3,14,15,16,17,18,19,25],safeti:26,same:[0,2,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19],sampl:[0,2,4,5,6,8,9,14,15,16,17,18,19,21,22,26],sample_threshold:[4,5,6,8,9],sarawagi:[7,12,26],saul:14,save:[0,1,2,3,9,10,11,12,14,15,16,17,18,19,25],save_arg:9,save_model:[0,1,2,3,14,15,16,17,18,19,25],savefig:9,scalar:[11,12,19],scale:9,scheme:[4,5,6,8,15,16,17,18],schneider:[14,15,16,17,18,19,26],scienc:26,scikit:26,scipi:26,scope:26,score:[0,1,2,3,4,5,6,7,8,11,15,16,17,18,19,26],score_funct:[0,1],search:[14,15,16,17,18,19],second:9,see:[10,11,12,14,26],seed:[2,14,15,16,17,18,19],seek:[14,15,16,17,18,19],seen:8,self:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],semidefinit:18,separ:[4,5,6,7,8,9,26],sequenti:[10,11,12],set:[0,1,2,3,9,10,11,12,14,15,16,17,18,19,25,26],set_param:[0,1,2,3,14,15,16,17,18,19,25],setup:26,setuptool:26,sever:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,20,24,25,26],shantia:[2,4,5,6,9,15,16,17,18,19,26],shape:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],sharp:8,should:[0,1,2,3,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,23,25,26],shown:26,sigma:[18,19],sigma_:18,sigmoid:[0,1,2,3,14,15,16,17,18,19,25],signatur:[10,11,12,14,15,16,17,18,19],silva:[15,18,26],similar:[3,4,5,6,9,10,11,12,21,22,26],simpl:[0,1,2,3,4,5,6,9,14,15,16,17,18,19,25],simpli:[2,17,26],simultan:8,sinc:[10,11,12,14],singl:[4,5,6,8,9,10,11,12,14,15,16,17,18,19],site:14,size:[0,1,2,3,4,5,6,7,8,10,11,12,14,15,16,17,18,19,22,25],sklearn:25,slightli:[4,5,6,9],slow:[14,15,16,17,18,19],snippet:26,softmax:[0,1,2,3,4,5,6,7,8,9,13,14,15,16,17,18,19,25,26],solv:14,some:[10,11,12,26],sort:[0,1,2,3],soumya:[8,26],sourc:[0,1,2,3,4,5,6,7,8,9,10,12,13,15,17,18,19,26],space:[7,9,26],specif:[10,11,12],specifi:[4,5,6,8,10,11,12,14,15,16,17,18,19],specifii:26,speed:26,split:[0,2,4,5,6,8,9],sqrt:7,squeez:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],squeeze_gener:[0,1,2,3,4,5,6,8,14,15,16,17,18,19,25],stack:26,standard:[1,4,5,6,9,15,17,19,26],state:[10,11,12],state_dict:[10,11,12],statist:[15,16,18,26],step:[14,15,16,17,18,19,26],store:[10,11,12],str:[0,1,2,3,4,5,6,8,9,10,11,12,14,15,16,17,18,19,25],strict:[10,11,12],strictli:[10,11,12],string:[0,1,2,3,9,10,11,12,14,15,16,17,18,19,25],structur:26,subclass:[10,11,12],subject:26,submodul:[10,11,12],subobject:[0,1,2,3,14,15,16,17,18,19,25],subsequ:[10,11,12],subset:[10,11,12],substitut:[14,15,16,17,18,19],suffix:9,suit:26,sum:[0,15,16,26],sum_:[0,1,4,5,7,14],sum_k:15,summar:15,sun:[9,17,19,26],sunita:[7,12,26],supervis:9,support:[0,7,14,17,26],symmetr:18,symposium:[14,15,16,17,18,19,26],system:[4,26],target:[0,1,2,3,11,12,14,15,16,17,18,19,25],task:[4,5,15,16,17,18,19,26],techniqu:14,technometr:26,telmo:[15,18,26],temperatur:[17,19,26],temperature_onli:17,temperaturesc:26,tend:[14,15,16,17,18,19],tensor:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],tensorboard:[2,14,15,16,17,18,19],term:[10,12,13,26],text:[4,5,6,14,15,16,17,18],than:[4,5,6,8,9,14,25],thei:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],them:1,therefor:[15,16,17,18,19],theta:[0,1,14],theta_:14,thi:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,22,24,25,26],thirion:26,those:[10,11,12,14,15,16,17,18,19,26],threshold:[4,5,6,8,10,13],thu:[17,26],tibshirani:26,tikz:9,tikzplotlib:[9,26],time:[10,11,12,14,18,26],titl:[9,26],title_suffix:9,togeth:[10,11,12],tommi:14,tool:26,top:[15,16,17,18,19],torch:[0,1,2,3,10,11,12,14,15,16,17,18,19,25,26],toward:26,tqdm:26,train:[0,1,2,3,10,11,12,14,15,16,17,18,19,23,25,26],trainabl:[7,11,12,26],transform:[0,1,2,3,14,15,16,17,18,19,25,26],transformermixin:25,treat:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],tree:[2,26],tri:[10,11,12,16,18],truth:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25,26],tucker:[10,13,26],tupl:[4,5,6,8,10,11,12,14,15,16,17,18,19,25],twenti:[0,5,6,26],two:26,txt:26,type:[0,1,2,3,4,5,6,7,9,10,11,12,13,14,15,16,17,18,19,25],typic:[10,11,12,13],ujjwal:[7,12,26],unbias:14,uncalibr:[0,1,2,3,14,15,16,17,18,19,25,26],uncalibrated_scor:26,uncertainti:[4,5,6,8,9,14,15,16,17,18,19],unchang:[10,11,12],underset:14,unexpect:[10,11,12],unexpected_kei:[10,11,12],union:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25],univari:[15,17],univers:26,unknown:[14,15,16,17,18,19],unless:[10,11,12],updat:[0,1,2,3,14,15,16,17,18,19,25],use:[2,4,5,6,8,9,10,11,12,15,16,17,18,19,20,24,26],use_cuda:[14,15,16,17,18,19,26],use_hpd:8,used:[0,1,2,3,4,5,6,8,9,10,11,12,14,15,16,17,18,19,25,26],user:[10,11,12],uses:[15,16,17,18,26],using:[0,1,4,5,6,7,8,9,10,11,12,14,15,16,17,18,19,26],util:[0,4,5,6,8,10,11,12,15,16,17,19,26],valid:[4,5,6,7,8,9],valu:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,25],vanderpla:26,variabl:[14,15,16,17,18,19],varianc:[4,5,6,8,17],variance_hist:[4,5,6,8],variant:16,variat:[2,4,5,6,8,9,14,15,16,17,18,19,26],variou:[10,11,12],varoquaux:26,vector:[0,1,2,3,4,5,6,7,8,9,14,15,16,17,18,19,25,26],vedaldi:[4,26],vehicl:[14,15,16,17,18,19,26],velez:[8,26],version:[0,1,2,3,10,11,12,14,15,16,17,18,19,25],vi_epoch:[14,15,16,17,18,19,26],view:26,violat:1,vision:[2,4,5,6,9,15,16,17,18,19,26],visit:26,visual:[4,5,6,7,8,9,22],volum:[9,17,19,26],wai:9,want:26,warm:26,warmup:[14,15,16,17,18,19],weight:[0,1,4,5,6,8,10,11,12,13,14,15,16,17,18,19,21,26],weight_mean_init:[15,16,17,18,19],weight_prior_dist:[15,16,17,18,19],weight_stddev_init:[15,16,17,18,19],weinberg:[9,17,19,26],weiss:26,weiwei:[8,26],well:[0,1,2,3,4,5,6,8,10,11,12,14,15,16,17,18,19,25,26],west:26,when:[10,11,12],where:[4,5,6,8,10,11,12,15,16,26],wherea:[15,16,17,18],whether:[10,11,12],which:[0,15,16,17,18,19,20,23,24,26],whole:[10,11,12],whose:[4,5,6,8,10,11,12,14,15,16,17,18,19],width:[0,2,4,5,6,8,9,15,16,17,18,19,26],wise:9,within:[4,5,6,11,26],without:[4,5,6,8,9,10,11,12,14,15,16,17,18,19],work:[0,1,2,3,14,15,16,17,18,19,25,26],workshop:[2,4,5,6,8,9,15,16,17,18,19,26],wrap:[10,11,12],write:26,www:26,x_0:[0,1],x_1:[0,1],x_i:14,x_new:[0,1,2,3,14,15,16,17,18,19,25],y_0:[0,1],y_1:[0,1],y_i:7,y_j:7,yao:[8,26],year:26,yield:[4,5,6,9,10,11,12],you:[10,11,12,14,15,16,17,18,19,26],your:[10,11,12,26],zadrozni:[2,3,26],zero:[10,11,12],zero_grad:[10,11,12],zisserman:[4,26],zoubin:14},titles:["netcal.binning.BBQ","netcal.binning.ENIR","netcal.binning.HistogramBinning","netcal.binning.IsotonicRegression","netcal.metrics.ACE","netcal.metrics.ECE","netcal.metrics.MCE","netcal.metrics.MMCE","netcal.metrics.PICP","netcal.presentation.ReliabilityDiagram","netcal.regularization.ConfidencePenalty","netcal.regularization.DCAPenalty","netcal.regularization.MMCEPenalty","netcal.regularization.confidence_penalty","netcal.scaling.AbstractLogisticRegression","netcal.scaling.BetaCalibration","netcal.scaling.BetaCalibrationDependent","netcal.scaling.LogisticCalibration","netcal.scaling.LogisticCalibrationDependent","netcal.scaling.TemperatureScaling","netcal.binning","netcal.metrics","netcal.presentation","netcal.regularization","netcal.scaling","netcal.AbstractCalibration","API Reference"],titleterms:{"class":[20,21,22,24],"function":23,ACE:4,ECE:5,abstractcalibr:25,abstractlogisticregress:14,api:26,avail:[20,21,22,23,24],bbq:0,betacalibr:15,betacalibrationdepend:16,bin:[0,1,2,3,20,26],calibr:26,classif:26,confidence_penalti:13,confidencepenalti:10,content:26,dcapenalti:11,detect:26,enir:1,exampl:26,framework:26,histogrambin:2,instal:26,isotonicregress:3,logisticcalibr:17,logisticcalibrationdepend:18,mce:6,method:26,metric:[4,5,6,7,8,21,26],mmce:7,mmcepenalti:12,netcal:[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25],overview:26,picp:8,present:[9,22],refer:26,regular:[10,11,12,13,23,26],reliabilitydiagram:9,requir:26,scale:[14,15,16,17,18,19,24,26],tabl:26,temperaturesc:19,uncertainti:26,updat:26,version:26,visual:26}})
\ No newline at end of file
diff --git a/docs/source/conf.py b/docs/source/conf.py
index ac8f059..21bd579 100644
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -27,7 +27,7 @@
 author = 'Fabian Kueppers'
 
 # The full version, including alpha/beta/rc tags
-release = '1.1.3'
+release = '1.2.0'
 
 
 # -- General configuration ---------------------------------------------------
diff --git a/examples/__init__.py b/examples/__init__.py
index 1ce3eb8..53a5dfe 100644
--- a/examples/__init__.py
+++ b/examples/__init__.py
@@ -1,11 +1,6 @@
-"""
-Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-
-This Source Code Form is subject to the terms of the Mozilla Public
-License, v. 2.0. If a copy of the MPL was not distributed with this
-file, You can obtain one at http://mozilla.org/MPL/2.0/.
-"""
-
-
-from .utils import single_example, cross_validation_5_2
+# Copyright (C) 2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
diff --git a/examples/classification/CIFAR.py b/examples/classification/CIFAR.py
index 03425e7..92588aa 100644
--- a/examples/classification/CIFAR.py
+++ b/examples/classification/CIFAR.py
@@ -1,18 +1,19 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import Union
 
 from netcal.binning import HistogramBinning, IsotonicRegression, ENIR, BBQ
 from netcal.scaling import LogisticCalibration, TemperatureScaling, BetaCalibration
 
-from utils import single_example, cross_validation_5_2
-from matplotlib import pyplot as plt
+from examples.classification import single_example, cross_validation_5_2
 
 
-def example_calibration(datafile: str) -> int:
+def example_calibration(datafile: str, domain: str = ".") -> int:
     """
     Example of several calibration methods.
 
@@ -27,7 +28,22 @@ def example_calibration(datafile: str) -> int:
         0 at success, -1 otherwise.
     """
 
-    bins = 10
+    # kwargs for uncertainty mode. Those can also be safely set on MLE
+    uncertainty_kwargs = {'mcmc_chains': 1,
+                          'mcmc_samples': 300,
+                          'mcmc_warmup_steps': 50,
+                          'vi_samples': 300,
+                          'vi_epochs': 3000}
+
+    if domain == 'examination-mcmc':
+        method = 'mcmc'
+    elif domain == 'examination-variational':
+        method = 'variational'
+    else:
+        method = 'mle'
+
+    bins = 15
+    hist_bins = 20
 
     # diagram = None
     diagram = 'diagram'
@@ -38,31 +54,32 @@ def example_calibration(datafile: str) -> int:
     # if True, a Pickle-Object will be written out for each calibration model built
     save_models = False
 
-    histogram = HistogramBinning(bins)
+    histogram = HistogramBinning(hist_bins)
     iso = IsotonicRegression()
     bbq = BBQ()
     enir = ENIR()
-    lr_calibration = LogisticCalibration()
-    temperature = TemperatureScaling()
-    betacal = BetaCalibration()
-
-    models = [("Histogram Binning", histogram),
-              ("Isotonic Regression", iso),
-              ("BBQ", bbq),
-              ("ENIR", enir),
-              ("Logistic Calibration", lr_calibration),
-              ("Temperature Scaling", temperature),
-              ("Beta Calibration", betacal)]
+
+    lr_calibration = LogisticCalibration(detection=False, method=method, use_cuda=use_cuda, **uncertainty_kwargs)
+    temperature = TemperatureScaling(detection=False, method=method, use_cuda=use_cuda, **uncertainty_kwargs)
+    betacal = BetaCalibration(detection=False, method=method, use_cuda=use_cuda, **uncertainty_kwargs)
+
+    models = [("hist", histogram),
+              ("iso", iso),
+              ("bbq", bbq),
+              ("enir", enir),
+              ("lr", lr_calibration),
+              ("temperature", temperature),
+              ("beta", betacal)]
 
     # see ../utils.py for calibration and its measurement
     success = single_example(models=models, datafile=datafile, bins=bins,
                              diagram=diagram, validation_split=validation_split,
-                             save_models=save_models)
+                             save_models=save_models, domain=domain)
 
     return success
 
 
-def cross_validation(datafile: str) -> int:
+def cross_validation(datafile: str, use_cuda: Union[bool, str] = False, domain: str = ".") -> int:
     """
     5x2 cross validation of several calibration methods.
 
@@ -77,36 +94,57 @@ def cross_validation(datafile: str) -> int:
         0 at success, -1 otherwise.
     """
 
-    bins = 10
+    # kwargs for uncertainty mode. Those can also be safely set on MLE
+    uncertainty_kwargs = {'mcmc_chains': 1,
+                          'mcmc_samples': 300,
+                          'mcmc_warmup_steps': 50,
+                          'vi_samples': 300,
+                          'vi_epochs': 3000}
+
+    hist_bins = 20
+    bins = 15
+
+    if domain == 'examination-mcmc':
+        method = 'mcmc'
+    elif domain == 'examination-variational':
+        method = 'variational'
+    else:
+        method = 'mle'
 
     # if True, a Pickle-Object will be written out for each calibration model built
-    save_models = False
+    save_models = True
 
-    histogram = HistogramBinning(bins)
+    histogram = HistogramBinning(hist_bins)
     iso = IsotonicRegression()
     bbq = BBQ()
     enir = ENIR()
-    lr_calibration = LogisticCalibration()
-    temperature = TemperatureScaling()
-    betacal = BetaCalibration()
-
-    models = [("Histogram Binning", histogram),
-              ("Isotonic Regression", iso),
-              ("BBQ", bbq),
-              ("ENIR", enir),
-              ("Logistic Calibration", lr_calibration),
-              ("Temperature Scaling", temperature),
-              ("Beta Calibration", betacal)]
+    lr_calibration = LogisticCalibration(detection=False, method=method, use_cuda=use_cuda, **uncertainty_kwargs)
+    temperature = TemperatureScaling(detection=False, method=method, use_cuda=use_cuda, **uncertainty_kwargs)
+    betacal = BetaCalibration(detection=False, method=method, use_cuda=use_cuda, **uncertainty_kwargs)
+
+    models = [("hist", histogram),
+              ("iso", iso),
+              ("bbq", bbq),
+              ("enir", enir),
+              ("lr", lr_calibration),
+              ("temperature", temperature),
+              ("beta", betacal)]
 
     # invoke cross validation function from ../utils.py
     # see ../utils.py for calibration and its measurement
-    success = cross_validation_5_2(models=models, datafile=datafile, bins=bins, save_models=save_models)
+    success = cross_validation_5_2(models=models, datafile=datafile, bins=bins, save_models=save_models, domain=domain)
 
     return success
 
 
 if __name__ == '__main__':
 
+    use_cuda = 'cuda:0'
+
+    # domain = "examination-map"
+    # domain = "examination-mcmc"
+    domain = "examination-variational"
+
     # example on CIFAR-10 with LeNet-5 and WideResnet-16-4
     lenet = "records/cifar10/lenet-5-cifar-10.npz"
     wideresnet = "records/cifar10/wideresnet-16-4-cifar-10.npz"
@@ -115,9 +153,8 @@ def cross_validation(datafile: str) -> int:
 
     # for each model, perform a single example and a 5x2 cross validation
     for model in cifar10:
-        example_calibration(model)
-        cross_validation(model)
-
+       example_calibration(model)
+       cross_validation(model)
 
     # example on CIFAR-100 with LeNet-5, DenseNet-BC-100 and WideResnet-16-4
     lenet = "records/cifar100/lenet-5-cifar-100.npz"
@@ -129,6 +166,4 @@ def cross_validation(datafile: str) -> int:
     # for each model, perform a single example and a 5x2 cross validation
     for model in cifar100:
         example_calibration(model)
-        cross_validation(model)
-
-    plt.show()
+        cross_validation(model, use_cuda=use_cuda, domain=domain)
diff --git a/examples/classification/Evaluation.py b/examples/classification/Evaluation.py
index e41c84b..108646a 100644
--- a/examples/classification/Evaluation.py
+++ b/examples/classification/Evaluation.py
@@ -1,21 +1,19 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import os
 import pandas as pd
 import numpy as np
-from typing import Union
-from matplotlib import pyplot as plt
+from typing import List
 
-from netcal.metrics import ACE, ECE, MCE
-from netcal.presentation import ReliabilityDiagram
+from netcal.metrics import ECE
 
 
-def read(base_dir: str, network: str) -> list:
+def read(base_dir: str, network: str) -> List:
     """
     Read calibrated data set from NumPy archive.
     Returns
@@ -37,7 +35,7 @@ def read(base_dir: str, network: str) -> list:
     return data
 
 
-def measure(key: str, ground_truth: list, data: list, uncertainty: str, bins: int):
+def measure(key: str, ground_truth: List, data: List, uncertainty: str, bins: int):
     """ Measure miscalibration (batched mode) """
 
     print("Measure: %s" % key)
@@ -64,8 +62,8 @@ def measure(key: str, ground_truth: list, data: list, uncertainty: str, bins: in
     return np.mean(miscalibration)
 
 
-def measure_miscalibration(bins: int, methods: list, uncertainty: str,
-                           map_data: list = None, mcmc_data: list = None, vi_data: list = None):
+def measure_miscalibration(bins: int, methods: List, uncertainty: str,
+                           map_data: List = None, mcmc_data: List = None, vi_data: List = None):
     """
     Measure miscalibration and write to stdout.
 
@@ -95,7 +93,7 @@ def measure_miscalibration(bins: int, methods: list, uncertainty: str,
     columns_methods = [[] for _ in methods]
 
     if map_data is not None:
-        types.append('MAP')
+        types.append('MLE')
         column_baseline.append(measure('test_scores', **map_kwargs))
 
         for i, method in enumerate(methods):
diff --git a/examples/classification/__init__.py b/examples/classification/__init__.py
index 0857f83..9b42fae 100644
--- a/examples/classification/__init__.py
+++ b/examples/classification/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 from .utils import single_example
 from .utils import cross_validation_5_2
\ No newline at end of file
diff --git a/examples/classification/utils.py b/examples/classification/utils.py
index fd39a0d..a1a6846 100644
--- a/examples/classification/utils.py
+++ b/examples/classification/utils.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import os
 import numpy as np
@@ -14,9 +14,9 @@
 from netcal.presentation import ReliabilityDiagram
 
 
-@global_accepts(list, str, int, (None, str), float, bool)
+@global_accepts(list, str, int, (None, str), float, bool, str)
 def single_example(models: list, datafile: str, bins: int, diagram: str = None,
-                   validation_split: float = 0.7, save_models: bool = False) -> int:
+                   validation_split: float = 0.7, save_models: bool = False, domain: str = ".") -> int:
     """
     Measure miscalibration of given methods on specified dataset.
 
@@ -34,6 +34,8 @@ def single_example(models: list, datafile: str, bins: int, diagram: str = None,
         Split ratio between build set and validation set.
     save_models : bool
         True if instances of calibration methods should be stored.
+    domain : str, optional, default: "."
+        Domain/directory where to store the results.
 
     Returns
     -------
@@ -80,7 +82,7 @@ def single_example(models: list, datafile: str, bins: int, diagram: str = None,
         instance.fit(build_set_sm, build_set_gt)
 
         if save_models:
-            instance.save_model("./models/%s.pkl" % name)
+            instance.save_model("%s/models/%s.pkl" % (domain, name))
 
     # ------------------------------------------
 
@@ -126,8 +128,8 @@ def single_example(models: list, datafile: str, bins: int, diagram: str = None,
     return 0
 
 
-@global_accepts(list, str, int, bool)
-def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bool = False) -> int:
+@global_accepts(list, str, int, bool, str)
+def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bool = False, domain: str = '.') -> int:
     """
     5x2 cross validation on given methods on specified dataset.
 
@@ -141,6 +143,8 @@ def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bo
         Number of bins used by ECE, MCE and ReliabilityDiagram.
     save_models : bool, optional, default: False
         True if instances of calibration methods should be stored.
+    domain : str, optional, default: "."
+        Domain/directory where to store the results.
 
     Returns
     -------
@@ -148,6 +152,9 @@ def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bo
         0 on success, -1 otherwise
     """
 
+    network = datafile[datafile.rfind("/")+1:datafile.rfind(".npz")]
+    seeds = [60932, 29571058, 127519, 23519410, 74198274]
+
     if not os.path.exists(datafile):
         print("Dataset \'%s\' does not exist" % datafile)
         return -1
@@ -178,13 +185,20 @@ def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bo
     all_ece = []
     all_mce = []
 
-    for i in range(5):
+    it = 0
+    for i, seed in enumerate(seeds):
+
+        np.random.seed(seed)
+
         # split data set into build set and validation set
         build_set_gt, validation_set_gt, build_set_sm, validation_set_sm = train_test_split(ground_truth, predictions,
+                                                                                            random_state=seed,
                                                                                             test_size=0.5,
                                                                                             stratify=ground_truth)
 
-        for _ in range(2):
+        for j in range(2):
+
+            calibrated_data = {}
 
             # 5x2 cross validation - flip build/val set after each iteration
             build_set_gt, validation_set_gt = validation_set_gt, build_set_gt
@@ -219,18 +233,20 @@ def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bo
 
                 instance.fit(build_set_sm, build_set_gt)
                 if save_models:
-                    instance.save_model("./models/%s_run_%d.pkl" % (name, i))
-
-            # ------------------------------------------
+                    instance.save_model("%s/models/%s-%s-%d.pkl" % (domain, network, name, i))
 
-            # perform predictions
-            for model in models:
-                _, instance = model
                 prediction = instance.transform(validation_set_sm)
+                calibrated_data[name] = prediction
 
                 if n_classes > 2:
+                    if prediction.ndim == 3:
+                        prediction = np.mean(prediction, axis=0)
+
                     labels = np.argmax(prediction, axis=1)
                 else:
+                    if prediction.ndim == 2:
+                        prediction = np.mean(prediction, axis=0)
+
                     labels = np.where(prediction > 0.5, np.ones_like(validation_set_gt),
                                       np.zeros_like(validation_set_gt))
 
@@ -247,6 +263,15 @@ def cross_validation_5_2(models: list, datafile: str, bins: int, save_models: bo
             all_ece.append(it_all_ece)
             all_mce.append(it_all_mce)
 
+            filename = "%s/results/%s_%02d.npz" % (domain, network, it)
+            with open(filename, "wb") as open_file:
+                np.savez_compressed(open_file,
+                                    train_gt=build_set_gt, test_gt=validation_set_gt,
+                                    train_scores=build_set_sm, test_scores=validation_set_sm,
+                                    **calibrated_data)
+
+            it += 1
+
     # convert to NumPy arrays and reduce mean afterwards
     all_accuracy = np.array(all_accuracy)
     all_ace = np.array(all_ace)
diff --git a/examples/detection/Calibration.py b/examples/detection/Calibration.py
new file mode 100644
index 0000000..995320c
--- /dev/null
+++ b/examples/detection/Calibration.py
@@ -0,0 +1,160 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import List, Dict
+import os
+
+import numpy as np
+from examples.detection.Helper import read_json, read_image_ids, match_frames_with_groundtruth
+from examples.detection.Features import get_features
+
+from netcal.binning import HistogramBinning
+from netcal.scaling import LogisticCalibration, BetaCalibration
+from netcal.scaling import LogisticCalibrationDependent, BetaCalibrationDependent
+
+try:
+    from detectron2.data import DatasetCatalog, MetadataCatalog
+except ImportError:
+    raise ImportError("Need detectron2 to evaluate object detection calibration. You can get the latest version at https://github.com/facebookresearch/detectron2")
+
+
+def calibrate(frames: List[Dict], dataset: str, network: str, subset: List[str], ious: List[float], train_ids: List):
+    """
+    Perform calibration of the given frames (as list of dicts) for a dedicated dataset with dedicated train_ids.
+    The trained models are stored at "calibration/<network>/models/".
+
+    Parameters
+    ----------
+    frames : List[Dict]
+        List of dictionaries holding the input data for each image frame.
+    dataset : str
+        String of the used dataset (see detectron2 registered datasets).
+    network : str
+        String describing the base neural network.
+    subset : List[str]
+        List with additional features used for calibration. Options are:
+        - 'cx'
+        - 'cy'
+        - 'w'
+        - 'h'
+    ious : List[float]
+        List with IoU scores used for evaluation.
+    train_ids : List
+        List of data frame ids used for calibration training.
+    """
+
+    meta = MetadataCatalog.get(dataset)
+    model_dir = os.path.join("calibration", network, "models")
+    os.makedirs(model_dir, exist_ok=True)
+
+    # reverse mapping of category ids to network class ids (e.g. for COCO dataset)
+    if hasattr(meta, "thing_dataset_id_to_contiguous_id"):
+        reverse_dictionary = {v: k for k, v in meta.thing_dataset_id_to_contiguous_id.items()}
+    else:
+        reverse_dictionary = None
+
+    # iterate over classes and perform class-wise calibration
+    for i, classname in enumerate(meta.thing_classes):
+        category_id = reverse_dictionary[i] if reverse_dictionary is not None else i
+        features, matched, _ = get_features(frames, category_id, subset, ious, train_ids)
+
+        if features.size == 0:
+            print("No samples for category %s found" % classname)
+            continue
+
+        # different binning schemes for different feature dimensions
+        if features.shape[1] == 1:
+            bins = 15
+        elif features.shape[1] == 3:
+            bins = 5
+        elif features.shape[1] == 5:
+            bins = 3
+        else:
+            raise ValueError("Unknown dimension: %d" % features.shape[1])
+
+        # iterate over IoUs and perform class-wise calibration for each IoU separately
+        print("Training: category %d: %d samples" % (category_id, features.shape[0]))
+        for iou, m in zip(ious, matched):
+
+            # initialize calibration methods
+            histogram = HistogramBinning(bins=bins, detection=True)
+            lr = LogisticCalibration(detection=True)
+            lr_dependent = LogisticCalibrationDependent()
+            betacal = BetaCalibration(detection=True)
+            betacal_dependent = BetaCalibrationDependent(momentum_epochs=500)
+
+            # if only negative (or positive) examples are given, calibration is not applicable
+            unique = np.unique(m)
+            print("Different labels:", unique)
+            if len(unique) != 2:
+                print("Calibration failed for cls %d as there are only negative samples" % i)
+                continue
+
+            # fit and save calibration models
+            print("Fit and save histogram binning")
+            histogram.fit(features, m)
+            histogram.save_model(os.path.join(model_dir, "histogram_%s_iou%.2f_cls-%02d.pkl" % (''.join(subset), iou, i)))
+
+            print("Fit independent logistic calibration")
+            lr.fit(features, m)
+            lr.save_model(os.path.join(model_dir, "lr_%s_iou%.2f_cls-%02d.pkl" % (''.join(subset), iou, i)))
+
+            print("Fit dependent logistic calibration")
+            lr_dependent.fit(features, m)
+            lr_dependent.save_model(os.path.join(model_dir, "lr_dependent_%s_iou%.2f_cls-%02d.pkl" % (''.join(subset), iou, i)))
+
+            print("Fit independent beta calibration")
+            betacal.fit(features, m)
+            betacal.save_model(os.path.join(model_dir, "betacal_%s_iou%.2f_cls-%02d.pkl" % (''.join(subset), iou, i)))
+
+            print("Fit dependent beta calibration")
+            betacal_dependent.fit(features, m)
+            betacal_dependent.save_model(os.path.join(model_dir, "betacal_dependent_%s_iou%.2f_cls-%02d.pkl" % (''.join(subset), iou, i)))
+
+
+if __name__ == '__main__':
+
+    # to use this script, perform inference of neural network using Detectron2 first. The predictions are stored as
+    # a JSON file in COCO annotations format. This JSON file is understood by the methods in this script.
+
+    # COCO data - Faster RCNN
+    filename = "./data/faster-rcnn-coco/inference/coco_instances_results.json"
+    network = "COCO-faster-rcnn-threshold-%.f"
+
+    # COCO data - RetinaNet
+    # filename = "./data/retinanet-coco/inference/coco_instances_results.json"
+    # network = "COCO-retinanet-threshold-%.f"
+
+    dataset = "coco_2017_val"
+    train_ids, val_ids = read_image_ids("image_ids_coco.json")
+
+    # Cityscapes data
+    # filename = "./data/mask-rcnn-cityscapes/inference/coco_instances_results.json"
+    # dataset = "cityscapes_fine_instance_seg_val"
+    # network = "Cityscapes-mask-rcnn-threshold-%.f"
+    # train_ids, val_ids = read_image_ids("image_ids_cityscapes.json")
+
+    # score threshold used for calibration
+    score_threshold = 0.3
+    # score_threshold = 0.05
+
+    network = network % score_threshold
+
+    # define different subsets and IoUs that are used for evaluation
+    subsets = [[], ['cx', 'cy'], ['w', 'h'], ['cx', 'cy', 'w', 'h']]
+    ious = [0.5, 0.75]
+
+    print("Load dataset")
+    DatasetCatalog.get(dataset)
+
+    # read frames and match the frames with the according ground-truth boxes. This is mandatory to assess the precision
+    frames = read_json(filename, score_threshold=score_threshold)
+    frames = match_frames_with_groundtruth(frames, dataset, ious)
+
+    # perform confidence calibration for each subset
+    for subset in subsets:
+        calibrate(frames, dataset, network, subset, ious, train_ids)
diff --git a/examples/detection/Evaluation.py b/examples/detection/Evaluation.py
new file mode 100644
index 0000000..9242dd6
--- /dev/null
+++ b/examples/detection/Evaluation.py
@@ -0,0 +1,284 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import List, Dict
+import os
+
+import numpy as np
+import itertools
+import csv
+from tabulate import tabulate
+from sklearn.metrics import average_precision_score
+from matplotlib import pyplot as plt
+
+from netcal.binning import HistogramBinning
+from netcal.scaling import LogisticCalibration, BetaCalibration
+from netcal.scaling import LogisticCalibrationDependent, BetaCalibrationDependent
+from netcal.metrics import ECE
+from netcal.presentation import ReliabilityDiagram
+from examples.detection.Helper import read_json, read_image_ids, match_frames_with_groundtruth
+from examples.detection.Features import get_features
+
+try:
+    from detectron2.data import DatasetCatalog, MetadataCatalog
+except ImportError:
+    raise ImportError("Need detectron2 to evaluate object detection calibration. You can get the latest version at https://github.com/facebookresearch/detectron2")
+
+
+def transform(frames: List[Dict], dataset: str, network: str, subset: List, ious: List, test_ids: List[int]):
+    """
+    After calibration training, evaluate the trained models by several miscalibration metrics. These metrics are:
+    D-ECE, Brier, NLL. Also capture area under precision-recall curve (AUPRC).
+    All results are stored at "./output/<network>".
+
+    Parameters
+    ----------
+    frames : List[Dict]
+        List of dictionaries holding the input data for each image frame.
+    dataset : str
+        String of the used dataset (see detectron2 registered datasets).
+    network : str
+        String describing the base neural network.
+    subset : List[str]
+        List with additional features used for calibration. Options are:
+        - 'cx'
+        - 'cy'
+        - 'w'
+        - 'h'
+    ious : List[float]
+        List with IoU scores used for evaluation.
+    test_ids : List
+        List of data frame ids used for calibration testing.
+    """
+
+    # get meta information and specify all relevant paths
+    meta = MetadataCatalog.get(dataset)
+    model_dir = os.path.join("calibration", network, "models")
+    output_dir = os.path.join("output", network)
+    diagram_path = os.path.join(output_dir, "diagrams", ''.join(subset) if len(subset) > 0 else "confidence")
+
+    os.makedirs(output_dir, exist_ok=True)
+    os.makedirs(diagram_path, exist_ok=True)
+
+    # calibration methods that have also been used for calibration training
+    methods = [("histogram", HistogramBinning), ("lr", LogisticCalibration),
+               ("lr_dependent", LogisticCalibrationDependent), ("betacal", BetaCalibration),
+               ("betacal_dependent", BetaCalibrationDependent)]
+
+    # reverse mapping of category ids to network class ids (e.g. for COCO dataset)
+    if hasattr(meta, "thing_dataset_id_to_contiguous_id"):
+        reverse_dictionary = {v: k for k, v in meta.thing_dataset_id_to_contiguous_id.items()}
+    else:
+        reverse_dictionary = None
+
+    # lists and placeholders for evaluation metrics
+    n_samples_total = 0
+    n_samples_per_class = []
+    dece_per_class = [[[] for _ in ious] for _ in range(len(methods)+1)]
+
+    brier_per_class = [[[] for _ in ious] for _ in range(len(methods) + 1)]
+    nll_per_class = [[[] for _ in ious] for _ in range(len(methods) + 1)]
+    average_precision = [[[] for _ in ious] for _ in range(len(methods) + 1)]
+
+    # -----------------------------------------------------
+    # visualization routine
+    diagram0d = ReliabilityDiagram(bins=20, detection=True, sample_threshold=8)
+    diagram1d = ReliabilityDiagram(bins=[5, 15], detection=True, sample_threshold=3, fmin=0, fmax=0.3)
+    diagram2d = ReliabilityDiagram(bins=[6, 9, 9], detection=True, sample_threshold=2, fmin=0, fmax=0.3)
+
+    def plot(f: np.ndarray, m: np.ndarray, title: str, formatter: str):
+        # Define function for diagram output
+
+        # plot baseline miscalibration
+        figures = [diagram0d.plot(f[:, :1], m, tikz=False, title_suffix=title, filename=formatter % "0d")]
+
+        # plot all additional features in 1D miscalibration plots
+        for i, fname in enumerate(['cx', 'cy', 'w', 'h']):
+            figures.append(diagram1d.plot(f[:, (0, i + 1)], m, tikz=False, feature_names=[fname], title_suffix=title,
+                                          filename=formatter % ("1d_%s" % fname)))
+
+        # finally, plot all feature combinations of size 2
+        for (i, fname1), (j, fname2) in itertools.combinations(enumerate(['cx', 'cy', 'w', 'h']), 2):
+            figures.append(diagram2d.plot(f[:, (0, i + 1, j + 1)], m, tikz=False, feature_names=[fname1, fname2],
+                                          title_suffix=title, filename=formatter % ("2d_%s_%s" % (fname1, fname2))))
+
+        # free memory space
+        for fig in figures:
+            plt.close(fig)
+
+    # -----------------------------------------------------
+
+    # iterate over all classes that are present in the current dataset
+    for i, classname in enumerate(meta.thing_classes):
+
+        # get calibration features for selected class
+        category_id = reverse_dictionary[i] if reverse_dictionary is not None else i
+        features, matched, img_ids = get_features(frames, category_id, subset, ious, test_ids)
+        all_features, _, _ = get_features(frames, category_id, ['cx', 'cy', 'w', 'h'], ious, test_ids)
+
+        if features.size == 0:
+            print("No samples for category %s found" % classname)
+            continue
+
+        # different binning schemes for different feature dimensions
+        if features.shape[1] == 1:
+            bins = 20
+        elif features.shape[1] == 3:
+            bins = 8
+        elif features.shape[1] == 5:
+            bins = 5
+        else:
+            raise ValueError("Unknown dimension: %d" % features.shape[1])
+
+        # define D-ECE metric
+        dece = ECE(bins=bins, detection=True, sample_threshold=8)
+        n_samples_per_class.append(features.shape[0])
+        n_samples_total += features.shape[0]
+
+        # failed flag is required to optionally blank failed or non-present classes during evaluation
+        # i.e., if a metric returns NaN
+        failed = False
+
+        # perform evaluation for each category separately
+        print("Inference: category %d: %d samples" % (category_id, features.shape[0]))
+        for j, (iou, m) in enumerate(zip(ious, matched)):
+
+            score = average_precision_score(m, features[:, 0])
+            if not np.isfinite(score) or np.isnan(score):
+                brier_per_class[0][j].append(0.)
+                nll_per_class[0][j].append(0.)
+                dece_per_class[0][j].append(0.)
+                average_precision[0][j].append(0.)
+                failed = True
+
+            # compute average precision, Brier, NLL and ECE
+            else:
+                brier_per_class[0][j].append(np.mean(np.square(features[:, 0] - m)))
+                nll_per_class[0][j].append(-np.mean(m * np.log(features[:, 0]) + (1. - m) * np.log(1. - features[:, 0])))
+                dece_per_class[0][j].append(dece.measure(features, m))
+                average_precision[0][j].append(score)
+
+            diagramname = os.path.join(diagram_path, "default_cls-%02d_iou%.2f" % (i, iou) + "_%s.tex")
+            plot(all_features, m, title="default", formatter=diagramname)
+
+            # start calibration evaluation for each method separately
+            for k, (name, method) in enumerate(methods, start=1):
+                instance = method()
+
+                try:
+                    print("Load %s and transform" % name)
+                    instance.load_model(os.path.join(model_dir, "%s_%s_iou%.2f_cls-%02d.pkl" % (name, ''.join(subset), iou, i)))
+                    calibrated = instance.transform(features)
+
+                    # perform clipping
+                    np.clip(calibrated, np.finfo(np.float32).eps, 1.-np.finfo(np.float32).eps, out=calibrated)
+                    score = average_precision_score(m, calibrated)
+                    if not np.isfinite(score) or np.isnan(score):
+                        raise ValueError("Couldn't compute AUPRC score")
+
+                    average_precision[k][j].append(score)
+
+                    brier_per_class[k][j].append(np.mean(np.square(calibrated - m)))
+                    nll_per_class[k][j].append(-np.mean(m * np.log(calibrated) + (1. - m) * np.log(1. - calibrated)))
+
+                    input = np.concatenate((np.reshape(calibrated, (-1, 1)), features[:, 1:]), axis=1)
+                    dece_per_class[k][j].append(dece.measure(input, m))
+
+                    diagramname = os.path.join(diagram_path, "%s_cls-%02d_iou%.2f" % (name, i, iou) + "_%s.tex")
+                    input = np.concatenate((np.reshape(calibrated, (-1, 1)), all_features[:, 1:]), axis=1)
+                    plot(input, m, title=name, formatter=diagramname)
+
+                except (FileNotFoundError, ValueError):
+                    print("Could not find weight file ", os.path.join(model_dir, "%s_%s_iou%.2f_cls-%02d.pkl" % (name, ''.join(subset), iou, i)))
+                    print("Disable evaluation for class %d" % i)
+
+                    brier_per_class[k][j].append(0.)
+                    nll_per_class[k][j].append(0.)
+                    dece_per_class[k][j].append(0.)
+                    average_precision[k][j].append(0.)
+
+                    failed = True
+
+        if failed:
+            n_samples_total -= n_samples_per_class[-1]
+            n_samples_per_class[-1] = 0
+
+    # convert all lists to NumPy arrays
+    weights = np.array(n_samples_per_class) / n_samples_total
+    brier_per_class = np.array(brier_per_class)
+    nll_per_class = np.array(nll_per_class)
+    dece_per_class = np.array(dece_per_class)
+    average_precision = np.array(average_precision)
+
+    # compute a feed-forward average and and a weighted counter-part
+    brier_global = np.mean(brier_per_class, axis=2)
+    weighted_brier_global = np.average(brier_per_class, weights=weights, axis=2)
+    nll_global = np.mean(nll_per_class, axis=2)
+    weighted_nll_global = np.average(nll_per_class, weights=weights, axis=2)
+    dece_global = np.mean(dece_per_class, axis=2)
+    weighted_dece_global = np.average(dece_per_class, weights=weights, axis=2)
+    average_precision_macro = np.mean(average_precision, axis=2)
+    average_precision_weighted = np.average(average_precision, weights=weights, axis=2)
+
+    # use tabulate library to visualize the evaluation results
+    header = []
+    body = [['default']]
+    body.extend([[name] for name, method in methods])
+    for i, iou in enumerate(ious):
+
+        header.extend(['D-ECE(w) @ IoU %.2f' % iou, 'D-ECE @ IoU %.2f' % iou, 'Brier(w) @ IoU %.2f' % iou, 'Brier @ IoU %.2f' % iou, 'NLL(w) @ IoU %.2f' % iou, 'NLL @ IoU %.2f' % iou, 'AP(w) @ IoU %.2f' % iou, 'AP @ IoU %.2f'])
+        body[0].extend([weighted_dece_global[0][i], dece_global[0][i], weighted_brier_global[0][i], brier_global[0][i], weighted_nll_global[0][i], nll_global[0][i], average_precision_weighted[0][i], average_precision_macro[0][i]])
+        for k, (name, method) in enumerate(methods):
+            body[k+1].extend([weighted_dece_global[k+1][i], dece_global[k+1][i], weighted_brier_global[k+1][i], brier_global[k+1][i], weighted_nll_global[k+1][i], nll_global[k+1][i], average_precision_weighted[k+1][i], average_precision_macro[k+1][i]])
+
+    results = [header, *body]
+
+    # also write the evaluation results to CSV format
+    print("\nEvaluation Results:")
+    print(tabulate(results, headers="firstrow"))
+    with open(os.path.join(output_dir, "results_%s.csv" % ''.join(subset)), "w") as open_file:
+        writer = csv.writer(open_file)
+        writer.writerow(["method", ] + results[0])
+        writer.writerows(results[1:])
+
+
+if __name__ == '__main__':
+
+    # to use this script, perform inference of neural network using Detectron2 first. The predictions are stored as
+    # a JSON file in COCO annotations format. This JSON file is understood by the methods in this script.
+
+    # COCO data - Faster RCNN
+    filename = "./data/faster-rcnn-coco/inference/coco_instances_results.json"
+    network = "COCO-faster-rcnn-threshold-%.f"
+
+    # COCO data - RetinaNet
+    # filename = "./data/retinanet-coco/inference/coco_instances_results.json"
+    # network = "COCO-retinanet-threshold-%.f"
+
+    dataset = "coco_2017_val"
+    train_ids, val_ids = read_image_ids("image_ids_coco.json")
+
+    # Cityscapes data
+    # filename = "./data/mask-rcnn-cityscapes/inference/coco_instances_results.json"
+    # dataset = "cityscapes_fine_instance_seg_val"
+    # network = "Cityscapes-mask-rcnn-threshold-%.f"
+    # train_ids, val_ids = read_image_ids("image_ids_cityscapes.json")
+
+    score_threshold = 0.3
+    # score_threshold = 0.05
+
+    subsets = [[], ['cx', 'cy'], ['w', 'h'], ['cx', 'cy', 'w', 'h']]
+    ious = [0.5, 0.75]
+
+    # read frames and match the frames with the according ground-truth boxes. This is mandatory to assess the precision
+    DatasetCatalog.get(dataset)
+    frames = read_json(filename, score_threshold=score_threshold)
+    frames = match_frames_with_groundtruth(frames, dataset, ious)
+
+    # perform confidence calibration evaluation for each subset
+    for subset in subsets:
+        transform(frames, dataset, network, subset, ious, val_ids)
diff --git a/examples/detection/Features.py b/examples/detection/Features.py
new file mode 100644
index 0000000..00d31f8
--- /dev/null
+++ b/examples/detection/Features.py
@@ -0,0 +1,103 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import List, Dict, Tuple
+import numpy as np
+
+try:
+    from detectron2.data import DatasetCatalog, MetadataCatalog
+    from detectron2.structures import Instances, Boxes
+except ImportError:
+    raise ImportError("Need detectron2 to evaluate object detection calibration. You can get the latest version at https://github.com/facebookresearch/detectron2")
+
+
+def get_features(frames: List[Dict], category_id: int, subset: List, ious: List[float], frame_ids: List) -> Tuple[np.ndarray, List[np.ndarray], List]:
+    """
+    Compute the calibration features for each frame. Return the preprocessed calibration features as a flattened
+    NumPy array holding all predictions in a single array.
+
+    Parameters
+    ----------
+    frames : List[Dict]
+        List of dictionaries holding the input data for each image frame.
+    category_id : int
+        Integer describing the current category ID for which the features should be extracted
+    subset : List[str]
+        List with additional features used for calibration. Options are:
+        - 'cx'
+        - 'cy'
+        - 'w'
+        - 'h'
+    ious : List[float]
+        List with IoU scores used for evaluation.
+    frame_ids : List
+        List with frame indices used for calibration prerpocessing.
+
+    Returns
+    -------
+    Tuple[np.ndarray, List[np.ndarray], List]
+        Tuple of size 3 containing:
+        - NumPy array of shape (N,M) with N predictions over all frames and M features
+        - List of NumPy arrays, each of shape (N,) with binary labels (0, 1) indicating a match/not match for each IoU score separately
+        - List of length N with image IDs for each prediction. This allows for a reconstruction of the frames later on.
+    """
+
+    features, img_ids = [], []
+    matched = [[] for _ in ious]
+
+    # iterate over frames
+    for frame in frames:
+
+        if frame['image_id'] not in frame_ids:
+            continue
+
+        # blank out all predictions that have a different category ID
+        categories = frame['category_ids']
+        filter = categories == category_id
+
+        if (filter == False).all():
+            continue
+
+        # filter out confidences, bounding boxes and matched information
+        confidence = frame['scores'][filter]
+        bboxes = frame['bboxes'][filter, :] # boxes are in XYWH_ABS
+        for i, m in enumerate(frame['matched']):
+            matched[i].append(m[filter])
+
+        # convert XYXY_ABS boxes to relative positioning
+        img_height, img_width = frame['height'], frame['width']
+        rel_cx = (bboxes[:, 0] + 0.5 * bboxes[:, 2]) / float(img_width)
+        rel_cy = (bboxes[:, 1] + 0.5 * bboxes[:, 3]) / float(img_height)
+        rel_width = bboxes[:, 2] / float(img_width)
+        rel_height = bboxes[:, 3] / float(img_height)
+
+        # depending on the specified subset, append different features to the final vector
+        input = [confidence]
+        if 'cx' in subset:
+            input.append(rel_cx)
+        if 'cy' in subset:
+            input.append(rel_cy)
+        if 'w' in subset:
+            input.append(rel_width)
+        if 'h' in subset:
+            input.append(rel_height)
+
+        # also record the respective image ids for each detection
+        img_ids.extend([frame['image_id'], ] * confidence.size)
+        features.append(np.stack(input, axis=1))
+
+    # in some cases it can occur that no predictions are found for a certain class. In this case, return empty lists
+    if len(features) == 0:
+        n_features = len(subset) + 1
+        matched = [np.empty(0, dtype=np.int32) for _ in ious]
+        return np.empty((0, n_features), dtype=np.float32), matched, []
+
+    features = np.concatenate(features, axis=0)
+    matched = [np.concatenate(m) for m in matched]
+    np.clip(features, np.finfo(np.float32).eps, 1.-np.finfo(np.float32).eps, out=features)
+
+    return features, matched, img_ids
diff --git a/examples/detection/Helper.py b/examples/detection/Helper.py
new file mode 100644
index 0000000..69d1582
--- /dev/null
+++ b/examples/detection/Helper.py
@@ -0,0 +1,191 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import List, Dict, Tuple
+import json
+import numpy as np
+from tqdm import tqdm
+import torch
+
+try:
+    from detectron2.data import DatasetCatalog, MetadataCatalog
+    from detectron2.structures.boxes import Boxes, BoxMode, pairwise_iou
+except ImportError:
+    raise ImportError(
+        "Need detectron2 to evaluate object detection calibration. You can get the latest version at https://github.com/facebookresearch/detectron2")
+
+
+def read_image_ids(filename: str) -> Tuple[List, List]:
+    """
+    Read a JSON file that holds the image ids used for training and testing.
+    Parameters
+    ----------
+    filename : str
+        Path to JSON file describing training and testing indices.
+
+    Returns
+    -------
+    Tuple[List, List]
+        Tuple of two lists with frame indices for training and testing.
+    """
+
+    with open(filename, "r") as open_file:
+        config = json.load(open_file)
+
+    # assert fields "train" and "test" within JSON file
+    assert "train" in config, "Field \'train\' must be given in JSON file root for specifying training IDs."
+    assert "test" in config, "Field \'test\' must be given in JSON file root for specifying testing IDs."
+
+    train_ids = config["train"]
+    test_ids = config["test"]
+
+    return train_ids, test_ids
+
+
+def read_json(filename: str, score_threshold: float = None) -> List[Dict]:
+    """
+    Read JSON prediction file. This file holds predictions in COCO annotation format generated by the Detectron2
+    framework (or any other framework that outputs predictions in COCO annotations format with scores attached
+    to each prediction). Detections below a certain score_threshold are neglected for training/testing.
+
+    Parameters
+    ----------
+    filename : str
+        Path to JSON file.
+    score_threshold : float, optional, default: None
+        Optional score threshold for detections.
+
+    Returns
+    -------
+    List[Dict]
+        List of dictionaries where each dict represents a frame with certain detections and their according scores,
+        classes and bounding boxes.
+    """
+
+    print("Read JSON file %s" % filename)
+    with open(filename, "r") as open_file:
+        content = json.load(open_file)
+
+    # iterate over all detections and perform a preprocessing. Detections are "flattened" across all frames.
+    # We sort each detection to its according frame
+    img_ids, frames = [], []
+    for prediction in tqdm(content, desc="Preprocess content"):
+
+        # if current prediction is below score threshold, continue
+        if score_threshold is not None and prediction['score'] < score_threshold:
+            continue
+
+        # create new dictionary if current frame has not been processed so far
+        if prediction['image_id'] not in img_ids:
+            img_ids.append(prediction['image_id'])
+            frames.append({'image_id': prediction['image_id'], 'category_ids': [prediction['category_id']],
+                           'bboxes': [prediction['bbox']], 'scores': [prediction['score']]})
+
+        # append to existing object otherwise
+        else:
+            frame = next((frame for frame in frames if frame["image_id"] == prediction['image_id']), None)
+            frame['category_ids'].append(prediction['category_id'])
+            frame['bboxes'].append(prediction['bbox'])
+            frame['scores'].append(prediction['score'])
+
+    # convert lists to NumPy arrays
+    for frame in frames:
+        frame['category_ids'] = np.array(frame['category_ids'])
+        frame['bboxes'] = np.array(frame['bboxes'])
+        frame['scores'] = np.array(frame['scores'])
+
+    return frames
+
+
+def match_frames_with_groundtruth(frames: List[Dict], dataset: str, ious: List[float]) -> List[Dict]:
+    """
+    For calbration training and evaluation, we need to assess the precision over all frames. This means, that we
+    need to match each detection with a ground-truth sample. Mark a matched object with m=1 and a not-matched
+    object with m=0. Matched criterion: IoU above a certain IoU threshold, same predicted class as ground-truth
+    object.
+
+    Parameters
+    ----------
+    frames : List[Dict]
+        List of dictionaries containing the neural network predictions.
+    dataset : str
+        String of the used dataset (see detectron2 registered datasets).
+    ious : List[float]
+        List with IoU scores used for evaluation.
+
+    Returns
+    -------
+    List[Dict]
+        List of dictionaries where each dict represents a frame with certain detections and their according scores,
+        classes and bounding boxes. In addition, each frame also holds the field 'matched' holding the boolean tensor
+        if a prediction has matched a ground-truth object or not.
+    """
+
+    # get information about current dataset using Detectron2
+    dataset_dicts = DatasetCatalog.get(dataset)
+    meta = MetadataCatalog.get(dataset)
+
+    # iterate over all frames and match with ground-truth
+    for frame in tqdm(frames, desc="Match frames with ground-truth annotations"):
+
+        # find according ground-truth frame and convert boxes to XYXY format
+        # the XYXY format is required for the Boxes wrapper module that is used to evaluate the IoU scores
+        d = next((d for d in dataset_dicts if d["image_id"] == frame['image_id']), None)
+        gt_categories = torch.from_numpy(np.array([x['category_id'] for x in d['annotations']]))
+        gt_boxes = np.array([BoxMode.convert(x['bbox'], from_mode=x['bbox_mode'], to_mode=BoxMode.XYXY_ABS) for x in d['annotations']])
+
+        frame['height'] = d['height']
+        frame['width'] = d['width']
+
+        # also put the detected predictions in the Boxes wrapper
+        pred_boxes = Boxes(BoxMode.convert(torch.from_numpy(frame['bboxes']), from_mode=BoxMode.XYWH_ABS, to_mode=BoxMode.XYXY_ABS)) # N
+        pred_labels = torch.tensor([meta.thing_dataset_id_to_contiguous_id[x] for x in frame['category_ids']]) if hasattr(meta, "thing_dataset_id_to_contiguous_id") else torch.from_numpy(frame['category_ids'])
+        gt_boxes = Boxes(torch.from_numpy(gt_boxes)) # M
+
+        # if either no prediction is given or not ground-truth boxes, skip current frame
+        if len(pred_boxes) == 0:
+            continue
+
+        if len(gt_boxes) == 0:
+            frame['matched'] = [np.zeros_like(pred_labels.numpy()) for _ in ious]
+            continue
+
+        # calculate pairwise IoU and only consider the max score. This yields a (N, M) tensor
+        iou_matrix = pairwise_iou(pred_boxes, gt_boxes)
+        iou_scores, idx = torch.max(iou_matrix, dim=1)
+        gt_labels = gt_categories[idx]
+        pred_labels = pred_labels
+
+        # mark predictions as matched that have the correct class label and are above a certain IoU threshold
+        frame['matched'] = []
+        for iou in ious:
+            matched = torch.where((iou_scores >= iou) & (pred_labels == gt_labels), torch.ones_like(iou_scores), torch.zeros_like(iou_scores))
+            frame['matched'].append(matched.numpy())
+
+    return frames
+
+
+def save_frames(frames: List[Dict], filename: str):
+    """
+    Counter-part to 'read_json' function. Write frames to JSON format.
+
+    Parameters
+    ----------
+    frames : List[Dict]
+        List of dictionaries containing the neural network predictions.
+    filename : str
+        Path to JSON file.
+    """
+
+    output = []
+    for frame in frames:
+        image_id = frame['image_id']
+        for category_id, bbox, score in zip(frame['category_ids'], frame['bboxes'], frame['scores']):
+            output.append({'image_id': int(image_id), 'category_id': int(category_id), 'bbox': bbox.tolist(), 'score': float(score)})
+
+    with open(filename, "w") as open_file:
+        json.dump(output, open_file)
diff --git a/examples/detection/__init__.py b/examples/detection/__init__.py
new file mode 100644
index 0000000..e1e1791
--- /dev/null
+++ b/examples/detection/__init__.py
@@ -0,0 +1,6 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
diff --git a/examples/detection/artificial/Calibration.py b/examples/detection/artificial/Calibration.py
deleted file mode 100644
index 1e62bca..0000000
--- a/examples/detection/artificial/Calibration.py
+++ /dev/null
@@ -1,124 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-"""
-Use this file to calibrate the confidence of the artificial dataset to demonstrate the effect of position-dependent
-confidence calibration used for object detection calibration.
-"""
-
-import numpy as np
-from typing import Union
-from netcal.binning import HistogramBinning
-from netcal.scaling import BetaCalibration, BetaCalibrationDependent, LogisticCalibration, LogisticCalibrationDependent
-from sklearn.model_selection import train_test_split
-import os
-
-
-def calibration(samples: dict, bins: Union[tuple, list], save_models: bool = False, random_state: int = None) -> dict:
-    """
-    Do example calibration on the artificial dataset created by the module "CreateDataset".
-
-    Parameters
-    ----------
-    samples : dict
-        Dictionary with samples generated by module "CreateDataset".
-    bins : iterable
-        Number of bins in each direction.
-    save_models : bool, optional, default: False
-        If True, save all models on disk.
-    random_state : int, optional, default: None
-        Random state as seed for train/test split
-
-    Returns
-    -------
-    dict
-        Dictionary with splitted test data and calibrated confidence estimates.
-    """
-
-    # extract values from dict
-    matched = samples['matched']
-    confidences = samples['confidences']
-    cx = samples['cx']
-    cy = samples['cy']
-
-    # check if save directory exists if models should be stored on disk
-    if save_models:
-        if not os.path.isdir("models"):
-            os.makedirs("models", exist_ok=True)
-
-    # stratified random split
-    conf_train, conf_test, cx_train, cx_test, cy_train, cy_test, matched_train, matched_test = \
-        train_test_split(confidences, cx, cy, matched,
-                         train_size=0.7,
-                         shuffle=True,
-                         stratify=matched,
-                         random_state=random_state)
-
-    # calibration results are stored in this dict
-    results = {'confidence': conf_test, 'matched': matched_test, 'cx': cx_test, 'cy': cy_test}
-
-    # -----------------------------------------
-    # 0D methods with confidence only
-    hist = HistogramBinning(bins=bins[0], detection=True)
-    betacal = BetaCalibration(detection=True)
-    lr_calibration = LogisticCalibration(temperature_only=False, detection=True)
-
-    methods0d = [("hist", hist), ("betacal", betacal), ("lr_calibration", lr_calibration)]
-
-    # iterate over 0D models, build calibration mapping and perform calibration
-    for name, method in methods0d:
-
-        method.fit(conf_train, matched_train)
-        results[name] = method.transform(conf_test)
-
-        if save_models:
-            method.save_model("models/%s.pkl" % name)
-
-    # -----------------------------------------
-    # 2D methods with confidence and x/y position
-
-    hist2d = HistogramBinning(bins=bins, detection=True)
-    betacal2d = BetaCalibration(detection=True)
-    betacal_dependent2d = BetaCalibrationDependent(momentum=True, detection=True)
-    lr_calibration2d = LogisticCalibration(temperature_only=False, detection=True)
-    lr_calibration_dependent2d = LogisticCalibrationDependent(detection=True)
-
-    methods2d = [("hist2d", hist2d), ("betacal2d", betacal2d), ("betacal_dependent2d", betacal_dependent2d),
-                 ("lr_calibration2d", lr_calibration2d), ("lr_calibration_dependent2d", lr_calibration_dependent2d)]
-
-    # iterate over 2D models, build calibration mapping and perform calibration
-    conf_train_2d = np.stack((conf_train, cx_train, cy_train), axis=1)
-    conf_test_2d = np.stack((conf_test, cx_test, cy_test), axis=1)
-
-    # iterate over 0D models, build calibration mapping and perform calibration
-    for name, method in methods2d:
-
-        method.fit(conf_train_2d, matched_train)
-        results[name] = method.transform(conf_test_2d)
-
-        if save_models:
-            method.save_model("models/%s.pkl" % name)
-
-    return results
-
-
-if __name__ == '__main__':
-
-    bins = [15, 15, 15]
-    save_models = True
-    random_state = None
-
-    # read generated artificial data
-    with open('artificial_dataset.npz', 'rb') as open_file:
-        npz = np.load(open_file)
-        samples = dict(npz)
-
-    results = calibration(samples, bins, save_models, random_state)
-
-    # save calibrated confidences as numpy array
-    with open("calibrated_dataset.npz", "wb") as open_file:
-        np.savez_compressed(open_file, **results)
diff --git a/examples/detection/artificial/CreateDataset.py b/examples/detection/artificial/CreateDataset.py
deleted file mode 100644
index 9d2b333..0000000
--- a/examples/detection/artificial/CreateDataset.py
+++ /dev/null
@@ -1,175 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-"""
-Use this file to create an artificial dataset to demonstrate the effect of position-dependent
-confidence calibration used for object detection calibration.
-"""
-
-import numpy as np
-from scipy.stats import truncnorm, multivariate_normal
-
-
-def create_bivariate_normal(num_samples: int = 1000,
-                            mean: np.ndarray = None, cov: np.ndarray = None,
-                            accuracy: float = 0.7, calibration_error: float = 0.0) -> tuple:
-    """
-    Create bivariate normal distribution with covariances and commanded calibration error.
-
-    Parameters
-    ----------
-    num_samples : int, default: 1000
-        Number of samples to generate
-    mean : np.ndarray of shape=(n_features,), optional, default: [0.5, 0.5]
-        Mean of bivariate normal distribution.
-    cov : np.ndarray of shape=(n_features, n_features), optional, default: [[0.01, 0], [0, 0.01]]
-        Covariance matrix of bivariate normal distribution.
-    accuracy : float, optional, default: 0.7
-        Commanded accuracy.
-    calibration_error : float, optional, default: 0
-        Commanded calibration error
-
-    Returns
-    -------
-    tuple of size 3
-        Returns 2D NumPy array with (x, y) position, matched values and confidence values for each sample.
-    """
-
-    # default mean
-    if mean is None:
-        mean = np.array([.5, .5])
-
-    # default covariance matrix
-    if cov is None:
-        cov = np.array([[.01, .0], [.0, .01]])
-
-    # sample from multivariate normal distribution as long as number of samples limit is reached
-    samples = []
-    i = 0
-    while i<num_samples:
-
-        # sample from normal
-        sample = np.random.multivariate_normal(mean=mean, cov=cov, size=1)
-
-        # discard samples from out of scope (out of interval [0,1])
-        if (sample > 1.0).any() or (sample < 0.0).any():
-            continue
-        else:
-            samples.append(sample)
-            i += 1
-
-    samples = np.array(samples).squeeze()
-
-    # number of bins, bin bounds and bin median for matches and confidences
-    n_bins = 10
-    bounds = np.linspace(0.0, 1.0, n_bins + 1)
-    bin_median = (bounds[:-1] + bounds[1:]) / 2.
-
-    # some magic numbers to scale up covariance values
-    # those scale factors control the strength of "value decay" to the boundaries
-    # the higher the number, the more constant are the values over the distribution
-    shift_scale = 3.0
-    shift_cov = cov * shift_scale
-
-    conf_scale = 10.0
-    conf_cov = cov * conf_scale
-
-    # sample a normalizer and other samples
-    # this guarantees values in the interval [0, 1] different from 1
-    # 1st part: probabilities for the accuracy in each region ('matched/not matched' flag)
-    normalizer = multivariate_normal.pdf(mean, mean=mean, cov=shift_cov)
-    sample_scaling = multivariate_normal.pdf(samples, mean=mean, cov=shift_cov) / normalizer
-
-    # 2nd part: scaling for confidence estimates in each region
-    normalizer = multivariate_normal.pdf(mean, mean=mean, cov=conf_cov)
-    conf_scaling = multivariate_normal.pdf(samples, mean=mean, cov=conf_cov) / normalizer
-
-    # now sample the "ground-truth" information according to the probabilities obtained beforehand
-    matched = []
-    for scale in sample_scaling:
-
-        # clip probabilitiy to [0, 1] interval and sample from {0, 1}
-        prob = np.clip(accuracy * scale, 0.0, 1.0)
-        matched.append(np.random.choice([0, 1], size=1, replace=True, p=[1. - prob, prob]))
-
-    matched = np.array(matched).squeeze()
-
-    # some more magic numbers: loc is the mean accuracy, scale the stddev of the accuracy
-    loc = accuracy+0.0
-    scale = 0.15
-
-    # upper and lower bounds for truncated normal
-    a, b = (0 - loc) / scale, (1 - loc) / scale
-
-    # now we need to distribute the samples along the confidence bins
-    # thus, we need a probability of sample occurrence over the confidence bins with a peak on the desired
-    # mean accuracy
-
-    # use a CDF and calculate the n-th discrete difference along the second axis
-    # this guarantees, that the occurrence probability sums up to 1
-    cumulated = np.array(
-        [truncnorm.cdf([bounds[i], bounds[i + 1]], a, b, loc=loc, scale=scale) for i in range(n_bins)]
-    )
-    bin_props = np.diff(cumulated, axis=1)
-
-    # convert the probabilities into absolute sample values and check if the number of desired samples still matches
-    samples_per_bin = np.around(bin_props * num_samples).astype(np.int)
-    if np.sum(samples_per_bin) != num_samples:
-        samples_per_bin[np.argmax(samples_per_bin)] -= np.sum(samples_per_bin) - num_samples
-
-    # lastly, get confidence values over all bins
-    # for this purpose, use a truncated normal distribution in each bin
-    confidences = []
-    for i in range(n_bins):
-
-        # use some more magic numbers to rescale confidence estimates in order to get the desired calibration error
-        loc = bin_median[i]
-        scale = 100 * calibration_error / n_bins
-
-        # bounds of truncated normal
-        a = (np.clip(bounds[i] - calibration_error, 0., 1.) - loc) / scale
-        b = (np.clip(bounds[i + 1] + calibration_error, 0., 1.) - loc) / scale
-
-        confidences.append(truncnorm.rvs(a, b, loc=loc, scale=scale, size=samples_per_bin[i]))
-
-    # rescale confidences according to the "scale PDF" obtained beforehand
-    confidences = np.concatenate(confidences)
-    confidences = confidences * conf_scaling
-
-    return samples, matched, confidences
-
-
-if __name__ == '__main__':
-
-    num_samples = 10000
-
-    # those values can be set to control the strength of miscalibration
-    # however, you can also tweak the remaining "magic numbers" in the function call above
-    commanded_calibration_error = 0.01
-    commanded_accuracy = 0.7
-
-    mean = np.array([.5, .5])
-
-    # you can use either uncorrelated or correlated covariance matrices
-    # correlated covariance matrices are more interesting in our case
-    cov_uncorrelated = np.array([[.01, 0.], [0., .01]])
-    cov_correlated = np.array([[.09, 0.06], [0.06, .09]])
-
-    #cov = cov_uncorrelated
-    cov = cov_correlated
-
-    # set seed for reproducibility
-    seed = None
-    np.random.seed(seed)
-
-    samples, matched, confidences = create_bivariate_normal(num_samples=num_samples, mean=mean, cov=cov,
-                                                            accuracy=commanded_accuracy,
-                                                            calibration_error=commanded_calibration_error)
-
-    # save in NumPy format
-    with open("artificial_dataset.npz", "wb") as open_file:
-        np.savez_compressed(open_file, matched=matched, confidences=confidences, cx=samples[..., 0], cy=samples[..., 1])
diff --git a/examples/detection/artificial/Evaluation.py b/examples/detection/artificial/Evaluation.py
deleted file mode 100644
index ab7f8aa..0000000
--- a/examples/detection/artificial/Evaluation.py
+++ /dev/null
@@ -1,141 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-"""
-Use this file to evaluate the calibration results on an artificial dataset to
-demonstrate the effect of position-dependent confidence calibration used for object detection calibration.
-"""
-
-import numpy as np
-from typing import Union
-from matplotlib import pyplot as plt
-
-from netcal.metrics import ACE, ECE, MCE
-from netcal.presentation import ReliabilityDiagram
-
-
-def read():
-    """
-    Read calibrated data set from NumPy archive.
-    Returns
-    -------
-    dict
-        Test set of artificial data set with default confidence estimates and calibrated ones.
-    """
-
-    with open("calibrated_dataset.npz", "rb") as open_file:
-        npz = np.load(open_file)
-        data = dict(npz)
-
-    return data
-
-
-def measure_miscalibration(bins: Union[tuple, list, int], data: dict, methods0d: list, methods2d: list):
-    """
-    Measure miscalibration and write to stdout.
-
-    Parameters
-    ----------
-    bins : iterable or int
-        Number of bins used by ACE, ECE and MCE.
-    data : dict
-        Dictionary of calibration data.
-    methods0d : list
-        List with strings containing the keys for the calibration data (confidence only methods).
-    methods2d : list
-        List with strings containing the keys for the calibration data (2D methods).
-    """
-
-    # iterate over 0D and 2D methods
-    for i, methods in enumerate([methods0d, methods2d]):
-
-        # insert 'confidence' key to the first place in the list to keep track of default miscalibration
-        if i==1:
-            methods = ['confidence'] + methods0d + methods2d
-        else:
-            methods = ['confidence'] + methods
-
-        # on confidence only, use one single value (the first one)
-        bins = bins[0] if i == 0 and isinstance(bins, (tuple, list)) else bins
-
-        # create instances for measuring miscalibration
-        ace = ACE(bins=bins, detection=True)
-        ece = ECE(bins=bins, detection=True)
-        mce = MCE(bins=bins, detection=True)
-
-        # initialize empty lists
-        ace_list = []
-        ece_list = []
-        mce_list = []
-
-        # iterate over all methods
-        for method in methods:
-            data_input = data[method] if i==0 else np.stack((data[method], data['cx'], data['cy']), axis=1)
-            ace_list.append(ace.measure(data_input, data['matched']))
-            ece_list.append(ece.measure(data_input, data['matched']))
-            mce_list.append(mce.measure(data_input, data['matched']))
-
-        # output formatted ECE
-        names = [len(x) for x in methods]
-        buffer = max(names)
-
-        # write out all miscalibration results in a 'pretty' manner
-        for j, method in enumerate(methods):
-            fill = (buffer - len(method)) * " "
-            print("%s%s ACE: %.5f - ECE: %.5f - MCE: %.5f" % (method, fill, ace_list[j], ece_list[j], mce_list[j]))
-
-
-def plot_results(bins: Union[tuple, list, int], data: dict, methods0d: list, methods2d: list):
-    """
-    Plot results as reliability diagrams (either 0D or 2D).
-
-    Parameters
-    ----------
-    bins : iterable or int
-        Number of bins used by ACE, ECE and MCE
-    data : dict
-        Dictionary of calibration data.
-    methods0d : list
-        List with strings containing the keys for the calibration data (confidence only methods).
-    methods2d : list
-        List with strings containing the keys for the calibration data (2D methods).
-    """
-
-    for i, methods in enumerate([methods0d, methods2d]):
-
-        # insert 'confidence' key to the first place in the list to keep track of default miscalibration
-        methods = ['confidence'] + methods
-
-        # on confidence only, use one single value (the first one)
-        bins = bins[0] if i == 0 and isinstance(bins, (tuple, list)) else bins
-
-        # iterate over all calibration models and plot reliability diagram
-        for method in methods:
-            diagram = ReliabilityDiagram(bins, detection=True, title_suffix=method)
-            fig = diagram.plot(data[method], data['matched'])
-
-        # --------------------------------------------
-        # second, plot 2D reliability diagrams as heatmaps
-        for method in methods:
-            data_input = np.stack((data[method], data['cx'], data['cy']), axis=1)
-
-            diagram = ReliabilityDiagram(bins, detection=True, feature_names=['cx', 'cy'],
-                                         fmin=0.0, fmax=0.3, title_suffix=method)
-            fig = diagram.plot(data_input, data['matched'])
-
-    plt.show()
-
-
-if __name__ == '__main__':
-
-    bins = 15
-    methods0d = ["hist", "betacal", "lr_calibration"]
-    methods2d = ["hist2d", "betacal2d", "betacal_dependent2d", "lr_calibration2d", "lr_calibration_dependent2d"]
-
-    data = read()
-    measure_miscalibration(bins, data, methods0d, methods2d)
-    # plot_results(bins, data, methods0d, methods2d)
diff --git a/examples/detection/artificial/__init__.py b/examples/detection/artificial/__init__.py
deleted file mode 100644
index 3a3b1ed..0000000
--- a/examples/detection/artificial/__init__.py
+++ /dev/null
@@ -1,11 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-from .CreateDataset import create_bivariate_normal
-from .Calibration import calibration
-from .Evaluation import plot_results
-from .Evaluation import measure_miscalibration
diff --git a/examples/detection/artificial/toolchain.py b/examples/detection/artificial/toolchain.py
deleted file mode 100644
index 510d592..0000000
--- a/examples/detection/artificial/toolchain.py
+++ /dev/null
@@ -1,71 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-"""
-Use this file to demonstrate the effect of position-dependent confidence calibration used for object
-detection calibration on an artificial dataset.
-"""
-
-import numpy as np
-from examples.detection.artificial import create_bivariate_normal
-from examples.detection.artificial import calibration
-from examples.detection.artificial import measure_miscalibration, plot_results
-
-
-def chain():
-    """
-    Grouped function call to all evaluation routines: from creating the artificial dataset over calibration
-    and visualization.
-    """
-
-    num_samples = 10000
-
-    # those values can be set to control the strength of miscalibration
-    # however, you can also tweak the remaining "magic numbers" in the function call above
-    commanded_calibration_error = 0.01
-    commanded_accuracy = 0.7
-
-    mean = np.array([.5, .5])
-
-    # you can use either uncorrelated or correlated covariance matrices
-    # correlated covariance matrices are more interesting in our case
-    cov_uncorrelated = np.array([[.01, 0.], [0., .01]])
-    cov_correlated = np.array([[.09, 0.06], [0.06, .09]])
-
-    #cov = cov_uncorrelated
-    cov = cov_correlated
-
-    # set seed for reproducibility
-    seed = None
-    np.random.seed(seed)
-
-    calibration_bins = [15, 15, 15]
-    measure_bins = [12, 12, 12]
-    save_models = True
-
-    # specify methods that should be evaluated
-    methods0d = ["hist", "betacal", "lr_calibration"]
-    methods2d = ["hist2d", "betacal2d", "betacal_dependent2d", "lr_calibration2d", "lr_calibration_dependent2d"]
-
-    # first step: create data
-    coordinates, matched, confidences = create_bivariate_normal(num_samples=num_samples, mean=mean, cov=cov,
-                                                                accuracy=commanded_accuracy,
-                                                                calibration_error=commanded_calibration_error)
-
-    # collect data in a single dict
-    samples = {'matched': matched, 'confidences': confidences, 'cx': coordinates[..., 0], 'cy': coordinates[..., 1]}
-
-    # second step: perform calibration
-    results = calibration(samples, calibration_bins, save_models, seed)
-
-    # last step: measure and visualize miscalibration
-    measure_miscalibration(measure_bins, results, methods0d, methods2d)
-    plot_results(measure_bins, results, methods0d, methods2d)
-
-
-if __name__ == '__main__':
-    chain()
diff --git a/examples/detection/mscoco/Evaluation.py b/examples/detection/mscoco/Evaluation.py
deleted file mode 100644
index da8a132..0000000
--- a/examples/detection/mscoco/Evaluation.py
+++ /dev/null
@@ -1,222 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-
-import multiprocessing
-import numpy as np
-from sklearn.model_selection import train_test_split
-
-from netcal.scaling import BetaCalibration, LogisticCalibration, BetaCalibrationDependent, LogisticCalibrationDependent
-from netcal.binning import HistogramBinning
-
-
-def read_predictions(filename: str) -> tuple:
-    """ Read npz-files with predictions inferred by a detection model. """
-
-    with open(filename, "rb") as open_file:
-        npz = np.load(open_file, allow_pickle=True)
-
-        all_filenames = npz['filenames']
-        all_classes = npz['classes']
-        all_gt_classes = npz['gt_classes']
-
-        all_boxes = npz['pred_boxes']
-        all_gt_boxes = npz['gt_boxes']
-
-        all_scores = npz['scores']
-        all_matched = npz['matched']
-
-    return all_filenames, all_classes, all_gt_classes, all_boxes, all_gt_boxes, all_scores, all_matched
-
-
-
-def merge_box_data(box_data):
-    """ merge relevant box data to a single numpy arrays """
-
-    _, _, _, all_boxes, _, all_scores, all_matched = box_data
-
-    all_boxes = np.concatenate(all_boxes, axis=0)
-    all_scores = np.concatenate(all_scores)
-    all_matched = np.concatenate(all_matched)
-
-    return all_boxes, all_scores, all_matched
-
-
-def eval_method(iteration: int, method_short: str, num_combinations: int,
-                train_combinations: list,
-                train_matched: np.ndarray,
-                test_combinations: list,
-                bins_combination: list) -> dict:
-    """
-    Eval one single method. For multiprocessing it is necessary to create the instance for the calibration
-    method within the new process.
-
-    Parameters
-    ----------
-    iteration : int
-        Number of current iteration used for writing the model files
-    method_short : str
-        Short description string to create the right calibration method within the new process on multiprocessing.
-    num_combinations : int
-        Total number of different calibration combinations.
-    train_combinations : list
-        List with all prebuild combinations used for calibration.
-    train_matched : list
-        List with all prebuild ground truth annotations for each calibration combination.
-    test_combinations : list
-        List with all prebuild combinations used for testing.
-    bins_combination : list
-        List with binning schemes for all combinations.
-
-    Returns
-    -------
-    dict
-        Calibration data for each combination on the current method.
-    """
-
-    print("Method %s" % method_short)
-
-    # initialize method based on the identifier
-    if method_short == "betacal":
-        method = BetaCalibration(detection=True)
-    elif method_short == "hist":
-        method = HistogramBinning(detection=True)
-    elif method_short == "lr":
-        method = LogisticCalibration(detection=True)
-    elif method_short == "lr_dependent":
-        method = LogisticCalibrationDependent(detection=True)
-    elif method_short == "betacal_dependent":
-        method = BetaCalibrationDependent(momentum=True, detection=True)
-    else:
-        raise AttributeError("Unknown short description")
-
-    # collect calibrated data of each combination
-    calibrated_data = {}
-    for j in range(num_combinations):
-        print("Combination %d method %s" % (j, method_short))
-        train_combination, val_combination = train_combinations[j], test_combinations[j]
-
-        # set Histogram binning w.r.t. current combination
-        if isinstance(method, HistogramBinning):
-            method = HistogramBinning(bins=bins_combination[j], detection=True)
-
-        # fit and save model
-        method.fit(train_combination, train_matched)
-        method.save_model("models/%s_%s_%d_%02d.pkl" % (network, method_short, j, iteration))
-
-        # perform calibration and save into dict
-        calibrated = method.transform(val_combination)
-        calibrated_data["%s_c%d" % (method_short, j)] = calibrated
-        print("Finished combination %d method %s" % (j, method_short))
-
-    return calibrated_data
-
-
-def examine_calibration_combinations(all_matched: np.ndarray, all_boxes: np.ndarray, all_scores: np.ndarray):
-    """ Core examination routine for our calibration methods for object detection. """
-
-    # fixed seeds to reproduce the results
-    seeds = [63091863, 61530583, 213073, 3588059, 38316496, 34393458,
-            47543951, 43979170, 37214807, 19239273, 87609388, 91821428,
-            17692642, 57440842, 59832019, 77128578, 21112041, 15409117,
-            85210406, 14992824]
-
-    num_iterations = 20
-    train_split = 0.7
-
-    histogram_bins_0d = 15
-    histogram_bins_2d = 5
-    histogram_bins_4d = 3
-
-    bins_combination = [histogram_bins_0d, histogram_bins_2d, histogram_bins_2d, histogram_bins_4d]
-
-    # identifier of the different methods
-    methods = ['hist', 'betacal', 'lr', 'lr_dependent', 'betacal_dependent']
-    num_combinations = 4
-
-    for iteration in range(num_iterations):
-
-        # set seed for current iteration
-        print("Iteration %d" % (iteration))
-        np.random.seed(seeds[iteration])
-
-        rel_height = all_boxes[:, 2] - all_boxes[:, 0]
-        rel_width = all_boxes[:, 3] - all_boxes[:, 1]
-        center_x = rel_width * 0.5 + all_boxes[:, 1]
-        center_y = rel_height * 0.5 + all_boxes[:, 0]
-
-        train_matched, test_matched, \
-        train_scores, test_scores, \
-        train_center_y, test_center_y, \
-        train_center_x, test_center_x, \
-        train_rel_height, test_rel_height, \
-        train_rel_width, test_rel_width = train_test_split(all_matched, all_scores, center_y,
-                                                          center_x, rel_height, rel_width,
-                                                          train_size=train_split, shuffle=True,
-                                                          stratify=all_matched,
-                                                          random_state=seeds[iteration])
-        # --------------------------------------------
-        # build all combinations of box properties
-        train_combinations = [np.array(train_scores).reshape(-1, 1),
-                              np.stack([train_scores, train_center_y, train_center_x], axis=1),
-                              np.stack([train_scores, train_rel_height, train_rel_width], axis=1),
-                              np.stack(
-                                  [train_scores, train_center_y, train_center_x, train_rel_height, train_rel_width],
-                                  axis=1
-                              )]
-
-        test_combinations = [np.array(test_scores).reshape(-1, 1),
-                             np.stack([test_scores, test_center_y, test_center_x], axis=1),
-                             np.stack([test_scores, test_rel_height, test_rel_width], axis=1),
-                             np.stack([test_scores, test_center_y, test_center_x, test_rel_height, test_rel_width],
-                                      axis=1
-                                      )
-                             ]
-
-        # ------------------------------------------------------------------
-        # build calibration algorithms for each possible combination
-        # iterate over methods with multiprocessing
-        calibrated_data = {}
-        with multiprocessing.Pool(processes=len(methods)) as pool:
-
-            # pack arguments of function call
-            args = zip([iteration,] * len(methods),
-                       methods,
-                       [num_combinations,] * len(methods),
-                       [train_combinations,] * len(methods),
-                       [train_matched,] * len(methods),
-                       [test_combinations,] * len(methods),
-                       [bins_combination,] * len(methods))
-
-            # multiprocessing function call
-            calibrated_data_list = pool.starmap(eval_method, args)
-            for entry in calibrated_data_list:
-                calibrated_data.update(entry)
-
-        print("Save data iteration %d" % iteration)
-        filename = "results/%s_%02d.npz" % (network, iteration)
-        with open(filename, "wb") as open_file:
-            np.savez_compressed(open_file,
-                                train_matched=train_matched, test_matched=test_matched,
-                                train_scores=train_scores, test_scores=test_scores,
-                                train_center_y=train_center_y, test_center_y=test_center_y,
-                                train_center_x=train_center_x, test_center_x=test_center_x,
-                                train_rel_height=train_rel_height, test_rel_height=test_rel_height,
-                                train_rel_width=train_rel_width, test_rel_width=test_rel_width,
-                                **calibrated_data)
-    return
-
-
-if __name__ == '__main__':
-
-    network = "faster-rcnn-resnet-50-iou-0.60"
-    filename = "records/%s.npz" % network
-    
-    box_data = read_predictions(filename)
-    all_boxes, all_scores, all_matched = merge_box_data(box_data)
-
-    examine_calibration_combinations(all_matched, all_boxes, all_scores)
diff --git a/examples/detection/mscoco/records/faster-rcnn-resnet-50-iou-0.60.npz b/examples/detection/mscoco/records/faster-rcnn-resnet-50-iou-0.60.npz
deleted file mode 100644
index 2fdf580..0000000
Binary files a/examples/detection/mscoco/records/faster-rcnn-resnet-50-iou-0.60.npz and /dev/null differ
diff --git a/examples/detection/mscoco/records/faster-rcnn-resnet-50-iou-0.75.npz b/examples/detection/mscoco/records/faster-rcnn-resnet-50-iou-0.75.npz
deleted file mode 100644
index d19bbcf..0000000
Binary files a/examples/detection/mscoco/records/faster-rcnn-resnet-50-iou-0.75.npz and /dev/null differ
diff --git a/examples/detection/mscoco/records/rfcn-resnet-101-iou-0.60.npz b/examples/detection/mscoco/records/rfcn-resnet-101-iou-0.60.npz
deleted file mode 100644
index d1b2351..0000000
Binary files a/examples/detection/mscoco/records/rfcn-resnet-101-iou-0.60.npz and /dev/null differ
diff --git a/examples/detection/mscoco/records/rfcn-resnet-101-iou-0.75.npz b/examples/detection/mscoco/records/rfcn-resnet-101-iou-0.75.npz
deleted file mode 100644
index e7f716c..0000000
Binary files a/examples/detection/mscoco/records/rfcn-resnet-101-iou-0.75.npz and /dev/null differ
diff --git a/examples/detection/mscoco/records/ssd-inception-v2-iou-0.60.npz b/examples/detection/mscoco/records/ssd-inception-v2-iou-0.60.npz
deleted file mode 100644
index 79c6b4f..0000000
Binary files a/examples/detection/mscoco/records/ssd-inception-v2-iou-0.60.npz and /dev/null differ
diff --git a/examples/detection/mscoco/records/ssd-inception-v2-iou-0.75.npz b/examples/detection/mscoco/records/ssd-inception-v2-iou-0.75.npz
deleted file mode 100644
index 42525b1..0000000
Binary files a/examples/detection/mscoco/records/ssd-inception-v2-iou-0.75.npz and /dev/null differ
diff --git a/netcal/AbstractCalibration.py b/netcal/AbstractCalibration.py
index e051e47..a07aec1 100644
--- a/netcal/AbstractCalibration.py
+++ b/netcal/AbstractCalibration.py
@@ -1,18 +1,19 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-import abc, os, logging
+import abc, os
 import numpy as np
-from typing import Union
-from scipy.special import expit as safe_sigmoid
-from scipy.special import logit as safe_logit
-from scipy.special import softmax as safe_softmax
+from typing import Union, Tuple, Iterable, List
 from sklearn.base import BaseEstimator, TransformerMixin
 
+import torch
+import torch.nn.functional as F
+
+from netcal import __version__ as version
 from .Decorator import accepts, dimensions
 
 
@@ -44,19 +45,11 @@ class are treated as independent of each other (sigmoid).
     epsilon : float
         Lowest possible digit that can be computed. Needed for several operations like divisions or log to guarantee
         values inequal to 0 or 1.
-
-    logger : RootLogger
-        Logger for printing debug/info/warning/error messages.
-
     """
 
     # epsilon to prevent division by zero
     epsilon = np.finfo(np.float).eps
 
-    # number of iterations used for validation
-    # this is for auto-select models in detection mode
-    num_validation_iterations = 5
-
     @accepts(bool, bool)
     def __init__(self, detection: bool = False, independent_probabilities: bool = False):
         """
@@ -85,7 +78,7 @@ class are treated as independent of each other (sigmoid).
         self._default_independent_probabilities = independent_probabilities
 
     @abc.abstractmethod
-    def fit(self, X: np.ndarray, y: np.ndarray) -> tuple:
+    def fit(self, X: np.ndarray, y: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
         """
         Abstract function call to build the calibration model.
         This function performs several checks and returns the improved X and y.
@@ -203,10 +196,14 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> tuple:
 
         # count all class labels and warn if not all labels are present
         unique = np.unique(y)
+
+        # on detection, only binary labels are allowed
+        if self.detection and len(unique) != 2:
+            raise RuntimeError("On detection mode, it is mandatory to provide binary labels y in [0,1].")
+
         if len(unique) != self.num_classes:
-            logger = logging.getLogger(__name__)
-            logger.warning("Not all class labels are present in ground truth array \'y\'. This could led to "
-                           "errors in some models.")
+            print("WARNING: Not all class labels are present in ground truth array \'y\'. "
+                  "This could led to errors in some models.")
 
         return X, y
 
@@ -350,7 +347,7 @@ def set_params(self, **params) -> 'AbstractCalibration':
     @accepts(str)
     def save_model(self, filename: str):
         """
-        Save model instance as Pickle Object.
+        Save model instance as with torch's save function as this is safer for torch tensors.
 
         Parameters
         ----------
@@ -363,11 +360,11 @@ def save_model(self, filename: str):
             os.makedirs(dir_path, exist_ok=True)
 
         with open(filename, 'wb') as write_object:
-            pickle.dump(self.get_params(deep=True), write_object, pickle.HIGHEST_PROTOCOL)
+            torch.save(self.get_params(deep=True), write_object, pickle_protocol=pickle.HIGHEST_PROTOCOL)
 
     def load_model(self, filename):
         """
-        Load model from saved Pickle instance.
+        Load model from saved torch dump.
 
         Parameters
         ----------
@@ -380,14 +377,17 @@ def load_model(self, filename):
             Instance of a child class of `AbstractCalibration`.
         """
 
-        with open(filename, 'rb') as read_object:
-            params = pickle.load(read_object)
+        try:
+            with open(filename, 'rb') as read_object:
+                params = torch.load(read_object)
+        except RuntimeError:
+            raise IOError("Stored models of version <1.1 are not compatible with current version %s" % version)
 
         self.set_params(**params)
         return self
 
     @classmethod
-    def squeeze_generic(cls, a: np.ndarray, axes_to_keep: Union[int, list, tuple]) -> np.ndarray:
+    def squeeze_generic(cls, a: np.ndarray, axes_to_keep: Union[int, Iterable[int]]) -> np.ndarray:
         """
         Squeeze input array a but keep axes defined by parameter 'axes_to_keep' even if the dimension is
         of size 1.
@@ -415,8 +415,8 @@ def squeeze_generic(cls, a: np.ndarray, axes_to_keep: Union[int, list, tuple]) -
         return a.reshape(out_s)
 
     @accepts(np.ndarray, np.ndarray, list, str)
-    def _calc_model_scores(self, confidences: np.ndarray, ground_truth: np.ndarray, model_list: list,
-                           score_function: str = 'BIC') -> np.ndarray:
+    def _calc_model_scores(self, confidences: np.ndarray, ground_truth: np.ndarray,
+                           model_list: List['AbstractCalibration'], score_function: str = 'BIC') -> np.ndarray:
         """
         Calculates the Bayesian Scores for each Histogram Binning model and discards each model which
         gets a score of 0 to speed up predictions later on.
@@ -445,7 +445,20 @@ def _calc_model_scores(self, confidences: np.ndarray, ground_truth: np.ndarray,
         log_likelihood = np.zeros(len(model_list))
         for i, model in enumerate(model_list):
             estimate = model.transform(confidences)
-            log_likelihood[i] = self._log_likelihood(estimate, ground_truth)
+
+            # use torch routines to get log likelihood
+            if self._is_binary_classification():
+                loss = F.binary_cross_entropy(torch.from_numpy(estimate).type(torch.FloatTensor),
+                                              torch.from_numpy(ground_truth).type(torch.FloatTensor),
+                                              reduction='sum')
+
+            # on multiclass, use NLLLoss - this function expects log-probabilities
+            else:
+                loss = F.nll_loss(torch.from_numpy(np.log(estimate)).type(torch.FloatTensor),
+                                  torch.from_numpy(ground_truth).type(torch.FloatTensor),
+                                  reduction='sum')
+
+            log_likelihood[i] = -loss.item()
 
         # get degrees of freedom of each model. This is equivalent to number of groups
         degrees_of_freedom = np.array([x.get_degrees_of_freedom() for x in model_list], dtype=np.int)
@@ -464,8 +477,8 @@ def _calc_model_scores(self, confidences: np.ndarray, ground_truth: np.ndarray,
         return model_scores
 
     @accepts(np.ndarray, np.ndarray, list, str, float)
-    def _elbow(self, confidences: np.ndarray, ground_truth: np.ndarray, model_list: list, score_function: str = 'BIC',
-               alpha: float = 0.001) -> tuple:
+    def _elbow(self, confidences: np.ndarray, ground_truth: np.ndarray, model_list: List['AbstractCalibration'],
+               score_function: str = 'BIC', alpha: float = 0.001) -> Tuple[List[float], List['AbstractCalibration']]:
         """
         Select models by Bayesian score and discard models below a certain threshold with elbow method.
 
@@ -523,7 +536,7 @@ def _elbow(self, confidences: np.ndarray, ground_truth: np.ndarray, model_list:
         return kept_scores, kept_models
 
     def _create_one_vs_all_models(self, confidences: np.ndarray, ground_truth: np.ndarray,
-                                  model_class: 'AbstractCalibration', *constructor_args) -> list:
+                                  model_class: 'AbstractCalibration', *constructor_args) -> List['AbstractCalibration']:
         """
         Create for K classes K one vs all calibration models.
 
@@ -549,8 +562,7 @@ def _create_one_vs_all_models(self, confidences: np.ndarray, ground_truth: np.nd
         for label in range(self.num_classes):
 
             if np.where(ground_truth == label)[0].size == 0:
-                logger = logging.getLogger(__name__)
-                logger.warning("Warning: no training data for label %d present" % label)
+                print("WARNING: no training data for label %d present" % label)
                 continue
 
             # get 1 vs all vector depending on current label
@@ -559,16 +571,16 @@ def _create_one_vs_all_models(self, confidences: np.ndarray, ground_truth: np.nd
 
             # build an own Histogram Binning model for each label in a 1 vs all manner
             # now it's a k-fold binary classification task
-            binning_model = model_class(*constructor_args, independent_probabilities=self.independent_probabilities)
-            binning_model.fit(onevsall_confidence, onevsall_ground_truth)
+            model = model_class(*constructor_args, independent_probabilities=self.independent_probabilities)
+            model.fit(onevsall_confidence, onevsall_ground_truth)
 
             # add instances to internal list for calibrating new confidence estimates
-            multiclass_instances.append(tuple((label, binning_model)))
+            multiclass_instances.append(tuple((label, model)))
 
         return multiclass_instances
 
     @classmethod
-    def _sort_arrays(cls, array1: np.ndarray, *args) -> tuple:
+    def _sort_arrays(cls, array1: np.ndarray, *args) -> Tuple:
         """
         Sort multiple NumPy arrays by values given with array1.
 
@@ -679,207 +691,3 @@ def _get_one_vs_all_confidence(self, confidences: np.ndarray, label: int) -> np.
 
         onevsall_conf = confidences[:, label]
         return onevsall_conf
-
-    @dimensions(1, None)
-    def _get_one_hot_encoded_labels(self, labels: np.ndarray, num_classes: int) -> np.ndarray:
-        """
-        Compute one hot encoded label array by given label vector.
-
-        Parameters
-        ----------
-        labels : np.ndarray, shape=(n_samples,)
-            NumPy 1-D array with labels.
-        num_classes : int
-            Total amount of present classes.
-
-        Returns
-        -------
-        np.ndarray
-            NumPy 2-D array with one hot encoded labels.
-        """
-
-        # one hot encoded label vector on multi class calibration
-        return np.eye(num_classes)[labels]
-
-    @dimensions((1, 2), (1, 2))
-    def _nll_loss(self, logit: np.ndarray, ground_truth: np.ndarray) -> float:
-        """
-        Compute negative log-likelihood.
-
-        Parameters
-        ----------
-        logit : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with logits for each prediction.
-            1-D for binary classification, 2-D for multi class (softmax).
-        ground_truth : np.ndarray, shape=(n_samples,)
-            NumPy array with ground truth labels.
-            1-D for binary classification, 2-D for multi class (one-hot encoded).
-
-        Returns
-        -------
-        float
-            float with NLL-Loss.
-        """
-
-        num_samples = ground_truth.shape[0]
-
-        # scale logits by optional parameter 'scale_logits' (cf. Temperature Scaling)
-        # afterwards, compute softmax or sigmoid (depends on binary/multi class)
-        if self.num_classes <= 2 or self.independent_probabilities or self.detection:
-
-            # if array is two dimensional, 2 cases can occur:
-            # - 2nd dimension is length 1 - thus, the dimension can be squeezed
-            # - 2nd dimension is length 2 - logits for y=0 and y=1 - take estimates for y=1 then
-            if len(logit.shape) == 2 and not self.independent_probabilities:
-                logit = logit[:, -1]
-
-            confidences = self._sigmoid(logit)
-        else:
-            # convert ground truth to one hot encoded if necessary
-            if len(ground_truth.shape) == 1:
-                ground_truth = self._get_one_hot_encoded_labels(ground_truth, self.num_classes)
-
-            confidences = self._softmax(logit)
-
-        # clip to epsilon and 1.-epsilon
-        confidences = np.clip(confidences, self.epsilon, 1. - self.epsilon)
-
-        log_likelihood = self._log_likelihood(confidences, ground_truth)
-        return -log_likelihood / num_samples
-
-    @dimensions((1, 2), (1, 2))
-    def _log_likelihood(self, confidences: np.ndarray, ground_truth: np.ndarray) -> float:
-        """
-        Compute log-likelihood of predictions given in confidences with according
-        ground truth information.
-
-        Parameters
-        ----------
-        confidences : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with confidence values for each prediction.
-            1-D for binary classification, 2-D for multi class (softmax).
-        ground_truth : np.ndarray, shape=(n_samples,)
-            NumPy array with ground truth labels.
-            1-D for binary classification, 2-D for multi class (one-hot encoded).
-
-        Returns
-        -------
-        float
-            Log likelihood.
-
-        Raises:
-            ValueError
-                If number of classes is 2 but 1-D NumPy array provided.
-        """
-
-        if self.num_classes > 2:
-            if len(confidences.shape) < 2:
-                raise ValueError("Need 2-D array for multiclass log-likelihood")
-
-            # convert ground truth to one hot encoded if necessary
-            if len(ground_truth.shape) == 1 and len(confidences.shape) == 2:
-                ground_truth = self._get_one_hot_encoded_labels(ground_truth, self.num_classes)
-
-            # clip confidences for log
-            confidences = np.clip(confidences, self.epsilon, 1. - self.epsilon)
-
-            # first, create log of softmax and multiply by according ground truth (0 or 1)
-            # second, sum each class and calculate mean over all samples
-            cross_entropy = np.multiply(ground_truth, np.log(confidences))
-            log_likelihood = np.sum(cross_entropy)
-
-        else:
-
-            # binary classification problem but got two entries? (probability for 0 and 1 separately)?
-            # we only need probability p for Y=1 (probability for 0 is (1-p) )
-            if len(confidences.shape) == 2:
-                confidences = np.array(confidences[:, -1])
-
-            # clip confidences for log - extra clip for negative values necessary due to
-            # numerical stability
-            negative_confidences = np.clip(1. - confidences, self.epsilon, 1. - self.epsilon)
-            confidences = np.clip(confidences, self.epsilon, 1. - self.epsilon)
-
-            # first, create log of sigmoid and multiply by according ground truth (0 or 1)
-            # second, calculate mean over all samples
-            cross_entropy = np.multiply(ground_truth, np.log(confidences)) + \
-                            np.multiply(1. - ground_truth, np.log(negative_confidences))
-
-            log_likelihood = np.sum(cross_entropy)
-
-        return float(log_likelihood)
-
-    @dimensions((1, 2))
-    def _sigmoid(self, logit: np.ndarray) -> np.ndarray:
-        """
-        Calculate Sigmoid of Logit
-
-        Parameters
-        ----------
-        logit : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with logit of Neural Network.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with sigmoid output.
-        """
-
-        return safe_sigmoid(logit)
-
-    @dimensions((1, 2))
-    def _inverse_sigmoid(self, confidence: np.ndarray) -> np.ndarray:
-        """
-        Calculate inverse of Sigmoid to get Logit.
-
-        Parameters
-        ----------
-        confidence : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with Sigmoid output.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with logit.
-        """
-
-        # return - np.log( (1./(confidence + self.epsilon)) - 1)
-        clipped = np.clip(confidence, self.epsilon, 1. - self.epsilon)
-        return safe_logit(clipped)
-
-    @dimensions(2)
-    def _softmax(self, logit: np.ndarray) -> np.ndarray:
-        """
-        Calculate Softmax of multi class logit.
-
-        Parameters
-        ----------
-        logit : np.ndarray, shape=(n_samples, n_classes)
-            NumPy 2-D array with logits.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, n_classes)
-            NumPy 2-D array with softmax output.
-        """
-
-        return safe_softmax(logit, axis=1)
-
-    @dimensions(2)
-    def _inverse_softmax(self, confidences: np.ndarray) -> np.ndarray:
-        """
-        Calculate inverse of multi class softmax.
-
-        Parameters
-        ----------
-        confidences : np.ndarray, shape=(n_samples, n_classes)
-            NumPy 2-D array with softmaxes.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, n_classes)
-            NumPy 2-D array with logits.
-        """
-
-        clipped = np.clip(confidences, self.epsilon, 1. - self.epsilon)
-        return np.log(clipped)
diff --git a/netcal/Context.py b/netcal/Context.py
new file mode 100644
index 0000000..2b15013
--- /dev/null
+++ b/netcal/Context.py
@@ -0,0 +1,61 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+import contextlib
+import numpy as np
+import sys
+import torch
+
+
+@contextlib.contextmanager
+def manual_seed(seed: int = None):
+    """ Context manager to temporally set a fixed RNG seed for NumPy and PyTorch. """
+
+    # store old states
+    torch_state = torch.random.get_rng_state()
+    numpy_state = np.random.get_state()
+    has_cuda = torch.cuda.is_available()
+
+    if has_cuda:
+        deterministic = torch.backends.cudnn.deterministic
+        benchmark = torch.backends.cudnn.benchmark
+
+    # set new states in the current context
+    try:
+        if seed is not None:
+
+            if has_cuda:
+                torch.backends.cudnn.deterministic = True
+                torch.backends.cudnn.benchmark = False
+
+            torch.random.manual_seed(seed)
+            np.random.seed(seed)
+
+        yield
+
+    # restore old states after leaving the current context
+    finally:
+        if seed is not None:
+
+            if has_cuda:
+                torch.backends.cudnn.deterministic = deterministic
+                torch.backends.cudnn.benchmark = benchmark
+
+            torch.random.set_rng_state(torch_state)
+            np.random.set_state(numpy_state)
+
+
+@contextlib.contextmanager
+def redirect(fileHandle):
+    """ Redirect std output to a logfile given with fileHandle parameter. """
+
+    out, err = sys.stdout, sys.stderr
+    sys.stdout, sys.stderr = fileHandle, fileHandle
+    try:
+        yield fileHandle
+    finally:
+        sys.stdout, sys.stderr = out, err
diff --git a/netcal/Decorator.py b/netcal/Decorator.py
index 0281e83..269aaef 100644
--- a/netcal/Decorator.py
+++ b/netcal/Decorator.py
@@ -1,14 +1,13 @@
-"""
-Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-
-This Source Code Form is subject to the terms of the Mozilla Public
-License, v. 2.0. If a copy of the MPL was not distributed with this
-file, You can obtain one at http://mozilla.org/MPL/2.0/.
-"""
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 
 import numpy as np
+import torch
 from functools import wraps
 
 
@@ -17,7 +16,7 @@ def accepts(*types):
     Decorator for function arg check
     """
     def check_accepts(f):
-        assert len(types)+1 == f.__code__.co_argcount
+        assert len(types)+1 == f.__code__.co_argcount, "Unequal amount of defined parameter types and existing parameters."
 
         @wraps(f)
         def new_f(*args, **kwds):
@@ -45,7 +44,7 @@ def dimensions(*dim):
     Decorator for numpy array dimension check
     """
     def check_dim(f):
-        assert len(dim)+1 == f.__code__.co_argcount
+        assert len(dim)+1 == f.__code__.co_argcount, "Unequal amount of defined dimensions and existing parameters."
 
         @wraps(f)
         def new_f(*args, **kwds):
@@ -54,7 +53,7 @@ def new_f(*args, **kwds):
                 if d is None:
                     continue
 
-                assert isinstance(a, np.ndarray), "arg \'%s\' does not match %s" % (f.__code__.co_varnames[i], np.ndarray)
+                assert isinstance(a, (np.ndarray, torch.Tensor, )), "arg \'%s\' does not match %s or %s" % (f.__code__.co_varnames[i], np.ndarray, torch.Tensor)
 
                 if type(d) == tuple:
                     assert len(a.shape) in d, "dimension of arg \'%s\' must match %s but is %d" % (f.__code__.co_varnames[i], str(d), len(a.shape))
@@ -72,7 +71,7 @@ def global_accepts(*types):
     Decorator for global function's arg check
     """
     def check_accepts(f):
-        assert len(types) == f.__code__.co_argcount
+        assert len(types) == f.__code__.co_argcount, "Unequal amount of defined parameter types and existing parameters."
 
         @wraps(f)
         def new_f(*args, **kwds):
@@ -100,7 +99,7 @@ def global_dimensions(*dim):
     Decorator for global function's numpy array dimension check
     """
     def check_dim(f):
-        assert len(dim) == f.__code__.co_argcount
+        assert len(dim) == f.__code__.co_argcount, "Unequal amount of defined dimensions and existing parameters."
 
         @wraps(f)
         def new_f(*args, **kwds):
@@ -109,7 +108,7 @@ def new_f(*args, **kwds):
                 if d is None:
                     continue
 
-                assert isinstance(a, np.ndarray), "arg \'%s\' does not match %s" % (f.__code__.co_varnames[i], np.ndarray)
+                assert isinstance(a, (np.ndarray, torch.Tensor)), "arg \'%s\' does not match %s or %s" % (f.__code__.co_varnames[i], np.ndarray, torch.Tensor)
 
                 if type(d) == tuple:
                     assert len(a.shape) in d, "dimension of arg \'%s\' must match %s but is %d" % (f.__code__.co_varnames[i], str(d), len(a.shape))
diff --git a/netcal/Logging.py b/netcal/Logging.py
deleted file mode 100644
index 6b12065..0000000
--- a/netcal/Logging.py
+++ /dev/null
@@ -1,47 +0,0 @@
-# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-#
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-import logging
-import io
-
-
-class TqdmHandler(io.StringIO):
-    """
-    Output tqdm messages via logging module.
-    """
-
-    logger = None
-    level = None
-    buf = ''
-
-    def __init__(self, logger: logging.Logger, level: int = None):
-        """
-        Constructor. Initialize logging stream handler.
-        """
-
-        super().__init__()
-        self.logger = logger
-        self.level = level or logging.INFO
-
-    def write(self, buf: str):
-        """
-        Write logging message into buffer
-
-        Parameters
-        ----------
-        buf : str
-            Message that shall be logged.
-        """
-
-        self.buf = buf.strip('\r\n\t ')
-
-    def flush(self):
-        """
-        Flush buffered messages to logger
-        """
-
-        self.logger.log(self.level, self.buf)
diff --git a/netcal/Stats.py b/netcal/Stats.py
new file mode 100644
index 0000000..7684d02
--- /dev/null
+++ b/netcal/Stats.py
@@ -0,0 +1,49 @@
+# Copyright (C) 2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+# Copyright (C) 2019-2020 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Visteon Electronics Germany GmbH, Kerpen, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+#
+# Parts of this file have been adapted from NumPyro: https://github.com/pyro-ppl/numpyro/blob/master/numpyro/diagnostics.py
+
+import numpy as np
+
+
+def hpdi(x, prob=0.90, axis=0):
+    """
+    Computes "highest posterior density interval" (HPDI) which is the narrowest
+    interval with probability mass ``prob``. This method has been adapted from NumPyro:
+    `Find NumPyro original implementation <https://github.com/pyro-ppl/numpyro/blob/v0.2.4/numpyro/diagnostics.py#L191>_`.
+
+    Parameters
+    ----------
+    x : np.ndarray
+        Input array.
+    prob : float, optional, default: 0.9
+        Probability mass of samples within the interval.
+    axis : int, optional, default: 0
+        The dimension to calculate hpdi.
+
+    Returns
+    -------
+    np.ndarray
+        Quantiles of ``x`` at ``(1 - prob) / 2`` and ``(1 + prob) / 2``.
+    """
+    x = np.swapaxes(x, axis, 0)
+    sorted_x = np.sort(x, axis=0)
+    mass = x.shape[0]
+    index_length = int(prob * mass)
+    intervals_left = sorted_x[:(mass - index_length)]
+    intervals_right = sorted_x[index_length:]
+    intervals_length = intervals_right - intervals_left
+    index_start = intervals_length.argmin(axis=0)
+    index_end = index_start + index_length
+    hpd_left = np.take_along_axis(sorted_x, index_start[None, ...], axis=0)
+    hpd_left = np.swapaxes(hpd_left, axis, 0)
+    hpd_right = np.take_along_axis(sorted_x, index_end[None, ...], axis=0)
+    hpd_right = np.swapaxes(hpd_right, axis, 0)
+
+    return np.concatenate([hpd_left, hpd_right], axis=axis)
diff --git a/netcal/__init__.py b/netcal/__init__.py
index ef525a9..575c1c2 100644
--- a/netcal/__init__.py
+++ b/netcal/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 """
 API Reference
@@ -37,8 +37,9 @@
 """
 
 name = 'calibration'
-__version__ = '1.1.3'
+__version__ = '1.2.0'
 
 from .AbstractCalibration import AbstractCalibration
 from .Decorator import accepts, dimensions, global_accepts, global_dimensions
-from .Logging import TqdmHandler
+from .Context import manual_seed, redirect
+from .Stats import hpdi
diff --git a/netcal/binning/BBQ.py b/netcal/binning/BBQ.py
index 964ef19..a2ea290 100644
--- a/netcal/binning/BBQ.py
+++ b/netcal/binning/BBQ.py
@@ -1,21 +1,21 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-import logging
 import numpy as np
 import itertools
 from tqdm import tqdm
-from netcal import AbstractCalibration, TqdmHandler, dimensions, accepts
+
+from netcal import AbstractCalibration, dimensions, accepts
 from .HistogramBinning import HistogramBinning
 
 
 class BBQ(AbstractCalibration):
     """
-    Bayesian Binning into Quantiles (BBQ). This method is originally proposed by [1]_. This method utilizes multiple :class:`HistogramBinning`
+    Bayesian Binning into Quantiles (BBQ) [1]_. This method utilizes multiple :class:`HistogramBinning`
     instances with different amounts of bins and computes a weighted sum of all methods to obtain a
     well-calibrated confidence estimate. The scoring function "BDeu", which is proposed in the original paper,
     is currently not supported.
@@ -60,6 +60,9 @@ class BBQ(AbstractCalibration):
         define score functions:
         - 'BIC': Bayesian-Information-Criterion
         - 'AIC': Akaike-Information-Criterion
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
@@ -79,8 +82,9 @@ class are treated as independent of each other (sigmoid).
 
     """
 
-    @accepts(str, bool, bool)
-    def __init__(self, score_function: str = 'BIC', detection: bool = False, independent_probabilities: bool = False):
+    @accepts(str, bool, bool, bool)
+    def __init__(self, score_function: str = 'BIC', equal_intervals: bool = True,
+                 detection: bool = False, independent_probabilities: bool = False):
         """
         Constructor.
 
@@ -116,6 +120,7 @@ class are treated as independent of each other (sigmoid).
             raise AttributeError("Unknown score function \'%s\'" % score_function)
 
         self.score_function = score_function.lower()
+        self.equal_intervals = equal_intervals
 
     def clear(self):
         """
@@ -225,7 +230,7 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'BBQ':
         if not self._is_binary_classification() and not self.detection:
 
             # create multiple one vs all models
-            self._multiclass_instances = self._create_one_vs_all_models(X, y, BBQ, self.score_function)
+            self._multiclass_instances = self._create_one_vs_all_models(X, y, BBQ, self.score_function, self.equal_intervals)
             return self
 
         num_features = 1
@@ -248,13 +253,11 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'BBQ':
         # iterate over all different binnings and fit Histogram Binning methods
         model_list = []
 
-        # use tqdm logger to pipe tqdm output to logger
-        logger = logging.getLogger(__name__)
-        tqdm_logger = TqdmHandler(logger=logger, level=logging.INFO)
-        for bins in tqdm(itertools.product(*all_ranges), total=np.power(len(bin_range), num_features), file=tqdm_logger):
+        # iterate over all bin combinations
+        for bins in tqdm(itertools.product(*all_ranges), total=np.power(len(bin_range), num_features)):
 
             bins = bins[0] if not self.detection else bins
-            histogram = HistogramBinning(bins=bins, detection=self.detection)
+            histogram = HistogramBinning(bins=bins, equal_intervals=self.equal_intervals, detection=self.detection)
             histogram.fit(X, y)
 
             model_list.append(histogram)
diff --git a/netcal/binning/ENIR.py b/netcal/binning/ENIR.py
index af838a0..3645b2a 100644
--- a/netcal/binning/ENIR.py
+++ b/netcal/binning/ENIR.py
@@ -1,11 +1,10 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-import logging
 import numpy as np
 from netcal import AbstractCalibration, dimensions, accepts
 from .NearIsotonicRegression import NearIsotonicRegression
@@ -13,7 +12,7 @@
 
 class ENIR(AbstractCalibration):
     """
-    Ensemble of Near Isotonic Regression (ENIR) models. This method is originally proposed by [1]_. These models allow - in contrast to standard
+    Ensemble of Near Isotonic Regression (ENIR) models [1]_. These models allow - in contrast to standard
     :class:`IsotonicRegression` method - a violation of the monotony restrictions. Using the *modified
     Pool-Adjacent-Violators Algorithm (mPAVA)*, this method build multiple Near Isotonic Regression models
     and weights them by a certain score function.
@@ -220,12 +219,10 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'ENIR':
             Instance of class :class:`ENIR`.
         """
 
-        logger = logging.getLogger(__name__)
-
         # detection mode is not supported natively
         if self.detection:
-            logger.warning("Detection mode is not supported natively by ENIR method. This will discard all "
-                           "additional box information and only keep confidence scores.")
+            print("WARNING: Detection mode is not supported natively by ENIR method. "
+                  "This will discard all additional box information and only keep confidence scores.")
 
             # if 2d, keep only confidence scores and preserve 2d structure
             if len(X.shape) == 2:
@@ -251,8 +248,7 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'ENIR':
         X, y = self._sort_arrays(X, y)
 
         # log action
-        logger.info("Get path of all Near Isotonic Regression models with mPAVA ...")
-
+        print("Get path of all Near Isotonic Regression models with mPAVA ...")
         iso = NearIsotonicRegression(quick_init=self.quick_init,
                                      independent_probabilities=self.independent_probabilities)
         iso.fit(X, y)
diff --git a/netcal/binning/HistogramBinning.py b/netcal/binning/HistogramBinning.py
index 5b18c13..4f050ee 100644
--- a/netcal/binning/HistogramBinning.py
+++ b/netcal/binning/HistogramBinning.py
@@ -1,24 +1,23 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import numpy as np
 from scipy.stats import binned_statistic_dd
-from typing import Union
+from typing import Union, Iterable
 from netcal import AbstractCalibration, dimensions, accepts
 
 
 class HistogramBinning(AbstractCalibration):
     """
-    Simple Histogram Binning calibration method. This method is originally proposed by [1]_. Each prediction is sorted into a bin
+    Simple Histogram Binning calibration method [1]_. Each prediction is sorted into a bin
     and assigned its calibrated confidence estimate. This method normally works for binary
     classification. For multiclass classification, this method is applied into a 1-vs-all manner [2]_.
 
-    The bin boundaries are either chosen to be
-    equal length intervals or to equalize the number of samples in each bin.
+    The bin boundaries are either chosen to be equal length intervals or to equalize the number of samples in each bin.
 
     On object detection, use a multidimensional binning to include additional information of the box
     regression branch [3]_.
@@ -60,7 +59,7 @@ class are treated as independent of each other (sigmoid).
     """
 
     @accepts((int, tuple, list), bool, bool, bool)
-    def __init__(self, bins: Union[int, tuple, list] = 10, equal_intervals: bool = True,
+    def __init__(self, bins: Union[int, Iterable[int]] = 10, equal_intervals: bool = True,
                  detection: bool = False, independent_probabilities: bool = False):
         """
         Create an instance of `HistogramBinning`.
@@ -90,9 +89,6 @@ class are treated as independent of each other (sigmoid).
         self.bins = bins
         self.equal_intervals = equal_intervals
 
-        if not self.equal_intervals:
-            raise ValueError("Parameter \'equal_intervals=False\' is currently not implemented.")
-
         # for multi class calibration with K classes, K binary calibration models are needed
         self._multiclass_instances = []
 
@@ -119,8 +115,9 @@ def clear(self):
 
         self._multiclass_instances.clear()
 
-    @dimensions((1, 2), (1, 2))
-    def fit(self, X: np.ndarray, y: np.ndarray) -> 'HistogramBinning':
+    @dimensions((1, 2), (1, 2), None, None, None)
+    def fit(self, X: np.ndarray, y: np.ndarray, random_state: int = None,
+                  tensorboard: bool = False, log_dir: str = None) -> 'HistogramBinning':
         """
         Function call to build the calibration model.
 
@@ -133,6 +130,8 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'HistogramBinning':
         y : np.ndarray, shape=(n_samples, [n_classes])
             NumPy array with ground truth labels.
             Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+        random_state : int, optional, default: None
+            Fix the random seed for the random number (only for compatibility here)
 
         Returns
         -------
@@ -149,7 +148,7 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'HistogramBinning':
         if not self._is_binary_classification() and not self.detection:
 
             # create multiple one vs all models
-            self._multiclass_instances = self._create_one_vs_all_models(X, y, HistogramBinning, self.bins)
+            self._multiclass_instances = self._create_one_vs_all_models(X, y, HistogramBinning, self.bins, self.equal_intervals)
             return self
 
         # ---------------------------------------
@@ -201,6 +200,17 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'HistogramBinning':
         # get bin bounds
         self._bin_bounds = [np.linspace(0.0, 1.0, bin + 1) for bin in self.bins]
 
+        # on equal_intervals=True, simply use linspace
+        # if the goal is to equalize the amount of samples in each bin, use np.quantile
+        if not self.equal_intervals:
+            for dim, bounds in enumerate(self._bin_bounds):
+                quantile = np.quantile(X[:, dim], q=bounds, axis=0)
+
+                # set lower and upper bounds to confidence limits
+                quantile[0] = 0.
+                quantile[-1] = 1.
+                self._bin_bounds[dim] = quantile
+
         # X must have the same shape as y
         acc_hist, _, _ = binned_statistic_dd(X, matched, statistic='mean', bins=self._bin_bounds)
 
@@ -217,8 +227,8 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'HistogramBinning':
 
         return self
 
-    @dimensions((1, 2))
-    def transform(self, X: np.ndarray) -> np.ndarray:
+    @dimensions((1, 2), None, None)
+    def transform(self, X: np.ndarray, num_samples: int = 1, random_state: int = None) -> np.ndarray:
         """
         After model calibration, this function is used to get calibrated outputs of uncalibrated
         confidence estimates.
@@ -228,6 +238,11 @@ def transform(self, X: np.ndarray) -> np.ndarray:
         X : np.ndarray, shape=(n_samples, [n_classes])
             NumPy array with uncalibrated confidence estimates.
             1-D for binary classification, 2-D for multi class (softmax).
+        num_samples : int, optional, default: 1000
+            Number of samples generated on MCMC sampling or Variational Inference - only for compatibility and
+            not used by Histogram Binning!
+        random_state : int, optional, default: None
+            Fix the random seed for the random number
 
         Returns
         -------
@@ -262,6 +277,9 @@ def transform(self, X: np.ndarray) -> np.ndarray:
             if len(X.shape) == 1:
                 X = np.reshape(X, (-1, 1))
 
+            if self.ndim != X.shape[1]:
+                raise RuntimeError("Histogram binning has been trained for %d dimensions but only %d are provided." % (self.ndim, X.shape[1]))
+
             # on detection, this is equivalent to the number of features
             # on binary classification, this is simply 1
             # on multiclass classification, we perform one vs. all binning - thus, it results in multiple binary cases
@@ -300,3 +318,10 @@ def get_degrees_of_freedom(self) -> int:
         """
 
         return int(np.prod(self.bins))
+
+    @property
+    def ndim(self):
+        if self._bin_map is not None:
+            return self._bin_map.ndim
+        else:
+            return -1
diff --git a/netcal/binning/IsotonicRegression.py b/netcal/binning/IsotonicRegression.py
index f6292bf..f26d85d 100644
--- a/netcal/binning/IsotonicRegression.py
+++ b/netcal/binning/IsotonicRegression.py
@@ -1,11 +1,10 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-import logging
 import numpy as np
 from netcal import AbstractCalibration, dimensions, accepts
 from sklearn.isotonic import IsotonicRegression as sklearn_iso
@@ -13,7 +12,7 @@
 
 class IsotonicRegression(AbstractCalibration):
     """
-    Isotonic Regression method. This method is originally proposed by [1]_. This method is similar to :class:`HistogramBinning` but with dynamic bin sizes
+    Isotonic Regression method [1]_. This method is similar to :class:`HistogramBinning` but with dynamic bin sizes
     and boundaries. A piecewise constant function gets fit to ground truth labels sorted by
     given confidence estimates.
 
@@ -96,9 +95,8 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'IsotonicRegression':
 
         # detection mode is not supported natively
         if self.detection:
-            logger = logging.getLogger(__name__)
-            logger.warning("Detection mode is not supported natively by IsotonicRegression method. "
-                           "This will discard all additional box information and only keep confidence scores.")
+            print("WARNING: Detection mode is not supported natively by IsotonicRegression method. "
+                  "This will discard all additional box information and only keep confidence scores.")
 
             # if 2d, keep only confidence scores and preserve 2d structure
             if len(X.shape) == 2:
diff --git a/netcal/binning/NearIsotonicRegression.py b/netcal/binning/NearIsotonicRegression.py
index 757b645..d957f85 100644
--- a/netcal/binning/NearIsotonicRegression.py
+++ b/netcal/binning/NearIsotonicRegression.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import numpy as np
 from typing import Union
@@ -12,7 +12,7 @@
 
 class NearIsotonicRegression(AbstractCalibration):
     """
-    Near Isotonic Regression Calibration method. This method is originally proposed by [1]_ (commonly used by :class:`ENIR`).
+    Near Isotonic Regression Calibration method [1]_ (commonly used by :class:`ENIR` [2]_).
 
     Parameters
     ----------
@@ -234,7 +234,7 @@ def __initial_model_standard(self, X: np.ndarray, y: np.ndarray):
 
         # one hot encoded label vector on multi class calibration
         if len(X.shape) == 2:
-            y = self._get_one_hot_encoded_labels(y, X.shape[1])
+            y = np.eye(self.num_classes)[y]
 
         # sort arrays by confidence - always flatten (this has no effect to 1-D arrays)
         X, y = self._sort_arrays(X.flatten(), y.flatten())
@@ -268,7 +268,7 @@ def __initial_model_quick(self, X: np.ndarray, y: np.ndarray):
 
         # one hot encoded label vector on multi class calibration
         if len(X.shape) == 2:
-            y = self._get_one_hot_encoded_labels(y, X.shape[1])
+            y = np.eye(self.num_classes)[y]
 
         # sort arrays by confidence - always flatten (this has no effect to 1-D arrays)
         X, y = self._sort_arrays(X.flatten(), y.flatten())
diff --git a/netcal/binning/__init__.py b/netcal/binning/__init__.py
index cb1ea84..7d5c0e4 100644
--- a/netcal/binning/__init__.py
+++ b/netcal/binning/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 """
 Binning methods for confidence calibration.
diff --git a/netcal/metrics/ACE.py b/netcal/metrics/ACE.py
index d2a447a..5fd6b1d 100644
--- a/netcal/metrics/ACE.py
+++ b/netcal/metrics/ACE.py
@@ -1,14 +1,13 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import numpy as np
-from typing import Union
+from typing import Union, Iterable, Tuple
 from .Miscalibration import _Miscalibration
-from netcal import dimensions
 
 
 class ACE(_Miscalibration):
@@ -31,11 +30,16 @@ class ACE(_Miscalibration):
         Number of bins used by the Histogram Binning.
         On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
         If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
         If True, the input array 'X' is treated as a box predictions with several box features (at least
         box confidence must be present) with shape (n_samples, [n_box_features]).
+    sample_threshold : int, optional, default: 1
+        Bins with an amount of samples below this threshold are not included into the miscalibration metrics.
 
     References
     ----------
@@ -45,38 +49,65 @@ class ACE(_Miscalibration):
        `Get source online <https://openreview.net/pdf?id=S1lG7aTnqQ>`_
     .. [2] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
-       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
+       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+       `Get source online <https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf>`_
     """
 
-    @dimensions((1, 2), (1, 2), None, None)
-    def measure(self, X: np.ndarray, y: np.ndarray,
-                return_map: bool = False, return_num_samples: bool = False) -> Union[np.ndarray, tuple]:
+    def measure(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray],
+                batched: bool = False, uncertainty: str = None,
+                return_map: bool = False,
+                return_num_samples: bool = False,
+                return_uncertainty_map: bool = False) -> Union[float, Tuple]:
         """
         Measure calibration by given predictions with confidence and the according ground truth.
         Assume binary predictions with y=1.
 
         Parameters
         ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+        X : iterable of np.ndarray, or np.ndarray of shape=([n_bayes], n_samples, [n_classes/n_box_features])
             NumPy array with confidence values for each prediction on classification with shapes
             1-D for binary classification, 2-D for multi class (softmax).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
             On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=([n_bayes], n_samples, [n_classes])
             NumPy array with ground truth labels.
             Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        batched : bool, optional, default: False
+            Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+            All predictions given by X and y are separately evaluated and their results are averaged afterwards
+            for visualization.
+        uncertainty : str, optional, default: False
+            Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+            that output an ensemble of predictions per sample. Choose one of the following options:
+            - flatten:  treat everything as a separate prediction - this option will yield into a slightly better
+                        calibration performance but without the visualization of a prediction interval.
+            - mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample
+                        (mean) with a standard deviation that is visualized.
         return_map: bool, optional, default: False
             If True, return map with miscalibration metric separated into all remaining dimension bins.
         return_num_samples : bool, optional, default: False
             If True, also return the number of samples in each bin.
+        return_uncertainty_map : bool, optional, default: False
+            If True, also return the average deviation of the confidence within each bin.
 
         Returns
         -------
-        float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)
-            Always returns miscalibration metric.
-            If 'return_map' is False, return ACE only (or num_samples map).
-            If 'return_map' is True, return tuple with ACE and map over all bins.
-            If 'return_num_samples' is False, ACE only (or ACE map).
-            If 'return_num_samples' is True, return tuple with ACE and number of samples in each bin.
+        float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])
+            Always returns Average Calibration Error.
+            If 'return_map' is True, return tuple and append miscalibration map over all bins.
+            If 'return_num_samples' is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+            If 'return_uncertainty' is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).
         """
 
-        return self._measure(X=X, y=y, metric='ace', return_map=return_map, return_num_samples=return_num_samples)
+        return self._measure(X=X, y=y, metric='ace',
+                             batched=batched, uncertainty=uncertainty,
+                             return_map=return_map,
+                             return_num_samples=return_num_samples,
+                             return_uncertainty_map=return_uncertainty_map)
diff --git a/netcal/metrics/ECE.py b/netcal/metrics/ECE.py
index 431e9c4..bfc9ac6 100644
--- a/netcal/metrics/ECE.py
+++ b/netcal/metrics/ECE.py
@@ -1,14 +1,13 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import numpy as np
-from typing import Union
+from typing import Union, Iterable, Tuple
 from .Miscalibration import _Miscalibration
-from netcal import dimensions
 
 
 class ECE(_Miscalibration):
@@ -32,11 +31,16 @@ class ECE(_Miscalibration):
         Number of bins used by the Histogram Binning.
         On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
         If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
         If True, the input array 'X' is treated as a box predictions with several box features (at least
         box confidence must be present) with shape (n_samples, [n_box_features]).
+    sample_threshold : int, optional, default: 1
+        Bins with an amount of samples below this threshold are not included into the miscalibration metrics.
 
     References
     ----------
@@ -46,38 +50,65 @@ class ECE(_Miscalibration):
        `Get source online <https://www.aaai.org/ocs/index.php/AAAI/AAAI15/paper/download/9667/9958>`_
     .. [2] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
-       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
+       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+       `Get source online <https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf>`_.
     """
 
-    @dimensions((1, 2), (1, 2), None, None)
-    def measure(self, X: np.ndarray, y: np.ndarray,
-                return_map: bool = False, return_num_samples: bool = False) -> Union[np.ndarray, tuple]:
+    def measure(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray],
+                batched: bool = False, uncertainty: str = None,
+                return_map: bool = False,
+                return_num_samples: bool = False,
+                return_uncertainty_map: bool = False) -> Union[float, Tuple]:
         """
         Measure calibration by given predictions with confidence and the according ground truth.
         Assume binary predictions with y=1.
 
         Parameters
         ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+        X : iterable of np.ndarray, or np.ndarray of shape=([n_bayes], n_samples, [n_classes/n_box_features])
             NumPy array with confidence values for each prediction on classification with shapes
             1-D for binary classification, 2-D for multi class (softmax).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
             On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=([n_bayes], n_samples, [n_classes])
             NumPy array with ground truth labels.
             Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        batched : bool, optional, default: False
+            Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+            All predictions given by X and y are separately evaluated and their results are averaged afterwards
+            for visualization.
+        uncertainty : str, optional, default: False
+            Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+            that output an ensemble of predictions per sample. Choose one of the following options:
+            - flatten:  treat everything as a separate prediction - this option will yield into a slightly better
+                        calibration performance but without the visualization of a prediction interval.
+            - mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample
+                        (mean) with a standard deviation that is visualized.
         return_map: bool, optional, default: False
             If True, return map with miscalibration metric separated into all remaining dimension bins.
         return_num_samples : bool, optional, default: False
             If True, also return the number of samples in each bin.
+        return_uncertainty_map : bool, optional, default: False
+            If True, also return the average deviation of the confidence within each bin.
 
         Returns
         -------
-        float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)
-            Always returns miscalibration metric.
-            If 'return_map' is False, return ECE only (or num_samples map).
-            If 'return_map' is True, return tuple with ECE and map over all bins.
-            If 'return_num_samples' is False, ECE only (or ECE map).
-            If 'return_num_samples' is True, return tuple with ECE and number of samples in each bin.
+        float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])
+            Always returns Expected Calibration Error.
+            If 'return_map' is True, return tuple and append miscalibration map over all bins.
+            If 'return_num_samples' is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+            If 'return_uncertainty' is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).
         """
 
-        return self._measure(X=X, y=y, metric='ece', return_map=return_map, return_num_samples=return_num_samples)
+        return self._measure(X=X, y=y, metric='ece',
+                             batched=batched, uncertainty=uncertainty,
+                             return_map=return_map,
+                             return_num_samples=return_num_samples,
+                             return_uncertainty_map=return_uncertainty_map)
diff --git a/netcal/metrics/MCE.py b/netcal/metrics/MCE.py
index 8ee8d82..e909b58 100644
--- a/netcal/metrics/MCE.py
+++ b/netcal/metrics/MCE.py
@@ -1,14 +1,13 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
+from typing import Union, Iterable, Tuple
 import numpy as np
-from typing import Union
 from .Miscalibration import _Miscalibration
-from netcal import dimensions
 
 
 class MCE(_Miscalibration):
@@ -30,11 +29,16 @@ class MCE(_Miscalibration):
         Number of bins used by the Histogram Binning.
         On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
         If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
         If True, the input array 'X' is treated as a box predictions with several box features (at least
         box confidence must be present) with shape (n_samples, [n_box_features]).
+    sample_threshold : int, optional, default: 1
+        Bins with an amount of samples below this threshold are not included into the miscalibration metrics.
 
     References
     ----------
@@ -44,35 +48,65 @@ class MCE(_Miscalibration):
        `Get source online <https://www.aaai.org/ocs/index.php/AAAI/AAAI15/paper/download/9667/9958>`_
     .. [2] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
-       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
+       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+       `Get source online <https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf>`_
     """
 
-    @dimensions((1, 2), (1, 2), None, None)
-    def measure(self, X: np.ndarray, y: np.ndarray,
-                return_map: bool = False, return_num_samples: bool = False) -> Union[np.ndarray, tuple]:
+    def measure(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray],
+                batched: bool = False, uncertainty: str = None,
+                return_map: bool = False,
+                return_num_samples: bool = False,
+                return_uncertainty_map: bool = False) -> Union[float, Tuple]:
         """
+        Measure calibration by given predictions with confidence and the according ground truth.
+        Assume binary predictions with y=1.
+
         Parameters
         ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+        X : iterable of np.ndarray, or np.ndarray of shape=([n_bayes], n_samples, [n_classes/n_box_features])
             NumPy array with confidence values for each prediction on classification with shapes
             1-D for binary classification, 2-D for multi class (softmax).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
             On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=([n_bayes], n_samples, [n_classes])
             NumPy array with ground truth labels.
             Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        batched : bool, optional, default: False
+            Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+            All predictions given by X and y are separately evaluated and their results are averaged afterwards
+            for visualization.
+        uncertainty : str, optional, default: False
+            Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+            that output an ensemble of predictions per sample. Choose one of the following options:
+            - flatten:  treat everything as a separate prediction - this option will yield into a slightly better
+                        calibration performance but without the visualization of a prediction interval.
+            - mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample
+                        (mean) with a standard deviation that is visualized.
         return_map: bool, optional, default: False
             If True, return map with miscalibration metric separated into all remaining dimension bins.
         return_num_samples : bool, optional, default: False
             If True, also return the number of samples in each bin.
+        return_uncertainty_map : bool, optional, default: False
+            If True, also return the average deviation of the confidence within each bin.
 
         Returns
         -------
-        float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)
-            Always returns miscalibration metric.
-            If 'return_map' is False, return MCE only (or num_samples map).
-            If 'return_map' is True, return tuple with MCE and map over all bins.
-            If 'return_num_samples' is False, MCE only (or MCE map).
-            If 'return_num_samples' is True, return tuple with MCE and number of samples in each bin.
+        float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])
+            Always returns Maximum Calibration Error.
+            If 'return_map' is True, return tuple and append miscalibration map over all bins.
+            If 'return_num_samples' is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+            If 'return_uncertainty' is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).
         """
 
-        return self._measure(X=X, y=y, metric='mce', return_map=return_map, return_num_samples=return_num_samples)
+        return self._measure(X=X, y=y, metric='mce',
+                             batched=batched, uncertainty=uncertainty,
+                             return_map=return_map,
+                             return_num_samples=return_num_samples,
+                             return_uncertainty_map=return_uncertainty_map)
diff --git a/netcal/metrics/MMCE.py b/netcal/metrics/MMCE.py
new file mode 100644
index 0000000..018db39
--- /dev/null
+++ b/netcal/metrics/MMCE.py
@@ -0,0 +1,151 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import Iterable
+import logging
+from typing import Union
+import numpy as np
+
+from netcal import accepts
+
+
+class MMCE(object):
+    """
+    Maximum Mean Calibration Error (MMCE) [1]_.
+    A differentiable approximation to the Expected Calibration Error (ECE) using a
+    reproducing _kernel Hilbert space (RKHS).
+    Using a dataset :math:`\\mathcal{D}` of size :math:`N` consisting of the ground truth labels :math:`\\hat{y} \\in \\{1, ..., K \\}`
+    with input :math:`\\hat{y} \\in \\mathcal{X}`, the MMCE is calculated by using a scoring classifier :math:`\\hat{p}=h(x)`
+    that returns the highest probability for a certain class in conjunction with the predicted label
+    information :math:`y \\in \\{1, ..., K \\}` and is defined by
+
+    .. math::
+
+       MMCE = \\sqrt{\\sum_{i, j \\in \\mathcal{D}} \\frac{1}{N^2}(\\mathbb{1}(\\hat{y}_i = y_i) - \\hat{p}_i) (\\mathbb{1}(\\hat{y}_j = y_j) - \\hat{p}_j)k(\\hat{p}_i, \\hat{p}_j)} ,
+
+    with :math:`\\mathbb{1}(*)` as the indicator function and a Laplacian _kernel :math:`k` defined by
+
+    .. math::
+       k(\\hat{p}_i, \\hat{p}_j) = \\exp(-2.5 |\\hat{p}_i - \\hat{p}_j|) .
+
+    Parameters
+    ----------
+    detection : bool, default: False
+        Detection mode is currently not supported for MMCE!
+        If False, the input array 'X' is treated as multi-class confidence input (softmax)
+        with shape (n_samples, [n_classes]).
+        If True, the input array 'X' is treated as a box predictions with several box features (at least
+        box confidence must be present) with shape (n_samples, [n_box_features]).
+
+    References
+    ----------
+    .. [1] Kumar, Aviral, Sunita Sarawagi, and Ujjwal Jain:
+       "Trainable calibration measures for neural networks from _kernel mean embeddings."
+       International Conference on Machine Learning. 2018.
+       `Get source online <http://proceedings.mlr.press/v80/kumar18a/kumar18a.pdf>`_.
+    """
+
+    @accepts(bool)
+    def __init__(self, detection: bool = False):
+        """ Constructor. For parameter doc see class doc. """
+
+        self.logger = logging.getLogger('calibration')
+
+        assert not detection, "MMCE is currently not supported for object detection."
+        self.detection = detection
+
+    def _batched(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray], batched: bool = False):
+        # batched: interpret X and y as multiple predictions
+
+        if not batched:
+            assert isinstance(X, np.ndarray), 'Parameter \'X\' must be Numpy array if not on batched mode.'
+            assert isinstance(y, np.ndarray), 'Parameter \'y\' must be Numpy array if not on batched mode.'
+            X, y = [X], [y]
+
+        # if we're in batched mode, create new lists for X and y to prevent overriding
+        else:
+            assert isinstance(X, (list, tuple)), 'Parameter \'X\' must be type list on batched mode.'
+            assert isinstance(y, (list, tuple)), 'Parameter \'y\' must be type list on batched mode.'
+            X, y = [x for x in X], [y_ for y_ in y]
+
+        # if input X is of type "np.ndarray", convert first axis to list
+        # this is necessary for the following operations
+        if isinstance(X, np.ndarray):
+            X = [x for x in X]
+
+        if isinstance(y, np.ndarray):
+            y = [y0 for y0 in y]
+
+        return X, y
+
+    def _kernel(self, confidence):
+        """ Laplacian _kernel """
+
+        diff = confidence[:, None] - confidence
+        return np.exp(-2.5 * np.abs(diff))
+
+    def measure(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray], batched: bool = False):
+        """
+        Measure calibration by given predictions with confidence and the according ground truth.
+
+        Parameters
+        ----------
+        X : iterable of np.ndarray, or np.ndarray of shape=(n_samples, [n_classes])
+            NumPy array with confidence values for each prediction on classification with shapes
+            1-D for binary classification, 2-D for multi class (softmax).
+            If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=(n_samples, [n_classes])
+            NumPy array with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        batched : bool, optional, default: False
+            Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+            All predictions given by X and y are separately evaluated and their results are averaged afterwards
+            for visualization.
+
+        Returns
+        -------
+        float
+            Returns Maximum Mean Calibration Error.
+        """
+
+        X, y = self._batched(X, y, batched)
+
+        mmce = []
+        for X_batch, y_batch in zip(X, y):
+
+            # assert y_batch is one-hot with 2 dimensions
+            if y_batch.ndim == 2:
+                y_batch = np.argmax(y_batch, axis=1)
+
+            # get max confidence and according label
+            if X_batch.ndim == 1:
+                confidence, labels = X_batch, np.where(X_batch > 0.5, np.ones_like(X_batch), np.zeros_like(X_batch))
+            elif X_batch.ndim == 2:
+                confidence, labels = np.max(X_batch, axis=1), np.argmax(X_batch, axis=1)
+            else:
+                raise ValueError("MMCE currently not defined for input arrays with ndim>3.")
+
+            n_samples = float(confidence.size)
+
+            # get matched flag and difference
+            matched = (y_batch == labels).astype(np.float)
+            diff = np.expand_dims(matched - confidence, axis=1)
+
+            # now calculate product of differences for each pair
+            confidence_pairs = np.matmul(diff, diff.T)
+
+            # caculate _kernel for each pair
+            kernel_pairs = self._kernel(confidence)
+
+            miscalibration = np.sqrt(np.sum(confidence_pairs * kernel_pairs) / np.square(n_samples))
+            mmce.append(miscalibration)
+
+        mmce = np.mean(mmce)
+        return mmce
diff --git a/netcal/metrics/Miscalibration.py b/netcal/metrics/Miscalibration.py
index a934cba..86d942d 100644
--- a/netcal/metrics/Miscalibration.py
+++ b/netcal/metrics/Miscalibration.py
@@ -1,14 +1,15 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import Union, Iterable, Tuple, List
 
 import numpy as np
 from scipy.stats import binned_statistic_dd
-from typing import Union
-from netcal import accepts, dimensions
+from netcal import accepts, hpdi
 
 
 class _Miscalibration(object):
@@ -23,6 +24,9 @@ class _Miscalibration(object):
         Number of bins used by the Histogram Binning.
         On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
         If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
@@ -37,59 +41,34 @@ class _Miscalibration(object):
        "Obtaining well calibrated probabilities using bayesian binning."
        Twenty-Ninth AAAI Conference on Artificial Intelligence, 2015.
        `Get source online <https://www.aaai.org/ocs/index.php/AAAI/AAAI15/paper/download/9667/9958>`_
+
     .. [2] Neumann, Lukas, Andrew Zisserman, and Andrea Vedaldi:
        "Relaxed Softmax: Efficient Confidence Auto-Calibration for Safe Pedestrian Detection."
        Conference on Neural Information Processing Systems (NIPS) Workshop MLITS, 2018.
        `Get source online <https://openreview.net/pdf?id=S1lG7aTnqQ>`_
+
     .. [3] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
-       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
+       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+       `Get source online <https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf>`_
     """
 
     epsilon = np.finfo(np.float).eps
 
-    @accepts((int, tuple, list), bool, int)
-    def __init__(self, bins: Union[int, tuple, list] = 10, detection: bool = False, sample_threshold: int = 1):
-        """
-        Constructor.
+    @accepts((int, tuple, list), bool, bool, int)
+    def __init__(self, bins: Union[int, Iterable[int]] = 10, equal_intervals: bool = True,
+                 detection: bool = False, sample_threshold: int = 1):
+        """ Constructor. For parameter doc see class doc. """
 
-        Parameters
-        ----------
-        bins : int or iterable, default: 10
-            Number of bins used by the Histogram Binning.
-            On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
-            If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
-        detection : bool, default: False
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        sample_threshold : int, optional, default: 1
-            Bins with an amount of samples below this threshold are not included into the miscalibration metrics.
-        """
         self.bins = bins
         self.detection = detection
         self.sample_threshold = sample_threshold
+        self.equal_intervals = equal_intervals
 
     @classmethod
-    def squeeze_generic(cls, a: np.ndarray, axes_to_keep: Union[int, list, tuple]) -> np.ndarray:
-        """
-        Squeeze input array a but keep axes defined by parameter 'axes_to_keep' even if the dimension is
-        of size 1.
-
-        Parameters
-        ----------
-        a : np.ndarray
-            NumPy array that should be squeezed.
-        axes_to_keep : int or iterable
-            Axes that should be kept even if they have a size of 1.
-
-        Returns
-        -------
-        np.ndarray
-            Squeezed array.
-
-        """
+    def squeeze_generic(cls, a: np.ndarray, axes_to_keep: Union[Iterable[int], int]) -> np.ndarray:
+        """ Squeeze input array a but keep axes defined by parameter
+        'axes_to_keep' even if the dimension is of size 1. """
 
         # if type is int, convert to iterable
         if type(axes_to_keep) == int:
@@ -99,146 +78,210 @@ def squeeze_generic(cls, a: np.ndarray, axes_to_keep: Union[int, list, tuple]) -
         out_s = [s for i, s in enumerate(a.shape) if i in axes_to_keep or s != 1]
         return a.reshape(out_s)
 
-    @dimensions((1, 2), (1, 2), None, None, None)
-    def _measure(self, X: np.ndarray, y: np.ndarray, metric: str, return_map: bool = False,
-                 return_num_samples: bool = False) -> Union[float, tuple]:
+    def reduce(self, histogram: np.ndarray, distribution: np.ndarray, axis: int, reduce_result: Tuple = None):
+        """
+        Calculate the weighted mean on a given histogram based on a dedicated data distribution.
+        If 'reduce_result' is given, reuse the data distribution of the previous result instead of the distribution
+        given by 'distribution' parameter.
         """
-        Measure calibration by given predictions with confidence and the according ground truth.
-        Assume binary predictions with y=1.
 
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
-        metric : str
-            Determine metric to measure. Must be one of 'ACE', 'ECE' or 'MCE'.
-        return_map: bool, optional, default: False
-            If True, return map with miscalibration metric separated into all remaining dimension bins.
-        return_num_samples : bool, optional, default: False
-            If True, also return the number of samples in each bin.
+        if reduce_result is None:
+            # in order to determine miscalibration w.r.t. additional features (excluding confidence dimension),
+            # reduce the first (confidence) dimension and determine the amount of samples in the remaining bins
+            samples_map = np.sum(distribution, axis=axis)
 
-        Returns
-        -------
-        float or tuple of (float, np.ndarray) or tuple of (float, np.ndarray, np.ndarray)
-            Always returns miscalibration metric.
-            If 'return_map' is False, return miscalibration metric only.
-            If 'return_map' is True, return tuple with miscalibration metric and map over all bins.
-            If 'return_num_samples' is False, return map with miscalibration metric.
-            If 'return_num_samples' is True, return tuple with miscalibration metric map and number of samples
-            in each bin.
-        """
+            # The following computation is a little bit confusing but necessary because:
+            # We are interested in the miscalibration score (here mainly D-ECE) as well as the confidence, accuracy and
+            # uncertainty for each feature bin (excluding the confidence dimension) separately.
+            # Thus, we need to know the total amount of samples over all confidence bins for each bin combination in the
+            # remaining dimensions separately. This amount of samples for each bin combination is then treated as the total
+            # amount of samples in order to compute the D-ECE in the current bin combination properly.
 
-        # ---------------------------------------
-        # perform parameter checks
+            # extend the reduced histogram again
+            extended_hist = np.repeat(
+                np.expand_dims(samples_map, axis=axis),
+                distribution.shape[axis],
+                axis=axis
+            )
 
-        # remove single-dimensional entries if present
-        X = self.squeeze_generic(X, axes_to_keep=0)
-        y = self.squeeze_generic(y, axes_to_keep=0)
+            # get the relative amount of samples according to a certain bin combination over all confidence bins
+            # leave out empty bin combinations
+            rel_samples_hist_reduced_conf = np.divide(distribution,
+                                                      extended_hist,
+                                                      out=np.zeros_like(distribution),
+                                                      where=extended_hist != 0)
+        else:
+            # reuse reduced data distribution from a previous call
+            rel_samples_hist_reduced_conf = reduce_result[1]
 
-        # check if metric is correct set
-        if not isinstance(metric, str):
-            raise AttributeError('Parameter \'metric\' must be string \'ACE\', \'ECE\' or \'MCE\'.')
-        if not metric.lower() in ['ace', 'ece', 'mce']:
-            raise AttributeError('Parameter \'metric\' must be string \'ACE\', \'ECE\' or \'MCE\'.')
+        # now reduce confidence dimension of accuracy, confidence and uncertainty histograms
+        weighted_mean = np.sum(histogram * rel_samples_hist_reduced_conf, axis=axis)
+
+        return weighted_mean, rel_samples_hist_reduced_conf
+
+    def prepare(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray],
+                batched: bool = False, uncertainty: str = None) -> Tuple[List[np.ndarray], List[np.ndarray], List[np.ndarray], List, int]:
+        """ Check input data. For detailed documentation of the input parameters, check "_measure" method. """
+
+        # batched: interpret X and y as multiple predictions
+        if not batched:
+            assert isinstance(X, np.ndarray), 'Parameter \'X\' must be Numpy array if not on batched mode.'
+            assert isinstance(y, np.ndarray), 'Parameter \'y\' must be Numpy array if not on batched mode.'
+            X, y = [X], [y]
+
+        # if we're in batched mode, create new lists for X and y to prevent overriding
         else:
-            metric = metric.lower()
+            assert isinstance(X, (list, tuple)), 'Parameter \'X\' must be type list on batched mode.'
+            assert isinstance(y, (list, tuple)), 'Parameter \'y\' must be type list on batched mode.'
+            X, y = [x for x in X], [y_ for y_ in y]
 
-        if y.shape[0] != X.shape[0]:
-            raise AttributeError('Number of samples given by \'X\' and \'y\' is not equal.')
+        # if input X is of type "np.ndarray", convert first axis to list
+        # this is necessary for the following operations
+        if isinstance(X, np.ndarray):
+            X = [x for x in X]
 
-        # check number of given samples
-        if y.size <= 0:
-            raise ValueError("No samples provided.")
+        if isinstance(y, np.ndarray):
+            y = [y0 for y0 in y]
 
-        elif len(y.shape) == 2:
+        # empty list to collect uncertainty estimates for each sample provided in each batch
+        matched, sample_uncertainty = [], []
 
-            # still assume y as binary with ground truth labels present in y=1 entry
-            if y.shape[1] <= 2:
-                y = y[:, -1]
+        num_features = -1
+        for i, (batch_X, batch_y) in enumerate(zip(X, y)):
 
-            # assume y as one-hot encoded
-            else:
-                y = np.argmax(y, axis=1)
+            # we need at least 2 dimensions (for classification as well as for detection)
+            if batch_X.ndim == 1:
+                X[i] = batch_X = np.reshape(batch_X, (-1, 1))
 
-        # we need at least 2 dimensions for this algorithm - thus reshape X if only one dimension is present
-        # assume binary classification
-        if len(X.shape) == 1:
-            X = np.reshape(X, (-1, 1))
-            prediction = np.ones(X.shape[0])
+            # -------------------------------------------------
+            # process uncertainty mode first
+            batch_X, batch_y, batch_uncertainty = self._prepare_uncertainty(batch_X, batch_y, uncertainty)
+            X[i], y[i] = batch_X, batch_y
 
-        # got 2D array for X?
-        elif len(X.shape) == 2:
+            # uncertainty (std deviation) of X values of current batch
+            sample_uncertainty.append(batch_uncertainty)
 
-            # on detection mode, assume all predictions as 'matched'
-            if self.detection:
-                prediction = np.ones(X.shape[0])
+            # -------------------------------------------------
+            # check and prepare input data
+            batch_X, batch_y, batch_matched = self._prepare_input(batch_X, batch_y)
+            X[i], y[i] = batch_X, batch_y
+            matched.append(batch_matched)
 
-            # on classification, if less than 2 entries for 2nd dimension are present, assume binary classification
-            # (independent sigmoids are currently not supported)
-            elif X.shape[1] == 1:
-                prediction = np.ones(X.shape[0])
+            # -------------------------------------------------
+            # check if number of features is consistent along all batches
+            batch_num_features = batch_X.shape[1] if self.detection and batch_X.ndim > 1 else 1
 
-            # classification and more than 1 entry for 2nd dimension? assume multiclass classification
+            # get number of additional dimensions (if not initialized)
+            if num_features == -1:
+                num_features = batch_num_features
             else:
-                prediction = np.argmax(X, axis=1)
-                X = np.reshape(np.max(X, axis=1), (-1, 1))
-        else:
-            prediction = np.ones_like(X)
+                # if number of features is not equal over all instances, raise exception
+                assert num_features == batch_num_features, "Unequal number of classes/features given in batched mode."
 
-        # clip to (0, 1) in order to get all samples into binning scheme
-        X = np.clip(X, self.epsilon, 1.-self.epsilon)
+        # -----------------------------------------------------
+        # prepare bin amount with the current amount of features
 
-        # calculate 'matched' (0 or 1)
-        matched = prediction == y
-        total_samples = X.shape[0]
+        bin_bounds = self._prepare_bins(X, num_features)
 
-        # get number of features for detection mode calibration
-        if self.detection:
-            num_features = X.shape[1]
+        return X, matched, sample_uncertainty, bin_bounds, num_features
 
-            # check bins parameter
-            # is int? distribute to all dimensions
-            if isinstance(self.bins, int):
-                bins = [self.bins, ] * num_features
+    def binning(self, bin_bounds: List, samples: np.ndarray, *values: Iterable, nan: float = 0.0) -> Tuple:
+        """
+        Perform binning on value (and all additional values passed) based on samples.
 
-            # is iterable? check for compatibility with all properties found
-            elif isinstance(self.bins, (tuple, list)):
-                if len(self.bins) != num_features:
-                    raise AttributeError("Length of \'bins\' parameter must match number of features.")
-                bins = self.bins
-            else:
-                raise AttributeError("Unknown type of parameter \'bins\'.")
-        else:
+        Parameters
+        ----------
+        bin_bounds : list, length=samples.shape[1]
+            Binning boundaries used for each dimension given in 'samples' parameter.
+        samples : np.ndarray of shape (n_samples, n_features)
+            Array used to group all samples into bins.
+        *values : instances np.ndarray of shape (n_samples, 1)
+            Arrays whose values are binned.
+        nan : float, optional default: 0.0
+            If a bin has no samples or less than defined sample_threshold, the according bin is marked as
+            NaN. Specify fill float to insert instead of NaN.
+
+        Returns
+        -------
+        tuple of length equal to the amount of passed value arrays with binning schemes and an additional histogram
+        with number of samples in each bin as well as an index tuple containing the bin indices.
+        """
 
-            if not isinstance(self.bins, int):
-                raise AttributeError("Parameter \'bins\' must be int for classification mode.")
+        # determine number of samples in histogram bins
+        num_samples_hist, _ = np.histogramdd(samples, bins=bin_bounds)
+        binning_schemes = []
+        binning_result = None
 
-            bins = [self.bins]
+        # iterate over passed value arrays
+        for val in values:
+            binning_result = binned_statistic_dd(samples, val, statistic='mean', bins=bin_bounds, binned_statistic_result=binning_result)
+            hist, _, _ = binning_result
 
-        # ---------------------------------------
-        # get bin bounds
-        bin_bounds = [np.linspace(0.0, 1.0, bins + 1) for bins in bins]
+            # blank out each bin that has less samples than a certain sample threshold in order
+            # to improve robustness of the miscalibration scores
+            # convert NaN entries to float
+            hist[num_samples_hist < self.sample_threshold] = np.nan
+            hist = np.nan_to_num(hist, nan=nan)
 
-        # X must have the same shape as y
-        acc_hist, _, _ = binned_statistic_dd(X, matched, statistic='mean', bins=bin_bounds)
-        conf_hist, _, _ = binned_statistic_dd(X, X[:, 0], statistic='mean', bins=bin_bounds)
-        num_samples_hist, _ = np.histogramdd(X, bins=bin_bounds)
+            binning_schemes.append(hist)
 
-        # convert NaN entries to 0
-        acc_hist, conf_hist, num_samples_hist = [np.nan_to_num(x, nan=0.0) for x in (acc_hist, conf_hist, num_samples_hist)]
+        binning_schemes.append(num_samples_hist)
+        _, _, idx = binning_result
+
+        # first step: expand bin numbers
+        # correct bin number afterwards as this variable has offset of 1
+        idx = np.asarray(np.unravel_index(idx, [len(bounds)+1 for bounds in bin_bounds]))
+        idx -= 1
+
+        # convert to tuple as this can be used for array indexing
+        idx = tuple([dim for dim in idx])
+        binning_schemes.append(idx)
+
+        return tuple(binning_schemes)
+
+    def process(self,
+                metric: str,
+                acc_hist: np.ndarray,
+                conf_hist: np.ndarray,
+                variance_hist: np.ndarray,
+                num_samples_hist: np.ndarray) -> Tuple[float, np.ndarray, np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
+        """
+        Determine miscalibration based on passed histograms.
+
+        Parameters
+        ----------
+        metric : str
+            Identifier to specify the used metric. Must be one of 'ace', 'ece' or 'mce'.
+        acc_hist : np.ndarray of shape (n_bins, [n_bins, [n_bins, [...]]])
+            Histogram with average accuracy in each bin.
+        conf_hist : np.ndarray of shape (n_bins, [n_bins, [n_bins, [...]]])
+            Histogram with average confidence in each bin.
+        variance_hist : np.ndarray of shape (n_bins, [n_bins, [n_bins, [...]]])
+            Histogram with average variance in each bin. This array is currently not used but
+            might be utilized in the future.
+        num_samples_hist : np.ndarray of shape (n_bins, [n_bins, [n_bins, [...]]])
+            Histogram with number of samples in each bin.
+
+        Returns
+        -------
+        tuple of length 6 (miscalibration score, miscalibration map, accuracy map, confidence map, variance map, num samples map)
+        All maps without confidence dimension.
+        """
 
         # in order to determine miscalibration w.r.t. additional features (excluding confidence dimension),
         # reduce the first (confidence) dimension and determine the amount of samples in the remaining bins
-        samples_hist_reduced_conf = np.sum(num_samples_hist, axis=0)
+        samples_map = np.sum(num_samples_hist, axis=0)
+        total_samples = np.sum(samples_map)
 
         # first, get deviation map
         deviation_map = np.abs(acc_hist - conf_hist)
 
+        reduce_result = self.reduce(acc_hist, num_samples_hist, axis=0)
+        acc_hist = reduce_result[0]
+
+        conf_hist, _ = self.reduce(conf_hist, num_samples_hist, axis=0, reduce_result=reduce_result)
+        variance_hist, _ = self.reduce(variance_hist, num_samples_hist, axis=0, reduce_result=reduce_result)
+
         # second, determine metric scheme
         if metric == 'ace':
 
@@ -259,46 +302,311 @@ def _measure(self, X: np.ndarray, y: np.ndarray, metric: str, return_map: bool =
             rel_samples_hist = num_samples_hist / total_samples
             miscalibration = np.sum(deviation_map * rel_samples_hist)
 
-            # The following computation is a little bit confusing but necessary because:
-            # We are interested in the D-ECE score for each feature bin (excluding the confidence dimension) separately.
-            # Thus, we need to know the total amount of samples over all confidence bins for each bin
-            # combination in the remaining dimensions separately.
-            # This amount of samples for each bin combination is then treated as the total amount of samples in order
-            # to compute the D-ECE in the current bin combination properly.
-
-            # extend the reduced histogram again
-            extended_hist = np.repeat(
-                np.expand_dims(samples_hist_reduced_conf, axis=0),
-                num_samples_hist.shape[0],
-                axis=0
-            )
-
-            # get the relative amount of samples according to a certain bin combination over all confidence bins
-            # leave out empty bin combinations
-            rel_samples_hist_reduced_conf = np.divide(num_samples_hist,
-                                                      extended_hist,
-                                                      out=np.zeros_like(num_samples_hist),
-                                                      where=extended_hist != 0)
-
             # sum weighted deviation along confidence dimension
-            bin_map = np.sum(deviation_map * rel_samples_hist_reduced_conf, axis=0)
+            bin_map, _ = self.reduce(deviation_map, num_samples_hist, axis=0, reduce_result=reduce_result)
 
         elif metric == 'mce':
 
             # get maximum deviation
             miscalibration = np.max(deviation_map)
-            bin_map = np.max(deviation_map,  axis=0)
+            bin_map = np.max(deviation_map, axis=0)
 
         else:
             raise ValueError("Unknown miscalibration metric. This exception is fatal at this point. Fix your implementation.")
 
-        if return_map or return_num_samples:
+        return miscalibration, bin_map, acc_hist, conf_hist, variance_hist, samples_map
+    
+    def _prepare_bins(self, X: List[np.ndarray], num_features: int) -> List[List[np.ndarray]]:
+        """ Prepare number of bins for binning scheme. """
+
+        # check bins parameter
+        # is int? distribute to all dimensions
+        if isinstance(self.bins, int):
+            bins = [self.bins, ] * num_features
+
+        # is iterable? check for compatibility with all properties found
+        elif isinstance(self.bins, (tuple, list)):
+            if len(self.bins) != num_features:
+                raise AttributeError("Length of \'bins\' parameter must match number of features.")
+            else:
+                bins = self.bins
+        else:
+            raise AttributeError("Unknown type of parameter \'bins\'.")
+
+        # create an own set of bin boundaries for each batch in X
+        bin_bounds = [[np.linspace(0.0, 1.0, bins + 1) for bins in bins] for _ in X]
+
+        # on equal_intervals=True, simply use linspace
+        # if the goal is to equalize the amount of samples in each bin, use np.quantile
+        if not self.equal_intervals:
+            for i, (batch_X, bounds) in enumerate(zip(X, bin_bounds)):
+                for dim, b in enumerate(bounds):
+                    quantile = np.quantile(batch_X[:, dim], q=b, axis=0)
+
+                    # set lower and upper bounds to confidence limits
+                    quantile[0] = 0.
+                    quantile[-1] = 1.
+                    bin_bounds[i][dim] = quantile
+
+        return bin_bounds
+    
+    def _prepare_input(self, X: np.ndarray, y: np.ndarray) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """ Prepare structure of input data (number of dimensions, etc.) """
+
+        # remove unnecessary dims if given
+        y = self.squeeze_generic(y, axes_to_keep=0)
+
+        # after processing uncertainty, we expect batch_X to be only 2-D afterwards (but probably with more samples)
+        # if we had no uncertainty, we expect that anyway
+        assert X.ndim <= 2, "Fatal error: invalid number of dimensions."
+        assert y.size > 0, "No samples provided."
+        assert X.shape[0] == y.shape[0], "Unequal number of samples given in X and y."
+
+        # on detection mode, we only have binary samples
+        if (y.ndim > 1 or (np.unique(y) > 1).any()) and self.detection:
+            raise ValueError("On detection, only binary values for y are valid.")
+
+        # on detection mode, leave y array untouched
+        elif len(y.shape) == 2 and not self.detection:
+            # still assume y as binary with ground truth labels present in y=1 entry
+            if y.shape[1] <= 2:
+                y = y[:, -1]
+
+            # assume y as one-hot encoded
+            else:
+                y = np.argmax(y, axis=1)
+
+        # clip to (0, 1) in order to get all samples into binning scheme
+        X = np.clip(X, self.epsilon, 1. - self.epsilon)
+
+        # -------------------------------------------------
+        # now evaluate the accuracy/precision
+        # on detection mode or binary classification, the accuracy/precision is already given in y
+        if self.detection or len(np.unique(y)) < 2:
+            matched = np.array(y)
+
+        # on multiclass classification, we need to evaluate the accuracy by the predictions in X
+        else:
+            matched = np.argmax(X, axis=1) == y
+            X = np.max(X, axis=1, keepdims=True)
+
+        return X, y, matched
+
+    def _prepare_uncertainty(self, X: np.ndarray, y: np.ndarray, uncertainty: str) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """ Prepare input data for uncertainty handling. """
+
+        # -------------------------------------------------
+        # process uncertainty mode first
+        if uncertainty is None:
+            if X.ndim == 3:
+                print("Input data is 3D but uncertainty type not specified. Using \'mean\'.")
+
+                # set uncertainty type and according list within this loop since this will be executed
+                # only once (if ever)
+                uncertainty = 'mean'
+            else:
+                return X, y, np.zeros_like(X)
+
+        # on uncertainty mode, there might be two reasons why there are only 2 dimensions:
+        # first case: no additional uncertainty support, only observation and feature/multiclass dimension given
+        # second case: no additional features/multiclass probs, only realization and obervation dimensions are given
+        if X.ndim == 2:
+
+            # identify axis that holds the observation dimension
+            obs_dim = [shape == y.shape[-1] for shape in X.shape].index(True)
+
+            # first case: no probability/realization axis - prepend dimension
+            # this is equivalent to no uncertainty
+            if obs_dim == 0:
+                X = np.expand_dims(X, axis=0)
+
+            # second case: no feature/multiclass prob axis - append axis
+            elif obs_dim == 1:
+                X = np.expand_dims(X, axis=2)
+
+            else:
+                raise ValueError("Input data is incosistent for uncertainty mode.")
+
+        # process the different types of uncertainty
+        # first one: MC integration with additional uncertainty per sample
+        if uncertainty in ['mean', 'median', 'mode']:
+
+            # first condition: check for invalid detection mode
+            # second condition: check for invalid binary classification mode
+            # third condition: check for invalid multiclass classification mode
+            if (y.ndim == 2 and self.detection) or \
+                    (y.ndim == 2 and X.ndim == 2 and not self.detection) or \
+                    (y.ndim == 3 and X.ndim == 3 and not self.detection):
+                raise ValueError("Separate ground-truth information is provided for each probability forward pass "
+                                 "but uncertainty type \'mean\', \'median\' or \'mode\' is specified.")
+
+            if uncertainty == 'mean':
+                X, X_uncertainty = self._mean(X)
+            elif uncertainty == 'median':
+                X, X_uncertainty = self._median(X)
+            elif uncertainty == 'mode':
+                X, X_uncertainty = self._mode(X)
+            else:
+                raise AttributeError("Fatal implementation error.")
+
+        # second one: treat each parameter set separately
+        # however, we can not assess the uncertainty of a single sample in this case
+        elif uncertainty == 'flatten':
+            X, y = self._flatten(X, y)
+            X_uncertainty = np.zeros_like(X)
+        else:
+            raise NotImplementedError("Uncertainty type \'%s\' is not implemented." % uncertainty)
+
+        return X, y, X_uncertainty
+
+    def _flatten(self, X: np.ndarray, y: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
+        """ repeat features to flattened confidence estimates """
+
+        # multiclass classification
+        if X.ndim == 3 and not self.detection:
+
+            n_classes = X.shape[1]
+
+            # if y is 3-D on multiclass classification, we also have separate ground-truth information available
+            # then simply flatten
+            if y.ndim == 3:
+                y = np.reshape(y, (-1, y.shape[2]))
+            else:
+                y = np.tile(y, X.shape[0])
+
+            # use NumPy's reshape function to flatten array along first axis
+            X = np.reshape(X, (-1, n_classes))
+
+        # binary classification
+        else:
+            n_features = X.shape[2]
+
+            # if y is 2-D on binary classification or detection, we also
+            # have separate ground-truth information available
+            # then simply flatten
+            if y.ndim == 2:
+                y = y.flatten()
+            else:
+                y = np.tile(y, X.shape[0])
+
+            # use NumPy's reshape function to flatten array along first axis
+            X = np.reshape(X, (-1, n_features))
+
+        return X, y
+
+    def _mean(self, X: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
+        """ return mean of input data along first axis """
+        return np.mean(X, axis=0), np.var(X, axis=0)
+
+    def _median(self, X: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
+        """ return median of input data along first axis """
+        return np.median(X, axis=0), np.var(X, axis=0)
+
+    def _mode(self, X: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
+        """ return mode of input data along first axis """
+
+        ret = []
+        # credible interval bounds on confidence only
+        for feature in range(X.shape[-1]):
+            bounds = hpdi(X[..., feature], 0.05)
+            mode = np.sum(bounds, axis=1) / 2.
+            ret.append(mode)
+
+        return np.stack(ret, axis=1), np.var(X, axis=0)
+
+    def _measure(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray],
+                 metric: str, batched: bool = False, uncertainty: str = None,
+                 return_map: bool = False,
+                 return_num_samples: bool = False,
+                 return_uncertainty_map: bool = False) -> Union[float, Tuple]:
+        """
+        Measure calibration by given predictions with confidence and the according ground truth.
+        Assume binary predictions with y=1.
+
+        Parameters
+        ----------
+        X : iterable of np.ndarray, or np.ndarray of shape=([n_bayes], n_samples, [n_classes/n_box_features])
+            NumPy array with confidence values for each prediction on classification with shapes
+            1-D for binary classification, 2-D for multi class (softmax).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+            On detection, this array must have 2 dimensions with number of additional box features in last dim.
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=([n_bayes], n_samples, [n_classes])
+            NumPy array with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        batched : bool, optional, default: False
+            Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+            All predictions given by X and y are separately evaluated and their results are averaged afterwards
+            for visualization.
+        uncertainty : str, optional, default: False
+            Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+            that output an ensemble of predictions per sample. Choose one of the following options:
+            - flatten:  treat everything as a separate prediction - this option will yield into a slightly better
+                        calibration performance but without the visualization of a prediction interval.
+            - mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample
+                        (mean) with a standard deviation that is visualized.
+        metric : str
+            Determine metric to measure. Must be one of 'ACE', 'ECE' or 'MCE'.
+        return_map: bool, optional, default: False
+            If True, return map with miscalibration metric separated into all remaining dimension bins.
+        return_num_samples : bool, optional, default: False
+            If True, also return the number of samples in each bin.
+        return_uncertainty_map : bool, optional, default: False
+            If True, also return the average deviation of the confidence within each bin.
+
+        Returns
+        -------
+        float or tuple of (float, np.ndarray, [np.ndarray, [np.ndarray]])
+            Always returns miscalibration metric.
+            If 'return_map' is True, return tuple and append miscalibration map over all bins.
+            If 'return_num_samples' is True, return tuple and append the number of samples in each bin (excluding confidence dimension).
+            If 'return_uncertainty' is True, return tuple and append the average standard deviation of confidence within each bin (excluding confidence dimension).
+        """
+
+        # check if metric is correct set
+        if not isinstance(metric, str):
+            raise AttributeError('Parameter \'metric\' must be string \'ACE\', \'ECE\' or \'MCE\'.')
+        if not metric.lower() in ['ace', 'ece', 'mce']:
+            raise AttributeError('Parameter \'metric\' must be string \'ACE\', \'ECE\' or \'MCE\'.')
+        else:
+            metric = metric.lower()
+
+        # prepare input data
+        X, matched, sample_uncertainty, bin_bounds, _ = self.prepare(X, y, batched, uncertainty)
+
+        # iterate over all batches of X and matched and calculate average miscalibration
+        results = []
+        for batch_X, batch_matched, batch_uncertainty, bounds in zip(X, matched, sample_uncertainty, bin_bounds):
+
+            # perform binning on input arrays and drop last outcome (idx bin indices are not needed here)
+            histograms = self.binning(bounds, batch_X, batch_matched, batch_X[:, 0], batch_uncertainty[:, 0])
+            histograms = histograms[:-1]
+
+            result = self.process(metric, *histograms)
+            results.append(result)
+
+        # finally, average over all batches
+        miscalibration = np.mean([result[0] for result in results], axis=0)
+        bin_map = np.mean([result[1] for result in results], axis=0)
+        samples_map = np.mean([result[-1] for result in results], axis=0)
+        uncertainty_map = np.sqrt(np.mean([result[-2] for result in results], axis=0))
+
+        # build output structure w.r.t. user input
+        if return_map or return_num_samples or return_uncertainty_map:
             return_value = (float(miscalibration),)
 
             if return_map:
                 return_value = return_value + (bin_map,)
             if return_num_samples:
-                return_value = return_value + (samples_hist_reduced_conf,)
+                return_value = return_value + (samples_map,)
+            if return_uncertainty_map:
+                return_value = return_value + (uncertainty_map,)
 
             return return_value
         else:
diff --git a/netcal/metrics/PICP.py b/netcal/metrics/PICP.py
new file mode 100644
index 0000000..33b0eb9
--- /dev/null
+++ b/netcal/metrics/PICP.py
@@ -0,0 +1,221 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import Iterable, NamedTuple, Tuple, List
+from collections import namedtuple
+import numpy as np
+from scipy.stats import norm
+from typing import Union
+
+from netcal import hpdi
+from netcal.metrics import _Miscalibration
+
+
+class PICP(_Miscalibration):
+    """
+    Compute Prediction Interval Coverage Probability (PICP) [1]_,[2]_ and Mean Prediction Interval Width (MPIW) [2]_.
+    This metric is used for Bayesian models to determine the quality of the uncertainty estimates.
+    In Bayesian mode, an uncertainty estimate is attached to each sample. The PICP measures the probability, that
+    the true (observed) accuracy falls into the p% prediction interval. The uncertainty is well-calibrated, if
+    the PICP is equal to p%. Simultaneously, the MPIW measures the mean width of all prediction intervals to evaluate
+    the sharpness of the uncertainty estimates.
+
+    Parameters
+    ----------
+    bins : int or iterable, default: 10
+        Number of bins used by the Histogram Binning.
+        On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
+        If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
+    detection : bool, default: False
+        If False, the input array 'X' is treated as multi-class confidence input (softmax)
+        with shape (n_samples, [n_classes]).
+        If True, the input array 'X' is treated as a box predictions with several box features (at least
+        box confidence must be present) with shape (n_samples, [n_box_features]).
+    sample_threshold : int, optional, default: 1
+        Bins with an amount of samples below this threshold are not included into the process metrics.
+
+    References
+    ----------
+    .. [1] Kuleshov, V.; Fenner, N. & Ermon, S.:
+       "Accurate Uncertainties for Deep Learning Using Calibrated Regression."
+       International Conference on Machine Learning (ICML), 2018
+       `Get source online <http://proceedings.mlr.press/v80/kuleshov18a/kuleshov18a.pdf>`_
+
+    .. [2] Jiayu  Yao,  Weiwei  Pan,  Soumya  Ghosh,  and  Finale  Doshi-Velez:
+       "Quality of Uncertainty Quantification for Bayesian Neural Network Inference."
+       Workshop on Uncertainty and Robustness in Deep Learning, ICML, 2019
+       `Get source online <https://arxiv.org/pdf/1906.09686.pdf>`_
+    """
+
+    def accuracy(self, X: Union[Iterable[np.ndarray], np.ndarray],
+                 y: Union[Iterable[np.ndarray], np.ndarray],
+                 batched: bool = False,
+                 uncertainty: str = 'mean') -> Tuple[List[np.ndarray], List[np.ndarray], List[np.ndarray], List[np.ndarray], List, int]:
+        """ Measure the accuracy of each point by binning. """
+
+        # prepare data - first, use "mean" to obtain the mean prediction of the posterior predictive
+        # use flattened confidence estimates in order to get a better evaluation of the accuracy within each bin
+        X_mean, _, sample_uncertainty, bin_bounds, num_features = self.prepare(X, y, batched, uncertainty=uncertainty)
+
+        # convert mean variance to mean std deviation
+        uncertainty = [np.sqrt(var) for var in sample_uncertainty]
+        sample_accuracy, num_samples = [], []
+
+        # for batch in zip(X_mean, X_flatten, matched_flatten, bin_bounds):
+        for batch_X_mean, bounds in zip(X_mean, bin_bounds):
+
+            # perform binning
+            # acc_hist, _, _ = self.binning(bounds, batch_X_flatten, batch_matched_flatten)
+            acc_hist, num_samples_hist, idx_mean = self.binning(bounds, batch_X_mean, batch_X_mean[:, 0], nan=np.nan)
+
+            # use accuracy histogram from flattened estimates
+            # and assign to "mean" values
+            sample_accuracy.append(acc_hist[idx_mean])
+            num_samples.append(num_samples_hist)
+
+        return X_mean, sample_accuracy, uncertainty, num_samples, bin_bounds, num_features
+
+    def measure(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray], p: float = 0.05,
+                use_hpd: bool = True, batched: bool = False, uncertainty: str = 'mean',
+                return_map: bool = False) -> NamedTuple:
+        """
+        Measure calibration by given predictions with confidence and the according ground truth.
+        Assume binary predictions with y=1.
+
+        Parameters
+        ----------
+        X : iterable of np.ndarray, or np.ndarray of shape=([n_bayes], n_samples, [n_classes/n_box_features])
+            NumPy array with confidence values for each prediction on classification with shapes
+            1-D for binary classification, 2-D for multi class (softmax).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+            On detection, this array must have 2 dimensions with number of additional box features in last dim.
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=([n_bayes], n_samples, [n_classes])
+            NumPy array with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
+            If iterable over multiple instances of np.ndarray and parameter batched=True,
+            interpret this parameter as multiple predictions that should be averaged.
+        p : float, optional, default: 0.05
+            Confidence level.
+        use_hpd : bool, optional, default: True
+            If True, use highest posterior density (HPD) interval to determine the prediction interval width.
+            Use variance with Gaussian assumption otherwise.
+        batched : bool, optional, default: False
+            Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
+            All predictions given by X and y are separately evaluated and their results are averaged afterwards
+            for visualization.
+        uncertainty : str, optional, default: "mean"
+            Mode to measure mean estimate and uncertainty of the samples in Bayesian mode. Must be one
+            of "mean" (mean of all samples), "mode" (mode of all samples), "median" (median of all samples) or
+            "flatten" (no uncertainty will be computed, all samples are seen as independent predictions).
+        return_map: bool, optional, default: False
+            If True, return map with PICP and MPIW metric separated into all remaining dimension bins.
+
+        Returns
+        -------
+        Namedtuple PICPResult with fields "picp" and "mpiw", where each field either holds the PICP/MPIW score
+        or a tuple of (float, np.ndarray)
+            Always returns a named tuple with PICP (prediction interval coverage probability) and MPIW
+            (mean prediction interval width).
+            If 'return_map' is True, each field holds a tuple for the metric itself and the PICP/MPIW distribution
+            over all bins.
+        """
+
+        # PICP returns a namedtuple - init
+        picpresult = namedtuple('PICPResult', ['picp', 'mpiw'])
+
+        # 'prediction interval coverage probability' and 'mean prediction interval width'
+        picp, picp_map = [], []
+        mpiw, mpiw_map = [], []
+
+        result = self.accuracy(X=X, y=y, batched=batched, uncertainty=uncertainty)
+
+        # TODO: check different cases
+        if not batched and isinstance(X, np.ndarray):
+            X = [X]
+
+        it = (X,) + tuple(result[:-1])
+
+        # iterate over batches and get mean estimates
+        for batch_X, batch_X_mean, batch_acc, batch_uncertainty, batch_num_samples, bounds, in zip(*it):
+
+            batch_uncertainty = batch_uncertainty[:, 0]
+
+            # if uncertainty is 0 everywhere (that is the case if no Bayesian method is evaluated)
+            # return NaN
+            if np.count_nonzero(batch_uncertainty) == 0:
+                return picpresult(np.nan, np.nan)
+
+            # TODO: do that more dynamically
+            elif len(batch_X.shape) == 2:
+                batch_X = np.expand_dims(batch_X, axis=-1)
+
+            # remove all entries that are NaN
+            nans = np.isnan(batch_acc)
+            batch_X_mean, batch_acc, batch_uncertainty = batch_X_mean[~nans], batch_acc[~nans], batch_uncertainty[~nans]
+
+            # since the output distributions might be skewed, using highed posterior density for interval
+            # calculation should be preferred
+            if use_hpd:
+
+                # use confidence only for HPD
+                interval_bounds = hpdi(batch_X[..., 0], 1.-p)
+                lb_ci = interval_bounds[0, :][~nans]
+                ub_ci = interval_bounds[1, :][~nans]
+
+            else:
+
+                # calculate prediction interval assuming a normal distribution
+                # calculate credible interval
+                z_score = norm.ppf(1. - (p / 2))
+                batch_uncertainty = z_score * batch_uncertainty
+                lb_ci = batch_X_mean[:, 0] - batch_uncertainty
+                ub_ci = batch_X_mean[:, 0] + batch_uncertainty
+
+            # use accuracy histogram from flattened estimates
+            # and assign to "mean" values
+            within_interval = np.where((batch_acc >= lb_ci) & (batch_acc <= ub_ci),
+                                       np.ones_like(batch_acc), np.zeros_like(batch_acc))
+            width = ub_ci - lb_ci
+
+            # mean prediction interval width
+            mpiw.append(np.mean(width))
+            picp.append(np.mean(within_interval))
+
+            # if a map along the "feature" bins is requested, use the binning routines of _Miscalibration class
+            if return_map:
+                # TODO: not that pretty
+                threshold = int(self.sample_threshold)
+                self.sample_threshold = 1
+                batch_picp_map, batch_mpiw_map, _ = self.binning(bounds, batch_X_mean, within_interval, width)
+                self.sample_threshold = threshold
+
+                # after binning, reduce first dimension
+                result = self.reduce(batch_picp_map, batch_num_samples, axis=0)
+                batch_mpiw_map, _ = self.reduce(batch_mpiw_map, batch_num_samples, axis=0, reduce_result=result)
+
+                mpiw_map.append(batch_mpiw_map)
+                picp_map.append(result[0])
+
+        picp = np.mean(picp)
+        mpiw = np.mean(mpiw)
+
+        if return_map:
+            picp_map = np.mean(picp_map, axis=0)
+            mpiw_map = np.mean(mpiw_map, axis=0)
+            result = picpresult((picp, picp_map), (mpiw, mpiw_map))
+        else:
+            result = picpresult(picp, mpiw)
+
+        return result
diff --git a/netcal/metrics/__init__.py b/netcal/metrics/__init__.py
index 49d34c9..5a45d71 100644
--- a/netcal/metrics/__init__.py
+++ b/netcal/metrics/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 """
 Methods for measuring miscalibration. The common methods are given with the
@@ -22,9 +22,13 @@
    ACE
    ECE
    MCE
+   MMCE
+   PICP
 """
 
 from .ACE import ACE
 from .ECE import ECE
 from .MCE import MCE
-from .Miscalibration import _Miscalibration
\ No newline at end of file
+from .Miscalibration import _Miscalibration
+from .PICP import PICP
+from .MMCE import MMCE
diff --git a/netcal/presentation/ReliabilityDiagram.py b/netcal/presentation/ReliabilityDiagram.py
index 99f987b..186c9b0 100644
--- a/netcal/presentation/ReliabilityDiagram.py
+++ b/netcal/presentation/ReliabilityDiagram.py
@@ -1,20 +1,19 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-import matplotlib.pyplot as plt
-from scipy.stats import binned_statistic
-from scipy.interpolate import interp1d, griddata
-from typing import Union
-from copy import deepcopy
+from typing import Union, Iterable, List
 import numpy as np
-import logging
+from scipy.stats import norm
+from scipy.interpolate import interp1d, griddata
+
+import matplotlib.pyplot as plt
+import tikzplotlib
 
 from netcal.metrics import _Miscalibration
-from netcal import accepts
 
 
 class ReliabilityDiagram(object):
@@ -30,6 +29,9 @@ class ReliabilityDiagram(object):
         Number of bins used by the ACE/ECE/MCE.
         On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
         If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
+    equal_intervals : bool, optional, default: True
+        If True, the bins have the same width. If False, the bins are splitted to equalize
+        the number of samples in each bin.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
@@ -41,8 +43,6 @@ class ReliabilityDiagram(object):
         Maximum value for scale color.
     metric : str, default: 'ECE'
         Metric to measure miscalibration. Might be either 'ECE', 'ACE' or 'MCE'.
-    title_suffix : str, optional, default: None
-        Suffix for plot title.
 
     References
     ----------
@@ -50,92 +50,92 @@ class ReliabilityDiagram(object):
        "On Calibration of Modern Neural Networks."
        Proceedings of the 34th International Conference on Machine Learning-Volume 70. JMLR. org, 2017.
        `Get source online <https://arxiv.org/abs/1706.04599>`_
+
     .. [2] A. Niculescu-Mizil and R. Caruana:
        “Predicting good probabilities with supervised learning.”
        Proceedings of the 22nd International Conference on Machine Learning, 2005, pp. 625–632.
        `Get source online <https://www.cs.cornell.edu/~alexn/papers/calibration.icml05.crc.rev3.pdf>`_
+
     .. [3] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
-       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
+       The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
+       `Get source online <https://openaccess.thecvf.com/content_CVPRW_2020/papers/w20/Kuppers_Multivariate_Confidence_Calibration_for_Object_Detection_CVPRW_2020_paper.pdf>`_
     """
 
-    @accepts((int, tuple, list), bool, (float, None), int, (list, None), (float, None), (str, None), (str, None))
-    def __init__(self, bins: Union[int, tuple, list] = 10,
+    def __init__(self, bins: Union[int, Iterable[int]] = 10, equal_intervals: bool = True,
                  detection: bool = False, sample_threshold: int = 1,
-                 feature_names: list = None,
                  fmin: float = None, fmax: float = None,
-                 metric: str = 'ECE', title_suffix: str = None):
-        """
-        Constructor.
-
-        Parameters
-        ----------
-        bins : int or iterable, default: 10
-            Number of bins used by the ACE/ECE/MCE.
-            On detection mode: if int, use same amount of bins for each dimension (nx1 = nx2 = ... = bins).
-            If iterable, use different amount of bins for each dimension (nx1, nx2, ... = bins).
-        detection : bool, default: False
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        sample_threshold : int, optional, default: 1
-            If the number of samples in a bin is less than this threshold, do not use this bin for miscalibration
-            computation.
-        feature_names : list, length: [n_box_features-1] optional, default: None
-            Names of the additional features (excluding confidence). These names are added to the according axes.
-        fmin : float, optional, default: None
-            Minimum value for scale color.
-        fmax : float, optional, default: None
-            Maximum value for scale color.
-        metric : str, default: 'ECE'
-            Metric to measure miscalibration. Might be either 'ECE', 'ACE' or 'MCE'.
-        title_suffix : str, optional, default: None
-            Suffix for plot title.
-        """
+                 metric: str = 'ECE', **kwargs):
+        """ Constructor. For detailed parameter documentation view classdocs. """
 
         self.bins = bins
         self.detection = detection
         self.sample_threshold = sample_threshold
-        self.feature_names = feature_names
         self.fmin = fmin
         self.fmax = fmax
         self.metric = metric
-        self.title_suffix = title_suffix
 
-    def plot(self, X: Union[tuple, list, np.ndarray], y: Union[tuple, list, np.ndarray], batched: bool = False,
-             filename: str = None, **save_args):
+        if 'feature_names' in kwargs:
+            self.feature_names = kwargs['feature_names']
+
+        if 'title_suffix' in kwargs:
+            self.title_suffix = kwargs['title_suffix']
+
+        self._miscalibration = _Miscalibration(bins=bins, equal_intervals=equal_intervals,
+                                               detection=detection, sample_threshold=sample_threshold)
+
+    def plot(self, X: Union[Iterable[np.ndarray], np.ndarray], y: Union[Iterable[np.ndarray], np.ndarray],
+             batched: bool = False, uncertainty: str = None, filename: str = None, tikz: bool = False,
+             title_suffix: str = None, feature_names: List[str] = None, **save_args) -> Union[plt.Figure, str]:
         """
         Reliability diagram to visualize miscalibration. This could be either in classical way for confidences only
         or w.r.t. additional properties (like x/y-coordinates of detection boxes, width, height, etc.). The additional
-        properties get binned. Afterwards, the ECE will be calculated for each bin. This is visualized as (multiple)
-        2-D plots.
+        properties get binned. Afterwards, the miscalibration will be calculated for each bin. This is
+        visualized as a 2-D plots.
 
         Parameters
         ----------
-        X : iterable of np.ndarray, or np.ndarray of shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+        X : iterable of np.ndarray, or np.ndarray of shape=([n_bayes], n_samples, [n_classes/n_box_features])
             NumPy array with confidence values for each prediction on classification with shapes
             1-D for binary classification, 2-D for multi class (softmax).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
             If this is an iterable over multiple instances of np.ndarray and parameter batched=True,
             interpret this parameter as multiple predictions that should be averaged.
             On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : iterable of np.ndarray with same length as X or np.ndarray of shape=(n_samples, [n_classes])
+        y : iterable of np.ndarray with same length as X or np.ndarray of shape=([n_bayes], n_samples, [n_classes])
             NumPy array with ground truth labels.
             Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            If 3-D, interpret first dimension as samples from an Bayesian estimator with mulitple data points
+            for a single sample (e.g. variational inference or MC dropout samples).
             If iterable over multiple instances of np.ndarray and parameter batched=True,
             interpret this parameter as multiple predictions that should be averaged.
         batched : bool, optional, default: False
             Multiple predictions can be evaluated at once (e.g. cross-validation examinations) using batched-mode.
             All predictions given by X and y are separately evaluated and their results are averaged afterwards
             for visualization.
+        uncertainty : str, optional, default: False
+            Define uncertainty handling if input X has been sampled e.g. by Monte-Carlo dropout or similar methods
+            that output an ensemble of predictions per sample. Choose one of the following options:
+            - flatten:  treat everything as a separate prediction - this option will yield into a slightly better
+                        calibration performance but without the visualization of a prediction interval.
+            - mean:     compute Monte-Carlo integration to obtain a simple confidence estimate for a sample
+                        (mean) with a standard deviation that is visualized.
         filename : str, optional, default: None
             Optional filename to save the plotted figure.
+        tikz : bool, optional, default: False
+            If True, use 'tikzplotlib' package to return tikz-code for Latex rather than a Matplotlib figure.
+        title_suffix : str, optional, default: None
+            Suffix for plot title.
+        feature_names : list, optional, default: None
+            Names of the additional features that are attached to the axes of a reliability diagram.
         **save_args : args
-            Additional arguments passed to 'matplotlib.pyplot.Figure.savefig' function.
+            Additional arguments passed to 'matplotlib.pyplot.Figure.savefig' function if 'tikz' is False.
+            If 'tikz' is True, the argument are passed to 'tikzplotlib.get_tikz_code' function.
 
         Returns
         -------
-        matplotlib.pyplot.Figure
+        matplotlib.pyplot.Figure if 'tikz' is False else str with tikz code.
 
         Raises
         ------
@@ -147,108 +147,72 @@ def plot(self, X: Union[tuple, list, np.ndarray], y: Union[tuple, list, np.ndarr
             - If more than 3 feature dimensions (including confidence) are provided
         """
 
-        # copy X and y for visualization as those variables might get modified
-        X, y = deepcopy(X), deepcopy(y)
+        # assign deprecated constructor parameter to title_suffix and feature_names
+        if hasattr(self, 'title_suffix') and title_suffix is None:
+            title_suffix = self.title_suffix
+
+        if hasattr(self, 'feature_names') and feature_names is None:
+            feature_names = self.feature_names
 
         # check if metric is correct
         if not isinstance(self.metric, str):
             raise AttributeError('Parameter \'metric\' must be string with either \'ece\', \'ace\' or \'mce\'.')
 
+        # check metrics parameter
         if self.metric.lower() not in ['ece', 'ace', 'mce']:
             raise AttributeError('Parameter \'metric\' must be string with either \'ece\', \'ace\' or \'mce\'.')
         else:
             self.metric = self.metric.lower()
 
-        # batched: interpret X and y as multiple predictions. Display average miscalibration map
-        # if batch mode is not enabled, use
-        if not batched:
-            X, y = [X], [y]
-
-        num_features = -1
-        for i, (batch_X, batch_y) in enumerate(zip(X, y)):
-
-            # we need at least 2 dimensions (for classification as well as for detection)
-            if len(batch_X.shape) == 1:
-                X[i] = np.reshape(batch_X, (-1, 1))
-
-            # remove unnecessary dims if given
-            y[i] = np.squeeze(batch_y)
-
-            # check number of given samples
-            if batch_y.size <= 0:
-                raise ValueError("No samples provided.")
+        # perform checks and prepare input data
+        X, matched, sample_uncertainty, bin_bounds, num_features = self._miscalibration.prepare(X, y, batched, uncertainty)
+        if num_features > 3:
+            raise AttributeError("Diagram is not defined for more than 2 additional feature dimensions.")
 
-            # on detection mode, leave y array untouched
-            elif len(batch_y.shape) == 2 and not self.detection:
-                # still assume y as binary with ground truth labels present in y=1 entry
-                if batch_y.shape[1] <= 2:
-                    y[i] = batch_y[:, -1]
-
-                # assume y as one-hot encoded
-                else:
-                    y[i] = np.argmax(batch_y, axis=1)
-
-            batch_num_features = batch_X.shape[1] if self.detection and batch_X.ndim > 1 else 1
-            # get number of additional dimensions (if not initialized)
-            if num_features == -1:
-                num_features = batch_num_features
-            else:
-                # if number of features is not equal over all instances, raise exception
-                if num_features != batch_num_features:
-                    raise ValueError("Unequal number of classes/features given in batched mode.")
-
-        # check bins parameter
-        # is int? distribute to all dimensions
-        if isinstance(self.bins, int):
-            self.bins = [self.bins, ] * num_features
-
-        # is iterable? check for compatibility with all properties found
-        elif isinstance(self.bins, (tuple, list)):
-            if len(self.bins) != num_features:
-                raise AttributeError("Length of \'bins\' parameter must match number of features.")
-        else:
-            raise AttributeError("Unknown type of parameter \'bins\'.")
-
-        if self.feature_names is not None:
-            if len(self.feature_names) != num_features-1:
-                raise AttributeError("If attribute \'feature_names\' is set, the length must equal the number of additional properties given.")
+        histograms = []
+        for batch_X, batch_matched, batch_uncertainty, bounds in zip(X, matched, sample_uncertainty, bin_bounds):
+            batch_histograms = self._miscalibration.binning(bounds, batch_X, batch_matched, batch_X[:, 0], batch_uncertainty[:, 0])
+            histograms.append(batch_histograms[:-1])
 
         # no additional dimensions? compute standard reliability diagram
         if num_features == 1:
-            fig = self.__plot_confidence_histogram(X, y)
+            fig = self.__plot_confidence_histogram(X, matched, histograms, bin_bounds, title_suffix)
 
         # one additional feature? compute 1D-plot
         elif num_features == 2:
-            fig = self.__plot_1d(X, y)
+            fig = self.__plot_1d(histograms, bin_bounds, title_suffix, feature_names)
 
         # two additional features? compute 2D plot
         elif num_features == 3:
-            fig = self.__plot_2d(X, y)
+            fig = self.__plot_2d(histograms, bin_bounds, title_suffix, feature_names)
 
         # number of dimensions exceeds 3? quit
         else:
-            raise AttributeError("Diagram is not defined for more than 3 additional feature dimensions.")
+            raise AttributeError("Diagram is not defined for more than 2 additional feature dimensions.")
+
+        # if tikz is true, create tikz code from matplotlib figure
+        if tikz:
 
+            # get tikz code for our specific figure and also pass filename to store possible bitmaps
+            tikz_fig = tikzplotlib.get_tikz_code(fig, filepath=filename, **save_args)
+
+            # close matplotlib figure when tikz figure is requested to save memory
+            plt.close(fig)
+            fig = tikz_fig
+
+        # save figure either as matplotlib PNG or as tikz output file
         if filename is not None:
-            fig.savefig(filename, **save_args)
+            if tikz:
+                with open(filename, "w") as open_file:
+                    open_file.write(fig)
+            else:
+                fig.savefig(filename, **save_args)
 
         return fig
 
     @classmethod
-    def __interpolate_grid(cls, metric_map: np.ndarray):
-        """
-        Interpolate missing values in a 2D-grid.
-
-        Parameters
-        ----------
-        metric_map: np.ndarray
-            Metric map computed by :class`_Miscalibration` class.
-
-        Returns
-        -------
-        np.ndarray
-            Interpolated 2D metric map
-        """
+    def __interpolate_grid(cls, metric_map: np.ndarray) -> np.ndarray:
+        """ Interpolate missing values in a 2D-grid using the mean of the data. The interpolation is done inplace. """
 
         # get all NaNs
         nans = np.isnan(metric_map)
@@ -259,317 +223,275 @@ def __interpolate_grid(cls, metric_map: np.ndarray):
         metric_map[nans] = griddata(x(~nans), metric_map[~nans], x(nans), method='cubic', fill_value=mean)
         return metric_map
 
-    def __plot_confidence_histogram(self, X: list, y: list) -> plt.Figure:
-        """
-        Plot confidence histogram and reliability diagram to visualize miscalibration for condidences only.
+    def __plot_confidence_histogram(self, X: List[np.ndarray], matched: List[np.ndarray], histograms: List[np.ndarray],
+                                    bin_bounds: List, title_suffix: str = None) -> plt.Figure:
+        """ Plot confidence histogram and reliability diagram to visualize miscalibration for condidences only. """
 
-        Parameters
-        ----------
-        X : list of np.ndarray, each with shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            List of NumPy arrays with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : list of np.ndarray, shape=(n_samples, [n_classes])
-            List of NumPy arrays with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+        # get number of bins (self.bins has not been processed yet)
+        n_bins = len(bin_bounds[0][0])-1
 
-        Returns
-        -------
-        matplotlib.pyplot.Figure
-        """
-
-        acc, conf, num_samples, mean_acc, mean_conf = [], [], [], [], []
-        bounds = np.linspace(0., 1., self.bins[0] + 1)
-        median_confidence = (bounds[1:] + bounds[:-1]) * 0.5
-
-        for batch_X, batch_y in zip(X, y):
-            if len(batch_X.shape) == 1:
-                batch_X = np.reshape(batch_X, (-1, 1))
-                prediction = np.ones(batch_X.shape[0])
-
-            # got 2D array for X?
-            elif len(batch_X.shape) == 2:
-
-                # on detection mode, assume all predictions as 'matched'
-                if self.detection:
-                    prediction = np.ones(batch_X.shape[0])
-
-                # on classification, if less than 2 entries for 2nd dimension are present, assume binary classification
-                # (independent sigmoids are currently not supported)
-                elif batch_X.shape[1] == 1:
-                    prediction = np.ones(batch_X.shape[0])
-
-                # classification and more than 1 entry for 2nd dimension? assume multiclass classification
-                else:
-                    prediction = np.argmax(batch_X, axis=1)
-                    batch_X = np.reshape(np.max(batch_X, axis=1), (-1, 1))
-            else:
-                prediction = np.ones_like(batch_X)
-
-            matched = prediction == batch_y
-
-            # get binned statistic of average accuracy and confidence
-            # as well as number of samples in each bin
-            batch_acc, _, _ = binned_statistic(batch_X[:, 0], values=matched, statistic='mean',
-                                               bins=self.bins[0], range=[[0.0, 1.0]])
-            batch_conf, _, _ = binned_statistic(batch_X[:, 0], values=batch_X[:, 0], statistic='mean',
-                                                bins=self.bins[0], range=[[0.0, 1.0]])
-            batch_num_samples, _ = np.histogram(batch_X[:, 0], bins=self.bins[0], range=(0.0, 1.0))
-
-            # identify all NaN indices
-            nan_indices = np.nonzero(np.isnan(batch_acc))[0]
-
-            # first dimension is confidence dimension - use the binning in this dimension to
-            # determine median as fill values for empty bins
-            batch_acc[nan_indices] = median_confidence[nan_indices]
-            batch_conf[nan_indices] = median_confidence[nan_indices]
-
-            # convert to relative amount of samples
-            batch_num_samples = batch_num_samples / np.sum(batch_num_samples)
+        median_confidence = [(bounds[0][1:] + bounds[0][:-1]) * 0.5 for bounds in bin_bounds]
+        mean_acc, mean_conf = [], []
+        for batch_X, batch_matched, batch_hist, batch_median in zip(X, matched, histograms, median_confidence):
+            acc_hist, conf_hist, _, num_samples_hist = batch_hist
+            empty_bins, = np.nonzero(num_samples_hist == 0)
 
             # calculate overall mean accuracy and confidence
-            batch_mean_acc = np.mean(batch_y)
-            batch_mean_conf = np.mean(batch_X)
-
-            # collect batched values
-            acc.append(batch_acc)
-            conf.append(batch_conf)
-            num_samples.append(batch_num_samples)
-            mean_acc.append(batch_mean_acc)
-            mean_conf.append(batch_mean_conf)
-
-        # calculate mean over batched values
-        acc = np.mean(np.array(acc), axis=0)
-        conf = np.mean(np.array(conf), axis=0)
-        num_samples = np.mean(np.array(num_samples), axis=0)
-        mean_acc = np.mean(np.array(mean_acc))
-        mean_conf = np.mean(np.array(mean_conf))
+            mean_acc.append(np.mean(batch_matched))
+            mean_conf.append(np.mean(batch_X))
+
+            # set empty bins to median bin value
+            acc_hist[empty_bins] = batch_median[empty_bins]
+            conf_hist[empty_bins] = batch_median[empty_bins]
+
+            # convert num_samples to relative afterwards (inplace denoted by [:])
+            num_samples_hist[:] = num_samples_hist / np.sum(num_samples_hist)
+
+        # get mean histograms and values over all batches
+        acc = np.mean([hist[0] for hist in histograms], axis=0)
+        conf = np.mean([hist[1] for hist in histograms], axis=0)
+        uncertainty = np.sqrt(np.mean([hist[2] for hist in histograms], axis=0))
+        num_samples = np.mean([hist[3] for hist in histograms], axis=0)
+        mean_acc = np.mean(mean_acc)
+        mean_conf = np.mean(mean_conf)
+        median_confidence = np.mean(median_confidence, axis=0)
+        bar_width = np.mean([np.diff(bounds[0]) for bounds in bin_bounds], axis=0)
+
+        # compute credible interval of uncertainty
+        p = 0.05
+        z_score = norm.ppf(1. - (p / 2))
+        uncertainty = z_score * uncertainty
+
+        # if no uncertainty is given, set variable uncertainty to None in order to prevent drawing error bars
+        if np.count_nonzero(uncertainty) == 0:
+            uncertainty = None
 
         # calculate deviation
         deviation = conf - acc
 
-        logger = logging.getLogger(__name__)
-        logger.info("Average accuracy: %.4f - average confidence: %.4f" % (mean_acc, mean_conf))
-
         # -----------------------------------------
-        # plot stuff
-        fig = plt.figure()
-        ax = plt.subplot(211)
+        # plot data distribution histogram first
+        fig, axes = plt.subplots(2, squeeze=True, figsize=(7, 6))
+        ax = axes[0]
 
         # set title suffix is given
-        if self.title_suffix is not None:
-            ax.set_title('Confidence Histogram - ' + self.title_suffix)
+        if title_suffix is not None:
+            ax.set_title('Confidence Histogram - ' + title_suffix)
         else:
             ax.set_title('Confidence Histogram')
 
         # create bar chart with relative amount of samples in each bin
         # as well as average confidence and accuracy
-        plt.bar(median_confidence, height=num_samples, width=1. / self.bins[0], align='center', edgecolor='black')
-        plt.plot([mean_acc, mean_acc], [0.0, 1.0], color='black', linestyle='--')
-        plt.plot([mean_conf, mean_conf], [0.0, 1.0], color='gray', linestyle='--')
-        plt.xlim((0.0, 1.0))
-        plt.ylim((0.0, 1.0))
+        ax.bar(median_confidence, height=num_samples, width=bar_width, align='center', edgecolor='black')
+        ax.plot([mean_acc, mean_acc], [0.0, 1.0], color='black', linestyle='--')
+        ax.plot([mean_conf, mean_conf], [0.0, 1.0], color='gray', linestyle='--')
+        ax.set_xlim((0.0, 1.0))
+        ax.set_ylim((0.0, 1.0))
 
         # labels and legend
-        plt.xlabel('Confidence')
-        plt.ylabel('% of Samples')
-        plt.legend(['Avg. Accuracy', 'Avg. Confidence', 'Relative Amount of Samples'])
+        ax.set_xlabel('Confidence')
+        ax.set_ylabel('% of Samples')
+        ax.legend(['Avg. Accuracy', 'Avg. Confidence', 'Relative Amount of Samples'])
 
         # second plot: reliability histogram
-        ax = plt.subplot(212)
+        ax = axes[1]
 
         # set title suffix if given
-        if self.title_suffix is not None:
-            ax.set_title('Reliability Diagram' + " - " + self.title_suffix)
+        if title_suffix is not None:
+            ax.set_title('Reliability Diagram' + " - " + title_suffix)
         else:
             ax.set_title('Reliability Diagram')
 
         # create two overlaying bar charts with bin accuracy and the gap of each bin to the perfect calibration
-        plt.bar(median_confidence, height=acc, width=1./self.bins[0], align='center', edgecolor='black')
-        plt.bar(median_confidence, height=deviation, bottom=acc, width=1./self.bins[0], align='center',
-                edgecolor='black', color='red', alpha=0.6)
+        ax.bar(median_confidence, height=acc, width=bar_width, align='center',
+               edgecolor='black', yerr=uncertainty, capsize=4)
+        ax.bar(median_confidence, height=deviation, bottom=acc, width=bar_width, align='center',
+               edgecolor='black', color='red', alpha=0.6)
 
         # draw diagonal as perfect calibration line
-        plt.plot([0, 1], [0, 1], color='red', linestyle='--')
-        plt.xlim((0.0, 1.0))
-        plt.ylim((0.0, 1.0))
+        ax.plot([0, 1], [0, 1], color='red', linestyle='--')
+        ax.set_xlim((0.0, 1.0))
+        ax.set_ylim((0.0, 1.0))
 
         # labels and legend of second plot
-        plt.xlabel('Confidence')
-        plt.ylabel('Accuracy')
-        plt.legend(['Perfect Calibration', 'Actual', 'Gap'])
+        ax.set_xlabel('Confidence')
+        ax.set_ylabel('Accuracy')
+        ax.legend(['Perfect Calibration', 'Output', 'Gap'])
 
         plt.tight_layout()
         return fig
 
-    def __plot_1d(self, X: list, y: list) -> plt.Figure:
-        """
-        Plot 1-D miscalibration w.r.t. one additional feature.
+    def __plot_1d(self, histograms: List[np.ndarray], bin_bounds: List,
+                  title_suffix: str = None, feature_names: List[str] = None) -> plt.Figure:
+        """ Plot 1-D miscalibration w.r.t. one additional feature. """
 
-        Parameters
-        ----------
-        X : list of np.ndarray, each with shape=(n_samples, [n_box_features])
-            List of NumPy arrays with confidence values for each prediction and and additional box features in last dim.
-        y : list of np.ndarray, each with shape=(n_samples, [n_classes])
-            List of NumPy arrays with ground truth labels as label vector (1-D).
+        # z score for credible interval (if uncertainty is given)
+        p = 0.05
+        z_score = norm.ppf(1. - (p / 2))
 
-        Returns
-        -------
-        matplotlib.pyplot.Figure
-        """
+        results = []
+        for batch_hist, bounds in zip(histograms, bin_bounds):
+            result = self._miscalibration.process(self.metric, *batch_hist)
+            bin_median = (bounds[-1][:-1] + bounds[-1][1:]) * 0.5
 
-        # iterate over all given models and build mean confidence and accuracy
-        acc, edge_acc, conf, edge_conf, miscalibration_map = [], [], [], [], []
-
-        # miscalibration object is used to get metric map
-        miscalibration = _Miscalibration(bins=self.bins, detection=self.detection,
-                                         sample_threshold=self.sample_threshold)
-
-        for batch_X, batch_y in zip(X, y):
-            # get miscalibration w.r.t. to given feature
-            # get binned statistic of average accuracy and confidence w.r.t. binning by additional feature
-            batch_acc, batch_edge_acc, _ = binned_statistic(batch_X[:, -1], values=batch_y,
-                                                            statistic='mean', bins=self.bins[-1],
-                                                            range=[[0.0, 1.0]])
-            batch_conf, batch_edge_conf, _ = binned_statistic(batch_X[:, -1], values=batch_X[:, 0],
-                                                              statistic='mean', bins=self.bins[-1],
-                                                              range=[[0.0, 1.0]])
-            _, batch_miscal = miscalibration._measure(batch_X, batch_y, metric=self.metric,
-                                                      return_map=True, return_num_samples=False)
-            miscalibration_map.append(batch_miscal)
-
-            # set empty bins to 0
-            # TODO: mark those ranges with a gray box
-            batch_acc[np.isnan(batch_acc)] = 0.0
-            batch_conf[np.isnan(batch_conf)] = 0.0
-
-            # correct binning indices
-            batch_edge_acc = (batch_edge_acc[:-1] + batch_edge_acc[1:]) * 0.5
-            batch_edge_conf = (batch_edge_conf[:-1] + batch_edge_conf[1:]) * 0.5
-
-            # append to global variables
-            acc.append(batch_acc)
-            edge_acc.append(batch_edge_acc)
-            conf.append(batch_conf)
-            edge_conf.append(batch_edge_conf)
-
-        # calculate mean over all given instances
-        acc = np.mean(np.array(acc), axis=0)
-        edge_acc = np.mean(np.array(edge_acc), axis=0)
-        conf = np.mean(np.array(conf), axis=0)
-        edge_conf = np.mean(np.array(edge_conf), axis=0)
-        miscalibration_map = np.mean(np.array(miscalibration_map), axis=0)
-
-        # interpolate missing values
-        x = np.linspace(0.0, 1.0, 1000)
-        acc = interp1d(edge_acc, acc, kind='cubic', fill_value='extrapolate')(x)
-        conf = interp1d(edge_conf, conf, kind='cubic', fill_value='extrapolate')(x)
-        miscalibration_map = interp1d(edge_conf, miscalibration_map, kind='cubic', fill_value='extrapolate')(x)
+            # interpolate missing values
+            x = np.linspace(0.0, 1.0, 1000)
+            miscalibration = interp1d(bin_median, result[1], kind='cubic', fill_value='extrapolate')(x)
+            acc = interp1d(bin_median, result[2], kind='cubic', fill_value='extrapolate')(x)
+            conf = interp1d(bin_median, result[3], kind='cubic', fill_value='extrapolate')(x)
+            uncertainty = interp1d(bin_median, result[4], kind='cubic', fill_value='extrapolate')(x)
+
+            results.append((miscalibration, acc, conf, uncertainty))
+
+        # get mean over all batches and convert mean variance to a std deviation afterwards
+        miscalibration = np.mean([result[0] for result in results], axis=0)
+        acc = np.mean([result[1] for result in results], axis=0)
+        conf = np.mean([result[2] for result in results], axis=0)
+        uncertainty = np.sqrt(np.mean([result[3] for result in results], axis=0))
 
         # draw routines
         fig, ax1 = plt.subplots()
-        color = 'tab:blue'
+        conf_color = 'tab:blue'
 
         # set name of the additional feature
-        if self.feature_names is not None:
-            ax1.set_xlabel(self.feature_names[0])
+        if feature_names is not None:
+            ax1.set_xlabel(feature_names[0])
 
         ax1.set_xlim([0.0, 1.0])
         ax1.set_ylim([0.0, 1.0])
-        ax1.set_ylabel('accuracy/confidence', color=color)
+        ax1.set_ylabel('accuracy/confidence', color=conf_color)
 
         # draw confidence and accuracy on the same (left) axis
+        x = np.linspace(0.0, 1.0, 1000)
         line1, = ax1.plot(x, acc, '-.', color='black')
-        line2, = ax1.plot(x, conf, '--', color=color)
-        ax1.tick_params('y', labelcolor=color)
+        line2, = ax1.plot(x, conf, '--', color=conf_color)
+        ax1.tick_params('y', labelcolor=conf_color)
+
+        # if uncertainty is given, compute average of variances over all bins and get std deviation by sqrt
+        # compute credible interval afterwards
+        # define lower and upper bound
+        uncertainty = z_score * uncertainty
+        lb = conf - uncertainty
+        ub = conf + uncertainty
 
-        # create second axis for ECE
+        # create second axis for miscalibration
         ax11 = ax1.twinx()
-        color = 'tab:red'
-        line3, = ax11.plot(x, miscalibration_map, '-', color=color)
+        miscal_color = 'tab:red'
+        line3, = ax11.plot(x, miscalibration, '-', color=miscal_color)
+
+        if self.metric == 'ace':
+            ax11.set_ylabel('Average Calibration Error (ACE)', color=miscal_color)
+        elif self.metric == 'ece':
+            ax11.set_ylabel('Expected Calibration Error (ECE)', color=miscal_color)
+        elif self.metric == 'mce':
+            ax11.set_ylabel('Maximum Calibration Error (MCE)', color=miscal_color)
 
-        ax11.set_ylabel('Expected Calibration Error (ECE)', color=color)
-        ax11.tick_params('y', labelcolor=color)
+        ax11.tick_params('y', labelcolor=miscal_color)
 
-        # set ECE limits if given
+        # set miscalibration limits if given
         if self.fmin is not None and self.fmax is not None:
             ax11.set_ylim([self.fmin, self.fmax])
 
-        ax1.legend((line1, line2, line3), ('accuracy', 'confidence', 'ECE'), loc='lower left')
+        ax1.legend((line1, line2, line3),
+                   ('accuracy', 'confidence', '%s' % self.metric.upper()),
+                   loc='best')
 
-        if self.title_suffix is not None:
-            ax1.set_title('Accuracy, confidence and ECE depending on cx coordinate\n- %s -' % self.title_suffix)
+        if title_suffix is not None:
+            ax1.set_title('Accuracy, confidence and %s\n- %s -' % (self.metric.upper(), title_suffix))
         else:
-            ax1.set_title('Accuracy, confidence and ECE depending on cx coordinate')
+            ax1.set_title('Accuracy, confidence and %s' % self.metric.upper())
 
         ax1.grid(True)
 
         fig.tight_layout()
         return fig
 
-    def __plot_2d(self, X: list, y: list) -> plt.Figure:
-        """
-        Plot 2D miscalibration reliability diagram heatmap.
-
-        Parameters
-        ----------
-        X : list of np.ndarray, each with shape=(n_samples, [n_box_features])
-            List of NumPy arrays with confidence values for each prediction and and additional box features in last dim.
-        y : list of np.ndarray, each with shape=(n_samples, [n_classes])
-            List of NumPy array with ground truth labels as label vector (1-D).
-
-        Returns
-        -------
-        matplotlib.pyplot.Figure
-        """
-
-        # miscalibration object is used to get metric map
-        miscalibration = _Miscalibration(bins=self.bins, detection=self.detection,
-                                         sample_threshold=self.sample_threshold)
+    def __plot_2d(self, histograms: List[np.ndarray], bin_bounds: List[np.ndarray],
+                  title_suffix: str = None, feature_names: List[str] = None) -> plt.Figure:
+        """ Plot 2D miscalibration reliability diagram heatmap. """
 
-        metric_map = []
-        for batch_X, batch_y in zip(X, y):
-            batch_miscal, batch_metric_map, batch_num_samples_map = miscalibration._measure(batch_X, batch_y,
-                                                                                            metric=self.metric,
-                                                                                            return_map=True,
-                                                                                            return_num_samples=True)
+        results = []
+        for batch_hist in histograms:
+            result = self._miscalibration.process(self.metric, *batch_hist)
 
-            # on 2D (3 dimensions including confidence), use grid interpolation
-            # set missing entries to NaN and interpolate
-            batch_metric_map[batch_num_samples_map == 0.0] = np.nan
-            batch_metric_map = self.__interpolate_grid(batch_metric_map)
+            # interpolate 2D data inplace to avoid "empty" bins
+            batch_samples = result[-1]
+            for map in result[1:-1]:
+                map[batch_samples == 0.0] = 0.0
+                # TODO: check what to do here
+                # map[batch_samples == 0.0] = np.nan
+                # self.__interpolate_grid(map)
 
-            metric_map.append(batch_metric_map)
-
-        # calculate mean miscalibration along all metric maps
-        metric_map = np.mean(np.array(metric_map), axis=0)
+            # on interpolation, it is sometimes possible that empty bins have negative values
+            # however, this is invalid for variance
+            result[4][result[4] < 0] = 0.0
+            results.append(result)
 
+        # calculate mean over all batches and transpose
         # transpose is necessary. Miscalibration is calculated in the order given by the features
         # however, imshow expects arrays in format [rows, columns] or [height, width]
         # e.g., miscalibration with additional x/y (in this order) will be drawn [y, x] otherwise
-        metric_map = metric_map.T
+        miscalibration = np.mean([result[1] for result in results], axis=0).T
+        acc = np.mean([result[2] for result in results], axis=0).T
+        conf = np.mean([result[3] for result in results], axis=0).T
+        mean = np.mean([result[4] for result in results], axis=0).T
+        uncertainty = np.sqrt(mean)
 
+        # -----------------------------------------------------------------------------------------
         # draw routines
-        fig, _ = plt.subplots()
-        plt.imshow(metric_map, origin='lower', interpolation="gaussian", cmap='jet', aspect=1, vmin=self.fmin, vmax=self.fmax)
 
-        # set correct x- and y-ticks
-        plt.xticks(np.linspace(0., self.bins[1] - 1, 5), np.linspace(0., 1., 5))
-        plt.yticks(np.linspace(0., self.bins[2] - 1, 5), np.linspace(0., 1., 5))
-        plt.xlim([0.0, self.bins[1] - 1])
-        plt.ylim([0.0, self.bins[2] - 1])
+        def set_axis(ax, map, vmin=None, vmax=None):
+            """ Generic function to set all subplots equally """
+            # TODO: set proper fmin, fmax values
+            img = ax.imshow(map, origin='lower', interpolation="gaussian", cmap='jet', aspect=1, vmin=vmin, vmax=vmax)
+
+            # set correct x- and y-ticks
+            ax.set_xticks(np.linspace(0., len(bin_bounds[0][1])-2, 5))
+            ax.set_xticklabels(np.linspace(0., 1., 5))
+            ax.set_yticks(np.linspace(0., len(bin_bounds[0][2])-2, 5))
+            ax.set_yticklabels(np.linspace(0., 1., 5))
+            ax.set_xlim([0.0, len(bin_bounds[0][1])-2])
+            ax.set_ylim([0.0, len(bin_bounds[0][2])-2])
+
+            # draw feature names on axes if given
+            if feature_names is not None:
+                ax.set_xlabel(feature_names[0])
+                ax.set_ylabel(feature_names[1])
 
-        # draw feature names on axes if given
-        if self.feature_names is not None:
-            plt.xlabel(self.feature_names[0])
-            plt.ylabel(self.feature_names[1])
+            fig.colorbar(img, ax=ax, fraction=0.046, pad=0.04)
 
-        plt.colorbar()
+            return ax, img
+
+        # -----------------------------------
+
+        # create only two subplots if no additional uncertainty is given
+        if np.count_nonzero(uncertainty) == 0:
+            fig, (ax1, ax2, ax3) = plt.subplots(1, 3, figsize=(15, 5))
+
+        # process additional uncertainty if given
+        else:
+            fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2, squeeze=True, figsize=(10, 10))
+            ax4, img4 = set_axis(ax4, uncertainty)
+
+            if title_suffix is not None:
+                ax4.set_title("Confidence std deviation\n- %s -" % title_suffix)
+            else:
+                ax4.set_title("Confidence std deviation")
+
+        ax1, img1 = set_axis(ax1, acc, vmin=0, vmax=1)
+        ax2, img2 = set_axis(ax2, conf, vmin=0, vmax=1)
+        ax3, img3 = set_axis(ax3, miscalibration, vmin=self.fmin, vmax=self.fmax)
 
         # draw title if given
-        if self.title_suffix is not None:
-            plt.title("ECE depending on cx/cy coordinates\n- %s -" % self.title_suffix)
+        if title_suffix is not None:
+            ax1.set_title("Average accuracy\n- %s -" % title_suffix)
+            ax2.set_title("Average confidence\n- %s -" % title_suffix)
+            ax3.set_title("%s\n- %s -" % (self.metric.upper(), title_suffix))
         else:
-            plt.title("ECE depending on cx/cy coordinates")
+            ax1.set_title("Average accuracy")
+            ax2.set_title("Average confidence")
+            ax3.set_title("%s" % self.metric.upper())
+
+        # -----------------------------------------------------------------------------------------
 
         return fig
diff --git a/netcal/presentation/__init__.py b/netcal/presentation/__init__.py
index 8c5cf70..83c2ba1 100644
--- a/netcal/presentation/__init__.py
+++ b/netcal/presentation/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 """
 Methods for the visualization of miscalibration. This package consists of a Reliability Diagram method.
@@ -22,3 +22,4 @@
 
 
 from .ReliabilityDiagram import ReliabilityDiagram
+
diff --git a/netcal/regularization/ConfidencePenalty.py b/netcal/regularization/ConfidencePenalty.py
index 24313cf..2fea60e 100644
--- a/netcal/regularization/ConfidencePenalty.py
+++ b/netcal/regularization/ConfidencePenalty.py
@@ -1,11 +1,13 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import numpy as np
+import torch
+from torch.nn.modules.loss import _Loss
 
 from netcal import global_dimensions
 
@@ -56,3 +58,58 @@ def confidence_penalty(X: np.ndarray, weight: float, threshold: float = None, ba
     penalty = weight * -entropy
 
     return penalty
+
+
+class ConfidencePenalty(_Loss):
+    """
+    Confidence penalty regularization implementation for PyTorch.
+    This penalty term can be applied to any loss function as a regularizer [1]_.
+
+    Parameters
+    ----------
+    weight : float
+        Weight of entropy.
+    threshold : float, optional, default: None
+        Entropy threshold (no penalty is assigned above threshold).
+    reduction : 'str'
+        Specifies the reduction to apply to the output.
+
+    References
+    ----------
+    .. [1] G. Pereyra, G. Tucker, J. Chorowski, Lukasz Kaiser, and G. Hinton:
+       “Regularizing neural networks by penalizing confident output distributions.”
+       CoRR, 2017.
+       `Get source online <https://arxiv.org/pdf/1701.06548>`_
+    """
+
+    epsilon = 1e-12
+
+    def __init__(self, weight: float = 1.0, threshold: float = -1., reduction='mean'):
+        """ Constructor. For parameter description, see class docstring. """
+
+        super().__init__(reduction=reduction)
+        self.weight = weight
+        self.threshold = threshold
+
+    def forward(self, input: torch.Tensor):
+        """ Forward call. Additional arguments and keyword-arguments are ignored. """
+
+        probs = torch.clamp(torch.softmax(input, dim=1), self.epsilon, 1.-self.epsilon)
+
+        # calculate entropy of each sample and sum all samples afterwards
+        loss = -self.weight * torch.mul(probs, torch.log(probs))
+
+        # set entropy threshold if given
+        if self.threshold > 0:
+            loss = torch.maximum(0.0, self.threshold - loss)
+
+        if self.reduction == 'mean':
+            return torch.mean(loss)
+        elif self.reduction == 'batchmean':
+            return torch.mean(torch.sum(loss, dim=1))
+        elif self.reduction == 'sum':
+            return torch.sum(loss)
+        elif self.reduction == 'none':
+            return loss
+        else:
+            raise AttributeError("Unknown reduction type \'%s\'." % self.reduction)
diff --git a/netcal/regularization/DCAPenalty.py b/netcal/regularization/DCAPenalty.py
new file mode 100644
index 0000000..52aecb1
--- /dev/null
+++ b/netcal/regularization/DCAPenalty.py
@@ -0,0 +1,48 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+import torch
+from torch.nn.modules.loss import _Loss
+
+
+class DCAPenalty(_Loss):
+    """
+    Difference between Confidence and Accuracy (DCA) [1]_. This regularization returns a single scalar indicating
+    the difference between mean confidence and accuracy within a single batch.
+
+    Parameters
+    ----------
+    weight : float
+        Weight of DCA regularization.
+
+    References
+    ----------
+    .. [1] Liang, Gongbo, et al.:
+       "Improved trainable calibration method for neural networks on medical imaging classification."
+       arXiv preprint arXiv:2009.04057 (2020).
+    """
+
+    def __init__(self, weight: float = 1.0):
+        """ Constructor. For parameter description, see class docstring. """
+
+        super().__init__()
+        self.weight = weight
+
+    def forward(self, input: torch.Tensor, target: torch.Tensor):
+        """ Forward call of module. Providing the target scores is mandatory. """
+
+        # assume logits as input
+        probs, labels = torch.max(torch.softmax(input, dim=1), dim=1)
+
+        # get batch accuracy
+        matched = torch.where(labels == target, torch.ones_like(labels), torch.zeros_like(labels))
+        acc = torch.mean(matched.detach().to(torch.float32))
+
+        # DCA is absolute difference between batch accuracy and mean confidence
+        dca = torch.abs(acc - torch.mean(probs))
+
+        return dca
diff --git a/netcal/regularization/MMCEPenalty.py b/netcal/regularization/MMCEPenalty.py
new file mode 100644
index 0000000..4b382e5
--- /dev/null
+++ b/netcal/regularization/MMCEPenalty.py
@@ -0,0 +1,77 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+import torch
+from torch.nn.modules.loss import _Loss
+
+
+class MMCEPenalty(_Loss):
+    """
+    Maximum mean calibration error (MMCE) [1]_. This term can be used for online confidence calibration directly
+    during model training.
+
+    Parameters
+    ----------
+    weight : float
+        Weight of MMCE regularization.
+
+    References
+    ----------
+    .. [1] Kumar, Aviral, Sunita Sarawagi, and Ujjwal Jain:
+       "Trainable calibration measures for neural networks from kernel mean embeddings."
+       International Conference on Machine Learning. PMLR, 2018.
+       `Get source online: <http://proceedings.mlr.press/v80/kumar18a/kumar18a.pdf>`_
+    """
+
+    epsilon = 1e-12
+
+    def __init__(self, weight: float = 1.0):
+        """ Constructor. For parameter description, see class docstring. """
+
+        super().__init__()
+        self.weight = weight
+
+    def kernel(self, c1: torch.Tensor, c2: torch.Tensor) -> torch.Tensor:
+        """ Laplacian kernel """
+
+        diff = c1[:, None] - c2
+        return torch.exp(-2.5 * torch.abs(diff))
+
+    def forward(self, input: torch.Tensor, target: torch.Tensor):
+        """ Forward call of module. Returns a single scalar indicating the MMCE for the current batch. """
+
+        # assume logits as input
+        probs, labels = torch.max(torch.softmax(input, dim=1), dim=1)
+        probs = torch.clamp(probs, min=self.epsilon, max=1. - self.epsilon)
+
+        matched = torch.where(labels == target, torch.ones_like(labels), torch.zeros_like(labels))
+        n_samples = len(matched)
+        n_correct = torch.sum(matched)
+
+        # divide all probabilities by matched/not matched
+        probs_false = probs[matched == 0]
+        probs_correct = probs[matched == 1]
+
+        # compute kernels between different combinations
+        kernel_false = self.kernel(probs_false, probs_false)
+        kernel_correct = self.kernel(probs_correct, probs_correct)
+        kernel_mixed = self.kernel(probs_correct, probs_false)
+
+        probs_false = torch.unsqueeze(probs_false, dim=1)
+        inv_probs_correct = torch.unsqueeze(1. - probs_correct, dim=1)
+
+        diff_false = torch.matmul(probs_false, probs_false.transpose(1, 0))
+        diff_correct = torch.matmul(inv_probs_correct, inv_probs_correct.transpose(1, 0))
+        diff_mixed = torch.matmul(inv_probs_correct, probs_false.transpose(1, 0))
+
+        # MMCE calculation scheme (see paper for mathematical details)
+        part_false = torch.sum(diff_false * kernel_false) / float((n_samples - n_correct) ** 2) if n_samples - n_correct > 0 else 0.
+        part_correct = torch.sum(diff_correct * kernel_correct) / float(n_correct ** 2) if n_correct > 0 else 0.
+        part_mixed = 2 * torch.sum(diff_mixed * kernel_mixed) / float((n_samples - n_correct) * n_correct) if (n_samples - n_correct) * n_correct > 0 else 0.
+
+        mmce = self.weight * torch.sqrt(part_false + part_correct - part_mixed)
+
+        return mmce
diff --git a/netcal/regularization/__init__.py b/netcal/regularization/__init__.py
index feafa9c..59dcccc 100644
--- a/netcal/regularization/__init__.py
+++ b/netcal/regularization/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 """
 Regularization methods which are applied during model training. These methods should achieve a
@@ -18,7 +18,13 @@
    :toctree: _autosummary_regularization_func
 
    confidence_penalty
+   ConfidencePenalty
+   MMCEPenalty
+   DCAPenalty
 """
 
 
 from .ConfidencePenalty import confidence_penalty
+from .ConfidencePenalty import ConfidencePenalty
+from .MMCEPenalty import MMCEPenalty
+from .DCAPenalty import DCAPenalty
diff --git a/netcal/scaling/AbstractLogisticRegression.py b/netcal/scaling/AbstractLogisticRegression.py
new file mode 100644
index 0000000..4020d7a
--- /dev/null
+++ b/netcal/scaling/AbstractLogisticRegression.py
@@ -0,0 +1,891 @@
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerkssysteme, Gaimersheim, Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from typing import Tuple, List
+import warnings
+from collections import OrderedDict, defaultdict
+from typing import Union
+import abc
+from tqdm import tqdm
+
+import numpy as np
+from scipy.optimize import minimize
+from scipy.special import logit as safe_logit
+
+import torch
+import torch.nn as nn
+from torch.utils.data import DataLoader
+import torch.distributions as tdist
+import torch.distributions.constraints as constraints
+from torch.utils.tensorboard import SummaryWriter
+
+import pyro
+from pyro.infer import SVI, Trace_ELBO, Predictive, MCMC, NUTS
+from pyro.optim import Adam, SGD
+import pyro.distributions as dist
+
+from netcal import AbstractCalibration, dimensions, accepts, manual_seed
+
+
+class AbstractLogisticRegression(AbstractCalibration):
+    """
+    Abstract class for all calibration methods that base on logistic regression. We extended common
+    scaling calibration methods by Bayesian epistemic uncertainty modelling [1]_.
+    On the one hand, this class supports Maximum Likelihood (MLE) estimates without uncertainty.
+    This method is commonly solved by negative log likelihood optimization given by
+
+    .. math::
+       \\theta_\\text{MLE} = \\underset{\\theta}{\\text{min}} \\, -\\sum_{i=1}^N \\log p(y | x_i, \\theta)
+
+    with samples :math:`X`, label :math:`y`, weights :math:`\\theta` and likelihood :math:`p(y|X, \\theta)`.
+    See the implementations of the methods for more details.
+
+    On the other hand, methods to obtain uncertainty in calibration are currently Variational Inference (VI) and
+    Markov-Chain Monte-Carlo (MCMC) sampling. Instead of estimating the weights :math:`\\theta` of the logistic
+    regression directly, we place a probability distribution over the weights by
+
+    .. math::
+       p(\\theta | X, y) = \\frac{p(y | X, \\theta) p(\\theta)}{\\int p(y | X, \\theta) p(\\theta) d\\theta}
+
+    Since the marginal likelihood cannot be evaluated analytically for logistic regression, we need to approximate the
+    posterior by either MCMC sampling or Variational Inference. Using several techniques, we sample multiple times from
+    the posterior in order to get multiple related calibration results with a mean and a deviation for each sample.
+
+    MCMC sampling allows the sampling of a posterior without knowing the marginal likelihood. This method is unbiased
+    but computational expensive. In contrast, Variational Inference defines an easy variational
+    distribution :math:`q_\\Phi(\\theta)` (e.g. a normal distribution) for each weight parametrized by :math:`\\Phi`.
+    The optimization objective is then the minimization of the Kullback-Leibler divergence between the
+    variational distribution :math:`q_\\Phi(\\theta))` and the true posterior :math:`p(\\theta | X, y)`.
+    This can be solved using the ELBO method [2]_. Variational Inference is faster than MCMC but also biased.
+
+    Parameters
+    ----------
+    method : str, default: "mle"
+        Method that is used to obtain a calibration mapping:
+        - 'mle': Maximum likelihood estimate without uncertainty using a convex optimizer.
+        - 'momentum': MLE estimate using Momentum optimizer for non-convex optimization.
+        - 'variational': Variational Inference with uncertainty.
+        - 'mcmc': Markov-Chain Monte-Carlo sampling with uncertainty.
+    momentum_epochs : int, optional, default: 1000
+            Number of epochs used by momentum optimizer.
+    mcmc_steps : int, optional, default: 20
+        Number of weight samples obtained by MCMC sampling.
+    mcmc_chains : int, optional, default: 1
+        Number of Markov-chains used in parallel for MCMC sampling (this will result
+        in mcmc_steps * mcmc_chains samples).
+    mcmc_warmup_steps : int, optional, default: 100
+        Warmup steps used for MCMC sampling.
+    vi_epochs : int, optional, default: 1000
+        Number of epochs used for ELBO optimization.
+    detection : bool, default: False
+        If False, the input array 'X' is treated as multi-class confidence input (softmax)
+        with shape (n_samples, [n_classes]).
+        If True, the input array 'X' is treated as a box predictions with several box features (at least
+        box confidence must be present) with shape (n_samples, [n_box_features]).
+    independent_probabilities : bool, optional, default: False
+        Boolean for multi class probabilities.
+        If set to True, the probability estimates for each
+        class are treated as independent of each other (sigmoid).
+    use_cuda : str or bool, optional, default: False
+        Specify if CUDA should be used. If str, you can also specify the device
+        number like 'cuda:0', etc.
+
+    References
+    ----------
+    .. [1] Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+       "Bayesian Confidence Calibration for Epistemic Uncertainty Modelling."
+       2021 IEEE Intelligent Vehicles Symposium (IV), 2021
+
+    .. [2] Michael I Jordan, Zoubin Ghahramani, Tommi S Jaakkola, and Lawrence K Saul:
+       "An introduction to variational methods for graphical models." Machine learning, 37(2): 183–233, 1999.
+    """
+
+    @accepts(str, int, int, int, int, int, bool, bool, (str, bool))
+    def __init__(self,
+                 method: str = 'mle',
+                 momentum_epochs: int = 1000,
+
+                 mcmc_steps: int = 250,
+                 mcmc_chains: int = 1,
+                 mcmc_warmup_steps: int = 100,
+
+                 vi_epochs: int = 1000,
+
+                 detection: bool = False,
+                 independent_probabilities: bool = False,
+                 use_cuda: Union[str, bool] = False,
+                 **kwargs):
+        """ Create an instance of `AbstractLogisticRegression`. Detailed parameter description given in class docs. """
+
+        super().__init__(detection=detection, independent_probabilities=independent_probabilities)
+
+        if 'num_samples' in kwargs:
+            warnings.warn("Parameter \'num_samples\' in constructor is deprecated and will be removed. "
+                          "Use this parameter in \'transform\' function call instead.")
+
+        if method == "mcmc":
+            warnings.warn("Optimization type \'MCMC\' is implemented but needs revision. Use \'variational\' instead.")
+
+        self.method = method.lower()
+        self.num_features = None
+
+        # epochs for momentum optimization
+        self.momentum_epochs = momentum_epochs
+
+        # properties for MCMC
+        self.mcmc_model = None
+        self.mcmc_steps = mcmc_steps
+        self.mcmc_chains = mcmc_chains
+        self.mcmc_warmup = mcmc_warmup_steps
+
+        # properties for Variational Inference
+        self.vi_model = None
+        self.vi_epochs = vi_epochs
+
+        if isinstance(use_cuda, str):
+            # this line will throw an exception if the cuda device does not exist
+            self._device = torch.device(use_cuda)
+            torch.cuda.get_device_name(use_cuda)
+
+        else:
+            self._device = torch.device('cuda') if use_cuda and torch.cuda.is_available() else torch.device('cpu')
+
+        # mask negative: for some methods like beta calibration, repeat optimization on MLE if
+        # negative values occur on the first run
+        self.mask_negative = False
+        self._sites = None
+
+    def save_model(self, filename: str):
+        """
+        Save model instance as with torch's save function as this is safer for torch tensors.
+
+        Parameters
+        ----------
+        filename : str
+            String with filename.
+        """
+
+        # overwrite is necessary because we want to copy everything back on CPU before we store anything
+        self.to(torch.device('cpu'))
+        super().save_model(filename)
+
+    def clear(self):
+        """
+        Clear model parameters.
+        """
+
+        # call parental clear method and clear parameter store of pyro
+        super().clear()
+        pyro.clear_param_store()
+
+        self.num_features = None
+        self._sites = None
+
+        self.mcmc_model = None
+        self.vi_model = None
+
+    @abc.abstractmethod
+    def prepare(self, X: np.ndarray) -> torch.Tensor:
+        """
+        Preprocessing of input data before called at the beginning of the fit-function.
+
+        Parameters
+        ----------
+        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+            NumPy array with confidence values for each prediction on classification with shapes
+            1-D for binary classification, 2-D for multi class (softmax).
+            On detection, this array must have 2 dimensions with number of additional box features in last dim.
+
+        Returns
+        -------
+        torch.Tensor
+            Prepared data vector X as torch tensor.
+        """
+
+        return torch.Tensor(X).to(self._device)
+
+    @abc.abstractmethod
+    def prior(self):
+        """
+        Prior definition of the weights and intercept used for log regression. This function has to set the
+        sites at least for "weights" and "bias".
+        """
+
+        raise NotImplementedError()
+
+    @abc.abstractmethod
+    def model(self, X: torch.Tensor = None, y: torch.Tensor = None) -> torch.Tensor:
+        """
+        Definition of the log regression model.
+
+        Parameters
+        ----------
+        X : torch.Tensor, shape=(n_samples, n_log_regression_features)
+            Input data that has been prepared by "self.prepare" function call.
+        y : torch.Tensor, shape=(n_samples, [n_classes])
+            Torch tensor with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).
+
+        Returns
+        -------
+        torch.Tensor, shape=(n_samples, [n_classes])
+            Logit of the log regression model.
+        """
+
+        raise NotImplementedError()
+
+    def mask(self) -> Tuple[np.ndarray, List]:
+        """
+        Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
+        in the interval [0, 0].
+        Constraints on the intercepts might also be set.
+
+        Returns
+        -------
+        tuple of (np.ndarray, list)
+            Indices of masked values and list of boundary constraints for optimization.
+        """
+
+        raise NotImplementedError()
+
+    def guide(self, X: torch.Tensor = None, y: torch.Tensor = None):
+        """
+        Variational substitution definition for each parameter. The signature is the same as for the
+        "self.model" function but the variables are not used.
+
+        Parameters
+        ----------
+        X : torch.Tensor, shape=(n_samples, n_log_regression_features)
+            Input data that has been prepared by "self.prepare" function call.
+        y : torch.Tensor, shape=(n_samples, [n_classes])
+            Torch tensor with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).
+        """
+
+        # iterate over all sites
+        for name, site in self._sites.items():
+
+            # get mean and scale as pyro parameters with (default) constraints
+            mean = pyro.param("%s_mean" % name, site['init']['mean'], constraint=site['constraint'])
+            scale = pyro.param("%s_scale" % name, site['init']['scale'], constraint=constraints.positive)
+
+            # use LogNormal if values are restricted to be positive
+            # use Normal distribution otherwise
+            guide_dist = dist.LogNormal if isinstance(site['constraint'], (constraints._GreaterThan, constraints._GreaterThanEq)) else dist.Normal
+
+            pyro.sample(
+                name, guide_dist(mean, scale, validate_args=True).independent(1)
+            )
+
+    def to(self, device: torch.device):
+        """ Set distribution parameters to the desired device in order to compute either on CPU or GPU. """
+
+        def get_base(distribution: dist.Distribution):
+            """ Get base distribution recursively (only works for derived Gaussians at the moment) """
+
+            if isinstance(distribution, (dist.Independent, dist.LogNormal)):
+                return get_base(distribution.base_dist)
+            elif isinstance(distribution, (dist.Normal, tdist.Normal)):
+                return distribution
+            else:
+                raise ValueError("Method is currently not implemented for other distributions than 'Independent', 'LogNormal' or 'Normal'.")
+
+        assert isinstance(self._sites, OrderedDict), "Method \'prior\' has to set all necessary initialization values and priors."
+
+        for name, site in self._sites.items():
+
+            # assert some member variables set by the 'prior' function
+            assert isinstance(site['prior'], dist.Distribution), "Method \'prior\' has to set prior dist for site %s." % name
+            assert isinstance(site['init']['mean'], torch.Tensor), "Method \'prior\' has to set initial mean for site %s." % name
+            assert isinstance(site['init']['scale'], torch.Tensor), "Method \'prior\' has to set initial scale for site %s." % name
+
+            # on some derived distributions (e.g. LogNormal), we need to set the base distribution parameters
+            # instead of the distribution parameters itself
+            prior_base = get_base(site['prior'])
+            prior_base.loc = prior_base.loc.to(device)
+            prior_base.scale = prior_base.scale.to(device)
+
+            # set initial values for mean and scale also to the proper device
+            site['init']['mean'] = site['init']['mean'].to(device)
+            site['init']['scale'] = site['init']['scale'].to(device)
+
+        # variational model is ParamStoreDict from pyro
+        if self.vi_model is not None:
+            for key, param in self.vi_model['params'].items():
+                self.vi_model['params'][key] = param.detach().to(device)
+
+        # MCMC samples are also dictionary
+        if self.mcmc_model is not None:
+            for key, param in self.vi_model.items():
+                self.vi_model[key] = param.detach().to(device)
+
+    @dimensions((1, 2), (1, 2), None, None, None)
+    def fit(self, X: np.ndarray, y: np.ndarray, random_state: int = None, tensorboard: bool = True,
+                 log_dir: str = None) -> 'AbstractLogisticRegression':
+        """
+        Build logitic calibration model either conventional with single MLE estimate or with
+        Variational Inference (VI) or Markov-Chain Monte-Carlo (MCMC) algorithm to also obtain uncertainty estimates.
+
+        Parameters
+        ----------
+        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+            NumPy array with confidence values for each prediction on classification with shapes
+            1-D for binary classification, 2-D for multi class (softmax).
+            On detection, this array must have 2 dimensions with number of additional box features in last dim.
+        y : np.ndarray, shape=(n_samples, [n_classes])
+            NumPy array with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+        random_state : int, optional, default: None
+            Fix the random seed for the random number
+
+        Returns
+        -------
+        AbstractLogisticRegression
+            Instance of class :class:`AbstractLogisticRegression`.
+        """
+
+        X, y = super().fit(X, y)
+
+        # prepare data input for algorithm
+        data = self.prepare(X).to(self._device)
+
+        # if y is given as one-hot, convert back to categorical encoding
+        if y.ndim == 2:
+            y = np.argmax(y, axis=1)
+
+        y = torch.from_numpy(y).to(self._device)
+        self.num_features = X.shape[1] if self.detection else 1
+
+        # initialize priors
+        self.prior()
+
+        # mark first dimension as independent
+        for site in self._sites.values():
+            site['prior'] = site['prior'].independent(1)
+
+        self.to(self._device)
+
+        with manual_seed(seed=random_state):
+
+            # markov-chain monte-carlo sampling (with uncertainty estimates)
+            if self.method == 'mcmc':
+                self.mcmc(data, y, tensorboard, log_dir)
+
+            # variational inference (with uncertainty estimates)
+            elif self.method == 'variational':
+                self.variational(data, y, tensorboard, log_dir)
+
+            # Maximum likelihood estimate (without uncertainty)
+            elif self.method == 'mle':
+                self.convex(data, y, tensorboard, log_dir)
+
+            # momentum is for non-convex optimization
+            elif self.method == 'momentum':
+                self.momentum(data, y, tensorboard, log_dir)
+            else:
+                raise AttributeError("Unknown method \'%s\'." % self.method)
+
+        # delete torch tensors
+        del data
+        del y
+
+        # if device is cuda, empty GPU cache to free memory
+        if self._device.type == 'cuda':
+            with torch.cuda.device(self._device):
+                torch.cuda.empty_cache()
+
+        return self
+
+    # -----------------------------------------------------------------
+
+    def mcmc(self, data: torch.Tensor, y: torch.Tensor, tensorboard: bool, log_dir: str):
+        """
+        Perform Markov-Chain Monte-Carlo sampling on the (unknown) posterior.
+
+        Parameters
+        ----------
+        data_input : np.ndarray, shape=(n_samples, n_features)
+            NumPy 2-D array with data input.
+        y : np.ndarray, shape=(n_samples,)
+            NumPy array with ground truth labels as 1-D vector (binary).
+        """
+
+        if tensorboard:
+            writer = SummaryWriter(log_dir=log_dir)
+            distribution = defaultdict(list)
+
+            def log(kernel, samples, stage, i):
+                """ Log after each MCMC iteration """
+
+                # loop through all sites and log their value as well as the underlying distribution
+                # approximated by a Gaussian
+                for key, value in samples.items():
+                    distribution[key].append(value)
+                    stacked = torch.stack(distribution[key], dim=0)
+                    mean, scale = torch.mean(stacked, dim=0), torch.std(stacked, dim=0)
+
+                    for d, x in enumerate(value):
+                        writer.add_scalar("%s_%s_%d" % (stage, key, d), x, i)
+                        writer.add_scalar("%s_%s_mean_%d" % (stage, key, d), mean[d], i)
+                        writer.add_scalar("%s_%s_scale_%d" % (stage, key, d), scale[d], i)
+
+                        writer.add_histogram("%s_histogram_%s_%d" % (stage, key, d), stacked[:, d], i)
+
+        # if logging is not requested, return empty lambda
+        else:
+            log = lambda kernel, samples, stage, i: None
+
+        # set up MCMC kernel
+        kernel = NUTS(self.model)
+
+        # initialize MCMC sampler and run sampling algorithm
+        mcmc = MCMC(kernel, num_samples=self.mcmc_steps,
+                    warmup_steps=self.mcmc_warmup,
+                    num_chains=self.mcmc_chains,
+                    hook_fn=log)
+        mcmc.run(data.float(), y.float())
+
+        # get samples from MCMC chains and store weights
+        samples = mcmc.get_samples()
+        self.mcmc_model = samples
+
+        if tensorboard:
+            writer.close()
+
+    def variational(self, data: torch.Tensor, y: torch.Tensor, tensorboard: bool, log_dir: str):
+        """
+        Perform variational inference using the guide.
+
+        Parameters
+        ----------
+        data_input : np.ndarray, shape=(n_samples, n_features)
+            NumPy 2-D array with data input.
+        y : np.ndarray, shape=(n_samples,)
+            NumPy array with ground truth labels as 1-D vector (binary).
+        """
+
+        # explicitly define datatype
+        data = data.float()
+        y = y.float()
+
+        num_samples = data.shape[0]
+
+        # create dataset
+        lr_dataset = torch.utils.data.TensorDataset(data, y)
+        data_loader = DataLoader(dataset=lr_dataset, batch_size=1024, pin_memory=False)
+
+        # define optimizer
+        optim = Adam({'lr': 0.01})
+        svi = SVI(self.model, self.guide, optim, loss=Trace_ELBO())
+
+        # add tensorboard writer if requested
+        if tensorboard:
+            writer = SummaryWriter(log_dir=log_dir)
+
+        # start variational process
+        with tqdm(total=self.vi_epochs) as pbar:
+            for epoch in range(self.vi_epochs):
+                epoch_loss = 0.
+                for i, (x, y) in enumerate(data_loader):
+                    epoch_loss += svi.step(x, y)
+
+                # get loss of complete epoch
+                epoch_loss = epoch_loss / num_samples
+
+                # logging stuff
+                if tensorboard:
+
+                    # add loss to logging
+                    writer.add_scalar("SVI loss", epoch_loss, epoch)
+
+                    # get param store and log current state of parameter store
+                    param_store = pyro.get_param_store()
+                    for key in self._sites.keys():
+                        for d, (loc, scale) in enumerate(zip(param_store["%s_mean" % key], param_store["%s_scale" % key])):
+                            writer.add_scalar("%s_mean_%d" % (key, d), loc, epoch)
+                            writer.add_scalar("%s_scale_%d" % (key, d), scale, epoch)
+
+                            # also represent the weights as distributions
+                            density = np.random.normal(loc=loc.detach().cpu().numpy(),
+                                                       scale=scale.detach().cpu().numpy(),
+                                                       size=1000)
+                            writer.add_histogram("histogram_%s_%d" % (key, d), density, epoch)
+
+                # update progress bar
+                pbar.set_description("SVI Loss: %.5f" % epoch_loss)
+                pbar.update(1)
+
+        self.vi_model = pyro.get_param_store().get_state()
+
+        if tensorboard:
+            writer.close()
+
+    def convex(self, data: torch.Tensor, y: torch.Tensor, tensorboard: bool, log_dir: str):
+        """
+        Convex optimization to find the global optimum of current parameter search.
+
+        Parameters
+        ----------
+        data_input : np.ndarray, shape=(n_samples, n_features)
+            NumPy 2-D array with data input.
+        y : np.ndarray, shape=(n_samples,)
+            NumPy array with ground truth labels as 1-D vector (binary).
+        """
+
+        # optimization objective function
+        # compute NLL loss - fix weights given of the model for the current iteration step
+        def MLE(w, x, y):
+
+            data = {}
+            start = 0
+            for name, site in self._sites.items():
+                num_weights = len(site['init']['mean'])
+                data[name] = torch.from_numpy(w[start:start+num_weights]).to(self._device)
+                start += num_weights
+
+            return loss_op(torch.squeeze(pyro.condition(self.model, data=data)(x)), y).item()
+
+        # convert input data to double as well as the weights
+        # this might be necessary for the optimizer
+        data = data.double()
+        initial_weights = np.concatenate(
+            [site['init']['mean'].cpu().numpy().astype(np.float64) for site in self._sites.values()]
+        )
+
+        # on detection or binary classification, use binary cross entropy loss and convert target vector to double
+        if self.detection or self._is_binary_classification():
+
+            # for an arbitrary reason, binary_cross_entropy_with_logits returns NaN
+            # thus, we need to use the bce loss with sigmoid
+            def loss_op(x, y):
+                return torch.nn.BCELoss(reduction='mean')(torch.sigmoid(x), y)
+
+            y = y.double()
+
+        # on multiclass classification, use multiclass cross entropy loss and convert target vector to long
+        else:
+            loss_op = torch.nn.CrossEntropyLoss(reduction='mean')
+            y = y.long()
+
+        # convert pytorch optim bounds to scipy optimization format
+        optim_bounds = self._get_scipy_constraints()
+
+        # invoke SciPy's optimization function as this is very light-weight and fast
+        result = minimize(fun=MLE, x0=initial_weights, args=(data, y), bounds=optim_bounds)
+
+        # assign weights to according sites
+        start = 0
+        for name, site in self._sites.items():
+            num_weights = len(site['init']['mean'])
+            site['values'] = result.x[start:start + num_weights].astype(np.float32)
+            start += num_weights
+
+        # on some methods like Beta calibration, it is necessary to repeat the optimization
+        # process if negative parameter estimates occur after training
+        if self.mask_negative:
+
+            # this method has to be implemented by the child class if it should be used
+            masked_weights, bounds = self.mask()
+            if bounds:
+                # rerun minimization routine
+                initial_weights[masked_weights] = 0.0
+                result = minimize(fun=MLE, x0=initial_weights, args=(data, y), bounds=bounds)
+
+        # get intercept and weights after optimization
+        start = 0
+        for name, site in self._sites.items():
+            num_weights = len(site['init']['mean'])
+            site['values'] = result.x[start:start + num_weights].astype(np.float32)
+            start += num_weights
+
+    def momentum(self, data: torch.Tensor, y: torch.Tensor, tensorboard: bool, log_dir: str):
+        """
+        Momentum optimization to find the global optimum of current parameter search.
+        This method is slow but tends to find the global optimum for non-convex optimization.
+
+        Parameters
+        ----------
+        data_input : np.ndarray, shape=(n_samples, n_features)
+            NumPy 2-D array with data input.
+        y : np.ndarray, shape=(n_samples,)
+            NumPy array with ground truth labels as 1-D vector (binary).
+        """
+
+        # initial learning rate, min delta for early stopping and patience
+        # for early stopping (number of epochs without improvement)
+        init_lr = 1e-3
+        batch_size = 1024
+
+        # criterion is Binary Cross Entropy on logits (numerically more stable)
+        criterion = nn.BCEWithLogitsLoss(reduction='mean')
+
+        # create dataset
+        lr_dataset = torch.utils.data.TensorDataset(data.double(), y.double())
+        data_loader = DataLoader(dataset=lr_dataset, batch_size=batch_size, pin_memory=False)
+
+        # init model and optimizer
+        parameters = [nn.Parameter(site['init']['mean']).to(self._device) for site in self._sites.values()]
+        optimizer = torch.optim.Adam(parameters, lr=init_lr)
+
+        best_loss = np.infty
+
+        # use tqdm to log loop action
+        with tqdm(total=self.momentum_epochs) as pbar:
+            for epoch in range(self.momentum_epochs):
+
+                # iterate over batches
+                for train_x, train_y in data_loader:
+
+                    condition = {}
+                    for name, param in zip(self._sites.keys(), parameters):
+                        condition[name] = param
+
+                    logit = pyro.condition(self.model, data=condition)(train_x.to(self._device))
+                    loss = criterion(logit, train_y.to(self._device))
+
+                    # perform optimization step
+                    optimizer.zero_grad()
+                    loss.backward()
+                    optimizer.step()
+
+                    # early stopping
+                    # if current loss is best so far, refresh memory
+                    if loss < best_loss:
+                        best_loss = loss
+
+                        pbar.set_description("Best Loss: %.6f" % best_loss)
+                        pbar.refresh()
+
+                # refresh progress bar
+                pbar.update(1)
+
+        # convert pytorch optim bounds to scipy optimization format
+        optim_bounds = self._get_scipy_constraints()
+
+        # get parameter estimates for each site
+        for site, param in zip(self._sites.values(), parameters):
+            site['values'] = param.detach().cpu().numpy()
+
+        # clip to optimization bounds afterwards because the last update step might not capture the
+        # optimization boundaries
+        if optim_bounds is not None:
+
+            start = 0
+            for name, site in self._sites.items():
+                num_weights = len(site['init']['mean'])
+
+                # use NumPy's clip function as this also supports arrays for clipping instead for
+                # single scalars only
+                site['values'] = np.clip(
+                    site['values'],
+                    [b[0] for b in optim_bounds[start:start+num_weights]],
+                    [b[1] for b in optim_bounds[start:start+num_weights]]
+                )
+                start += num_weights
+
+    # -----------------------------------------------------------------
+
+    def transform(self, X: np.ndarray, num_samples: int = 1000, random_state: int = None,
+                  mean_estimate: bool = False) -> np.ndarray:
+        """
+        After model calibration, this function is used to get calibrated outputs of uncalibrated
+        confidence estimates.
+
+        Parameters
+        ----------
+        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
+            NumPy array with confidence values for each prediction on classification with shapes
+            1-D for binary classification, 2-D for multi class (softmax).
+            On detection, this array must have 2 dimensions with number of additional box features in last dim.
+        num_samples : int, optional, default: 1000
+            Number of samples generated on MCMC sampling or Variational Inference.
+        random_state : int, optional, default: None
+            Fix the random seed for the random number
+        mean_estimate : bool, optional, default: False
+            If True, directly return the mean on probabilistic methods like MCMC or VI instead of the full
+            distribution. This parameter has no effect on MLE.
+
+        Returns
+        -------
+        np.ndarray, shape=(n_samples, [n_classes]) on MLE or on MCMC/VI if 'mean_estimate' is True
+        or shape=(n_parameters, n_samples, [n_classes]) on VI, MCMC if 'mean_estimate' is False
+            On MLE without uncertainty, return NumPy array with calibrated confidence estimates.
+            1-D for binary classification, 2-D for multi class (softmax).
+            On VI or MCMC, return NumPy array with leading dimension as the number of sampled parameters from the
+            log regression parameter distribution obtained by VI or MCMC.
+        """
+
+        def process_model(weights: dict) -> torch.Tensor:
+            """ Fix model weights to the weight vector given as the parameter and return calibrated data. """
+
+            # model will return pytorch tensor
+            model = pyro.condition(self.model, data=weights)
+            logit = model(data)
+
+            # distinguish between detection, binary and multiclass classification
+            if self.detection or self._is_binary_classification():
+                calibrated = torch.sigmoid(logit)
+            else:
+                calibrated = torch.softmax(logit, dim=1)
+
+            return calibrated
+
+        # prepare input data
+        X = super().transform(X)
+        self.to(self._device)
+
+        # convert input data and weights to torch (and possibly to CUDA)
+        data = self.prepare(X).float().to(self._device)
+
+        # if weights is 2-D matrix, we are in sampling mode
+        # treat each row as a separate weights vector
+        if self.method in ['variational', 'mcmc']:
+
+            if mean_estimate:
+                weights = {}
+
+                # on MCMC sampling, use mean over all weights as mean weight estimate
+                # TODO: we need to find another way since the parameters are conditionally dependent
+                # TODO: revise!!! We often have log-normals instead of normal distributions,
+                #  thus the mean will be a different
+                if self.mcmc_model is not None:
+                    for name, site in self._sites.items():
+                        weights[name] = torch.from_numpy(np.mean(self.mcmc_model[name])).to(self._device)
+
+                # on variational inference, use mean of the variational distribution for inference
+                elif self.vi_model is not None:
+                    for name, site in self._sites.items():
+                        weights[name] = torch.from_numpy(self.vi_model['params']['%s_mean' % name]).to(self._device)
+
+                else:
+                    raise ValueError("Internal error: neither MCMC nor variational model given.")
+
+                # on MLE without uncertainty, only return the single model estimate
+                calibrated = process_model(weights).cpu().numpy()
+                calibrated = self.squeeze_generic(calibrated, axes_to_keep=0)
+            else:
+
+                parameter = []
+                if self.mcmc_model is not None:
+
+                    with manual_seed(seed=random_state):
+                        idxs = torch.randint(0, self.mcmc_steps, size=(num_samples,), device=self._device)
+                        samples = {k: v.index_select(0, idxs) for k, v in self.mcmc_model.items()}
+
+                elif self.vi_model is not None:
+
+                    # restore state of global parameter store of pyro and use this parameter store for the predictive
+                    pyro.get_param_store().set_state(self.vi_model)
+                    predictive = Predictive(self.model, guide=self.guide,
+                                            num_samples=num_samples,
+                                            return_sites=tuple(self._sites.keys()))
+
+                    with manual_seed(seed=random_state):
+                        samples = predictive(data)
+
+                else:
+                    raise ValueError("Internal error: neither MCMC nor variational model given.")
+
+                # remove unnecessary dims that possibly occur on MCMC or VI
+                samples = {k: torch.reshape(v, (num_samples, -1)) for k, v in samples.items()}
+
+                # iterate over all parameter sets
+                for i in range(num_samples):
+                    param_dict = {}
+
+                    # iterate over all sites and store into parameter dict
+                    for site in self._sites.keys():
+                        param_dict[site] = samples[site][i].detach().to(self._device)
+
+                    parameter.append(param_dict)
+
+                calibrated = []
+
+                # iterate over all parameter collections and compute calibration mapping
+                for param_dict in parameter:
+                    cal = process_model(param_dict)
+                    calibrated.append(cal)
+
+                # stack all calibrated estimates along axis 0 and calculate stddev as well as mean
+                calibrated = torch.stack(calibrated, dim=0).cpu().numpy()
+                calibrated = self.squeeze_generic(calibrated, axes_to_keep=(0, 1))
+        else:
+
+            # extract all weight values of sites and store into single dict
+            weights = {}
+            for name, site in self._sites.items():
+                weights[name] = torch.from_numpy(site['values']).to(self._device)
+
+            # on MLE without uncertainty, only return the single model estimate
+            calibrated = process_model(weights).cpu().numpy()
+            calibrated = self.squeeze_generic(calibrated, axes_to_keep=0)
+
+        # delete torch data tensor
+        del data
+
+        # if device is cuda, empty GPU cache to free memory
+        if self._device.type == 'cuda':
+            with torch.cuda.device(self._device):
+                torch.cuda.empty_cache()
+
+        return calibrated
+
+    @dimensions((1, 2))
+    def _inverse_sigmoid(self, confidence: Union[np.ndarray, torch.Tensor]) -> Union[np.ndarray, torch.Tensor]:
+        """ Calculate inverse of Sigmoid to get Logit. """
+
+        # on torch tensors, use torch built-in functions
+        if isinstance(confidence, torch.Tensor):
+
+            # clip normal and inverse separately due to numerical stability
+            clipped = torch.clamp(confidence, self.epsilon, 1. - self.epsilon)
+            inv_clipped = torch.clamp(1. - confidence, self.epsilon, 1. - self.epsilon)
+
+            logit = torch.log(clipped) - torch.log(inv_clipped)
+            return logit
+
+        # use NumPy method otherwise
+        else:
+            clipped = np.clip(confidence, self.epsilon, 1. - self.epsilon)
+            return safe_logit(clipped)
+
+    @dimensions(2)
+    def _inverse_softmax(self, confidences: Union[np.ndarray, torch.Tensor]) -> Union[np.ndarray, torch.Tensor]:
+        """ Calculate inverse of multi class softmax. """
+
+        # on torch tensors, use torch built-in functions
+        if isinstance(confidences, torch.Tensor):
+            clipped = torch.clamp(confidences, self.epsilon, 1. - self.epsilon)
+            return torch.log(clipped)
+
+        # use NumPy methods otherwise
+        else:
+            clipped = np.clip(confidences, self.epsilon, 1. - self.epsilon)
+            return np.log(clipped)
+
+    def _get_scipy_constraints(self) -> List:
+        """ Convert list of optimization constraints defined in Pytorch to list of tuples for NumPy/Scipy. """
+
+        numpy_bounds = []
+
+        # iterate over bias and weights constraints
+        for site in self._sites.values():
+
+            bound = [-np.infty, np.infty]
+            constraint = site['constraint']
+            num_parameters = len(site['init']['mean'])
+
+            # check if constraint object has attributes for lower_bound or upper_bound
+            if constraint is not None:
+                if hasattr(constraint, 'lower_bound'):
+                    bound[0] = constraint.lower_bound
+                if hasattr(constraint, 'upper_bound'):
+                    bound[1] = constraint.upper_bound
+
+            numpy_bounds.extend([tuple(bound), ] * num_parameters)
+
+        return numpy_bounds
diff --git a/netcal/scaling/BetaCalibration.py b/netcal/scaling/BetaCalibration.py
index 2efadfc..15d3990 100644
--- a/netcal/scaling/BetaCalibration.py
+++ b/netcal/scaling/BetaCalibration.py
@@ -1,16 +1,24 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
+from typing import Tuple, List
+from collections import OrderedDict
+from typing import Union
 import numpy as np
-from scipy.optimize import minimize
-from netcal import AbstractCalibration, dimensions, accepts
 
+import torch
+import torch.distributions.constraints as constraints
+import pyro
+import pyro.distributions as dist
 
-class BetaCalibration(AbstractCalibration):
+from netcal.scaling import AbstractLogisticRegression
+
+
+class BetaCalibration(AbstractLogisticRegression):
     """
     On classification, apply the beta calibration method to obtain a calibration mapping. The original method was
     proposed by [1]_.
@@ -20,7 +28,8 @@ class BetaCalibration(AbstractCalibration):
     calibration mapping by means of the confidence as well as additional features [2]_. This calibration scheme
     assumes independence between all variables.
 
-    It is necessary to provide all data in input parameter ``X`` as an NumPy array of shape ``(n_samples, n_features)``,
+    On detection, it is necessary to provide all data in input parameter ``X`` as an NumPy array
+    of shape ``(n_samples, n_features)``,
     whereas the confidence must be the first feature given in the input array. The ground-truth samples ``y``
     must be an array of shape ``(n_samples,)`` consisting of binary labels :math:`y \\in \\{0, 1\\}`. Those
     labels indicate if the according sample has matched a ground truth box :math:`\\text{m}=1` or is a false
@@ -71,8 +80,23 @@ class BetaCalibration(AbstractCalibration):
 
     Parameters
     ----------
-    auto_select : bool, optional, default: False
-        Auto selection of best combination on detection mode.
+    method : str, default: "mle"
+        Method that is used to obtain a calibration mapping:
+        - 'mle': Maximum likelihood estimate without uncertainty using a convex optimizer.
+        - 'momentum': MLE estimate using Momentum optimizer for non-convex optimization.
+        - 'variational': Variational Inference with uncertainty.
+        - 'mcmc': Markov-Chain Monte-Carlo sampling with uncertainty.
+    momentum_epochs : int, optional, default: 1000
+            Number of epochs used by momentum optimizer.
+    mcmc_steps : int, optional, default: 20
+        Number of weight samples obtained by MCMC sampling.
+    mcmc_chains : int, optional, default: 1
+        Number of Markov-chains used in parallel for MCMC sampling (this will result
+        in mcmc_steps * mcmc_chains samples).
+    mcmc_warmup_steps : int, optional, default: 100
+        Warmup steps used for MCMC sampling.
+    vi_epochs : int, optional, default: 1000
+        Number of epochs used for ELBO optimization.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
@@ -82,6 +106,9 @@ class BetaCalibration(AbstractCalibration):
         Boolean for multi class probabilities.
         If set to True, the probability estimates for each
         class are treated as independent of each other (sigmoid).
+    use_cuda : str or bool, optional, default: False
+        Specify if CUDA should be used. If str, you can also specify the device
+        number like 'cuda:0', etc.
 
     References
     ----------
@@ -89,47 +116,45 @@ class are treated as independent of each other (sigmoid).
        "Beta calibration: a well-founded and easily implemented improvement on logistic calibration for binary classifiers"
        Artificial Intelligence and Statistics, PMLR 54:623-631, 2017
        `Get source online <http://proceedings.mlr.press/v54/kull17a/kull17a.pdf>`_
+
     .. [2] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
        The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
+
+    .. [3] Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+       "Bayesian Confidence Calibration for Epistemic Uncertainty Modelling."
+       2021 IEEE Intelligent Vehicles Symposium (IV), 2021
     """
 
-    @accepts(bool, bool, bool)
-    def __init__(self, auto_select: bool = False, detection: bool = False, independent_probabilities: bool = False):
-        """
-        Constructor
+    def __init__(self, *args, **kwargs):
+        """ Create an instance of `BetaCalibration`. Detailed parameter description given in class docs. """
 
-        Parameters
-        ----------
-        auto_select : bool, optional, default: False
-            Auto selection of best combination on detection mode.
-        detection : bool, default: False
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        independent_probabilities : bool, optional, default: False
-            Boolean for multi class probabilities.
-            If set to True, the probability estimates for each
-            class are treated as independent of each other (sigmoid).
-        """
-        super().__init__(detection=detection, independent_probabilities=independent_probabilities)
+        super().__init__(*args, **kwargs)
+        self.mask_negative = True
 
-        self.auto_select = auto_select
-        self._weights = None
+    # -------------------------------------------------
 
-    def clear(self):
-        """
-        Clear model parameters.
-        """
+    @property
+    def intercept(self) -> Union[np.ndarray, float]:
+        """ Getter for intercept of logistic calibration. """
+        if self._sites is None:
+            raise ValueError("Intercept is None. You have to call the method 'fit' first.")
+
+        return self._sites['bias']['values']
+
+    @property
+    def weights(self) -> Union[np.ndarray, float]:
+        """ Getter for weights of beta calibration. """
+        if self._sites is None:
+            raise ValueError("Weights is None. You have to call the method 'fit' first.")
 
-        super().clear()
-        self._weights = None
+        return self._sites['weights']['bias']
 
-    @dimensions((1, 2), (1, 2))
-    def fit(self, X: np.ndarray, y: np.ndarray) -> 'BetaCalibration':
+    # -------------------------------------------------
+
+    def prepare(self, X: np.ndarray) -> torch.Tensor:
         """
-        Build Beta Calibration model.
+        Preprocessing of input data before called at the beginning of the fit-function.
 
         Parameters
         ----------
@@ -137,118 +162,198 @@ def fit(self, X: np.ndarray, y: np.ndarray) -> 'BetaCalibration':
             NumPy array with confidence values for each prediction on classification with shapes
             1-D for binary classification, 2-D for multi class (softmax).
             On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
 
         Returns
         -------
-        BetaCalibration
-            Instance of class :class:`BetaCalibration`.
+        torch.Tensor
+            Prepared data vector X as torch tensor.
         """
 
-        X, y = super().fit(X, y)
-        solver = 'SLSQP'
-
-        # number of given features is 1 on classification mode (confidence)
-        num_features = 1
         if len(X.shape) == 1:
             X = np.reshape(X, (-1, 1))
 
-        # on detection mode, check if additional features are given
-        if self.detection:
-            num_features = X.shape[1]
-
-        # prepare data for beta calibration
-        data_input = self._get_data_input(X)
+        # build 2-D array with [log(x), -log(1-x)]
+        # convert confidences array and clip values to open interval (0, 1)
 
-        # detection case: logistic regression with multiple features and bias
+        # on detection, create array of shape (n_samples, 2*n_features)
         if self.detection:
-            num_weights = num_features * 2 + 1
-            normalizer = 1. / float(num_features * 2)
+            features = []
+            for i in range(X.shape[1]):
+                features.append(X[:, i])
+                features.append(1. - X[:, i])
 
-        # binary classification case: logistic regression with two features and bias
-        elif self._is_binary_classification():
-            num_weights = 3
-            normalizer = 0.5
+            data_input = np.stack(features, axis=1)
+            data_input = np.clip(data_input, self.epsilon, 1. - self.epsilon)
+            data_input = np.log(data_input)
+            data_input[:, 1::2] *= -1
 
-        # multiclass classification case: multinomial logistic regression with two features and bias for each class
+        # on classification, create an array
+        # - binary classification: shape (n_samples, 2)
+        # - multiclass classification: shape (n_samples, n_classes, 2)
         else:
-            num_weights = self.num_classes * 3
-            normalizer = 0.5
-
-            # convert ground truth to one hot if not binary
-            y = self._get_one_hot_encoded_labels(y, self.num_classes)
-
-        # initial parameter set
-        theta_0 = np.ones(num_weights) * normalizer
-        result = minimize(method=solver,
-                          fun=self._loss_function, x0=theta_0,
-                          args=(data_input, y))
-
-        self._weights = result.x
+            features = []
+            for i in range(X.shape[1]):
+                features.append(np.stack([X[:, i], 1. - X[:, i]], axis=1))
 
-        # get all weights masked whose values are negative and repeat optimization in that case
-        masked_weights = self._mask_negative_weights(self._weights)
-        if len(masked_weights):
+            data_input = features[0] if self._is_binary_classification() else np.stack(features, axis=1)
+            data_input = np.clip(data_input, self.epsilon, 1. - self.epsilon)
+            data_input = np.log(data_input)
+            data_input[..., 1] *= -1
 
-            # rerun minimization routine
-            theta_0 = np.ones(num_weights) * normalizer
-            theta_0[masked_weights] = 0.0
-            result = minimize(method=solver,
-                              fun=self._loss_function, x0=theta_0,
-                              args=(data_input, y, masked_weights))
+        return torch.tensor(data_input)
 
-            self._weights = result.x
+    def prior(self):
+        """
+        Prior definition of the weights used for log regression. This function has to set the
+        variables 'self.weight_prior_dist', 'self.weight_mean_init' and 'self.weight_stddev_init'.
+        """
 
-        return self
+        self._sites = OrderedDict()
 
-    @dimensions((1, 2))
-    def transform(self, X: np.ndarray) -> np.ndarray:
+        # on detection mode or binary classification, we have a weight for each given feature (one for binary
+        # classification) and bias
+        if self.detection or self._is_binary_classification():
+            num_bias = 1
+            num_weights = 2
+            feature_weights = 2 * (self.num_features - 1)
+
+            # store feature weights separately from confidence weights as they are unconstrained
+            # in constrast to the confidence weights
+            if feature_weights > 0:
+                self._sites['feature_weights'] = {
+                    'values': None,
+                    'constraint': constraints.real,
+                    'init': {
+                        'mean': torch.ones(feature_weights),
+                        'scale': torch.ones(feature_weights)
+                    },
+                    'prior': dist.Normal(torch.ones(feature_weights), 10 * torch.ones(feature_weights), validate_args=True),
+                }
+
+        # on multiclass classification, we have one weight and one bias for each class separately
+        else:
+            num_bias = self.num_classes
+            num_weights = 2*self.num_classes
+
+        # initialize weight mean by ones and set prior distribution
+        init_mean = torch.ones(num_weights)
+        init_scale = torch.ones(num_weights)
+        prior = dist.Normal(init_mean, 10 * init_scale, validate_args=True)
+
+        # we have constraints on the weights for the confidence
+        # this is usually solved by removing dims with invalid weights on MLE
+        # however, on MCMC and VI this is not possible
+        # instead, we are using a "shifted" LogNormal to obtain only positive samples
+        if self.method in ['variational', 'mcmc']:
+
+            # for this purpose, we need to transform the prior mean first and set the
+            # distribution to be a LogNormal
+            init_mean = torch.log(torch.exp(init_mean)-1)
+            prior = dist.LogNormal(init_mean, 10 * init_scale, validate_args=True)
+
+        # set sites for weights and bias
+        self._sites['weights'] = {
+            'values': None,
+            'constraint': constraints.positive,
+            'init': {
+                'mean': init_mean,
+                'scale': init_scale
+            },
+            'prior': prior
+        }
+
+        self._sites['bias'] = {
+            'values': None,
+            'constraint': constraints.real,
+            'init': {
+                'mean': torch.zeros(num_bias),
+                'scale': torch.ones(num_bias)
+            },
+            'prior': dist.Normal(torch.zeros(num_bias), 10 * torch.ones(num_bias), validate_args=True)
+        }
+
+    def model(self, X: torch.Tensor = None, y: torch.Tensor = None) -> torch.Tensor:
         """
-        After model calibration, this function is used to get calibrated outputs of uncalibrated
-        confidence estimates.
+        Definition of the log regression model.
 
         Parameters
         ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
+        X : torch.Tensor, shape=(n_samples, n_log_regression_features)
+            Input data that has been prepared by "self.prepare" function call.
+        y : torch.Tensor, shape=(n_samples, [n_classes])
+            Torch tensor with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).
 
         Returns
         -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with calibrated confidence estimates.
-            1-D for binary classification, 2-D for multi class (softmax).
+        torch.Tensor, shape=(n_samples, [n_classes])
+            Logit of the log regression model.
         """
 
-        X = super().transform(X)
+        # sample from prior - on MLE, this weight will be set as conditional
+        bias = pyro.sample("bias", self._sites['bias']['prior'])
+        weights = pyro.sample("weights", self._sites['weights']['prior'])
+
+        # on MCMC or VI, use samples obtained by a "shifted" LogNormal
+        # the "shifted" +1 term guarantees positive samples only
+        if self.method in ['variational', 'mcmc']:
+            weights = torch.log(weights + 1)
+            assert (weights >= 0).all().item() == True, "Negative confidence weights are not allowed."
+
+            # on MCMC sampling, extreme values might occur and can cause an 'inf'
+            # this will result in invalid prob values - catch infs and set to log of max value
+            weights[torch.isinf(weights)] = torch.log(torch.tensor(torch.finfo(weights.dtype).max))
+
+        # additional weights are extra weights for extra features (on detection mode)
+        if "feature_weights" in self._sites.keys():
+            feature_weights = pyro.sample("feature_weights", self._sites['feature_weights']['prior'])
+            weights = torch.cat((weights, feature_weights))
+
+        # the first dimension of the given input data is the "independent" sample dimension
+        with pyro.plate("data", X.shape[0]):
 
-        # prepare data for beta calibration
-        data_input = self._get_data_input(X)
-        logit = self._get_logit(self._weights, data_input)
+            if self.detection or self._is_binary_classification():
+                weights = torch.reshape(weights, (-1, 1))
+
+                # compute logits and remove unnecessary dimensions
+                logit = torch.squeeze(torch.matmul(X, weights) + bias)
+                probs = torch.sigmoid(logit)
+                dist_op = dist.Bernoulli
+
+            else:
+
+                # get number of weights and biases according to number of classes
+                weights = torch.reshape(weights, (-1, 2, 1))
 
-        # compute logistic fit
-        calibrated = self._sigmoid(logit)[:, 0] if self.detection or self._is_binary_classification() else self._softmax(logit)
-        return self.squeeze_generic(calibrated, axes_to_keep=0)
+                # use broadcast mechanism of pytorch: if 3 dimensions are provided, treat first dimension
+                # as a stack of matrices -> this speeds up the calculation
+                result = torch.matmul(X.permute(1, 0, 2), weights)
 
-    def _mask_negative_weights(self, weights: np.ndarray) -> list:
+                # as a result, we obtain an array of shape (n_classes, n_samples, 1)
+                # remove last dim and swap axes
+                logit = torch.transpose(torch.squeeze(result, dim=2), 0, 1) + bias
+                probs = torch.softmax(logit, dim=1)
+                dist_op = dist.Categorical
+
+            # if MLE, (slow) sampling is not necessary. However, this is needed for 'variational' and 'mcmc'
+            if self.method in ['variational', 'mcmc']:
+                pyro.sample("obs", dist_op(probs=probs, validate_args=True), obs=y)
+
+            return logit
+
+    def mask(self) -> Tuple[np.ndarray, List]:
         """
         Seek for all relevant weights whose values are negative. Mask those values with optimization constraints
         in the interval [0, 0].
 
-        Parameters
-        ----------
-        weights : np.ndarray
-            Flattened weights array
-
         Returns
         -------
         list
             Indices of masked values.
         """
 
+        # get weights from sites
+        weights = self._sites['weights']['values']
         num_weights = len(weights)
 
         # --------------------------------------------------------------------------------
@@ -256,16 +361,6 @@ def _mask_negative_weights(self, weights: np.ndarray) -> list:
         # if either param a or param b < 0, the second distribution's parameter is fixed to zero
         # the logistic fit is repeated afterwards with remaining distribution
 
-        # first step: extract weights without bias and get all weights below 0
-
-        # on detection or binary classification, only face the confidence weights
-        if self.detection or self._is_binary_classification():
-            weights = weights[1:3]
-
-            # on multiclass classification, face all weights (without biases)
-        else:
-            weights = weights[self.num_classes:]
-
         # now check if negative entries are present
         masked_weights = np.where((weights.flatten() < 0))[0]
 
@@ -292,126 +387,18 @@ def _mask_negative_weights(self, weights: np.ndarray) -> list:
             # increase indices for optimization routine due to bias values
             masked_weights += 1 if self.detection or self._is_binary_classification() else self.num_classes
 
-        return masked_weights
-
-    def _get_data_input(self, X: np.ndarray) -> np.ndarray:
-        """
-        Build data input for beta calibration logistic regression.
-
-        Note for multiclass classification:
-        For NumPy's matmul function it is mandatory to provide the class dimension in the first
-        axis in order to use its broadcasting mechanism that allows multiple dot-products in a single run.
-
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with confidence values for each prediction.
-            1-D for binary classification, 2-D for multi class (softmax).
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, 2*n_features) on detection or shape=([n_classes], n_samples, 2) on classification
-            NumPy array with prepared input data for beta calibration.
-        """
-
-        if len(X.shape) == 1:
-            X = np.reshape(X, (-1, 1))
-
-        # build 2-D array with [log(x), -log(1-x)]
-        # convert confidences array and clip values to open interval (0, 1)
-
-        # on detection, create array of shape (n_samples, 2*n_features)
-        if self.detection:
-            features = []
-            for i in range(X.shape[1]):
-                features.append(X[:, i])
-                features.append(1. - X[:, i])
-
-            data_input = np.stack(features, axis=1)
-            data_input = np.clip(data_input, self.epsilon, 1. - self.epsilon)
-            data_input = np.log(data_input)
-            data_input[:, 1::2] *= -1
-
-        # on classification, create an array
-        # - binary classification: shape (n_samples, 2)
-        # - multiclass classification: shape (n_classes, n_samples, 2)
-        else:
-            features = []
-            for i in range(X.shape[1]):
-                features.append(np.stack([X[:, i], 1. - X[:, i]], axis=1))
-
-            data_input = features[0] if self._is_binary_classification() else np.stack(features, axis=0)
-            data_input = np.clip(data_input, self.epsilon, 1. - self.epsilon)
-            data_input = np.log(data_input)
-            data_input[..., 1] *= -1
-
-        return data_input
-
-    def _get_logit(self, weights: np.ndarray, data_input: np.ndarray) -> np.ndarray:
-        """
-        Calculate logit depending on the provided weights and prepared data input for beta calibration.
-
-        Parameters
-        ----------
-        weights : np.ndarray, shape=(3,) for binary classification or shape=(3*n_classes,) for multiclass
-            Weights for logistic fit with dependencies.
-        data_input : np.ndarray, shape=([n_classes], n_samples, 2)
-            NumPy 2-D array with data input.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            Logit for beta calibration.
-        """
-
-        if self.detection or self._is_binary_classification():
-            bias = weights[0]
-            weights = np.array(weights[1:]).reshape(-1, 1)
-
-            # compute logits
-            logit = np.matmul(data_input, weights) + bias
+            # masking of the values is done by setting linear constraints for the masked values
+            # make sure that the remaining values are also >0 by settings the bounds accordingly
+            # first part: bounds for the bias (None); second part: bounds for the parameters
+            if self.detection or self._is_binary_classification():
+                bounds = [(None, None), ] + \
+                         [(0, 0) if i in masked_weights else (0, None) for i in range(num_weights - 1)]
+            else:
+                bounds = [(None, None), ] * self.num_classes + \
+                         [(0, 0) if i in masked_weights else (0, None) for i in range(num_weights - self.num_classes)]
 
+            # prepend bounds by (non-present) limits for intercept
+            bounds = [(None, None), ] * len(self._sites['bias']['values']) + bounds
+            return masked_weights, bounds
         else:
-
-            # get number of weights and biases according to number of classes
-            bias = weights[:self.num_classes]
-            weights = np.reshape(weights[self.num_classes:], (-1, 2, 1))
-
-            # use broadcast mechanism of NumPy: if 3 dimensions are provided, treat first dimension
-            # as a stack of matrices -> this speeds up the calculation
-            result = np.matmul(data_input, weights)
-
-            # as a result, we obtain an array of shape (n_classes, n_samples, 1)
-            # remove last dim and swap axes
-            logit = np.swapaxes(np.squeeze(result), 0, 1) + bias
-
-        return logit
-
-    def _loss_function(self, weights: np.ndarray, data_input: np.ndarray, y: np.ndarray, masked: list = None) -> float:
-        """
-        Wrapper function for SciPy's loss. This is simply NLL-Loss.
-        This wrapper is necessary because the first parameter is interpreted as the optimization parameter.
-
-        Parameters
-        ----------
-        weights : np.ndarray, shape=(2*n_features+1) for detection, shape=(3,) for binary classification or
-                 shape=(3*n_classes,) for multiclass
-            Weights for logistic fit with dependencies.
-        data_input : np.ndarray, shape=(n_samples, 2*n_features) for detection or shape=([n_classes], n_samples, 2)
-                     for classification
-            NumPy array with data input.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
-
-        Returns
-        -------
-        float
-            NLL-Loss
-        """
-
-        if masked is not None:
-            weights[masked] = 0.
-
-        logit = self._get_logit(weights, data_input)
-        return self._nll_loss(logit, y)
+            return masked_weights, []
diff --git a/netcal/scaling/BetaCalibrationDependent.py b/netcal/scaling/BetaCalibrationDependent.py
index 3fc241e..28e6710 100644
--- a/netcal/scaling/BetaCalibrationDependent.py
+++ b/netcal/scaling/BetaCalibrationDependent.py
@@ -1,24 +1,23 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-
-import logging
+from typing import Tuple
+from collections import OrderedDict
 import numpy as np
-from scipy.optimize import minimize
-from tqdm import tqdm
+
 import torch
-import torch.nn as nn
-from torch.utils.data import DataLoader
-from torch.utils.data import TensorDataset
+import torch.distributions.constraints as constraints
+import pyro
+import pyro.distributions as dist
 
-from netcal import AbstractCalibration, TqdmHandler, dimensions, accepts
+from netcal.scaling import AbstractLogisticRegression
 
 
-class BetaCalibrationDependent(AbstractCalibration):
+class BetaCalibrationDependent(AbstractLogisticRegression):
     """
     This calibration method uses a multivariate variant of a Beta distribution to obtain a
     calibration mapping by means of the confidence as well as additional features. This method is originally
@@ -88,16 +87,30 @@ class BetaCalibrationDependent(AbstractCalibration):
 
     Parameters
     ----------
-    momentum : bool, default: False
-        If True, momentum optimizer will be used instead of standard SciPy optimizer.
-    max_iter : int, default: 1000
-        Maximum iteration of optimizer.
-    detection : bool, default: True
-        IMPORTANT: this parameter is only for compatibility reasons. It MUST be set to True.
-        If False, the input array 'X' is treated as multi-class confidence input (softmax)
-        with shape (n_samples, [n_classes]).
-        If True, the input array 'X' is treated as a box predictions with several box features (at least
-        box confidence must be present) with shape (n_samples, [n_box_features]).
+    method : str, default: "momentum"
+        Method that is used to obtain a calibration mapping:
+        - 'mle': Maximum likelihood estimate without uncertainty using a convex optimizer.
+        - 'momentum': MLE estimate using Momentum optimizer for non-convex optimization.
+        - 'variational': Variational Inference with uncertainty.
+        - 'mcmc': Markov-Chain Monte-Carlo sampling with uncertainty.
+    momentum_epochs : int, optional, default: 1000
+            Number of epochs used by momentum optimizer.
+    mcmc_steps : int, optional, default: 20
+        Number of weight samples obtained by MCMC sampling.
+    mcmc_chains : int, optional, default: 1
+        Number of Markov-chains used in parallel for MCMC sampling (this will result
+        in mcmc_steps * mcmc_chains samples).
+    mcmc_warmup_steps : int, optional, default: 100
+        Warmup steps used for MCMC sampling.
+    vi_epochs : int, optional, default: 1000
+        Number of epochs used for ELBO optimization.
+    independent_probabilities : bool, optional, default: False
+        Boolean for multi class probabilities.
+        If set to True, the probability estimates for each
+        class are treated as independent of each other (sigmoid).
+    use_cuda : str or bool, optional, default: False
+        Specify if CUDA should be used. If str, you can also specify the device
+        number like 'cuda:0', etc.
 
     References
     ----------
@@ -108,118 +121,61 @@ class BetaCalibrationDependent(AbstractCalibration):
     .. [2] Libby, David L., and Melvin R. Novick:
        "Multivariate generalized beta distributions with applications to utility assessment"
        Journal of Educational Statistics 7.4, pp. 271-294, 1982
-    """
-
-    @accepts(bool, int, bool)
-    def __init__(self, momentum: bool = True, max_iter: int = 1000, detection: bool = True):
-        """
-        Constructor.
-
-        Parameters
-        ----------
-        momentum : bool, default: True
-            If True, momentum optimizer will be used instead of standard SciPy optimizer.
-        max_iter : int
-            Maximum iteration of optimizer.
-        detection : bool, default: True
-            IMPORTANT: this parameter is only for compatibility reasons. It MUST be set to True.
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        """
-
-        assert detection, "Classification mode (detection=False) is not supported for class BetaCalibrationDependent."
-        super().__init__(detection=True, independent_probabilities=False)
-
-        self.max_iter = max_iter
-        self.momentum = momentum
 
-        # amount of additional properties
-        self._alpha_pos = np.empty(0)
-        self._alpha_neg = np.empty(0)
-        self._beta_pos = np.empty(0)
-        self._beta_neg = np.empty(0)
-        self._bias = 0.0
-
-    def clear(self):
-        """
-        Clear model parameters.
-        """
-
-        super().clear()
-        self._alpha_pos = np.empty(0)
-        self._alpha_neg = np.empty(0)
-        self._beta_pos = np.empty(0)
-        self._beta_neg = np.empty(0)
-        self._bias = 0.0
+    .. [3] Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+       "Bayesian Confidence Calibration for Epistemic Uncertainty Modelling."
+       2021 IEEE Intelligent Vehicles Symposium (IV), 2021
+    """
 
-    @dimensions((1, 2), (1, 2), None)
-    def fit(self, X: np.ndarray, y: np.ndarray, device: str = None) -> 'BetaCalibrationDependent':
-        """
-        Build dependent Beta Calibration model for multivariate Beta distributions.
+    def __init__(self, *args, method: str = 'momentum', **kwargs):
+        """ Create an instance of `BetaCalibrationDependent`. Detailed parameter description given in class docs. """
 
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+        # an instance of this class is definitely of type detection
+        if 'detection' in kwargs and kwargs['detection'] == False:
+            print("WARNING: On BetaCalibrationDependent, attribute \'detection\' must be True.")
 
-        Returns
-        -------
-        BetaCalibrationDependent
-            Instance of class :class:`BetaCalibrationDependent`.
-        """
+        kwargs['detection'] = True
+        super().__init__(*args, method=method, **kwargs)
 
-        X, y = super().fit(X, y)
-        solver = 'SLSQP'
-        #solver = 'L-BFGS-B'
+    # -------------------------------------------------
 
-        if len(X.shape) == 1:
-            X = np.reshape(X, (-1, 1))
+    @property
+    def intercept(self) -> float:
+        """ Getter for intercept of dependent beta calibration. """
+        if self._sites is None:
+            raise ValueError("Intercept is None. You have to call the method 'fit' first.")
 
-        # determine number of additional properties
-        num_features = X.shape[1]
+        return self._sites['bias']['values']
 
-        # clip seperately due to numerical stability
-        data_input = np.clip(X, self.epsilon, 1. - self.epsilon) / np.clip((1. - X), self.epsilon, 1. - self.epsilon)
-        # --------------------------------------------------------------------------------
+    @property
+    def alphas(self) -> Tuple[np.ndarray, np.ndarray]:
+        """ Getter for alpha values of dependent beta calibration. """
+        if self._sites is None:
+            raise ValueError("Weights is None. You have to call the method 'fit' first.")
 
-        # additional weights for: bias, confidences, shared parameter a0
+        index_2 = self.num_features + 1
+        index_3 = index_2 + self.num_features + 1
+        weights = self._sites['weights']['values']
 
-        # momentum optimizer is slow but very accurate
-        if self.momentum:
-            self._alpha_pos, self._alpha_neg, self._beta_pos, self._beta_neg, self._bias = \
-                self._momentum_optimization(data_input, y, device)
+        return weights[:index_2], weights[index_2:index_3]
 
-        # scipy optimizer is very fast. SLSQP has shown similar performance than momentum optimizer
-        else:
+    @property
+    def betas(self) -> Tuple[np.ndarray, np.ndarray]:
+        """ Getter for beta values of dependent beta calibration. """
+        if self._sites is None:
+            raise ValueError("Weights is None. You have to call the method 'fit' first.")
 
-            weights_per_feature = num_features+1
-            num_weights = 4*weights_per_feature + 1
-            theta_0 = np.random.uniform(low=1. + self.epsilon, high=2., size=num_weights)
-            result = minimize(method=solver,
-                              fun=self._loss_function, x0=theta_0,
-                              args=(data_input, y, num_features),
-                              bounds=[(self.epsilon, None),] * (num_weights-1) + [(None, None),])
+        index_1 = 2 * (self.num_features + 1)
+        index_2 = index_1 + self.num_features + 1
+        weights = self._sites['weights']['values']
 
-            self._alpha_pos = result.x[:weights_per_feature]
-            self._alpha_neg = result.x[weights_per_feature: 2*weights_per_feature]
-            self._beta_pos = result.x[2*weights_per_feature:3*weights_per_feature]
-            self._beta_neg = result.x[3*weights_per_feature:4*weights_per_feature]
-            self._bias = result.x[-1]
+        return weights[index_1:index_2], weights[index_2:]
 
-        return self
+    # -------------------------------------------------
 
-    @dimensions((1, 2))
-    def transform(self, X: np.ndarray) -> np.ndarray:
+    def prepare(self, X: np.ndarray) -> torch.Tensor:
         """
-        After model calibration, this function is used to get calibrated outputs of uncalibrated
-        confidence estimates.
+        Preprocessing of input data before called at the beginning of the fit-function.
 
         Parameters
         ----------
@@ -230,272 +186,141 @@ def transform(self, X: np.ndarray) -> np.ndarray:
 
         Returns
         -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with calibrated confidence estimates.
-            1-D for binary classification, 2-D for multi class (softmax).
+        torch.Tensor
+            Prepared data vector X as torch tensor.
         """
 
-        X = super().transform(X)
+        assert self.detection, "Detection mode must be enabled for dependent beta calibration."
 
         if len(X.shape) == 1:
-            X = X.reshape(-1, 1)
-
-        # transform input data to appropriate input format
-        data_input = np.clip(X, self.epsilon, 1. - self.epsilon) / np.clip((1. - X), self.epsilon, 1. - self.epsilon)
-
-        # get likelihood ratio which equals logit and calculate sigmoid
-        likelihood_ratio = self._get_likelihood_ratio_beta(data_input, self._alpha_pos, self._alpha_neg,
-                                                           self._beta_pos, self._beta_neg, self._bias)
-        calibrated = self._sigmoid(likelihood_ratio)
-
-        return calibrated
-
-    @dimensions(2, 1, 1, 1, 1, None)
-    def _get_likelihood_ratio_beta(self, data_input: np.ndarray,
-                                   alpha_pos: np.ndarray, alpha_neg: np.ndarray,
-                                   beta_pos: np.ndarray, beta_neg: np.ndarray, bias: float) -> np.ndarray:
-        """
-        Get likelihood ratio by given input data, weights and bias.
-
-        Parameters
-        ----------
-        data_input : np.ndarray, shape=(n_samples, n_features)
-            Prepared input data.
-        alpha_pos : np.ndarray, shape=(n_features+1,)
-            Alpha values for positive distribution.
-        alpha_neg : np.ndarray, shape=(n_features+1,)
-            Alpha values for negative distribution.
-        beta_pos : np.ndarray, shape=(n_features+1,)
-            Beta values for positive distribution.
-        beta_neg : np.ndarray, shape=(n_features+1,)
-            Beta values for negative distribution.
-        bias : float
-            Bias of logit.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples,)
-            Likelihood ratio as logits.
-        """
-
-        # lambdas are ratio between all betas and beta_0
-        lambda_pos = beta_pos[1:] / beta_pos[0]
-        lambda_neg = beta_neg[1:] / beta_neg[0]
-        log_lambdas_upper = alpha_pos[1:] * np.log(lambda_pos) - alpha_neg[1:] * np.log(lambda_neg)
-
-        # parameter differences
-        differences_alpha_upper = alpha_pos[1:] - alpha_neg[1:]
-        log_values_upper = np.log(data_input)
-
-        # calculate upper part
-        upper_part = np.sum(log_lambdas_upper + differences_alpha_upper * log_values_upper, axis=1)
-
-        # start with summation of alphas for lower part of equation
-        sum_alpha_pos = np.sum(alpha_pos)
-        sum_alpha_neg = np.sum(alpha_neg)
-
-        # calculate lower part
-        log_sum_lower_pos = np.log(1. + np.sum(lambda_pos * data_input, axis=1))
-        log_sum_lower_neg = np.log(1. + np.sum(lambda_neg * data_input, axis=1))
-        lower_part = (sum_alpha_neg * log_sum_lower_neg) - (sum_alpha_pos * log_sum_lower_pos)
-
-        # combine to likelihood ratio and return
-        likelihood_ratio = bias + upper_part + lower_part
+            X = np.reshape(X, (-1, 1))
 
-        return likelihood_ratio
+        # clip seperately due to numerical stability
+        data = np.clip(X, self.epsilon, 1. - self.epsilon) / np.clip((1. - X), self.epsilon, 1. - self.epsilon)
+        return torch.tensor(data)
 
-    def _loss_function(self, weights: np.ndarray, data_input: np.ndarray,
-                       y: np.ndarray, num_features: int) -> float:
+    def prior(self):
         """
-        Wrapper function for SciPy's loss. This is simply NLL-Loss.
-        This wrapper is necessary because the first parameter is interpreted as the optimization parameter.
-
-        Parameters
-        ----------
-        weights : np.ndarray, shape=(3,) or (2*num_features + 1,)
-            Weights for logistic fit with dependencies.
-        data_input : np.ndarray, shape=(n_samples, n_features)
-            NumPy 2-D array with data input.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
-        num_features : int
-            Number of features for multivariate distribution.
-
-        Returns
-        -------
-        float
-            NLL-Loss
+        Prior definition of the weights used for log regression. This function has to set the
+        variables 'self.weight_prior_dist', 'self.weight_mean_init' and 'self.weight_stddev_init'.
         """
 
-        weights_per_feature = num_features+1
-        alpha_pos = weights[:weights_per_feature]
-        alpha_neg = weights[weights_per_feature: 2 * weights_per_feature]
-        beta_pos = weights[2 * weights_per_feature:3 * weights_per_feature]
-        beta_neg = weights[3 * weights_per_feature:4 * weights_per_feature]
-        bias = weights[-1]
-
-        # get likelihood ratio as logits and get NLL loss
-        likelihood_ratio = self._get_likelihood_ratio_beta(data_input, alpha_pos, alpha_neg, beta_pos, beta_neg, bias)
-        return self._nll_loss(logit=likelihood_ratio, ground_truth=y)
-
-    @dimensions(2, 1, None)
-    def _momentum_optimization(self, data_input: np.ndarray, y: np.ndarray, device: str = None) -> tuple:
+        # number of weights
+        num_weights = 4 * (self.num_features + 1)
+        self._sites = OrderedDict()
+
+        # initial values for mean, scale and prior dist
+        init_mean = torch.ones(num_weights).uniform_(1. + self.epsilon, 2.)
+        init_scale = torch.ones(num_weights)
+        prior = dist.Normal(init_mean, 10 * init_scale, validate_args=True)
+
+        # we have constraints on the weights to be positive
+        # this is usually solved by defining constraints on the MLE optimizer
+        # however, on MCMC and VI this is not possible
+        # instead, we are using a "shifted" LogNormal to obtain only positive samples
+
+        if self.method in ['variational', 'mcmc']:
+
+            # for this purpose, we need to transform the prior mean first and set the
+            # distribution to be a LogNormal
+            init_mean = torch.log(torch.exp(init_mean) - 1)
+            prior = dist.LogNormal(init_mean, 10 * init_scale, validate_args=True)
+
+        # set properties for "weights": weights must be positive
+        self._sites['weights'] = {
+            'values': None,
+            'constraint': constraints.greater_than(self.epsilon),
+            'init': {
+                'mean': init_mean,
+                'scale': init_scale
+            },
+            'prior': prior
+        }
+
+        # set properties for "bias"
+        self._sites['bias'] = {
+            'values': None,
+            'constraint': constraints.real,
+            'init': {
+                'mean': torch.ones(1) * self.epsilon,
+                'scale': torch.ones(1)
+            },
+            'prior': dist.Normal(torch.zeros(1), 10 * torch.ones(1), validate_args=True),
+        }
+
+    def model(self, X: torch.Tensor = None, y: torch.Tensor = None) -> torch.Tensor:
         """
-        Momentum optimization to find the global optimum of current parameter search.
-        This method is slow but tends to find the global optimum.
+        Definition of the log regression model.
 
         Parameters
         ----------
-        data_input : np.ndarray, shape=(n_samples, n_features)
-            NumPy 2-D array with data input.
-        y : np.ndarray, shape=(n_samples,)
-            NumPy array with ground truth labels as 1-D vector (binary).
+        X : torch.Tensor, shape=(n_samples, n_log_regression_features)
+            Input data that has been prepared by "self.prepare" function call.
+        y : torch.Tensor, shape=(n_samples, [n_classes])
+            Torch tensor with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).
 
         Returns
         -------
-        tuple of length 5
-            Estimated parameters.
+        torch.Tensor, shape=(n_samples, [n_classes])
+            Logit of the log regression model.
         """
 
-        # select device
-        if device is None:
-            if torch.cuda.is_available():
-                device = 'cuda'
-            else:
-                device = 'cpu'
-
-        # initial learning rate, min delta for early stopping and patience
-        # for early stopping (number of epochs without improvement)
-        init_lr = 1e-3
-        batch_size = 256
-
-        # crierion is Binary Cross Entropy on logits (numerically more stable)
-        criterion = nn.BCEWithLogitsLoss(reduction='mean')
-
-        # create PyTorch dataset directly on GPU
-        torch_data_input = torch.Tensor(data_input).to(device)
-        torch_y = torch.Tensor(y).to(device)
-        dataset = TensorDataset(torch_data_input, torch_y)
-        dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True, pin_memory=False)
-
-        # init model and optimizer
-        logistic_regression = DependentLR(n_features=data_input.shape[-1]).to(device)
-        optimizer = torch.optim.Adam(logistic_regression.parameters(), lr=init_lr)
-
-        # enable training mode of model
-        logistic_regression.train()
-
-        # set number of epochs
-        num_batches = len(dataloader)
-        num_epochs = int(np.ceil(self.max_iter / num_batches))
-
-        best_loss = np.infty
-
-        # use tqdm logger to pipe tqdm output to logger
-        logger = logging.getLogger(__name__)
-        tqdm_logger = TqdmHandler(logger=logger, level=logging.INFO)
-        with tqdm(total=num_epochs * num_batches, file=tqdm_logger) as pbar:
-            for epoch in range(num_epochs):
+        # get indices of weights
+        index_1 = self.num_features+1
+        index_2 = index_1 + self.num_features+1
+        index_3 = index_2 + self.num_features+1
 
-                # iterate over batches
-                for i, (train_x, train_y) in enumerate(dataloader, start=(epoch*num_batches)):
-                    logits = logistic_regression(train_x)
-                    loss = criterion(logits, train_y)
+        # sample from prior - on MLE, this weight will be set as conditional
+        bias = pyro.sample("bias", self._sites['bias']['prior'])
+        weights = pyro.sample("weights", self._sites['weights']['prior'])
 
-                    # perform optimization step
-                    optimizer.zero_grad()
-                    loss.backward()
-                    optimizer.step()
+        # on MCMC or VI, use samples obtained by a "shifted" LogNormal
+        # the "shifted" +1 term guarantees positive samples only
+        if self.method in ['variational', 'mcmc']:
+            weights = torch.log(weights + 1)
+            assert (weights >= 0).all().item() == True, "Negative weights are not allowed."
 
-                    # early stopping
-                    # if current loss is best so far, refresh memory
-                    if loss < best_loss:
-                        best_loss = loss
+            # on MCMC sampling, extreme values might occur and can cause an 'inf'
+            # this will result in invalid prob values - catch infs and set to log of max value
+            weights[torch.isinf(weights)] = torch.log(torch.tensor(torch.finfo(weights.dtype).max))
 
-                        pbar.set_description("Best Loss: %.6f" % best_loss)
-                        pbar.refresh()
+        # the first dimension of the given input data is the "independent" sample dimension
+        with pyro.plate("data", X.shape[0]):
 
-                    # refresh progress bar
-                    pbar.update(1)
-
-        # extract weights from layer and clip to interval (0, inf]
-        # this is necessary because negative values might be occur after last
-        # optimization step - these values are not clipped then
-        alpha_pos = np.clip(logistic_regression.alpha_pos.data.cpu().numpy(), self.epsilon, np.infty)
-        alpha_neg = np.clip(logistic_regression.alpha_neg.data.cpu().numpy(), self.epsilon, np.infty)
-        beta_pos = np.clip(logistic_regression.beta_pos.data.cpu().numpy(), self.epsilon, np.infty)
-        beta_neg = np.clip(logistic_regression.beta_neg.data.cpu().numpy(), self.epsilon, np.infty)
-
-        bias = logistic_regression.bias.data.cpu().numpy()
-
-        return alpha_pos, alpha_neg, beta_pos, beta_neg, bias
-
-
-class DependentLR(nn.Module):
-    """
-    PyTorch nn.Module for dependent logistic regression of multivariate beta distribution.
-    """
-
-    epsilon = np.finfo(np.float).eps
-
-    @accepts(int)
-    def __init__(self, n_features: int):
-        """
-        Constructor.
-        """
-
-        super().__init__()
-        n_dims = n_features + 1
-
-        self.alpha_pos = nn.Parameter(torch.empty(n_dims).uniform_(1. + self.epsilon, 2.))
-        self.alpha_neg = nn.Parameter(torch.empty(n_dims).uniform_(1. + self.epsilon, 2.))
-        self.beta_pos = nn.Parameter(torch.empty(n_dims).uniform_(1. + self.epsilon, 2.))
-        self.beta_neg = nn.Parameter(torch.empty(n_dims).uniform_(1. + self.epsilon, 2.))
-        self.bias = nn.Parameter(torch.empty(1).uniform_(-1., 1.))
-
-    def forward(self, x: torch.Tensor):
-        """
-        Function for forward pass.
-
-        Parameters
-        ----------
-        x : torch.Tensor
-            Input data.
-
-        Returns
-        -------
-            Logits of multivariate beta logistic regression.
-        """
+            # clip values to range (0, inf]
+            alpha_pos = torch.clamp(weights[:index_1], self.epsilon, np.infty)
+            alpha_neg = torch.clamp(weights[index_1:index_2], self.epsilon, np.infty)
+            beta_pos = torch.clamp(weights[index_2:index_3], self.epsilon, np.infty)
+            beta_neg = torch.clamp(weights[index_3:], self.epsilon, np.infty)
 
-        # clip values to range (0, inf]
-        alpha_pos = torch.clamp(self.alpha_pos, self.epsilon, np.infty)
-        alpha_neg = torch.clamp(self.alpha_neg, self.epsilon, np.infty)
-        beta_pos = torch.clamp(self.beta_pos, self.epsilon, np.infty)
-        beta_neg = torch.clamp(self.beta_neg, self.epsilon, np.infty)
+            # lambdas are ratio between all betas and beta_0
+            lambda_pos = beta_pos[1:] / beta_pos[0]
+            lambda_neg = beta_neg[1:] / beta_neg[0]
+            log_lambdas_upper = alpha_pos[1:] * torch.log(lambda_pos) - alpha_neg[1:] * torch.log(lambda_neg)
 
-        # lambdas are ratio between all betas and beta_0
-        lambda_pos = beta_pos[1:] / beta_pos[0]
-        lambda_neg = beta_neg[1:] / beta_neg[0]
-        log_lambdas_upper = alpha_pos[1:] * torch.log(lambda_pos) - alpha_neg[1:] * torch.log(lambda_neg)
+            # parameter differences
+            differences_alpha_upper = alpha_pos[1:] - alpha_neg[1:]
+            log_values_upper = torch.log(X)
 
-        # parameter differences
-        differences_alpha_upper = alpha_pos[1:] - alpha_neg[1:]
-        log_values_upper = torch.log(x)
+            # calculate upper part
+            upper_part = torch.sum(log_lambdas_upper + (differences_alpha_upper * log_values_upper), dim=1)
 
-        # calculate upper part
-        upper_part = torch.sum(log_lambdas_upper + (differences_alpha_upper * log_values_upper), dim=1)
+            # start with summation of alphas for lower part of equation
+            sum_alpha_pos = torch.sum(alpha_pos)
+            sum_alpha_neg = torch.sum(alpha_neg)
 
-        # start with summation of alphas for lower part of equation
-        sum_alpha_pos = torch.sum(alpha_pos)
-        sum_alpha_neg = torch.sum(alpha_neg)
+            # calculate lower part
+            log_sum_lower_pos = torch.log(1. + torch.sum(lambda_pos * X, dim=1))
+            log_sum_lower_neg = torch.log(1. + torch.sum(lambda_neg * X, dim=1))
+            lower_part = (sum_alpha_neg * log_sum_lower_neg) - (sum_alpha_pos * log_sum_lower_pos)
 
-        # calculate lower part
-        log_sum_lower_pos = torch.log(1. + torch.sum(lambda_pos * x, dim=1))
-        log_sum_lower_neg = torch.log(1. + torch.sum(lambda_neg * x, dim=1))
-        lower_part = (sum_alpha_neg * log_sum_lower_neg) - (sum_alpha_pos * log_sum_lower_pos)
+            # combine both parts and bias to logits
+            logit = torch.squeeze(bias + upper_part + lower_part)
 
-        # combine both parts and bias to logits
-        logits = self.bias + upper_part + lower_part
+            # if MLE, (slow) sampling is not necessary. However, this is needed for 'variational' and 'mcmc'
+            if self.method in ['variational', 'mcmc']:
+                probs = torch.sigmoid(logit)
+                pyro.sample("obs", dist.Bernoulli(probs=probs, validate_args=True), obs=y)
 
-        return logits
+        return logit
diff --git a/netcal/scaling/LogisticCalibration.py b/netcal/scaling/LogisticCalibration.py
index 28ec6a9..f7120ae 100644
--- a/netcal/scaling/LogisticCalibration.py
+++ b/netcal/scaling/LogisticCalibration.py
@@ -1,16 +1,23 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
+
+from collections import OrderedDict
+from typing import Union
 
 import numpy as np
-from scipy.optimize import minimize
-from netcal import AbstractCalibration, accepts, dimensions
+import torch
+import torch.distributions.constraints as constraints
+import pyro
+import pyro.distributions as dist
+
+from netcal.scaling import AbstractLogisticRegression
 
 
-class LogisticCalibration(AbstractCalibration):
+class LogisticCalibration(AbstractLogisticRegression):
     """
     On classification, apply the logistic calibration method aka Platt scaling to obtain a
     calibration mapping. This method is originally proposed by [1]_.
@@ -66,6 +73,23 @@ class LogisticCalibration(AbstractCalibration):
     ----------
     temperature_only : bool, default: False
         If True, use Temperature Scaling instead of Platt/Vector Scaling.
+    method : str, default: "mle"
+        Method that is used to obtain a calibration mapping:
+        - 'mle': Maximum likelihood estimate without uncertainty using a convex optimizer.
+        - 'momentum': MLE estimate using Momentum optimizer for non-convex optimization.
+        - 'variational': Variational Inference with uncertainty.
+        - 'mcmc': Markov-Chain Monte-Carlo sampling with uncertainty.
+    momentum_epochs : int, optional, default: 1000
+            Number of epochs used by momentum optimizer.
+    mcmc_steps : int, optional, default: 20
+        Number of weight samples obtained by MCMC sampling.
+    mcmc_chains : int, optional, default: 1
+        Number of Markov-chains used in parallel for MCMC sampling (this will result
+        in mcmc_steps * mcmc_chains samples).
+    mcmc_warmup_steps : int, optional, default: 100
+        Warmup steps used for MCMC sampling.
+    vi_epochs : int, optional, default: 1000
+        Number of epochs used for ELBO optimization.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
@@ -75,6 +99,9 @@ class LogisticCalibration(AbstractCalibration):
         Boolean for multi class probabilities.
         If set to True, the probability estimates for each
         class are treated as independent of each other (sigmoid).
+    use_cuda : str or bool, optional, default: False
+        Specify if CUDA should be used. If str, you can also specify the device
+        number like 'cuda:0', etc.
 
     References
     ----------
@@ -91,144 +118,44 @@ class are treated as independent of each other (sigmoid).
     .. [3] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
        The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
-    """
-
-    @accepts(bool, bool, bool)
-    def __init__(self, temperature_only: bool = False, detection: bool = False, independent_probabilities: bool = False):
-        """
-        Constructor
 
-        Parameters
-        ----------
-        temperature_only : bool, default: False
-            If True, use Temperature Scaling instead of Platt/Vector Scaling.
-        detection : bool, default: False
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        independent_probabilities : bool, optional, default: False
-            Boolean for multi class probabilities.
-            If set to True, the probability estimates for each
-            class are treated as independent of each other (sigmoid).
-        """
+    .. [4] Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+       "Bayesian Confidence Calibration for Epistemic Uncertainty Modelling."
+       2021 IEEE Intelligent Vehicles Symposium (IV), 2021
+    """
 
-        super().__init__(detection=detection, independent_probabilities=independent_probabilities)
+    def __init__(self, *args, temperature_only: bool = False, **kwargs):
+        """ Create an instance of `LogisticCalibration`. Detailed parameter description given in class docs. """
 
+        super().__init__(*args, **kwargs)
         self.temperature_only = temperature_only
 
-        self._weights = None
-        self._num_combination = 0
-
-    def clear(self):
-        """
-        Clear model parameters.
-        """
-
-        super().clear()
+    # -------------------------------------------------
 
-        self._weights = None
-        self._num_combination = 0
-
-    @dimensions((1, 2), (1, 2))
-    def fit(self, X: np.ndarray, y: np.ndarray) -> 'LogisticCalibration':
-        """
-        Build logitic calibration model.
+    @property
+    def intercept(self) -> Union[np.ndarray, float]:
+        """ Getter for intercept of logistic calibration. """
+        if self._sites is None:
+            raise ValueError("Intercept is None. You have to call the method 'fit' first.")
 
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
-
-        Returns
-        -------
-        LogisticCalibration
-            Instance of class :class:`LogisticCalibration`.
-        """
-
-        X, y = super().fit(X, y)
-        data_input = self._build_data_input(X)
-
-        # convert ground truth to one hot if not binary and not detection mode
-        if self.num_classes > 2 and not self.detection:
-            y = self._get_one_hot_encoded_labels(y, self.num_classes)
-
-        # initialize weights
-        # on temperature scaling, number of weights is single scalar
         if self.temperature_only:
-            initial_weights = np.array(1.0)
-
-        else:
-            # detection mode: number of weights is number of features + bias
-            # initialize weights equally weighted and bias slightly greater than 0
-            if self.detection:
-                num_weights = X.shape[1] + 1
-                initial_weights = np.ones(num_weights) / float(num_weights-1)
-                initial_weights[0] = self.epsilon
-
-            # binary classification: use one weight and one bias
-            elif self._is_binary_classification():
-                num_weights = 2
-                initial_weights = np.ones(num_weights)
-                initial_weights[0] = self.epsilon
-
-            # multiclass classification: use one weight and one bias for each class separately
-            else:
-                num_weights = 2*self.num_classes
-                initial_weights = np.ones(num_weights)
-                initial_weights[:self.num_classes] = self.epsilon
-
-        # -----------------------------
-
-        # invoke SciPy's optimization function
-        result = minimize(fun=self._loss_function, x0=initial_weights, args=(data_input, y))
-
-        # get weights after optimization
-        self._weights = result.x
-
-        return self
-
-    @dimensions((1, 2))
-    def transform(self, X: np.ndarray) -> np.ndarray:
-        """
-        After model calibration, this function is used to get calibrated outputs of uncalibrated
-        confidence estimates.
-
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-
-        Returns
-        -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with calibrated confidence estimates.
-            1-D for binary classification, 2-D for multi class (softmax).
-        """
+            raise ValueError("There is no intercept for temperature scaling.")
 
-        X = super().transform(X)
+        return self._sites['bias']['values']
 
-        # get data input and logits
-        data_input = self._build_data_input(X)
-        logit = self._calculate_logit(data_input, self._weights)
+    @property
+    def weights(self) -> Union[np.ndarray, float]:
+        """ Getter for weights of logistic calibration. """
+        if self._sites is None:
+            raise ValueError("Weights is None. You have to call the method 'fit' first.")
 
-        if self.detection or self._is_binary_classification():
-            calibrated = self._sigmoid(logit)
-        else:
-            calibrated = self._softmax(logit)
+        return self._sites['weights']['values']
 
-        return self.squeeze_generic(calibrated, axes_to_keep=0)
+    # -------------------------------------------------
 
-    def _build_data_input(self, X: np.ndarray) -> np.ndarray:
+    def prepare(self, X: np.ndarray) -> torch.Tensor:
         """
-        Build data input for Vector/Platt/Temperature scaling (even for detection mode).
+        Preprocessing of input data before called at the beginning of the fit-function.
 
         Parameters
         ----------
@@ -239,8 +166,8 @@ def _build_data_input(self, X: np.ndarray) -> np.ndarray:
 
         Returns
         -------
-        np.ndarray
-            Data input to calculate logits.
+        torch.Tensor
+            Prepared data vector X as torch tensor.
         """
 
         if len(X.shape) == 1:
@@ -258,70 +185,125 @@ def _build_data_input(self, X: np.ndarray) -> np.ndarray:
         else:
             data_input = self._inverse_softmax(X)
 
-        return data_input
+        return torch.Tensor(data_input)
 
-    def _calculate_logit(self, data_input: np.ndarray, weights: np.ndarray) -> np.ndarray:
+    def prior(self):
+        """
+        Prior definition of the weights used for log regression. This function has to set the
+        variables 'self.weight_prior_dist', 'self.weight_mean_init' and 'self.weight_stddev_init'.
         """
-        Calculate logit by given data input and weights. The weights are decomposed automatically.
+
+        self._sites = OrderedDict()
+
+        # on temperature scaling, we only have one single weight for all classes
+        if self.temperature_only:
+            self._sites['weights'] = {
+                'values': None,
+                'constraint': constraints.real,
+                'init': {
+                    'mean': torch.ones(1),
+                    'scale': torch.ones(1)
+                    },
+                'prior': dist.Normal(torch.ones(1), 10 * torch.ones(1), validate_args=True)
+            }
+
+        else:
+
+            # on detection mode or binary classification, we have a weight for each given feature (one for binary
+            # classification) and bias
+            if self.detection or self._is_binary_classification():
+                num_bias = 1
+                num_weights = self.num_features
+
+            # on multiclass classification, we have one weight and one bias for each class separately
+            else:
+                num_bias = self.num_classes
+                num_weights = self.num_classes
+
+            # set properties for "weights"
+            self._sites['weights'] = {
+                'values': None,
+                'constraint': constraints.real,
+                'init': {
+                    'mean': torch.ones(num_weights),
+                    'scale': torch.ones(num_weights)
+                },
+                'prior': dist.Normal(torch.ones(num_weights), 10 * torch.ones(num_weights), validate_args=True),
+            }
+
+            # set properties for "bias"
+            self._sites['bias'] = {
+                'values': None,
+                'constraint': constraints.real,
+                'init': {
+                    'mean': torch.zeros(num_bias),
+                    'scale': torch.ones(num_bias)
+                },
+                'prior': dist.Normal(torch.zeros(num_bias), 10 * torch.ones(num_bias), validate_args=True),
+            }
+
+    def model(self, X: torch.Tensor = None, y: torch.Tensor = None) -> torch.Tensor:
+        """
+        Definition of the log regression model.
 
         Parameters
         ----------
-        data_input : np.ndarray
-            Data input to calculate logits.
-        weights : np.ndarray
-            Weights for scaling and shifting data input to calculate logits.
+        X : torch.Tensor, shape=(n_samples, n_log_regression_features)
+            Input data that has been prepared by "self.prepare" function call.
+        y : torch.Tensor, shape=(n_samples, [n_classes])
+            Torch tensor with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).
 
         Returns
         -------
-        np.ndarray
-            Scaled and shifted logits.
+        torch.Tensor, shape=(n_samples, [n_classes])
+            Logit of the log regression model.
         """
 
-        # only one weight is equal to temperature scaling - set bias to 0
-        if len(weights) == 1:
-            bias = 0.0
-            logit = (data_input * weights) + bias
+        # sample from prior - on MLE, this weight will be set as conditional
+        weights = pyro.sample("weights", self._sites["weights"]["prior"])
 
-        # more than one weight is vector/platt scaling or detection calibration
+        if self.temperature_only:
+            bias = 0.
         else:
+            bias = pyro.sample("bias", self._sites["bias"]["prior"])
 
-            # on detection, perform a dot product operation
-            # this is equivalent to (column-wise) multiplication on binary case
-            if self.detection or self._is_binary_classification():
-                bias = weights[0]
-                weights = np.array(weights[1:]).reshape(-1, 1)
-                logit = np.matmul(data_input, weights) + bias
+        # on detection or binary classification, use dot product to sum up all given features to one logit
+        if self.detection or self._is_binary_classification():
+
+            # we need squeeze to remove last (unnecessary) dim to avoid site-effects
+            # temperature scaling: sinlge scalar
+            if self.temperature_only:
+                def logit_op(x, w, b): return torch.squeeze(torch.sum(torch.mul(x, w), dim=1))
 
-            # on binary classification, extract bias and weights and perform (column-wise) multiplication
-            # this is equivalent to a weight matrix restricted to a diagonal
+            # platt scaling: one weight for each feature given
             else:
-                bias = weights[:self.num_classes]
-                weights = np.array(weights[self.num_classes:])
-                logit = np.multiply(data_input, weights) + bias
+                weights = torch.reshape(weights, (-1, 1))
+                def logit_op(x, w, b): return torch.squeeze(torch.matmul(x, w) + b)
 
-        return logit
+            # define as probabilistic output the sigmoid and a bernoulli distribution
+            prob_op = torch.sigmoid
+            dist_op = dist.Bernoulli
 
-    @dimensions(1, (1, 2), (1, 2))
-    def _loss_function(self, weights: np.ndarray, data_input: np.ndarray, y: np.ndarray) -> float:
-        """
-        Wrapper function for SciPy's loss. This is simply NLL-Loss.
-        This wrapper is necessary because the first parameter is interpreted as the optimization parameter.
+        else:
 
-        Parameters
-        ----------
-        weights : np.ndarray, shape=(3,) or (2*num_features + 1,)
-            Weights for logistic fit with dependencies.
-        data_input : np.ndarray, shape=(n_samples, 2)
-            NumPy 2-D array with data input.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+            # the op for calculating the logit is an element-wise multiplication
+            # for vector scaling and to keep multinomial output
+            def logit_op(x, w, b): return torch.mul(x, w) + b
 
-        Returns
-        -------
-        float
-            NLL-Loss
-        """
+            # define as probabilistic output the softmax and a categorical distribution
+            def prob_op(logit): return torch.softmax(logit, dim=1)
+            dist_op = dist.Categorical
 
-        logit = self._calculate_logit(data_input, weights)
-        return self._nll_loss(logit, y)
+        # the first dimension of the given input data is the "independent" sample dimension
+        with pyro.plate("data", X.shape[0]):
+
+            # calculate logit
+            logit = logit_op(X, weights, bias)
+
+            # if MLE, (slow) sampling is not necessary. However, this is needed for 'variational' and 'mcmc'
+            if self.method in ['variational', 'mcmc']:
+                probs = prob_op(logit)
+                pyro.sample("obs", dist_op(probs=probs, validate_args=True), obs=y)
+
+        return logit
diff --git a/netcal/scaling/LogisticCalibrationDependent.py b/netcal/scaling/LogisticCalibrationDependent.py
index bb38251..40c9e25 100644
--- a/netcal/scaling/LogisticCalibrationDependent.py
+++ b/netcal/scaling/LogisticCalibrationDependent.py
@@ -1,29 +1,27 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
-
-
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
+from typing import Tuple
+from collections import OrderedDict
 import numpy as np
-from scipy.optimize import minimize
 import torch
-import torch.nn as nn
-from torch.utils.data import DataLoader
-from torch.utils.data import TensorDataset
-from tqdm import tqdm
+import torch.distributions.constraints as constraints
 
-from netcal import AbstractCalibration, accepts, dimensions
+import pyro
+import pyro.distributions as dist
 
+from netcal.scaling import AbstractLogisticRegression
 
-class LogisticCalibrationDependent(AbstractCalibration):
+
+class LogisticCalibrationDependent(AbstractLogisticRegression):
     """
-    This calibration method uses multivariate normal distributions to obtain a
-    calibration mapping by means of the confidence as well as additional features. This method is originally
-    proposed by [1]_. This calibration scheme
-    tries to model several dependencies in the variables given by the input ``X``.
+    This calibration method is for detection only and uses multivariate normal distributions to obtain a
+    calibration mapping by means of the confidence as well as additional features. This calibration scheme
+    tries to model several dependencies in the variables given by the input ``X`` [1]_.
 
     It is necessary to provide all data in input parameter ``X`` as an NumPy array of shape ``(n_samples, n_features)``,
     whereas the confidence must be the first feature given in the input array. The ground-truth samples ``y``
@@ -46,7 +44,7 @@ class LogisticCalibrationDependent(AbstractCalibration):
 
        g(s) = \\frac{1}{1 + \\exp(-z(s))} ,
 
-    According to [1]_, we can interpret the logit :math:`z` as the logarithm of the posterior odds
+    According to [2]_, we can interpret the logit :math:`z` as the logarithm of the posterior odds
 
     .. math::
 
@@ -69,129 +67,112 @@ class LogisticCalibrationDependent(AbstractCalibration):
     matrix V as
 
     .. math::
-       \\Sigma = V^T * V
+       \\Sigma = V^T V
 
     instead of estimating :math:`\\Sigma` directly. This guarantees both requirements.
 
     Parameters
     ----------
-    detection : bool, default: True
-        IMPORTANT: this parameter is only for compatibility reasons. It MUST be set to True.
-        If False, the input array 'X' is treated as multi-class confidence input (softmax)
-        with shape (n_samples, [n_classes]).
-        If True, the input array 'X' is treated as a box predictions with several box features (at least
-        box confidence must be present) with shape (n_samples, [n_box_features]).
+    method : str, default: "mle"
+        Method that is used to obtain a calibration mapping:
+        - 'mle': Maximum likelihood estimate without uncertainty using a convex optimizer.
+        - 'momentum': MLE estimate using Momentum optimizer for non-convex optimization.
+        - 'variational': Variational Inference with uncertainty.
+        - 'mcmc': Markov-Chain Monte-Carlo sampling with uncertainty.
+    momentum_epochs : int, optional, default: 1000
+            Number of epochs used by momentum optimizer.
+    mcmc_steps : int, optional, default: 20
+        Number of weight samples obtained by MCMC sampling.
+    mcmc_chains : int, optional, default: 1
+        Number of Markov-chains used in parallel for MCMC sampling (this will result
+        in mcmc_steps * mcmc_chains samples).
+    mcmc_warmup_steps : int, optional, default: 100
+        Warmup steps used for MCMC sampling.
+    vi_epochs : int, optional, default: 1000
+        Number of epochs used for ELBO optimization.
+    independent_probabilities : bool, optional, default: False
+        Boolean for multi class probabilities.
+        If set to True, the probability estimates for each
+        class are treated as independent of each other (sigmoid).
+    use_cuda : str or bool, optional, default: False
+        Specify if CUDA should be used. If str, you can also specify the device
+        number like 'cuda:0', etc.
 
     References
     ----------
     .. [1] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
        The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
-    """
 
-    @accepts(bool)
-    def __init__(self, detection: bool = True):
-        """
-        Constructor.
+    .. [2] Kull, Meelis, Telmo Silva Filho, and Peter Flach:
+       "Beta calibration: a well-founded and easily implemented improvement on logistic calibration for binary classifiers"
+       Artificial Intelligence and Statistics, PMLR 54:623-631, 2017
+       `Get source online <http://proceedings.mlr.press/v54/kull17a/kull17a.pdf>`_
 
-        Parameters
-        ----------
-        detection : bool, default: True
-            IMPORTANT: this parameter is only for compatibility reasons. It MUST be set to True.
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        """
-
-        assert detection, "Classification mode (detection=False) is not supported for class LogisticCalibrationDependent."
-        super().__init__(detection=True, independent_probabilities=False)
-
-        self._bias = None
-        self._inverse_cov_pos = None
-        self._inverse_cov_neg = None
-        self._mean_pos = None
-        self._mean_neg = None
+    .. [3] Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+       "Bayesian Confidence Calibration for Epistemic Uncertainty Modelling."
+       2021 IEEE Intelligent Vehicles Symposium (IV), 2021
+    """
 
-    def clear(self):
-        """
-        Clear model parameters.
-        """
+    def __init__(self, *args, **kwargs):
+        """ Create an instance of `LogisticCalibrationDependent`. Detailed parameter description given in class docs. """
 
-        super().clear()
+        # an instance of this class is definitely of type detection
+        if 'detection' in kwargs and kwargs['detection'] == False:
+            print("WARNING: On LogisticCalibrationDependent, attribute \'detection\' must be True.")
 
-        self._bias = None
-        self._inverse_cov_pos = None
-        self._inverse_cov_neg = None
-        self._mean_pos = None
-        self._mean_neg = None
+        kwargs['detection'] = True
+        super().__init__(*args, **kwargs)
 
-    @dimensions((1, 2), (1, 2))
-    def fit(self, X: np.ndarray, y: np.ndarray) -> 'LogisticCalibrationDependent':
-        """
-        Build Logistic Calibration model for multivariate normal distributions.
+    # -------------------------------------------------
 
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
+    @property
+    def intercept(self) -> float:
+        """ Getter for intercept of dependent logistic calibration. """
+        if self._sites is None:
+            raise ValueError("Intercept is None. You have to call the method 'fit' first.")
 
-        Returns
-        -------
-        LogisticCalibrationDependent
-            Instance of class :class:`LogisticCalibrationDependent`.
-        """
+        return self._sites['bias']['values']
 
-        X, y = super().fit(X, y)
-        if len(X.shape) == 1:
-            X = X.reshape(-1, 1)
+    @property
+    def means(self) -> Tuple[np.ndarray, np.ndarray]:
+        """ Getter for mean vectors of dependent logistic calibration. """
+        if self._sites is None:
+            raise ValueError("Weights is None. You have to call the method 'fit' first.")
 
-        solver = 'SLSQP'
+        index_1 = 2 * (self.num_features ** 2)
+        index_2 = index_1 + self.num_features
 
-        # build data input to compute logit
-        data_input = self._build_data_input(X)
-        num_features = X.shape[1]
+        weights = self._sites['weights']['values']
+        return weights[index_1:index_2], weights[index_2:]
 
-        # scipy optimizer is very fast. SLSQP has shown similar performance compared to momentum optimizer
-        theta_0 = np.random.rand(1 + np.power(num_features, 2) * 2 + num_features * 2)
-        result = minimize(method=solver,
-                          fun=self._loss_function, x0=theta_0,
-                          args=(data_input, y, num_features))
+    @property
+    def covariances(self) -> Tuple[np.ndarray, np.ndarray]:
+        """ Getter for covariance matrices of dependent logistic calibration. """
+        if self._sites is None:
+            raise ValueError("Weights is None. You have to call the method 'fit' first.")
 
-        # get result of optimization and extract
-        weights = result.x
+        index_1 = self.num_features ** 2
+        index_2 = index_1 + self.num_features ** 2
 
-        # get indices of weights and decompose
-        index_1 = 1 + int(np.power(num_features, 2))
-        index_2 = index_1 + int(np.power(num_features, 2))
-        index_3 = index_2 + num_features
+        weights = self._sites['weights']['values']
 
-        # covariance matrices are not evaluated directly
-        decomposed_inv_cov_pos = np.array(weights[1:index_1]).reshape((num_features, num_features))
-        decomposed_inv_cov_neg = np.array(weights[index_1:index_2]).reshape((num_features, num_features))
+        decomposed_inv_cov_pos = np.reshape(weights[:index_1], (self.num_features, self.num_features))
+        decomposed_inv_cov_neg = np.reshape(weights[index_1:index_2], (self.num_features, self.num_features))
 
-        # calculate covariance matrices
-        self._inverse_cov_pos = np.matmul(decomposed_inv_cov_pos, decomposed_inv_cov_pos.T)
-        self._inverse_cov_neg = np.matmul(decomposed_inv_cov_neg, decomposed_inv_cov_neg.T)
+        inv_cov_pos = np.matmul(decomposed_inv_cov_pos.T, decomposed_inv_cov_pos.T)
+        inv_cov_neg = np.matmul(decomposed_inv_cov_neg.T, decomposed_inv_cov_neg.T)
 
-        # get mean vectors and bias
-        self._mean_pos = np.array(weights[index_2:index_3])
-        self._mean_neg = np.array(weights[index_3:])
+        cov_pos = np.linalg.inv(inv_cov_pos)
+        cov_neg = np.linalg.inv(inv_cov_neg)
 
-        self._bias = weights[0]
+        return cov_pos, cov_neg
 
-        return self
+    # -------------------------------------------------
 
-    @dimensions((1, 2))
-    def transform(self, X: np.ndarray) -> np.ndarray:
+    def prepare(self, X: np.ndarray) -> torch.Tensor:
         """
-        After model calibration, this function is used to get calibrated outputs of uncalibrated
-        confidence estimates.
+        Preprocessing of input data before called at the beginning of the fit-function.
 
         Parameters
         ----------
@@ -202,144 +183,128 @@ def transform(self, X: np.ndarray) -> np.ndarray:
 
         Returns
         -------
-        np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with calibrated confidence estimates.
-            1-D for binary classification, 2-D for multi class (softmax).
+        torch.Tensor
+            Prepared data vector X as torch tensor.
         """
 
-        X = super().transform(X)
+        assert self.detection, "Detection mode must be enabled for dependent logistic calibration."
 
-        data_input = self._build_data_input(X)
-        logit = self._get_gaussian_ratio(data_input, self._bias, self._inverse_cov_pos, self._inverse_cov_neg,
-                                         self._mean_pos, self._mean_neg)
+        if len(X.shape) == 1:
+            X = np.reshape(X, (-1, 1))
 
-        calibrated = self._sigmoid(logit)
-        return calibrated
+        # on detection mode, convert confidence to sigmoid and append the remaining features
+        data_input = np.concatenate((self._inverse_sigmoid(X[:, 0]).reshape(-1, 1), X[:, 1:]), axis=1)
+        return torch.Tensor(data_input)
 
-    @dimensions((1, 2))
-    def _build_data_input(self, X: np.ndarray) -> np.ndarray:
+    def prior(self):
         """
-        Build data input for Matrix/Platt/Temperature scaling (even for detection mode).
-
-        Parameters
-        ----------
-        X : np.ndarray, shape=(n_samples, [n_classes]) or (n_samples, [n_box_features])
-            NumPy array with confidence values for each prediction on classification with shapes
-            1-D for binary classification, 2-D for multi class (softmax).
-            On detection, this array must have 2 dimensions with number of additional box features in last dim.
-
-        Returns
-        -------
-        np.ndarray
-            Data input to calculate logits.
+        Prior definition of the weights used for log regression. This function has to set the
+        variables 'self.weight_prior_dist', 'self.weight_mean_init' and 'self.weight_stddev_init'.
         """
 
-        if len(X.shape) == 1:
-            X = np.reshape(X, (-1, 1))
-
-        # if binary, use sigmoid instead of softmax
-        if self.num_classes <= 2 or self.independent_probabilities or self.detection:
-            if self.detection:
-                data_input = np.concatenate((self._inverse_sigmoid(X[:, 0]).reshape(-1, 1), X[:, 1:]), axis=1)
-            else:
-                data_input = self._inverse_sigmoid(X)
-        else:
-            data_input = self._inverse_softmax(X)
-
-        return data_input
-
-    @dimensions(2, None, 2, 2, 1, 1)
-    def _get_gaussian_ratio(self, data_input: np.ndarray, bias: float,
-                            inverse_cov_pos: np.ndarray, inverse_cov_neg: np.ndarray,
-                            mean_pos: np.ndarray, mean_neg: np.ndarray) -> np.ndarray:
+        # number of weights
+        num_weights = 2 * (self.num_features ** 2 + self.num_features)
+
+        # prior estimates for decomposed inverse covariance matrices and mean vectors
+        decomposed_inv_cov_prior = torch.diag(torch.ones(self.num_features))
+        mean_mean_prior = torch.ones(self.num_features)
+
+        # initial stddev for all weights is always the same
+        weights_mean_prior = torch.cat((decomposed_inv_cov_prior.flatten(),
+                                        decomposed_inv_cov_prior.flatten(),
+                                        mean_mean_prior.flatten(),
+                                        mean_mean_prior.flatten()))
+
+        self._sites = OrderedDict()
+
+        # set properties for "weights"
+        self._sites['weights'] = {
+            'values': None,
+            'constraint': constraints.real,
+            'init': {
+                'mean': weights_mean_prior,
+                'scale': torch.ones(num_weights)
+            },
+            'prior': dist.Normal(weights_mean_prior, 10 * torch.ones(num_weights), validate_args=True),
+        }
+
+        # set properties for "bias"
+        self._sites['bias'] = {
+            'values': None,
+            'constraint': constraints.real,
+            'init': {
+                'mean': torch.zeros(1),
+                'scale': torch.ones(1)
+            },
+            'prior': dist.Normal(torch.zeros(1), 10 * torch.ones(1), validate_args=True),
+        }
+
+    def model(self, X: torch.Tensor = None, y: torch.Tensor = None) -> torch.Tensor:
         """
-        Calculate ratio between two gaussian distributions given with parameters.
+        Definition of the log regression model.
 
         Parameters
         ----------
-        data_input : np.ndarray, shape=(n_samples, n_features)
-            Data input to calculate logits.
-        bias : float
-            Bias for the ratio.
-        inverse_cov_pos : np.ndarray, shape=(n_features, n_features)
-            Inverse covariance matrix of positive labels.
-        inverse_cov_neg : np.ndarray, shape=(n_features, n_features)
-            Inverse covariance matrix of negative labels.
-        mean_pos : np.ndarray, shape=(n_features,)
-            Means of positive labels.
-        mean_neg : np.ndarray, shape=(n_features,)
-            Means of negative labels.
+        X : torch.Tensor, shape=(n_samples, n_log_regression_features)
+            Input data that has been prepared by "self.prepare" function call.
+        y : torch.Tensor, shape=(n_samples, [n_classes])
+            Torch tensor with ground truth labels.
+            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D) (for multiclass MLE only).
 
         Returns
         -------
-        np.ndarray, shape=(n_samples,)
-            Ratio between both distributions.
+        torch.Tensor, shape=(n_samples, [n_classes])
+            Logit of the log regression model.
         """
 
-        # calculate data without means
-        difference_pos = data_input - mean_pos
-        difference_neg = data_input - mean_neg
-
-        # add a new dimensions. This is necessary for NumPy to distribute dot product
-        difference_pos = np.expand_dims(difference_pos, axis=-1)
-        difference_neg = np.expand_dims(difference_neg, axis=-1)
+        # get indices of weights
+        index_1 = int(np.power(self.num_features, 2))
+        index_2 = index_1 + int(np.power(self.num_features, 2))
+        index_3 = index_2 + self.num_features
 
-        logit = 0.5 * (np.matmul(np.transpose(difference_neg, axes=[0, 2, 1]),
-                                 np.matmul(inverse_cov_neg, difference_neg)) -
-                       np.matmul(np.transpose(difference_pos, axes=[0, 2, 1]),
-                                 np.matmul(inverse_cov_pos, difference_pos))
-                       )
+        # sample from prior - on MLE, this weight will be set as conditional
+        bias = pyro.sample("bias", self._sites["bias"]["prior"])
+        weights = pyro.sample("weights", self._sites["weights"]["prior"])
 
-        # remove unnecessary dimensions
-        logit = self.squeeze_generic(logit, axes_to_keep=0)
+        # the first dimension of the given input data is the "independent" sample dimension
+        with pyro.plate("data", X.shape[0]):
 
-        # add log determinant ratio to logit
-        logit = bias + logit
-        return logit
+            # get weights of decomposed cov matrices V^(-1)
+            decomposed_inv_cov_pos = torch.reshape(weights[:index_1], (self.num_features, self.num_features))
+            decomposed_inv_cov_neg = torch.reshape(weights[index_1:index_2], (self.num_features, self.num_features))
 
-    def _loss_function(self, weights: np.ndarray, data_input: np.ndarray,
-                       y: np.ndarray, num_features: int) -> float:
-        """
-        Wrapper function for SciPy's loss. This is simply NLL-Loss.
-        This wrapper is necessary because the first parameter is interpreted as the optimization parameter.
+            mean_pos = weights[index_2:index_3]
+            mean_neg = weights[index_3:]
 
-        Parameters
-        ----------
-        weights : np.ndarray, shape=(3,) or (2*num_features + 1,)
-            Weights for logistic fit with dependencies.
-        data_input : np.ndarray, shape=(n_samples, n_features)
-            NumPy 2-D array with data input.
-        y : np.ndarray, shape=(n_samples, [n_classes])
-            NumPy array with ground truth labels.
-            Either as label vector (1-D) or as one-hot encoded ground truth array (2-D).
-        num_features : int
-            Number of features for multivariate distribution.
+            # get logits by calculating gaussian ratio between both distributions
+            # calculate covariance matrices
+            # COV^(-1) = V^(-1) * V^(-1,T)
+            inverse_cov_pos = torch.matmul(decomposed_inv_cov_pos, decomposed_inv_cov_pos.transpose(1, 0))
+            inverse_cov_neg = torch.matmul(decomposed_inv_cov_neg, decomposed_inv_cov_neg.transpose(1, 0))
 
-        Returns
-        -------
-        float
-            NLL-Loss
-        """
+            # calculate data without means
+            difference_pos = X - mean_pos
+            difference_neg = X - mean_neg
 
-        # get indices of weights
-        index_1 = 1 + int(np.power(num_features, 2))
-        index_2 = index_1 + int(np.power(num_features, 2))
-        index_3 = index_2 + num_features
+            # add a new dimensions. This is necessary for torch to distribute dot product
+            difference_pos = torch.unsqueeze(difference_pos, 2)
+            difference_neg = torch.unsqueeze(difference_neg, 2)
 
-        # get weights of decomposed cov matrices V
-        decomposed_inv_cov_pos = np.array(weights[1:index_1]).reshape((num_features, num_features))
-        decomposed_inv_cov_neg = np.array(weights[index_1:index_2]).reshape((num_features, num_features))
+            logit = 0.5 * (torch.matmul(difference_neg.transpose(2, 1),
+                                        torch.matmul(inverse_cov_neg, difference_neg)) -
+                           torch.matmul(difference_pos.transpose(2, 1),
+                                        torch.matmul(inverse_cov_pos, difference_pos))
+                           )
 
-        # calculate covariance matrices
-        # COV^-1 = V^-1 * V^(-1,T)
-        inv_cov_pos = np.matmul(decomposed_inv_cov_pos, decomposed_inv_cov_pos.T)
-        inv_cov_neg = np.matmul(decomposed_inv_cov_neg, decomposed_inv_cov_neg.T)
+            # remove unnecessary dimensions
+            logit = torch.squeeze(logit)
 
-        mean_pos = np.array(weights[index_2:index_3])
-        mean_neg = np.array(weights[index_3:])
+            # add bias ratio to logit
+            logit = bias + logit
 
-        bias = weights[0]
+            # if MLE, (slow) sampling is not necessary. However, this is needed for 'variational' and 'mcmc'
+            if self.method in ['variational', 'mcmc']:
+                probs = torch.sigmoid(logit)
+                pyro.sample("obs", dist.Bernoulli(probs=probs, validate_args=True), obs=y)
 
-        # get logits by calculating gaussian ratio between both distributions
-        logit = self._get_gaussian_ratio(data_input, bias, inv_cov_pos, inv_cov_neg, mean_pos, mean_neg)
-        return self._nll_loss(logit=logit, ground_truth=y)
+        return logit
diff --git a/netcal/scaling/TemperatureScaling.py b/netcal/scaling/TemperatureScaling.py
index c2441a5..3fbd814 100644
--- a/netcal/scaling/TemperatureScaling.py
+++ b/netcal/scaling/TemperatureScaling.py
@@ -1,30 +1,56 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
-from netcal import accepts
 from netcal.scaling import LogisticCalibration
 
 
 class TemperatureScaling(LogisticCalibration):
     """
-    Perform Temperature scaling to logits of NN. This method is originally proposed by [1]_.
-    The calibrated probability :math:`\\hat{q}` is computed by
+    On classification or detection, apply the temperature scaling method described in [1]_ to obtain a
+    calibration mapping. For confidence calibration in classification tasks, a
+    confidence mapping :math:`g` is applied on top of a miscalibrated scoring classifier :math:`\\hat{p} = h(x)` to
+    deliver a calibrated confidence score :math:`\\hat{q} = g(h(x))`.
+
+    For detection calibration, we can also use the additional box regression output which we denote as
+    :math:`\\hat{r} \\in [0, 1]^J` with :math:`J` as the number of dimensions used for the box encoding (e.g.
+    :math:`J=4` for x position, y position, width and height).
+    Therefore, the calibration map is not only a function of the confidence score, but also of :math:`\\hat{r}`.
+    To define a general calibration map, we use the the combined input :math:`s = (\\hat{p}, \\hat{r})` of size K
+    and perform a temperature scaling defined by
 
     .. math::
 
-       \\hat{q} = \\sigma_{\\text{SM}} (z / T)
+       \\hat{q} = \\sigma(s / T)
+
+    with the temperature :math:`T \\in \\mathbb{R}` as a single scalar value.
+    The function :math:`\\sigma(*)` is either the sigmoid (on detection or binary classification) or the
+    softmax operator (multiclass classification).
 
-    with :math:`\\sigma_{\\text{SM}}` as the softmax operator (or the sigmoid alternatively),
-    :math:`z` as the logits and :math:`T` as the temperature estimated by logistic regression.
-    This leds to calibrated confidence estimates.
-    This methods can also be applied on object detection tasks with an additional regression output [2]_.
+    We utilize standard optimization methods to determine the calibration mapping :math:`g(s)`.
 
     Parameters
     ----------
+    method : str, default: "mle"
+        Method that is used to obtain a calibration mapping:
+        - 'mle': Maximum likelihood estimate without uncertainty using a convex optimizer.
+        - 'momentum': MLE estimate using Momentum optimizer for non-convex optimization.
+        - 'variational': Variational Inference with uncertainty.
+        - 'mcmc': Markov-Chain Monte-Carlo sampling with uncertainty.
+    momentum_epochs : int, optional, default: 1000
+            Number of epochs used by momentum optimizer.
+    mcmc_steps : int, optional, default: 20
+        Number of weight samples obtained by MCMC sampling.
+    mcmc_chains : int, optional, default: 1
+        Number of Markov-chains used in parallel for MCMC sampling (this will result
+        in mcmc_steps * mcmc_chains samples).
+    mcmc_warmup_steps : int, optional, default: 100
+        Warmup steps used for MCMC sampling.
+    vi_epochs : int, optional, default: 1000
+        Number of epochs used for ELBO optimization.
     detection : bool, default: False
         If False, the input array 'X' is treated as multi-class confidence input (softmax)
         with shape (n_samples, [n_classes]).
@@ -34,6 +60,9 @@ class TemperatureScaling(LogisticCalibration):
         Boolean for multi class probabilities.
         If set to True, the probability estimates for each
         class are treated as independent of each other (sigmoid).
+    use_cuda : str or bool, optional, default: False
+        Specify if CUDA should be used. If str, you can also specify the device
+        number like 'cuda:0', etc.
 
     References
     ----------
@@ -44,31 +73,20 @@ class are treated as independent of each other (sigmoid).
 
     .. [2] Fabian Küppers, Jan Kronenberger, Amirhossein Shantia and Anselm Haselhoff:
        "Multivariate Confidence Calibration for Object Detection."
-       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops.
-    """
+       The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, 2020.
 
-    @accepts(bool, bool)
-    def __init__(self, detection: bool = False, independent_probabilities: bool = False):
-        """
-        Constructor.
+    .. [3] Fabian Küppers, Jan Kronenberger, Jonas Schneider  and Anselm Haselhoff:
+       "Bayesian Confidence Calibration for Epistemic Uncertainty Modelling."
+       2021 IEEE Intelligent Vehicles Symposium (IV), 2021
+    """
 
-        Parameters
-        ----------
-        detection : bool, default: False
-            If False, the input array 'X' is treated as multi-class confidence input (softmax)
-            with shape (n_samples, [n_classes]).
-            If True, the input array 'X' is treated as a box predictions with several box features (at least
-            box confidence must be present) with shape (n_samples, [n_box_features]).
-        independent_probabilities : bool, default=False
-            boolean for multi class probabilities.
-            If set to True, the probability estimates for each
-            class are treated as independent of each other (sigmoid).
-        """
+    def __init__(self, *args, **kwargs):
+        """ Create an instance of `TemperatureScaling`. Detailed parameter description given in class docs. """
 
-        super().__init__(temperature_only=True, detection=detection,
-                         independent_probabilities=independent_probabilities)
+        super().__init__(*args, **kwargs)
+        self.temperature_only = True
 
     @property
     def temperature(self):
-        """ Alias for the temperature """
-        return self._weights
+        """ Getter for temperature of temperature scaling. """
+        return self.weights
diff --git a/netcal/scaling/__init__.py b/netcal/scaling/__init__.py
index 18d9ea8..3f59139 100644
--- a/netcal/scaling/__init__.py
+++ b/netcal/scaling/__init__.py
@@ -1,9 +1,9 @@
 # Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
 # AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
 #
-# This Source Code Form is subject to the terms of the Mozilla Public
-# License, v. 2.0. If a copy of the MPL was not distributed with this
-# file, You can obtain one at http://mozilla.org/MPL/2.0/.
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 """
 Scaling methods for confidence calibration.
@@ -17,6 +17,7 @@
    :toctree: _autosummary_scaling
    :template: custom_class.rst
 
+   AbstractLogisticRegression
    LogisticCalibration
    LogisticCalibrationDependent
    TemperatureScaling
@@ -24,6 +25,7 @@
    BetaCalibrationDependent
 """
 
+from .AbstractLogisticRegression import AbstractLogisticRegression
 
 from .LogisticCalibration import LogisticCalibration
 from .LogisticCalibrationDependent import LogisticCalibrationDependent
diff --git a/setup.py b/setup.py
index 148b01e..79585c0 100644
--- a/setup.py
+++ b/setup.py
@@ -1,12 +1,9 @@
-"""
-Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
-AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
-
-This Source Code Form is subject to the terms of the Mozilla Public
-License, v. 2.0. If a copy of the MPL was not distributed with this
-file, You can obtain one at http://mozilla.org/MPL/2.0/.
-"""
-
+# Copyright (C) 2019-2021 Ruhr West University of Applied Sciences, Bottrop, Germany
+# AND Elektronische Fahrwerksysteme GmbH, Gaimersheim Germany
+#
+# This Source Code Form is subject to the terms of the Apache License 2.0
+# If a copy of the APL2 was not distributed with this
+# file, You can obtain one at https://www.apache.org/licenses/LICENSE-2.0.txt.
 
 import setuptools
 
@@ -15,7 +12,7 @@
 
 setuptools.setup(
     name="netcal",
-    version="1.1.3",
+    version="1.2.0",
     author="Fabian Kueppers",
     author_email="fabian.kueppers@hs-ruhrwest.de",
     description="Python Framework to calibrate confidence estimates of classifiers like Neural Networks",
@@ -23,10 +20,10 @@
     long_description_content_type="text/x-rst",
     url="https://github.com/fabiankueppers/calibration-framework",
     packages=setuptools.find_packages(),
-    install_requires = ['numpy>=1.17', 'scipy>=1.3', 'matplotlib>=3.1', 'scikit-learn>=0.20.0', 'torch>=1.1', 'tqdm'],
+    install_requires = ['numpy>=1.17', 'scipy>=1.3', 'matplotlib>=3.1', 'scikit-learn>=0.21', 'torch>=1.4', 'torchvision>=0.5.0', 'tqdm>=4.40', 'pyro-ppl>=1.3', 'tikzplotlib>=0.9.8', 'tensorboard>=2.2'],
     classifiers=[
         "Programming Language :: Python :: 3",
-        "License :: OSI Approved :: Mozilla Public License 2.0 (MPL 2.0)",
+        "License :: OSI Approved :: Apache Software License",
         "Operating System :: OS Independent",
         "Development Status :: 5 - Production/Stable",
         "Topic :: Scientific/Engineering :: Artificial Intelligence",