NNPDF
diff --git a/‎n3fit/runcards/examples/Basic_runcard_qed.yml‎
Lines changed: 4 additions & 4 deletions b/‎n3fit/runcards/examples/Basic_runcard_qed.yml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎n3fit/src/n3fit/Basic_runcard_bayesian/filter.yml‎
Lines changed: 96 additions & 0 deletions b/‎n3fit/src/n3fit/Basic_runcard_bayesian/filter.yml‎
Lines changed: 96 additions & 0 deletions
diff --git a/‎n3fit/src/n3fit/Basic_runcard_normal/filter.yml‎
Lines changed: 96 additions & 0 deletions b/‎n3fit/src/n3fit/Basic_runcard_normal/filter.yml‎
Lines changed: 96 additions & 0 deletions
diff --git a/‎n3fit/src/n3fit/backends/keras_backend/base_layers.py‎
Lines changed: 106 additions & 4 deletions b/‎n3fit/src/n3fit/backends/keras_backend/base_layers.py‎
Lines changed: 106 additions & 4 deletions
@@ -27,11 +27,11 @@ trvlseed: 1551864071
 nnseed: 676150632
 mcseed: 619859729
 save: false
-genrep: true      # true = generate MC replicas, false = use real data
+genrep: false      # true = generate MC replicas, false = use real data
 
 parameters: # This defines the parameter dictionary that is passed to the Model Trainer
-  nodes_per_layer: [25, 20, 8]
-  activation_per_layer: [tanh, tanh, linear]
+  nodes_per_layer: [15, 10, 8]
+  activation_per_layer: ['gelu', 'gelu', 'gelu']
   initializer: glorot_normal
   optimizer:
     clipnorm: 6.073e-6
@@ -45,7 +45,7 @@ parameters: # This defines the parameter dictionary that is passed to the Model
     initial: 10
     multiplier:
   stopping_patience: 0.1
-  layer_type: dense
+  layer_type: ["dense", "dense", "VBDense"]
   dropout: 0.0
   threshold_chi2: 3.5
 
 
@@ -0,0 +1,96 @@
+#
+# Configuration file for n3fit
+#
+############################################################
+description: Basic runcard with extra options such as debugging and tensorboard
+
+############################################################
+# frac: training fraction
+# ewk: apply ewk k-factors
+# sys: systematics treatment (see systypes)
+dataset_inputs:
+- {dataset: NMC_NC_NOTFIXED_EM-F2, variant: legacy_dw}
+#- {dataset: SLAC_NC_NOTFIXED_D_EM-F2, variant: legacy_dw}
+#- {dataset: ATLAS_Z0J_8TEV_PT-M }
+
+diagonal_frac: 0.75
+
+############################################################
+datacuts:
+  t0pdfset     : NNPDF40_nnlo_as_01180 # PDF set to generate t0 covmat
+  q2min        : 3.49                # Q2 minimum
+  w2min        : 12.5                # W2 minimum
+
+############################################################
+theory:
+  theoryid: 41_000_000       # database id
+
+parameters: # This defines the parameter dictionary that is passed to the Model Trainer
+  nodes_per_layer: [15, 10, 8]
+  activation_per_layer: ['gelu', 'gelu', 'gelu']
+  initializer: 'glorot_normal'
+  optimizer:
+    optimizer_name: 'RMSprop'
+    learning_rate: 0.01
+    clipnorm: 1.0
+  epochs: 900
+  positivity:
+    multiplier: 1.05 # When any of the multiplier and/or the initial is not set
+    initial: # the maxlambda will be used instead to compute these values per dataset
+    threshold: 1e-5
+  stopping_patience: 0.30 # percentage of the number of epochs
+  layer_type: ['dense','dense','VBDense']
+  dropout: 0.0
+  threshold_chi2: 5.0
+
+############################################################
+trvlseed: 1
+nnseed: 2
+mcseed: 3
+genrep: True     # true = generate MC replicas, false = use real data
+
+fitting:
+  # NN23(QED) = sng=0,g=1,v=2,t3=3,ds=4,sp=5,sm=6,(pht=7)
+  # EVOL(QED) = sng=0,g=1,v=2,v3=3,v8=4,t3=5,t8=6,(pht=7)
+  # EVOLS(QED)= sng=0,g=1,v=2,v8=4,t3=4,t8=5,ds=6,(pht=7)
+  # FLVR(QED) = g=0, u=1, ubar=2, d=3, dbar=4, s=5, sbar=6, (pht=7)
+  fitbasis: NN31IC # EVOL (7), EVOLQED (8), etc.
+  basis:
+      # remeber to change the name of PDF accordingly with fitbasis
+      - { fl: sng,  smallx: [1.05,1.19], largex: [1.47,2.70], trainable: False }
+      - { fl: g,    smallx: [0.94,1.25], largex: [0.11,5.87], trainable: False }
+      - { fl: v,    smallx: [0.54,0.75], largex: [1.15,2.76], trainable: False }
+      - { fl: v3,   smallx: [0.21,0.57], largex: [1.35,3.08] }
+      - { fl: v8,   smallx: [0.52,0.76], largex: [0.77,3.56], trainable: True }
+      - { fl: t3,   smallx: [-0.37,1.52], largex: [1.74,3.39] }
+      - { fl: t8,   smallx: [0.56,1.29], largex: [1.45,3.03] }
+      - { fl: cp,   smallx: [0.12,1.19], largex: [1.83,6.70] }
+
+############################################################
+positivity:
+  posdatasets:
+  #- {dataset: NNPDF_POS_2P24GEV_F2U, maxlambda: 1e6}        # Positivity Lagrange Multiplier
+  #- {dataset: NNPDF_POS_2P24GEV_FLL, maxlambda: 1e6}
+  #- {dataset: NNPDF_POS_2P24GEV_XGL, maxlambda: 1e6}
+
+############################################################
+integrability:
+  integdatasets:
+  - {dataset: NNPDF_INTEG_3GEV_XT3, maxlambda: 1e2}
+
+# Apply a cut to a dataset or process type, in this case to the positivity dataset `NNPDF_POS_2P24GEV_XGL` which has process type: POS_XPDF
+added_filter_rules:
+    - process_type: POS_XPDF
+      rule: "x > 0.1"
+
+############################################################
+debug: True
+maxcores: 8
+parallel_models: false
+
+tensorboard:
+  weight_freq: 100
+  profiling: False
+
+save: 'weights.h5'
+# load: '/path/to/weights.h5/file'
@@ -0,0 +1,96 @@
+#
+# Configuration file for n3fit
+#
+############################################################
+description: Basic runcard with extra options such as debugging and tensorboard
+
+############################################################
+# frac: training fraction
+# ewk: apply ewk k-factors
+# sys: systematics treatment (see systypes)
+dataset_inputs:
+- {dataset: NMC_NC_NOTFIXED_EM-F2, variant: legacy_dw}
+#- {dataset: SLAC_NC_NOTFIXED_D_EM-F2, variant: legacy_dw}
+#- {dataset: ATLAS_Z0J_8TEV_PT-M }
+
+diagonal_frac: 0.75
+
+############################################################
+datacuts:
+  t0pdfset     : NNPDF40_nnlo_as_01180 # PDF set to generate t0 covmat
+  q2min        : 3.49                # Q2 minimum
+  w2min        : 12.5                # W2 minimum
+
+############################################################
+theory:
+  theoryid: 41_000_000       # database id
+
+parameters: # This defines the parameter dictionary that is passed to the Model Trainer
+  nodes_per_layer: [15, 10, 8]
+  activation_per_layer: ['gelu', 'gelu', 'gelu']
+  initializer: 'glorot_normal'
+  optimizer:
+    optimizer_name: 'RMSprop'
+    learning_rate: 0.01
+    clipnorm: 1.0
+  epochs: 900
+  positivity:
+    multiplier: 1.05 # When any of the multiplier and/or the initial is not set
+    initial: # the maxlambda will be used instead to compute these values per dataset
+    threshold: 1e-5
+  stopping_patience: 0.30 # percentage of the number of epochs
+  layer_type: ['dense','dense','dense']
+  dropout: 0.0
+  threshold_chi2: 5.0
+
+############################################################
+trvlseed: 1
+nnseed: 2
+mcseed: 3
+genrep: True     # true = generate MC replicas, false = use real data
+
+fitting:
+  # NN23(QED) = sng=0,g=1,v=2,t3=3,ds=4,sp=5,sm=6,(pht=7)
+  # EVOL(QED) = sng=0,g=1,v=2,v3=3,v8=4,t3=5,t8=6,(pht=7)
+  # EVOLS(QED)= sng=0,g=1,v=2,v8=4,t3=4,t8=5,ds=6,(pht=7)
+  # FLVR(QED) = g=0, u=1, ubar=2, d=3, dbar=4, s=5, sbar=6, (pht=7)
+  fitbasis: NN31IC # EVOL (7), EVOLQED (8), etc.
+  basis:
+      # remeber to change the name of PDF accordingly with fitbasis
+      - { fl: sng,  smallx: [1.05,1.19], largex: [1.47,2.70], trainable: False }
+      - { fl: g,    smallx: [0.94,1.25], largex: [0.11,5.87], trainable: False }
+      - { fl: v,    smallx: [0.54,0.75], largex: [1.15,2.76], trainable: False }
+      - { fl: v3,   smallx: [0.21,0.57], largex: [1.35,3.08] }
+      - { fl: v8,   smallx: [0.52,0.76], largex: [0.77,3.56], trainable: True }
+      - { fl: t3,   smallx: [-0.37,1.52], largex: [1.74,3.39] }
+      - { fl: t8,   smallx: [0.56,1.29], largex: [1.45,3.03] }
+      - { fl: cp,   smallx: [0.12,1.19], largex: [1.83,6.70] }
+
+############################################################
+positivity:
+  posdatasets:
+  #- {dataset: NNPDF_POS_2P24GEV_F2U, maxlambda: 1e6}        # Positivity Lagrange Multiplier
+  #- {dataset: NNPDF_POS_2P24GEV_FLL, maxlambda: 1e6}
+  #- {dataset: NNPDF_POS_2P24GEV_XGL, maxlambda: 1e6}
+
+############################################################
+integrability:
+  integdatasets:
+  - {dataset: NNPDF_INTEG_3GEV_XT3, maxlambda: 1e2}
+
+# Apply a cut to a dataset or process type, in this case to the positivity dataset `NNPDF_POS_2P24GEV_XGL` which has process type: POS_XPDF
+added_filter_rules:
+    - process_type: POS_XPDF
+      rule: "x > 0.1"
+
+############################################################
+debug: True
+maxcores: 8
+parallel_models: false
+
+tensorboard:
+  weight_freq: 100
+  profiling: False
+
+save: 'weights.h5'
+# load: '/path/to/weights.h5/file'
@@ -16,15 +16,21 @@
 
 The names of the layer and the activation function are the ones to be used in the n3fit runcard.
 """
+import numpy as np
+import keras.backend as K
+import tensorflow as tf
+import math
+from scipy.stats import norm
 
 from keras.layers import Dense as KerasDense
-from keras.layers import Dropout, Lambda
+from keras.layers import Dropout, Lambda, Layer
 from keras.layers import Input  # pylint: disable=unused-import
 from keras.layers import LSTM, Concatenate
 from keras.regularizers import l1_l2
 
 from . import operations as ops
 from .MetaLayer import MetaLayer
+from contextlib import contextmanager
 
 
 # Custom activation functions
@@ -74,14 +80,101 @@ def ReshapedLSTM(input_tensor):
 
     return ReshapedLSTM
 
+class VBDense(Layer):
+    def __init__(self, out_features: int, in_features: int, prior_prec: float = 0.01, 
+                 map: bool = False, std_init: float = -9, lbound=-30, ubound=11, training = True):
+        super().__init__()
+        self.output_dim = out_features
+        self.input_dim = in_features
+        self.map = map
+        self.prior_prec = tf.cast(prior_prec, tf.float64)
+        self.random = None
+        self.eps = 1e-12 if K.floatx() == 'float64' else 1e-8
+        self.std_init = tf.cast(std_init, tf.float64)
+        self.lbound = lbound
+        self.ubound = ubound
+        self.training = training
+
+    def build(self, input_shape):
+        self.bias = self.add_weight(
+            name='bias', 
+            shape=(self.output_dim,), 
+            initializer='glorot_normal', 
+            trainable=True, 
+            dtype=tf.float64
+            )
+        
+        self.mu_w = self.add_weight(
+            name='mu_w', 
+            shape=(self.output_dim, self.input_dim), 
+            initializer='glorot_normal', 
+            trainable=True, 
+            dtype=tf.float64
+            )
+        
+        self.logsig2_w = self.add_weight(
+            name='logsig2_w', 
+            shape=(self.output_dim, self.input_dim), 
+            initializer='glorot_normal', 
+            trainable=True,
+            dtype=tf.float64,
+            ) 
+        
+        self.reset_parameters()
+
+    def reset_parameters(self):
+        stdv = 1.0 / tf.math.sqrt(tf.cast(self.input_dim, dtype=tf.float64))
+        self.bias.assign(tf.zeros_like(self.bias))
+        self.mu_w.assign(tf.random.normal(tf.shape(self.mu_w), mean=0, stddev=stdv, dtype=tf.float64))
+        #self.logsig2_w.assign(tf.random.normal(tf.shape(self.logsig2_w), mean=0.001, stddev=self.std_init, dtype=tf.float64))
+        initial_logsig2 = tf.constant(self.std_init, dtype=tf.float64) 
+        self.logsig2_w.assign(tf.fill(tf.shape(self.logsig2_w), initial_logsig2))
+
+    def reset_random(self):
+        self.random = None
+        self.map = False
+
+    def kl_loss(self) -> tf.Tensor:
+        logsig2_w = tf.clip_by_value(self.logsig2_w, self.lbound, self.ubound)
+        kl = 0.5 * tf.reduce_sum((self.prior_prec*(tf.math.pow(self.mu_w,2)+tf.math.exp(logsig2_w))
+                                - logsig2_w - tf.constant(1.0, dtype=tf.float64) - tf.math.log(self.prior_prec)))
+        return kl
+        
+    def call(self, input: tf.Tensor) -> tf.Tensor:
+        # Ensure input is tf.float64
+        input = tf.cast(input, tf.float64)
+    
+        if self.training:
+            mu_out = tf.matmul(input, tf.cast(self.mu_w, input.dtype), transpose_b=True) + tf.cast(self.bias, input.dtype)
+            logsig2_w = tf.clip_by_value(self.logsig2_w, self.lbound, self.ubound)
+            s2_w = tf.math.exp(logsig2_w)
+            input2 = tf.math.pow(input, 2)
+            var_out = tf.matmul(input2, s2_w, transpose_b=True) + tf.cast(self.eps, input.dtype)
+        
+            return mu_out + tf.math.sqrt(var_out) * tf.random.normal(shape=tf.shape(mu_out), dtype=input.dtype)
+    
+        else:
+            # During inference, use MAP estimation (posterior mean) for deterministic output
+            mu_out = tf.matmul(input, tf.cast(self.mu_w, input.dtype), transpose_b=True) + tf.cast(self.bias, input.dtype)
+            return mu_out
+
+
 
 class Dense(KerasDense, MetaLayer):
+<<<<<<< Updated upstream
 
     def __init__(self, *args, **kwargs):
         # In Keras == 3.13, np.int() is not accepted by Dense
         if "units" in kwargs:
             kwargs["units"] = int(kwargs["units"])
         super().__init__(*args, **kwargs)
+=======
+    def __init__(self, **kwargs):
+        # Set default dtype to tf.float64 if not provided
+        if 'dtype' not in kwargs:
+            kwargs['dtype'] = tf.float64
+        super().__init__(**kwargs)
+>>>>>>> Stashed changes
 
 
 def dense_per_flavour(basis_size=8, kernel_initializer="glorot_normal", **dense_kwargs):
@@ -133,7 +226,6 @@ def apply_dense(xinput):
 
     return apply_dense
 
-
 layers = {
     "dense": (
         Dense,
@@ -142,6 +234,7 @@ def apply_dense(xinput):
             "units": 5,
             "activation": "sigmoid",
             "kernel_regularizer": None,
+            "dtype": tf.float64,
         },
     ),
     "dense_per_flavour": (
@@ -151,12 +244,21 @@ def apply_dense(xinput):
             "units": 5,
             "activation": "sigmoid",
             "basis_size": 8,
+            "dtype": tf.float64,
         },
     ),
     "LSTM": (
         LSTM_modified,
         {"kernel_initializer": "glorot_normal", "units": 5, "activation": "sigmoid"},
     ),
+    "VBDense": (
+        VBDense,
+        {   
+            "in_features" : 10,
+            "out_features" : 8,
+            "training": "False", 
+        },
+    ),
     "dropout": (Dropout, {"rate": 0.0}),
     "concatenate": (Concatenate, {}),
 }
@@ -173,7 +275,7 @@ def base_layer_selector(layer_name, **kwargs):
 
     Parameters
     ----------
-        `layer_name
+        `layer_name`
             str with the name of the layer
         `**kwargs`
             extra optional arguments to pass to the layer (beyond their defaults)
@@ -232,4 +334,4 @@ def regularizer_selector(reg_name, **kwargs):
         if key in reg_args.keys():
             reg_args[key] = value
 
-    return reg_class(**reg_args)
+    return reg_class(**reg_args)