Skip to content

Commit

Permalink
added filter and filter utils for Z TOT, unc are correlated with WPWM
Browse files Browse the repository at this point in the history
  • Loading branch information
comane committed Dec 8, 2024
1 parent 155fd8e commit a24b6e0
Show file tree
Hide file tree
Showing 6 changed files with 289 additions and 22 deletions.
96 changes: 96 additions & 0 deletions nnpdf_data/nnpdf_data/commondata/ATLAS_Z0_13TEV/filter.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,96 @@
"""
filter.py module for ATLAS_WPWM_13TEV dataset
When running `python filter.py` the relevant uncertainties , data and kinematics yaml
file will be created in the `nnpdf_data/commondata/ATLAS_WPWM_13TEV` directory.
"""

import yaml
from filter_utils import get_data_values, get_systematics
from nnpdf_data.filter_utils.utils import prettify_float

yaml.add_representer(float, prettify_float)

MZ2 = 91.1876**2


def filter_ATLAS_Z0_13TEV_TOT_data_kinetic():
"""
This function writes the central values and kinematics to yaml files.
"""

kin = [
{
'm_Z2': {'min': None, 'mid': MZ2, 'max': None},
'sqrts': {'min': None, 'mid': 13000.0, 'max': None},
}
]

# only keep the last entry corresponding to Z observable
central_values = [get_data_values()[-1]]

data_central_yaml = {"data_central": central_values}

kinematics_yaml = {"bins": kin}

# write central values and kinematics to yaml file
with open("data.yaml", "w") as file:
yaml.dump(data_central_yaml, file, sort_keys=False)

with open("kinematics.yaml", "w") as file:
yaml.dump(kinematics_yaml, file, sort_keys=False)


def filter_ATLAS_Z0_13TEV_TOT_systematics():
"""
This function writes the systematics to a yaml file.
"""

with open("metadata.yaml", "r") as file:
metadata = yaml.safe_load(file)

systematics = get_systematics()

# error definition
error_definitions = {}
errors = []

for sys in systematics:
if sys[0]['name'] == 'stat':
error_definitions[sys[0]['name']] = {
"description": f"{sys[0]['name']}",
"treatment": "ADD",
"type": "UNCORR",
}

elif sys[0]['name'] == 'ATLAS_LUMI':
error_definitions["ATLASLUMI13"] = {
"description": f"ATLASLUMI13",
"treatment": "ADD",
"type": "ATLASLUMI13",
}

else:
error_definitions[sys[0]['name']] = {
"description": f"{sys[0]['name']}",
"treatment": "ADD",
"type": f"{sys[0]['name']}",
}

for i in range(metadata['implemented_observables'][0]['ndata']):
error_value = {}

for sys in systematics:
error_value[sys[0]['name']] = float(sys[0]['values'][i])

errors.append(error_value)

uncertainties_yaml = {"definitions": error_definitions, "bins": errors}

# write uncertainties
with open(f"uncertainties.yaml", 'w') as file:
yaml.dump(uncertainties_yaml, file, sort_keys=False)


if __name__ == "__main__":
filter_ATLAS_Z0_13TEV_TOT_data_kinetic()
filter_ATLAS_Z0_13TEV_TOT_systematics()
115 changes: 115 additions & 0 deletions nnpdf_data/nnpdf_data/commondata/ATLAS_Z0_13TEV/filter_utils.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,115 @@
"""
This module contains helper functions that are used to extract the uncertainties, kinematics and data values
from the rawdata files.
"""

import yaml
import numpy as np
from nnpdf_data.filter_utils.utils import decompose_covmat


UNIT_CONVERSION = 1000000
TABLES = [9, 8, 11] # order is W-, W+, Z


def get_data_values():
"""
returns the central data values in the form of a list.
"""
name_data = lambda tab: f"rawdata/HEPData-ins1436497-v1-Table_{tab}.yaml"

data_central = []

for tab in TABLES:
with open(name_data(tab), 'r') as file:
input = yaml.safe_load(file)
values = input['dependent_variables'][0]['values']
data_central.append(values[0]['value'] * UNIT_CONVERSION)

return data_central


def get_uncertainties():
"""
Returns array of shape (3,3)
Each row corresponds to a different observable: (W-, W+, Z)
Each column corresponds to a different systematic: (stat, sys, lumi)
See table 3 of paper: https://arxiv.org/abs/1603.09222
"""

name_data = lambda tab: f"rawdata/HEPData-ins1436497-v1-Table_{tab}.yaml"

uncertainties = []

for tab in TABLES:
with open(name_data(tab), 'r') as file:
input = yaml.safe_load(file)
errors = input['dependent_variables'][0]['values'][0]['errors']
uncertainties.append(
np.array([errors[0]['symerror'], errors[1]['symerror'], errors[2]['symerror']])
)

return np.array(uncertainties) * UNIT_CONVERSION


def get_correlation_matrix():
"""
See extra material page: https://atlas.web.cern.ch/Atlas/GROUPS/PHYSICS/PAPERS/STDM-2015-03/tabaux_03.pdf
Note that this does not include the normalisation uncertainty due to the luminosity.
"""

correlation_matrix = np.ones((3, 3))
correlation_matrix[0, 1] = 0.93
correlation_matrix[1, 0] = correlation_matrix[0, 1]
correlation_matrix[0, 2] = 0.18
correlation_matrix[2, 0] = correlation_matrix[0, 2]
correlation_matrix[1, 2] = 0.19
correlation_matrix[2, 1] = correlation_matrix[1, 2]

return correlation_matrix


def get_covariance_matrices():
"""
For the systematics see Table 3 of paper: https://arxiv.org/abs/1603.09222
Returns:
--------
tuple: (cov_matrix_no_lumi, lumi_cov)
cov_matrix_no_lumi: np.array, the sum of stat and syst covmats -> to be decomposed into artificial systematics
lumi_cov: np.array, the lumi covmat. This is correlated between experiments so needs to be saved with type: SPECIAL
"""
corr_matrix = get_correlation_matrix()
uncertainties = get_uncertainties()

# build correlated systematics covariance
sys = np.array([uncertainties[i, 1] for i in range(3)])
cov_sys = corr_matrix * np.outer(sys, sys)

# array of lumi uncertainties
lumi_unc = np.array([uncertainties[i, 2] for i in range(3)])

# array of stat uncertainties
stat = np.array([uncertainties[i, 0] for i in range(3)])

return stat, cov_sys, lumi_unc


def get_systematics():
stat, cov_sys, lumi_unc = get_covariance_matrices()

# decompose sys covmat
syst_unc = decompose_covmat(cov_sys)

uncertainties = []

# store only systematics for W+ and W-
for i in range(3):
uncertainties.append([{"name": f"ATLAS_WZ_TOT_13TEV_{i}", "values": [syst_unc[2, i]]}])

uncertainties.append([{"name": "stat", "values": [stat[2]]}])
uncertainties.append([{"name": "ATLAS_LUMI", "values": [lumi_unc[2]]}])

return uncertainties
40 changes: 18 additions & 22 deletions nnpdf_data/nnpdf_data/commondata/ATLAS_Z0_13TEV/metadata.yaml
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
setname: ATLAS_Z0_13TEV
version: 1
version_comment: Port of old commondata
version_comment: New implementation, as for the old one, data is taken from Table 3 of the paper
nnpdf_metadata:
nnpdf31_process: DY NC
experiment: ATLAS
Expand All @@ -19,11 +19,11 @@ implemented_observables:
label: ATLAS $Z$ inclusive 13 TeV
units: ''
process_type: INC
tables: []
npoints: []
tables: [9, 8, 11]
npoints: [1]
ndata: 1
plotting:
kinematics_override: inc_sqrt_scale
kinematics_override: identity
dataset_label: ATLAS $Z$ inclusive 13 TeV
y_label: $\sigma^{fid}$ (fb)
figure_by:
Expand All @@ -35,33 +35,29 @@ implemented_observables:
- Z
plot_x: ' '
kinematic_coverage:
- k1
- k2
- k3
- m_Z2
- sqrts
kinematics:
variables:
k1:
description: Variable k1
label: k1
units: ''
k2:
description: Variable k2
label: k2
units: ''
k3:
description: Variable k3
label: k3
units: ''
file: kinematics_TOT.yaml
m_Z2:
description: Z boson mass squared
label: '$m_{Z}^2$'
units: '$GeV^2$'
sqrts:
description: center of mass energy
label: '$\sqrt{s}$'
units: 'GeV'
file: kinematics.yaml
theory:
conversion_factor: 1.0
operation: 'null'
FK_tables:
- - ATLAS_WZ_TOT_13TEV-ATLASWZTOT13TEV81PB_Z_tot
data_uncertainties: []
data_uncertainties:
- uncertainties.yaml
variants:
legacy:
data_uncertainties:
- uncertainties_legacy_TOT.yaml
data_central: data_legacy_TOT.yaml
data_central: data.yaml
ported_from: ATLAS_Z_TOT_13TEV
Original file line number Diff line number Diff line change
@@ -0,0 +1,20 @@
dependent_variables:
- header: {name: SIG, units: NB}
qualifiers:
- {name: ABS(ETARAP(C=ELECTRON)), value: < 2.5}
- {name: ABS(ETARAP(C=MUON)), value: < 2.5}
- {name: MZ, units: GEV, value: 66-116}
- {name: PT(C=ELECTRON), units: GEV, value: '> 25'}
- {name: PT(C=MUON), units: GEV, value: '> 25'}
- {name: RE, value: P P --> ( Z0 < E+ E- + MU+ MU- > + GAMMA* < E+ E- + MU+ MU-
> ) X}
values:
- errors:
- {label: stat, symerror: 0.003}
- {label: sys, symerror: 0.006}
- {label: sys, symerror: 0.016}
value: 0.779
independent_variables:
- header: {name: SQRT(S), units: GEV}
values:
- {value: 13000.0}
Original file line number Diff line number Diff line change
@@ -0,0 +1,20 @@
dependent_variables:
- header: {name: SIG, units: NB}
qualifiers:
- {name: ABS(ETARAP(C=ELECTRON)), value: < 2.5}
- {name: ABS(ETARAP(C=MUON)), value: < 2.5}
- {name: MT, units: GEV, value: '> 50'}
- {name: PT(C=ELECTRON), units: GEV, value: '> 25'}
- {name: PT(C=MUON), units: GEV, value: '> 25'}
- {name: PT(C=NU), units: GEV, value: '> 25'}
- {name: RE, value: P P --> W+ < E+ NUE + MU+ NUMU > X}
values:
- errors:
- {label: stat, symerror: 0.01}
- {label: sys, symerror: 0.09}
- {label: sys, symerror: 0.1}
value: 4.53
independent_variables:
- header: {name: SQRT(S), units: GEV}
values:
- {value: 13000.0}
Original file line number Diff line number Diff line change
@@ -0,0 +1,20 @@
dependent_variables:
- header: {name: SIG, units: NB}
qualifiers:
- {name: 'ABS(ETARAP(C=ELECTRON)}', value: < 2.5}
- {name: ABS(ETARAP(C=MUON)), value: < 2.5}
- {name: MT, units: GEV, value: '> 50'}
- {name: PT(C=ELECTRON), units: GEV, value: '> 25'}
- {name: PT(C=MUON), units: GEV, value: '> 25'}
- {name: PT(C=NU), units: GEV, value: '> 25'}
- {name: RE, value: P P --> W- < E- NUEBAR + MU- NUMUBAR > X}
values:
- errors:
- {label: stat, symerror: 0.01}
- {label: sys, symerror: 0.07}
- {label: sys, symerror: 0.07}
value: 3.5
independent_variables:
- header: {name: SQRT(S), units: GEV}
values:
- {value: 13000.0}

0 comments on commit a24b6e0

Please sign in to comment.