Skip to content

Instantly share code, notes, and snippets.

@andrzejnovak
Created October 13, 2020 09:25
Show Gist options
  • Save andrzejnovak/72269a260323a18ffcac740cfe7778c8 to your computer and use it in GitHub Desktop.
Save andrzejnovak/72269a260323a18ffcac740cfe7778c8 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {
"ExecuteTime": {
"end_time": "2020-10-12T13:23:07.128698Z",
"start_time": "2020-10-12T13:23:06.871336Z"
}
},
"outputs": [],
"source": [
"import uproot4 as uproot"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"ExecuteTime": {
"end_time": "2020-10-12T13:23:38.673412Z",
"start_time": "2020-10-12T13:23:38.670438Z"
}
},
"outputs": [],
"source": [
"xrd = 'root://cms-xrd-global.cern.ch/'\n",
"fname = '//store/user/anovak/PFNano/106X_v1/QCD_Pt-300to470_MuEnrichedPt5_TuneCP5_13TeV_pythia8/RunIISummer19UL17PFNanoAOD-106X_mc2017_realistic_v6-v2/200730_105451/0000/nano106X_on_mini106X_2017_mc_NANO_1.root'"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"ExecuteTime": {
"end_time": "2020-10-12T13:23:51.872190Z",
"start_time": "2020-10-12T13:23:50.950522Z"
}
},
"outputs": [],
"source": [
"f= uproot.open(xrd+fname)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"ExecuteTime": {
"end_time": "2020-10-12T13:23:54.518624Z",
"start_time": "2020-10-12T13:23:54.510247Z"
}
},
"outputs": [
{
"data": {
"text/plain": [
"['tag;1',\n",
" 'Events;1',\n",
" 'LuminosityBlocks;1',\n",
" 'Runs;1',\n",
" 'MetaData;1',\n",
" 'ParameterSets;1']"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"f.keys()"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {
"ExecuteTime": {
"end_time": "2020-10-12T13:24:48.203457Z",
"start_time": "2020-10-12T13:24:48.189621Z"
}
},
"outputs": [
{
"data": {
"text/plain": [
"['JetPFCands_d0',\n",
" 'JetPFCands_d0Err',\n",
" 'JetPFCands_dz',\n",
" 'JetPFCands_dzErr',\n",
" 'JetPFCands_eta',\n",
" 'JetPFCands_mass',\n",
" 'JetPFCands_phi',\n",
" 'JetPFCands_pt',\n",
" 'JetPFCands_puppiWeight',\n",
" 'JetPFCands_puppiWeightNoLep',\n",
" 'JetPFCands_trkChi2',\n",
" 'JetPFCands_vtxChi2',\n",
" 'JetPFCands_charge',\n",
" 'JetPFCands_lostInnerHits',\n",
" 'JetPFCands_pdgId',\n",
" 'JetPFCands_pvAssocQuality',\n",
" 'JetPFCands_trkQuality']"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"feature_names = [k for k in f['Events'].keys() if k.startswith('JetPFCands_')]\n",
"feature_names"
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {
"ExecuteTime": {
"end_time": "2020-10-12T13:30:16.390580Z",
"start_time": "2020-10-12T13:30:16.230964Z"
}
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
" JetPFCands_d0 JetPFCands_d0Err JetPFCands_dz \\\n",
"entry subentry \n",
"0 0 0.007652 0.016571 -0.055542 \n",
" 1 0.018799 0.009842 -0.000535 \n",
" 2 0.050323 0.021469 -0.046265 \n",
" 3 -0.005287 0.009094 0.010147 \n",
" 4 0.011551 0.034607 -3.470703 \n",
"... ... ... ... \n",
"9 235 -1.000000 -1.000000 -1.000000 \n",
" 236 -1.000000 -1.000000 -1.000000 \n",
" 237 -1.000000 -1.000000 -1.000000 \n",
" 238 -1.000000 -1.000000 -1.000000 \n",
" 239 -1.000000 -1.000000 -1.000000 \n",
"\n",
" JetPFCands_dzErr JetPFCands_eta JetPFCands_mass \\\n",
"entry subentry \n",
"0 0 0.013168 1.756348 1.395264e-01 \n",
" 1 0.011269 0.630249 1.395264e-01 \n",
" 2 0.019623 -0.810791 1.395264e-01 \n",
" 3 0.008598 -1.575684 1.395264e-01 \n",
" 4 0.022461 2.704590 1.282959e-01 \n",
"... ... ... ... \n",
"9 235 -1.000000 -1.780518 0.000000e+00 \n",
" 236 -1.000000 -1.868896 0.000000e+00 \n",
" 237 -1.000000 -1.876465 0.000000e+00 \n",
" 238 -1.000000 -1.938477 0.000000e+00 \n",
" 239 -1.000000 -2.285645 1.192093e-07 \n",
"\n",
" JetPFCands_phi JetPFCands_pt JetPFCands_puppiWeight \\\n",
"entry subentry \n",
"0 0 -0.977417 0.710938 1.000000 \n",
" 1 2.015137 0.521484 1.000000 \n",
" 2 -1.237305 0.654785 1.000000 \n",
" 3 -2.247559 0.865234 1.000000 \n",
" 4 0.629150 0.721680 0.000000 \n",
"... ... ... ... \n",
"9 235 -2.030273 1.375000 0.996094 \n",
" 236 0.288696 0.353516 0.000000 \n",
" 237 -0.261353 0.438232 0.000000 \n",
" 238 3.061523 0.152466 0.000000 \n",
" 239 -3.040039 1.911133 0.996094 \n",
"\n",
" JetPFCands_puppiWeightNoLep JetPFCands_trkChi2 \\\n",
"entry subentry \n",
"0 0 1.000000 0.0 \n",
" 1 1.000000 0.0 \n",
" 2 1.000000 0.0 \n",
" 3 1.000000 0.0 \n",
" 4 0.000000 0.0 \n",
"... ... ... \n",
"9 235 0.996094 -1.0 \n",
" 236 0.000000 -1.0 \n",
" 237 0.000000 -1.0 \n",
" 238 0.000000 -1.0 \n",
" 239 0.996094 -1.0 \n",
"\n",
" JetPFCands_vtxChi2 JetPFCands_charge \\\n",
"entry subentry \n",
"0 0 0.0 1 \n",
" 1 0.0 1 \n",
" 2 0.0 1 \n",
" 3 0.0 1 \n",
" 4 0.0 1 \n",
"... ... ... \n",
"9 235 -1.0 0 \n",
" 236 -1.0 0 \n",
" 237 -1.0 0 \n",
" 238 -1.0 0 \n",
" 239 -1.0 0 \n",
"\n",
" JetPFCands_lostInnerHits JetPFCands_pdgId \\\n",
"entry subentry \n",
"0 0 -1 211 \n",
" 1 -1 211 \n",
" 2 0 211 \n",
" 3 -1 211 \n",
" 4 -1 211 \n",
"... ... ... \n",
"9 235 -1 22 \n",
" 236 -1 22 \n",
" 237 -1 22 \n",
" 238 -1 22 \n",
" 239 -1 22 \n",
"\n",
" JetPFCands_pvAssocQuality JetPFCands_trkQuality \n",
"entry subentry \n",
"0 0 7 5 \n",
" 1 7 5 \n",
" 2 6 5 \n",
" 3 7 5 \n",
" 4 1 5 \n",
"... ... ... \n",
"9 235 7 0 \n",
" 236 7 0 \n",
" 237 7 0 \n",
" 238 7 0 \n",
" 239 7 0 \n",
"\n",
"[1877 rows x 17 columns]\n"
]
}
],
"source": [
"for data in f['Events'].iterate(feature_names, step_size=10, library='pd'):\n",
" print(data)\n",
" break\n",
" # operate on a batch of data in the loop"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python (def)",
"language": "python",
"name": "def"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.3"
}
},
"nbformat": 4,
"nbformat_minor": 4
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment