Created
October 13, 2020 09:25
-
-
Save andrzejnovak/72269a260323a18ffcac740cfe7778c8 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"cells": [ | |
{ | |
"cell_type": "code", | |
"execution_count": 1, | |
"metadata": { | |
"ExecuteTime": { | |
"end_time": "2020-10-12T13:23:07.128698Z", | |
"start_time": "2020-10-12T13:23:06.871336Z" | |
} | |
}, | |
"outputs": [], | |
"source": [ | |
"import uproot4 as uproot" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 2, | |
"metadata": { | |
"ExecuteTime": { | |
"end_time": "2020-10-12T13:23:38.673412Z", | |
"start_time": "2020-10-12T13:23:38.670438Z" | |
} | |
}, | |
"outputs": [], | |
"source": [ | |
"xrd = 'root://cms-xrd-global.cern.ch/'\n", | |
"fname = '//store/user/anovak/PFNano/106X_v1/QCD_Pt-300to470_MuEnrichedPt5_TuneCP5_13TeV_pythia8/RunIISummer19UL17PFNanoAOD-106X_mc2017_realistic_v6-v2/200730_105451/0000/nano106X_on_mini106X_2017_mc_NANO_1.root'" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 3, | |
"metadata": { | |
"ExecuteTime": { | |
"end_time": "2020-10-12T13:23:51.872190Z", | |
"start_time": "2020-10-12T13:23:50.950522Z" | |
} | |
}, | |
"outputs": [], | |
"source": [ | |
"f= uproot.open(xrd+fname)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 4, | |
"metadata": { | |
"ExecuteTime": { | |
"end_time": "2020-10-12T13:23:54.518624Z", | |
"start_time": "2020-10-12T13:23:54.510247Z" | |
} | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"['tag;1',\n", | |
" 'Events;1',\n", | |
" 'LuminosityBlocks;1',\n", | |
" 'Runs;1',\n", | |
" 'MetaData;1',\n", | |
" 'ParameterSets;1']" | |
] | |
}, | |
"execution_count": 4, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"f.keys()" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 10, | |
"metadata": { | |
"ExecuteTime": { | |
"end_time": "2020-10-12T13:24:48.203457Z", | |
"start_time": "2020-10-12T13:24:48.189621Z" | |
} | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"['JetPFCands_d0',\n", | |
" 'JetPFCands_d0Err',\n", | |
" 'JetPFCands_dz',\n", | |
" 'JetPFCands_dzErr',\n", | |
" 'JetPFCands_eta',\n", | |
" 'JetPFCands_mass',\n", | |
" 'JetPFCands_phi',\n", | |
" 'JetPFCands_pt',\n", | |
" 'JetPFCands_puppiWeight',\n", | |
" 'JetPFCands_puppiWeightNoLep',\n", | |
" 'JetPFCands_trkChi2',\n", | |
" 'JetPFCands_vtxChi2',\n", | |
" 'JetPFCands_charge',\n", | |
" 'JetPFCands_lostInnerHits',\n", | |
" 'JetPFCands_pdgId',\n", | |
" 'JetPFCands_pvAssocQuality',\n", | |
" 'JetPFCands_trkQuality']" | |
] | |
}, | |
"execution_count": 10, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"feature_names = [k for k in f['Events'].keys() if k.startswith('JetPFCands_')]\n", | |
"feature_names" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 18, | |
"metadata": { | |
"ExecuteTime": { | |
"end_time": "2020-10-12T13:30:16.390580Z", | |
"start_time": "2020-10-12T13:30:16.230964Z" | |
} | |
}, | |
"outputs": [ | |
{ | |
"name": "stdout", | |
"output_type": "stream", | |
"text": [ | |
" JetPFCands_d0 JetPFCands_d0Err JetPFCands_dz \\\n", | |
"entry subentry \n", | |
"0 0 0.007652 0.016571 -0.055542 \n", | |
" 1 0.018799 0.009842 -0.000535 \n", | |
" 2 0.050323 0.021469 -0.046265 \n", | |
" 3 -0.005287 0.009094 0.010147 \n", | |
" 4 0.011551 0.034607 -3.470703 \n", | |
"... ... ... ... \n", | |
"9 235 -1.000000 -1.000000 -1.000000 \n", | |
" 236 -1.000000 -1.000000 -1.000000 \n", | |
" 237 -1.000000 -1.000000 -1.000000 \n", | |
" 238 -1.000000 -1.000000 -1.000000 \n", | |
" 239 -1.000000 -1.000000 -1.000000 \n", | |
"\n", | |
" JetPFCands_dzErr JetPFCands_eta JetPFCands_mass \\\n", | |
"entry subentry \n", | |
"0 0 0.013168 1.756348 1.395264e-01 \n", | |
" 1 0.011269 0.630249 1.395264e-01 \n", | |
" 2 0.019623 -0.810791 1.395264e-01 \n", | |
" 3 0.008598 -1.575684 1.395264e-01 \n", | |
" 4 0.022461 2.704590 1.282959e-01 \n", | |
"... ... ... ... \n", | |
"9 235 -1.000000 -1.780518 0.000000e+00 \n", | |
" 236 -1.000000 -1.868896 0.000000e+00 \n", | |
" 237 -1.000000 -1.876465 0.000000e+00 \n", | |
" 238 -1.000000 -1.938477 0.000000e+00 \n", | |
" 239 -1.000000 -2.285645 1.192093e-07 \n", | |
"\n", | |
" JetPFCands_phi JetPFCands_pt JetPFCands_puppiWeight \\\n", | |
"entry subentry \n", | |
"0 0 -0.977417 0.710938 1.000000 \n", | |
" 1 2.015137 0.521484 1.000000 \n", | |
" 2 -1.237305 0.654785 1.000000 \n", | |
" 3 -2.247559 0.865234 1.000000 \n", | |
" 4 0.629150 0.721680 0.000000 \n", | |
"... ... ... ... \n", | |
"9 235 -2.030273 1.375000 0.996094 \n", | |
" 236 0.288696 0.353516 0.000000 \n", | |
" 237 -0.261353 0.438232 0.000000 \n", | |
" 238 3.061523 0.152466 0.000000 \n", | |
" 239 -3.040039 1.911133 0.996094 \n", | |
"\n", | |
" JetPFCands_puppiWeightNoLep JetPFCands_trkChi2 \\\n", | |
"entry subentry \n", | |
"0 0 1.000000 0.0 \n", | |
" 1 1.000000 0.0 \n", | |
" 2 1.000000 0.0 \n", | |
" 3 1.000000 0.0 \n", | |
" 4 0.000000 0.0 \n", | |
"... ... ... \n", | |
"9 235 0.996094 -1.0 \n", | |
" 236 0.000000 -1.0 \n", | |
" 237 0.000000 -1.0 \n", | |
" 238 0.000000 -1.0 \n", | |
" 239 0.996094 -1.0 \n", | |
"\n", | |
" JetPFCands_vtxChi2 JetPFCands_charge \\\n", | |
"entry subentry \n", | |
"0 0 0.0 1 \n", | |
" 1 0.0 1 \n", | |
" 2 0.0 1 \n", | |
" 3 0.0 1 \n", | |
" 4 0.0 1 \n", | |
"... ... ... \n", | |
"9 235 -1.0 0 \n", | |
" 236 -1.0 0 \n", | |
" 237 -1.0 0 \n", | |
" 238 -1.0 0 \n", | |
" 239 -1.0 0 \n", | |
"\n", | |
" JetPFCands_lostInnerHits JetPFCands_pdgId \\\n", | |
"entry subentry \n", | |
"0 0 -1 211 \n", | |
" 1 -1 211 \n", | |
" 2 0 211 \n", | |
" 3 -1 211 \n", | |
" 4 -1 211 \n", | |
"... ... ... \n", | |
"9 235 -1 22 \n", | |
" 236 -1 22 \n", | |
" 237 -1 22 \n", | |
" 238 -1 22 \n", | |
" 239 -1 22 \n", | |
"\n", | |
" JetPFCands_pvAssocQuality JetPFCands_trkQuality \n", | |
"entry subentry \n", | |
"0 0 7 5 \n", | |
" 1 7 5 \n", | |
" 2 6 5 \n", | |
" 3 7 5 \n", | |
" 4 1 5 \n", | |
"... ... ... \n", | |
"9 235 7 0 \n", | |
" 236 7 0 \n", | |
" 237 7 0 \n", | |
" 238 7 0 \n", | |
" 239 7 0 \n", | |
"\n", | |
"[1877 rows x 17 columns]\n" | |
] | |
} | |
], | |
"source": [ | |
"for data in f['Events'].iterate(feature_names, step_size=10, library='pd'):\n", | |
" print(data)\n", | |
" break\n", | |
" # operate on a batch of data in the loop" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": null, | |
"metadata": {}, | |
"outputs": [], | |
"source": [] | |
} | |
], | |
"metadata": { | |
"kernelspec": { | |
"display_name": "Python (def)", | |
"language": "python", | |
"name": "def" | |
}, | |
"language_info": { | |
"codemirror_mode": { | |
"name": "ipython", | |
"version": 3 | |
}, | |
"file_extension": ".py", | |
"mimetype": "text/x-python", | |
"name": "python", | |
"nbconvert_exporter": "python", | |
"pygments_lexer": "ipython3", | |
"version": "3.7.3" | |
} | |
}, | |
"nbformat": 4, | |
"nbformat_minor": 4 | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment