Commit 3ab2d38f authored by Sylvester Joosten's avatar Sylvester Joosten
Browse files

Add script to sanitize HepMC3 so it can be read properly by npsim

parent a0855d91
Pipeline #22202 passed with stages
in 1 minute and 1 second
......@@ -112,3 +112,7 @@ install(FILES
scripts/ DESTINATION bin RENAME sanitize_hepmc3
#!/usr/bin/env python3
import sys
import argparse
class InvalidHepmc3Error(Exception):
def __init__(this, *msg):
print('InvalidHepmc3Error:', *msg, file=sys.stderr)
class EventHeader:
def __init__(this, line):
if not line[0] == 'E':
raise InvalidHepmc3Error('Expected event record, but found:', line)
this.raw = line
this.vertex = this._get_vertex_if_present(line)
this.n_vertices = int(line.split(' ')[2])
this.n_particles = int(line.split(' ')[3])
this.vert_cnt = 0
this.part_cnt = 0
def get_record(this):
if not this.vert_cnt == this.n_vertices:
raise InvalidHepmc3Error('Not all vertices found for event:', event.raw)
if not this.part_cnt == this.n_particles:
raise InvalidHepmc3Error('Not all particles found for event:', event.raw)
if this.vertex and not '@' in this.raw:
return '{} @{}'.format(this.raw[:-1], this.vertex)
return this.raw
def process_vertex(this, line):
this.vert_cnt += 1
if this.vert_cnt > this.n_vertices:
raise InvalidHepmc3Error('Too many vertices for event:', event.raw)
if not this.vertex:
if '@' in line:
this.vertex = this._get_vertex_if_present(line)
def process_particle(this, line):
this.part_cnt += 1
if this.part_cnt > this.n_particles:
raise InvalidHepmc3Error('Too many particles for event:', event.raw)
def _get_vertex_if_present(this, line):
if not '@' in line:
return None
return line.split('@')[1]
def flush_buffer(header, buffer):
if header:
for line in buffer:
if __name__ == '__main__':
parser = argparse.ArgumentParser(
description='Read HepMC3 input from stdin and sanitize the '
'output (e.g. add vertex info to the event header '
'if the event has a displaced starting vertex). '
'Output is written to stdout.')
args = parser.parse_args()
header = None
buffer = []
have_first_line = False
have_second_line = False
end_reached = False
## read line-by-line, fill the event buffer, and then
## write the sanitized output to stdout
for line in sys.stdin:
if end_reached or len(line) == 0:
if not have_first_line:
if not 'HepMC::Version' in line:
raise InvalidHepmc3Error('Not a valid HepMC3 file header:', line)
have_first_line = True
elif not have_second_line:
if not 'HepMC::Asciiv3-START_EVENT_LISTING\n' == line:
raise InvalidHepmc3Error('Not a valid HepMC3 file header:', line)
have_second_line = True
elif 'HepMC::Asciiv3-END_EVENT_LISTING\n' == line:
end_reached = True
elif line[0] == 'E':
flush_buffer(header, buffer)
header = EventHeader(line)
buffer = []
if header is None:
raise InvalidHepmc3Error('Encountered field before the Event header:', line)
if line[0] == 'V':
elif line[0] == 'P':
elif line[0] not in ['W', 'A', 'U']:
raise InvalidHepmc3Error('Encountered unknown field:', line)
# final buffer flush at the end
flush_buffer(header, buffer)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment