16 auto delta_x = x1 - x2;
17 auto delta_y = y1 - y2;
18 auto r_square = delta_x * delta_x + delta_y * delta_y;
19 return std::sqrt(r_square);
24T
CLUE::dist(T x1, T y1, T z1, T x2, T y2, T z2) {
25 auto delta_x = x1 - x2;
26 auto delta_y = y1 - y2;
27 auto delta_z = z1 - z2;
28 auto r_square = delta_x * delta_x + delta_y * delta_y + delta_z * delta_z;
29 return std::sqrt(r_square);
37void CLUE::electronSeparation(std::vector<ldmx::EcalHit> hits) {
38 std::vector<double> layer_thickness = {2., 3.5, 5.3, 5.3, 5.3, 5.3,
39 5.3, 5.3, 5.3, 5.3, 5.3, 10.5,
40 10.5, 10.5, 10.5, 10.5};
43 std::sort(hits.begin(), hits.end(),
45 return a.getZPos() < b.getZPos();
48 std::vector<ldmx::EcalHit> first_layers;
49 std::vector<IntermediateCluster> first_layer_clusters;
51 double layer_z = hits[0].getZPos();
52 for (
const auto& hit : hits) {
53 if (hit.getZPos() > layer_z + layer_thickness[layer_tag] + air) {
58 first_layers.push_back(hit);
60 cluster.setLayer(layer_tag);
61 first_layer_clusters.push_back(cluster);
66 for (
int i = 0; i < first_layer_clusters.size(); i++) {
67 if (first_layer_clusters[i].empty())
continue;
69 for (
int j = i + 1; j < first_layer_clusters.size(); j++) {
70 if (first_layer_clusters[j].empty())
continue;
71 if (
dist(first_layer_clusters[i].centroidX(),
72 first_layer_clusters[i].centroidY(),
73 first_layer_clusters[j].centroidX(),
74 first_layer_clusters[j].centroidY()) < 8.) {
75 first_layer_clusters[i].add(first_layer_clusters[j]);
76 first_layer_clusters[j].clear();
83 ldmx_log(trace) <<
"--- ELECTRON SEPARATION ---";
84 for (
int i = 0; i < first_layer_clusters.size(); i++) {
85 if (first_layer_clusters[i].empty())
continue;
86 ldmx_log(trace) <<
" Cluster " << i
87 <<
" x: " << first_layer_clusters[i].centroidX()
88 <<
" y: " << first_layer_clusters[i].centroidY();
89 for (
int j = i + 1; j < first_layer_clusters.size(); j++) {
90 if (first_layer_clusters[j].empty())
continue;
91 auto d =
dist(first_layer_clusters[i].centroidX(),
92 first_layer_clusters[i].centroidY(),
93 first_layer_clusters[j].centroidX(),
94 first_layer_clusters[j].centroidY());
95 ldmx_log(trace) <<
"Dist to cluster " << j <<
": " << d;
101std::vector<std::vector<const ldmx::EcalHit*>> CLUE::createLayers(
102 const std::vector<const ldmx::EcalHit*>& hits) {
103 ldmx_log(trace) <<
"--- LAYER CREATION ---";
104 ldmx_log(trace) <<
"Number of layers: " << nbr_of_layers_;
108 std::vector<std::vector<const ldmx::EcalHit*>> hits_per_layer(nbr_of_layers_);
111 std::vector<double> layer_max_energies(nbr_of_layers_, 0.0);
114 layer_rho_c_.clear();
117 double rhoc_factor = rhoc_ / 250.;
119 for (
const auto& hit : hits) {
122 int layer = ecal_id.layer();
124 if (layer >= nbr_of_layers_) {
125 ldmx_log(trace) <<
"Skipping hit in layer " << layer
126 <<
" (beyond nbr_of_layers_ = " << nbr_of_layers_ <<
")";
131 if (hit->getEnergy() > layer_max_energies[layer]) {
132 layer_max_energies[layer] = hit->getEnergy();
135 ldmx_log(trace) <<
" Adding hit with energy " << hit->getEnergy()
136 <<
" to layer " << layer;
137 hits_per_layer[layer].push_back(hit);
141 for (
int i = 0; i < nbr_of_layers_; i++) {
142 double rho_c = layer_max_energies[i] / rhoc_factor;
143 layer_rho_c_.push_back(rho_c);
144 ldmx_log(trace) <<
"Layer " << i <<
" has " << hits_per_layer[i].size()
145 <<
" hits, max energy " << layer_max_energies[i]
146 <<
", rho_c " << rho_c;
149 ldmx_log(trace) <<
"Created " << hits_per_layer.size() <<
" layers";
150 return hits_per_layer;
153float CLUE::roundToDecimal(
float x_,
int num_decimal_precision_digits) {
154 float power_of_10 = std::pow(10, num_decimal_precision_digits);
155 return std::round(x_ * power_of_10) / power_of_10;
158std::vector<std::shared_ptr<CLUE::Density>> CLUE::setup(
159 const std::vector<const ldmx::EcalHit*>& hits) {
160 std::vector<std::shared_ptr<Density>> densities;
161 std::map<std::pair<float, float>, std::shared_ptr<Density>> density_map;
163 ldmx_log(trace) <<
"--- SETUP ---";
164 ldmx_log(trace) <<
"Building densities";
165 for (
const auto& hit : hits) {
167 float x = roundToDecimal(hit->getXPos(), 4);
168 float y = roundToDecimal(hit->getYPos(), 4);
169 float z = roundToDecimal(hit->getZPos(), 4);
170 ldmx_log(trace) <<
" New hit { x: " << x <<
" y: " << y <<
"}"
171 <<
" (and z: " << z <<
")";
172 std::pair<float, float> coords;
173 if (dc_ != 0 && nbr_of_layers_ > 1) {
175 double i = std::ceil(std::abs(x) / dc_);
176 double j = std::ceil(std::abs(y) / dc_);
190 ldmx_log(trace) <<
" Index " << i <<
", " << j <<
"; x: " << x
198 if (density_map.find(coords) == density_map.end()) {
199 density_map.emplace(coords, std::make_shared<CLUE::Density>(x, y));
200 ldmx_log(trace) <<
" * New density created";
202 ldmx_log(trace) <<
" --> Found density with x: "
203 << density_map[coords]->x_
204 <<
" y: " << density_map[coords]->y_;
206 density_map[coords]->hits_.push_back(hit);
207 density_map[coords]->total_energy_ += hit->getEnergy();
208 density_map[coords]->z_ += hit->getZPos();
210 event_centroid_.
add(hit);
213 densities.reserve(density_map.size());
214 for (
const auto& entry : density_map) {
215 densities.push_back(std::move(entry.second));
218 std::sort(densities.begin(), densities.end(),
219 [](
const std::shared_ptr<CLUE::Density>& a,
220 const std::shared_ptr<CLUE::Density>& b) {
221 return a->total_energy_ > b->total_energy_;
224 ldmx_log(trace) <<
"Decide parents";
227 for (
int i = 0; i < densities.size(); i++) {
228 densities[i]->index_ = i;
230 densities[i]->z_ = densities[i]->z_ / densities[i]->hits_.size();
231 ldmx_log(trace) <<
" Index: " << i <<
"; x: " << densities[i]->x_
232 <<
"; y: " << densities[i]->y_
233 <<
"; Energy: " << densities[i]->total_energy_;
235 for (
int j = 0; j < i; j++) {
236 float distance_2d =
dist(densities[i]->x_, densities[i]->y_,
237 densities[j]->x_, densities[j]->y_);
240 if ((distance_2d < dm_) && (distance_2d < densities[i]->delta_)) {
241 densities[i]->delta_ = distance_2d;
242 densities[i]->follower_of_ = j;
243 ldmx_log(trace) <<
" New parent, index " << j
244 <<
"; delta_2d: " << std::setprecision(4)
255std::vector<std::vector<const ldmx::EcalHit*>> CLUE::clustering(
256 std::vector<std::shared_ptr<CLUE::Density>>& densities,
257 bool connecting_layers,
int layer_index) {
258 ldmx_log(trace) <<
"--- CLUSTERING ---";
259 ldmx_log(trace) <<
"Number of densities: " << densities.size()
260 <<
"; connecting_layers: " << connecting_layers
261 <<
"; layer_index: " << layer_index;
262 if (!connecting_layers && nbr_of_layers_ > 1) {
264 rhoc_ = layer_rho_c_[layer_index];
265 ldmx_log(trace) <<
"Setting rho_c on layer " << layer_index <<
" to "
267 if (layer_index * 2 - 1 < radius_.size()) {
268 deltac_ = radius_[layer_index * 2 - 1];
269 ldmx_log(trace) <<
"Setting delta_c on layer " << layer_index <<
" to "
272 }
else if (connecting_layers) {
282 bool energy_overload =
false;
283 double max_energy = 10000.;
284 clustering_loops_ = 0;
285 double delta_c_mod = deltac_;
286 double centroid_radius = 10.;
289 std::vector<std::shared_ptr<Density>>& layer_seeds = seeds_[layer_index];
292 std::vector<std::vector<const ldmx::EcalHit*>> clusters;
294 std::vector<bool> merged_densities;
295 merged_densities.resize(densities.size());
297 std::vector<double> cluster_energies;
300 if (energy_overload) {
302 delta_c_mod = delta_c_mod / 1.1;
303 ldmx_log(trace) <<
"Energy overload, new delta_cmod: " << delta_c_mod;
304 energy_overload =
false;
308 ldmx_log(trace) <<
"Clustering loop " << clustering_loops_;
314 layer_seeds.reserve(densities.size());
316 clusters.reserve(densities.size());
317 cluster_energies.clear();
318 cluster_energies.reserve(densities.size());
320 std::stack<int> cluster_stack;
322 std::vector<std::vector<int>> followers;
323 followers.resize(densities.size());
326 for (
auto& density : densities) {
328 ldmx_log(trace) <<
" Index: " << density->index_
329 <<
"; x: " << density->x_ <<
"; y: " << density->y_
330 <<
"; Energy: " << density->total_energy_
331 <<
" Parent ID: " << density->follower_of_
332 <<
"; Delta: " << density->delta_;
335 if (delta_c_mod != deltac_ && merged_densities[density->cluster_id_] &&
337 event_centroid_.
centroidY()) < centroid_radius) {
342 density->total_energy_ > rhoc_ && density->delta_ > delta_c_mod;
344 is_seed = density->total_energy_ > rhoc_ && density->delta_ > deltac_;
346 ldmx_log(trace) <<
" Distance to event centroid: "
347 <<
dist(density->x_, density->y_,
353 (density->total_energy_ < rhoc_) && (density->delta_ > deltao_);
354 density->cluster_id_ = -1;
356 ldmx_log(trace) <<
" This is a Seed";
357 ldmx_log(trace) <<
" Distance to centroid: "
358 <<
dist(density->x_, density->y_,
361 <<
"; with delta " << density->delta_;
362 ldmx_log(trace) <<
" Setting cluster ID to " << k;
363 density->cluster_id_ = k;
366 cluster_stack.push(density->index_);
367 clusters.push_back(density->hits_);
368 cluster_energies.push_back(density->total_energy_);
369 layer_seeds.push_back(density);
370 }
else if (!is_outlier) {
371 ldmx_log(trace) <<
" This is a Follower";
372 int& parent_index = density->follower_of_;
373 if (parent_index != -1)
374 followers[parent_index].push_back(density->index_);
377 <<
" Somehow found a follower with parent index -1: id = "
380 ldmx_log(trace) <<
" This is an Outlier";
384 merged_densities.clear();
385 merged_densities.resize(densities.size());
388 while (cluster_stack.size() > 0) {
389 auto& d = densities[cluster_stack.top()];
391 auto& cid = d->cluster_id_;
393 for (
const auto follower_index : followers[d->index_]) {
394 auto& follower = densities[follower_index];
396 follower->cluster_id_ = cid;
397 cluster_energies[cid] += follower->total_energy_;
399 if (reclustering_ && cluster_energies[cid] > max_energy &&
400 delta_c_mod > 0.5 && clustering_loops_ < 100) {
403 merged_densities[cid] =
true;
404 if (!energy_overload && clustering_loops_ == 99) {
405 ldmx_log(warn) <<
"Merging clusters, max cluster loops hit";
407 energy_overload =
true;
408 if (clustering_loops_ != 1) {
414 clusters[cid].insert(std::end(clusters[cid]),
415 std::begin(follower->hits_),
416 std::end(follower->hits_));
419 cluster_stack.push(follower_index);
424 if (clustering_loops_ == 1 && energy_overload)
425 initial_cluster_nbr_ = clusters.size();
427 }
while (energy_overload);
429 if (!connecting_layers && nbr_of_layers_ > 1) {
432 for (
auto& seed : layer_seeds) {
433 seed->delta_ = std::numeric_limits<float>::max();
434 seed->hits_ = clusters[seed->cluster_id_];
435 seed->total_energy_ = cluster_energies[seed->cluster_id_];
436 seed->index_ = seed_index_;
440 std::sort(layer_seeds.begin(), layer_seeds.end(),
441 [](
const std::shared_ptr<Density>& a,
442 const std::shared_ptr<Density>& b) {
443 return a->total_energy_ > b->total_energy_;
451std::vector<std::shared_ptr<CLUE::Density>> CLUE::setupForClue3D() {
452 ldmx_log(trace) <<
"--- LAYER SETUP ---";
453 std::vector<std::shared_ptr<CLUE::Density>> densities;
454 layer_rho_c_.clear();
455 for (
int layer = 0; layer < nbr_of_layers_; layer++) {
456 ldmx_log(trace) <<
" LAYER " << layer <<
" with " << seeds_[layer].size()
458 auto& seeds_in_current_layer = seeds_[layer];
459 double highest_energy = 0.;
460 for (
const auto& current_seed : seeds_in_current_layer) {
462 current_seed->layer_ = layer;
463 if (current_seed->total_energy_ > highest_energy)
464 highest_energy = current_seed->total_energy_;
465 ldmx_log(trace) <<
" Density with index " << current_seed->index_
466 <<
", energy: " << current_seed->total_energy_
467 <<
" position (x,y)= {" << current_seed->x_ <<
","
468 << current_seed->y_ <<
")";
473 if ((layer - depth >= 0) && (layer - depth < seeds_.size())) {
474 ldmx_log(trace) <<
" Looking at pre-layer: " << layer - depth;
476 ldmx_log(trace) <<
" In previous layer... ";
477 auto& previous_layer = seeds_[layer - depth];
478 ldmx_log(trace) <<
" Got " << previous_layer.size() <<
" seeds";
479 for (
const auto& prev_seed : previous_layer) {
481 auto distance_2d_prev =
dist(current_seed->x_, current_seed->y_,
482 prev_seed->x_, prev_seed->y_);
483 auto dz_prev = std::abs(current_seed->z_ - prev_seed->z_);
484 ldmx_log(trace) <<
" DeltaXY to index " << prev_seed->index_
485 <<
": " << std::setprecision(4) << distance_2d_prev;
486 ldmx_log(trace) <<
" DeltaZ to index " << prev_seed->index_
487 <<
": " << std::setprecision(4) << dz_prev;
488 if (prev_seed->total_energy_ > current_seed->total_energy_ &&
489 distance_2d_prev < current_seed->delta_ &&
490 dz_prev < current_seed->z_delta_) {
491 ldmx_log(trace) <<
" New parent: index " << prev_seed->index_
492 <<
" on layer " << layer - depth <<
"; energy "
493 << prev_seed->total_energy_;
494 ldmx_log(trace) <<
" New 2D distance to prev-layer: "
495 << std::setprecision(4) << distance_2d_prev;
497 <<
" New delta Z: " << std::setprecision(4) << dz_prev;
498 current_seed->delta_ = distance_2d_prev;
499 current_seed->z_delta_ = dz_prev;
500 current_seed->follower_of_ = prev_seed->index_;
501 }
else if (prev_seed->total_energy_ < current_seed->total_energy_) {
502 ldmx_log(trace) <<
" Breaking on index " << prev_seed->index_
503 <<
" with energy " << prev_seed->total_energy_;
509 if (layer + depth < nbr_of_layers_ && layer + depth < seeds_.size()) {
510 ldmx_log(trace) <<
" Looking at post-layer: " << layer + depth;
511 auto& next_layer = seeds_[layer + depth];
512 ldmx_log(trace) <<
" Got " << next_layer.size() <<
" seeds";
513 for (
const auto& next_seed : next_layer) {
514 auto distance_2d_next =
dist(current_seed->x_, current_seed->y_,
515 next_seed->x_, next_seed->y_);
516 auto dz_next = std::abs(current_seed->z_ - next_seed->z_);
517 ldmx_log(trace) <<
" DeltaXY to index " << next_seed->index_
518 <<
": " << std::setprecision(4) << distance_2d_next;
519 ldmx_log(trace) <<
" DeltaZ to index_" << next_seed->index_
520 <<
": " << std::setprecision(4) << dz_next;
521 if (next_seed->total_energy_ > current_seed->total_energy_ &&
522 distance_2d_next < current_seed->delta_ &&
523 dz_next < current_seed->z_delta_) {
524 ldmx_log(trace) <<
" New parent: index_" << next_seed->index_
525 <<
" on layer " << layer + depth <<
"; energy "
526 << next_seed->total_energy_;
527 ldmx_log(trace) <<
" New 2D distance to next-layer: "
528 << std::setprecision(4) << distance_2d_next;
530 <<
" New delta_Z: " << std::setprecision(4) << dz_next;
531 current_seed->delta_ = distance_2d_next;
532 current_seed->z_delta_ = dz_next;
533 current_seed->follower_of_ = next_seed->index_;
534 }
else if (next_seed->total_energy_ < current_seed->total_energy_) {
535 ldmx_log(trace) <<
" Breaking on index_" << next_seed->index_
536 <<
" with energy " << next_seed->total_energy_;
543 ldmx_log(trace) <<
" Done setting parents.";
544 densities.push_back(current_seed);
547 layer_rho_c_.push_back(highest_energy / 2);
552void CLUE::convertToIntermediateClusters(
553 std::vector<std::vector<const ldmx::EcalHit*>>& clusters) {
556 for (
const auto& cluster : clusters) {
558 intermediate_cluster_first_layer{};
560 for (
const auto& hit : cluster) {
561 intermediate_cluster.add(hit);
564 auto layer = ecal_id.layer();
565 intermediate_cluster.setLayer(layer);
567 intermediate_cluster_first_layer.add(hit);
568 intermediate_cluster_first_layer.setLayer(layer);
571 final_clusters_.push_back(intermediate_cluster);
572 first_layer_centroids_.push_back(intermediate_cluster_first_layer);
573 auto cent_x = intermediate_cluster.centroidX();
574 auto cent_y = intermediate_cluster.centroidY();
575 auto event_cent_x = event_centroid_.
centroidX();
576 auto event_cent_y = event_centroid_.
centroidY();
577 const auto& distance =
dist(cent_x, cent_y, event_cent_x, event_cent_y);
578 centroid_distances_.push_back(distance);
582void CLUE::cluster(
const std::vector<ldmx::EcalHit>& unsorted_hits,
double dc,
583 double rc,
double delta_c,
double delta_o,
int nbr_of_layers,
585 ldmx_log(info) <<
"Starting CLUE clustering with parameters:" <<
"dc " << dc
586 <<
", rc " << rc <<
", delta_c " << delta_c <<
", delta_o "
587 << delta_o <<
", nbr_of_layers " << nbr_of_layers
588 <<
", reclustering " << reclustering;
598 dm_ = std::max(delta_c, delta_o);
601 reclustering_ = reclustering;
602 nbr_of_layers_ = nbr_of_layers;
604 if (nbr_of_layers_ < 1) {
606 nbr_of_layers_ = max_layers_;
607 }
else if (nbr_of_layers_ > max_layers_) {
608 ldmx_log(warn) <<
"nbr_of_layers_ " << nbr_of_layers_
609 <<
" exceeds max layers " << max_layers_
610 <<
", setting to max layers";
611 nbr_of_layers_ = max_layers_;
615 std::vector<const ldmx::EcalHit*> hits;
616 hits.reserve(unsorted_hits.size());
617 ldmx_log(debug) <<
"Clustering " << unsorted_hits.size() <<
" hits";
618 for (
const auto& unsorted_hit : unsorted_hits) {
619 hits.push_back(&unsorted_hit);
622 ldmx_log(debug) <<
"Sorting hits by Z position";
623 std::sort(hits.begin(), hits.end(),
625 return a->getZPos() < b->getZPos();
628 seeds_.resize(nbr_of_layers_);
630 if (nbr_of_layers_ > 1) {
631 ldmx_log(debug) <<
"Creating layers";
633 const auto layers = createLayers(hits);
634 ldmx_log(debug) <<
"Doing layer-wise clustering on " << layers.size()
636 for (
int i = 0; i < layers.size(); i++) {
637 ldmx_log(trace) <<
"--- LAYER " << i + 1 <<
" ---";
638 auto densities = setup(layers[i]);
639 auto clusters = clustering(densities,
false, i);
640 convertToIntermediateClusters(clusters);
649 ldmx_log(debug) <<
"Only one layer, doing 2D clustering";
650 auto densities = setup(hits);
651 auto clusters = clustering(densities,
false);
652 convertToIntermediateClusters(clusters);
A version of CLUE (CMS) for clustering in ECal.
T dist(T x1, T y1, T x2, T y2)
Euclidean distance between two points.
Stores reconstructed hit information from the ECAL.
Extension of DetectorID providing access to ECal layers and cell numbers in a hex grid.
double centroidY() const
Get the centroid Y position (energy-weighted).
double centroidX() const
Get the centroid X position (energy-weighted).
void add(const HitType *hit)
Add a hit to the cluster using its stored position.