Back to home page

Project CMSSW displayed by LXR

 
 

    


File indexing completed on 2024-10-17 22:59:06

0001 #include "MkFinder.h"
0002 
0003 #include "RecoTracker/MkFitCore/interface/cms_common_macros.h"
0004 #include "RecoTracker/MkFitCore/interface/IterationConfig.h"
0005 #include "CandCloner.h"
0006 #include "FindingFoos.h"
0007 #include "KalmanUtilsMPlex.h"
0008 #include "MatriplexPackers.h"
0009 #include "MiniPropagators.h"
0010 
0011 //#define DEBUG
0012 #include "Debug.h"
0013 
0014 #if defined(MKFIT_STANDALONE)
0015 #include "RecoTracker/MkFitCore/standalone/Event.h"
0016 #endif
0017 
0018 #ifdef RNT_DUMP_MkF_SelHitIdcs
0019 // declares struct RntIfc_selectHitIndices rnt_shi in unnamed namespace;
0020 #include "RecoTracker/MkFitCore/standalone/RntDumper/MkFinder_selectHitIndices.icc"
0021 #endif
0022 
0023 #include "vdt/atan2.h"
0024 
0025 #include <algorithm>
0026 #include <queue>
0027 
0028 namespace mkfit {
0029 
0030   void MkFinder::setup(const PropagationConfig &pc,
0031                        const IterationConfig &ic,
0032                        const IterationParams &ip,
0033                        const IterationLayerConfig &ilc,
0034                        const SteeringParams &sp,
0035                        const std::vector<bool> *ihm,
0036                        const Event *ev,
0037                        int region,
0038                        bool infwd) {
0039     m_prop_config = &pc;
0040     m_iteration_config = &ic;
0041     m_iteration_params = &ip;
0042     m_iteration_layer_config = &ilc;
0043     m_steering_params = &sp;
0044     m_iteration_hit_mask = ihm;
0045     m_event = ev;
0046     m_current_region = region;
0047     m_in_fwd = infwd;
0048   }
0049 
0050   void MkFinder::setup_bkfit(const PropagationConfig &pc, const SteeringParams &sp, const Event *ev) {
0051     m_prop_config = &pc;
0052     m_steering_params = &sp;
0053     m_event = ev;
0054   }
0055 
0056   void MkFinder::release() {
0057     m_prop_config = nullptr;
0058     m_iteration_config = nullptr;
0059     m_iteration_params = nullptr;
0060     m_iteration_layer_config = nullptr;
0061     m_steering_params = nullptr;
0062     m_iteration_hit_mask = nullptr;
0063     m_event = nullptr;
0064     m_current_region = -1;
0065     m_in_fwd = true;
0066   }
0067 
0068   void MkFinder::begin_layer(const LayerOfHits &layer_of_hits) {
0069 #ifdef RNT_DUMP_MkF_SelHitIdcs
0070     const LayerOfHits &L = layer_of_hits;
0071     const LayerInfo &LI = L.layer_info();
0072     rnt_shi.ResetH();
0073     rnt_shi.ResetF();
0074     *rnt_shi.h = {m_event->evtID(),
0075                   m_iteration_config->m_iteration_index,
0076                   m_iteration_config->m_track_algorithm,
0077                   m_current_region,
0078                   L.layer_id(),
0079                   L.is_barrel() ? LI.rin() : LI.zmin(),
0080                   LI.is_barrel() ? LI.rout() : LI.zmax(),
0081                   L.is_barrel(),
0082                   L.is_pixel(),
0083                   L.is_stereo()};
0084     *rnt_shi.f = *rnt_shi.h;
0085 #endif
0086   }
0087 
0088   void MkFinder::end_layer() {
0089 #ifdef RNT_DUMP_MkF_SelHitIdcs
0090     rnt_shi.FillH();
0091     rnt_shi.FillF();
0092 #endif
0093   }
0094 
0095   //==============================================================================
0096   // Input / Output TracksAndHitIdx
0097   //==============================================================================
0098 
0099   void MkFinder::inputTracksAndHitIdx(const std::vector<Track> &tracks, int beg, int end, bool inputProp) {
0100     // Assign track parameters to initial state and copy hit values in.
0101 
0102     // This might not be true for the last chunk!
0103     // assert(end - beg == NN);
0104 
0105     const int iI = inputProp ? iP : iC;
0106 
0107     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0108       copy_in(tracks[i], imp, iI);
0109     }
0110   }
0111 
0112   void MkFinder::inputTracksAndHitIdx(
0113       const std::vector<Track> &tracks, const std::vector<int> &idxs, int beg, int end, bool inputProp, int mp_offset) {
0114     // Assign track parameters to initial state and copy hit values in.
0115 
0116     // This might not be true for the last chunk!
0117     // assert(end - beg == NN);
0118 
0119     const int iI = inputProp ? iP : iC;
0120 
0121     for (int i = beg, imp = mp_offset; i < end; ++i, ++imp) {
0122       copy_in(tracks[idxs[i]], imp, iI);
0123     }
0124   }
0125 
0126   void MkFinder::inputTracksAndHitIdx(const std::vector<CombCandidate> &tracks,
0127                                       const std::vector<std::pair<int, int>> &idxs,
0128                                       int beg,
0129                                       int end,
0130                                       bool inputProp) {
0131     // Assign track parameters to initial state and copy hit values in.
0132 
0133     // This might not be true for the last chunk!
0134     // assert(end - beg == NN);
0135 
0136     const int iI = inputProp ? iP : iC;
0137 
0138     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0139       const TrackCand &trk = tracks[idxs[i].first][idxs[i].second];
0140 
0141       copy_in(trk, imp, iI);
0142 
0143       m_SeedIdx(imp, 0, 0) = idxs[i].first;
0144       m_CandIdx(imp, 0, 0) = idxs[i].second;
0145       m_SeedOriginIdx[imp] = tracks[idxs[i].first].seed_origin_index();
0146     }
0147   }
0148 
0149   void MkFinder::inputTracksAndHits(const std::vector<CombCandidate> &tracks,
0150                                     const LayerOfHits &layer_of_hits,
0151                                     const std::vector<UpdateIndices> &idxs,
0152                                     int beg,
0153                                     int end,
0154                                     bool inputProp) {
0155     // Assign track parameters to initial state and copy hit values in.
0156 
0157     // This might not be true for the last chunk!
0158     // assert(end - beg == NN);
0159 
0160     const int iI = inputProp ? iP : iC;
0161 
0162     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0163       const TrackCand &trk = tracks[idxs[i].seed_idx][idxs[i].cand_idx];
0164 
0165       copy_in(trk, imp, iI);
0166 
0167       m_SeedIdx(imp, 0, 0) = idxs[i].seed_idx;
0168       m_CandIdx(imp, 0, 0) = idxs[i].cand_idx;
0169       m_SeedOriginIdx[imp] = tracks[idxs[i].seed_idx].seed_origin_index();
0170 
0171       // Reuse selectHitIndices() arrays -- used also in packModuleNormDir()
0172       m_XHitArr(imp, 0, 0) = idxs[i].hit_idx;
0173       m_XHitSize(imp, 0, 0) = 1;
0174 
0175       const Hit &hit = layer_of_hits.refHit(idxs[i].hit_idx);
0176       m_msErr.copyIn(imp, hit.errArray());
0177       m_msPar.copyIn(imp, hit.posArray());
0178     }
0179   }
0180 
0181   void MkFinder::inputOverlapHits(const LayerOfHits &layer_of_hits,
0182                                   const std::vector<UpdateIndices> &idxs,
0183                                   int beg,
0184                                   int end) {
0185     // Copy overlap hit values in.
0186 
0187     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0188       const Hit &hit = layer_of_hits.refHit(idxs[i].ovlp_idx);
0189       m_msErr.copyIn(imp, hit.errArray());
0190       m_msPar.copyIn(imp, hit.posArray());
0191     }
0192   }
0193 
0194   void MkFinder::inputTracksAndHitIdx(const std::vector<CombCandidate> &tracks,
0195                                       const std::vector<std::pair<int, IdxChi2List>> &idxs,
0196                                       int beg,
0197                                       int end,
0198                                       bool inputProp) {
0199     // Assign track parameters to initial state and copy hit values in.
0200 
0201     // This might not be true for the last chunk!
0202     // assert(end - beg == NN);
0203 
0204     const int iI = inputProp ? iP : iC;
0205 
0206     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0207       const TrackCand &trk = tracks[idxs[i].first][idxs[i].second.trkIdx];
0208 
0209       copy_in(trk, imp, iI);
0210 
0211       m_SeedIdx(imp, 0, 0) = idxs[i].first;
0212       m_CandIdx(imp, 0, 0) = idxs[i].second.trkIdx;
0213       m_SeedOriginIdx[imp] = tracks[idxs[i].first].seed_origin_index();
0214     }
0215   }
0216 
0217   void MkFinder::outputTracksAndHitIdx(std::vector<Track> &tracks, int beg, int end, bool outputProp) const {
0218     // Copies requested track parameters into Track objects.
0219     // The tracks vector should be resized to allow direct copying.
0220 
0221     const int iO = outputProp ? iP : iC;
0222 
0223     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0224       copy_out(tracks[i], imp, iO);
0225     }
0226   }
0227 
0228   void MkFinder::outputTracksAndHitIdx(
0229       std::vector<Track> &tracks, const std::vector<int> &idxs, int beg, int end, bool outputProp) const {
0230     // Copies requested track parameters into Track objects.
0231     // The tracks vector should be resized to allow direct copying.
0232 
0233     const int iO = outputProp ? iP : iC;
0234 
0235     for (int i = beg, imp = 0; i < end; ++i, ++imp) {
0236       copy_out(tracks[idxs[i]], imp, iO);
0237     }
0238   }
0239 
0240   void MkFinder::packModuleNormDirPnt(
0241       const LayerOfHits &layer_of_hits, int hit_cnt, MPlexHV &norm, MPlexHV &dir, MPlexHV &pnt, int N_proc) const {
0242     for (int itrack = 0; itrack < NN; ++itrack) {
0243       if (itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
0244         const auto &hit = layer_of_hits.refHit(m_XHitArr.constAt(itrack, hit_cnt, 0));
0245         unsigned int mid = hit.detIDinLayer();
0246         const ModuleInfo &mi = layer_of_hits.layer_info().module_info(mid);
0247         norm.At(itrack, 0, 0) = mi.zdir[0];
0248         norm.At(itrack, 1, 0) = mi.zdir[1];
0249         norm.At(itrack, 2, 0) = mi.zdir[2];
0250         dir.At(itrack, 0, 0) = mi.xdir[0];
0251         dir.At(itrack, 1, 0) = mi.xdir[1];
0252         dir.At(itrack, 2, 0) = mi.xdir[2];
0253         pnt.At(itrack, 0, 0) = mi.pos[0];
0254         pnt.At(itrack, 1, 0) = mi.pos[1];
0255         pnt.At(itrack, 2, 0) = mi.pos[2];
0256         //std::cout << "packModuleNormDirPnt id=" << hit_cnt << " norm=(" << mi.zdir[0] << ", " << mi.zdir[1] << ", " << mi.zdir[2] << ") - dir=(" << mi.xdir[0] << ", " << mi.xdir[1] << ", " << mi.xdir[2] << ") -  pnt=(" << mi.pos[0] << ", " << mi.pos[1] << ", " << mi.pos[2] << ")" << std::endl;
0257       }
0258     }
0259   }
0260 
0261   //==============================================================================
0262   // getHitSelDynamicWindows
0263   //==============================================================================
0264   // From HitSelectionWindows.h: track-related config on hit selection windows
0265 
0266   void MkFinder::getHitSelDynamicWindows(
0267       const float invpt, const float theta, float &min_dq, float &max_dq, float &min_dphi, float &max_dphi) {
0268     float max_invpt = std::min(invpt, 10.0f);  // => pT>0.1 GeV
0269 
0270     enum SelWinParameters_e { dp_sf = 0, dp_0, dp_1, dp_2, dq_sf, dq_0, dq_1, dq_2 };
0271     auto &v = m_iteration_layer_config->get_window_params(m_in_fwd, true);
0272 
0273     if (!v.empty()) {
0274       // dq hit selection window
0275       const float this_dq = v[dq_sf] * (v[dq_0] * max_invpt + v[dq_1] * theta + v[dq_2]);
0276       // In case value is below 0 (bad window derivation or other reasons), leave original limits
0277       if (this_dq > 0.f) {
0278         min_dq = this_dq;
0279         max_dq = 2.0f * min_dq;
0280       }
0281 
0282       // dphi hit selection window
0283       const float this_dphi = v[dp_sf] * (v[dp_0] * max_invpt + v[dp_1] * theta + v[dp_2]);
0284       // In case value is too low (bad window derivation or other reasons), leave original limits
0285       if (this_dphi > min_dphi) {
0286         min_dphi = this_dphi;
0287         max_dphi = 2.0f * min_dphi;
0288       }
0289     }
0290   }
0291 
0292   //==============================================================================
0293   // getHitSelDynamicChi2Cut
0294   //==============================================================================
0295   // From HitSelectionWindows.h: track-related config on hit selection windows
0296 
0297   inline float MkFinder::getHitSelDynamicChi2Cut(const int itrk, const int ipar) {
0298     const float minChi2Cut = m_iteration_params->chi2Cut_min;
0299     const float invpt = m_Par[ipar].At(itrk, 3, 0);
0300     const float theta = std::abs(m_Par[ipar].At(itrk, 5, 0) - Const::PIOver2);
0301 
0302     float max_invpt = std::min(invpt, 10.0f);  // => pT>0.1 GeV
0303 
0304     enum SelWinParameters_e { c2_sf = 8, c2_0, c2_1, c2_2 };
0305     auto &v = m_iteration_layer_config->get_window_params(m_in_fwd, true);
0306 
0307     if (!v.empty()) {
0308       float this_c2 = v[c2_sf] * (v[c2_0] * max_invpt + v[c2_1] * theta + v[c2_2]);
0309       // In case value is too low (bad window derivation or other reasons), leave original limits
0310       if (this_c2 > minChi2Cut)
0311         return this_c2;
0312     }
0313     return minChi2Cut;
0314   }
0315 
0316   //==============================================================================
0317   // SelectHitIndices
0318   //==============================================================================
0319 
0320   void MkFinder::selectHitIndices(const LayerOfHits &layer_of_hits, const int N_proc, bool fill_binsearch_only) {
0321     // bool debug = true;
0322     using bidx_t = LayerOfHits::bin_index_t;
0323     using bcnt_t = LayerOfHits::bin_content_t;
0324     const LayerOfHits &L = layer_of_hits;
0325     const IterationLayerConfig &ILC = *m_iteration_layer_config;
0326 
0327     const int iI = iP;
0328     const float nSigmaPhi = 3;
0329     const float nSigmaZ = 3;
0330     const float nSigmaR = 3;
0331 
0332     dprintf("LayerOfHits::SelectHitIndices %s layer=%d N_proc=%d\n",
0333             L.is_barrel() ? "barrel" : "endcap",
0334             L.layer_id(),
0335             N_proc);
0336 
0337     float dqv[NN], dphiv[NN], qv[NN], phiv[NN];
0338     bidx_t qb1v[NN], qb2v[NN], qbv[NN], pb1v[NN], pb2v[NN];
0339 
0340     const auto assignbins = [&](int itrack,
0341                                 float q,
0342                                 float dq,
0343                                 float phi,
0344                                 float dphi,
0345                                 float min_dq,
0346                                 float max_dq,
0347                                 float min_dphi,
0348                                 float max_dphi) {
0349       dphi = std::clamp(std::abs(dphi), min_dphi, max_dphi);
0350       dq = std::clamp(dq, min_dq, max_dq);
0351       //
0352       qv[itrack] = q;
0353       phiv[itrack] = phi;
0354       dphiv[itrack] = dphi;
0355       dqv[itrack] = dq;
0356       //
0357       qbv[itrack] = L.qBinChecked(q);
0358       qb1v[itrack] = L.qBinChecked(q - dq);
0359       qb2v[itrack] = L.qBinChecked(q + dq) + 1;
0360       pb1v[itrack] = L.phiBinChecked(phi - dphi);
0361       pb2v[itrack] = L.phiMaskApply(L.phiBin(phi + dphi) + 1);
0362     };
0363 
0364     const auto calcdphi2 = [&](int itrack, float dphidx, float dphidy) {
0365       return dphidx * dphidx * m_Err[iI].constAt(itrack, 0, 0) + dphidy * dphidy * m_Err[iI].constAt(itrack, 1, 1) +
0366              2 * dphidx * dphidy * m_Err[iI].constAt(itrack, 0, 1);
0367     };
0368 
0369     const auto calcdphi = [&](float dphi2, float min_dphi) {
0370       return std::max(nSigmaPhi * std::sqrt(std::abs(dphi2)), min_dphi);
0371     };
0372 
0373     if (L.is_barrel()) {
0374       // Pull out the part of the loop that vectorizes with icc and gcc
0375       // In llvm16 clang issues a warning that it can't vectorize
0376       // the loop.  Unfortunately, there doesn't seem to be a
0377       // pragma to suppress the warning, so we ifdef it out.  This
0378       // should be rechecked if llvm vectorization improves.
0379 #if !defined(__clang__)
0380 #pragma omp simd
0381 #endif
0382       for (int itrack = 0; itrack < NN; ++itrack) {
0383         if (itrack >= N_proc)
0384           continue;
0385         m_XHitSize[itrack] = 0;
0386 
0387         float min_dq = ILC.min_dq();
0388         float max_dq = ILC.max_dq();
0389         float min_dphi = ILC.min_dphi();
0390         float max_dphi = ILC.max_dphi();
0391 
0392         const float invpt = m_Par[iI].At(itrack, 3, 0);
0393         const float theta = std::fabs(m_Par[iI].At(itrack, 5, 0) - Const::PIOver2);
0394         getHitSelDynamicWindows(invpt, theta, min_dq, max_dq, min_dphi, max_dphi);
0395 
0396         const float x = m_Par[iI].constAt(itrack, 0, 0);
0397         const float y = m_Par[iI].constAt(itrack, 1, 0);
0398         const float r2 = x * x + y * y;
0399         const float dphidx = -y / r2, dphidy = x / r2;
0400         const float dphi2 = calcdphi2(itrack, dphidx, dphidy);
0401 #ifdef HARD_CHECK
0402         assert(dphi2 >= 0);
0403 #endif
0404 
0405         const float phi = getPhi(x, y);
0406         float dphi = calcdphi(dphi2, min_dphi);
0407 
0408         const float z = m_Par[iI].constAt(itrack, 2, 0);
0409         const float dz = std::abs(nSigmaZ * std::sqrt(m_Err[iI].constAt(itrack, 2, 2)));
0410         const float edgeCorr =
0411             std::abs(0.5f * (L.layer_info().rout() - L.layer_info().rin()) / std::tan(m_Par[iI].constAt(itrack, 5, 0)));
0412         // XXX-NUM-ERR above, m_Err(2,2) gets negative!
0413 
0414         m_XWsrResult[itrack] = L.is_within_z_sensitive_region(z, std::sqrt(dz * dz + edgeCorr * edgeCorr));
0415         assignbins(itrack, z, dz, phi, dphi, min_dq, max_dq, min_dphi, max_dphi);
0416 
0417         // Relax propagation-fail detection to be in line with pre-43145.
0418         if (m_FailFlag[itrack] && std::sqrt(r2) >= L.layer_info().rin()) {
0419           m_FailFlag[itrack] = 0;
0420         }
0421       }
0422     } else  // endcap
0423     {
0424       //layer half-thikness for dphi spread calculation; only for very restrictive iters
0425       const float layerD = std::abs(L.layer_info().zmax() - L.layer_info().zmin()) * 0.5f *
0426                            (m_iteration_params->maxConsecHoles == 0 || m_iteration_params->maxHolesPerCand == 0);
0427       // Pull out the part of the loop that vectorizes with icc and gcc
0428 #if !defined(__clang__)
0429 #pragma omp simd
0430 #endif
0431       for (int itrack = 0; itrack < NN; ++itrack) {
0432         m_XHitSize[itrack] = 0;
0433 
0434         float min_dq = ILC.min_dq();
0435         float max_dq = ILC.max_dq();
0436         float min_dphi = ILC.min_dphi();
0437         float max_dphi = ILC.max_dphi();
0438 
0439         const float invpt = m_Par[iI].At(itrack, 3, 0);
0440         const float theta = std::fabs(m_Par[iI].At(itrack, 5, 0) - Const::PIOver2);
0441         getHitSelDynamicWindows(invpt, theta, min_dq, max_dq, min_dphi, max_dphi);
0442 
0443         const float x = m_Par[iI].constAt(itrack, 0, 0);
0444         const float y = m_Par[iI].constAt(itrack, 1, 0);
0445         const float r2 = x * x + y * y;
0446         const float r2Inv = 1.f / r2;
0447         const float dphidx = -y * r2Inv, dphidy = x * r2Inv;
0448         const float phi = getPhi(x, y);
0449         const float dphi2 =
0450             calcdphi2(itrack, dphidx, dphidy)
0451             //range from finite layer thickness
0452             + std::pow(layerD * std::tan(m_Par[iI].At(itrack, 5, 0)) * std::sin(m_Par[iI].At(itrack, 4, 0) - phi), 2) *
0453                   r2Inv;
0454 #ifdef HARD_CHECK
0455         assert(dphi2 >= 0);
0456 #endif
0457 
0458         float dphi = calcdphi(dphi2, min_dphi);
0459 
0460         const float r = std::sqrt(r2);
0461         const float dr = nSigmaR * std::sqrt(std::abs(x * x * m_Err[iI].constAt(itrack, 0, 0) +
0462                                                       y * y * m_Err[iI].constAt(itrack, 1, 1) +
0463                                                       2 * x * y * m_Err[iI].constAt(itrack, 0, 1)) /
0464                                              r2);
0465         const float edgeCorr = std::abs(0.5f * (L.layer_info().zmax() - L.layer_info().zmin()) *
0466                                         std::tan(m_Par[iI].constAt(itrack, 5, 0)));
0467 
0468         m_XWsrResult[itrack] = L.is_within_r_sensitive_region(r, std::sqrt(dr * dr + edgeCorr * edgeCorr));
0469         assignbins(itrack, r, dr, phi, dphi, min_dq, max_dq, min_dphi, max_dphi);
0470       }
0471     }
0472 
0473 #ifdef RNT_DUMP_MkF_SelHitIdcs
0474     if (fill_binsearch_only) {
0475       // XXX loop over good indices (prepared in V2) and put in V1 BinSearch results
0476       for (auto i : rnt_shi.f_h_idcs) {
0477         CandInfo &ci = (*rnt_shi.ci)[rnt_shi.f_h_remap[i]];
0478         ci.bso = BinSearch({phiv[i],
0479                             dphiv[i],
0480                             qv[i],
0481                             dqv[i],
0482                             pb1v[i],
0483                             pb2v[i],
0484                             qb1v[i],
0485                             qb2v[i],
0486                             m_XWsrResult[i].m_wsr,
0487                             m_XWsrResult[i].m_in_gap,
0488                             false});
0489       }
0490       return;
0491     }
0492 #endif
0493 
0494     // Vectorizing this makes it run slower!
0495     //#pragma omp simd
0496     for (int itrack = 0; itrack < NN; ++itrack) {
0497       if (itrack >= N_proc) {
0498         continue;
0499       }
0500       // PROP-FAIL-ENABLE The following to be enabled when propagation failure
0501       // detection is properly implemented in propagate-to-R/Z.
0502       if (m_FailFlag[itrack]) {
0503         m_XWsrResult[itrack].m_wsr = WSR_Failed;
0504         continue;
0505       }
0506 
0507       if (m_XWsrResult[itrack].m_wsr == WSR_Outside) {
0508         continue;
0509       }
0510 
0511       const bidx_t qb = qbv[itrack];
0512       const bidx_t qb1 = qb1v[itrack];
0513       const bidx_t qb2 = qb2v[itrack];
0514       const bidx_t pb1 = pb1v[itrack];
0515       const bidx_t pb2 = pb2v[itrack];
0516 
0517       const float q = qv[itrack];
0518       const float phi = phiv[itrack];
0519       const float dphi = dphiv[itrack];
0520       const float dq = dqv[itrack];
0521 
0522       // clang-format off
0523       dprintf("  %2d/%2d: %6.3f %6.3f %6.6f %7.5f %3u %3u %4u %4u\n",
0524               L.layer_id(), itrack, q, phi, dq, dphi,
0525               qb1, qb2, pb1, pb2);
0526       // clang-format on
0527 
0528 #if defined(DUMPHITWINDOW) && defined(MKFIT_STANDALONE)
0529       const auto ngr = [](float f) { return isFinite(f) ? f : -999.0f; };
0530 
0531       const int seed_lbl = m_event->currentSeed(m_SeedOriginIdx[itrack]).label();
0532       Event::SimLabelFromHits slfh = m_event->simLabelForCurrentSeed(m_SeedOriginIdx[itrack]);
0533       const int seed_mcid = (slfh.is_set() && slfh.good_frac() > 0.7f) ? slfh.label : -999999;
0534 #endif
0535 
0536       for (bidx_t qi = qb1; qi != qb2; ++qi) {
0537         for (bidx_t pi = pb1; pi != pb2; pi = L.phiMaskApply(pi + 1)) {
0538           // Limit to central Q-bin
0539           if (qi == qb && L.isBinDead(pi, qi) == true) {
0540             dprint("dead module for track in layer=" << L.layer_id() << " qb=" << qi << " pi=" << pi << " q=" << q
0541                                                      << " phi=" << phi);
0542             m_XWsrResult[itrack].m_in_gap = true;
0543           }
0544 
0545           // MT: The following line is the biggest hog (4% total run time).
0546           // This comes from cache misses, I presume.
0547           // It might make sense to make first loop to extract bin indices
0548           // and issue prefetches at the same time.
0549           // Then enter vectorized loop to actually collect the hits in proper order.
0550 
0551           //SK: ~20x1024 bin sizes give mostly 1 hit per bin. Commented out for 128 bins or less
0552           // #pragma nounroll
0553           auto pbi = L.phiQBinContent(pi, qi);
0554           for (bcnt_t hi = pbi.begin(); hi < pbi.end(); ++hi) {
0555             // MT: Access into m_hit_zs and m_hit_phis is 1% run-time each.
0556 
0557             const unsigned int hi_orig = L.getOriginalHitIndex(hi);
0558 
0559             if (m_iteration_hit_mask && (*m_iteration_hit_mask)[hi_orig]) {
0560               dprintf(
0561                   "Yay, denying masked hit on layer %u, hi %u, orig idx %u\n", L.layer_info().layer_id(), hi, hi_orig);
0562               continue;
0563             }
0564 
0565             if (Config::usePhiQArrays) {
0566               if (m_XHitSize[itrack] >= MPlexHitIdxMax)
0567                 break;
0568 
0569               const float ddq = std::abs(q - L.hit_q(hi));
0570               const float ddphi = cdist(std::abs(phi - L.hit_phi(hi)));
0571 
0572               // clang-format off
0573               dprintf("     SHI %3u %4u %5u  %6.3f %6.3f %6.4f %7.5f   %s\n",
0574                       qi, pi, hi, L.hit_q(hi), L.hit_phi(hi),
0575                       ddq, ddphi, (ddq < dq && ddphi < dphi) ? "PASS" : "FAIL");
0576               // clang-format on
0577 
0578 #if defined(DUMPHITWINDOW) && defined(MKFIT_STANDALONE)
0579               // clang-format off
0580               MPlexQF thisOutChi2;
0581               {
0582                 const MCHitInfo &mchinfo = m_event->simHitsInfo_[L.refHit(hi).mcHitID()];
0583                 int mchid = mchinfo.mcTrackID();
0584                 int st_isfindable = 0;
0585                 int st_label = -999999;
0586                 int st_prodtype = 0;
0587                 int st_nhits = -1;
0588                 int st_charge = 0;
0589                 float st_r = -999.;
0590                 float st_z = -999.;
0591                 float st_pt = -999.;
0592                 float st_eta = -999.;
0593                 float st_phi = -999.;
0594                 if (mchid >= 0) {
0595                   Track simtrack = m_event->simTracks_[mchid];
0596                   st_isfindable = (int)simtrack.isFindable();
0597                   st_label = simtrack.label();
0598                   st_prodtype = (int)simtrack.prodType();
0599                   st_pt = simtrack.pT();
0600                   st_eta = simtrack.momEta();
0601                   st_phi = simtrack.momPhi();
0602                   st_nhits = simtrack.nTotalHits();
0603                   st_charge = simtrack.charge();
0604                   st_r = simtrack.posR();
0605                   st_z = simtrack.z();
0606                 }
0607 
0608                 const Hit &thishit = L.refHit(hi_orig);
0609                 m_msErr.copyIn(itrack, thishit.errArray());
0610                 m_msPar.copyIn(itrack, thishit.posArray());
0611 
0612                 MPlexQI propFail;
0613                 MPlexLV tmpPropPar;
0614                 const FindingFoos &fnd_foos = FindingFoos::get_finding_foos(L.is_barrel());
0615                 (*fnd_foos.m_compute_chi2_foo)(m_Err[iI],
0616                                                m_Par[iI],
0617                                                m_Chg,
0618                                                m_msErr,
0619                                                m_msPar,
0620                                                thisOutChi2,
0621                                                tmpPropPar,
0622                                                propFail,
0623                                                N_proc,
0624                                                m_prop_config->finding_intra_layer_pflags,
0625                                                m_prop_config->finding_requires_propagation_to_hit_pos);
0626 
0627                 float hx = thishit.x();
0628                 float hy = thishit.y();
0629                 float hz = thishit.z();
0630                 float hr = std::hypot(hx, hy);
0631                 float hphi = std::atan2(hy, hx);
0632                 float hex = ngr( std::sqrt(thishit.exx()) );
0633                 float hey = ngr( std::sqrt(thishit.eyy()) );
0634                 float hez = ngr( std::sqrt(thishit.ezz()) );
0635                 float her = ngr( std::sqrt(
0636                     (hx * hx * thishit.exx() + hy * hy * thishit.eyy() + 2.0f * hx * hy * m_msErr.At(itrack, 0, 1)) /
0637                     (hr * hr)) );
0638                 float hephi = ngr( std::sqrt(thishit.ephi()) );
0639                 float hchi2 = ngr( thisOutChi2[itrack] );
0640                 float tx = m_Par[iI].At(itrack, 0, 0);
0641                 float ty = m_Par[iI].At(itrack, 1, 0);
0642                 float tz = m_Par[iI].At(itrack, 2, 0);
0643                 float tr = std::hypot(tx, ty);
0644                 float tphi = std::atan2(ty, tx);
0645                 // float tchi2 = ngr( m_Chi2(itrack, 0, 0) ); // unused
0646                 float tex = ngr( std::sqrt(m_Err[iI].At(itrack, 0, 0)) );
0647                 float tey = ngr( std::sqrt(m_Err[iI].At(itrack, 1, 1)) );
0648                 float tez = ngr( std::sqrt(m_Err[iI].At(itrack, 2, 2)) );
0649                 float ter = ngr( std::sqrt(
0650                     (tx * tx * tex * tex + ty * ty * tey * tey + 2.0f * tx * ty * m_Err[iI].At(itrack, 0, 1)) /
0651                     (tr * tr)) );
0652                 float tephi = ngr( std::sqrt(
0653                     (ty * ty * tex * tex + tx * tx * tey * tey - 2.0f * tx * ty * m_Err[iI].At(itrack, 0, 1)) /
0654                     (tr * tr * tr * tr)) );
0655                 float ht_dxy = std::hypot(hx - tx, hy - ty);
0656                 float ht_dz = hz - tz;
0657                 float ht_dphi = cdist(std::abs(hphi - tphi));
0658 
0659                 static bool first = true;
0660                 if (first) {
0661                   printf(
0662                       "HITWINDOWSEL "
0663                       "evt_id/I:track_algo/I:"
0664                       "lyr_id/I:lyr_isbrl/I:hit_idx/I:"
0665                       "trk_cnt/I:trk_idx/I:trk_label/I:"
0666                       "trk_pt/F:trk_eta/F:trk_mphi/F:trk_chi2/F:"
0667                       "nhits/I:"
0668                       "seed_idx/I:seed_label/I:seed_mcid/I:"
0669                       "hit_mcid/I:"
0670                       "st_isfindable/I:st_prodtype/I:st_label/I:"
0671                       "st_pt/F:st_eta/F:st_phi/F:"
0672                       "st_nhits/I:st_charge/I:st_r/F:st_z/F:"
0673                       "trk_q/F:hit_q/F:dq_trkhit/F:dq_cut/F:trk_phi/F:hit_phi/F:dphi_trkhit/F:dphi_cut/F:"
0674                       "t_x/F:t_y/F:t_r/F:t_phi/F:t_z/F:"
0675                       "t_ex/F:t_ey/F:t_er/F:t_ephi/F:t_ez/F:"
0676                       "h_x/F:h_y/F:h_r/F:h_phi/F:h_z/F:"
0677                       "h_ex/F:h_ey/F:h_er/F:h_ephi/F:h_ez/F:"
0678                       "ht_dxy/F:ht_dz/F:ht_dphi/F:"
0679                       "h_chi2/F"
0680                       "\n");
0681                   first = false;
0682                 }
0683 
0684                 if (!(std::isnan(phi)) && !(std::isnan(getEta(m_Par[iI].At(itrack, 5, 0))))) {
0685                   //|| std::isnan(ter) || std::isnan(her) || std::isnan(m_Chi2(itrack, 0, 0)) || std::isnan(hchi2)))
0686                   printf("HITWINDOWSEL "
0687                          "%d %d"
0688                          "%d %d %d "
0689                          "%d %d %d "
0690                          "%6.3f %6.3f %6.3f %6.3f "
0691                          "%d "
0692                          "%d %d %d "
0693                          "%d "
0694                          "%d %d %d "
0695                          "%6.3f %6.3f %6.3f "
0696                          "%d %d %6.3f %6.3f "
0697                          "%6.3f %6.3f %6.3f %6.3f %6.3f %6.3f %6.3f %6.3f "
0698                          "%6.3f %6.3f %6.3f %6.3f %6.3f "
0699                          "%6.6f %6.6f %6.6f %6.6f %6.6f "
0700                          "%6.3f %6.3f %6.3f %6.3f %6.3f "
0701                          "%6.6f %6.6f %6.6f %6.6f %6.6f "
0702                          "%6.3f %6.3f %6.3f "
0703                          "%6.3f"
0704                          "\n",
0705                          m_event->evtID(), m_iteration_config->m_track_algorithm,
0706                          L.layer_id(), L.is_barrel(), hi_orig,
0707                          itrack, m_CandIdx(itrack, 0, 0), m_Label(itrack, 0, 0),
0708                          1.0f / m_Par[iI].At(itrack, 3, 0), getEta(m_Par[iI].At(itrack, 5, 0)), m_Par[iI].At(itrack, 4, 0), m_Chi2(itrack, 0, 0),
0709                          m_NFoundHits(itrack, 0, 0),
0710                          m_SeedOriginIdx(itrack, 0, 0), seed_lbl, seed_mcid,
0711                          mchid,
0712                          st_isfindable, st_prodtype, st_label,
0713                          st_pt, st_eta, st_phi,
0714                          st_nhits, st_charge, st_r, st_z,
0715                          q, L.hit_q(hi), ddq, dq, phi, L.hit_phi(hi), ddphi, dphi,
0716                          tx, ty, tr, tphi, tz,
0717                          tex, tey, ter, tephi, tez,
0718                          hx, hy, hr, hphi, hz,
0719                          hex, hey, her, hephi, hez,
0720                          ht_dxy, ht_dz, ht_dphi,
0721                          hchi2);
0722                 }
0723               }
0724               // clang-format on
0725 #endif
0726 
0727               if (ddq >= dq)
0728                 continue;
0729               if (ddphi >= dphi)
0730                 continue;
0731 
0732               // MT: Removing extra check gives full efficiency ...
0733               //     and means our error estimations are wrong!
0734               // Avi says we should have *minimal* search windows per layer.
0735               // Also ... if bins are sufficiently small, we do not need the extra
0736               // checks, see above.
0737               m_XHitArr.At(itrack, m_XHitSize[itrack]++, 0) = hi_orig;
0738             } else {
0739               // MT: The following check alone makes more sense with spiral traversal,
0740               // we'd be taking in closest hits first.
0741 
0742               // Hmmh -- there used to be some more checks here.
0743               // Or, at least, the phi binning was much smaller and no further checks were done.
0744               assert(false && "this code has not been used in a while -- see comments in code");
0745 
0746               if (m_XHitSize[itrack] < MPlexHitIdxMax) {
0747                 m_XHitArr.At(itrack, m_XHitSize[itrack]++, 0) = hi_orig;
0748               }
0749             }
0750           }  //hi
0751         }  //pi
0752       }  //qi
0753     }  //itrack
0754   }
0755 
0756   //==============================================================================
0757   // SelectHitIndicesV2
0758   //==============================================================================
0759 
0760   void MkFinder::selectHitIndicesV2(const LayerOfHits &layer_of_hits, const int N_proc) {
0761     // bool debug = true;
0762     using bidx_t = LayerOfHits::bin_index_t;
0763     using bcnt_t = LayerOfHits::bin_content_t;
0764     const LayerOfHits &L = layer_of_hits;
0765     const LayerInfo &LI = L.layer_info();
0766 
0767     const int iI = iP;
0768 
0769     dprintf("LayerOfHits::SelectHitIndicesV2 %s layer=%d N_proc=%d\n",
0770             L.is_barrel() ? "barrel" : "endcap",
0771             L.layer_id(),
0772             N_proc);
0773 
0774 #ifdef RNT_DUMP_MkF_SelHitIdcs
0775     rnt_shi.InnerIdcsReset(N_proc);
0776     Event::SimLabelFromHits sim_lbls[NN];
0777     for (int i = 0; i < N_proc; ++i) {
0778       sim_lbls[i] = m_event->simLabelForCurrentSeed(m_SeedOriginIdx[i]);
0779       if (m_FailFlag[i]) {
0780         rnt_shi.RegisterFailedProp(i, m_Par[1 - iI], m_Par[iI], m_event, m_SeedOriginIdx[i]);
0781       } else if (sim_lbls[i].is_set()) {
0782         /* CandInfo &ci = */ rnt_shi.RegisterGoodProp(i, m_Par[iI], m_event, m_SeedOriginIdx[i]);
0783       }  // else ... could do something about the bad seeds ... probably better to collect elsewhere.
0784     }
0785     // Get BinSearch result from V1. Note -- it can clear m_FailFlag for some cands!
0786     auto ff_stash = m_FailFlag;
0787     selectHitIndices(layer_of_hits, N_proc, true);
0788     m_FailFlag = ff_stash;
0789 #endif
0790 
0791     constexpr int NEW_MAX_HIT = 6;  // 4 - 6 give about the same # of tracks in quality-val
0792     constexpr float DDPHI_PRESEL_FAC = 2.0f;
0793     constexpr float DDQ_PRESEL_FAC = 1.2f;
0794     constexpr float PHI_BIN_EXTRA_FAC = 2.75f;
0795     constexpr float Q_BIN_EXTRA_FAC = 1.6f;
0796 
0797     namespace mp = mini_propagators;
0798     struct Bins {
0799       MPlexQUH q0, q1, q2, p1, p2;
0800       mp::InitialStatePlex isp;
0801       mp::StatePlex sp1, sp2;
0802       int n_proc;
0803 
0804       MPlexQF dphi_track, dq_track;  // 3 sigma track errors at initial state
0805 
0806       // debug & ntuple dump -- to be local in functions
0807       MPlexQF phi_c, dphi;
0808       MPlexQF q_c, qmin, qmax;
0809 
0810       Bins(const MPlexLV &par, const MPlexQI &chg, int np = NN) : isp(par, chg), n_proc(np) {}
0811 
0812       void prop_to_limits(const LayerInfo &li) {
0813         // Positions 1 and 2 should really be by "propagation order", 1 is the closest/
0814         // This should also work for backward propagation so not exactly trivial.
0815         // Also, do not really need propagation to center.
0816         if (li.is_barrel()) {
0817           isp.propagate_to_r(mp::PA_Exact, li.rin(), sp1, true, n_proc);
0818           isp.propagate_to_r(mp::PA_Exact, li.rout(), sp2, true, n_proc);
0819         } else {
0820           isp.propagate_to_z(mp::PA_Exact, li.zmin(), sp1, true, n_proc);
0821           isp.propagate_to_z(mp::PA_Exact, li.zmax(), sp2, true, n_proc);
0822         }
0823       }
0824 
0825       void find_bin_ranges(const LayerInfo &li, const LayerOfHits &loh, const MPlexLS &err) {
0826         // Below made members for debugging
0827         // MPlexQF phi_c, dphi_min, dphi_max;
0828         // phi_c = mp::fast_atan2(isp.y, isp.x);  // calculated below as difference
0829 
0830         // Matriplex::min_max(sp1.dphi, sp2.dphi, dphi_min, dphi_max);
0831         // the above is wrong: dalpha is not dphi --> renamed variable in State
0832         MPlexQF xp1, xp2, pmin, pmax;
0833         xp1 = mp::fast_atan2(sp1.y, sp1.x);
0834         xp2 = mp::fast_atan2(sp2.y, sp2.x);
0835         Matriplex::min_max(xp1, xp2, pmin, pmax);
0836         // Matriplex::min_max(mp::fast_atan2(sp1.y, sp1.x), smp::fast_atan2(sp2.y, sp2.x), pmin, pmax);
0837         MPlexQF dp = pmax - pmin;
0838         phi_c = 0.5f * (pmax + pmin);
0839         for (int ii = 0; ii < NN; ++ii) {
0840           if (ii < n_proc) {
0841             if (dp[ii] > Const::PI) {
0842               std::swap(pmax[ii], pmin[ii]);
0843               dp[ii] = Const::TwoPI - dp[ii];
0844               phi_c[ii] = Const::PI - phi_c[ii];
0845             }
0846             dphi[ii] = 0.5f * dp[ii];
0847             // printf("phic: %f  p1: %f  p2: %f   pmin: %f  pmax: %f   dphi: %f\n",
0848             //       phi_c[ii], xp1[ii], xp2[ii], pmin[ii], pmax[ii], dphi[ii]);
0849           }
0850         }
0851 
0852         const auto calc_err_xy = [&](const MPlexQF &x, const MPlexQF &y) {
0853           return x * x * err.ReduceFixedIJ(0, 0) + y * y * err.ReduceFixedIJ(1, 1) +
0854                  2.0f * x * y * err.ReduceFixedIJ(0, 1);
0855         };
0856 
0857         // Calculate dphi_track, dq_track differs for barrel/endcap
0858         MPlexQF r2_c = isp.x * isp.x + isp.y * isp.y;
0859         MPlexQF r2inv_c = 1.0f / r2_c;
0860         MPlexQF dphidx_c = -isp.y * r2inv_c;
0861         MPlexQF dphidy_c = isp.x * r2inv_c;
0862         dphi_track = 3.0f * calc_err_xy(dphidx_c, dphidy_c).abs().sqrt();
0863 
0864         // MPlexQF qmin, qmax;
0865         if (li.is_barrel()) {
0866           Matriplex::min_max(sp1.z, sp2.z, qmin, qmax);
0867           q_c = isp.z;
0868           dq_track = 3.0f * err.ReduceFixedIJ(2, 2).abs().sqrt();
0869         } else {
0870           Matriplex::min_max(Matriplex::hypot(sp1.x, sp1.y), Matriplex::hypot(sp2.x, sp2.y), qmin, qmax);
0871           q_c = Matriplex::sqrt(r2_c);
0872           dq_track = 3.0f * (r2inv_c * calc_err_xy(isp.x, isp.y).abs()).sqrt();
0873         }
0874 
0875         for (int i = 0; i < p1.kTotSize; ++i) {
0876           // Clamp crazy sizes. This actually only happens when prop-fail flag is set.
0877           // const float dphi_clamp = 0.1;
0878           // if (dphi_min[i] > 0.0f || dphi_min[i] < -dphi_clamp) dphi_min[i] = -dphi_clamp;
0879           // if (dphi_max[i] < 0.0f || dphi_max[i] > dphi_clampf) dphi_max[i] = dphi_clamp;
0880           p1[i] = loh.phiBinChecked(pmin[i] - dphi_track[i] - PHI_BIN_EXTRA_FAC * 0.0123f);
0881           p2[i] = loh.phiBinChecked(pmax[i] + dphi_track[i] + PHI_BIN_EXTRA_FAC * 0.0123f);
0882 
0883           q0[i] = loh.qBinChecked(q_c[i]);
0884           q1[i] = loh.qBinChecked(qmin[i] - dq_track[i] - Q_BIN_EXTRA_FAC * 0.5f * li.q_bin());
0885           q2[i] = loh.qBinChecked(qmax[i] + dq_track[i] + Q_BIN_EXTRA_FAC * 0.5f * li.q_bin()) + 1;
0886         }
0887       }
0888     };
0889 
0890     Bins B(m_Par[iI], m_Chg, N_proc);
0891     B.prop_to_limits(LI);
0892     B.find_bin_ranges(LI, L, m_Err[iI]);
0893 
0894     for (int i = 0; i < NN; ++i) {
0895       if (i < N_proc) {
0896         m_XHitSize[i] = 0;
0897         // Notify failure. Ideally should be detected before selectHitIndices().
0898         if (m_FailFlag[i]) {
0899           m_XWsrResult[i].m_wsr = WSR_Failed;
0900         } else {
0901           if (LI.is_barrel()) {
0902             m_XWsrResult[i] = L.is_within_z_sensitive_region(B.q_c[i], 0.5f * (B.q2[i] - B.q1[i]));
0903           } else {
0904             m_XWsrResult[i] = L.is_within_r_sensitive_region(B.q_c[i], 0.5f * (B.q2[i] - B.q1[i]));
0905           }
0906         }
0907       }
0908     }
0909 
0910     // for (int i = 0; i < N_proc; ++i) {
0911     //   printf("BinCheck %c %+8.6f %+8.6f | %3d %3d - %3d %3d ||  | %2d %2d - %2d %2d\n", LI.is_barrel() ? 'B' : 'E',
0912     //          B.phi[i], B.dphi[i], B.p1[i], B.p2[i], pb1v[i], pb2v[i],
0913     //          B.q[i], B.dq[i], B.q1[i], B.q2[i], qb1v[i], qb2v[i]);
0914     // }
0915 
0916 #ifdef RNT_DUMP_MkF_SelHitIdcs
0917     for (auto i : rnt_shi.f_h_idcs) {
0918       CandInfo &ci = (*rnt_shi.ci)[rnt_shi.f_h_remap[i]];
0919       ci.bsn = BinSearch({B.phi_c[i],
0920                           B.dphi[i],
0921                           B.q_c[i],
0922                           0.5f * (B.q2[i] - B.q1[i]),
0923                           B.p1[i],
0924                           B.p2[i],
0925                           B.q1[i],
0926                           B.q2[i],
0927                           m_XWsrResult[i].m_wsr,
0928                           m_XWsrResult[i].m_in_gap,
0929                           false});
0930       ci.ps_min = statep2propstate(B.sp1, i);
0931       ci.ps_max = statep2propstate(B.sp2, i);
0932     }
0933 #endif
0934 
0935     struct PQE {
0936       float score;
0937       unsigned int hit_index;
0938     };
0939     auto pqe_cmp = [](const PQE &a, const PQE &b) { return a.score < b.score; };
0940     std::priority_queue<PQE, std::vector<PQE>, decltype(pqe_cmp)> pqueue(pqe_cmp);
0941     int pqueue_size = 0;
0942 
0943     // Vectorizing this makes it run slower!
0944     //#pragma omp simd
0945     for (int itrack = 0; itrack < NN; ++itrack) {
0946       if (itrack >= N_proc) {
0947         continue;
0948       }
0949 
0950       if (m_FailFlag[itrack]) {
0951         m_XWsrResult[itrack].m_wsr = WSR_Failed;
0952         continue;
0953       }
0954 
0955       if (m_XWsrResult[itrack].m_wsr == WSR_Outside) {
0956         continue;
0957       }
0958 
0959       // New binning -- known to be too restrictive, so scaled up. Probably esp. in stereo layers.
0960       // Also, could take track covariance dphi / dq extras + known tilt stuff.
0961       const bidx_t qb = B.q0[itrack];
0962       const bidx_t qb1 = B.q1[itrack];
0963       const bidx_t qb2 = B.q2[itrack];
0964       const bidx_t pb1 = B.p1[itrack];
0965       const bidx_t pb2 = B.p2[itrack];
0966 
0967       // clang-format off
0968       dprintf("  %2d/%2d: %6.3f %6.3f %6.6f %7.5f %3u %3u %4u %4u\n",
0969               L.layer_id(), itrack, B.q_c[itrack], B.phi_c[itrack],
0970               B.qmax[itrack] - B.qmin[itrack], B.dphi[itrack],
0971               qb1, qb2, pb1, pb2);
0972 #ifdef RNT_DUMP_MkF_SelHitIdcs
0973       int hit_out_idx = 0;
0974       // phi-sorted position of matched hits
0975       struct pos_match { float dphi, dq; int idx; bool matched; };
0976       std::vector<pos_match> pos_match_vec;
0977 #endif
0978       // clang-format on
0979 
0980       mp::InitialState mp_is(m_Par[iI], m_Chg, itrack);
0981       mp::State mp_s;
0982 
0983       for (bidx_t qi = qb1; qi != qb2; ++qi) {
0984         for (bidx_t pi = pb1; pi != pb2; pi = L.phiMaskApply(pi + 1)) {
0985           // Limit to central Q-bin
0986           if (qi == qb && L.isBinDead(pi, qi) == true) {
0987             dprint("dead module for track in layer=" << L.layer_id() << " qb=" << qi << " pi=" << pi
0988                                                      << " q=" << B.q_c[itrack] << " phi=" << B.phi_c[itrack]);
0989             m_XWsrResult[itrack].m_in_gap = true;
0990           }
0991 
0992           // It might make sense to make first loop to extract bin indices
0993           // and issue prefetches at the same time.
0994           // Then enter vectorized loop to actually collect the hits in proper order.
0995 
0996           //SK: ~20x1024 bin sizes give mostly 1 hit per bin. Commented out for 128 bins or less
0997           // #pragma nounroll
0998           auto pbi = L.phiQBinContent(pi, qi);
0999           for (bcnt_t hi = pbi.begin(); hi < pbi.end(); ++hi) {
1000             // MT: Access into m_hit_zs and m_hit_phis is 1% run-time each.
1001 
1002             const unsigned int hi_orig = L.getOriginalHitIndex(hi);
1003 
1004             if (m_iteration_hit_mask && (*m_iteration_hit_mask)[hi_orig]) {
1005               dprintf(
1006                   "Yay, denying masked hit on layer %u, hi %u, orig idx %u\n", L.layer_info().layer_id(), hi, hi_orig);
1007               continue;
1008             }
1009 
1010             float new_q, new_phi, new_ddphi, new_ddq;
1011             bool prop_fail;
1012 
1013             if (L.is_barrel()) {
1014               const Hit &hit = L.refHit(hi_orig);
1015               unsigned int mid = hit.detIDinLayer();
1016               const ModuleInfo &mi = LI.module_info(mid);
1017 
1018               // Original condition, for phase2
1019               // if (L.layer_id() >= 4 && L.layer_id() <= 9 && std::abs(mp_is.z) > 10.f) {
1020 
1021               // This could work well instead of prop-to-r, too. Limit to 0.05 rad, 2.85 deg.
1022               if (std::abs(mi.zdir(2)) > 0.05f) {
1023                 prop_fail = mp_is.propagate_to_plane(mp::PA_Line, mi, mp_s, true);
1024                 new_q = mp_s.z;
1025                 /*
1026                 // This for calculating ddq on the dector plane, along the "strip" direction.
1027                 // NOTE -- should take full covariance and project it onto ydir.
1028                 SVector3 ydir = mi.calc_ydir();
1029                 new_ddq = (mp_s.x - mi.pos(0)) * ydir(0) +
1030                           (mp_s.y - mi.pos(1)) * ydir(1) +
1031                           (mp_s.z - mi.pos(2)) * ydir(2);
1032                 new_ddq = std::abs(new_ddq);
1033                 */
1034                 new_ddq = std::abs(new_q - L.hit_q(hi));
1035                 // dq from z direction is actually projected, so just take plain dz.
1036 
1037               } else {
1038                 prop_fail = mp_is.propagate_to_r(mp::PA_Exact, L.hit_qbar(hi), mp_s, true);
1039                 new_q = mp_s.z;
1040                 new_ddq = std::abs(new_q - L.hit_q(hi));
1041               }
1042             } else {
1043               prop_fail = mp_is.propagate_to_z(mp::PA_Exact, L.hit_qbar(hi), mp_s, true);
1044               new_q = std::hypot(mp_s.x, mp_s.y);
1045               new_ddq = std::abs(new_q - L.hit_q(hi));
1046             }
1047 
1048             new_phi = vdt::fast_atan2f(mp_s.y, mp_s.x);
1049             new_ddphi = cdist(std::abs(new_phi - L.hit_phi(hi)));
1050             bool dqdphi_presel = new_ddq < B.dq_track[itrack] + DDQ_PRESEL_FAC * L.hit_q_half_length(hi) &&
1051                                  new_ddphi < B.dphi_track[itrack] + DDPHI_PRESEL_FAC * 0.0123f;
1052 
1053             // clang-format off
1054             dprintf("     SHI %3u %4u %5u  %6.3f %6.3f %6.4f %7.5f  PROP-%s  %s\n",
1055                     qi, pi, hi, L.hit_q(hi), L.hit_phi(hi),
1056                     new_ddq, new_ddphi, prop_fail ? "FAIL" : "OK", dqdphi_presel ? "PASS" : "REJECT");
1057 #ifdef RNT_DUMP_MkF_SelHitIdcs
1058             if (rnt_shi.f_h_remap[itrack] >= 0) {
1059               int sim_lbl = sim_lbls[itrack].label;
1060               const Hit &thishit = L.refHit(hi_orig);
1061               m_msErr.copyIn(itrack, thishit.errArray());
1062               m_msPar.copyIn(itrack, thishit.posArray());
1063 
1064               MPlexQF thisOutChi2;
1065               MPlexQI propFail(0);
1066               MPlexLV tmpPropPar;
1067               const FindingFoos &fnd_foos = FindingFoos::get_finding_foos(L.is_barrel());
1068               (*fnd_foos.m_compute_chi2_foo)(
1069                 m_Err[iI], m_Par[iI], m_Chg, m_msErr, m_msPar,
1070                 thisOutChi2, tmpPropPar, propFail, N_proc,
1071                 m_prop_config->finding_intra_layer_pflags,
1072                 m_prop_config->finding_requires_propagation_to_hit_pos);
1073               float hchi2 = thisOutChi2[itrack];
1074 
1075               CandInfo &ci = (*rnt_shi.ci)[rnt_shi.f_h_remap[itrack]];
1076 
1077               const MCHitInfo &mchinfo = m_event->simHitsInfo_[L.refHit(hi_orig).mcHitID()];
1078               int hit_lbl = mchinfo.mcTrackID();
1079               ci.hmi.emplace_back(HitMatchInfo{ HitInfo
1080                 { hit2pos(thishit),
1081                   new_q, L.hit_q_half_length(hi), L.hit_qbar(hi), new_phi,
1082                   hit_lbl },
1083                 state2pos(mp_s), state2mom(mp_s),
1084                 new_ddq, new_ddphi, hchi2, (int) hi_orig,
1085                 (sim_lbl == hit_lbl), dqdphi_presel, !prop_fail,
1086                 false, IdxChi2List()
1087               });
1088               ci.hmi.back().ic2list.reset(); // zero initialize
1089 
1090               bool new_dec = dqdphi_presel && !prop_fail;
1091               ++ci.n_all_hits;
1092               if (sim_lbl == hit_lbl) {
1093                 ++ci.n_hits_match;
1094                 if (new_dec) ++ci.n_hits_pass_match;
1095               }
1096               if (new_dec) ++ci.n_hits_pass;
1097               if (new_dec)
1098                 pos_match_vec.emplace_back(pos_match{ new_ddphi, new_ddq, hit_out_idx++,
1099                                              sim_lbl == hit_lbl });
1100             } // if cand is saved
1101 #endif
1102             // clang-format on
1103 
1104             if (prop_fail || !dqdphi_presel)
1105               continue;
1106             if (pqueue_size < NEW_MAX_HIT) {
1107               pqueue.push({new_ddphi, hi_orig});
1108               ++pqueue_size;
1109             } else if (new_ddphi < pqueue.top().score) {
1110               pqueue.pop();
1111               pqueue.push({new_ddphi, hi_orig});
1112             }
1113           }  //hi
1114         }  //pi
1115       }  //qi
1116 
1117       dprintf(" PQUEUE (%d)", pqueue_size);
1118 #ifdef RNT_DUMP_MkF_SelHitIdcs
1119       // clang-format off
1120       if (sim_lbls[itrack].is_set()) {
1121         // Find ord number of matched hits.
1122         std::sort(pos_match_vec.begin(), pos_match_vec.end(),
1123                   [](auto &a, auto &b){return a.dphi < b.dphi;});
1124         int pmvs = pos_match_vec.size();
1125 
1126         CandInfo &ci = (*rnt_shi.ci)[rnt_shi.f_h_remap[itrack]];
1127         for (int i = 0; i < pmvs; ++i) {
1128           if (pos_match_vec[i].matched) {
1129             ci.ord_first_match = i;
1130             ci.dphi_first_match = pos_match_vec[i].dphi;
1131             ci.dq_first_match = pos_match_vec[i].dq;
1132             break;
1133           }
1134         }
1135       }
1136       // clang-format off
1137 #endif
1138       // Reverse hits so best dphis/scores come first in the hit-index list.
1139       m_XHitSize[itrack] = pqueue_size;
1140       while (pqueue_size) {
1141         --pqueue_size;
1142         m_XHitArr.At(itrack, pqueue_size, 0) = pqueue.top().hit_index;
1143         dprintf("   %d: %f %d", pqueue_size, pqueue.top().score, pqueue.top().hit_index);
1144         pqueue.pop();
1145       }
1146       dprintf("\n");
1147 
1148     }  //itrack
1149   }
1150 
1151   //==============================================================================
1152   // AddBestHit - Best Hit Track Finding
1153   //==============================================================================
1154 
1155   void MkFinder::addBestHit(const LayerOfHits &layer_of_hits, const int N_proc, const FindingFoos &fnd_foos) {
1156     // debug = true;
1157 
1158     MatriplexHitPacker mhp(layer_of_hits.hitArray());
1159 
1160     float minChi2[NN];
1161     int bestHit[NN];
1162     int maxSize = 0;
1163 
1164     // Determine maximum number of hits for tracks in the collection.
1165     for (int it = 0; it < NN; ++it) {
1166       if (it < N_proc) {
1167         if (m_XHitSize[it] > 0) {
1168           maxSize = std::max(maxSize, m_XHitSize[it]);
1169         }
1170       }
1171 
1172       bestHit[it] = -1;
1173       minChi2[it] = getHitSelDynamicChi2Cut(it, iP);
1174     }
1175 
1176     for (int hit_cnt = 0; hit_cnt < maxSize; ++hit_cnt) {
1177       //fixme what if size is zero???
1178 
1179       mhp.reset();
1180 
1181       //#pragma omp simd doesn't vectorize with current compilers
1182       for (int itrack = 0; itrack < NN; ++itrack) {
1183         if (itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
1184           mhp.addInputAt(itrack, layer_of_hits.refHit(m_XHitArr.At(itrack, hit_cnt, 0)));
1185         }
1186       }
1187 
1188       mhp.pack(m_msErr, m_msPar);
1189 
1190       //now compute the chi2 of track state vs hit
1191       MPlexQF outChi2;
1192       MPlexLV tmpPropPar;
1193       clearFailFlag();
1194       (*fnd_foos.m_compute_chi2_foo)(m_Err[iP],
1195                                      m_Par[iP],
1196                                      m_Chg,
1197                                      m_msErr,
1198                                      m_msPar,
1199                                      outChi2,
1200                                      tmpPropPar,
1201                                      m_FailFlag,
1202                                      N_proc,
1203                                      m_prop_config->finding_intra_layer_pflags,
1204                                      m_prop_config->finding_requires_propagation_to_hit_pos);
1205 
1206       //update best hit in case chi2<minChi2
1207 #pragma omp simd
1208       for (int itrack = 0; itrack < NN; ++itrack) {
1209         if (itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
1210           const float chi2 = std::abs(outChi2[itrack]);  //fixme negative chi2 sometimes...
1211           dprint("chi2=" << chi2 << " minChi2[itrack]=" << minChi2[itrack]);
1212           if (chi2 < minChi2[itrack]) {
1213             minChi2[itrack] = chi2;
1214             bestHit[itrack] = m_XHitArr.At(itrack, hit_cnt, 0);
1215           }
1216         }
1217       }
1218     }  // end loop over hits
1219 
1220     //#pragma omp simd
1221     for (int itrack = 0; itrack < NN; ++itrack) {
1222       if (itrack >= N_proc) {
1223         continue;
1224       }
1225 
1226       if (m_XWsrResult[itrack].m_wsr == WSR_Outside) {
1227         // Why am I doing this?
1228         m_msErr.setDiagonal3x3(itrack, 666);
1229         m_msPar(itrack, 0, 0) = m_Par[iP](itrack, 0, 0);
1230         m_msPar(itrack, 1, 0) = m_Par[iP](itrack, 1, 0);
1231         m_msPar(itrack, 2, 0) = m_Par[iP](itrack, 2, 0);
1232 
1233         // XXXX If not in gap, should get back the old track params. But they are gone ...
1234         // Would actually have to do it right after SelectHitIndices where updated params are still ok.
1235         // Here they got screwed during hit matching.
1236         // So, I'd store them there (into propagated params) and retrieve them here.
1237         // Or we decide not to care ...
1238 
1239         continue;
1240       }
1241 
1242       //fixme decide what to do in case no hit found
1243       if (bestHit[itrack] >= 0) {
1244         const Hit &hit = layer_of_hits.refHit(bestHit[itrack]);
1245         const float chi2 = minChi2[itrack];
1246 
1247         dprint("ADD BEST HIT FOR TRACK #"
1248                << itrack << std::endl
1249                << "prop x=" << m_Par[iP].constAt(itrack, 0, 0) << " y=" << m_Par[iP].constAt(itrack, 1, 0) << std::endl
1250                << "copy in hit #" << bestHit[itrack] << " x=" << hit.position()[0] << " y=" << hit.position()[1]);
1251 
1252         m_msErr.copyIn(itrack, hit.errArray());
1253         m_msPar.copyIn(itrack, hit.posArray());
1254         m_Chi2(itrack, 0, 0) += chi2;
1255 
1256         add_hit(itrack, bestHit[itrack], layer_of_hits.layer_id());
1257       } else {
1258         int fake_hit_idx = Hit::kHitMissIdx;
1259 
1260         if (m_XWsrResult[itrack].m_wsr == WSR_Edge) {
1261           // YYYYYY Config::store_missed_layers
1262           fake_hit_idx = Hit::kHitEdgeIdx;
1263         } else if (num_all_minus_one_hits(itrack)) {
1264           fake_hit_idx = Hit::kHitStopIdx;
1265         }
1266 
1267         dprint("ADD FAKE HIT FOR TRACK #" << itrack << " withinBounds=" << (fake_hit_idx != Hit::kHitEdgeIdx)
1268                                           << " r=" << std::hypot(m_Par[iP](itrack, 0, 0), m_Par[iP](itrack, 1, 0)));
1269 
1270         m_msErr.setDiagonal3x3(itrack, 666);
1271         m_msPar(itrack, 0, 0) = m_Par[iP](itrack, 0, 0);
1272         m_msPar(itrack, 1, 0) = m_Par[iP](itrack, 1, 0);
1273         m_msPar(itrack, 2, 0) = m_Par[iP](itrack, 2, 0);
1274         // Don't update chi2
1275 
1276         add_hit(itrack, fake_hit_idx, layer_of_hits.layer_id());
1277       }
1278     }
1279 
1280     // Update the track parameters with this hit. (Note that some calculations
1281     // are already done when computing chi2. Not sure it's worth caching them?)
1282 
1283     dprint("update parameters");
1284     clearFailFlag();
1285     (*fnd_foos.m_update_param_foo)(m_Err[iP],
1286                                    m_Par[iP],
1287                                    m_Chg,
1288                                    m_msErr,
1289                                    m_msPar,
1290                                    m_Err[iC],
1291                                    m_Par[iC],
1292                                    m_FailFlag,
1293                                    N_proc,
1294                                    m_prop_config->finding_intra_layer_pflags,
1295                                    m_prop_config->finding_requires_propagation_to_hit_pos);
1296 
1297     dprint("m_Par[iP](0,0,0)=" << m_Par[iP](0, 0, 0) << " m_Par[iC](0,0,0)=" << m_Par[iC](0, 0, 0));
1298   }
1299 
1300   //=======================================================
1301   // isStripQCompatible : check if prop is consistent with the barrel/endcap strip length
1302   //=======================================================
1303   bool isStripQCompatible(
1304       int itrack, bool isBarrel, const MPlexLS &pErr, const MPlexLV &pPar, const MPlexHS &msErr, const MPlexHV &msPar) {
1305     //check module compatibility via long strip side = L/sqrt(12)
1306     if (isBarrel) {  //check z direction only
1307       const float res = std::abs(msPar.constAt(itrack, 2, 0) - pPar.constAt(itrack, 2, 0));
1308       const float hitHL = sqrt(msErr.constAt(itrack, 2, 2) * 3.f);  //half-length
1309       const float qErr = sqrt(pErr.constAt(itrack, 2, 2));
1310       dprint("qCompat " << hitHL << " + " << 3.f * qErr << " vs " << res);
1311       return hitHL + std::max(3.f * qErr, 0.5f) > res;
1312     } else {  //project on xy, assuming the strip Length >> Width
1313       const float res[2]{msPar.constAt(itrack, 0, 0) - pPar.constAt(itrack, 0, 0),
1314                          msPar.constAt(itrack, 1, 0) - pPar.constAt(itrack, 1, 0)};
1315       const float hitT2 = msErr.constAt(itrack, 0, 0) + msErr.constAt(itrack, 1, 1);
1316       const float hitT2inv = 1.f / hitT2;
1317       const float proj[3] = {msErr.constAt(itrack, 0, 0) * hitT2inv,
1318                              msErr.constAt(itrack, 0, 1) * hitT2inv,
1319                              msErr.constAt(itrack, 1, 1) * hitT2inv};
1320       const float qErr =
1321           sqrt(std::abs(pErr.constAt(itrack, 0, 0) * proj[0] + 2.f * pErr.constAt(itrack, 0, 1) * proj[1] +
1322                         pErr.constAt(itrack, 1, 1) * proj[2]));  //take abs to avoid non-pos-def cases
1323       const float resProj =
1324           sqrt(res[0] * proj[0] * res[0] + 2.f * res[1] * proj[1] * res[0] + res[1] * proj[2] * res[1]);
1325       dprint("qCompat " << sqrt(hitT2 * 3.f) << " + " << 3.f * qErr << " vs " << resProj);
1326       return sqrt(hitT2 * 3.f) + std::max(3.f * qErr, 0.5f) > resProj;
1327     }
1328   }
1329 
1330   //=======================================================
1331   // passStripChargePCMfromTrack : apply the slope correction to charge per cm and cut using hit err matrix
1332   //         the raw pcm = charge/L_normal
1333   //         the corrected qCorr = charge/L_path = charge/(L_normal*p/p_zLocal) = pcm*p_zLocal/p
1334   //=======================================================
1335   bool passStripChargePCMfromTrack(
1336       int itrack, bool isBarrel, unsigned int pcm, unsigned int pcmMin, const MPlexLV &pPar, const MPlexHS &msErr) {
1337     //skip the overflow case
1338     if (pcm >= Hit::maxChargePerCM())
1339       return true;
1340 
1341     float qSF;
1342     if (isBarrel) {  //project in x,y, assuming zero-error direction is in this plane
1343       const float hitT2 = msErr.constAt(itrack, 0, 0) + msErr.constAt(itrack, 1, 1);
1344       const float hitT2inv = 1.f / hitT2;
1345       const float proj[3] = {msErr.constAt(itrack, 0, 0) * hitT2inv,
1346                              msErr.constAt(itrack, 0, 1) * hitT2inv,
1347                              msErr.constAt(itrack, 1, 1) * hitT2inv};
1348       const bool detXY_OK =
1349           std::abs(proj[0] * proj[2] - proj[1] * proj[1]) < 0.1f;  //check that zero-direction is close
1350       const float cosP = cos(pPar.constAt(itrack, 4, 0));
1351       const float sinP = sin(pPar.constAt(itrack, 4, 0));
1352       const float sinT = std::abs(sin(pPar.constAt(itrack, 5, 0)));
1353       //qSF = sqrt[(px,py)*(1-proj)*(px,py)]/p = sinT*sqrt[(cosP,sinP)*(1-proj)*(cosP,sinP)].
1354       qSF = detXY_OK ? sinT * std::sqrt(std::abs(1.f + cosP * cosP * proj[0] + sinP * sinP * proj[2] -
1355                                                  2.f * cosP * sinP * proj[1]))
1356                      : 1.f;
1357     } else {  //project on z
1358       // p_zLocal/p = p_z/p = cosT
1359       qSF = std::abs(cos(pPar.constAt(itrack, 5, 0)));
1360     }
1361 
1362     const float qCorr = pcm * qSF;
1363     dprint("pcm " << pcm << " * " << qSF << " = " << qCorr << " vs " << pcmMin);
1364     return qCorr > pcmMin;
1365   }
1366 
1367   //==============================================================================
1368   // FindCandidates - Standard Track Finding
1369   //==============================================================================
1370 
1371   void MkFinder::findCandidates(const LayerOfHits &layer_of_hits,
1372                                 std::vector<std::vector<TrackCand>> &tmp_candidates,
1373                                 const int offset,
1374                                 const int N_proc,
1375                                 const FindingFoos &fnd_foos) {
1376     // bool debug = true;
1377 
1378     MatriplexHitPacker mhp(layer_of_hits.hitArray());
1379 
1380     int maxSize = 0;
1381 
1382     // Determine maximum number of hits for tracks in the collection.
1383     for (int it = 0; it < NN; ++it) {
1384       if (it < N_proc) {
1385         if (m_XHitSize[it] > 0) {
1386           maxSize = std::max(maxSize, m_XHitSize[it]);
1387         }
1388       }
1389     }
1390 
1391     dprintf("FindCandidates max hits to process=%d\n", maxSize);
1392 
1393     int nHitsAdded[NN]{};
1394     bool isTooLargeCluster[NN]{false};
1395 
1396     for (int hit_cnt = 0; hit_cnt < maxSize; ++hit_cnt) {
1397       mhp.reset();
1398 
1399       int charge_pcm[NN];
1400 
1401       //#pragma omp simd doesn't vectorize with current compilers
1402       for (int itrack = 0; itrack < NN; ++itrack) {
1403         if (itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
1404           const auto &hit = layer_of_hits.refHit(m_XHitArr.At(itrack, hit_cnt, 0));
1405           mhp.addInputAt(itrack, hit);
1406           charge_pcm[itrack] = hit.chargePerCM();
1407         }
1408       }
1409 
1410       mhp.pack(m_msErr, m_msPar);
1411 
1412       //now compute the chi2 of track state vs hit
1413       MPlexQF outChi2;
1414       MPlexLV propPar;
1415       clearFailFlag();
1416 
1417       if /*constexpr*/ (Config::usePropToPlane) {
1418         // Maybe could use 2 matriplex packers ... ModuleInfo has 3 * SVector3 and uint
1419     MPlexHV norm, dir, pnt;
1420     packModuleNormDirPnt(layer_of_hits, hit_cnt, norm, dir, pnt, N_proc);
1421         kalmanPropagateAndComputeChi2Plane(m_Err[iP],
1422                                            m_Par[iP],
1423                                            m_Chg,
1424                                            m_msErr,
1425                                            m_msPar,
1426                                                  norm,
1427                                            dir,
1428                                            pnt,
1429                                            outChi2,
1430                                            propPar,
1431                                            m_FailFlag,
1432                                            N_proc,
1433                                            m_prop_config->finding_intra_layer_pflags,
1434                          m_prop_config->finding_requires_propagation_to_hit_pos);
1435       } else {
1436         (*fnd_foos.m_compute_chi2_foo)(m_Err[iP],
1437                                        m_Par[iP],
1438                                        m_Chg,
1439                                        m_msErr,
1440                                        m_msPar,
1441                                        outChi2,
1442                                        propPar,
1443                                        m_FailFlag,
1444                                        N_proc,
1445                                        m_prop_config->finding_intra_layer_pflags,
1446                                        m_prop_config->finding_requires_propagation_to_hit_pos);
1447       }
1448 
1449       // Now update the track parameters with this hit (note that some
1450       // calculations are already done when computing chi2, to be optimized).
1451       // 1. This is not needed for candidates the hit is not added to, but it's
1452       // vectorized so doing it serially below should take the same time.
1453       // 2. Still it's a waste of time in case the hit is not added to any of the
1454       // candidates, so check beforehand that at least one cand needs update.
1455       bool oneCandPassCut = false;
1456       for (int itrack = 0; itrack < NN; ++itrack) {
1457         if (itrack >= N_proc) {
1458           continue;
1459         }
1460         float max_c2 = getHitSelDynamicChi2Cut(itrack, iP);
1461 
1462         if (hit_cnt < m_XHitSize[itrack]) {
1463           const float chi2 = std::abs(outChi2[itrack]);  //fixme negative chi2 sometimes...
1464           dprint("chi2=" << chi2);
1465           if (chi2 < max_c2) {
1466             bool isCompatible = true;
1467             if (!layer_of_hits.is_pixel()) {
1468               //check module compatibility via long strip side = L/sqrt(12)
1469               isCompatible =
1470                   isStripQCompatible(itrack, layer_of_hits.is_barrel(), m_Err[iP], propPar, m_msErr, m_msPar);
1471 
1472               //rescale strip charge to track parameters and reapply the cut
1473           if (isCompatible && layer_of_hits.layer_info().has_charge()) {
1474                 isCompatible = passStripChargePCMfromTrack(
1475                   itrack, layer_of_hits.is_barrel(), charge_pcm[itrack], Hit::minChargePerCM(), propPar, m_msErr);
1476           }
1477         }
1478             // Select only SiStrip hits with cluster size < maxClusterSize
1479             if (!layer_of_hits.is_pixel()) {
1480               if (layer_of_hits.refHit(m_XHitArr.At(itrack, hit_cnt, 0)).spanRows() >=
1481                   m_iteration_params->maxClusterSize) {
1482                 isTooLargeCluster[itrack] = true;
1483                 isCompatible = false;
1484               }
1485             }
1486 
1487             if (isCompatible) {
1488               oneCandPassCut = true;
1489               break;
1490             }
1491           }
1492         }
1493       }
1494 
1495       if (oneCandPassCut) {
1496         MPlexQI tmpChg = m_Chg;
1497         clearFailFlag();
1498         (*fnd_foos.m_update_param_foo)(m_Err[iP],
1499                                        m_Par[iP],
1500                                        tmpChg,
1501                                        m_msErr,
1502                                        m_msPar,
1503                                        m_Err[iC],
1504                                        m_Par[iC],
1505                                        m_FailFlag,
1506                                        N_proc,
1507                                        m_prop_config->finding_intra_layer_pflags,
1508                                        m_prop_config->finding_requires_propagation_to_hit_pos);
1509 
1510         dprint("update parameters" << std::endl
1511                                    << "propagated track parameters x=" << m_Par[iP].constAt(0, 0, 0)
1512                                    << " y=" << m_Par[iP].constAt(0, 1, 0) << std::endl
1513                                    << "               hit position x=" << m_msPar.constAt(0, 0, 0)
1514                                    << " y=" << m_msPar.constAt(0, 1, 0) << std::endl
1515                                    << "   updated track parameters x=" << m_Par[iC].constAt(0, 0, 0)
1516                                    << " y=" << m_Par[iC].constAt(0, 1, 0));
1517 
1518         //create candidate with hit in case chi2 < max_c2
1519         //fixme: please vectorize me... (not sure it's possible in this case)
1520         for (int itrack = 0; itrack < NN; ++itrack) {
1521           if (itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
1522             const float max_c2 = getHitSelDynamicChi2Cut(itrack, iP);
1523             const float chi2 = std::abs(outChi2[itrack]);  //fixme negative chi2 sometimes...
1524             dprint("chi2=" << chi2);
1525             if (chi2 < max_c2) {
1526               bool isCompatible = true;
1527               if (!layer_of_hits.is_pixel()) {
1528                 // select only SiStrip hits with cluster size < maxClusterSize
1529                 if (layer_of_hits.refHit(m_XHitArr.At(itrack, hit_cnt, 0)).spanRows() >=
1530                     m_iteration_params->maxClusterSize) {
1531                   // isTooLargeCluster[itrack] = true; -- only in CloneEngine
1532                   isCompatible = false;
1533                 }
1534                 // check module compatibility via long strip side = L/sqrt(12)
1535                 if (isCompatible)
1536                   isCompatible =
1537                     isStripQCompatible(itrack, layer_of_hits.is_barrel(), m_Err[iP], propPar, m_msErr, m_msPar);
1538                 // rescale strip charge to track parameters and reapply the cut
1539                 if (isCompatible && layer_of_hits.layer_info().has_charge()) {
1540                   isCompatible = passStripChargePCMfromTrack(
1541                     itrack, layer_of_hits.is_barrel(), charge_pcm[itrack], Hit::minChargePerCM(), propPar, m_msErr);
1542                 }
1543               }
1544 
1545               if (isCompatible) {
1546                 bool hitExists = false;
1547                 int maxHits = m_NFoundHits(itrack, 0, 0);
1548                 if (layer_of_hits.is_pixel()) {
1549                   for (int i = 0; i <= maxHits; ++i) {
1550                     if (i > 2)
1551                       break;
1552                     if (m_HoTArrs[itrack][i].layer == layer_of_hits.layer_id()) {
1553                       hitExists = true;
1554                       break;
1555                     }
1556                   }
1557                 }
1558                 if (hitExists)
1559                   continue;
1560 
1561                 nHitsAdded[itrack]++;
1562                 dprint("chi2 cut passed, creating new candidate");
1563                 // Create a new candidate and fill the tmp_candidates output vector.
1564                 // QQQ only instantiate if it will pass, be better than N_best
1565 
1566                 const int hit_idx = m_XHitArr.At(itrack, hit_cnt, 0);
1567 
1568                 TrackCand newcand;
1569                 copy_out(newcand, itrack, iC);
1570                 newcand.setCharge(tmpChg(itrack, 0, 0));
1571                 newcand.addHitIdx(hit_idx, layer_of_hits.layer_id(), chi2);
1572                 newcand.setScore(getScoreCand(m_steering_params->m_track_scorer,
1573                                               newcand,
1574                                               true /*penalizeTailMissHits*/,
1575                                               true /*inFindCandidates*/));
1576                 newcand.setOriginIndex(m_CandIdx(itrack, 0, 0));
1577 
1578                 // To apply a fixed cut instead of dynamic cut for overlap: m_iteration_params->chi2CutOverlap
1579                 if (chi2 < max_c2) {
1580                   CombCandidate &ccand = *newcand.combCandidate();
1581                   ccand[m_CandIdx(itrack, 0, 0)].considerHitForOverlap(
1582                       hit_idx, layer_of_hits.refHit(hit_idx).detIDinLayer(), chi2);
1583                 }
1584 
1585                 dprint("updated track parameters x=" << newcand.parameters()[0] << " y=" << newcand.parameters()[1]
1586                                                      << " z=" << newcand.parameters()[2]
1587                                                      << " pt=" << 1. / newcand.parameters()[3]);
1588 
1589                 tmp_candidates[m_SeedIdx(itrack, 0, 0) - offset].emplace_back(newcand);
1590               }
1591             }
1592           }
1593         }
1594       }  //end if (oneCandPassCut)
1595 
1596     }  //end loop over hits
1597 
1598     //now add invalid hit
1599     //fixme: please vectorize me...
1600     for (int itrack = 0; itrack < NN; ++itrack) {
1601       // Cands that miss the layer are stashed away in MkBuilder(), before propagation,
1602       // and then merged back afterwards.
1603       if (itrack >= N_proc || m_XWsrResult[itrack].m_wsr == WSR_Outside) {
1604         continue;
1605       }
1606 
1607       int fake_hit_idx = ((num_all_minus_one_hits(itrack) < m_iteration_params->maxHolesPerCand) &&
1608                           (m_NTailMinusOneHits(itrack, 0, 0) < m_iteration_params->maxConsecHoles))
1609                              ? Hit::kHitMissIdx
1610                              : Hit::kHitStopIdx;
1611 
1612       if (m_XWsrResult[itrack].m_wsr == WSR_Edge) {
1613         // YYYYYY m_iteration_params->store_missed_layers
1614         fake_hit_idx = Hit::kHitEdgeIdx;
1615       }
1616       //now add fake hit for tracks that passsed through inactive modules
1617       else if (m_XWsrResult[itrack].m_in_gap == true && nHitsAdded[itrack] == 0) {
1618         fake_hit_idx = Hit::kHitInGapIdx;
1619       }
1620       //now add fake hit for cases where hit cluster size is larger than maxClusterSize
1621       else if (isTooLargeCluster[itrack] == true && nHitsAdded[itrack] == 0) {
1622         fake_hit_idx = Hit::kHitMaxClusterIdx;
1623       }
1624 
1625       dprint("ADD FAKE HIT FOR TRACK #" << itrack << " withinBounds=" << (fake_hit_idx != Hit::kHitEdgeIdx)
1626                                         << " r=" << std::hypot(m_Par[iP](itrack, 0, 0), m_Par[iP](itrack, 1, 0)));
1627 
1628       // QQQ as above, only create and add if score better
1629       TrackCand newcand;
1630       copy_out(newcand, itrack, iP);
1631       newcand.addHitIdx(fake_hit_idx, layer_of_hits.layer_id(), 0.);
1632       newcand.setScore(getScoreCand(
1633           m_steering_params->m_track_scorer, newcand, true /*penalizeTailMissHits*/, true /*inFindCandidates*/));
1634       // Only relevant when we actually add a hit
1635       // newcand.setOriginIndex(m_CandIdx(itrack, 0, 0));
1636       tmp_candidates[m_SeedIdx(itrack, 0, 0) - offset].emplace_back(newcand);
1637     }
1638   }
1639 
1640   //==============================================================================
1641   // FindCandidatesCloneEngine - Clone Engine Track Finding
1642   //==============================================================================
1643 
1644   void MkFinder::findCandidatesCloneEngine(const LayerOfHits &layer_of_hits,
1645                                            CandCloner &cloner,
1646                                            const int offset,
1647                                            const int N_proc,
1648                                            const FindingFoos &fnd_foos) {
1649     // bool debug = true;
1650 
1651     MatriplexHitPacker mhp(layer_of_hits.hitArray());
1652 
1653     int maxSize = 0;
1654 
1655     // Determine maximum number of hits for tracks in the collection.
1656 #pragma omp simd
1657     for (int it = 0; it < NN; ++it) {
1658       if (it < N_proc) {
1659         if (m_XHitSize[it] > 0) {
1660           maxSize = std::max(maxSize, m_XHitSize[it]);
1661         }
1662       }
1663     }
1664 
1665     dprintf("FindCandidatesCloneEngine max hits to process=%d\n", maxSize);
1666 
1667     int nHitsAdded[NN]{};
1668     bool isTooLargeCluster[NN]{false};
1669 
1670     for (int hit_cnt = 0; hit_cnt < maxSize; ++hit_cnt) {
1671       mhp.reset();
1672 
1673       int charge_pcm[NN];
1674 
1675       //#pragma omp simd doesn't vectorize with current compilers
1676       for (int itrack = 0; itrack < NN; ++itrack) {
1677         if (itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
1678           const auto &hit = layer_of_hits.refHit(m_XHitArr.At(itrack, hit_cnt, 0));
1679           mhp.addInputAt(itrack, hit);
1680           charge_pcm[itrack] = hit.chargePerCM();
1681         }
1682       }
1683 
1684       mhp.pack(m_msErr, m_msPar);
1685 
1686       //now compute the chi2 of track state vs hit
1687       MPlexQF outChi2;
1688       MPlexLV propPar;
1689       clearFailFlag();
1690 
1691       if /*constexpr*/ (Config::usePropToPlane) {
1692         // Maybe could use 2 matriplex packers ... ModuleInfo has 3 * SVector3 and uint
1693         MPlexHV norm, dir, pnt;
1694         packModuleNormDirPnt(layer_of_hits, hit_cnt, norm, dir, pnt, N_proc);
1695         kalmanPropagateAndComputeChi2Plane(m_Err[iC],
1696                                      m_Par[iC],
1697                                      m_Chg,
1698                                      m_msErr,
1699                                      m_msPar,
1700                                      norm, dir, pnt,
1701                                      outChi2,
1702                                      propPar,
1703                                      m_FailFlag,
1704                                      N_proc,
1705                                      m_prop_config->finding_intra_layer_pflags,
1706                                      m_prop_config->finding_requires_propagation_to_hit_pos);
1707       } else {
1708         (*fnd_foos.m_compute_chi2_foo)(m_Err[iP],
1709                                        m_Par[iP],
1710                                        m_Chg,
1711                                        m_msErr,
1712                                        m_msPar,
1713                                        outChi2,
1714                                        propPar,
1715                                        m_FailFlag,
1716                                        N_proc,
1717                                        m_prop_config->finding_intra_layer_pflags,
1718                                        m_prop_config->finding_requires_propagation_to_hit_pos);
1719       }
1720 
1721       //#pragma omp simd  // DOES NOT VECTORIZE AS IT IS NOW
1722       for (int itrack = 0; itrack < NN; ++itrack) {
1723         // We can be in failed state from the initial propagation before selectHitIndices
1724         // and there hit_count for track is set to -1 and WSR state to Failed, handled below.
1725         // Or we might have hit it here in propagate-to-hit.
1726         // PROP-FAIL-ENABLE FailFlag check to be enabled when propagation failure
1727         // detection is properly implemented in propagate-to-R/Z.
1728         if (/*!m_FailFlag[itrack] &&*/ itrack < N_proc && hit_cnt < m_XHitSize[itrack]) {
1729           // make sure the hit was in the compatiblity window for the candidate
1730           const float max_c2 = getHitSelDynamicChi2Cut(itrack, iP);
1731           const float chi2 = std::abs(outChi2[itrack]);  //fixme negative chi2 sometimes...
1732           // XXX-NUM-ERR assert(chi2 >= 0);
1733 
1734           dprintf("  chi2=%.3f (%.3f)  trkIdx=%d hitIdx=%d\n", chi2, max_c2, itrack,  m_XHitArr.At(itrack, hit_cnt, 0));
1735           if (chi2 < max_c2) {
1736             bool isCompatible = true;
1737             if (!layer_of_hits.is_pixel()) {
1738               // select only SiStrip hits with cluster size < maxClusterSize
1739               if (layer_of_hits.refHit(m_XHitArr.At(itrack, hit_cnt, 0)).spanRows() >=
1740                   m_iteration_params->maxClusterSize) {
1741                 isTooLargeCluster[itrack] = true;
1742                 isCompatible = false;
1743               }
1744               // check module compatibility via long strip side = L/sqrt(12)
1745               if (isCompatible)
1746                 isCompatible =
1747                   isStripQCompatible(itrack, layer_of_hits.is_barrel(), m_Err[iP], propPar, m_msErr, m_msPar);
1748               // rescale strip charge to track parameters and reapply the cut
1749               if (isCompatible && layer_of_hits.layer_info().has_charge()) {
1750                 isCompatible = passStripChargePCMfromTrack(
1751                   itrack, layer_of_hits.is_barrel(), charge_pcm[itrack], Hit::minChargePerCM(), propPar, m_msErr);
1752               }
1753             }
1754 
1755             if (isCompatible) {
1756               CombCandidate &ccand = cloner.combCandWithOriginalIndex(m_SeedIdx(itrack, 0, 0));
1757               bool hitExists = false;
1758               int maxHits = m_NFoundHits(itrack, 0, 0);
1759               if (layer_of_hits.is_pixel()) {
1760                 for (int i = 0; i <= maxHits; ++i) {
1761                   if (i > 2)
1762                     break;
1763                   if (ccand.hot(i).layer == layer_of_hits.layer_id()) {
1764                     hitExists = true;
1765                     break;
1766                   }
1767                 }
1768               }
1769               if (hitExists)
1770                 continue;
1771 
1772               nHitsAdded[itrack]++;
1773               const int hit_idx = m_XHitArr.At(itrack, hit_cnt, 0);
1774 
1775               // Register hit for overlap consideration, if chi2 cut is passed
1776               // To apply a fixed cut instead of dynamic cut for overlap: m_iteration_params->chi2CutOverlap
1777               if (chi2 < max_c2) {
1778                 ccand[m_CandIdx(itrack, 0, 0)].considerHitForOverlap(
1779                     hit_idx, layer_of_hits.refHit(hit_idx).detIDinLayer(), chi2);
1780               }
1781 
1782               IdxChi2List tmpList;
1783               tmpList.trkIdx = m_CandIdx(itrack, 0, 0);
1784               tmpList.hitIdx = hit_idx;
1785               tmpList.module = layer_of_hits.refHit(hit_idx).detIDinLayer();
1786               tmpList.nhits = m_NFoundHits(itrack, 0, 0) + 1;
1787               tmpList.ntailholes = 0;
1788               tmpList.noverlaps = m_NOverlapHits(itrack, 0, 0);
1789               tmpList.nholes = num_all_minus_one_hits(itrack);
1790               tmpList.pt = std::abs(1.0f / m_Par[iP].At(itrack, 3, 0));
1791               tmpList.chi2 = m_Chi2(itrack, 0, 0) + chi2;
1792               tmpList.chi2_hit = chi2;
1793               tmpList.score = getScoreStruct(m_steering_params->m_track_scorer, tmpList);
1794               cloner.add_cand(m_SeedIdx(itrack, 0, 0) - offset, tmpList);
1795 
1796               dprint("  adding hit with hit_cnt=" << hit_cnt << " for trkIdx=" << tmpList.trkIdx
1797                                                   << " orig Seed=" << m_Label(itrack, 0, 0));
1798 
1799 #ifdef RNT_DUMP_MkF_SelHitIdcs
1800               if (rnt_shi.f_h_remap[itrack] >= 0) {
1801                 CandInfo &ci = (*rnt_shi.ci)[rnt_shi.f_h_remap[itrack]];
1802                 ci.assignIdxChi2List(tmpList);
1803               }
1804 #endif
1805             }
1806           }
1807         }
1808       }
1809 
1810     }  //end loop over hits
1811 
1812     //now add invalid hit
1813     for (int itrack = 0; itrack < NN; ++itrack) {
1814       dprint("num_all_minus_one_hits(" << itrack << ")=" << num_all_minus_one_hits(itrack));
1815 
1816       // Cands that miss the layer are stashed away in MkBuilder(), before propagation,
1817       // and then merged back afterwards.
1818       if (itrack >= N_proc || m_XWsrResult[itrack].m_wsr == WSR_Outside) {
1819         continue;
1820       }
1821 
1822       // int fake_hit_idx = num_all_minus_one_hits(itrack) < m_iteration_params->maxHolesPerCand ? -1 : -2;
1823       int fake_hit_idx = ((num_all_minus_one_hits(itrack) < m_iteration_params->maxHolesPerCand) &&
1824                           (m_NTailMinusOneHits(itrack, 0, 0) < m_iteration_params->maxConsecHoles))
1825                              ? Hit::kHitMissIdx
1826                              : Hit::kHitStopIdx;
1827 
1828       if (m_XWsrResult[itrack].m_wsr == WSR_Edge) {
1829         fake_hit_idx = Hit::kHitEdgeIdx;
1830       }
1831       //now add fake hit for tracks that passsed through inactive modules
1832       else if (m_XWsrResult[itrack].m_in_gap == true && nHitsAdded[itrack] == 0) {
1833         fake_hit_idx = Hit::kHitInGapIdx;
1834       }
1835       //now add fake hit for cases where hit cluster size is larger than maxClusterSize
1836       else if (isTooLargeCluster[itrack] == true && nHitsAdded[itrack] == 0) {
1837         fake_hit_idx = Hit::kHitMaxClusterIdx;
1838       }
1839 
1840       // PROP-FAIL-ENABLE The following to be enabled when propagation failure
1841       // detection is properly implemented in propagate-to-R/Z.
1842       // // Override for failed propagation, this trumps all other cases.
1843       // if (m_XWsrResult[itrack].m_wsr == WSR_Failed) {
1844       //   fake_hit_idx = Hit::kHitStopIdx;
1845       // }
1846 
1847       IdxChi2List tmpList;
1848       tmpList.trkIdx = m_CandIdx(itrack, 0, 0);
1849       tmpList.hitIdx = fake_hit_idx;
1850       tmpList.module = -1;
1851       tmpList.nhits = m_NFoundHits(itrack, 0, 0);
1852       tmpList.ntailholes = (fake_hit_idx == Hit::kHitMissIdx ? m_NTailMinusOneHits(itrack, 0, 0) + 1
1853                                                              : m_NTailMinusOneHits(itrack, 0, 0));
1854       tmpList.noverlaps = m_NOverlapHits(itrack, 0, 0);
1855       tmpList.nholes = num_inside_minus_one_hits(itrack);
1856       tmpList.pt = std::abs(1.0f / m_Par[iP].At(itrack, 3, 0));
1857       tmpList.chi2 = m_Chi2(itrack, 0, 0);
1858       tmpList.chi2_hit = 0;
1859       tmpList.score = getScoreStruct(m_steering_params->m_track_scorer, tmpList);
1860       cloner.add_cand(m_SeedIdx(itrack, 0, 0) - offset, tmpList);
1861       dprint("adding invalid hit " << fake_hit_idx);
1862     }
1863   }
1864 
1865   //==============================================================================
1866   // UpdateWithLoadedHit
1867   //==============================================================================
1868 
1869   void MkFinder::updateWithLoadedHit(int N_proc, const LayerOfHits &layer_of_hits, const FindingFoos &fnd_foos) {
1870     // See comment in MkBuilder::find_tracks_in_layer() about intra / inter flags used here
1871     // for propagation to the hit.
1872     clearFailFlag();
1873     if /*constexpr*/ (Config::usePropToPlane) {
1874       MPlexHV norm, dir, pnt;
1875       packModuleNormDirPnt(layer_of_hits, 0, norm, dir, pnt, N_proc);
1876       kalmanPropagateAndUpdatePlane(m_Err[iP],
1877                                    m_Par[iP],
1878                                    m_Chg,
1879                                    m_msErr,
1880                                    m_msPar,
1881                                    norm, dir, pnt,
1882                                    m_Err[iC],
1883                                    m_Par[iC],
1884                                    m_FailFlag,
1885                                    N_proc,
1886                                    m_prop_config->finding_inter_layer_pflags,
1887                                    m_prop_config->finding_requires_propagation_to_hit_pos);
1888     } else {
1889       (*fnd_foos.m_update_param_foo)(m_Err[iP],
1890                                      m_Par[iP],
1891                                      m_Chg,
1892                                      m_msErr,
1893                                      m_msPar,
1894                                      m_Err[iC],
1895                                      m_Par[iC],
1896                                      m_FailFlag,
1897                                      N_proc,
1898                                      m_prop_config->finding_inter_layer_pflags,
1899                                      m_prop_config->finding_requires_propagation_to_hit_pos);
1900     }
1901 
1902     // PROP-FAIL-ENABLE The following to be enabled when propagation failure
1903     // detection is properly implemented in propagate-to-R/Z.
1904     // for (int i = 0; i < N_proc; ++i) {
1905     //   if (m_FailFlag[i]) {
1906     //     dprintf("MkFinder::updateWithLoadedHit fail in update, recovering.\n");
1907     //     m_Err[iC].copySlot(i, m_Err[iP]);
1908     //     m_Par[iC].copySlot(i, m_Par[iP]);
1909     //   }
1910     // }
1911   }
1912 
1913   void MkFinder::chi2OfLoadedHit(int N_proc, const FindingFoos &fnd_foos) {
1914     // We expect input in iC slots from above function.
1915     // See comment in MkBuilder::find_tracks_in_layer() about intra / inter flags used here
1916     // for propagation to the hit.
1917     clearFailFlag();
1918     (*fnd_foos.m_compute_chi2_foo)(m_Err[iC],
1919                                    m_Par[iC],
1920                                    m_Chg,
1921                                    m_msErr,
1922                                    m_msPar,
1923                                    m_Chi2,
1924                                    m_Par[iP],
1925                                    m_FailFlag,
1926                                    N_proc,
1927                                    m_prop_config->finding_inter_layer_pflags,
1928                                    m_prop_config->finding_requires_propagation_to_hit_pos);
1929 
1930     // PROP-FAIL-ENABLE .... removed here
1931   }
1932 
1933   //==============================================================================
1934   // CopyOutParErr
1935   //==============================================================================
1936 
1937   void MkFinder::copyOutParErr(std::vector<CombCandidate> &seed_cand_vec, int N_proc, bool outputProp) const {
1938     const int iO = outputProp ? iP : iC;
1939 
1940     for (int i = 0; i < NN; ++i) {
1941       if (i < N_proc) {
1942         TrackCand &cand = seed_cand_vec[m_SeedIdx(i, 0, 0)][m_CandIdx(i, 0, 0)];
1943 
1944         // Set the track state to the updated parameters
1945         m_Err[iO].copyOut(i, cand.errors_nc().Array());
1946         m_Par[iO].copyOut(i, cand.parameters_nc().Array());
1947         cand.setCharge(m_Chg(i, 0, 0));
1948 
1949         dprint((outputProp ? "propagated" : "updated")
1950                << " track parameters x=" << cand.parameters()[0] << " y=" << cand.parameters()[1]
1951                << " z=" << cand.parameters()[2] << " pt=" << 1. / cand.parameters()[3] << " posEta=" << cand.posEta());
1952       }
1953     }
1954   }
1955 
1956   //==============================================================================
1957   // Backward Fit hack
1958   //==============================================================================
1959 
1960   void MkFinder::bkFitInputTracks(TrackVec &cands, int beg, int end) {
1961     // Uses HitOnTrack vector from Track directly + a local cursor array to current hit.
1962 
1963     MatriplexTrackPacker mtp(&cands[beg]);
1964 
1965     int itrack = 0;
1966 
1967     for (int i = beg; i < end; ++i, ++itrack) {
1968       const Track &trk = cands[i];
1969 
1970       m_Chg(itrack, 0, 0) = trk.charge();
1971       m_CurHit[itrack] = trk.nTotalHits() - 1;
1972       m_HoTArr[itrack] = trk.getHitsOnTrackArray();
1973 
1974       mtp.addInput(trk);
1975     }
1976 
1977     m_Chi2.setVal(0);
1978 
1979     mtp.pack(m_Err[iC], m_Par[iC]);
1980 
1981     m_Err[iC].scale(100.0f);
1982   }
1983 
1984   void MkFinder::bkFitInputTracks(EventOfCombCandidates &eocss, int beg, int end) {
1985     // Could as well use HotArrays from tracks directly + a local cursor array to last hit.
1986 
1987     // XXXX - shall we assume only TrackCand-zero is needed and that we can freely
1988     // bork the HoTNode array?
1989 
1990     MatriplexTrackPacker mtp(&eocss[beg][0]);
1991 
1992     int itrack = 0;
1993 
1994     for (int i = beg; i < end; ++i, ++itrack) {
1995       const TrackCand &trk = eocss[i][0];
1996 
1997       m_Chg(itrack, 0, 0) = trk.charge();
1998       m_CurNode[itrack] = trk.lastCcIndex();
1999       m_HoTNodeArr[itrack] = trk.combCandidate()->hotsData();
2000 
2001       // XXXX Need TrackCand* to update num-hits. Unless I collect info elsewhere
2002       // and fix it in BkFitOutputTracks.
2003       m_TrkCand[itrack] = &eocss[i][0];
2004 
2005       mtp.addInput(trk);
2006     }
2007 
2008     m_Chi2.setVal(0);
2009 
2010     mtp.pack(m_Err[iC], m_Par[iC]);
2011 
2012     m_Err[iC].scale(100.0f);
2013   }
2014 
2015   //------------------------------------------------------------------------------
2016 
2017   void MkFinder::bkFitOutputTracks(TrackVec &cands, int beg, int end, bool outputProp) {
2018     // Only copy out track params / errors / chi2, all the rest is ok.
2019 
2020     const int iO = outputProp ? iP : iC;
2021 
2022     int itrack = 0;
2023     for (int i = beg; i < end; ++i, ++itrack) {
2024       Track &trk = cands[i];
2025 
2026       m_Err[iO].copyOut(itrack, trk.errors_nc().Array());
2027       m_Par[iO].copyOut(itrack, trk.parameters_nc().Array());
2028 
2029       trk.setChi2(m_Chi2(itrack, 0, 0));
2030       if (isFinite(trk.chi2())) {
2031         trk.setScore(getScoreCand(m_steering_params->m_track_scorer, trk));
2032       }
2033     }
2034   }
2035 
2036   void MkFinder::bkFitOutputTracks(EventOfCombCandidates &eocss, int beg, int end, bool outputProp) {
2037     // Only copy out track params / errors / chi2, all the rest is ok.
2038 
2039     // XXXX - where will rejected hits get removed?
2040 
2041     const int iO = outputProp ? iP : iC;
2042 
2043     int itrack = 0;
2044     for (int i = beg; i < end; ++i, ++itrack) {
2045       TrackCand &trk = eocss[i][0];
2046 
2047       m_Err[iO].copyOut(itrack, trk.errors_nc().Array());
2048       m_Par[iO].copyOut(itrack, trk.parameters_nc().Array());
2049 
2050       trk.setChi2(m_Chi2(itrack, 0, 0));
2051       if (isFinite(trk.chi2())) {
2052         trk.setScore(getScoreCand(m_steering_params->m_track_scorer, trk));
2053       }
2054     }
2055   }
2056 
2057   //------------------------------------------------------------------------------
2058 
2059 #if defined(DEBUG_BACKWARD_FIT) || defined(DEBUG_BACKWARD_FIT_BH)
2060   namespace {
2061     float e2s(float x) { return 1e4 * std::sqrt(x); }
2062   }  // namespace
2063 #endif
2064 
2065   void MkFinder::bkFitFitTracksBH(const EventOfHits &eventofhits,
2066                                   const SteeringParams &st_par,
2067                                   const int N_proc,
2068                                   bool chiDebug) {
2069     // Prototyping final backward fit.
2070     // This works with track-finding indices, before remapping.
2071     //
2072     // Layers should be collected during track finding and list all layers that have actual hits.
2073     // Then we could avoid checking which layers actually do have hits.
2074 
2075     MPlexQF tmp_chi2;
2076     float tmp_err[6] = {666, 0, 666, 0, 0, 666};
2077     float tmp_pos[3];
2078 
2079     for (auto lp_iter = st_par.m_layer_plan.rbegin(); lp_iter != st_par.m_layer_plan.rend(); ++lp_iter) {
2080       const int layer = lp_iter->m_layer;
2081 
2082       const LayerOfHits &L = eventofhits[layer];
2083       const LayerInfo &LI = L.layer_info();
2084 
2085       int count = 0;
2086       for (int i = 0; i < N_proc; ++i) {
2087         while (m_CurHit[i] >= 0 && m_HoTArr[i][m_CurHit[i]].index < 0)
2088           --m_CurHit[i];
2089 
2090         if (m_CurHit[i] >= 0 && m_HoTArr[i][m_CurHit[i]].layer == layer) {
2091           // Skip the overlap hits -- if they exist.
2092           // 1. Overlap hit gets placed *after* the original hit in TrackCand::exportTrack()
2093           // which is *before* in the reverse iteration that we are doing here.
2094           // 2. Seed-hit merging can result in more than two hits per layer.
2095           while (m_CurHit[i] > 0 && m_HoTArr[i][m_CurHit[i] - 1].layer == layer)
2096             --m_CurHit[i];
2097 
2098           const Hit &hit = L.refHit(m_HoTArr[i][m_CurHit[i]].index);
2099           m_msErr.copyIn(i, hit.errArray());
2100           m_msPar.copyIn(i, hit.posArray());
2101           ++count;
2102           --m_CurHit[i];
2103         } else {
2104           tmp_pos[0] = m_Par[iC](i, 0, 0);
2105           tmp_pos[1] = m_Par[iC](i, 1, 0);
2106           tmp_pos[2] = m_Par[iC](i, 2, 0);
2107           m_msErr.copyIn(i, tmp_err);
2108           m_msPar.copyIn(i, tmp_pos);
2109         }
2110       }
2111 
2112       if (count == 0)
2113         continue;
2114 
2115       // ZZZ Could add missing hits here, only if there are any actual matches.
2116 
2117       if (LI.is_barrel()) {
2118         propagateTracksToHitR(m_msPar, N_proc, m_prop_config->backward_fit_pflags);
2119 
2120         kalmanOperation(KFO_Calculate_Chi2 | KFO_Update_Params | KFO_Local_Cov,
2121                         m_Err[iP],
2122                         m_Par[iP],
2123                         m_msErr,
2124                         m_msPar,
2125                         m_Err[iC],
2126                         m_Par[iC],
2127                         tmp_chi2,
2128                         N_proc);
2129       } else {
2130         propagateTracksToHitZ(m_msPar, N_proc, m_prop_config->backward_fit_pflags);
2131 
2132         kalmanOperationEndcap(KFO_Calculate_Chi2 | KFO_Update_Params,
2133                               m_Err[iP],
2134                               m_Par[iP],
2135                               m_msErr,
2136                               m_msPar,
2137                               m_Err[iC],
2138                               m_Par[iC],
2139                               tmp_chi2,
2140                               N_proc);
2141       }
2142 
2143       //fixup invpt sign and charge
2144       for (int n = 0; n < NN; ++n) {
2145         if (n < N_proc && m_Par[iC].At(n, 3, 0) < 0) {
2146           m_Chg.At(n, 0, 0) = -m_Chg.At(n, 0, 0);
2147           m_Par[iC].At(n, 3, 0) = -m_Par[iC].At(n, 3, 0);
2148         }
2149       }
2150 
2151 #ifdef DEBUG_BACKWARD_FIT_BH
2152       // Dump per hit chi2
2153       for (int i = 0; i < N_proc; ++i) {
2154         float r_h = std::hypot(m_msPar.At(i, 0, 0), m_msPar.At(i, 1, 0));
2155         float r_t = std::hypot(m_Par[iC].At(i, 0, 0), m_Par[iC].At(i, 1, 0));
2156 
2157         // if ((std::isnan(tmp_chi2[i]) || std::isnan(r_t)))
2158         // if ( ! std::isnan(tmp_chi2[i]) && tmp_chi2[i] > 0) // && tmp_chi2[i] > 30)
2159         if (chiDebug) {
2160           int ti = iP;
2161           printf(
2162               "CHIHIT %3d %10g %10g %10g %10g %10g %11.5g %11.5g %11.5g %10g %10g %10g %10g %11.5g %11.5g %11.5g %10g "
2163               "%10g %10g %10g %10g %11.5g %11.5g\n",
2164               layer,
2165               tmp_chi2[i],
2166               m_msPar.At(i, 0, 0),
2167               m_msPar.At(i, 1, 0),
2168               m_msPar.At(i, 2, 0),
2169               r_h,  // x_h y_h z_h r_h -- hit pos
2170               e2s(m_msErr.At(i, 0, 0)),
2171               e2s(m_msErr.At(i, 1, 1)),
2172               e2s(m_msErr.At(i, 2, 2)),  // ex_h ey_h ez_h -- hit errors
2173               m_Par[ti].At(i, 0, 0),
2174               m_Par[ti].At(i, 1, 0),
2175               m_Par[ti].At(i, 2, 0),
2176               r_t,  // x_t y_t z_t r_t -- track pos
2177               e2s(m_Err[ti].At(i, 0, 0)),
2178               e2s(m_Err[ti].At(i, 1, 1)),
2179               e2s(m_Err[ti].At(i, 2, 2)),  // ex_t ey_t ez_t -- track errors
2180               1.0f / m_Par[ti].At(i, 3, 0),
2181               m_Par[ti].At(i, 4, 0),
2182               m_Par[ti].At(i, 5, 0),                                     // pt, phi, theta
2183               std::atan2(m_msPar.At(i, 1, 0), m_msPar.At(i, 0, 0)),      // phi_h
2184               std::atan2(m_Par[ti].At(i, 1, 0), m_Par[ti].At(i, 0, 0)),  // phi_t
2185               1e4f * std::hypot(m_msPar.At(i, 0, 0) - m_Par[ti].At(i, 0, 0),
2186                                 m_msPar.At(i, 1, 0) - m_Par[ti].At(i, 1, 0)),  // d_xy
2187               1e4f * (m_msPar.At(i, 2, 0) - m_Par[ti].At(i, 2, 0))             // d_z
2188               // e2s((m_msErr.At(i,0,0) + m_msErr.At(i,1,1)) / (r_h * r_h)),     // ephi_h
2189               // e2s((m_Err[ti].At(i,0,0) + m_Err[ti].At(i,1,1)) / (r_t * r_t))  // ephi_t
2190           );
2191         }
2192       }
2193 #endif
2194 
2195       // update chi2
2196       m_Chi2.add(tmp_chi2);
2197     }
2198   }
2199 
2200   //------------------------------------------------------------------------------
2201 
2202   void MkFinder::print_par_err(int corp, int mslot) const {
2203 #ifdef DEBUG
2204     printf("Parameters:\n");
2205     for (int i = 0; i < 6; ++i) {
2206       printf("  %12.4g", m_Par[corp].constAt(mslot, i, 0));
2207     }
2208     printf("\nError matrix\n");
2209     for (int i = 0; i < 6; ++i) {
2210       for (int j = 0; j < 6; ++j) {
2211         printf("  %12.4g", m_Err[corp].constAt(mslot, i, j));
2212       }
2213       printf("\n");
2214     }
2215 #endif
2216   }
2217 
2218   void MkFinder::bkFitFitTracks(const EventOfHits &eventofhits,
2219                                 const SteeringParams &st_par,
2220                                 const int N_proc,
2221                                 bool chiDebug) {
2222     // Prototyping final backward fit.
2223     // This works with track-finding indices, before remapping.
2224     //
2225     // Layers should be collected during track finding and list all layers that have actual hits.
2226     // Then we could avoid checking which layers actually do have hits.
2227 
2228     // bool debug = true;
2229 
2230     MPlexQF tmp_chi2;
2231     MPlexQI no_mat_effs;
2232     float tmp_err[6] = {666, 0, 666, 0, 0, 666};
2233     float tmp_pos[3];
2234 
2235 #if defined(DEBUG_PROP_UPDATE)
2236     const int DSLOT = 0;
2237     printf("bkfit entry, track in slot %d\n", DSLOT);
2238     print_par_err(iC, DSLOT);
2239 #endif
2240 
2241     for (auto lp_iter = st_par.make_iterator(SteeringParams::IT_BkwFit); lp_iter.is_valid(); ++lp_iter) {
2242       const int layer = lp_iter.layer();
2243 
2244       const LayerOfHits &L = eventofhits[layer];
2245       const LayerInfo &LI = L.layer_info();
2246 
2247 #if defined(DEBUG_BACKWARD_FIT)
2248       const Hit *last_hit_ptr[NN];
2249 #endif
2250 
2251       no_mat_effs.setVal(0);
2252       int done_count = 0;
2253       int here_count = 0;
2254       for (int i = 0; i < N_proc; ++i) {
2255         while (m_CurNode[i] >= 0 && m_HoTNodeArr[i][m_CurNode[i]].m_hot.index < 0) {
2256           m_CurNode[i] = m_HoTNodeArr[i][m_CurNode[i]].m_prev_idx;
2257         }
2258 
2259         if (m_CurNode[i] < 0)
2260           ++done_count;
2261 
2262         if (m_CurNode[i] >= 0 && m_HoTNodeArr[i][m_CurNode[i]].m_hot.layer == layer) {
2263           // Skip the overlap hits -- if they exist.
2264           // 1. Overlap hit gets placed *after* the original hit in TrackCand::exportTrack()
2265           // which is *before* in the reverse iteration that we are doing here.
2266           // 2. Seed-hit merging can result in more than two hits per layer.
2267           // while (m_CurHit[i] > 0 && m_HoTArr[ i ][ m_CurHit[i] - 1 ].layer == layer) --m_CurHit[i];
2268           while (m_HoTNodeArr[i][m_CurNode[i]].m_prev_idx >= 0 &&
2269                  m_HoTNodeArr[i][m_HoTNodeArr[i][m_CurNode[i]].m_prev_idx].m_hot.layer == layer)
2270             m_CurNode[i] = m_HoTNodeArr[i][m_CurNode[i]].m_prev_idx;
2271 
2272           const Hit &hit = L.refHit(m_HoTNodeArr[i][m_CurNode[i]].m_hot.index);
2273 
2274 #ifdef DEBUG_BACKWARD_FIT
2275           last_hit_ptr[i] = &hit;
2276 #endif
2277           m_msErr.copyIn(i, hit.errArray());
2278           m_msPar.copyIn(i, hit.posArray());
2279           ++here_count;
2280 
2281           m_CurNode[i] = m_HoTNodeArr[i][m_CurNode[i]].m_prev_idx;
2282         } else {
2283 #ifdef DEBUG_BACKWARD_FIT
2284           last_hit_ptr[i] = nullptr;
2285 #endif
2286           no_mat_effs[i] = 1;
2287           tmp_pos[0] = m_Par[iC](i, 0, 0);
2288           tmp_pos[1] = m_Par[iC](i, 1, 0);
2289           tmp_pos[2] = m_Par[iC](i, 2, 0);
2290           m_msErr.copyIn(i, tmp_err);
2291           m_msPar.copyIn(i, tmp_pos);
2292         }
2293       }
2294 
2295       if (done_count == N_proc)
2296         break;
2297       if (here_count == 0)
2298         continue;
2299 
2300       // ZZZ Could add missing hits here, only if there are any actual matches.
2301 
2302       clearFailFlag();
2303 
2304       // PROP-FAIL-ENABLE Once always "copy input to output on fail" is removed from
2305       // propagateToR one might want to enable this for barrel or endcap or both.
2306       if (LI.is_barrel()) {
2307         propagateTracksToHitR(m_msPar, N_proc, m_prop_config->backward_fit_pflags, &no_mat_effs);
2308 
2309         kalmanOperation(KFO_Calculate_Chi2 | KFO_Update_Params | KFO_Local_Cov,
2310                         m_Err[iP],
2311                         m_Par[iP],
2312                         m_msErr,
2313                         m_msPar,
2314                         m_Err[iC],
2315                         m_Par[iC],
2316                         tmp_chi2,
2317                         N_proc);
2318       } else {
2319         propagateTracksToHitZ(m_msPar, N_proc, m_prop_config->backward_fit_pflags, &no_mat_effs);
2320 
2321         kalmanOperationEndcap(KFO_Calculate_Chi2 | KFO_Update_Params,
2322                               m_Err[iP],
2323                               m_Par[iP],
2324                               m_msErr,
2325                               m_msPar,
2326                               m_Err[iC],
2327                               m_Par[iC],
2328                               tmp_chi2,
2329                               N_proc);
2330       }
2331 
2332 #if defined(DEBUG_PROP_UPDATE)
2333       printf("\nbkfit at layer %d, track in slot %d -- fail=%d, had hit=%d (%g, %g, %g)\n",
2334              LI.layer_id(),
2335              DSLOT,
2336              m_FailFlag[DSLOT],
2337              1 - no_mat_effs[DSLOT],
2338              m_msPar(DSLOT, 0, 0),
2339              m_msPar(DSLOT, 1, 0),
2340              m_msPar(DSLOT, 2, 0));
2341       printf("Propagated:\n");
2342       print_par_err(iP, DSLOT);
2343       printf("Updated:\n");
2344       print_par_err(iC, DSLOT);
2345 #endif
2346 
2347       // Fixup for failed propagation or invpt sign and charge.
2348       for (int i = 0; i < NN; ++i) {
2349         // PROP-FAIL-ENABLE The following to be enabled when propagation failure
2350         // detection is properly implemented in propagate-to-R/Z.
2351         // 1. The following code was only expecting barrel state to be restored.
2352         //      auto barrel_pf(m_prop_config->backward_fit_pflags);
2353         //      barrel_pf.copy_input_state_on_fail = true;
2354         // 2. There is also check on chi2, commented out to keep physics changes minimal.
2355         /*
2356         if (m_FailFlag[i] && LI.is_barrel()) {
2357           // Barrel pflags are set to include PF_copy_input_state_on_fail.
2358           // Endcap errors are immaterial here (relevant for fwd search), with prop error codes
2359           // one could do other things.
2360           // Are there also fail conditions in KalmanUpdate?
2361 #ifdef DEBUG
2362           if (debug && g_debug) {
2363             dprintf("MkFinder::bkFitFitTracks prop fail: chi2=%f, layer=%d, label=%d. Recovering.\n",
2364                     tmp_chi2[i], LI.layer_id(), m_Label[i]);
2365             print_par_err(iC, i);
2366           }
2367 #endif
2368           m_Err[iC].copySlot(i, m_Err[iP]);
2369           m_Par[iC].copySlot(i, m_Par[iP]);
2370         } else if (tmp_chi2[i] > 200 || tmp_chi2[i] < 0) {
2371 #ifdef DEBUG
2372           if (debug && g_debug) {
2373             dprintf("MkFinder::bkFitFitTracks chi2 fail: chi2=%f, layer=%d, label=%d. Recovering.\n",
2374                     tmp_chi2[i], LI.layer_id(), m_Label[i]);
2375             print_par_err(iC, i);
2376           }
2377 #endif
2378           // Go back to propagated state (at the current hit, the previous one is lost).
2379           m_Err[iC].copySlot(i, m_Err[iP]);
2380           m_Par[iC].copySlot(i, m_Par[iP]);
2381         }
2382         */
2383         // Fixup invpt sign and charge.
2384         if (i < N_proc && m_Par[iC].At(i, 3, 0) < 0) {
2385           m_Chg.At(i, 0, 0) = -m_Chg.At(i, 0, 0);
2386           m_Par[iC].At(i, 3, 0) = -m_Par[iC].At(i, 3, 0);
2387         }
2388       }
2389 
2390 #if defined(DEBUG_BACKWARD_FIT)
2391       // clang-format off
2392       bool debug = true;
2393       const char beg_cur_sep = '/'; // set to ' ' root parsable printouts
2394       for (int i = 0; i < N_proc; ++i) {
2395         if (chiDebug && last_hit_ptr[i]) {
2396           TrackCand &bb = *m_TrkCand[i];
2397           int ti = iP;
2398           float chi = tmp_chi2.At(i, 0, 0);
2399           float chi_prnt = std::isfinite(chi) ? chi : -9;
2400 
2401 #if defined(MKFIT_STANDALONE)
2402           const MCHitInfo &mchi = m_event->simHitsInfo_[last_hit_ptr[i]->mcHitID()];
2403 
2404           dprintf("BKF_OVERLAP %d %d %d %d %d %d %d "
2405                   "%f%c%f %f %f%c%f %f %f %f %d %d %d %d "
2406                   "%f %f %f %f %f\n",
2407               m_event->evtID(),
2408 #else
2409           dprintf("BKF_OVERLAP %d %d %d %d %d %d "
2410                   "%f%c%f %f %f%c%f %f %f %f %d %d %d "
2411                   "%f %f %f %f %f\n",
2412 #endif
2413               bb.label(), (int)bb.prodType(), bb.isFindable(),
2414               layer, L.is_stereo(), L.is_barrel(),
2415               bb.pT(), beg_cur_sep, 1.0f / m_Par[ti].At(i, 3, 0),
2416               bb.posEta(),
2417               bb.posPhi(), beg_cur_sep, std::atan2(m_Par[ti].At(i, 1, 0), m_Par[ti].At(i, 0, 0)),
2418               std::hypot(m_Par[ti].At(i, 0, 0), m_Par[ti].At(i, 1, 0)),
2419               m_Par[ti].At(i, 2, 0),
2420               chi_prnt,
2421               std::isnan(chi), std::isfinite(chi), chi > 0,
2422 #if defined(MKFIT_STANDALONE)
2423               mchi.mcTrackID(),
2424 #endif
2425               // The following three can get negative / prouce nans in e2s.
2426               // std::abs the args for FPE hunt.
2427               e2s(std::abs(m_Err[ti].At(i, 0, 0))),
2428               e2s(std::abs(m_Err[ti].At(i, 1, 1))),
2429               e2s(std::abs(m_Err[ti].At(i, 2, 2))),  // sx_t sy_t sz_t -- track errors
2430               1e4f * std::hypot(m_msPar.At(i, 0, 0) - m_Par[ti].At(i, 0, 0),
2431                                 m_msPar.At(i, 1, 0) - m_Par[ti].At(i, 1, 0)),  // d_xy
2432               1e4f * (m_msPar.At(i, 2, 0) - m_Par[ti].At(i, 2, 0))             // d_z
2433           );
2434         }
2435       }
2436       // clang-format on
2437 #endif
2438 
2439       // update chi2
2440       m_Chi2.add(tmp_chi2);
2441     }
2442   }
2443 
2444   //------------------------------------------------------------------------------
2445 
2446   void MkFinder::bkFitPropTracksToPCA(const int N_proc) {
2447     propagateTracksToPCAZ(N_proc, m_prop_config->pca_prop_pflags);
2448   }
2449 
2450 }  // end namespace mkfit