From effaa5d075c5916bee2a5139ab46fc50767734b9 Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Wed, 3 Dec 2025 15:26:59 +0000
Subject: [PATCH 01/10] init commit

---
 modules/slam/include/opencv2/slam.hpp | 1 +
 1 file changed, 1 insertion(+)
 create mode 100644 modules/slam/include/opencv2/slam.hpp

diff --git a/modules/slam/include/opencv2/slam.hpp b/modules/slam/include/opencv2/slam.hpp
new file mode 100644
index 0000000000..6f70f09bee
--- /dev/null
+++ b/modules/slam/include/opencv2/slam.hpp
@@ -0,0 +1 @@
+#pragma once

From c4cb4d9c230ec644104a09c035cf40d3533f8630 Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Wed, 3 Dec 2025 20:10:04 +0000
Subject: [PATCH 02/10] SLAM VO: a framework

---
 modules/slam/include/opencv2/slam.hpp         |  28 +-
 .../slam/include/opencv2/slam/data_loader.hpp |  44 ++
 modules/slam/include/opencv2/slam/feature.hpp |  38 ++
 .../slam/include/opencv2/slam/initializer.hpp |  87 ++++
 .../slam/include/opencv2/slam/keyframe.hpp    |  21 +
 .../slam/include/opencv2/slam/localizer.hpp   |  32 ++
 modules/slam/include/opencv2/slam/map.hpp     |  91 ++++
 modules/slam/include/opencv2/slam/matcher.hpp |  34 ++
 .../slam/include/opencv2/slam/optimizer.hpp   |  69 +++
 modules/slam/include/opencv2/slam/pose.hpp    |  19 +
 .../slam/include/opencv2/slam/visualizer.hpp  |  47 ++
 modules/slam/include/opencv2/slam/vo.hpp      | 114 +++++
 modules/slam/src/data_loader.cpp              | 103 +++++
 modules/slam/src/feature.cpp                  | 167 +++++++
 modules/slam/src/initializer.cpp              | 406 ++++++++++++++++++
 modules/slam/src/keyframe.cpp                 |   0
 modules/slam/src/localizer.cpp                | 157 +++++++
 modules/slam/src/map.cpp                      | 319 ++++++++++++++
 modules/slam/src/matcher.cpp                  | 132 ++++++
 modules/slam/src/optimizer.cpp                | 255 +++++++++++
 modules/slam/src/pose.cpp                     |  43 ++
 modules/slam/src/visualizer.cpp               | 131 ++++++
 modules/slam/src/vo.cpp                       | 389 +++++++++++++++++
 23 files changed, 2725 insertions(+), 1 deletion(-)
 create mode 100644 modules/slam/include/opencv2/slam/data_loader.hpp
 create mode 100644 modules/slam/include/opencv2/slam/feature.hpp
 create mode 100644 modules/slam/include/opencv2/slam/initializer.hpp
 create mode 100644 modules/slam/include/opencv2/slam/keyframe.hpp
 create mode 100644 modules/slam/include/opencv2/slam/localizer.hpp
 create mode 100644 modules/slam/include/opencv2/slam/map.hpp
 create mode 100644 modules/slam/include/opencv2/slam/matcher.hpp
 create mode 100644 modules/slam/include/opencv2/slam/optimizer.hpp
 create mode 100644 modules/slam/include/opencv2/slam/pose.hpp
 create mode 100644 modules/slam/include/opencv2/slam/visualizer.hpp
 create mode 100644 modules/slam/include/opencv2/slam/vo.hpp
 create mode 100644 modules/slam/src/data_loader.cpp
 create mode 100644 modules/slam/src/feature.cpp
 create mode 100644 modules/slam/src/initializer.cpp
 create mode 100644 modules/slam/src/keyframe.cpp
 create mode 100644 modules/slam/src/localizer.cpp
 create mode 100644 modules/slam/src/map.cpp
 create mode 100644 modules/slam/src/matcher.cpp
 create mode 100644 modules/slam/src/optimizer.cpp
 create mode 100644 modules/slam/src/pose.cpp
 create mode 100644 modules/slam/src/visualizer.cpp
 create mode 100644 modules/slam/src/vo.cpp

diff --git a/modules/slam/include/opencv2/slam.hpp b/modules/slam/include/opencv2/slam.hpp
index 6f70f09bee..334925ec9b 100644
--- a/modules/slam/include/opencv2/slam.hpp
+++ b/modules/slam/include/opencv2/slam.hpp
@@ -1 +1,27 @@
-#pragma once
+// This file is part of OpenCV project.
+// It is subject to the license terms in the LICENSE file found in the top-level directory
+// of this distribution and at http://opencv.org/license.html
+
+#ifndef __OPENCV_SLAM_HPP__
+#define __OPENCV_SLAM_HPP__
+
+#include "opencv2/slam/data_loader.hpp"
+#include "opencv2/slam/feature.hpp"
+#include "opencv2/slam/initializer.hpp"
+#include "opencv2/slam/keyframe.hpp"
+#include "opencv2/slam/localizer.hpp"
+#include "opencv2/slam/map.hpp"
+#include "opencv2/slam/matcher.hpp"
+#include "opencv2/slam/optimizer.hpp"
+#include "opencv2/slam/pose.hpp"
+#include "opencv2/slam/visualizer.hpp"
+#include "opencv2/slam/vo.hpp"
+
+
+/** @defgroup slam Simultaneous Localization and Mapping
+  @brief Simultaneous Localization and Mapping (SLAM) module
+*/
+
+#endif
+
+/* End of file. */
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/data_loader.hpp b/modules/slam/include/opencv2/slam/data_loader.hpp
new file mode 100644
index 0000000000..acc7795a1f
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/data_loader.hpp
@@ -0,0 +1,44 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <string>
+#include <vector>
+
+namespace cv{
+namespace vo{
+
+class DataLoader {
+public:
+    // 构造：传入图像目录（可以是相对或绝对路径）
+    DataLoader(const std::string &imageDir);
+
+    // 获取下一张图像，成功返回 true 并填充 image 与 imagePath；到末尾返回 false
+    bool getNextImage(Mat &image, std::string &imagePath);
+
+    // 重置到序列开始
+    void reset();
+
+    // 是否还有图像
+    bool hasNext() const;
+
+    // 图像总数
+    size_t size() const;
+
+    // 尝试加载并返回相机内参（fx, fy, cx, cy），返回是否成功
+    bool loadIntrinsics(const std::string &yamlPath);
+
+    // 内参访问
+    double fx() const { return fx_; }
+    double fy() const { return fy_; }
+    double cx() const { return cx_; }
+    double cy() const { return cy_; }
+
+private:
+    std::vector<std::string> imageFiles;
+    size_t currentIndex;
+
+    // 相机内参（若未加载则为回退值）
+    double fx_, fy_, cx_, cy_;
+};
+    
+} // namespace vo
+} // namespace cv
diff --git a/modules/slam/include/opencv2/slam/feature.hpp b/modules/slam/include/opencv2/slam/feature.hpp
new file mode 100644
index 0000000000..0ec86302a0
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/feature.hpp
@@ -0,0 +1,38 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <opencv2/features2d.hpp>
+#include <vector>
+
+namespace cv {
+namespace vo {
+
+class FeatureExtractor {
+public:
+    explicit FeatureExtractor(int nfeatures = 2000);
+    // detectAndCompute: detect keypoints and compute descriptors.
+    // If previous-frame data (prevGray, prevKp) is provided, a flow-aware grid allocation
+    // will be used (score = response * (1 + flow_lambda * normalized_flow)). Otherwise a
+    // simpler ANMS selection is used. The prev arguments have defaults so this function
+    // replaces the two previous overloads.
+    void detectAndCompute(const Mat &image, std::vector<KeyPoint> &kps, Mat &desc,
+                          const Mat &prevGray = Mat(), const std::vector<KeyPoint> &prevKp = std::vector<KeyPoint>(),
+                          double flow_lambda = 5.0);
+private:
+    Ptr<ORB> orb_;
+    int nfeatures_;
+};
+
+// Function to detect and compute features in an image
+inline void detectAndComputeFeatures(const Mat &image,
+                                     std::vector<KeyPoint> &keypoints,
+                                     Mat &descriptors) {
+    // Create ORB detector and descriptor
+    auto orb = ORB::create();
+    // Detect keypoints
+    orb->detect(image, keypoints);
+    // Compute descriptors
+    orb->compute(image, keypoints, descriptors);
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/initializer.hpp b/modules/slam/include/opencv2/slam/initializer.hpp
new file mode 100644
index 0000000000..b0e8676a0f
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/initializer.hpp
@@ -0,0 +1,87 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <opencv2/features2d.hpp>
+#include <vector>
+#include "opencv2/slam/keyframe.hpp"
+#include "opencv2/slam/map.hpp"
+
+namespace cv {
+namespace vo {
+
+class Initializer {
+public:
+    Initializer();
+    
+    // Attempt initialization with two frames
+    // Returns true if initialization successful
+    bool initialize(const std::vector<KeyPoint> &kps1,
+                   const std::vector<KeyPoint> &kps2,
+                   const std::vector<DMatch> &matches,
+                   double fx, double fy, double cx, double cy,
+                   Mat &R, Mat &t,
+                   std::vector<Point3d> &points3D,
+                   std::vector<bool> &isTriangulated);
+    
+    // Check if frames have sufficient parallax for initialization
+    static bool checkParallax(const std::vector<KeyPoint> &kps1,
+                             const std::vector<KeyPoint> &kps2,
+                             const std::vector<DMatch> &matches,
+                             double minMedianParallax = 15.0);
+    
+private:
+    // Reconstruct from Homography
+    bool reconstructH(const std::vector<Point2f> &pts1,
+                     const std::vector<Point2f> &pts2,
+                     const Mat &H,
+                     double fx, double fy, double cx, double cy,
+                     Mat &R, Mat &t,
+                     std::vector<Point3d> &points3D,
+                     std::vector<bool> &isTriangulated,
+                     float &parallax);
+    
+    // Reconstruct from Fundamental/Essential
+    bool reconstructF(const std::vector<Point2f> &pts1,
+                     const std::vector<Point2f> &pts2,
+                     const Mat &F,
+                     double fx, double fy, double cx, double cy,
+                     Mat &R, Mat &t,
+                     std::vector<Point3d> &points3D,
+                     std::vector<bool> &isTriangulated,
+                     float &parallax);
+    
+    // Check reconstructed points quality
+    int checkRT(const Mat &R, const Mat &t,
+               const std::vector<Point2f> &pts1,
+               const std::vector<Point2f> &pts2,
+               const std::vector<Point3d> &points3D,
+               std::vector<bool> &isGood,
+               double fx, double fy, double cx, double cy,
+               float &parallax);
+    
+    // Triangulate points
+    void triangulate(const Mat &P1, const Mat &P2,
+                    const std::vector<Point2f> &pts1,
+                    const std::vector<Point2f> &pts2,
+                    std::vector<Point3d> &points3D);
+    
+    // Decompose Homography
+    void decomposeH(const Mat &H, std::vector<Mat> &Rs,
+                   std::vector<Mat> &ts, std::vector<Mat> &normals);
+    
+    // Compute homography score
+    float computeScore(const Mat &H21, const Mat &H12,
+                      const std::vector<Point2f> &pts1,
+                      const std::vector<Point2f> &pts2,
+                      std::vector<bool> &inliersH,
+                      float sigma = 1.0);
+    
+    // Compute fundamental score
+    float computeScoreF(const Mat &F21,
+                       const std::vector<Point2f> &pts1,
+                       const std::vector<Point2f> &pts2,
+                       std::vector<bool> &inliersF,
+                       float sigma = 1.0);
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/keyframe.hpp b/modules/slam/include/opencv2/slam/keyframe.hpp
new file mode 100644
index 0000000000..ce5d3a6b06
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/keyframe.hpp
@@ -0,0 +1,21 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <opencv2/features2d.hpp>
+#include <vector>
+
+namespace cv {
+namespace vo {
+
+struct KeyFrame {
+    int id = -1;
+    Mat image; // optional
+    std::vector<KeyPoint> kps;
+    Mat desc;
+    // pose: rotation and translation to map coordinates
+    // X_world = R * X_cam + t
+    Mat R_w = Mat::eye(3,3,CV_64F);
+    Mat t_w = Mat::zeros(3,1,CV_64F);
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/localizer.hpp b/modules/slam/include/opencv2/slam/localizer.hpp
new file mode 100644
index 0000000000..c441737b93
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/localizer.hpp
@@ -0,0 +1,32 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <vector>
+#include "opencv2/slam/data_loader.hpp"
+#include "opencv2/slam/map.hpp"
+
+namespace cv {
+namespace vo {
+
+class Localizer {
+public:
+    Localizer(float ratio = 0.7f);
+
+    // Try to solve PnP against map points. Returns true if solved and fills R_out/t_out and inliers.
+    // Provide camera intrinsics and image dimensions explicitly (DataLoader doesn't expose width/height).
+    // Enhanced tryPnP with optional diagnostics output (frame id, image and output directory)
+    // out_preMatches and out_postMatches can be nullptr. If outDir provided, diagnostics images/logs will be saved there.
+
+    bool tryPnP(const MapManager &map, const Mat &desc, const std::vector<KeyPoint> &kps,
+                double fx, double fy, double cx, double cy, int imgW, int imgH,
+                int min_inliers,
+                Mat &R_out, Mat &t_out, int &inliers_out,
+                int frame_id = -1, const Mat *image = nullptr, const std::string &outDir = "",
+                int *out_preMatches = nullptr, int *out_postMatches = nullptr, double *out_meanReproj = nullptr) const;
+
+    float ratio() const { return ratio_; }
+private:
+    float ratio_ = 0.7f;
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/map.hpp b/modules/slam/include/opencv2/slam/map.hpp
new file mode 100644
index 0000000000..38d8d7097b
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/map.hpp
@@ -0,0 +1,91 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <vector>
+#include <unordered_map>
+#include "opencv2/slam/keyframe.hpp"
+
+namespace cv {
+namespace vo {
+
+struct MapPoint {
+    int id = -1; // unique id for id-based lookups
+    Point3d p; // 3D position in world frame
+    std::vector<std::pair<int,int>> observations; // pairs of (keyframe id, keypoint idx)
+    
+    // Quality management fields
+    Mat descriptor;           // Representative descriptor for matching
+    int nObs = 0;                 // Number of observations
+    bool isBad = false;           // Flag for bad points to be culled
+    double minDistance = 0.0;     // Min viewing distance
+    double maxDistance = 0.0;     // Max viewing distance
+    
+    // Statistics
+    int nFound = 0;               // Number of times found in tracking
+    int nVisible = 0;             // Number of times visible
+    
+    // Constructor
+    MapPoint() = default;
+    MapPoint(const Point3d& pos) : p(pos) {}
+    
+    // Helper: compute found ratio
+    float getFoundRatio() const {
+        return nVisible > 0 ? static_cast<float>(nFound) / nVisible : 0.0f;
+    }
+};
+
+class MapManager {
+public:
+    MapManager();
+
+    void addKeyFrame(const KeyFrame &kf);
+    void addMapPoints(const std::vector<MapPoint> &pts);
+
+    const std::vector<KeyFrame>& keyframes() const { return keyframes_; }
+    const std::vector<MapPoint>& mappoints() const { return mappoints_; }
+
+    // Find candidate mappoint indices visible from pose (lastR, lastT) and inside image
+    std::vector<int> findVisibleCandidates(const Mat &lastR, const Mat &lastT,
+                                           double fx, double fy, double cx, double cy,
+                                           int imgW, int imgH) const;
+
+    // Triangulate given normalized coordinates between last keyframe and current
+    // Returns newly created map points (appended to internal list).
+    std::vector<MapPoint> triangulateBetweenLastTwo(const std::vector<Point2f> &pts1n,
+                                                    const std::vector<Point2f> &pts2n,
+                                                    const std::vector<int> &pts1_kp_idx,
+                                                    const std::vector<int> &pts2_kp_idx,
+                                                    const KeyFrame &lastKf, const KeyFrame &curKf,
+                                                    double fx, double fy, double cx, double cy);
+
+    // Lookup keyframe index by id (-1 if not found)
+    int keyframeIndex(int id) const;
+    // Lookup mappoint index by id (-1 if not found)
+    int mapPointIndex(int id) const;
+    // Mutable access if caller legitimately needs to modify keyframes/mappoints.
+    // Prefer using the applyOptimized... APIs for controlled updates.
+    std::vector<KeyFrame>& keyframesMutable() { return keyframes_; }
+    std::vector<MapPoint>& mappointsMutable() { return mappoints_; }
+
+    // Apply optimized pose/point by id (safe writeback APIs for backend)
+    void applyOptimizedKeyframePose(int keyframeId, const Mat &R, const Mat &t);
+    void applyOptimizedMapPoint(int mappointId, const Point3d &p);
+
+    // Quality management
+    void cullBadMapPoints();
+    double computeReprojError(const MapPoint &mp, const KeyFrame &kf, 
+                             double fx, double fy, double cx, double cy) const;
+    void updateMapPointDescriptor(MapPoint &mp);
+    
+    // Statistics
+    int countGoodMapPoints() const;
+
+private:
+    std::vector<KeyFrame> keyframes_;
+    std::vector<MapPoint> mappoints_;
+    std::unordered_map<int,int> id2idx_;
+    std::unordered_map<int,int> mpid2idx_;
+    int next_mappoint_id_ = 1;
+};
+
+} // namespace vo
+} // namespace cv
diff --git a/modules/slam/include/opencv2/slam/matcher.hpp b/modules/slam/include/opencv2/slam/matcher.hpp
new file mode 100644
index 0000000000..215b8ea0b1
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/matcher.hpp
@@ -0,0 +1,34 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <opencv2/features2d.hpp>
+#include <vector>
+
+namespace cv {
+namespace vo {
+
+class Matcher {
+public:
+    explicit Matcher(float ratio = 0.75f);
+    // Match descriptors from prev -> curr, return good matches (queryIdx refers to prev, trainIdx to curr)
+    // Basic knn ratio test (backwards-compatible)
+    void knnMatch(const Mat &desc1, const Mat &desc2, std::vector<DMatch> &goodMatches);
+
+    // Stronger match: knn + ratio test + optional mutual cross-check + optional spatial bucketing.
+    // desc1/desc2 are descriptors for prev/curr frames.
+    // kps1/kps2 are the corresponding keypoints (needed for spatial bucketing).
+    // imgCols/imgRows are used to size the bucketing grid. Defaults provide conservative values.
+    // maxTotal: if >0, final matches will be truncated to this count (keep smallest distances).
+    // enableMutual: enable/disable mutual cross-check. enableBucketing: enable/disable grid bucketing.
+    void match(const Mat &desc1, const Mat &desc2,
+               const std::vector<KeyPoint> &kps1, const std::vector<KeyPoint> &kps2,
+               std::vector<DMatch> &goodMatches,
+               int imgCols = 640, int imgRows = 480,
+               int bucketRows = 8, int bucketCols = 8, int topKPerBucket = 4,
+               int maxTotal = 0, bool enableMutual = true, bool enableBucketing = true);
+private:
+    float ratio_;
+    BFMatcher bf_;
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/optimizer.hpp b/modules/slam/include/opencv2/slam/optimizer.hpp
new file mode 100644
index 0000000000..a46263d7b1
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/optimizer.hpp
@@ -0,0 +1,69 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <vector>
+#include "opencv2/slam/keyframe.hpp"
+#include "opencv2/slam/map.hpp"
+
+namespace cv {
+namespace vo {
+
+// Bundle Adjustment Optimizer using OpenCV-based Levenberg-Marquardt
+// Note: For production, should use g2o or Ceres for better performance
+class Optimizer {
+public:
+    Optimizer();
+    
+    // Local Bundle Adjustment
+    // Optimizes a window of recent keyframes and all observed map points
+    // fixedKFs: indices of keyframes to keep fixed during optimization
+#ifdef USE_G2O
+    static void localBundleAdjustmentG2O(
+        std::vector<KeyFrame> &keyframes,
+        std::vector<MapPoint> &mappoints,
+        const std::vector<int> &localKfIndices,
+        const std::vector<int> &fixedKfIndices,
+        double fx, double fy, double cx, double cy,
+        int iterations = 10);
+#endif
+    static void localBundleAdjustmentSFM(
+        std::vector<KeyFrame> &keyframes,
+        std::vector<MapPoint> &mappoints,
+        const std::vector<int> &localKfIndices,
+        const std::vector<int> &fixedKfIndices,
+        double fx, double fy, double cx, double cy,
+        int iterations = 10);
+    // Pose-only optimization (optimize camera pose given fixed 3D points)
+    static bool optimizePose(
+        KeyFrame &kf,
+        const std::vector<MapPoint> &mappoints,
+        const std::vector<int> &matchedMpIndices,
+        double fx, double fy, double cx, double cy,
+        std::vector<bool> &inliers,
+        int iterations = 10);
+    
+    // Global Bundle Adjustment (expensive, use after loop closure)
+    static void globalBundleAdjustmentSFM(
+        std::vector<KeyFrame> &keyframes,
+        std::vector<MapPoint> &mappoints,
+        double fx, double fy, double cx, double cy,
+        int iterations = 20);
+    
+private:
+    // Compute reprojection error and Jacobian
+    static double computeReprojectionError(
+        const Point3d &point3D,
+        const Mat &R, const Mat &t,
+        const Point2f &observed,
+        double fx, double fy, double cx, double cy,
+        Mat &jacobianPose,
+        Mat &jacobianPoint);
+    
+    // Project 3D point to image
+    static Point2f project(
+        const Point3d &point3D,
+        const Mat &R, const Mat &t,
+        double fx, double fy, double cx, double cy);
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/pose.hpp b/modules/slam/include/opencv2/slam/pose.hpp
new file mode 100644
index 0000000000..acf3615950
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/pose.hpp
@@ -0,0 +1,19 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <vector>
+
+namespace cv {
+namespace vo {
+
+class PoseEstimator {
+public:
+    PoseEstimator() = default;
+    // Estimate relative pose from matched normalized image points. Returns true if pose recovered.
+    bool estimate(const std::vector<Point2f> &pts1,
+                  const std::vector<Point2f> &pts2,
+                  double fx, double fy, double cx, double cy,
+                  Mat &R, Mat &t, Mat &mask, int &inliers);
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/visualizer.hpp b/modules/slam/include/opencv2/slam/visualizer.hpp
new file mode 100644
index 0000000000..22ffe94fd3
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/visualizer.hpp
@@ -0,0 +1,47 @@
+#pragma once
+#include <opencv2/core.hpp>
+#include <string>
+#include "opencv2/slam/pose.hpp"
+#include "opencv2/slam/feature.hpp"
+#include "opencv2/slam/matcher.hpp"
+
+namespace cv {
+namespace vo {
+
+class Tracker {
+public:
+    Tracker();
+    // Process a gray image, returns true if a pose was estimated. imgOut contains visualization (matches or keypoints)
+    bool processFrame(const Mat &gray, const std::string &imagePath, Mat &imgOut, Mat &R_out, Mat &t_out, std::string &info);
+private:
+    FeatureExtractor feat_;
+    Matcher matcher_;
+    PoseEstimator poseEst_;
+
+    Mat prevGray_, prevDesc_;
+    std::vector<KeyPoint> prevKp_;
+    int frame_id_;
+};
+
+class Visualizer {
+public:
+    Visualizer(int W=1000, int H=800, double meters_per_pixel=0.02);
+    // 更新轨迹（传入 x,z 坐标）
+    void addPose(double x, double z);
+    // 返回帧绘制（matches 或 keypoints）到窗口
+    void showFrame(const Mat &frame);
+    // 返回并显示俯视图
+    void showTopdown();
+    // 保存最终轨迹图像到文件
+    bool saveTrajectory(const std::string &path);
+private:
+    int W_, H_;
+    double meters_per_pixel_;
+    Size mapSize_;
+    Mat map_;
+    std::vector<Point2d> traj_; // 存储 (x,z)
+    Point worldToPixel(const Point2d &p) const;
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/include/opencv2/slam/vo.hpp b/modules/slam/include/opencv2/slam/vo.hpp
new file mode 100644
index 0000000000..9f08e203e3
--- /dev/null
+++ b/modules/slam/include/opencv2/slam/vo.hpp
@@ -0,0 +1,114 @@
+#pragma once
+
+#include <opencv2/core.hpp>
+#include <opencv2/features2d.hpp>
+#include <opencv2/calib3d.hpp>
+#include <vector>
+
+namespace cv {
+namespace vo {
+
+struct CameraIntrinsics {
+    Mat K;      // 3x3 camera matrix
+    Mat dist;   // distortion coefficients (optional)
+};
+
+struct VOParams {
+    int minInitInliers = 80;
+    double ransacProb = 0.999;
+    double ransacThresh = 1.5; // pixels
+    double minParallaxDeg = 1.0;
+    double reprojErrThresh = 3.0;
+    int pnpMinInliers = 30;
+    double pnpReprojErr = 3.0;
+    int keyframeInterval = 10; // frames
+    double keyframeMinBaseline = 0.05; // relative scale
+    double keyframeMinRotationDeg = 5.0;
+    int localWindowSize = 7; // for BA
+    // Backend parameters
+    bool enableBackend = false;
+    int baMaxIters = 50;
+    // Backend type: 0=g2o (default), 1=opencv_sfm
+    int backendType = 0;
+};
+
+class VisualOdometry {
+public:
+    VisualOdometry(const Ptr<Feature2D>& feature,
+                   const Ptr<DescriptorMatcher>& matcher,
+                   const CameraIntrinsics& intrinsics,
+                   const VOParams& params = VOParams());
+
+    // Process a single frame. Returns true if tracking succeeded.
+    bool processFrame(const Mat& img, double timestamp);
+
+    // Current camera pose (R|t) as 4x4 SE3 matrix.
+    Mat getCurrentPose() const;
+
+    // Full trajectory as vector of 4x4 matrices.
+    std::vector<Mat> getTrajectory() const;
+
+    // Backend controls
+    void setEnableBackend(bool on);
+    void setWindowSize(int N);
+    void setBAParams(double reprojThresh, int maxIters);
+    void setBackendType(int type);
+
+    // Loop closure & localization stubs (Milestone 4)
+    enum Mode { MODE_SLAM, MODE_LOCALIZATION };
+    void setMode(Mode m);
+    bool saveMap(const std::string& path) const;
+    bool loadMap(const std::string& path);
+    void enableLoopClosure(bool on);
+    void setPlaceRecognizer(const Ptr<Feature2D>& vocabFeature);
+
+private:
+    // internal helpers
+    bool initializeTwoView(const Mat& img0, const Mat& img1);
+    bool trackWithPnP(const Mat& img);
+    bool shouldInsertKeyframe() const;
+    void triangulateWithLastKeyframe();
+    void runLocalBAIfEnabled();
+
+    // state
+    Ptr<Feature2D> feature_;
+    Ptr<DescriptorMatcher> matcher_;
+    CameraIntrinsics K_;
+    VOParams params_;
+
+    bool initialized_ = false;
+    bool backendEnabled_ = false;
+    int frameCount_ = 0;
+    Mode mode_ = MODE_SLAM;
+    bool loopClosureEnabled_ = false;
+
+    // cached
+    Mat lastImg_;
+    Mat currentPoseSE3_; // 4x4
+    std::vector<Mat> trajectory_;
+
+    // minimal containers (placeholder, to be integrated with MapManager/KeyFrame)
+    std::vector<Point3d> mapPoints_; // simple storage for demo
+
+    // keyframe state (latest KF only)
+    std::vector<KeyPoint> kf_keypoints_;
+    Mat kf_descriptors_;
+    std::vector<int> kf_kp_to_map_; // size == kf_keypoints_.size(), -1 if not mapped
+    Mat kfPoseSE3_; // KF pose 4x4
+
+    // current frame cached features
+    std::vector<KeyPoint> cur_keypoints_;
+    Mat cur_descriptors_;
+    int lastPnPInliers_ = 0;
+    std::vector<std::pair<int,int>> curFeat_to_map_inliers_; // (cur_kp_idx, map_idx)
+    double unmatchedRatio_ = 0.0; // fraction of matched keyframe features without map points (for KF decision)
+
+    // simple history for sliding window
+    std::vector<Mat> keyframePoses_; // poses of historical KFs
+    std::vector<std::vector<KeyPoint>> keyframeKeypoints_;
+    std::vector<Mat> keyframeDescriptors_;
+    std::vector<std::vector<int>> keyframeKpToMap_; // per-KF mapping from kp idx to map point idx
+};
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/data_loader.cpp b/modules/slam/src/data_loader.cpp
new file mode 100644
index 0000000000..1488e9a02a
--- /dev/null
+++ b/modules/slam/src/data_loader.cpp
@@ -0,0 +1,103 @@
+#include "opencv2/slam/data_loader.hpp"
+#include <opencv2/imgcodecs.hpp>
+#include <filesystem>
+#include <iostream>
+#include <fstream>
+#include <sstream>
+
+namespace cv {
+namespace vo {
+
+DataLoader::DataLoader(const std::string &imageDir)
+    : currentIndex(0), fx_(700.0), fy_(700.0), cx_(0.5), cy_(0.5)
+{
+    // 使用 std::filesystem 先检查目录是否存在
+    try {
+        std::filesystem::path p(imageDir);
+        if(!std::filesystem::exists(p) || !std::filesystem::is_directory(p)){
+            std::cerr << "DataLoader: imageDir does not exist or is not a directory: " << imageDir << std::endl;
+            return;
+        }
+    } catch(const std::exception &e){
+        std::cerr << "DataLoader: filesystem error checking imageDir: " << e.what() << std::endl;
+        // fallthrough to try glob
+    }
+
+    // 使用 glob 列出文件，捕获可能的 OpenCV 异常
+    try {
+        glob(imageDir + "/*", imageFiles, false);
+    } catch(const Exception &e){
+        std::cerr << "DataLoader: glob failed for '" << imageDir << "': " << e.what() << std::endl;
+        imageFiles.clear();
+        return;
+    }
+
+    if(imageFiles.empty()){
+        std::cerr << "DataLoader: no image files found in " << imageDir << std::endl;
+        return;
+    }
+
+    // 尝试在 imageDir 或其上一级目录寻找 sensor.yaml
+    std::filesystem::path p(imageDir);
+    std::string yaml1 = (p / "sensor.yaml").string();
+    std::string yaml2 = (p.parent_path() / "sensor.yaml").string();
+    if(!loadIntrinsics(yaml1)){
+        loadIntrinsics(yaml2); // best-effort
+    }
+}
+
+bool DataLoader::loadIntrinsics(const std::string &yamlPath){
+    std::ifstream ifs(yamlPath);
+    if(!ifs.is_open()) return false;
+    std::string line;
+    while(std::getline(ifs, line)){
+        auto pos = line.find("intrinsics:");
+        if(pos != std::string::npos){
+            size_t lb = line.find('[', pos);
+            size_t rb = line.find(']', pos);
+            std::string nums;
+            if(lb != std::string::npos && rb != std::string::npos && rb > lb){
+                nums = line.substr(lb+1, rb-lb-1);
+            } else {
+                std::string rest;
+                while(std::getline(ifs, rest)){
+                    nums += rest + " ";
+                    if(rest.find(']') != std::string::npos) break;
+                }
+            }
+            for(char &c: nums) if(c == ',' || c == '[' || c == ']') c = ' ';
+            std::stringstream ss(nums);
+            std::vector<double> vals;
+            double v;
+            while(ss >> v) vals.push_back(v);
+            if(vals.size() >= 4){
+                fx_ = vals[0]; fy_ = vals[1]; cx_ = vals[2]; cy_ = vals[3];
+                std::cerr << "DataLoader: loaded intrinsics from " << yamlPath << std::endl;
+                return true;
+            }
+        }
+    }
+    return false;
+}
+
+bool DataLoader::hasNext() const { return currentIndex < imageFiles.size(); }
+
+size_t DataLoader::size() const { return imageFiles.size(); }
+
+void DataLoader::reset(){ currentIndex = 0; }
+
+bool DataLoader::getNextImage(Mat &image, std::string &imagePath){
+    if(currentIndex >= imageFiles.size()) return false;
+    imagePath = imageFiles[currentIndex];
+    image = imread(imagePath, IMREAD_UNCHANGED);
+    if(image.empty()){
+        std::cerr << "DataLoader: couldn't read " << imagePath << ", skipping" << std::endl;
+        currentIndex++;
+        return getNextImage(image, imagePath); // try next
+    }
+    currentIndex++;
+    return true;
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/feature.cpp b/modules/slam/src/feature.cpp
new file mode 100644
index 0000000000..e2eb7dde50
--- /dev/null
+++ b/modules/slam/src/feature.cpp
@@ -0,0 +1,167 @@
+#include "opencv2/slam/feature.hpp"
+#include <limits>
+#include <cmath>
+#include <opencv2/video/tracking.hpp>
+#include <map>
+
+namespace cv {
+namespace vo {
+
+FeatureExtractor::FeatureExtractor(int nfeatures)
+    : nfeatures_(nfeatures)
+{
+    orb_ = ORB::create(nfeatures_);
+}
+
+// Adaptive Non-Maximal Suppression (ANMS)
+static void anms(const std::vector<KeyPoint> &in, std::vector<KeyPoint> &out, int maxFeatures)
+{
+    out.clear();
+    if(in.empty()) return;
+    int N = (int)in.size();
+    if(maxFeatures <= 0 || N <= maxFeatures){ out = in; return; }
+
+    // For each keypoint, find distance to the nearest keypoint with strictly higher response
+    std::vector<float> radius(N, std::numeric_limits<float>::infinity());
+    for(int i=0;i<N;++i){
+        for(int j=0;j<N;++j){
+            if(in[j].response > in[i].response){
+                float dx = in[i].pt.x - in[j].pt.x;
+                float dy = in[i].pt.y - in[j].pt.y;
+                float d2 = dx*dx + dy*dy;
+                if(d2 < radius[i]) radius[i] = d2;
+            }
+        }
+        // if no stronger keypoint exists, radius[i] stays INF
+    }
+
+    // Now pick top maxFeatures by radius (larger radius preferred). If radius==INF, treat as large.
+    std::vector<int> idx(N);
+    for(int i=0;i<N;++i) idx[i] = i;
+    std::sort(idx.begin(), idx.end(), [&](int a, int b){
+        float ra = radius[a]; float rb = radius[b];
+        if(std::isinf(ra) && std::isinf(rb)) return in[a].response > in[b].response; // tie-break by response
+        if(std::isinf(ra)) return true;
+        if(std::isinf(rb)) return false;
+        if(ra == rb) return in[a].response > in[b].response;
+        return ra > rb;
+    });
+
+    int take = std::min(maxFeatures, N);
+    out.reserve(take);
+    for(int i=0;i<take;++i) out.push_back(in[idx[i]]);
+}
+
+// Unified detectAndCompute: uses flow-aware allocation when prevGray/prevKp provided,
+// otherwise falls back to ANMS selection.
+void FeatureExtractor::detectAndCompute(const Mat &image, std::vector<KeyPoint> &kps, Mat &desc,
+                                       const Mat &prevGray, const std::vector<KeyPoint> &prevKp,
+                                       double flow_lambda)
+{
+    kps.clear(); desc.release();
+    if(image.empty()) return;
+
+    // detect candidates with ORB
+    std::vector<KeyPoint> candidates;
+    orb_->detect(image, candidates);
+    if(candidates.empty()) return;
+
+    // If no previous-frame info is provided, use simple ANMS + descriptor computation
+    if(prevGray.empty() || prevKp.empty()){
+        std::vector<KeyPoint> selected;
+        anms(candidates, selected, nfeatures_);
+        if(selected.empty()) return;
+        orb_->compute(image, selected, desc);
+        kps = std::move(selected);
+        return;
+    }
+
+    // Flow-aware scoring path -------------------------------------------------
+    // 1) track previous keypoints into current frame to estimate flows
+    std::vector<Point2f> trackedPts;
+    std::vector<unsigned char> status;
+    std::vector<float> err;
+    std::vector<double> trackedFlows; // aligned with prevKp
+    std::vector<Point2f> prevPts; prevPts.reserve(prevKp.size());
+    for(const auto &kp: prevKp) prevPts.push_back(kp.pt);
+    trackedPts.resize(prevPts.size()); status.resize(prevPts.size()); err.resize(prevPts.size());
+    try{
+        calcOpticalFlowPyrLK(prevGray, image, prevPts, trackedPts, status, err, Size(21,21), 3,
+                                 TermCriteria(TermCriteria::COUNT+TermCriteria::EPS, 30, 0.01), 0, 1e-4);
+    } catch(...) { status.clear(); }
+    trackedFlows.resize(prevPts.size());
+    for(size_t i=0;i<prevPts.size();++i){
+        if(status.size() == prevPts.size() && status[i]){
+            double dx = trackedPts[i].x - prevPts[i].x;
+            double dy = trackedPts[i].y - prevPts[i].y;
+            trackedFlows[i] = std::sqrt(dx*dx + dy*dy);
+        } else trackedFlows[i] = 0.0;
+    }
+
+    // 2) assign a flow value to each candidate: find nearest tracked point within radius
+    const double FLOW_NEIGHBOR_RADIUS = 8.0; // px
+    double diag = std::sqrt(double(image.cols)*double(image.cols) + double(image.rows)*double(image.rows));
+    struct CandScore { double score; double flow; int idx; };
+    std::vector<CandScore> scored; scored.reserve(candidates.size());
+    for(size_t i=0;i<candidates.size();++i){
+        double flow = 0.0;
+        if(!trackedFlows.empty()){
+            double bestd = FLOW_NEIGHBOR_RADIUS*FLOW_NEIGHBOR_RADIUS; int besti = -1;
+            for(size_t j=0;j<trackedFlows.size();++j){
+                if(trackedFlows[j] <= 0.0) continue;
+                double dx = candidates[i].pt.x - trackedPts[j].x;
+                double dy = candidates[i].pt.y - trackedPts[j].y;
+                double d2 = dx*dx + dy*dy;
+                if(d2 < bestd){ bestd = d2; besti = (int)j; }
+            }
+            if(besti >= 0) flow = trackedFlows[besti];
+        }
+        double resp = candidates[i].response;
+        double norm_flow = diag > 0.0 ? (flow / diag) : flow;
+        double score = resp * (1.0 + flow_lambda * norm_flow);
+        scored.push_back({score, flow, (int)i});
+    }
+
+    // 3) grid allocation (ORB-style): split into grid and take top per-cell
+    const int GRID_ROWS = 8;
+    const int GRID_COLS = 8;
+    int cellW = std::max(1, image.cols / GRID_COLS);
+    int cellH = std::max(1, image.rows / GRID_ROWS);
+    int cellCap = (nfeatures_ + GRID_ROWS*GRID_COLS - 1) / (GRID_ROWS*GRID_COLS);
+    std::vector<std::vector<CandScore>> buckets(GRID_ROWS * GRID_COLS);
+    for(const auto &c: scored){
+        const KeyPoint &kp = candidates[c.idx];
+        int cx = std::min(GRID_COLS-1, std::max(0, int(kp.pt.x) / cellW));
+        int cy = std::min(GRID_ROWS-1, std::max(0, int(kp.pt.y) / cellH));
+        buckets[cy*GRID_COLS + cx].push_back(c);
+    }
+
+    std::vector<KeyPoint> selected; selected.reserve(nfeatures_);
+    for(auto &b: buckets){
+        if(b.empty()) continue;
+        std::sort(b.begin(), b.end(), [](const CandScore &a, const CandScore &b){ return a.score > b.score; });
+        int take = std::min((int)b.size(), cellCap);
+        for(int i=0;i<take && (int)selected.size() < nfeatures_; ++i){
+            selected.push_back(candidates[b[i].idx]);
+        }
+    }
+
+    // if we still have space, fill from all candidates by global score
+    if((int)selected.size() < nfeatures_){
+        std::vector<CandScore> all = scored;
+        std::sort(all.begin(), all.end(), [](const CandScore &a, const CandScore &b){ return a.score > b.score; });
+        for(const auto &c: all){
+            if((int)selected.size() >= nfeatures_) break;
+            bool dup = false;
+            for(const auto &s: selected){ if(norm(s.pt - candidates[c.idx].pt) < 1.0){ dup = true; break; } }
+            if(!dup) selected.push_back(candidates[c.idx]);
+        }
+    }
+
+    if(selected.empty()) return;
+    orb_->compute(image, selected, desc);
+    kps = std::move(selected);
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/initializer.cpp b/modules/slam/src/initializer.cpp
new file mode 100644
index 0000000000..2bdd5a9924
--- /dev/null
+++ b/modules/slam/src/initializer.cpp
@@ -0,0 +1,406 @@
+#include "opencv2/slam/initializer.hpp"
+#include <opencv2/calib3d.hpp>
+#include <iostream>
+#include <algorithm>
+
+namespace cv {
+namespace vo {
+
+Initializer::Initializer() {}
+
+bool Initializer::initialize(const std::vector<KeyPoint> &kps1,
+                             const std::vector<KeyPoint> &kps2,
+                             const std::vector<DMatch> &matches,
+                             double fx, double fy, double cx, double cy,
+                             Mat &R, Mat &t,
+                             std::vector<Point3d> &points3D,
+                             std::vector<bool> &isTriangulated) {
+    
+    if(matches.size() < 50) {
+        std::cout << "Initializer: too few matches (" << matches.size() << ")" << std::endl;
+        return false;
+    }
+    
+    // Extract matched points
+    std::vector<Point2f> pts1, pts2;
+    pts1.reserve(matches.size());
+    pts2.reserve(matches.size());
+    
+    for(const auto &m : matches) {
+        pts1.push_back(kps1[m.queryIdx].pt);
+        pts2.push_back(kps2[m.trainIdx].pt);
+    }
+    
+    // Estimate both Homography and Fundamental
+    std::vector<uchar> inliersH, inliersF;
+    Mat H = findHomography(pts1, pts2, RANSAC, 3.0, inliersH, 2000, 0.999);
+    Mat F = findFundamentalMat(pts1, pts2, FM_RANSAC, 3.0, 0.999, inliersF);
+    
+    if(H.empty() || F.empty()) {
+        std::cout << "Initializer: failed to compute H or F" << std::endl;
+        return false;
+    }
+    
+    // Compute scores
+    std::vector<bool> inlH, inlF;
+    float scoreH = computeScore(H, H.inv(), pts1, pts2, inlH, 1.0);
+    float scoreF = computeScoreF(F, pts1, pts2, inlF, 1.0);
+    
+    float ratio = scoreH / (scoreH + scoreF);
+    
+    std::cout << "Initializer: H score=" << scoreH << " F score=" << scoreF 
+              << " ratio=" << ratio << std::endl;
+    
+    // Decide between H and F
+    // If ratio > 0.45, scene is likely planar, use H
+    // Otherwise use F for general scenes
+    bool useH = (ratio > 0.45);
+    
+    Mat R_out, t_out;
+    std::vector<Point3d> pts3D;
+    std::vector<bool> isTri;
+    float parallax = 0.0f;
+    
+    bool success = false;
+    if(useH) {
+        std::cout << "Initializer: using Homography" << std::endl;
+        success = reconstructH(pts1, pts2, H, fx, fy, cx, cy, R_out, t_out, pts3D, isTri, parallax);
+    } else {
+        std::cout << "Initializer: using Fundamental" << std::endl;
+        success = reconstructF(pts1, pts2, F, fx, fy, cx, cy, R_out, t_out, pts3D, isTri, parallax);
+    }
+    
+    if(!success) {
+        std::cout << "Initializer: reconstruction failed" << std::endl;
+        return false;
+    }
+    
+    // Count good triangulated points
+    int goodCount = 0;
+    for(bool b : isTri) if(b) goodCount++;
+    
+    std::cout << "Initializer: triangulated " << goodCount << "/" << pts3D.size() 
+              << " points, parallax=" << parallax << std::endl;
+    
+    // Check quality: need enough good points
+    if(goodCount < 50) {
+        std::cout << "Initializer: too few good points (" << goodCount << ")" << std::endl;
+        return false;
+    }
+    
+    // Check parallax
+    if(parallax < 1.0f) {
+        std::cout << "Initializer: insufficient parallax (" << parallax << ")" << std::endl;
+        return false;
+    }
+    
+    // Success
+    R = R_out;
+    t = t_out;
+    points3D = pts3D;
+    isTriangulated = isTri;
+    
+    std::cout << "Initializer: SUCCESS!" << std::endl;
+    return true;
+}
+
+bool Initializer::checkParallax(const std::vector<KeyPoint> &kps1,
+                                const std::vector<KeyPoint> &kps2,
+                                const std::vector<DMatch> &matches,
+                                double minMedianParallax) {
+    if(matches.empty()) return false;
+    
+    std::vector<double> parallaxes;
+    parallaxes.reserve(matches.size());
+    
+    for(const auto &m : matches) {
+        Point2f p1 = kps1[m.queryIdx].pt;
+        Point2f p2 = kps2[m.trainIdx].pt;
+        double dx = p2.x - p1.x;
+        double dy = p2.y - p1.y;
+        parallaxes.push_back(std::sqrt(dx*dx + dy*dy));
+    }
+    
+    std::sort(parallaxes.begin(), parallaxes.end());
+    double median = parallaxes[parallaxes.size()/2];
+    
+    return median >= minMedianParallax;
+}
+
+bool Initializer::reconstructF(const std::vector<Point2f> &pts1,
+                               const std::vector<Point2f> &pts2,
+                               const Mat &F,
+                               double fx, double fy, double cx, double cy,
+                               Mat &R, Mat &t,
+                               std::vector<Point3d> &points3D,
+                               std::vector<bool> &isTriangulated,
+                               float &parallax) {
+    
+    // Compute Essential matrix from F
+    Mat K = (Mat_<double>(3,3) << fx, 0, cx, 0, fy, cy, 0, 0, 1);
+    Mat E = K.t() * F * K;
+    
+    // Recover pose from E
+    Mat mask;
+    int inliers = recoverPose(E, pts1, pts2, K, R, t, mask);
+    
+    if(inliers < 30) return false;
+    
+    // Triangulate
+    points3D.resize(pts1.size());
+    isTriangulated.resize(pts1.size(), false);
+    
+    Mat P1 = Mat::eye(3, 4, CV_64F);
+    Mat P2(3, 4, CV_64F);
+    for(int i = 0; i < 3; ++i) {
+        for(int j = 0; j < 3; ++j) P2.at<double>(i,j) = R.at<double>(i,j);
+        P2.at<double>(i, 3) = t.at<double>(i, 0);
+    }
+    
+    triangulate(P1, P2, pts1, pts2, points3D);
+    
+    // Check quality
+    std::vector<bool> isGood;
+    int nGood = checkRT(R, t, pts1, pts2, points3D, isGood, fx, fy, cx, cy, parallax);
+    
+    isTriangulated = isGood;
+    return nGood >= 30;
+}
+
+bool Initializer::reconstructH(const std::vector<Point2f> &pts1,
+                               const std::vector<Point2f> &pts2,
+                               const Mat &H,
+                               double fx, double fy, double cx, double cy,
+                               Mat &R, Mat &t,
+                               std::vector<Point3d> &points3D,
+                               std::vector<bool> &isTriangulated,
+                               float &parallax) {
+    
+    // Decompose H to get multiple solutions
+    std::vector<Mat> Rs, ts, normals;
+    decomposeH(H, Rs, ts, normals);
+    
+    // Try all solutions and pick best
+    int bestGood = 0;
+    int bestIdx = -1;
+    std::vector<std::vector<Point3d>> allPoints(Rs.size());
+    std::vector<std::vector<bool>> allGood(Rs.size());
+    std::vector<float> allParallax(Rs.size());
+    
+    for(size_t i = 0; i < Rs.size(); ++i) {
+        std::vector<Point3d> pts3D;
+        std::vector<bool> isGood;
+        float par = 0.0f;
+        
+        Mat P1 = Mat::eye(3, 4, CV_64F);
+        Mat P2(3, 4, CV_64F);
+        for(int r = 0; r < 3; ++r) {
+            for(int c = 0; c < 3; ++c) P2.at<double>(r,c) = Rs[i].at<double>(r,c);
+            P2.at<double>(r, 3) = ts[i].at<double>(r, 0);
+        }
+        
+        triangulate(P1, P2, pts1, pts2, pts3D);
+        int nGood = checkRT(Rs[i], ts[i], pts1, pts2, pts3D, isGood, fx, fy, cx, cy, par);
+        
+        allPoints[i] = pts3D;
+        allGood[i] = isGood;
+        allParallax[i] = par;
+        
+        if(nGood > bestGood) {
+            bestGood = nGood;
+            bestIdx = i;
+        }
+    }
+    
+    if(bestIdx < 0 || bestGood < 30) return false;
+    
+    R = Rs[bestIdx];
+    t = ts[bestIdx];
+    points3D = allPoints[bestIdx];
+    isTriangulated = allGood[bestIdx];
+    parallax = allParallax[bestIdx];
+    
+    return true;
+}
+
+int Initializer::checkRT(const Mat &R, const Mat &t,
+                         const std::vector<Point2f> &pts1,
+                         const std::vector<Point2f> &pts2,
+                         const std::vector<Point3d> &points3D,
+                         std::vector<bool> &isGood,
+                         double fx, double fy, double cx, double cy,
+                         float &parallax) {
+    
+    isGood.resize(points3D.size(), false);
+    
+    Mat R1 = Mat::eye(3, 3, CV_64F);
+    Mat t1 = Mat::zeros(3, 1, CV_64F);
+    Mat R2 = R;
+    Mat t2 = t;
+    
+    int nGood = 0;
+    std::vector<float> cosParallaxes;
+    cosParallaxes.reserve(points3D.size());
+    
+    for(size_t i = 0; i < points3D.size(); ++i) {
+        const Point3d &p3d = points3D[i];
+        
+        // Check depth in first camera
+        Mat p3dMat = (Mat_<double>(3,1) << p3d.x, p3d.y, p3d.z);
+        Mat p1 = R1 * p3dMat + t1;
+        double z1 = p1.at<double>(2, 0);
+        
+        if(z1 <= 0) continue;
+        
+        // Check depth in second camera
+        Mat p2 = R2 * p3dMat + t2;
+        double z2 = p2.at<double>(2, 0);
+        
+        if(z2 <= 0) continue;
+        
+        // Check reprojection error in first camera
+        double u1 = fx * p1.at<double>(0,0)/z1 + cx;
+        double v1 = fy * p1.at<double>(1,0)/z1 + cy;
+        double err1 = std::sqrt(std::pow(u1 - pts1[i].x, 2) + std::pow(v1 - pts1[i].y, 2));
+        
+        if(err1 > 4.0) continue;
+        
+        // Check reprojection error in second camera
+        double u2 = fx * p2.at<double>(0,0)/z2 + cx;
+        double v2 = fy * p2.at<double>(1,0)/z2 + cy;
+        double err2 = std::sqrt(std::pow(u2 - pts2[i].x, 2) + std::pow(v2 - pts2[i].y, 2));
+        
+        if(err2 > 4.0) continue;
+        
+        // Check parallax
+        Mat normal1 = p3dMat / norm(p3dMat);
+        Mat normal2 = (p3dMat - t2) / norm(p3dMat - t2);
+        double cosParallax = normal1.dot(normal2);
+        
+        cosParallaxes.push_back(cosParallax);
+        
+        isGood[i] = true;
+        nGood++;
+    }
+    
+    if(!cosParallaxes.empty()) {
+        std::sort(cosParallaxes.begin(), cosParallaxes.end());
+        float medianCos = cosParallaxes[cosParallaxes.size()/2];
+        parallax = std::acos(medianCos) * 180.0 / CV_PI;
+    }
+    
+    return nGood;
+}
+
+void Initializer::triangulate(const Mat &P1, const Mat &P2,
+                              const std::vector<Point2f> &pts1,
+                              const std::vector<Point2f> &pts2,
+                              std::vector<Point3d> &points3D) {
+    
+    points3D.resize(pts1.size());
+    
+    Mat pts4D;
+    triangulatePoints(P1, P2, pts1, pts2, pts4D);
+    
+    for(int i = 0; i < pts4D.cols; ++i) {
+        Mat x = pts4D.col(i);
+        x /= x.at<float>(3, 0);
+        points3D[i] = Point3d(x.at<float>(0,0), x.at<float>(1,0), x.at<float>(2,0));
+    }
+}
+
+void Initializer::decomposeH(const Mat &H, std::vector<Mat> &Rs,
+                             std::vector<Mat> &ts, std::vector<Mat> &normals) {
+    
+    Mat H_normalized = H / H.at<double>(2,2);
+    
+    std::vector<Mat> rotations, translations, normalsOut;
+    int solutions = decomposeHomographyMat(H_normalized, Mat::eye(3,3,CV_64F),
+                                               rotations, translations, normalsOut);
+    
+    Rs = rotations;
+    ts = translations;
+    normals = normalsOut;
+}
+
+float Initializer::computeScore(const Mat &H21, const Mat &H12,
+                               const std::vector<Point2f> &pts1,
+                               const std::vector<Point2f> &pts2,
+                               std::vector<bool> &inliersH,
+                               float sigma) {
+    
+    const float th = 5.991 * sigma;
+    inliersH.resize(pts1.size(), false);
+    
+    float score = 0.0f;
+    const float thSq = th * th;
+    
+    for(size_t i = 0; i < pts1.size(); ++i) {
+        // Forward error
+        Mat p1 = (Mat_<double>(3,1) << pts1[i].x, pts1[i].y, 1.0);
+        Mat p2pred = H21 * p1;
+        p2pred /= p2pred.at<double>(2,0);
+        
+        float dx = pts2[i].x - p2pred.at<double>(0,0);
+        float dy = pts2[i].y - p2pred.at<double>(1,0);
+        float errSq = dx*dx + dy*dy;
+        
+        if(errSq < thSq) {
+            score += thSq - errSq;
+        }
+        
+        // Backward error
+        Mat p2 = (Mat_<double>(3,1) << pts2[i].x, pts2[i].y, 1.0);
+        Mat p1pred = H12 * p2;
+        p1pred /= p1pred.at<double>(2,0);
+        
+        dx = pts1[i].x - p1pred.at<double>(0,0);
+        dy = pts1[i].y - p1pred.at<double>(1,0);
+        errSq = dx*dx + dy*dy;
+        
+        if(errSq < thSq) {
+            score += thSq - errSq;
+            inliersH[i] = true;
+        }
+    }
+    
+    return score;
+}
+
+float Initializer::computeScoreF(const Mat &F21,
+                                 const std::vector<Point2f> &pts1,
+                                 const std::vector<Point2f> &pts2,
+                                 std::vector<bool> &inliersF,
+                                 float sigma) {
+    
+    const float th = 3.841 * sigma;
+    const float thSq = th * th;
+    
+    inliersF.resize(pts1.size(), false);
+    float score = 0.0f;
+    
+    for(size_t i = 0; i < pts1.size(); ++i) {
+        Mat p1 = (Mat_<double>(3,1) << pts1[i].x, pts1[i].y, 1.0);
+        Mat p2 = (Mat_<double>(3,1) << pts2[i].x, pts2[i].y, 1.0);
+        
+        // Epipolar line in second image
+        Mat l2 = F21 * p1;
+        float a2 = l2.at<double>(0,0);
+        float b2 = l2.at<double>(1,0);
+        float c2 = l2.at<double>(2,0);
+        
+        float num2 = a2*pts2[i].x + b2*pts2[i].y + c2;
+        float den2 = a2*a2 + b2*b2;
+        float distSq2 = (num2*num2) / den2;
+        
+        if(distSq2 < thSq) {
+            score += thSq - distSq2;
+            inliersF[i] = true;
+        }
+    }
+    
+    return score;
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/keyframe.cpp b/modules/slam/src/keyframe.cpp
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/modules/slam/src/localizer.cpp b/modules/slam/src/localizer.cpp
new file mode 100644
index 0000000000..40647f1751
--- /dev/null
+++ b/modules/slam/src/localizer.cpp
@@ -0,0 +1,157 @@
+#include "opencv2/slam/localizer.hpp"
+#include "opencv2/slam/matcher.hpp"
+#include <opencv2/calib3d.hpp>
+#include <filesystem>
+#include <fstream>
+#include <opencv2/imgproc.hpp>
+#include <opencv2/imgcodecs.hpp>
+
+namespace cv {
+namespace vo {
+
+Localizer::Localizer(float ratio) : ratio_(ratio) {}
+
+bool Localizer::tryPnP(const MapManager &map, const Mat &desc, const std::vector<KeyPoint> &kps,
+                       double fx, double fy, double cx, double cy, int imgW, int imgH,
+                       int min_inliers,
+                       Mat &R_out, Mat &t_out, int &inliers_out,
+                       int frame_id, const Mat *image, const std::string &outDir,
+                       int *out_preMatches, int *out_postMatches, double *out_meanReproj) const {
+    inliers_out = 0; R_out.release(); t_out.release();
+    const auto &mappoints = map.mappoints();
+    const auto &keyframes = map.keyframes();
+    if(mappoints.empty() || keyframes.empty() || desc.empty()) return false;
+
+    // Use last keyframe as prior
+    const KeyFrame &last = keyframes.back();
+    Mat lastR = last.R_w, lastT = last.t_w;
+
+    // select visible candidates
+    std::vector<int> candidates = map.findVisibleCandidates(lastR, lastT, fx, fy, cx, cy, imgW, imgH);
+    if(candidates.empty()) return false;
+
+    // gather descriptors from map (prefer mp.descriptor if available)
+    Mat trainDesc;
+    std::vector<Point3f> objPts; objPts.reserve(candidates.size());
+    std::vector<int> trainMpIds; trainMpIds.reserve(candidates.size());
+    for(int idx: candidates){
+        const auto &mp = mappoints[idx];
+        if(mp.observations.empty()) continue;
+        // prefer representative descriptor on MapPoint
+        if(!mp.descriptor.empty()){
+            trainDesc.push_back(mp.descriptor.row(0));
+        } else {
+            auto ob = mp.observations.front();
+            int kfid = ob.first; int kpidx = ob.second;
+            int kfIdx = map.keyframeIndex(kfid);
+            if(kfIdx < 0) continue;
+            const KeyFrame &kf = keyframes[kfIdx];
+            if(kf.desc.empty() || kpidx < 0 || kpidx >= kf.desc.rows) continue;
+            trainDesc.push_back(kf.desc.row(kpidx));
+        }
+        objPts.emplace_back((float)mp.p.x, (float)mp.p.y, (float)mp.p.z);
+        trainMpIds.push_back(mp.id);
+    }
+    if(trainDesc.empty()) return false;
+
+    // Forward and backward knn to enable mutual cross-check
+    BFMatcher bf(NORM_HAMMING);
+    std::vector<std::vector<DMatch>> knnF, knnB;
+    bf.knnMatch(desc, trainDesc, knnF, 2);
+    bf.knnMatch(trainDesc, desc, knnB, 1);
+
+    int preMatches = static_cast<int>(knnF.size());
+    if(out_preMatches) *out_preMatches = preMatches;
+
+    // Ratio + mutual
+    const float RATIO = ratio_;
+    std::vector<DMatch> goodMatches;
+    goodMatches.reserve(knnF.size());
+    for(size_t q=0;q<knnF.size();++q){
+        if(knnF[q].empty()) continue;
+        const DMatch &m0 = knnF[q][0];
+        if(knnF[q].size() >= 2){
+            const DMatch &m1 = knnF[q][1];
+            if(m0.distance > RATIO * m1.distance) continue;
+        }
+        int trainIdx = m0.trainIdx;
+        // mutual check: ensure best match of trainIdx points back to this query
+        if(trainIdx < 0 || trainIdx >= static_cast<int>(knnB.size())) continue;
+        if(knnB[trainIdx].empty()) continue;
+        int backIdx = knnB[trainIdx][0].trainIdx; // index in desc
+        if(backIdx != static_cast<int>(q)) continue;
+        // passed ratio and mutual
+        goodMatches.push_back(DMatch(static_cast<int>(q), trainIdx, m0.distance));
+    }
+
+    if(out_postMatches) *out_postMatches = static_cast<int>(goodMatches.size());
+
+    if(goodMatches.size() < static_cast<size_t>(std::max(6, min_inliers))) return false;
+
+    // build PnP inputs
+    std::vector<Point3f> obj; std::vector<Point2f> imgpts; obj.reserve(goodMatches.size()); imgpts.reserve(goodMatches.size());
+    std::vector<int> matchedMpIds; matchedMpIds.reserve(goodMatches.size());
+    for(const auto &m: goodMatches){
+        int q = m.queryIdx; int t = m.trainIdx;
+        if(t < 0 || t >= static_cast<int>(objPts.size()) || q < 0 || q >= static_cast<int>(kps.size())) continue;
+        obj.push_back(objPts[t]);
+        imgpts.push_back(kps[q].pt);
+        matchedMpIds.push_back(trainMpIds[t]);
+    }
+
+    if(obj.size() < static_cast<size_t>(std::max(6, min_inliers))) return false;
+
+    Mat camera = (Mat_<double>(3,3) << fx,0,cx, 0,fy,cy, 0,0,1);
+    Mat dist = Mat::zeros(4,1,CV_64F);
+    std::vector<int> inliersIdx;
+    bool ok = solvePnPRansac(obj, imgpts, camera, dist, R_out, t_out, false,
+                                 100, 8.0, 0.99, inliersIdx, SOLVEPNP_ITERATIVE);
+    if(!ok) return false;
+    inliers_out = static_cast<int>(inliersIdx.size());
+
+    // compute mean reprojection error on inliers
+    double meanReproj = 0.0;
+    if(!inliersIdx.empty()){
+        std::vector<Point2f> proj;
+        projectPoints(obj, R_out, t_out, camera, dist, proj);
+        double sum = 0.0;
+        for(int idx: inliersIdx){
+            double e = std::hypot(proj[idx].x - imgpts[idx].x, proj[idx].y - imgpts[idx].y);
+            sum += e;
+        }
+        meanReproj = sum / inliersIdx.size();
+    }
+    if(out_meanReproj) *out_meanReproj = meanReproj;
+
+    // Diagnostics: draw matches and inliers if requested
+    if(!outDir.empty() && image){
+        try{
+            std::filesystem::create_directories(outDir);
+            Mat vis;
+            if(image->channels() == 1) cvtColor(*image, vis, COLOR_GRAY2BGR);
+            else vis = image->clone();
+            // draw all good matches as small circles; inliers green
+            for(size_t i=0;i<goodMatches.size();++i){
+                Point2f p = imgpts[i];
+                bool isInlier = std::find(inliersIdx.begin(), inliersIdx.end(), static_cast<int>(i)) != inliersIdx.end();
+                Scalar col = isInlier ? Scalar(0,255,0) : Scalar(0,0,255);
+                circle(vis, p, 3, col, 2, LINE_AA);
+            }
+            std::ostringstream name; name << outDir << "/pnp_frame_" << frame_id << ".png";
+            putText(vis, "pre=" + std::to_string(preMatches) + " post=" + std::to_string(goodMatches.size()) + " inliers=" + std::to_string(inliers_out) + " mean_px=" + std::to_string(meanReproj),
+                        Point(10,20), FONT_HERSHEY_SIMPLEX, 0.6, Scalar(255,255,255), 2);
+            imwrite(name.str(), vis);
+            // append a small CSV-like log
+            std::ofstream logf((outDir + "/pnp_stats.csv"), std::ios::app);
+            if(logf){
+                logf << frame_id << "," << preMatches << "," << goodMatches.size() << "," << inliers_out << "," << meanReproj << "\n";
+                logf.close();
+            }
+        } catch(...) { /* don't crash on diagnostics */ }
+    }
+
+    return inliers_out >= min_inliers;
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/map.cpp b/modules/slam/src/map.cpp
new file mode 100644
index 0000000000..670eaff63c
--- /dev/null
+++ b/modules/slam/src/map.cpp
@@ -0,0 +1,319 @@
+#include "opencv2/slam/map.hpp"
+#include <opencv2/calib3d.hpp>
+#include <iostream>
+#include <algorithm>
+#include <limits>
+
+namespace cv {
+namespace vo {
+
+MapManager::MapManager() {}
+
+void MapManager::addKeyFrame(const KeyFrame &kf){
+    keyframes_.push_back(kf);
+    id2idx_[kf.id] = static_cast<int>(keyframes_.size()) - 1;
+}
+
+void MapManager::addMapPoints(const std::vector<MapPoint> &pts){
+    for(auto p: pts) {
+        if(p.id <= 0) p.id = next_mappoint_id_++;
+        mpid2idx_[p.id] = static_cast<int>(mappoints_.size());
+        mappoints_.push_back(p);
+    }
+}
+
+std::vector<int> MapManager::findVisibleCandidates(const Mat &lastR, const Mat &lastT,
+                                                   double fx, double fy, double cx, double cy,
+                                                   int imgW, int imgH) const {
+    std::vector<int> candidates; candidates.reserve(mappoints_.size());
+    for(size_t mi=0; mi<mappoints_.size(); ++mi){
+        const auto &mp = mappoints_[mi];
+        Mat Xw = (Mat_<double>(3,1) << mp.p.x, mp.p.y, mp.p.z);
+        Mat Xc = lastR.t() * (Xw - lastT);
+        double z = Xc.at<double>(2,0);
+        if(z <= 0) continue;
+        double u = fx * (Xc.at<double>(0,0)/z) + cx;
+        double v = fy * (Xc.at<double>(1,0)/z) + cy;
+        if(u >= 0 && u < imgW && v >= 0 && v < imgH) candidates.push_back((int)mi);
+    }
+    return candidates;
+}
+
+std::vector<MapPoint> MapManager::triangulateBetweenLastTwo(const std::vector<Point2f> &pts1n,
+                                                            const std::vector<Point2f> &pts2n,
+                                                            const std::vector<int> &pts1_kp_idx,
+                                                            const std::vector<int> &pts2_kp_idx,
+                                                            const KeyFrame &lastKf, const KeyFrame &curKf,
+                                                            double fx, double fy, double cx, double cy){
+    std::vector<MapPoint> newPoints;
+    if(pts1n.empty() || pts2n.empty()) return newPoints;
+    // Relative pose from last -> current (we expect lastKf and curKf poses to be in world)
+    // compute relative transformation
+    // P1 = [I|0], P2 = [R_rel|t_rel] where R_rel = R_last^{-1} * R_cur, t_rel = R_last^{-1}*(t_cur - t_last)
+    Mat R_last = lastKf.R_w, t_last = lastKf.t_w;
+    Mat R_cur = curKf.R_w, t_cur = curKf.t_w;
+    Mat R_rel = R_last.t() * R_cur;
+    Mat t_rel = R_last.t() * (t_cur - t_last);
+    Mat P1 = Mat::eye(3,4,CV_64F);
+    Mat P2(3,4,CV_64F);
+    for(int r=0;r<3;++r){
+        for(int c=0;c<3;++c) P2.at<double>(r,c) = R_rel.at<double>(r,c);
+        P2.at<double>(r,3) = t_rel.at<double>(r,0);
+    }
+    Mat points4D;
+    try{ triangulatePoints(P1, P2, pts1n, pts2n, points4D); }
+    catch(...) { points4D.release(); }
+    if(points4D.empty()) return newPoints;
+    Mat p4d64;
+    if(points4D.type() != CV_64F) points4D.convertTo(p4d64, CV_64F); else p4d64 = points4D;
+    for(int c=0;c<p4d64.cols; ++c){
+        double w = p4d64.at<double>(3,c);
+        if(std::abs(w) < 1e-8) continue;
+        double Xx = p4d64.at<double>(0,c)/w;
+        double Xy = p4d64.at<double>(1,c)/w;
+        double Xz = p4d64.at<double>(2,c)/w;
+        if(Xz <= 0) continue;
+        Mat Xc = (Mat_<double>(3,1) << Xx, Xy, Xz);
+        Mat Xw = lastKf.R_w * Xc + lastKf.t_w;
+        MapPoint mp; mp.p = Point3d(Xw.at<double>(0,0), Xw.at<double>(1,0), Xw.at<double>(2,0));
+        // compute reprojection error in both views (pixel coords)
+        // project into last
+        Mat Xc_last = Xc;
+        double u1 = fx * (Xc_last.at<double>(0,0)/Xc_last.at<double>(2,0)) + cx;
+        double v1 = fy * (Xc_last.at<double>(1,0)/Xc_last.at<double>(2,0)) + cy;
+        // project into current: Xc_cur = R_rel * Xc + t_rel (we computed P2 earlier)
+        Mat Xc_cur = R_rel * Xc + t_rel;
+        double u2 = fx * (Xc_cur.at<double>(0,0)/Xc_cur.at<double>(2,0)) + cx;
+        double v2 = fy * (Xc_cur.at<double>(1,0)/Xc_cur.at<double>(2,0)) + cy;
+        // obtain observed pixel locations
+        double obs_u1 = -1, obs_v1 = -1, obs_u2 = -1, obs_v2 = -1;
+        if(c < static_cast<int>(pts1_kp_idx.size())){
+            // pts1n/pts2n are normalized coords; but we were given kp indices - use them if valid
+            int kp1 = pts1_kp_idx[c];
+            if(kp1 >= 0 && kp1 < static_cast<int>(lastKf.kps.size())){
+                obs_u1 = lastKf.kps[kp1].pt.x; obs_v1 = lastKf.kps[kp1].pt.y;
+            }
+        }
+        if(c < static_cast<int>(pts2_kp_idx.size())){
+            int kp2 = pts2_kp_idx[c];
+            if(kp2 >= 0 && kp2 < static_cast<int>(curKf.kps.size())){
+                obs_u2 = curKf.kps[kp2].pt.x; obs_v2 = curKf.kps[kp2].pt.y;
+            }
+        }
+        // if we have observed pixel locations, check reprojection error
+        bool pass = true;
+        const double MAX_REPROJ_PX = 2.0;
+        if(obs_u1 >= 0 && obs_v1 >= 0){
+            double e1 = std::hypot(u1 - obs_u1, v1 - obs_v1);
+            if(e1 > MAX_REPROJ_PX) pass = false;
+        }
+        if(obs_u2 >= 0 && obs_v2 >= 0){
+            double e2 = std::hypot(u2 - obs_u2, v2 - obs_v2);
+            if(e2 > MAX_REPROJ_PX) pass = false;
+        }
+        // parallax check: angle between viewing rays (in last frame)
+        Mat ray1 = Xc_last / norm(Xc_last);
+        Mat ray2 = Xc_cur / norm(Xc_cur);
+        double cos_par = ray1.dot(ray2);
+        double parallax = std::acos(std::min(1.0, std::max(-1.0, cos_par)));
+        const double MIN_PARALLAX_RAD = 1.0 * CV_PI / 180.0; // 1 degree
+        if(parallax < MIN_PARALLAX_RAD) pass = false;
+        if(!pass) continue;
+        // attach observations using provided keypoint indices when available
+        int kp1idx = (c < static_cast<int>(pts1_kp_idx.size())) ? pts1_kp_idx[c] : -1;
+        int kp2idx = (c < static_cast<int>(pts2_kp_idx.size())) ? pts2_kp_idx[c] : -1;
+        if(kp1idx >= 0) mp.observations.emplace_back(lastKf.id, kp1idx);
+        if(kp2idx >= 0) mp.observations.emplace_back(curKf.id, kp2idx);
+        // assign id
+        mp.id = next_mappoint_id_++;
+        mpid2idx_[mp.id] = static_cast<int>(mappoints_.size()) + static_cast<int>(newPoints.size());
+        newPoints.push_back(mp);
+    }
+    // append to internal map
+    for(const auto &p: newPoints) mappoints_.push_back(p);
+    return newPoints;
+}
+
+int MapManager::keyframeIndex(int id) const{
+    auto it = id2idx_.find(id);
+    if(it == id2idx_.end()) return -1;
+    return it->second;
+}
+
+int MapManager::mapPointIndex(int id) const{
+    auto it = mpid2idx_.find(id);
+    if(it == mpid2idx_.end()) return -1;
+    return it->second;
+}
+
+void MapManager::applyOptimizedKeyframePose(int keyframeId, const Mat &R, const Mat &t){
+    int idx = keyframeIndex(keyframeId);
+    if(idx < 0 || idx >= static_cast<int>(keyframes_.size())) return;
+    keyframes_[idx].R_w = R.clone();
+    keyframes_[idx].t_w = t.clone();
+}
+
+void MapManager::applyOptimizedMapPoint(int mappointId, const Point3d &p){
+    int idx = mapPointIndex(mappointId);
+    if(idx < 0 || idx >= static_cast<int>(mappoints_.size())) return;
+    mappoints_[idx].p = p;
+}
+
+void MapManager::cullBadMapPoints() {
+    const double MAX_REPROJ_ERROR = 3.0;  // pixels
+    const int MIN_OBSERVATIONS = 2;
+    const float MIN_FOUND_RATIO = 0.25f;
+    
+    for(auto &mp : mappoints_) {
+        if(mp.isBad) continue;
+        
+        // 1. Check observation count
+        mp.nObs = static_cast<int>(mp.observations.size());
+        if(mp.nObs < MIN_OBSERVATIONS) {
+            mp.isBad = true;
+            continue;
+        }
+        
+        // 2. Check found ratio (avoid points rarely tracked)
+        if(mp.nVisible > 10 && mp.getFoundRatio() < MIN_FOUND_RATIO) {
+            mp.isBad = true;
+            continue;
+        }
+        
+        // 3. Check reprojection error across observations
+        // Sample a few keyframes to check reprojection
+        int errorCount = 0;
+        int checkCount = 0;
+        for(const auto &obs : mp.observations) {
+            int kfId = obs.first;
+            int kfIdx = keyframeIndex(kfId);
+            if(kfIdx < 0 || kfIdx >= static_cast<int>(keyframes_.size())) continue;
+            
+            const KeyFrame &kf = keyframes_[kfIdx];
+            // Use default camera params (should be passed in production code)
+            double fx = 500.0, fy = 500.0, cx = 320.0, cy = 240.0;
+            double error = computeReprojError(mp, kf, fx, fy, cx, cy);
+            
+            checkCount++;
+            if(error > MAX_REPROJ_ERROR) {
+                errorCount++;
+            }
+            
+            // Sample up to 3 observations for efficiency
+            if(checkCount >= 3) break;
+        }
+        
+        // If majority of samples have high error, mark as bad
+        if(checkCount > 0 && errorCount > checkCount / 2) {
+            mp.isBad = true;
+        }
+    }
+    
+    // Remove bad points
+    size_t before = mappoints_.size();
+    mappoints_.erase(
+        std::remove_if(mappoints_.begin(), mappoints_.end(),
+            [](const MapPoint &p) { return p.isBad; }),
+        mappoints_.end()
+    );
+    size_t after = mappoints_.size();
+    
+    if(before - after > 0) {
+        std::cout << "MapManager: culled " << (before - after) << " bad map points ("
+                  << after << " remain)" << std::endl;
+    }
+}
+
+double MapManager::computeReprojError(const MapPoint &mp, const KeyFrame &kf,
+                                      double fx, double fy, double cx, double cy) const {
+    // Transform world point to camera frame
+    Mat Xw = (Mat_<double>(3,1) << mp.p.x, mp.p.y, mp.p.z);
+    Mat Xc = kf.R_w.t() * (Xw - kf.t_w);
+    
+    double z = Xc.at<double>(2, 0);
+    if(z <= 0) return std::numeric_limits<double>::max();
+    
+    // Project to image
+    double u = fx * (Xc.at<double>(0, 0) / z) + cx;
+    double v = fy * (Xc.at<double>(1, 0) / z) + cy;
+    
+    // Find corresponding observation in this keyframe
+    Point2f observed(-1, -1);
+    for(const auto &obs : mp.observations) {
+        if(obs.first == kf.id) {
+            int kpIdx = obs.second;
+            if(kpIdx >= 0 && kpIdx < static_cast<int>(kf.kps.size())) {
+                observed = kf.kps[kpIdx].pt;
+                break;
+            }
+        }
+    }
+    
+    if(observed.x < 0) return std::numeric_limits<double>::max();
+    
+    // Compute reprojection error
+    double dx = u - observed.x;
+    double dy = v - observed.y;
+    return std::sqrt(dx * dx + dy * dy);
+}
+
+void MapManager::updateMapPointDescriptor(MapPoint &mp) {
+    if(mp.observations.empty()) return;
+    
+    // Collect all descriptors from observations
+    std::vector<Mat> descriptors;
+    for(const auto &obs : mp.observations) {
+        int kfIdx = keyframeIndex(obs.first);
+        if(kfIdx < 0) continue;
+        
+        const KeyFrame &kf = keyframes_[kfIdx];
+        int kpIdx = obs.second;
+        if(kpIdx >= 0 && kpIdx < kf.desc.rows) {
+            descriptors.push_back(kf.desc.row(kpIdx));
+        }
+    }
+    
+    if(descriptors.empty()) return;
+    
+    // Compute median descriptor (for binary descriptors, use majority voting per bit)
+    if(descriptors[0].type() == CV_8U) {
+        // Binary descriptor (ORB)
+        int bytes = descriptors[0].cols;
+        Mat median = Mat::zeros(1, bytes, CV_8U);
+        
+        for(int b = 0; b < bytes; ++b) {
+            int bitCount[8] = {0};
+            for(const auto &desc : descriptors) {
+                uchar byte = desc.at<uchar>(0, b);
+                for(int bit = 0; bit < 8; ++bit) {
+                    if(byte & (1 << bit)) bitCount[bit]++;
+                }
+            }
+            
+            uchar medianByte = 0;
+            int threshold = descriptors.size() / 2;
+            for(int bit = 0; bit < 8; ++bit) {
+                if(bitCount[bit] > threshold) {
+                    medianByte |= (1 << bit);
+                }
+            }
+            median.at<uchar>(0, b) = medianByte;
+        }
+        
+        mp.descriptor = median;
+    } else {
+        // Fallback: use first descriptor
+        mp.descriptor = descriptors[0].clone();
+    }
+}
+
+int MapManager::countGoodMapPoints() const {
+    int count = 0;
+    for(const auto &mp : mappoints_) {
+        if(!mp.isBad) count++;
+    }
+    return count;
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/matcher.cpp b/modules/slam/src/matcher.cpp
new file mode 100644
index 0000000000..e0579793d3
--- /dev/null
+++ b/modules/slam/src/matcher.cpp
@@ -0,0 +1,132 @@
+#include "opencv2/slam/matcher.hpp"
+
+namespace cv {
+namespace vo {
+
+Matcher::Matcher(float ratio)
+    : ratio_(ratio), bf_(NORM_HAMMING)
+{
+}
+
+void Matcher::knnMatch(const Mat &desc1, const Mat &desc2, std::vector<DMatch> &goodMatches)
+{
+    goodMatches.clear();
+    if(desc1.empty() || desc2.empty()) return;
+    std::vector<std::vector<DMatch>> knn;
+    bf_.knnMatch(desc1, desc2, knn, 2);
+    for(size_t i=0;i<knn.size();++i){
+        if(knn[i].size() < 2) continue;
+        const DMatch &m1 = knn[i][0];
+        const DMatch &m2 = knn[i][1];
+        if(m1.distance < ratio_ * m2.distance) goodMatches.push_back(m1);
+    }
+}
+
+void Matcher::match(const Mat &desc1, const Mat &desc2,
+                    const std::vector<KeyPoint> &kps1, const std::vector<KeyPoint> &kps2,
+                    std::vector<DMatch> &goodMatches,
+                    int imgCols, int imgRows,
+                    int bucketRows, int bucketCols, int topKPerBucket,
+                    int maxTotal, bool enableMutual, bool enableBucketing)
+{
+    goodMatches.clear();
+    if(desc1.empty() || desc2.empty()) return;
+    // 1) knn match desc1 -> desc2 and apply ratio test
+    std::vector<std::vector<DMatch>> knn12;
+    bf_.knnMatch(desc1, desc2, knn12, 2);
+    const int n1 = static_cast<int>(knn12.size());
+
+    std::vector<int> best12(n1, -1); // best trainIdx for each query if ratio test passed
+    for(int i=0;i<n1;++i){
+        if(knn12[i].size() < 2) continue;
+        const DMatch &m1 = knn12[i][0];
+        const DMatch &m2 = knn12[i][1];
+        if(m1.distance < ratio_ * m2.distance) best12[i] = m1.trainIdx;
+    }
+
+    // 2) optionally perform reverse matching for mutual check
+    std::vector<int> best21; // only filled if enableMutual
+    int n2 = 0;
+    if(enableMutual){
+        std::vector<std::vector<DMatch>> knn21;
+        bf_.knnMatch(desc2, desc1, knn21, 1);
+        n2 = static_cast<int>(knn21.size());
+        best21.assign(n2, -1);
+        for(int j=0;j<n2;++j){
+            if(knn21[j].size() < 1) continue;
+            best21[j] = knn21[j][0].trainIdx;
+        }
+    } else {
+        // if no mutual check, set n2 conservatively by descriptor count of desc2
+        n2 = desc2.rows > 0 ? desc2.rows : 0;
+    }
+
+    // 3) Collect candidate matches according to whether mutual check is enabled
+    struct Cand { DMatch m; float x; float y; };
+    std::vector<Cand> candidates;
+    candidates.reserve(n1);
+    for(int i=0;i<n1;++i){
+        int j = best12[i];
+        if(j < 0) continue;
+        if(enableMutual){
+            if(j >= n2) continue;
+            if(best21[j] != i) continue; // mutual check
+        }
+        // safe distance value from knn12
+        float dist = (knn12[i].size() ? knn12[i][0].distance : 0.0f);
+        DMatch dm(i, j, dist);
+        // keypoint location on current frame (kps2)
+        float x = 0, y = 0;
+        if(j >= 0 && j < (int)kps2.size()){ x = kps2[j].pt.x; y = kps2[j].pt.y; }
+        candidates.push_back({dm, x, y});
+    }
+
+    if(candidates.empty()) return;
+
+    // 4) Spatial bucketing on current-frame locations to promote spatially-distributed matches
+    std::vector<DMatch> interimMatches;
+    interimMatches.reserve(candidates.size());
+    if(enableBucketing){
+        int cols = std::max(1, bucketCols);
+        int rows = std::max(1, bucketRows);
+        float cellW = (imgCols > 0) ? (float)imgCols / cols : 1.0f;
+        float cellH = (imgRows > 0) ? (float)imgRows / rows : 1.0f;
+
+        // buckets: for each cell keep topKPerBucket smallest-distance matches
+        std::vector<std::vector<Cand>> buckets(cols * rows);
+        for(const auto &c: candidates){
+            int bx = 0, by = 0;
+            if(cellW > 0) bx = std::min(cols - 1, std::max(0, (int)std::floor(c.x / cellW)));
+            if(cellH > 0) by = std::min(rows - 1, std::max(0, (int)std::floor(c.y / cellH)));
+            int idx = by * cols + bx;
+            buckets[idx].push_back(c);
+        }
+
+        // sort each bucket and take top K
+        for(auto &vec: buckets){
+            if(vec.empty()) continue;
+            std::sort(vec.begin(), vec.end(), [](const Cand &a, const Cand &b){ return a.m.distance < b.m.distance; });
+            int take = std::min((int)vec.size(), topKPerBucket);
+            for(int i=0;i<take;++i) interimMatches.push_back(vec[i].m);
+        }
+    } else {
+        // no bucketing: keep all candidates
+        for(const auto &c: candidates) interimMatches.push_back(c.m);
+    }
+
+    if(interimMatches.empty()) return;
+
+    // 5) apply global cap if requested (keep lowest-distance matches)
+    if(maxTotal > 0 && (int)interimMatches.size() > maxTotal){
+        std::nth_element(interimMatches.begin(), interimMatches.begin() + maxTotal, interimMatches.end(),
+                         [](const DMatch &a, const DMatch &b){ return a.distance < b.distance; });
+        interimMatches.resize(maxTotal);
+    }
+
+    // final sort by distance
+    std::sort(interimMatches.begin(), interimMatches.end(), [](const DMatch &a, const DMatch &b){ return a.distance < b.distance; });
+    goodMatches = std::move(interimMatches);
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/optimizer.cpp b/modules/slam/src/optimizer.cpp
new file mode 100644
index 0000000000..fe138c718c
--- /dev/null
+++ b/modules/slam/src/optimizer.cpp
@@ -0,0 +1,255 @@
+#include "opencv2/slam/optimizer.hpp"
+#include <iostream>
+#include <set>
+#include <opencv2/calib3d.hpp>
+
+// If g2o is enabled (CMake defines USE_G2O), compile and use the g2o-based
+// implementation. Otherwise fall back to a simplified OpenCV-based implementation.
+
+#ifdef USE_G2O
+#include <g2o/core/sparse_optimizer.h>
+#include <g2o/core/block_solver.h>
+#include <g2o/core/optimization_algorithm_levenberg.h>
+#include <g2o/solvers/dense/linear_solver_dense.h>
+#include <g2o/types/sba/types_six_dof_expmap.h>
+#include <g2o/core/robust_kernel_impl.h>
+#include <opencv2/core/eigen.hpp>
+#include <Eigen/Core>
+#include <map>
+#include <memory>
+#else
+#include "opencv2/sfm.hpp"
+#endif
+
+#include <opencv2/core.hpp>
+
+namespace cv {
+namespace vo {
+
+Optimizer::Optimizer() {}
+
+#ifdef USE_G2O
+void Optimizer::localBundleAdjustment(
+    std::vector<KeyFrame> &keyframes,
+    std::vector<MapPoint> &mappoints,
+    const std::vector<int> &localKfIndices,
+    const std::vector<int> &fixedKfIndices,
+    double fx, double fy, double cx, double cy,
+    int iterations) {
+
+    if(localKfIndices.empty()) return;
+
+    typedef g2o::BlockSolver< g2o::BlockSolverTraits<6,3> > Block;
+    auto linearSolver = std::make_unique<g2o::LinearSolverDense<Block::PoseMatrixType>>();
+    auto blockSolver = std::make_unique<Block>(std::move(linearSolver));
+    auto solver = new g2o::OptimizationAlgorithmLevenberg(std::move(blockSolver));
+
+    g2o::SparseOptimizer optimizer;
+    optimizer.setAlgorithm(solver);
+    optimizer.setVerbose(false);
+
+    // Camera parameter (id = 0)
+    g2o::CameraParameters* cam = new g2o::CameraParameters(fx, Eigen::Vector2d(cx, cy), 0);
+    cam->setId(0);
+    optimizer.addParameter(cam);
+
+    // Poses
+    std::map<int, g2o::VertexSE3Expmap*> poseVertices;
+    for (int idx : localKfIndices) {
+        if (idx < 0 || idx >= static_cast<int>(keyframes.size())) continue;
+        KeyFrame &kf = keyframes[idx];
+        Eigen::Matrix3d R;
+        cv2eigen(kf.R_w, R);
+        Eigen::Vector3d t;
+        cv2eigen(kf.t_w, t);
+        g2o::SE3Quat pose(R, t);
+        auto *vSE3 = new g2o::VertexSE3Expmap();
+        vSE3->setId(idx);
+        vSE3->setEstimate(pose);
+        if (std::find(fixedKfIndices.begin(), fixedKfIndices.end(), idx) != fixedKfIndices.end()) vSE3->setFixed(true);
+        optimizer.addVertex(vSE3);
+        poseVertices[idx] = vSE3;
+    }
+
+    // Points
+    const int POINT_ID_OFFSET = 10000;
+    std::vector<int> mpVertexIds(mappoints.size(), -1);
+    for (size_t i = 0; i < mappoints.size(); ++i) {
+        const MapPoint &mp = mappoints[i];
+        auto *vPoint = new g2o::VertexPointXYZ();
+        vPoint->setEstimate(Eigen::Vector3d(mp.p.x, mp.p.y, mp.p.z));
+        int vid = POINT_ID_OFFSET + static_cast<int>(i);
+        vPoint->setId(vid);
+        vPoint->setMarginalized(true);
+        optimizer.addVertex(vPoint);
+        mpVertexIds[i] = vid;
+    }
+
+    // Observations / edges
+    for (size_t i = 0; i < mappoints.size(); ++i) {
+        const MapPoint &mp = mappoints[i];
+        int pid = mpVertexIds[i];
+        if (pid < 0) continue;
+        for (const auto &obs : mp.observations) {
+            int kfIdx = obs.first;
+            int kpIdx = obs.second;
+            if (poseVertices.find(kfIdx) == poseVertices.end()) continue;
+            if (kfIdx < 0 || kfIdx >= static_cast<int>(keyframes.size())) continue;
+            KeyFrame &kf = keyframes[kfIdx];
+            if (kpIdx < 0 || kpIdx >= static_cast<int>(kf.kps.size())) continue;
+
+            const KeyPoint &kp = kf.kps[kpIdx];
+            Eigen::Vector2d meas(kp.pt.x, kp.pt.y);
+
+            auto *edge = new g2o::EdgeProjectXYZ2UV();
+            edge->setVertex(0, optimizer.vertex(pid));
+            edge->setVertex(1, optimizer.vertex(kfIdx));
+            edge->setMeasurement(meas);
+            edge->information() = Eigen::Matrix2d::Identity();
+            edge->setParameterId(0, cam->id());
+            auto *rk = new g2o::RobustKernelHuber();
+            rk->setDelta(1.0);
+            edge->setRobustKernel(rk);
+            optimizer.addEdge(edge);
+        }
+    }
+
+    optimizer.initializeOptimization();
+    optimizer.optimize(iterations);
+
+    // Write back poses
+    for (auto &kv : poseVertices) {
+        int idx = kv.first;
+        g2o::VertexSE3Expmap* v = kv.second;
+        g2o::SE3Quat est = v->estimate();
+        Eigen::Matrix3d R = est.rotation().toRotationMatrix();
+        Eigen::Vector3d t = est.translation();
+        Mat Rcv, tcv;
+        eigen2cv(R, Rcv);
+        eigen2cv(t, tcv);
+        keyframes[idx].R_w = Rcv.clone();
+        keyframes[idx].t_w = tcv.clone();
+    }
+
+    // Write back points
+    for (size_t i = 0; i < mappoints.size(); ++i) {
+        int pid = mpVertexIds[i];
+        if (pid < 0) continue;
+        auto *v = dynamic_cast<g2o::VertexPointXYZ*>(optimizer.vertex(pid));
+        if (!v) continue;
+        Eigen::Vector3d p = v->estimate();
+        mappoints[i].p.x = p[0];
+        mappoints[i].p.y = p[1];
+        mappoints[i].p.z = p[2];
+    }
+}
+#endif
+void Optimizer::localBundleAdjustmentSFM(
+    std::vector<KeyFrame> &keyframes,
+    std::vector<MapPoint> &mappoints,
+    const std::vector<int> &localKfIndices,
+    const std::vector<int> &fixedKfIndices,
+    double fx, double fy, double cx, double cy,
+    int iterations) {
+    //TODO: Implement SFM-based local BA
+}
+
+
+bool Optimizer::optimizePose(
+    KeyFrame &kf,
+    const std::vector<MapPoint> &mappoints,
+    const std::vector<int> &matchedMpIndices,
+    double fx, double fy, double cx, double cy,
+    std::vector<bool> &inliers,
+    int iterations) {
+
+    if(matchedMpIndices.empty()) return false;
+    inliers.assign(matchedMpIndices.size(), false);
+
+    std::vector<Point3f> objectPoints;
+    std::vector<Point2f> imagePoints;
+    for(size_t i = 0; i < matchedMpIndices.size(); ++i) {
+        int mpIdx = matchedMpIndices[i];
+        if(mpIdx < 0 || mpIdx >= static_cast<int>(mappoints.size())) continue;
+        const MapPoint &mp = mappoints[mpIdx];
+        if(mp.isBad) continue;
+        if(i < kf.kps.size()) {
+            objectPoints.emplace_back(mp.p.x, mp.p.y, mp.p.z);
+            imagePoints.push_back(kf.kps[i].pt);
+        }
+    }
+    if(objectPoints.size() < 4) return false;
+
+    Mat K = (Mat_<double>(3,3) << fx, 0, cx, 0, fy, cy, 0, 0, 1);
+    Mat rvec, tvec, inliersMask;
+    bool success = solvePnPRansac(objectPoints, imagePoints, K, Mat(), rvec, tvec,
+                                      false, iterations, 2.0, 0.99, inliersMask);
+    if(!success) return false;
+    Mat R;
+    Rodrigues(rvec, R);
+    kf.R_w = R;
+    kf.t_w = tvec;
+    for(int i = 0; i < inliersMask.rows && i < static_cast<int>(inliers.size()); ++i)
+        inliers[i] = (inliersMask.at<uchar>(i,0) != 0);
+
+    return true;
+}
+
+void Optimizer::globalBundleAdjustmentSFM(
+    std::vector<KeyFrame> &keyframes,
+    std::vector<MapPoint> &mappoints,
+    double fx, double fy, double cx, double cy,
+    int iterations) {
+
+    std::cout << "Optimizer: Global BA with " << keyframes.size()
+              << " KFs and " << mappoints.size() << " map points" << std::endl;
+    std::vector<int> localKfIndices;
+    for(size_t i = 1; i < keyframes.size(); ++i) localKfIndices.push_back(static_cast<int>(i));
+    std::vector<int> fixedKfIndices = {0};
+    localBundleAdjustmentSFM(keyframes, mappoints, localKfIndices, fixedKfIndices, fx, fy, cx, cy, iterations);
+    std::cout << "Optimizer: Global BA completed" << std::endl;
+}
+
+double Optimizer::computeReprojectionError(
+    const Point3d &point3D,
+    const Mat &R, const Mat &t,
+    const Point2f &observed,
+    double fx, double fy, double cx, double cy,
+    Mat &jacobianPose,
+    Mat &jacobianPoint) {
+
+    Mat Xw = (Mat_<double>(3,1) << point3D.x, point3D.y, point3D.z);
+    Mat Xc = R.t() * (Xw - t);
+    double x = Xc.at<double>(0,0), y = Xc.at<double>(1,0), z = Xc.at<double>(2,0);
+    if(z <= 0) return std::numeric_limits<double>::max();
+    double u = fx * (x / z) + cx;
+    double v = fy * (y / z) + cy;
+    double du = u - observed.x, dv = v - observed.y;
+    jacobianPose = Mat::zeros(2,6,CV_64F);
+    jacobianPoint = Mat::zeros(2,3,CV_64F);
+    double invZ = 1.0 / z; double invZ2 = invZ * invZ;
+    jacobianPoint.at<double>(0,0) = fx * invZ;
+    jacobianPoint.at<double>(0,1) = 0;
+    jacobianPoint.at<double>(0,2) = -fx * x * invZ2;
+    jacobianPoint.at<double>(1,0) = 0;
+    jacobianPoint.at<double>(1,1) = fy * invZ;
+    jacobianPoint.at<double>(1,2) = -fy * y * invZ2;
+    return std::sqrt(du*du + dv*dv);
+}
+
+Point2f Optimizer::project(
+    const Point3d &point3D,
+    const Mat &R, const Mat &t,
+    double fx, double fy, double cx, double cy) {
+
+    Mat Xw = (Mat_<double>(3,1) << point3D.x, point3D.y, point3D.z);
+    Mat Xc = R.t() * (Xw - t);
+    double z = Xc.at<double>(2,0);
+    if(z <= 0) return Point2f(-1,-1);
+    float u = static_cast<float>(fx * (Xc.at<double>(0,0) / z) + cx);
+    float v = static_cast<float>(fy * (Xc.at<double>(1,0) / z) + cy);
+    return Point2f(u,v);
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/pose.cpp b/modules/slam/src/pose.cpp
new file mode 100644
index 0000000000..728e27f313
--- /dev/null
+++ b/modules/slam/src/pose.cpp
@@ -0,0 +1,43 @@
+#include "opencv2/slam/pose.hpp"
+#include <opencv2/calib3d.hpp>
+
+namespace cv {
+namespace vo {
+
+    bool PoseEstimator::estimate(const std::vector<Point2f> &pts1,
+                             const std::vector<Point2f> &pts2,
+                             double fx, double fy, double cx, double cy,
+                             Mat &R, Mat &t, Mat &mask, int &inliers)
+{
+    if(pts1.size() < 8 || pts2.size() < 8) { inliers = 0; return false; }
+    double focal = (fx + fy) * 0.5;
+    Point2d pp(cx, cy);
+    // If provided principal point looks invalid (e.g. zeros or tiny values),
+    // fall back to the approximate center of the matched points' bounding box.
+    // This is better than leaving (0,0) which can break essential-matrix estimation.
+    if((pp.x <= 2.0 || pp.y <= 2.0) && !pts1.empty()){
+        float minx = std::numeric_limits<float>::max();
+        float miny = std::numeric_limits<float>::max();
+        float maxx = std::numeric_limits<float>::lowest();
+        float maxy = std::numeric_limits<float>::lowest();
+        for(size_t i=0;i<pts1.size();++i){
+            const Point2f &p1 = pts1[i];
+            const Point2f &p2 = pts2[i];
+            minx = std::min(minx, std::min(p1.x, p2.x));
+            miny = std::min(miny, std::min(p1.y, p2.y));
+            maxx = std::max(maxx, std::max(p1.x, p2.x));
+            maxy = std::max(maxy, std::max(p1.y, p2.y));
+        }
+        // center of bounding box of matched points
+        pp.x = (minx + maxx) * 0.5;
+        pp.y = (miny + maxy) * 0.5;
+    }
+    mask.release();
+    Mat E = findEssentialMat(pts1, pts2, focal, pp, RANSAC, 0.999, 1.0, mask);
+    if(E.empty()) { inliers = 0; return false; }
+    inliers = recoverPose(E, pts1, pts2, R, t, focal, pp, mask);
+    return true;
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/visualizer.cpp b/modules/slam/src/visualizer.cpp
new file mode 100644
index 0000000000..59ee2a4186
--- /dev/null
+++ b/modules/slam/src/visualizer.cpp
@@ -0,0 +1,131 @@
+#include "opencv2/slam/visualizer.hpp"
+#include <opencv2/imgproc.hpp>
+#include <opencv2/features2d.hpp>
+#include <opencv2/highgui.hpp>
+
+namespace cv {
+namespace vo {
+
+Tracker::Tracker()
+    : feat_(), matcher_(), poseEst_(), frame_id_(0)
+{
+}
+
+bool Tracker::processFrame(const Mat &gray, const std::string &imagePath, Mat &imgOut, Mat &R_out, Mat &t_out, std::string &info)
+{
+    if(gray.empty()) return false;
+    // detect
+    std::vector<KeyPoint> kps;
+    Mat desc;
+    feat_.detectAndCompute(gray, kps, desc);
+
+    if(!prevGray_.empty() && !prevDesc_.empty() && !desc.empty()){
+        // match
+        std::vector<DMatch> goodMatches;
+        matcher_.knnMatch(prevDesc_, desc, goodMatches);
+
+        // draw matches for visualization
+        drawMatches(prevGray_, prevKp_, gray, kps, goodMatches, imgOut,
+                        Scalar::all(-1), Scalar::all(-1), std::vector<char>(), DrawMatchesFlags::NOT_DRAW_SINGLE_POINTS);
+
+        // prepare points
+        std::vector<Point2f> pts1, pts2;
+        for(const auto &m: goodMatches){
+            pts1.push_back(prevKp_[m.queryIdx].pt);
+            pts2.push_back(kps[m.trainIdx].pt);
+        }
+
+        if(pts1.size() >= 8){
+            Mat R, t, mask;
+            int inliers = 0;
+            // Note: we don't have intrinsics here; caller should provide via global or arguments. For now, caller will use PoseEstimator directly if needed.
+            // We'll estimate using default focal/pp later (caller will adapt). Return false for now so caller can invoke PoseEstimator separately.
+            // But to keep compatibility, leave R_out/t_out empty and set info.
+            info = "matches=" + std::to_string(goodMatches.size()) + ", inliers=" + std::to_string(inliers);
+            // update prev buffers below
+        } else {
+            info = "matches=" + std::to_string(goodMatches.size()) + ", inliers=0";
+        }
+    } else {
+        // first frame: draw keypoints
+        drawKeypoints(gray, kps, imgOut, Scalar::all(-1), DrawMatchesFlags::DRAW_RICH_KEYPOINTS);
+        info = "first_frame";
+    }
+
+    // update prev
+    prevGray_ = gray.clone();
+    prevKp_ = kps;
+    prevDesc_ = desc.clone();
+    frame_id_++;
+    return true;
+}
+
+Visualizer::Visualizer(int W, int H, double meters_per_pixel)
+    : W_(W), H_(H), meters_per_pixel_(meters_per_pixel), mapSize_(W,H)
+{
+    map_ = Mat::zeros(mapSize_, CV_8UC3);
+}
+
+Point Visualizer::worldToPixel(const Point2d &p) const {
+    Point2d origin(mapSize_.width/2.0, mapSize_.height/2.0);
+    int x = int(origin.x + p.x / meters_per_pixel_);
+    int y = int(origin.y - p.y / meters_per_pixel_);
+    return Point(x,y);
+}
+
+void Visualizer::addPose(double x, double z){
+    traj_.emplace_back(x,z);
+}
+
+void Visualizer::showFrame(const Mat &frame){
+    if(frame.empty()) return;
+    // Do not draw heading overlay on video frames; only show raw frame.
+    imshow("frame", frame);
+}
+
+void Visualizer::showTopdown(){
+    map_ = Mat::zeros(mapSize_, CV_8UC3);
+    for (int gx = 0; gx < mapSize_.width; gx += 50) line(map_, Point(gx,0), Point(gx,mapSize_.height), Scalar(30,30,30), 1);
+    for (int gy = 0; gy < mapSize_.height; gy += 50) line(map_, Point(0,gy), Point(mapSize_.width,gy), Scalar(30,30,30), 1);
+    for(size_t i=1;i<traj_.size();++i){
+        Point p1 = worldToPixel(traj_[i-1]);
+        Point p2 = worldToPixel(traj_[i]);
+        line(map_, p1, p2, Scalar(0,255,0), 2);
+    }
+    if(!traj_.empty()){
+        Point p = worldToPixel(traj_.back());
+        // draw heading arrow on topdown map based on recent trajectory
+        if(traj_.size() >= 2){
+            int K = std::min<size_t>(5, traj_.size()-1);
+            double dx = 0.0, dz = 0.0;
+            for(int i=0;i<K;i++){
+                auto a = traj_[traj_.size()-1 - i];
+                auto b = traj_[traj_.size()-2 - i];
+                dx += (a.x - b.x);
+                dz += (a.y - b.y);
+            }
+            dx /= K; dz /= K;
+            double norm = std::hypot(dx, dz);
+            if(norm > 1e-6){
+                dx /= norm; dz /= norm;
+                // arrow length in world meters
+                double arrow_m = 0.5; // 0.5 meters
+                // tail is behind the current position by arrow_m, head (tip) at current position
+                Point2d tail_world(traj_.back().x - dx * arrow_m, traj_.back().y - dz * arrow_m);
+                Point tail_px = worldToPixel(tail_world);
+                arrowedLine(map_, tail_px, p, Scalar(0,0,255), 2, LINE_AA, 0, 0.3);
+            }
+        }
+        // label near current position
+        putText(map_, "Robot", p + Point(10,-10), FONT_HERSHEY_SIMPLEX, 0.5, Scalar(255,255,255), 1);
+    }
+    imshow("topdown", map_);
+}
+
+bool Visualizer::saveTrajectory(const std::string &path){
+    if(map_.empty()) showTopdown();
+    return imwrite(path, map_);
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file
diff --git a/modules/slam/src/vo.cpp b/modules/slam/src/vo.cpp
new file mode 100644
index 0000000000..439b8bba14
--- /dev/null
+++ b/modules/slam/src/vo.cpp
@@ -0,0 +1,389 @@
+#include "opencv2/slam/vo.hpp"
+#include "opencv2/slam/optimizer.hpp"
+#include <opencv2/imgproc.hpp>
+#include <opencv2/highgui.hpp>
+#include <opencv2/calib3d.hpp>
+#include <numeric>
+
+namespace cv {
+namespace vo {
+
+static Mat makeSE3(const Mat& R, const Mat& t) {
+    Mat T = Mat::eye(4, 4, CV_64F);
+    R.copyTo(T(Rect(0,0,3,3)));
+    t.copyTo(T(Rect(3,0,1,3)));
+    return T;
+}
+
+VisualOdometry::VisualOdometry(const Ptr<Feature2D>& feature,
+                               const Ptr<DescriptorMatcher>& matcher,
+                               const CameraIntrinsics& intrinsics,
+                               const VOParams& params)
+    : feature_(feature), matcher_(matcher), K_(intrinsics), params_(params) {
+    currentPoseSE3_ = Mat::eye(4,4,CV_64F);
+}
+
+bool VisualOdometry::processFrame(const Mat& img, double /*timestamp*/) {
+    frameCount_++;
+    if (!initialized_) {
+        if (lastImg_.empty()) {
+            lastImg_ = img.clone();
+            return false;
+        }
+        initialized_ = initializeTwoView(lastImg_, img);
+        lastImg_ = img.clone();
+        if (initialized_) trajectory_.push_back(currentPoseSE3_.clone());
+        return initialized_;
+    }
+
+    bool ok = trackWithPnP(img);
+    lastImg_ = img.clone();
+    if (ok) {
+        trajectory_.push_back(currentPoseSE3_.clone());
+        if (shouldInsertKeyframe()) {
+            // promote current frame to new keyframe using current features and PnP inliers
+            kfPoseSE3_ = currentPoseSE3_.clone();
+            kf_keypoints_ = cur_keypoints_;
+            kf_descriptors_ = cur_descriptors_.clone();
+            kf_kp_to_map_.assign((int)kf_keypoints_.size(), -1);
+                keyframePoses_.push_back(kfPoseSE3_.clone());
+                keyframeKeypoints_.push_back(kf_keypoints_);
+                keyframeDescriptors_.push_back(kf_descriptors_.clone());
+            // seed mapping for tracked correspondences
+            for (auto &pr : curFeat_to_map_inliers_) {
+                int curIdx = pr.first; int mpIdx = pr.second;
+                if (curIdx >=0 && curIdx < (int)kf_kp_to_map_.size()) kf_kp_to_map_[curIdx] = mpIdx;
+            }
+                // push kp->map history for BA
+                keyframeKpToMap_.push_back(kf_kp_to_map_);
+            triangulateWithLastKeyframe();
+            runLocalBAIfEnabled();
+        }
+    }
+    return ok;
+}
+
+Mat VisualOdometry::getCurrentPose() const { return currentPoseSE3_.clone(); }
+std::vector<Mat> VisualOdometry::getTrajectory() const { return trajectory_; }
+
+void VisualOdometry::setEnableBackend(bool on) { backendEnabled_ = on; }
+void VisualOdometry::setWindowSize(int N) { params_.localWindowSize = N; }
+void VisualOdometry::setBAParams(double reprojThresh, int maxIters) {
+    params_.reprojErrThresh = reprojThresh;
+    params_.baMaxIters = std::max(1, maxIters);
+}
+void VisualOdometry::setBackendType(int type) { params_.backendType = type; }
+void VisualOdometry::setMode(Mode m) { mode_ = m; }
+bool VisualOdometry::saveMap(const std::string& /*path*/) const { return false; }
+bool VisualOdometry::loadMap(const std::string& /*path*/) { return false; }
+void VisualOdometry::enableLoopClosure(bool on) { loopClosureEnabled_ = on; }
+void VisualOdometry::setPlaceRecognizer(const Ptr<Feature2D>& /*vocabFeature*/) {}
+
+bool VisualOdometry::initializeTwoView(const Mat& img0, const Mat& img1) {
+    std::vector<KeyPoint> k0, k1; Mat d0, d1;
+    feature_->detectAndCompute(img0, noArray(), k0, d0);
+    feature_->detectAndCompute(img1, noArray(), k1, d1);
+    if (k0.size() < 50 || k1.size() < 50) return false;
+
+    std::vector<std::vector<DMatch>> knn01; matcher_->knnMatch(d0, d1, knn01, 2);
+    std::vector<DMatch> good;
+    for (auto& v : knn01) if (v.size()>=2 && v[0].distance < 0.75 * v[1].distance) good.push_back(v[0]);
+    if (good.size() < 80) return false;
+
+    std::vector<Point2f> p0, p1;
+    p0.reserve(good.size()); p1.reserve(good.size());
+    for (auto& m : good) { p0.push_back(k0[m.queryIdx].pt); p1.push_back(k1[m.trainIdx].pt); }
+
+    Mat mask;
+    Mat E = findEssentialMat(p0, p1, K_.K, RANSAC, params_.ransacProb, params_.ransacThresh, mask);
+    if (E.empty()) return false;
+
+    Mat R, t;
+    int inliers = recoverPose(E, p0, p1, K_.K, R, t, mask);
+    if (inliers < params_.minInitInliers) return false;
+
+    // Set first pose = Identity, second = (R,t)
+    currentPoseSE3_ = makeSE3(R, t);
+
+    // Minimal triangulation demo (no storage of per-point observations yet)
+    Mat P0 = K_.K * Mat::eye(3,4,CV_64F);
+    Mat P1(3,4,CV_64F); R.copyTo(P1(Rect(0,0,3,3))); t.copyTo(P1(Rect(3,0,1,3))); P1 = K_.K * P1;
+
+    std::vector<Point2f> tp0, tp1; tp0.reserve(inliers); tp1.reserve(inliers);
+    std::vector<int> inlier_trainIdx; inlier_trainIdx.reserve(inliers);
+    for (size_t i=0;i<good.size();++i) if (mask.at<uchar>(int(i))) {
+        tp0.push_back(p0[i]); tp1.push_back(p1[i]);
+        inlier_trainIdx.push_back(good[i].trainIdx);
+    }
+    if (tp0.size() >= 20) {
+        Mat X4;
+        triangulatePoints(P0, P1, tp0, tp1, X4);
+        // initialize KF as second frame
+        kf_keypoints_ = k1;
+        kf_descriptors_ = d1.clone();
+        kf_kp_to_map_.assign((int)kf_keypoints_.size(), -1);
+        kfPoseSE3_ = currentPoseSE3_.clone();
+        for (int i=0;i<X4.cols;i++) {
+            Vec4d h = X4.col(i);
+            if (std::abs(h[3]) < 1e-8) continue;
+            Point3d X(h[0]/h[3], h[1]/h[3], h[2]/h[3]);
+            if (X.z > 0) {
+                int mpIndex = (int)mapPoints_.size();
+                mapPoints_.push_back(X);
+                int trainIdx = inlier_trainIdx[i];
+                if (trainIdx >=0 && trainIdx < (int)kf_kp_to_map_.size())
+                    kf_kp_to_map_[trainIdx] = mpIndex;
+            }
+        }
+    }
+    return true;
+}
+
+bool VisualOdometry::trackWithPnP(const Mat& img) {
+    cur_keypoints_.clear();
+    feature_->detectAndCompute(img, noArray(), cur_keypoints_, cur_descriptors_);
+    if (kf_descriptors_.empty() || cur_descriptors_.empty()) return false;
+
+    // Match KF -> current
+    std::vector<std::vector<DMatch>> knn;
+    matcher_->knnMatch(kf_descriptors_, cur_descriptors_, knn, 2);
+    std::vector<DMatch> good;
+    good.reserve(knn.size());
+    for (auto &v : knn) if (v.size()>=2 && v[0].distance < 0.75*v[1].distance) good.push_back(v[0]);
+
+    std::vector<Point3f> objPts; objPts.reserve(good.size());
+    std::vector<Point2f> imgPts; imgPts.reserve(good.size());
+    std::vector<int> curIdxOfCorr; curIdxOfCorr.reserve(good.size());
+    std::vector<int> mapIdxOfCorr; mapIdxOfCorr.reserve(good.size());
+
+    int unmatchedCount = 0;
+    for (auto &m : good) {
+        int kf_idx = m.queryIdx;
+        int mp_idx = (kf_idx >=0 && kf_idx < (int)kf_kp_to_map_.size()) ? kf_kp_to_map_[kf_idx] : -1;
+        if (mp_idx >= 0 && mp_idx < (int)mapPoints_.size()) {
+            const Point3d &Xd = mapPoints_[mp_idx];
+            objPts.emplace_back((float)Xd.x,(float)Xd.y,(float)Xd.z);
+            imgPts.push_back(cur_keypoints_[m.trainIdx].pt);
+            curIdxOfCorr.push_back(m.trainIdx);
+            mapIdxOfCorr.push_back(mp_idx);
+        } else {
+            unmatchedCount++;
+        }
+    }
+    unmatchedRatio_ = good.empty() ? 0.0 : (double)unmatchedCount / (double)good.size();
+    if (objPts.size() < 4) return false;
+
+    Mat rvec, tvec, R;
+    std::vector<int> inliers;
+    bool ok = solvePnPRansac(objPts, imgPts, K_.K, K_.dist, rvec, tvec, false,
+                                 100, params_.pnpReprojErr, 0.99, inliers, SOLVEPNP_ITERATIVE);
+    if (!ok || (int)inliers.size() < std::max(4, params_.pnpMinInliers)) return false;
+
+    Rodrigues(rvec, R);
+    currentPoseSE3_ = makeSE3(R, tvec);
+    lastPnPInliers_ = (int)inliers.size();
+
+    // keep inlier correspondences for KF mapping when inserting a new KF
+    curFeat_to_map_inliers_.clear();
+    curFeat_to_map_inliers_.reserve(inliers.size());
+    for (int idx : inliers) {
+        int curIdx = curIdxOfCorr[idx];
+        int mpIdx = mapIdxOfCorr[idx];
+        curFeat_to_map_inliers_.emplace_back(curIdx, mpIdx);
+    }
+    return true;
+}
+
+bool VisualOdometry::shouldInsertKeyframe() const {
+    // simple: periodic or tracking weakening
+    bool periodic = (frameCount_ % params_.keyframeInterval) == 0;
+    bool weakTracking = (lastPnPInliers_ > 0 && lastPnPInliers_ < params_.pnpMinInliers + 10);
+
+    // baseline & rotation criteria
+    auto extractRt = [](const Mat& T, Mat& R, Mat& t){ R = T(Rect(0,0,3,3)).clone(); t = T(Rect(3,0,1,3)).clone(); };
+    Mat R_prev, t_prev, R_cur, t_cur; extractRt(kfPoseSE3_, R_prev, t_prev); extractRt(currentPoseSE3_, R_cur, t_cur);
+    double baseline = norm(t_cur - t_prev);
+    Mat R_delta = R_prev.t() * R_cur;
+    double traceVal = R_delta.at<double>(0,0) + R_delta.at<double>(1,1) + R_delta.at<double>(2,2);
+    double rotAngle = std::acos(std::min(1.0, std::max(-1.0, (traceVal - 1.0) / 2.0))) * 180.0 / CV_PI;
+    bool baselineEnough = baseline > params_.keyframeMinBaseline;
+    bool rotationEnough = rotAngle > params_.keyframeMinRotationDeg;
+
+    // mapping expansion need: many unmatched candidate features
+    bool needExpansion = unmatchedRatio_ > 0.5; // heuristic
+
+    return periodic || weakTracking || baselineEnough || rotationEnough || needExpansion;
+}
+
+void VisualOdometry::triangulateWithLastKeyframe() {
+    if (kf_descriptors_.empty() || cur_descriptors_.empty()) return;
+
+    // Match KF -> current again to find candidates without map points
+    std::vector<std::vector<DMatch>> knn;
+    matcher_->knnMatch(kf_descriptors_, cur_descriptors_, knn, 2);
+    std::vector<Point2f> kfPts, curPts;
+    std::vector<int> kfIdxs;
+    for (auto &v : knn) {
+        if (v.size()>=2 && v[0].distance < 0.75*v[1].distance) {
+            int qi = v[0].queryIdx; int ti = v[0].trainIdx;
+            if (qi >=0 && qi < (int)kf_kp_to_map_.size() && kf_kp_to_map_[qi] == -1) {
+                kfPts.push_back(kf_keypoints_[qi].pt);
+                curPts.push_back(cur_keypoints_[ti].pt);
+                kfIdxs.push_back(qi);
+            }
+        }
+    }
+    if (kfPts.size() < 15) return;
+
+    auto extractRt = [](const Mat& T, Mat& R, Mat& t){
+        R = T(Rect(0,0,3,3)).clone();
+        t = T(Rect(3,0,1,3)).clone();
+    };
+    Mat R1,t1,R2,t2; extractRt(kfPoseSE3_, R1,t1); extractRt(currentPoseSE3_, R2,t2);
+
+    Mat P1(3,4,CV_64F), P2(3,4,CV_64F);
+    R1.copyTo(P1(Rect(0,0,3,3))); t1.copyTo(P1(Rect(3,0,1,3)));
+    R2.copyTo(P2(Rect(0,0,3,3))); t2.copyTo(P2(Rect(3,0,1,3)));
+    P1 = K_.K * P1; P2 = K_.K * P2;
+
+    Mat X4; triangulatePoints(P1, P2, kfPts, curPts, X4);
+
+    auto reprojErr = [&](const Point3d& X, const Mat& R, const Mat& t, const Point2f& uv){
+        Mat Xv = (Mat_<double>(3,1) << X.x,X.y,X.z);
+        Mat x = K_.K * (R*Xv + t);
+        double u = x.at<double>(0)/x.at<double>(2);
+        double v = x.at<double>(1)/x.at<double>(2);
+        double du = u - uv.x; double dv = v - uv.y; return std::sqrt(du*du+dv*dv);
+    };
+
+    for (int i=0;i<X4.cols;i++) {
+        double hx = X4.at<double>(0,i);
+        double hy = X4.at<double>(1,i);
+        double hz = X4.at<double>(2,i);
+        double hw = X4.at<double>(3,i);
+        if (std::abs(hw) < 1e-8) continue;
+        Point3d X(hx/hw, hy/hw, hz/hw);
+        // positive depth check (in both views)
+        Mat R1_,t1_,R2_,t2_;
+        R1_ = R1; t1_ = t1; R2_ = R2; t2_ = t2;
+        Mat Xv = (Mat_<double>(3,1) << X.x,X.y,X.z);
+        Mat Y1 = R1_*Xv + t1_;
+        Mat Y2 = R2_*Xv + t2_;
+        double z1 = Y1.ptr<double>(2)[0];
+        double z2 = Y2.ptr<double>(2)[0];
+        if (z1 <= 0 || z2 <= 0) continue;
+        double e1 = reprojErr(X, R1, t1, kfPts[i]);
+        double e2 = reprojErr(X, R2, t2, curPts[i]);
+        if (e1 > params_.reprojErrThresh || e2 > params_.reprojErrThresh) continue;
+        int mpIndex = (int)mapPoints_.size();
+        mapPoints_.push_back(X);
+        int kf_kp = kfIdxs[i];
+        if (kf_kp >=0 && kf_kp < (int)kf_kp_to_map_.size()) kf_kp_to_map_[kf_kp] = mpIndex;
+    }
+}
+
+void VisualOdometry::runLocalBAIfEnabled() {
+    if (!backendEnabled_) return;
+    // Collect recent keyframes and build observations for map points
+    int N = std::max(2, params_.localWindowSize);
+    int totalKFs = (int)keyframePoses_.size();
+    if (totalKFs < 2) return;
+    int startIdx = std::max(0, totalKFs - N);
+
+    // Build KeyFrame vector for optimizer
+    std::vector<KeyFrame> kfs;
+    kfs.reserve(totalKFs - startIdx);
+    for (int i = startIdx; i < totalKFs; ++i) {
+        KeyFrame kf;
+        kf.id = i; // use history index as id
+        kf.kps = keyframeKeypoints_[i];
+        kf.desc = keyframeDescriptors_[i];
+        // extract R,t from SE3 4x4
+        const Mat &T = keyframePoses_[i];
+        Mat R = T(Rect(0,0,3,3)).clone();
+        Mat t = T(Rect(3,0,1,3)).clone();
+        kf.R_w = R; kf.t_w = t;
+        kfs.push_back(kf);
+    }
+
+    // Build MapPoint vector with observations from selected window
+    std::vector<MapPoint> mps;
+    mps.reserve(mapPoints_.size());
+    // Track which points are observed within the window
+    std::vector<char> pointObserved(mapPoints_.size(), 0);
+    for (int i = startIdx; i < totalKFs; ++i) {
+        const auto &kp2mp = keyframeKpToMap_[i];
+        for (int kpIdx = 0; kpIdx < (int)kp2mp.size(); ++kpIdx) {
+            int mpIdx = kp2mp[kpIdx];
+            if (mpIdx >= 0 && mpIdx < (int)mapPoints_.size()) {
+                pointObserved[mpIdx] = 1;
+            }
+        }
+    }
+    // Create mps with observations
+    for (size_t mpIdx = 0; mpIdx < mapPoints_.size(); ++mpIdx) {
+        if (!pointObserved[mpIdx]) continue; // only optimize observed points
+        MapPoint mp;
+        mp.id = (int)mpIdx;
+        mp.p = mapPoints_[mpIdx];
+        for (int i = startIdx; i < totalKFs; ++i) {
+            const auto &kp2mp = keyframeKpToMap_[i];
+            if ((int)kp2mp.size() == 0) continue;
+            for (int kpIdx = 0; kpIdx < (int)kp2mp.size(); ++kpIdx) {
+                if (kp2mp[kpIdx] == (int)mpIdx) {
+                    mp.observations.emplace_back(i, kpIdx);
+                }
+            }
+        }
+        if (!mp.observations.empty()) mps.push_back(mp);
+    }
+
+    if (kfs.size() < 2 || mps.empty()) return;
+
+    // Local/fixed KF indices relative to full history ids
+    std::vector<int> localKfIndices;
+    localKfIndices.reserve(kfs.size());
+    for (const auto &kf : kfs) localKfIndices.push_back(kf.id);
+    // Fix the oldest KF in the window to anchor optimization
+    std::vector<int> fixedKfIndices = { startIdx };
+
+    // Select backend
+
+    if (params_.backendType == 0) {
+    #ifndef USE_G2O
+        CV_Error(Error::StsBadArg, "G2O backend is not available (not built with SLAM module)");
+    #else
+        Optimizer::localBundleAdjustment(
+            kfs, mps, localKfIndices, fixedKfIndices,
+            K_.K.at<double>(0,0), K_.K.at<double>(1,1), K_.K.at<double>(0,2), K_.K.at<double>(1,2),
+            params_.baMaxIters);
+    #endif
+    } else
+    {
+        Optimizer::localBundleAdjustmentSFM(
+            kfs, mps, localKfIndices, fixedKfIndices,
+            K_.K.at<double>(0,0), K_.K.at<double>(1,1), K_.K.at<double>(0,2), K_.K.at<double>(1,2),
+            params_.baMaxIters);
+    }
+
+    // Write back optimized poses and points
+    for (const auto &kf : kfs) {
+        int i = kf.id;
+        Mat T = Mat::eye(4,4,CV_64F);
+        kf.R_w.copyTo(T(Rect(0,0,3,3)));
+        kf.t_w.copyTo(T(Rect(3,0,1,3)));
+        if (i >= 0 && i < totalKFs) keyframePoses_[i] = T.clone();
+        if (i == totalKFs - 1) { // also update current KF pose cache
+            kfPoseSE3_ = T.clone();
+            currentPoseSE3_ = T.clone();
+        }
+    }
+    for (const auto &mp : mps) {
+        if (mp.id >= 0 && mp.id < (int)mapPoints_.size()) {
+            mapPoints_[mp.id] = mp.p;
+        }
+    }
+}
+
+} // namespace vo
+} // namespace cv
\ No newline at end of file

From f4a0958ff411507ba8215ed11b1d2135c6d237b9 Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Thu, 4 Dec 2025 03:50:54 +0000
Subject: [PATCH 03/10] basic VO

---
 modules/slam/include/opencv2/slam/vo.hpp | 116 +---
 modules/slam/src/optimizer.cpp           | 114 +++-
 modules/slam/src/vo.cpp                  | 831 +++++++++++++----------
 3 files changed, 606 insertions(+), 455 deletions(-)

diff --git a/modules/slam/include/opencv2/slam/vo.hpp b/modules/slam/include/opencv2/slam/vo.hpp
index 9f08e203e3..31681ed1a6 100644
--- a/modules/slam/include/opencv2/slam/vo.hpp
+++ b/modules/slam/include/opencv2/slam/vo.hpp
@@ -1,114 +1,32 @@
 #pragma once
-
 #include <opencv2/core.hpp>
 #include <opencv2/features2d.hpp>
-#include <opencv2/calib3d.hpp>
+#include <string>
 #include <vector>
 
 namespace cv {
 namespace vo {
 
-struct CameraIntrinsics {
-    Mat K;      // 3x3 camera matrix
-    Mat dist;   // distortion coefficients (optional)
-};
-
-struct VOParams {
-    int minInitInliers = 80;
-    double ransacProb = 0.999;
-    double ransacThresh = 1.5; // pixels
-    double minParallaxDeg = 1.0;
-    double reprojErrThresh = 3.0;
-    int pnpMinInliers = 30;
-    double pnpReprojErr = 3.0;
-    int keyframeInterval = 10; // frames
-    double keyframeMinBaseline = 0.05; // relative scale
-    double keyframeMinRotationDeg = 5.0;
-    int localWindowSize = 7; // for BA
-    // Backend parameters
-    bool enableBackend = false;
-    int baMaxIters = 50;
-    // Backend type: 0=g2o (default), 1=opencv_sfm
-    int backendType = 0;
+struct VisualOdometryOptions {
+    int min_matches = 15;
+    int min_inliers = 4;
+    double min_inlier_ratio = 0.1;
+    double diff_zero_thresh = 2.0;
+    double flow_zero_thresh = 0.3;
+    double min_translation_norm = 1e-4;
+    double min_rotation_rad = 0.5 * CV_PI / 180.0;
+    int max_matches_keep = 500;
+    double flow_weight_lambda = 5.0;
 };
 
 class VisualOdometry {
 public:
-    VisualOdometry(const Ptr<Feature2D>& feature,
-                   const Ptr<DescriptorMatcher>& matcher,
-                   const CameraIntrinsics& intrinsics,
-                   const VOParams& params = VOParams());
-
-    // Process a single frame. Returns true if tracking succeeded.
-    bool processFrame(const Mat& img, double timestamp);
-
-    // Current camera pose (R|t) as 4x4 SE3 matrix.
-    Mat getCurrentPose() const;
-
-    // Full trajectory as vector of 4x4 matrices.
-    std::vector<Mat> getTrajectory() const;
-
-    // Backend controls
-    void setEnableBackend(bool on);
-    void setWindowSize(int N);
-    void setBAParams(double reprojThresh, int maxIters);
-    void setBackendType(int type);
-
-    // Loop closure & localization stubs (Milestone 4)
-    enum Mode { MODE_SLAM, MODE_LOCALIZATION };
-    void setMode(Mode m);
-    bool saveMap(const std::string& path) const;
-    bool loadMap(const std::string& path);
-    void enableLoopClosure(bool on);
-    void setPlaceRecognizer(const Ptr<Feature2D>& vocabFeature);
-
+    VisualOdometry(cv::Ptr<cv::Feature2D> feature, cv::Ptr<cv::DescriptorMatcher> matcher);
+    int run(const std::string &imageDir, double scale_m = 1.0, const VisualOdometryOptions &options = VisualOdometryOptions());
 private:
-    // internal helpers
-    bool initializeTwoView(const Mat& img0, const Mat& img1);
-    bool trackWithPnP(const Mat& img);
-    bool shouldInsertKeyframe() const;
-    void triangulateWithLastKeyframe();
-    void runLocalBAIfEnabled();
-
-    // state
-    Ptr<Feature2D> feature_;
-    Ptr<DescriptorMatcher> matcher_;
-    CameraIntrinsics K_;
-    VOParams params_;
-
-    bool initialized_ = false;
-    bool backendEnabled_ = false;
-    int frameCount_ = 0;
-    Mode mode_ = MODE_SLAM;
-    bool loopClosureEnabled_ = false;
-
-    // cached
-    Mat lastImg_;
-    Mat currentPoseSE3_; // 4x4
-    std::vector<Mat> trajectory_;
-
-    // minimal containers (placeholder, to be integrated with MapManager/KeyFrame)
-    std::vector<Point3d> mapPoints_; // simple storage for demo
-
-    // keyframe state (latest KF only)
-    std::vector<KeyPoint> kf_keypoints_;
-    Mat kf_descriptors_;
-    std::vector<int> kf_kp_to_map_; // size == kf_keypoints_.size(), -1 if not mapped
-    Mat kfPoseSE3_; // KF pose 4x4
-
-    // current frame cached features
-    std::vector<KeyPoint> cur_keypoints_;
-    Mat cur_descriptors_;
-    int lastPnPInliers_ = 0;
-    std::vector<std::pair<int,int>> curFeat_to_map_inliers_; // (cur_kp_idx, map_idx)
-    double unmatchedRatio_ = 0.0; // fraction of matched keyframe features without map points (for KF decision)
-
-    // simple history for sliding window
-    std::vector<Mat> keyframePoses_; // poses of historical KFs
-    std::vector<std::vector<KeyPoint>> keyframeKeypoints_;
-    std::vector<Mat> keyframeDescriptors_;
-    std::vector<std::vector<int>> keyframeKpToMap_; // per-KF mapping from kp idx to map point idx
+    cv::Ptr<cv::Feature2D> feature_;
+    cv::Ptr<cv::DescriptorMatcher> matcher_;
 };
 
-} // namespace vo
-} // namespace cv
\ No newline at end of file
+}
+} // namespace cv::vo
\ No newline at end of file
diff --git a/modules/slam/src/optimizer.cpp b/modules/slam/src/optimizer.cpp
index fe138c718c..51b438357d 100644
--- a/modules/slam/src/optimizer.cpp
+++ b/modules/slam/src/optimizer.cpp
@@ -1,6 +1,8 @@
 #include "opencv2/slam/optimizer.hpp"
 #include <iostream>
 #include <set>
+#include <unordered_set>
+#include <algorithm>
 #include <opencv2/calib3d.hpp>
 
 // If g2o is enabled (CMake defines USE_G2O), compile and use the g2o-based
@@ -151,7 +153,117 @@ void Optimizer::localBundleAdjustmentSFM(
     const std::vector<int> &fixedKfIndices,
     double fx, double fy, double cx, double cy,
     int iterations) {
-    //TODO: Implement SFM-based local BA
+    // Simple SFM-based local bundle adjustment using OpenCV routines.
+    // This implementation alternates:
+    //  - point-only Gauss-Newton updates (poses kept fixed)
+    //  - pose-only optimization using PnP (points kept fixed)
+    // It uses available jacobians w.r.t. point coordinates from
+    // computeReprojectionError and the existing optimizePose() helper
+    // to avoid depending on g2o / ceres. This provides an effective
+    // local refinement for SLAM windows when full BA backends are
+    // not available.
+
+    if (localKfIndices.empty() || mappoints.empty()) return;
+
+    // Fast lookup for whether a keyframe id is in the local window
+    std::unordered_set<int> localSet(localKfIndices.begin(), localKfIndices.end());
+    std::unordered_set<int> fixedSet(fixedKfIndices.begin(), fixedKfIndices.end());
+
+    const double HUBER_DELTA = 3.0; // pixels
+    const double MAX_POINT_STEP = 1.0; // meters (safeguard per-iter)
+
+    // Outer iterations: alternate point updates and pose updates
+    for (int iter = 0; iter < iterations; ++iter) {
+        // --- Point-only Gauss-Newton update (poses fixed) ---
+        for (size_t pid = 0; pid < mappoints.size(); ++pid) {
+            MapPoint &mp = mappoints[pid];
+            if (mp.isBad) continue;
+
+            Mat JtJ = Mat::zeros(3, 3, CV_64F);
+            Mat Jtr = Mat::zeros(3, 1, CV_64F);
+            int obsCount = 0;
+
+            for (const auto &obs : mp.observations) {
+                int kfIdx = obs.first;
+                int kpIdx = obs.second;
+                if (localSet.find(kfIdx) == localSet.end()) continue;
+                if (kfIdx < 0 || kfIdx >= static_cast<int>(keyframes.size())) continue;
+                KeyFrame &kf = keyframes[kfIdx];
+                if (kpIdx < 0 || kpIdx >= static_cast<int>(kf.kps.size())) continue;
+
+                Point2f observed = kf.kps[kpIdx].pt;
+                // Project current point into this keyframe
+                Point2f proj = project(mp.p, kf.R_w, kf.t_w, fx, fy, cx, cy);
+                if (proj.x < 0 || proj.y < 0) continue;
+                // Compute jacobians (fills jacobianPoint)
+                Mat jacPose, jacPoint;
+                computeReprojectionError(mp.p, kf.R_w, kf.t_w, observed, fx, fy, cx, cy, jacPose, jacPoint);
+                // jacPoint is 2x3, residual r = [u - u_obs; v - v_obs]
+                Mat r = (Mat_<double>(2,1) << proj.x - observed.x, proj.y - observed.y);
+
+                // robust weight (Huber)
+                double err = std::sqrt(r.at<double>(0,0)*r.at<double>(0,0) + r.at<double>(1,0)*r.at<double>(1,0));
+                double w = 1.0;
+                if (err > HUBER_DELTA) w = HUBER_DELTA / err;
+
+                // accumulate JtJ and Jtr
+                Mat Jt = jacPoint.t(); // 3x2
+                Mat W = Mat::eye(2,2,CV_64F) * w;
+                Mat JtW = Jt * W; // 3x2
+                JtJ += JtW * jacPoint; // 3x3
+                Jtr += JtW * r; // 3x1
+                obsCount++;
+            }
+
+            if (obsCount < 2) continue; // not enough constraints
+
+            // Solve for delta using SVD for stability
+            Mat delta; // 3x1
+            bool solved = false;
+            if (cv::determinant(JtJ) != 0) {
+                solved = cv::solve(JtJ, -Jtr, delta, cv::DECOMP_SVD);
+            } else {
+                solved = cv::solve(JtJ, -Jtr, delta, cv::DECOMP_SVD);
+            }
+            if (!solved) continue;
+
+            double step = std::sqrt(delta.at<double>(0,0)*delta.at<double>(0,0) +
+                                    delta.at<double>(1,0)*delta.at<double>(1,0) +
+                                    delta.at<double>(2,0)*delta.at<double>(2,0));
+            if (step > MAX_POINT_STEP) {
+                double scale = MAX_POINT_STEP / step;
+                delta *= scale;
+            }
+
+            mp.p.x += delta.at<double>(0,0);
+            mp.p.y += delta.at<double>(1,0);
+            mp.p.z += delta.at<double>(2,0);
+        }
+
+        // --- Pose-only optimization (points fixed) ---
+        // For each local keyframe that is not fixed, call optimizePose
+        for (int kfId : localKfIndices) {
+            if (fixedSet.find(kfId) != fixedSet.end()) continue;
+            if (kfId < 0 || kfId >= static_cast<int>(keyframes.size())) continue;
+            KeyFrame &kf = keyframes[kfId];
+            // Build matchedMpIndices: for each keypoint in this KF, which mappoint index it corresponds to
+            std::vector<int> matchedMpIndices(kf.kps.size(), -1);
+            for (size_t mpIdx = 0; mpIdx < mappoints.size(); ++mpIdx) {
+                const MapPoint &mp = mappoints[mpIdx];
+                if (mp.isBad) continue;
+                for (const auto &obs : mp.observations) {
+                    if (obs.first == kfId) {
+                        int kpIdx = obs.second;
+                        if (kpIdx >= 0 && kpIdx < static_cast<int>(matchedMpIndices.size()))
+                            matchedMpIndices[kpIdx] = static_cast<int>(mpIdx);
+                    }
+                }
+            }
+            std::vector<bool> inliers;
+            // Use the same number of iterations as outer loop for RANSAC attempts
+            optimizePose(kf, mappoints, matchedMpIndices, fx, fy, cx, cy, inliers, std::max(20, iterations));
+        }
+    }
 }
 
 
diff --git a/modules/slam/src/vo.cpp b/modules/slam/src/vo.cpp
index 439b8bba14..0bd730ac51 100644
--- a/modules/slam/src/vo.cpp
+++ b/modules/slam/src/vo.cpp
@@ -1,388 +1,509 @@
-#include "opencv2/slam/vo.hpp"
+#include "opencv2/slam/data_loader.hpp"
+#include "opencv2/slam/feature.hpp"
+#include "opencv2/slam/initializer.hpp"
+#include "opencv2/slam/keyframe.hpp"
+#include "opencv2/slam/localizer.hpp"
+#include "opencv2/slam/map.hpp"
+#include "opencv2/slam/matcher.hpp"
 #include "opencv2/slam/optimizer.hpp"
+#include "opencv2/slam/pose.hpp"
+#include "opencv2/slam/visualizer.hpp"
+#include "opencv2/slam/vo.hpp"
+#include <thread>
+#include <mutex>
+#include <condition_variable>
+#include <atomic>
+#include <opencv2/calib3d.hpp>
+#include <iostream>
 #include <opencv2/imgproc.hpp>
 #include <opencv2/highgui.hpp>
-#include <opencv2/calib3d.hpp>
-#include <numeric>
+#include <opencv2/video/tracking.hpp>
+#include <filesystem>
+#include <chrono>
+#include <iomanip>
+#include <sstream>
+#include <cmath>
+#include <fstream>
+#include <algorithm>
 
 namespace cv {
 namespace vo {
 
-static Mat makeSE3(const Mat& R, const Mat& t) {
-    Mat T = Mat::eye(4, 4, CV_64F);
-    R.copyTo(T(Rect(0,0,3,3)));
-    t.copyTo(T(Rect(3,0,1,3)));
-    return T;
+VisualOdometry::VisualOdometry(Ptr<Feature2D> feature, Ptr<DescriptorMatcher> matcher)
+    : feature_(std::move(feature)), matcher_(std::move(matcher)) {
 }
 
-VisualOdometry::VisualOdometry(const Ptr<Feature2D>& feature,
-                               const Ptr<DescriptorMatcher>& matcher,
-                               const CameraIntrinsics& intrinsics,
-                               const VOParams& params)
-    : feature_(feature), matcher_(matcher), K_(intrinsics), params_(params) {
-    currentPoseSE3_ = Mat::eye(4,4,CV_64F);
-}
-
-bool VisualOdometry::processFrame(const Mat& img, double /*timestamp*/) {
-    frameCount_++;
-    if (!initialized_) {
-        if (lastImg_.empty()) {
-            lastImg_ = img.clone();
-            return false;
-        }
-        initialized_ = initializeTwoView(lastImg_, img);
-        lastImg_ = img.clone();
-        if (initialized_) trajectory_.push_back(currentPoseSE3_.clone());
-        return initialized_;
+int VisualOdometry::run(const std::string &imageDir, double scale_m, const VisualOdometryOptions &options){
+    DataLoader loader(imageDir);
+    std::cout << "VisualOdometry: loaded " << loader.size() << " images from " << imageDir << std::endl;
+    if(loader.size() == 0){
+        std::cerr << "VisualOdometry: no images found in " << imageDir << std::endl;
+        return -1;
     }
 
-    bool ok = trackWithPnP(img);
-    lastImg_ = img.clone();
-    if (ok) {
-        trajectory_.push_back(currentPoseSE3_.clone());
-        if (shouldInsertKeyframe()) {
-            // promote current frame to new keyframe using current features and PnP inliers
-            kfPoseSE3_ = currentPoseSE3_.clone();
-            kf_keypoints_ = cur_keypoints_;
-            kf_descriptors_ = cur_descriptors_.clone();
-            kf_kp_to_map_.assign((int)kf_keypoints_.size(), -1);
-                keyframePoses_.push_back(kfPoseSE3_.clone());
-                keyframeKeypoints_.push_back(kf_keypoints_);
-                keyframeDescriptors_.push_back(kf_descriptors_.clone());
-            // seed mapping for tracked correspondences
-            for (auto &pr : curFeat_to_map_inliers_) {
-                int curIdx = pr.first; int mpIdx = pr.second;
-                if (curIdx >=0 && curIdx < (int)kf_kp_to_map_.size()) kf_kp_to_map_[curIdx] = mpIdx;
-            }
-                // push kp->map history for BA
-                keyframeKpToMap_.push_back(kf_kp_to_map_);
-            triangulateWithLastKeyframe();
-            runLocalBAIfEnabled();
-        }
+    if(!feature_){
+        feature_ = ORB::create(2000);
     }
-    return ok;
-}
-
-Mat VisualOdometry::getCurrentPose() const { return currentPoseSE3_.clone(); }
-std::vector<Mat> VisualOdometry::getTrajectory() const { return trajectory_; }
-
-void VisualOdometry::setEnableBackend(bool on) { backendEnabled_ = on; }
-void VisualOdometry::setWindowSize(int N) { params_.localWindowSize = N; }
-void VisualOdometry::setBAParams(double reprojThresh, int maxIters) {
-    params_.reprojErrThresh = reprojThresh;
-    params_.baMaxIters = std::max(1, maxIters);
-}
-void VisualOdometry::setBackendType(int type) { params_.backendType = type; }
-void VisualOdometry::setMode(Mode m) { mode_ = m; }
-bool VisualOdometry::saveMap(const std::string& /*path*/) const { return false; }
-bool VisualOdometry::loadMap(const std::string& /*path*/) { return false; }
-void VisualOdometry::enableLoopClosure(bool on) { loopClosureEnabled_ = on; }
-void VisualOdometry::setPlaceRecognizer(const Ptr<Feature2D>& /*vocabFeature*/) {}
-
-bool VisualOdometry::initializeTwoView(const Mat& img0, const Mat& img1) {
-    std::vector<KeyPoint> k0, k1; Mat d0, d1;
-    feature_->detectAndCompute(img0, noArray(), k0, d0);
-    feature_->detectAndCompute(img1, noArray(), k1, d1);
-    if (k0.size() < 50 || k1.size() < 50) return false;
-
-    std::vector<std::vector<DMatch>> knn01; matcher_->knnMatch(d0, d1, knn01, 2);
-    std::vector<DMatch> good;
-    for (auto& v : knn01) if (v.size()>=2 && v[0].distance < 0.75 * v[1].distance) good.push_back(v[0]);
-    if (good.size() < 80) return false;
-
-    std::vector<Point2f> p0, p1;
-    p0.reserve(good.size()); p1.reserve(good.size());
-    for (auto& m : good) { p0.push_back(k0[m.queryIdx].pt); p1.push_back(k1[m.trainIdx].pt); }
-
-    Mat mask;
-    Mat E = findEssentialMat(p0, p1, K_.K, RANSAC, params_.ransacProb, params_.ransacThresh, mask);
-    if (E.empty()) return false;
-
-    Mat R, t;
-    int inliers = recoverPose(E, p0, p1, K_.K, R, t, mask);
-    if (inliers < params_.minInitInliers) return false;
-
-    // Set first pose = Identity, second = (R,t)
-    currentPoseSE3_ = makeSE3(R, t);
-
-    // Minimal triangulation demo (no storage of per-point observations yet)
-    Mat P0 = K_.K * Mat::eye(3,4,CV_64F);
-    Mat P1(3,4,CV_64F); R.copyTo(P1(Rect(0,0,3,3))); t.copyTo(P1(Rect(3,0,1,3))); P1 = K_.K * P1;
-
-    std::vector<Point2f> tp0, tp1; tp0.reserve(inliers); tp1.reserve(inliers);
-    std::vector<int> inlier_trainIdx; inlier_trainIdx.reserve(inliers);
-    for (size_t i=0;i<good.size();++i) if (mask.at<uchar>(int(i))) {
-        tp0.push_back(p0[i]); tp1.push_back(p1[i]);
-        inlier_trainIdx.push_back(good[i].trainIdx);
+    if(!matcher_){
+        matcher_ = DescriptorMatcher::create(DescriptorMatcher::BRUTEFORCE_HAMMING);
     }
-    if (tp0.size() >= 20) {
-        Mat X4;
-        triangulatePoints(P0, P1, tp0, tp1, X4);
-        // initialize KF as second frame
-        kf_keypoints_ = k1;
-        kf_descriptors_ = d1.clone();
-        kf_kp_to_map_.assign((int)kf_keypoints_.size(), -1);
-        kfPoseSE3_ = currentPoseSE3_.clone();
-        for (int i=0;i<X4.cols;i++) {
-            Vec4d h = X4.col(i);
-            if (std::abs(h[3]) < 1e-8) continue;
-            Point3d X(h[0]/h[3], h[1]/h[3], h[2]/h[3]);
-            if (X.z > 0) {
-                int mpIndex = (int)mapPoints_.size();
-                mapPoints_.push_back(X);
-                int trainIdx = inlier_trainIdx[i];
-                if (trainIdx >=0 && trainIdx < (int)kf_kp_to_map_.size())
-                    kf_kp_to_map_[trainIdx] = mpIndex;
-            }
-        }
+    // Remove internal FeatureExtractor/Matcher in favor of injected OpenCV components
+    PoseEstimator poseEst;
+    Visualizer vis;
+    MapManager map;
+    // two-view initializer
+    Initializer initializer;
+    // configure Localizer with a slightly stricter Lowe ratio (0.7)
+    Localizer localizer(0.7f);
+
+    // prepare per-run CSV diagnostics
+    std::string runTimestamp;
+    {
+        auto now = std::chrono::system_clock::now();
+        std::time_t t = std::chrono::system_clock::to_time_t(now);
+        std::tm tm = *std::localtime(&t);
+        std::ostringstream ss; ss << std::put_time(&tm, "%Y%m%d_%H%M%S");
+        runTimestamp = ss.str();
+    }
+    std::filesystem::path resultDir("../../result");
+    if(!std::filesystem::exists(resultDir)) std::filesystem::create_directories(resultDir);
+    // create a per-run folder under result/ named by timestamp
+    std::filesystem::path runDir = resultDir / runTimestamp;
+    if(!std::filesystem::exists(runDir)) std::filesystem::create_directories(runDir);
+    std::filesystem::path csvPath = runDir / std::string("run.csv");
+    std::ofstream csv(csvPath);
+    if(csv){
+        csv << "frame_id,mean_diff,median_flow,pre_matches,post_matches,inliers,inlier_ratio,integrated\n";
+        csv.flush();
+        std::cout << "Writing diagnostics to " << csvPath.string() << std::endl;
+    } else {
+        std::cerr << "Failed to open diagnostics CSV " << csvPath.string() << std::endl;
     }
-    return true;
-}
 
-bool VisualOdometry::trackWithPnP(const Mat& img) {
-    cur_keypoints_.clear();
-    feature_->detectAndCompute(img, noArray(), cur_keypoints_, cur_descriptors_);
-    if (kf_descriptors_.empty() || cur_descriptors_.empty()) return false;
-
-    // Match KF -> current
-    std::vector<std::vector<DMatch>> knn;
-    matcher_->knnMatch(kf_descriptors_, cur_descriptors_, knn, 2);
-    std::vector<DMatch> good;
-    good.reserve(knn.size());
-    for (auto &v : knn) if (v.size()>=2 && v[0].distance < 0.75*v[1].distance) good.push_back(v[0]);
-
-    std::vector<Point3f> objPts; objPts.reserve(good.size());
-    std::vector<Point2f> imgPts; imgPts.reserve(good.size());
-    std::vector<int> curIdxOfCorr; curIdxOfCorr.reserve(good.size());
-    std::vector<int> mapIdxOfCorr; mapIdxOfCorr.reserve(good.size());
-
-    int unmatchedCount = 0;
-    for (auto &m : good) {
-        int kf_idx = m.queryIdx;
-        int mp_idx = (kf_idx >=0 && kf_idx < (int)kf_kp_to_map_.size()) ? kf_kp_to_map_[kf_idx] : -1;
-        if (mp_idx >= 0 && mp_idx < (int)mapPoints_.size()) {
-            const Point3d &Xd = mapPoints_[mp_idx];
-            objPts.emplace_back((float)Xd.x,(float)Xd.y,(float)Xd.z);
-            imgPts.push_back(cur_keypoints_[m.trainIdx].pt);
-            curIdxOfCorr.push_back(m.trainIdx);
-            mapIdxOfCorr.push_back(mp_idx);
-        } else {
-            unmatchedCount++;
+    Mat R_g = Mat::eye(3,3,CV_64F);
+    Mat t_g = Mat::zeros(3,1,CV_64F);
+
+    // simple map structures
+    std::vector<KeyFrame> keyframes;
+    std::vector<MapPoint> mappoints;
+    std::unordered_map<int,int> keyframeIdToIndex;
+
+    // Backend (BA) thread primitives
+    std::mutex mapMutex; // protects map and keyframe modifications and writeback
+    std::condition_variable backendCv;
+    std::atomic<bool> backendStop(false);
+    std::atomic<int> backendRequests(0);
+    const int LOCAL_BA_WINDOW = 5; // window size for local BA (adjustable)
+
+    // Start backend thread: waits for notifications and runs BA on a snapshot
+    std::thread backendThread([&]() {
+        while(!backendStop.load()){
+            std::unique_lock<std::mutex> lk(mapMutex);
+            backendCv.wait(lk, [&]{ return backendStop.load() || backendRequests.load() > 0; });
+            if(backendStop.load()) break;
+            // snapshot map and keyframes
+            auto kfs_snapshot = map.keyframes();
+            auto mps_snapshot = map.mappoints();
+            // reset requests
+            backendRequests.store(0);
+            lk.unlock();
+
+            // determine local window
+            int K = static_cast<int>(kfs_snapshot.size());
+            if(K <= 0) continue;
+            int start = std::max(0, K - LOCAL_BA_WINDOW);
+            std::vector<int> localKfIndices;
+            for(int ii = start; ii < K; ++ii) localKfIndices.push_back(ii);
+            std::vector<int> fixedKfIndices;
+            if(start > 0) fixedKfIndices.push_back(0);
+
+            // Run BA on snapshot (may take time) - uses Optimizer which will use g2o if enabled
+            Optimizer::localBundleAdjustmentSFM(kfs_snapshot, mps_snapshot, localKfIndices, fixedKfIndices,
+                                            loader.fx(), loader.fy(), loader.cx(), loader.cy(), 10);
+
+            // write back optimized poses/points into main map under lock using id-based lookup
+            std::lock_guard<std::mutex> lk2(mapMutex);
+            auto &kfs_ref = const_cast<std::vector<KeyFrame>&>(map.keyframes());
+            auto &mps_ref = const_cast<std::vector<MapPoint>&>(map.mappoints());
+            // copy back poses by id to ensure we update the authoritative containers
+            for(const auto &kf_opt : kfs_snapshot){
+                int idx = map.keyframeIndex(kf_opt.id);
+                if(idx >= 0 && idx < static_cast<int>(kfs_ref.size())){
+                    kfs_ref[idx].R_w = kf_opt.R_w.clone();
+                    kfs_ref[idx].t_w = kf_opt.t_w.clone();
+                }
+            }
+            // copy back mappoint positions by id
+            for(const auto &mp_opt : mps_snapshot){
+                if(mp_opt.id <= 0) continue;
+                int idx = map.mapPointIndex(mp_opt.id);
+                if(idx >= 0 && idx < static_cast<int>(mps_ref.size())){
+                    mps_ref[idx].p = mp_opt.p;
+                }
+            }
         }
-    }
-    unmatchedRatio_ = good.empty() ? 0.0 : (double)unmatchedCount / (double)good.size();
-    if (objPts.size() < 4) return false;
-
-    Mat rvec, tvec, R;
-    std::vector<int> inliers;
-    bool ok = solvePnPRansac(objPts, imgPts, K_.K, K_.dist, rvec, tvec, false,
-                                 100, params_.pnpReprojErr, 0.99, inliers, SOLVEPNP_ITERATIVE);
-    if (!ok || (int)inliers.size() < std::max(4, params_.pnpMinInliers)) return false;
-
-    Rodrigues(rvec, R);
-    currentPoseSE3_ = makeSE3(R, tvec);
-    lastPnPInliers_ = (int)inliers.size();
-
-    // keep inlier correspondences for KF mapping when inserting a new KF
-    curFeat_to_map_inliers_.clear();
-    curFeat_to_map_inliers_.reserve(inliers.size());
-    for (int idx : inliers) {
-        int curIdx = curIdxOfCorr[idx];
-        int mpIdx = mapIdxOfCorr[idx];
-        curFeat_to_map_inliers_.emplace_back(curIdx, mpIdx);
-    }
-    return true;
-}
+    });
+
+    Mat frame;
+    std::string imgPath;
+    int frame_id = 0;
+
+    // persistent previous-frame storage (declare outside loop so detectAndCompute can use them)
+    static std::vector<KeyPoint> prevKp;
+    static Mat prevGray, prevDesc;
+    while(loader.getNextImage(frame, imgPath)){
+        Mat gray = frame;
+        if(gray.channels() > 1) cvtColor(gray, gray, COLOR_BGR2GRAY);
+
+        std::vector<KeyPoint> kps;
+        Mat desc;
+        // Detect and compute descriptors using injected feature_ (e.g., ORB)
+        feature_->detect(gray, kps);
+        feature_->compute(gray, kps, desc);
+
+    // (previous-frame storage declared outside loop)
+
+        if(!prevGray.empty() && !prevDesc.empty() && !desc.empty()){
+            // KNN match with ratio test and mutual cross-check
+            std::vector<std::vector<DMatch>> knn12, knn21;
+            matcher_->knnMatch(prevDesc, desc, knn12, 2);
+            matcher_->knnMatch(desc, prevDesc, knn21, 2);
+            auto ratioKeep = [&](const std::vector<std::vector<DMatch>>& knn, bool forward) {
+                std::vector<DMatch> filtered;
+                for(size_t qi=0; qi<knn.size(); ++qi){
+                    if(knn[qi].empty()) continue;
+                    DMatch best = knn[qi][0];
+                    float ratio = 0.75f;
+                    if(knn[qi].size() >= 2){
+                        if(knn[qi][1].distance > 0) {
+                            if(best.distance / knn[qi][1].distance > ratio) continue;
+                        }
+                    }
+                    // mutual check
+                    int q = forward ? (int)qi : best.trainIdx;
+                    int t = forward ? best.trainIdx : (int)qi;
+                    // find reverse match for t
+                    const auto &rev = forward ? knn21 : knn12;
+                    if(t < 0 || t >= (int)rev.size() || rev[t].empty()) continue;
+                    DMatch rbest = rev[t][0];
+                    if((forward && rbest.trainIdx == (int)qi) || (!forward && rbest.trainIdx == best.queryIdx)){
+                        filtered.push_back(best);
+                    }
+                }
+                return filtered;
+            };
+            std::vector<DMatch> goodMatches = ratioKeep(knn12, true);
+
+            Mat imgMatches;
+            drawMatches(prevGray, prevKp, gray, kps, goodMatches, imgMatches,
+                            Scalar::all(-1), Scalar::all(-1), std::vector<char>(), DrawMatchesFlags::NOT_DRAW_SINGLE_POINTS);
+
+            std::vector<Point2f> pts1, pts2;
+            pts1.reserve(goodMatches.size()); pts2.reserve(goodMatches.size());
+            for(const auto &m: goodMatches){
+                pts1.push_back(prevKp[m.queryIdx].pt);
+                pts2.push_back(kps[m.trainIdx].pt);
+            }
 
-bool VisualOdometry::shouldInsertKeyframe() const {
-    // simple: periodic or tracking weakening
-    bool periodic = (frameCount_ % params_.keyframeInterval) == 0;
-    bool weakTracking = (lastPnPInliers_ > 0 && lastPnPInliers_ < params_.pnpMinInliers + 10);
-
-    // baseline & rotation criteria
-    auto extractRt = [](const Mat& T, Mat& R, Mat& t){ R = T(Rect(0,0,3,3)).clone(); t = T(Rect(3,0,1,3)).clone(); };
-    Mat R_prev, t_prev, R_cur, t_cur; extractRt(kfPoseSE3_, R_prev, t_prev); extractRt(currentPoseSE3_, R_cur, t_cur);
-    double baseline = norm(t_cur - t_prev);
-    Mat R_delta = R_prev.t() * R_cur;
-    double traceVal = R_delta.at<double>(0,0) + R_delta.at<double>(1,1) + R_delta.at<double>(2,2);
-    double rotAngle = std::acos(std::min(1.0, std::max(-1.0, (traceVal - 1.0) / 2.0))) * 180.0 / CV_PI;
-    bool baselineEnough = baseline > params_.keyframeMinBaseline;
-    bool rotationEnough = rotAngle > params_.keyframeMinRotationDeg;
-
-    // mapping expansion need: many unmatched candidate features
-    bool needExpansion = unmatchedRatio_ > 0.5; // heuristic
-
-    return periodic || weakTracking || baselineEnough || rotationEnough || needExpansion;
-}
+            // quick frame-diff to detect near-static frames
+            double meanDiff = 0.0;
+            if(!prevGray.empty()){
+                Mat diff; absdiff(gray, prevGray, diff);
+                meanDiff = mean(diff)[0];
+            }
 
-void VisualOdometry::triangulateWithLastKeyframe() {
-    if (kf_descriptors_.empty() || cur_descriptors_.empty()) return;
-
-    // Match KF -> current again to find candidates without map points
-    std::vector<std::vector<DMatch>> knn;
-    matcher_->knnMatch(kf_descriptors_, cur_descriptors_, knn, 2);
-    std::vector<Point2f> kfPts, curPts;
-    std::vector<int> kfIdxs;
-    for (auto &v : knn) {
-        if (v.size()>=2 && v[0].distance < 0.75*v[1].distance) {
-            int qi = v[0].queryIdx; int ti = v[0].trainIdx;
-            if (qi >=0 && qi < (int)kf_kp_to_map_.size() && kf_kp_to_map_[qi] == -1) {
-                kfPts.push_back(kf_keypoints_[qi].pt);
-                curPts.push_back(cur_keypoints_[ti].pt);
-                kfIdxs.push_back(qi);
+            // compute per-match flow magnitudes and median flow
+            std::vector<double> flows; flows.reserve(pts1.size());
+            double median_flow = 0.0;
+            for(size_t i=0;i<pts1.size();++i){
+                double dx = pts2[i].x - pts1[i].x;
+                double dy = pts2[i].y - pts1[i].y;
+                flows.push_back(std::sqrt(dx*dx + dy*dy));
+            }
+            if(!flows.empty()){
+                std::vector<double> tmp = flows;
+                size_t mid = tmp.size()/2;
+                std::nth_element(tmp.begin(), tmp.begin()+mid, tmp.end());
+                median_flow = tmp[mid];
             }
-        }
-    }
-    if (kfPts.size() < 15) return;
-
-    auto extractRt = [](const Mat& T, Mat& R, Mat& t){
-        R = T(Rect(0,0,3,3)).clone();
-        t = T(Rect(3,0,1,3)).clone();
-    };
-    Mat R1,t1,R2,t2; extractRt(kfPoseSE3_, R1,t1); extractRt(currentPoseSE3_, R2,t2);
-
-    Mat P1(3,4,CV_64F), P2(3,4,CV_64F);
-    R1.copyTo(P1(Rect(0,0,3,3))); t1.copyTo(P1(Rect(3,0,1,3)));
-    R2.copyTo(P2(Rect(0,0,3,3))); t2.copyTo(P2(Rect(3,0,1,3)));
-    P1 = K_.K * P1; P2 = K_.K * P2;
-
-    Mat X4; triangulatePoints(P1, P2, kfPts, curPts, X4);
-
-    auto reprojErr = [&](const Point3d& X, const Mat& R, const Mat& t, const Point2f& uv){
-        Mat Xv = (Mat_<double>(3,1) << X.x,X.y,X.z);
-        Mat x = K_.K * (R*Xv + t);
-        double u = x.at<double>(0)/x.at<double>(2);
-        double v = x.at<double>(1)/x.at<double>(2);
-        double du = u - uv.x; double dv = v - uv.y; return std::sqrt(du*du+dv*dv);
-    };
-
-    for (int i=0;i<X4.cols;i++) {
-        double hx = X4.at<double>(0,i);
-        double hy = X4.at<double>(1,i);
-        double hz = X4.at<double>(2,i);
-        double hw = X4.at<double>(3,i);
-        if (std::abs(hw) < 1e-8) continue;
-        Point3d X(hx/hw, hy/hw, hz/hw);
-        // positive depth check (in both views)
-        Mat R1_,t1_,R2_,t2_;
-        R1_ = R1; t1_ = t1; R2_ = R2; t2_ = t2;
-        Mat Xv = (Mat_<double>(3,1) << X.x,X.y,X.z);
-        Mat Y1 = R1_*Xv + t1_;
-        Mat Y2 = R2_*Xv + t2_;
-        double z1 = Y1.ptr<double>(2)[0];
-        double z2 = Y2.ptr<double>(2)[0];
-        if (z1 <= 0 || z2 <= 0) continue;
-        double e1 = reprojErr(X, R1, t1, kfPts[i]);
-        double e2 = reprojErr(X, R2, t2, curPts[i]);
-        if (e1 > params_.reprojErrThresh || e2 > params_.reprojErrThresh) continue;
-        int mpIndex = (int)mapPoints_.size();
-        mapPoints_.push_back(X);
-        int kf_kp = kfIdxs[i];
-        if (kf_kp >=0 && kf_kp < (int)kf_kp_to_map_.size()) kf_kp_to_map_[kf_kp] = mpIndex;
-    }
-}
 
-void VisualOdometry::runLocalBAIfEnabled() {
-    if (!backendEnabled_) return;
-    // Collect recent keyframes and build observations for map points
-    int N = std::max(2, params_.localWindowSize);
-    int totalKFs = (int)keyframePoses_.size();
-    if (totalKFs < 2) return;
-    int startIdx = std::max(0, totalKFs - N);
-
-    // Build KeyFrame vector for optimizer
-    std::vector<KeyFrame> kfs;
-    kfs.reserve(totalKFs - startIdx);
-    for (int i = startIdx; i < totalKFs; ++i) {
-        KeyFrame kf;
-        kf.id = i; // use history index as id
-        kf.kps = keyframeKeypoints_[i];
-        kf.desc = keyframeDescriptors_[i];
-        // extract R,t from SE3 4x4
-        const Mat &T = keyframePoses_[i];
-        Mat R = T(Rect(0,0,3,3)).clone();
-        Mat t = T(Rect(3,0,1,3)).clone();
-        kf.R_w = R; kf.t_w = t;
-        kfs.push_back(kf);
-    }
+            int pre_matches = static_cast<int>(goodMatches.size());
+            int post_matches = pre_matches;
+
+            // Two-view initialization: if map is empty and this is the second frame, try to bootstrap
+            if(map.keyframes().empty() && frame_id == 1){
+                std::cout << "Attempting two-view initialization (frame 0 + 1), matches=" << goodMatches.size() << std::endl;
+                Mat R_init, t_init;
+                std::vector<Point3d> pts3D;
+                std::vector<bool> isTri;
+                // call initializer using the matched keypoints between prev and current
+                if(initializer.initialize(prevKp, kps, goodMatches, loader.fx(), loader.fy(), loader.cx(), loader.cy(), R_init, t_init, pts3D, isTri)){
+                    std::cout << "Initializer: success, creating initial keyframes and mappoints (" << pts3D.size() << ")" << std::endl;
+                    // build two keyframes: previous (id = frame_id-1) and current (id = frame_id)
+                    KeyFrame kf0, kf1;
+                    kf0.id = frame_id - 1;
+                    // prevGray/prevKp/prevDesc refer to previous frame
+                    if(!prevGray.empty()){
+                        if(prevGray.channels() == 1){ cvtColor(prevGray, kf0.image, COLOR_GRAY2BGR); }
+                        else kf0.image = prevGray.clone();
+                    }
+                    kf0.kps = prevKp;
+                    kf0.desc = prevDesc.clone();
+                    kf0.R_w = Mat::eye(3,3,CV_64F);
+                    kf0.t_w = Mat::zeros(3,1,CV_64F);
+
+                    kf1.id = frame_id;
+                    kf1.image = frame.clone();
+                    kf1.kps = kps;
+                    kf1.desc = desc.clone();
+                    // initializer returns pose of second camera relative to first (world = first)
+                    kf1.R_w = R_init.clone();
+                    kf1.t_w = t_init.clone();
+
+                    // convert initializer 3D points (in first camera frame) to MapPoints in world coords (world==first)
+                    std::vector<MapPoint> newMps;
+                    newMps.reserve(pts3D.size());
+                    for(size_t i=0;i<pts3D.size();++i){
+                        if(!isTri[i]) continue;
+                        MapPoint mp;
+                        mp.p = pts3D[i];
+                        // observation indices come from goodMatches order
+                        if(i < goodMatches.size()){
+                            const DMatch &m = goodMatches[i];
+                            mp.observations.emplace_back(kf0.id, m.queryIdx);
+                            mp.observations.emplace_back(kf1.id, m.trainIdx);
+                        }
+                        newMps.push_back(mp);
+                    }
+
+                    {
+                        std::lock_guard<std::mutex> lk(mapMutex);
+                        keyframes.push_back(std::move(kf0));
+                        map.addKeyFrame(keyframes.back());
+                        keyframes.push_back(std::move(kf1));
+                        map.addKeyFrame(keyframes.back());
+                        if(!newMps.empty()) map.addMapPoints(newMps);
+                    }
+
+                    // set global pose to second keyframe (apply scale)
+                    Mat t_d; kf1.t_w.convertTo(t_d, CV_64F);
+                    t_g = t_d * scale_m;
+                    R_g = kf1.R_w.clone();
+                    double x = t_g.at<double>(0);
+                    double z = t_g.at<double>(2);
+                    vis.addPose(x,-z);
+
+                    // write CSV entry for initialization frame
+                    if(csv){
+                        csv << frame_id << ",init,0,0,0,0,0,1\n";
+                        csv.flush();
+                    }
+
+                    // notify backend to run BA on initial map
+                    backendRequests.fetch_add(1);
+                    backendCv.notify_one();
+                    // skip the usual PnP / poseEst path for this frame since we've initialized
+                    prevGray = gray.clone(); prevKp = kps; prevDesc = desc.clone();
+                    frame_id++;
+                    continue;
+                } else {
+                    std::cout << "Initializer: failed to initialize from first two frames" << std::endl;
+                }
+            }
 
-    // Build MapPoint vector with observations from selected window
-    std::vector<MapPoint> mps;
-    mps.reserve(mapPoints_.size());
-    // Track which points are observed within the window
-    std::vector<char> pointObserved(mapPoints_.size(), 0);
-    for (int i = startIdx; i < totalKFs; ++i) {
-        const auto &kp2mp = keyframeKpToMap_[i];
-        for (int kpIdx = 0; kpIdx < (int)kp2mp.size(); ++kpIdx) {
-            int mpIdx = kp2mp[kpIdx];
-            if (mpIdx >= 0 && mpIdx < (int)mapPoints_.size()) {
-                pointObserved[mpIdx] = 1;
+            // Try PnP against map points first (via Localizer)
+            bool solvedByPnP = false;
+            Mat R_pnp, t_pnp; int inliers_pnp = 0;
+            int preMatches_pnp = 0, postMatches_pnp = 0; double meanReproj_pnp = 0.0;
+            if(localizer.tryPnP(map, desc, kps, loader.fx(), loader.fy(), loader.cx(), loader.cy(), gray.cols, gray.rows,
+                                options.min_inliers, R_pnp, t_pnp, inliers_pnp, frame_id, &frame, runDir.string(),
+                                &preMatches_pnp, &postMatches_pnp, &meanReproj_pnp)){
+                solvedByPnP = true;
+                std::cout << "PnP solved: preMatches="<<preMatches_pnp<<" post="<<postMatches_pnp<<" inliers="<<inliers_pnp<<" meanReproj="<<meanReproj_pnp<<std::endl;
             }
-        }
-    }
-    // Create mps with observations
-    for (size_t mpIdx = 0; mpIdx < mapPoints_.size(); ++mpIdx) {
-        if (!pointObserved[mpIdx]) continue; // only optimize observed points
-        MapPoint mp;
-        mp.id = (int)mpIdx;
-        mp.p = mapPoints_[mpIdx];
-        for (int i = startIdx; i < totalKFs; ++i) {
-            const auto &kp2mp = keyframeKpToMap_[i];
-            if ((int)kp2mp.size() == 0) continue;
-            for (int kpIdx = 0; kpIdx < (int)kp2mp.size(); ++kpIdx) {
-                if (kp2mp[kpIdx] == (int)mpIdx) {
-                    mp.observations.emplace_back(i, kpIdx);
+
+            if(pts1.size() >= 8 && !solvedByPnP){
+                Mat R, t, mask; int inliers = 0;
+                bool ok = poseEst.estimate(pts1, pts2, loader.fx(), loader.fy(), loader.cx(), loader.cy(), R, t, mask, inliers);
+
+                int matchCount = post_matches;
+                double inlierRatio = matchCount > 0 ? double(inliers) / double(matchCount) : 0.0;
+
+                // thresholds (tunable) -- relaxed and add absolute inlier guard
+                const int MIN_MATCHES = 15;           // require at least this many matches (relative)
+                const int MIN_INLIERS = 4;             // OR accept if at least this many absolute inliers
+                double t_norm = 0.0, rot_angle = 0.0;
+                if(ok){
+                    Mat t_d; t.convertTo(t_d, CV_64F);
+                    t_norm = norm(t_d);
+                    Mat R_d; R.convertTo(R_d, CV_64F);
+                    double trace = R_d.at<double>(0,0) + R_d.at<double>(1,1) + R_d.at<double>(2,2);
+                    double cos_angle = std::min(1.0, std::max(-1.0, (trace - 1.0) * 0.5));
+                    rot_angle = std::acos(cos_angle);
+                }
+
+                // Print per-frame diagnostics
+                // std::cout << "F" << frame_id << " diff=" << meanDiff << " median_flow=" << median_flow
+                //           << " pre_matches=" << pre_matches << " post_matches=" << matchCount << " inliers=" << inliers << " inlierRatio=" << inlierRatio
+                //           << " t_norm=" << t_norm << " rot_rad=" << rot_angle << std::endl;
+
+                // decide whether to integrate
+                // Prefer geometry-based decision (absolute inliers OR matchCount + ratio). Use image-diff/flow
+                // only to skip when geometry is weak or motion truly negligible.
+                bool integrate = true;
+                if(!ok){
+                    integrate = false;
+                    // std::cout << "  -> pose estimation failed, skipping integration." << std::endl;
+                } else if(inliers < MIN_INLIERS || matchCount < MIN_MATCHES){
+                    // Not enough geometric support -> skip (unless absolute inliers pass)
+                    integrate = false;
+                    // std::cout << "  -> insufficient matches/inliers (by both absolute and relative metrics), skipping integration." << std::endl;
+                } else {
+                    // We have sufficient geometric support. Only skip if motion is truly negligible
+                    // (both translation and rotation tiny) AND the image/flow indicate near-identical frames.
+                    const double MIN_TRANSLATION_NORM = 1e-4;
+                    const double MIN_ROTATION_RAD = (0.5 * CV_PI / 180.0); // 0.5 degree
+                    const double DIFF_ZERO_THRESH = 2.0;   // nearly identical image
+                    const double FLOW_ZERO_THRESH = 0.3;   // nearly zero flow in pixels
+
+                    if(t_norm < MIN_TRANSLATION_NORM && std::abs(rot_angle) < MIN_ROTATION_RAD
+                       && meanDiff < DIFF_ZERO_THRESH && median_flow < FLOW_ZERO_THRESH){
+                        integrate = false; // truly static
+                        // std::cout << "  -> negligible motion and near-identical frames, skipping integration." << std::endl;
+                    }
+                }
+                if (inliers >= options.min_inliers || (inliers >= 2 && matchCount > 50 && median_flow > 2.0)) {
+                    integrate = true;
+                }
+
+                // integrate transform if allowed
+                if(integrate){
+                    Mat t_d; t.convertTo(t_d, CV_64F);
+                    Mat t_scaled = t_d * scale_m;
+                    Mat R_d; R.convertTo(R_d, CV_64F);
+                    t_g = t_g + R_g * t_scaled;
+                    R_g = R_g * R_d;
+                    double x = t_g.at<double>(0);
+                    double z = t_g.at<double>(2);
+                    vis.addPose(x,-z);
                 }
+
+                    // if we integrated, create a keyframe and optionally triangulate new map points
+                if(integrate){
+                    KeyFrame kf;
+                    kf.id = frame_id;
+                    kf.image = frame.clone();
+                    kf.kps = kps;
+                    kf.desc = desc.clone();
+                    kf.R_w = R_g.clone(); kf.t_w = t_g.clone();
+
+                    bool didTriangulate = false;
+                    if(!map.keyframes().empty() && map.keyframes().back().id == frame_id - 1){
+                        // triangulate between last keyframe and this frame using normalized coordinates
+                        const KeyFrame &last = map.keyframes().back();
+                        std::vector<Point2f> pts1n, pts2n; pts1n.reserve(pts1.size()); pts2n.reserve(pts2.size());
+                        double fx = loader.fx(), fy = loader.fy(), cx = loader.cx(), cy = loader.cy();
+                        for(size_t i=0;i<pts1.size();++i){
+                            pts1n.emplace_back(float((pts1[i].x - cx)/fx), float((pts1[i].y - cy)/fy));
+                            pts2n.emplace_back(float((pts2[i].x - cx)/fx), float((pts2[i].y - cy)/fy));
+                        }
+                        // build kp index lists (matching goodMatches order)
+                        std::vector<int> pts1_kp_idx; pts1_kp_idx.reserve(goodMatches.size());
+                        std::vector<int> pts2_kp_idx; pts2_kp_idx.reserve(goodMatches.size());
+                        for(const auto &m: goodMatches){ pts1_kp_idx.push_back(m.queryIdx); pts2_kp_idx.push_back(m.trainIdx); }
+                        auto newPts = map.triangulateBetweenLastTwo(pts1n, pts2n, pts1_kp_idx, pts2_kp_idx, last, keyframes.empty() ? kf : keyframes.back(), fx, fy, cx, cy);
+                        if(!newPts.empty()){
+                            didTriangulate = true;
+                            // already appended inside MapManager
+                        }
+                    }
+
+                    {
+                        // insert keyframe and map points under lock to keep consistent state
+                        std::lock_guard<std::mutex> lk(mapMutex);
+                        keyframes.push_back(std::move(kf));
+                        map.addKeyFrame(keyframes.back());
+                    }
+                    if(didTriangulate){
+                        std::cout << "Created keyframe " << frame_id << " and triangulated new map points (total=" << map.mappoints().size() << ")" << std::endl;
+                    } else {
+                        std::cout << "Created keyframe " << frame_id << " (no triangulation)" << std::endl;
+                    }
+                    // Notify backend thread to run local BA asynchronously
+                    backendRequests.fetch_add(1);
+                    backendCv.notify_one();
+                }
+
+                // write CSV line
+                if(csv){
+                    csv << frame_id << "," << meanDiff << "," << median_flow << "," << pre_matches << "," << post_matches << "," << inliers << "," << inlierRatio << "," << (integrate?1:0) << "\n";
+                    csv.flush();
+                }
+
+                // Always show a single image; if we have matches, draw small boxes around matched keypoints
+                Mat visImg;
+                if(frame.channels() > 1) visImg = frame.clone();
+                else cvtColor(gray, visImg, COLOR_GRAY2BGR);
+                std::string info = std::string("Frame ") + std::to_string(frame_id) + " matches=" + std::to_string(matchCount) + " inliers=" + std::to_string(inliers);
+                if(!goodMatches.empty()){
+                    for(size_t mi=0; mi<goodMatches.size(); ++mi){
+                        Point2f p2 = (mi < pts2.size()) ? pts2[mi] : kps[goodMatches[mi].trainIdx].pt;
+
+                        // determine inlier status from mask (robust to mask shape)
+                        bool isInlier = false;
+                        if(!mask.empty()){
+                            if(mask.rows == static_cast<int>(goodMatches.size())){
+                                isInlier = mask.at<uchar>(static_cast<int>(mi), 0) != 0;
+                            } else if(mask.cols == static_cast<int>(goodMatches.size())){
+                                isInlier = mask.at<uchar>(0, static_cast<int>(mi)) != 0;
+                            }
+                        }
+                        Scalar col = isInlier ? Scalar(0,255,0) : Scalar(0,0,255);
+                        Point ip(cvRound(p2.x), cvRound(p2.y));
+                        Rect r(ip - Point(4,4), Size(8,8));
+                        rectangle(visImg, r, col, 2, LINE_AA);
+                    }
+                }
+                putText(visImg, info, Point(10,20), FONT_HERSHEY_SIMPLEX, 0.6, Scalar(0,255,0), 2);
+                vis.showFrame(visImg);
+
+            } else {
+                vis.showFrame(gray);
             }
+        } else {
+            Mat visFrame; drawKeypoints(gray, kps, visFrame, Scalar::all(-1), DrawMatchesFlags::DRAW_RICH_KEYPOINTS);
+            vis.showFrame(visFrame);
         }
-        if (!mp.observations.empty()) mps.push_back(mp);
-    }
 
-    if (kfs.size() < 2 || mps.empty()) return;
-
-    // Local/fixed KF indices relative to full history ids
-    std::vector<int> localKfIndices;
-    localKfIndices.reserve(kfs.size());
-    for (const auto &kf : kfs) localKfIndices.push_back(kf.id);
-    // Fix the oldest KF in the window to anchor optimization
-    std::vector<int> fixedKfIndices = { startIdx };
-
-    // Select backend
-
-    if (params_.backendType == 0) {
-    #ifndef USE_G2O
-        CV_Error(Error::StsBadArg, "G2O backend is not available (not built with SLAM module)");
-    #else
-        Optimizer::localBundleAdjustment(
-            kfs, mps, localKfIndices, fixedKfIndices,
-            K_.K.at<double>(0,0), K_.K.at<double>(1,1), K_.K.at<double>(0,2), K_.K.at<double>(1,2),
-            params_.baMaxIters);
-    #endif
-    } else
-    {
-        Optimizer::localBundleAdjustmentSFM(
-            kfs, mps, localKfIndices, fixedKfIndices,
-            K_.K.at<double>(0,0), K_.K.at<double>(1,1), K_.K.at<double>(0,2), K_.K.at<double>(1,2),
-            params_.baMaxIters);
+        vis.showTopdown();
+        // update prev
+        prevGray = gray.clone(); prevKp = kps; prevDesc = desc.clone();
+        frame_id++;
+        char key = (char)waitKey(1);
+        if(key == 27) break;
     }
 
-    // Write back optimized poses and points
-    for (const auto &kf : kfs) {
-        int i = kf.id;
-        Mat T = Mat::eye(4,4,CV_64F);
-        kf.R_w.copyTo(T(Rect(0,0,3,3)));
-        kf.t_w.copyTo(T(Rect(3,0,1,3)));
-        if (i >= 0 && i < totalKFs) keyframePoses_[i] = T.clone();
-        if (i == totalKFs - 1) { // also update current KF pose cache
-            kfPoseSE3_ = T.clone();
-            currentPoseSE3_ = T.clone();
-        }
-    }
-    for (const auto &mp : mps) {
-        if (mp.id >= 0 && mp.id < (int)mapPoints_.size()) {
-            mapPoints_[mp.id] = mp.p;
+    // save trajectory with timestamp into result/ folder
+    try{
+        // save trajectory into the per-run folder using a simple filename (no timestamp)
+        std::filesystem::path outDir = resultDir / runTimestamp;
+        if(!std::filesystem::exists(outDir)) std::filesystem::create_directories(outDir);
+        std::filesystem::path outPath = outDir / std::string("trajectory.png");
+        if(vis.saveTrajectory(outPath.string())){
+            std::cout << "Saved trajectory to " << outPath.string() << std::endl;
+        } else {
+            std::cerr << "Failed to save trajectory to " << outPath.string() << std::endl;
         }
+    } catch(const std::exception &e){
+        std::cerr << "Error saving trajectory: " << e.what() << std::endl;
     }
+
+    // Shutdown backend thread gracefully
+    backendStop.store(true);
+    backendCv.notify_one();
+    if(backendThread.joinable()) backendThread.join();
+
+    return 0;
 }
 
 } // namespace vo

From 654366d34a2c5d3ba371d7fc71177ca574b9123d Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Thu, 4 Dec 2025 07:08:25 +0000
Subject: [PATCH 04/10] Add CMakeLists.txt

---
 modules/slam/CMakeLists.txt      | 30 ++++++++++++++++++++++++++++++
 modules/slam/src/data_loader.cpp |  6 +++---
 modules/slam/src/keyframe.cpp    |  0
 3 files changed, 33 insertions(+), 3 deletions(-)
 create mode 100644 modules/slam/CMakeLists.txt
 delete mode 100644 modules/slam/src/keyframe.cpp

diff --git a/modules/slam/CMakeLists.txt b/modules/slam/CMakeLists.txt
new file mode 100644
index 0000000000..747dcb37cf
--- /dev/null
+++ b/modules/slam/CMakeLists.txt
@@ -0,0 +1,30 @@
+set(the_description "SLAM module: visual odometry / mapping / localization utilities")
+
+# Core dependencies used by the sources (see includes in src/ and include/)
+ocv_define_module(slam
+	opencv_core
+	opencv_imgproc
+	opencv_calib3d
+	opencv_features2d
+	OPTIONAL opencv_sfm
+	opencv_imgcodecs
+	opencv_highgui
+	opencv_video
+	WRAP python
+)
+
+# Ensure C++17 is enabled for this module (required for <filesystem>)
+if(TARGET ${the_module})
+	set_target_properties(${the_module} PROPERTIES CXX_STANDARD 17 CXX_STANDARD_REQUIRED ON)
+	# For older GCC/libstdc++ (<9) we may need to link stdc++fs
+	if(CMAKE_CXX_COMPILER_ID STREQUAL "GNU" AND CMAKE_CXX_COMPILER_VERSION VERSION_LESS "9.0")
+		target_link_libraries(${the_module} PRIVATE stdc++fs)
+	endif()
+endif()
+
+# If you need to add special include directories, libraries or compile flags,
+# add them below using the OpenCV contrib module helper macros, for example:
+#
+# ocv_include_directories(${CMAKE_CURRENT_LIST_DIR}/include)
+# ocv_module_compile_options(-Wall)
+#
diff --git a/modules/slam/src/data_loader.cpp b/modules/slam/src/data_loader.cpp
index 1488e9a02a..8deb8e9c26 100644
--- a/modules/slam/src/data_loader.cpp
+++ b/modules/slam/src/data_loader.cpp
@@ -11,7 +11,7 @@ namespace vo {
 DataLoader::DataLoader(const std::string &imageDir)
     : currentIndex(0), fx_(700.0), fy_(700.0), cx_(0.5), cy_(0.5)
 {
-    // 使用 std::filesystem 先检查目录是否存在
+    // Use std::filesystem to check whether the directory exists first
     try {
         std::filesystem::path p(imageDir);
         if(!std::filesystem::exists(p) || !std::filesystem::is_directory(p)){
@@ -23,7 +23,7 @@ DataLoader::DataLoader(const std::string &imageDir)
         // fallthrough to try glob
     }
 
-    // 使用 glob 列出文件，捕获可能的 OpenCV 异常
+    // Use glob to list files, catching any possible OpenCV exceptions
     try {
         glob(imageDir + "/*", imageFiles, false);
     } catch(const Exception &e){
@@ -37,7 +37,7 @@ DataLoader::DataLoader(const std::string &imageDir)
         return;
     }
 
-    // 尝试在 imageDir 或其上一级目录寻找 sensor.yaml
+    // Try to find sensor.yaml in imageDir or its parent directory
     std::filesystem::path p(imageDir);
     std::string yaml1 = (p / "sensor.yaml").string();
     std::string yaml2 = (p.parent_path() / "sensor.yaml").string();
diff --git a/modules/slam/src/keyframe.cpp b/modules/slam/src/keyframe.cpp
deleted file mode 100644
index e69de29bb2..0000000000

From 9b7309ab5a1fa358dae818fcb8311d2e4268887e Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Thu, 4 Dec 2025 18:35:57 +0000
Subject: [PATCH 05/10] Address link issue

---
 modules/slam/include/opencv2/slam/vo.hpp | 26 ++++++++++++------------
 modules/slam/src/vo.cpp                  |  3 ++-
 2 files changed, 15 insertions(+), 14 deletions(-)

diff --git a/modules/slam/include/opencv2/slam/vo.hpp b/modules/slam/include/opencv2/slam/vo.hpp
index 31681ed1a6..5172edb74d 100644
--- a/modules/slam/include/opencv2/slam/vo.hpp
+++ b/modules/slam/include/opencv2/slam/vo.hpp
@@ -7,22 +7,22 @@
 namespace cv {
 namespace vo {
 
-struct VisualOdometryOptions {
-    int min_matches = 15;
-    int min_inliers = 4;
-    double min_inlier_ratio = 0.1;
-    double diff_zero_thresh = 2.0;
-    double flow_zero_thresh = 0.3;
-    double min_translation_norm = 1e-4;
-    double min_rotation_rad = 0.5 * CV_PI / 180.0;
-    int max_matches_keep = 500;
-    double flow_weight_lambda = 5.0;
+struct CV_EXPORTS_W_SIMPLE VisualOdometryOptions {
+    CV_PROP_RW int min_matches = 15;
+    CV_PROP_RW int min_inliers = 4;
+    CV_PROP_RW double min_inlier_ratio = 0.1;
+    CV_PROP_RW double diff_zero_thresh = 2.0;
+    CV_PROP_RW double flow_zero_thresh = 0.3;
+    CV_PROP_RW double min_translation_norm = 1e-4;
+    CV_PROP_RW double min_rotation_rad = 0.5 * CV_PI / 180.0;
+    CV_PROP_RW int max_matches_keep = 500;
+    CV_PROP_RW double flow_weight_lambda = 5.0;
 };
 
-class VisualOdometry {
+class CV_EXPORTS_W VisualOdometry {
 public:
-    VisualOdometry(cv::Ptr<cv::Feature2D> feature, cv::Ptr<cv::DescriptorMatcher> matcher);
-    int run(const std::string &imageDir, double scale_m = 1.0, const VisualOdometryOptions &options = VisualOdometryOptions());
+    CV_WRAP VisualOdometry(cv::Ptr<cv::Feature2D> feature, cv::Ptr<cv::DescriptorMatcher> matcher);
+    CV_WRAP int run(const std::string &imageDir, double scale_m = 1.0, const VisualOdometryOptions &options = VisualOdometryOptions());
 private:
     cv::Ptr<cv::Feature2D> feature_;
     cv::Ptr<cv::DescriptorMatcher> matcher_;
diff --git a/modules/slam/src/vo.cpp b/modules/slam/src/vo.cpp
index 0bd730ac51..7532ece628 100644
--- a/modules/slam/src/vo.cpp
+++ b/modules/slam/src/vo.cpp
@@ -65,7 +65,8 @@ int VisualOdometry::run(const std::string &imageDir, double scale_m, const Visua
         std::ostringstream ss; ss << std::put_time(&tm, "%Y%m%d_%H%M%S");
         runTimestamp = ss.str();
     }
-    std::filesystem::path resultDir("../../result");
+    // create a 'result' folder inside the provided imageDir (use filesystem join to be robust)
+    std::filesystem::path resultDir = std::filesystem::path(imageDir) / "result";
     if(!std::filesystem::exists(resultDir)) std::filesystem::create_directories(resultDir);
     // create a per-run folder under result/ named by timestamp
     std::filesystem::path runDir = resultDir / runTimestamp;

From d53fa3cbe7739b22683ca62b61ee0eb675701c52 Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Fri, 5 Dec 2025 06:12:43 +0000
Subject: [PATCH 06/10] Fix cxx standard build error

---
 modules/slam/src/data_loader.cpp | 52 ++++++++++++++++++++++++++++----
 1 file changed, 46 insertions(+), 6 deletions(-)

diff --git a/modules/slam/src/data_loader.cpp b/modules/slam/src/data_loader.cpp
index 8deb8e9c26..aedfc79e90 100644
--- a/modules/slam/src/data_loader.cpp
+++ b/modules/slam/src/data_loader.cpp
@@ -1,6 +1,21 @@
 #include "opencv2/slam/data_loader.hpp"
 #include <opencv2/imgcodecs.hpp>
-#include <filesystem>
+#if defined(__has_include)
+#  if __has_include(<filesystem>)
+#    include <filesystem>
+#    define HAVE_STD_FILESYSTEM 1
+#    namespace fs = std::filesystem;
+#  elif __has_include(<experimental/filesystem>)
+#    include <experimental/filesystem>
+#    define HAVE_STD_FILESYSTEM 1
+#    namespace fs = std::experimental::filesystem;
+#  else
+#    define HAVE_STD_FILESYSTEM 0
+#  endif
+#else
+#  define HAVE_STD_FILESYSTEM 0
+#endif
+#include <sys/stat.h>
 #include <iostream>
 #include <fstream>
 #include <sstream>
@@ -11,10 +26,12 @@ namespace vo {
 DataLoader::DataLoader(const std::string &imageDir)
     : currentIndex(0), fx_(700.0), fy_(700.0), cx_(0.5), cy_(0.5)
 {
-    // Use std::filesystem to check whether the directory exists first
+    // Check whether the directory exists. Prefer std::filesystem when available,
+    // otherwise fall back to POSIX stat.
+#if HAVE_STD_FILESYSTEM
     try {
-        std::filesystem::path p(imageDir);
-        if(!std::filesystem::exists(p) || !std::filesystem::is_directory(p)){
+        fs::path p(imageDir);
+        if(!fs::exists(p) || !fs::is_directory(p)){
             std::cerr << "DataLoader: imageDir does not exist or is not a directory: " << imageDir << std::endl;
             return;
         }
@@ -22,6 +39,13 @@ DataLoader::DataLoader(const std::string &imageDir)
         std::cerr << "DataLoader: filesystem error checking imageDir: " << e.what() << std::endl;
         // fallthrough to try glob
     }
+#else
+    struct stat sb;
+    if(stat(imageDir.c_str(), &sb) != 0 || !S_ISDIR(sb.st_mode)){
+        std::cerr << "DataLoader: imageDir does not exist or is not a directory: " << imageDir << std::endl;
+        return;
+    }
+#endif
 
     // Use glob to list files, catching any possible OpenCV exceptions
     try {
@@ -37,13 +61,29 @@ DataLoader::DataLoader(const std::string &imageDir)
         return;
     }
 
-    // Try to find sensor.yaml in imageDir or its parent directory
-    std::filesystem::path p(imageDir);
+    // Try to find sensor.yaml in imageDir or its parent directory.
+    // Use filesystem paths when available; otherwise build paths with simple string ops.
+#if HAVE_STD_FILESYSTEM
+    fs::path p(imageDir);
     std::string yaml1 = (p / "sensor.yaml").string();
     std::string yaml2 = (p.parent_path() / "sensor.yaml").string();
     if(!loadIntrinsics(yaml1)){
         loadIntrinsics(yaml2); // best-effort
     }
+#else
+    auto make_parent_yaml = [](const std::string &dir)->std::string{
+        std::string tmp = dir;
+        if(!tmp.empty() && tmp.back() == '/') tmp.pop_back();
+        auto pos = tmp.find_last_of('/');
+        if(pos == std::string::npos) return std::string("sensor.yaml");
+        return tmp.substr(0, pos) + "/sensor.yaml";
+    };
+    std::string yaml1 = imageDir + "/sensor.yaml";
+    std::string yaml2 = make_parent_yaml(imageDir);
+    if(!loadIntrinsics(yaml1)){
+        loadIntrinsics(yaml2); // best-effort
+    }
+#endif
 }
 
 bool DataLoader::loadIntrinsics(const std::string &yamlPath){

From b96a45bc9901088424dd9cb184ae0b9e1139a40b Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Fri, 5 Dec 2025 07:20:21 +0000
Subject: [PATCH 07/10] Fix filesystem:: namespace issue

---
 modules/slam/src/data_loader.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/modules/slam/src/data_loader.cpp b/modules/slam/src/data_loader.cpp
index aedfc79e90..446c1485e5 100644
--- a/modules/slam/src/data_loader.cpp
+++ b/modules/slam/src/data_loader.cpp
@@ -4,11 +4,11 @@
 #  if __has_include(<filesystem>)
 #    include <filesystem>
 #    define HAVE_STD_FILESYSTEM 1
-#    namespace fs = std::filesystem;
+    namespace fs = std::filesystem;
 #  elif __has_include(<experimental/filesystem>)
 #    include <experimental/filesystem>
 #    define HAVE_STD_FILESYSTEM 1
-#    namespace fs = std::experimental::filesystem;
+    namespace fs = std::experimental::filesystem;
 #  else
 #    define HAVE_STD_FILESYSTEM 0
 #  endif

From 61470086d567fe2d69546257f00e175d5e2e9a08 Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Fri, 5 Dec 2025 08:16:29 +0000
Subject: [PATCH 08/10] Add function ensureDirectoryExists()

---
 .../slam/include/opencv2/slam/data_loader.hpp |  2 +
 modules/slam/src/data_loader.cpp              | 41 +++++++++++++++++++
 modules/slam/src/localizer.cpp                |  4 +-
 modules/slam/src/vo.cpp                       | 34 +++++++--------
 4 files changed, 63 insertions(+), 18 deletions(-)

diff --git a/modules/slam/include/opencv2/slam/data_loader.hpp b/modules/slam/include/opencv2/slam/data_loader.hpp
index acc7795a1f..109a83639f 100644
--- a/modules/slam/include/opencv2/slam/data_loader.hpp
+++ b/modules/slam/include/opencv2/slam/data_loader.hpp
@@ -6,6 +6,8 @@
 namespace cv{
 namespace vo{
 
+bool ensureDirectoryExists(const std::string &dir);
+
 class DataLoader {
 public:
     // 构造：传入图像目录（可以是相对或绝对路径）
diff --git a/modules/slam/src/data_loader.cpp b/modules/slam/src/data_loader.cpp
index 446c1485e5..4ad81c1750 100644
--- a/modules/slam/src/data_loader.cpp
+++ b/modules/slam/src/data_loader.cpp
@@ -16,13 +16,54 @@
 #  define HAVE_STD_FILESYSTEM 0
 #endif
 #include <sys/stat.h>
+#include <sys/types.h>
+#include <errno.h>
+#include <sys/stat.h>
 #include <iostream>
 #include <fstream>
 #include <sstream>
 
+
 namespace cv {
 namespace vo {
 
+bool ensureDirectoryExists(const std::string &dir){
+    if(dir.empty()) return false;
+#if HAVE_STD_FILESYSTEM
+    try{
+        fs::path p(dir);
+        return fs::create_directories(p) || fs::exists(p);
+    }catch(...){ return false; }
+#else
+    std::string tmp = dir;
+    if(tmp.empty()) return false;
+    while(tmp.size() > 1 && tmp.back() == '/') tmp.pop_back();
+    std::string cur;
+    if(!tmp.empty() && tmp[0] == '/') cur = "/";
+    size_t pos = 0;
+    while(pos < tmp.size()){
+        size_t next = tmp.find('/', pos);
+        std::string part = (next == std::string::npos) ? tmp.substr(pos) : tmp.substr(pos, next-pos);
+        if(!part.empty()){
+            if(cur.size() > 1 && cur.back() != '/') cur += '/';
+            cur += part;
+            if(mkdir(cur.c_str(), 0755) != 0){
+                if(errno == EEXIST){ /* ok */ }
+                else {
+                    struct stat st;
+                    if(stat(cur.c_str(), &st) == 0 && S_ISDIR(st.st_mode)){
+                        // ok
+                    } else return false;
+                }
+            }
+        }
+        if(next == std::string::npos) break;
+        pos = next + 1;
+    }
+    return true;
+#endif
+}
+
 DataLoader::DataLoader(const std::string &imageDir)
     : currentIndex(0), fx_(700.0), fy_(700.0), cx_(0.5), cy_(0.5)
 {
diff --git a/modules/slam/src/localizer.cpp b/modules/slam/src/localizer.cpp
index 40647f1751..8e7c384988 100644
--- a/modules/slam/src/localizer.cpp
+++ b/modules/slam/src/localizer.cpp
@@ -1,7 +1,7 @@
 #include "opencv2/slam/localizer.hpp"
 #include "opencv2/slam/matcher.hpp"
+#include "opencv2/slam/data_loader.hpp"
 #include <opencv2/calib3d.hpp>
-#include <filesystem>
 #include <fstream>
 #include <opencv2/imgproc.hpp>
 #include <opencv2/imgcodecs.hpp>
@@ -126,7 +126,7 @@ bool Localizer::tryPnP(const MapManager &map, const Mat &desc, const std::vector
     // Diagnostics: draw matches and inliers if requested
     if(!outDir.empty() && image){
         try{
-            std::filesystem::create_directories(outDir);
+            ensureDirectoryExists(outDir);
             Mat vis;
             if(image->channels() == 1) cvtColor(*image, vis, COLOR_GRAY2BGR);
             else vis = image->clone();
diff --git a/modules/slam/src/vo.cpp b/modules/slam/src/vo.cpp
index 7532ece628..24876f4a33 100644
--- a/modules/slam/src/vo.cpp
+++ b/modules/slam/src/vo.cpp
@@ -18,7 +18,6 @@
 #include <opencv2/imgproc.hpp>
 #include <opencv2/highgui.hpp>
 #include <opencv2/video/tracking.hpp>
-#include <filesystem>
 #include <chrono>
 #include <iomanip>
 #include <sstream>
@@ -65,20 +64,23 @@ int VisualOdometry::run(const std::string &imageDir, double scale_m, const Visua
         std::ostringstream ss; ss << std::put_time(&tm, "%Y%m%d_%H%M%S");
         runTimestamp = ss.str();
     }
-    // create a 'result' folder inside the provided imageDir (use filesystem join to be robust)
-    std::filesystem::path resultDir = std::filesystem::path(imageDir) / "result";
-    if(!std::filesystem::exists(resultDir)) std::filesystem::create_directories(resultDir);
+    // create a 'result' folder inside the provided imageDir (portable, avoids requiring <filesystem>)
+    std::string resultDirStr = imageDir;
+    if(resultDirStr.empty()) resultDirStr = std::string(".");
+    if(resultDirStr.back() == '/') resultDirStr.pop_back();
+    resultDirStr += "/result";
+    ensureDirectoryExists(resultDirStr);
     // create a per-run folder under result/ named by timestamp
-    std::filesystem::path runDir = resultDir / runTimestamp;
-    if(!std::filesystem::exists(runDir)) std::filesystem::create_directories(runDir);
-    std::filesystem::path csvPath = runDir / std::string("run.csv");
+    std::string runDirStr = resultDirStr + "/" + runTimestamp;
+    ensureDirectoryExists(runDirStr);
+    std::string csvPath = runDirStr + "/run.csv";
     std::ofstream csv(csvPath);
     if(csv){
         csv << "frame_id,mean_diff,median_flow,pre_matches,post_matches,inliers,inlier_ratio,integrated\n";
         csv.flush();
-        std::cout << "Writing diagnostics to " << csvPath.string() << std::endl;
+        std::cout << "Writing diagnostics to " << csvPath << std::endl;
     } else {
-        std::cerr << "Failed to open diagnostics CSV " << csvPath.string() << std::endl;
+        std::cerr << "Failed to open diagnostics CSV " << csvPath << std::endl;
     }
 
     Mat R_g = Mat::eye(3,3,CV_64F);
@@ -317,7 +319,7 @@ int VisualOdometry::run(const std::string &imageDir, double scale_m, const Visua
             Mat R_pnp, t_pnp; int inliers_pnp = 0;
             int preMatches_pnp = 0, postMatches_pnp = 0; double meanReproj_pnp = 0.0;
             if(localizer.tryPnP(map, desc, kps, loader.fx(), loader.fy(), loader.cx(), loader.cy(), gray.cols, gray.rows,
-                                options.min_inliers, R_pnp, t_pnp, inliers_pnp, frame_id, &frame, runDir.string(),
+                                options.min_inliers, R_pnp, t_pnp, inliers_pnp, frame_id, &frame, runDirStr,
                                 &preMatches_pnp, &postMatches_pnp, &meanReproj_pnp)){
                 solvedByPnP = true;
                 std::cout << "PnP solved: preMatches="<<preMatches_pnp<<" post="<<postMatches_pnp<<" inliers="<<inliers_pnp<<" meanReproj="<<meanReproj_pnp<<std::endl;
@@ -487,13 +489,13 @@ int VisualOdometry::run(const std::string &imageDir, double scale_m, const Visua
     // save trajectory with timestamp into result/ folder
     try{
         // save trajectory into the per-run folder using a simple filename (no timestamp)
-        std::filesystem::path outDir = resultDir / runTimestamp;
-        if(!std::filesystem::exists(outDir)) std::filesystem::create_directories(outDir);
-        std::filesystem::path outPath = outDir / std::string("trajectory.png");
-        if(vis.saveTrajectory(outPath.string())){
-            std::cout << "Saved trajectory to " << outPath.string() << std::endl;
+        std::string outDir = resultDirStr + "/" + runTimestamp;
+        ensureDirectoryExists(outDir);
+        std::string outPath = outDir + "/trajectory.png";
+        if(vis.saveTrajectory(outPath)){
+            std::cout << "Saved trajectory to " << outPath << std::endl;
         } else {
-            std::cerr << "Failed to save trajectory to " << outPath.string() << std::endl;
+            std::cerr << "Failed to save trajectory to " << outPath << std::endl;
         }
     } catch(const std::exception &e){
         std::cerr << "Error saving trajectory: " << e.what() << std::endl;

From 1760865414a7486bf53b50a5ce26061c6f3dd38d Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Fri, 5 Dec 2025 08:41:15 +0000
Subject: [PATCH 09/10] define cross-platform macro

---
 modules/slam/src/data_loader.cpp | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/modules/slam/src/data_loader.cpp b/modules/slam/src/data_loader.cpp
index 4ad81c1750..3210ebc9cf 100644
--- a/modules/slam/src/data_loader.cpp
+++ b/modules/slam/src/data_loader.cpp
@@ -19,6 +19,15 @@
 #include <sys/types.h>
 #include <errno.h>
 #include <sys/stat.h>
+#ifdef _WIN32
+#  include <direct.h>
+#  ifndef S_ISDIR
+#    define S_ISDIR(mode) (((mode) & S_IFDIR) != 0)
+#  endif
+#  ifndef mkdir
+#    define mkdir(path, mode) _mkdir(path)
+#  endif
+#endif
 #include <iostream>
 #include <fstream>
 #include <sstream>

From 1d94a0b011255c5a67de26616043599369030fc5 Mon Sep 17 00:00:00 2001
From: Xuanrui Zhu <634210954@qq.com>
Date: Fri, 5 Dec 2025 12:28:53 +0000
Subject: [PATCH 10/10] Add sfm/g2o dependency check

---
 modules/slam/CMakeLists.txt                   | 32 +++++++++++++++++++
 .../slam/include/opencv2/slam/optimizer.hpp   | 11 +++++--
 modules/slam/src/optimizer.cpp                | 15 +++++----
 modules/slam/src/vo.cpp                       |  4 +--
 4 files changed, 51 insertions(+), 11 deletions(-)

diff --git a/modules/slam/CMakeLists.txt b/modules/slam/CMakeLists.txt
index 747dcb37cf..3b86f31986 100644
--- a/modules/slam/CMakeLists.txt
+++ b/modules/slam/CMakeLists.txt
@@ -13,6 +13,38 @@ ocv_define_module(slam
 	WRAP python
 )
 
+# Detect optional dependencies and expose preprocessor macros so sources
+# can use #if defined(HAVE_SFM) / #if defined(HAVE_G2O)
+if(TARGET ${the_module})
+	# opencv_sfm is declared OPTIONAL above; if its target exists enable HAVE_SFM
+	if(TARGET opencv_sfm)
+		message(STATUS "slam: opencv_sfm target found — enabling HAVE_SFM")
+		target_compile_definitions(${the_module} PRIVATE HAVE_SFM=1)
+			# also add a global definition so header-parsers (python generator)
+			# running during build/config time can evaluate #if HAVE_SFM
+			add_definitions(-DHAVE_SFM=1)
+		target_link_libraries(${the_module} PRIVATE opencv_sfm)
+	else()
+		message(STATUS "slam: opencv_sfm not found — HAVE_SFM disabled")
+	endif()
+
+	# Try to detect g2o (header + library). This is a best-effort detection: we
+	# look for a common g2o header and try to find a library name. Users on
+	# Windows should install/build g2o and make it discoverable to CMake.
+	find_path(G2O_INCLUDE_DIR NAMES g2o/core/sparse_optimizer.h)
+	find_library(G2O_LIBRARY NAMES g2o_core g2o)
+	if(G2O_INCLUDE_DIR AND G2O_LIBRARY)
+		message(STATUS "slam: g2o found (headers and library) — enabling HAVE_G2O")
+		target_include_directories(${the_module} PRIVATE ${G2O_INCLUDE_DIR})
+		target_link_libraries(${the_module} PRIVATE ${G2O_LIBRARY})
+		target_compile_definitions(${the_module} PRIVATE HAVE_G2O=1)
+			# also expose globally so external header parsers can evaluate #if HAVE_G2O
+			add_definitions(-DHAVE_G2O=1)
+	else()
+		message(STATUS "slam: g2o not found — HAVE_G2O disabled")
+	endif()
+endif()
+
 # Ensure C++17 is enabled for this module (required for <filesystem>)
 if(TARGET ${the_module})
 	set_target_properties(${the_module} PROPERTIES CXX_STANDARD 17 CXX_STANDARD_REQUIRED ON)
diff --git a/modules/slam/include/opencv2/slam/optimizer.hpp b/modules/slam/include/opencv2/slam/optimizer.hpp
index a46263d7b1..b99b980815 100644
--- a/modules/slam/include/opencv2/slam/optimizer.hpp
+++ b/modules/slam/include/opencv2/slam/optimizer.hpp
@@ -16,7 +16,7 @@ class Optimizer {
     // Local Bundle Adjustment
     // Optimizes a window of recent keyframes and all observed map points
     // fixedKFs: indices of keyframes to keep fixed during optimization
-#ifdef USE_G2O
+#if defined(HAVE_G2O)
     static void localBundleAdjustmentG2O(
         std::vector<KeyFrame> &keyframes,
         std::vector<MapPoint> &mappoints,
@@ -25,6 +25,8 @@ class Optimizer {
         double fx, double fy, double cx, double cy,
         int iterations = 10);
 #endif
+
+#if defined(HAVE_SFM)
     static void localBundleAdjustmentSFM(
         std::vector<KeyFrame> &keyframes,
         std::vector<MapPoint> &mappoints,
@@ -32,6 +34,7 @@ class Optimizer {
         const std::vector<int> &fixedKfIndices,
         double fx, double fy, double cx, double cy,
         int iterations = 10);
+#endif
     // Pose-only optimization (optimize camera pose given fixed 3D points)
     static bool optimizePose(
         KeyFrame &kf,
@@ -40,14 +43,16 @@ class Optimizer {
         double fx, double fy, double cx, double cy,
         std::vector<bool> &inliers,
         int iterations = 10);
-    
+
+#if defined(HAVE_SFM)
     // Global Bundle Adjustment (expensive, use after loop closure)
     static void globalBundleAdjustmentSFM(
         std::vector<KeyFrame> &keyframes,
         std::vector<MapPoint> &mappoints,
         double fx, double fy, double cx, double cy,
         int iterations = 20);
-    
+#endif    
+
 private:
     // Compute reprojection error and Jacobian
     static double computeReprojectionError(
diff --git a/modules/slam/src/optimizer.cpp b/modules/slam/src/optimizer.cpp
index 51b438357d..b1e037e142 100644
--- a/modules/slam/src/optimizer.cpp
+++ b/modules/slam/src/optimizer.cpp
@@ -5,10 +5,10 @@
 #include <algorithm>
 #include <opencv2/calib3d.hpp>
 
-// If g2o is enabled (CMake defines USE_G2O), compile and use the g2o-based
+// If g2o is enabled (CMake defines HAVE_G2O), compile and use the g2o-based
 // implementation. Otherwise fall back to a simplified OpenCV-based implementation.
 
-#ifdef USE_G2O
+#if defined(HAVE_G2O)
 #include <g2o/core/sparse_optimizer.h>
 #include <g2o/core/block_solver.h>
 #include <g2o/core/optimization_algorithm_levenberg.h>
@@ -19,7 +19,7 @@
 #include <Eigen/Core>
 #include <map>
 #include <memory>
-#else
+#elif defined(HAVE_SFM)
 #include "opencv2/sfm.hpp"
 #endif
 
@@ -30,8 +30,8 @@ namespace vo {
 
 Optimizer::Optimizer() {}
 
-#ifdef USE_G2O
-void Optimizer::localBundleAdjustment(
+#if defined(HAVE_G2O)
+void Optimizer::localBundleAdjustmentG2O(
     std::vector<KeyFrame> &keyframes,
     std::vector<MapPoint> &mappoints,
     const std::vector<int> &localKfIndices,
@@ -146,6 +146,7 @@ void Optimizer::localBundleAdjustment(
     }
 }
 #endif
+#if defined(HAVE_SFM)
 void Optimizer::localBundleAdjustmentSFM(
     std::vector<KeyFrame> &keyframes,
     std::vector<MapPoint> &mappoints,
@@ -265,7 +266,7 @@ void Optimizer::localBundleAdjustmentSFM(
         }
     }
 }
-
+#endif
 
 bool Optimizer::optimizePose(
     KeyFrame &kf,
@@ -307,6 +308,7 @@ bool Optimizer::optimizePose(
     return true;
 }
 
+#if defined(HAVE_SFM)
 void Optimizer::globalBundleAdjustmentSFM(
     std::vector<KeyFrame> &keyframes,
     std::vector<MapPoint> &mappoints,
@@ -321,6 +323,7 @@ void Optimizer::globalBundleAdjustmentSFM(
     localBundleAdjustmentSFM(keyframes, mappoints, localKfIndices, fixedKfIndices, fx, fy, cx, cy, iterations);
     std::cout << "Optimizer: Global BA completed" << std::endl;
 }
+#endif
 
 double Optimizer::computeReprojectionError(
     const Point3d &point3D,
diff --git a/modules/slam/src/vo.cpp b/modules/slam/src/vo.cpp
index 24876f4a33..c1ac1e09a9 100644
--- a/modules/slam/src/vo.cpp
+++ b/modules/slam/src/vo.cpp
@@ -119,11 +119,11 @@ int VisualOdometry::run(const std::string &imageDir, double scale_m, const Visua
             for(int ii = start; ii < K; ++ii) localKfIndices.push_back(ii);
             std::vector<int> fixedKfIndices;
             if(start > 0) fixedKfIndices.push_back(0);
-
+        #if defined(HAVE_SFM)
             // Run BA on snapshot (may take time) - uses Optimizer which will use g2o if enabled
             Optimizer::localBundleAdjustmentSFM(kfs_snapshot, mps_snapshot, localKfIndices, fixedKfIndices,
                                             loader.fx(), loader.fy(), loader.cx(), loader.cy(), 10);
-
+        #endif
             // write back optimized poses/points into main map under lock using id-based lookup
             std::lock_guard<std::mutex> lk2(mapMutex);
             auto &kfs_ref = const_cast<std::vector<KeyFrame>&>(map.keyframes());