/* Copyright 2016 Fixstars Corporation Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http ://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #include #include #include #include #include #include #include "sample_common.h" // Camera Parameters struct CameraParameters { float fu; //!< focal length x (pixel) float fv; //!< focal length y (pixel) float u0; //!< principal point x (pixel) float v0; //!< principal point y (pixel) float baseline; //!< baseline (meter) float height; //!< height position (meter), ignored when ROAD_ESTIMATION_AUTO float tilt; //!< tilt angle (radian), ignored when ROAD_ESTIMATION_AUTO }; // Transformation between pixel coordinate and world coordinate struct CoordinateTransform { CoordinateTransform(const CameraParameters& camera) : camera(camera) { sinTilt = sinf(camera.tilt); cosTilt = cosf(camera.tilt); bf = camera.baseline * camera.fu; invfu = 1.f / camera.fu; invfv = 1.f / camera.fv; } inline cv::Point3f imageToWorld(const cv::Point2f& pt, float d) const { const float u = pt.x; const float v = pt.y; const float Zc = bf / d; const float Xc = invfu * (u - camera.u0) * Zc; const float Yc = invfv * (v - camera.v0) * Zc; const float Xw = Xc; const float Yw = Yc * cosTilt + Zc * sinTilt; const float Zw = Zc * cosTilt - Yc * sinTilt; return cv::Point3f(Xw, Yw, Zw); } CameraParameters camera; float sinTilt, cosTilt, bf, invfu, invfv; }; void reprojectPointsTo3D(const cv::Mat& disparity, const CameraParameters& camera, std::vector& points, bool subpixeled) { CV_Assert(disparity.type() == CV_32F); CoordinateTransform tf(camera); points.clear(); points.reserve(disparity.rows * disparity.cols); for (int y = 0; y < disparity.rows; y++) { for (int x = 0; x < disparity.cols; x++) { const float d = disparity.at(y, x); if (d > 0) points.push_back(tf.imageToWorld(cv::Point(x, y), d)); } } } static cv::Vec3b computeColor(float val) { const float hscale = 6.f; float h = 0.6f * (1.f - val), s = 1.f, v = 1.f; static const int sector_data[][3] = { { 1,3,0 },{ 1,0,2 },{ 3,0,1 },{ 0,2,1 },{ 0,1,3 },{ 2,1,0 } }; float tab[4]; int sector; h *= hscale; if (h < 0) do h += 6; while (h < 0); else if (h >= 6) do h -= 6; while (h >= 6); sector = cvFloor(h); h -= sector; if ((unsigned)sector >= 6u) { sector = 0; h = 0.f; } tab[0] = v; tab[1] = v * (1.f - s); tab[2] = v * (1.f - s * h); tab[3] = v * (1.f - s * (1.f - h)); const uchar b = (uchar)(255 * tab[sector_data[sector][0]]); const uchar g = (uchar)(255 * tab[sector_data[sector][1]]); const uchar r = (uchar)(255 * tab[sector_data[sector][2]]); return cv::Vec3b(b, g, r); } void drawPoints3D(const std::vector& points, cv::Mat& draw) { const int SIZE_X = 512; const int SIZE_Z = 1024; const int maxz = 20; // [meter] const double pixelsPerMeter = 1. * SIZE_Z / maxz; draw = cv::Mat::zeros(SIZE_Z, SIZE_X, CV_8UC3); const int tableSize = 256; const float scaleZ = 1.f * (tableSize - 1) / maxz; static std::vector colorTable; if (colorTable.empty()) { colorTable.resize(tableSize); for (int i = 0; i < tableSize; i++) colorTable[i] = computeColor(1.f * i / tableSize); } for (const cv::Point3f& pt : points) { const float X = pt.x; const float Z = pt.z; const int u = cvRound(pixelsPerMeter * X) + SIZE_X / 2; const int v = SIZE_Z - cvRound(pixelsPerMeter * Z); const auto& color = colorTable[cvRound(scaleZ * std::min(Z, 1.f * maxz))]; cv::circle(draw, cv::Point(u, v), 1, color); } } int main(int argc, char* argv[]) { if (argc < 4) { std::cout << "usage: " << argv[0] << " left-image-format right-image-format camera.xml [disp_size] [subpixel_enable(0: false, 1:true)]" << std::endl; std::exit(EXIT_FAILURE); } const int start_number = 1; cv::Mat I1 = cv::imread(cv::format(argv[1], start_number), cv::IMREAD_UNCHANGED); cv::Mat I2 = cv::imread(cv::format(argv[2], start_number), cv::IMREAD_UNCHANGED); const cv::FileStorage fs(argv[3], cv::FileStorage::READ); const int disp_size = argc >= 5 ? std::stoi(argv[4]) : 128; const bool subpixel = argc >= 6 ? std::stoi(argv[5]) != 0 : true; ASSERT_MSG(!I1.empty() && !I2.empty(), "imread failed."); ASSERT_MSG(fs.isOpened(), "camera.xml read failed."); ASSERT_MSG(I1.size() == I2.size() && I1.type() == I2.type(), "input images must be same size and type."); ASSERT_MSG(I1.type() == CV_8U || I1.type() == CV_16U, "input image format must be CV_8U or CV_16U."); ASSERT_MSG(disp_size == 64 || disp_size == 128 || disp_size == 256, "disparity size must be 64, 128 or 256."); // read camera parameters CameraParameters camera; camera.fu = fs["FocalLengthX"]; camera.fv = fs["FocalLengthY"]; camera.u0 = fs["CenterX"]; camera.v0 = fs["CenterY"]; camera.baseline = fs["BaseLine"]; camera.tilt = fs["Tilt"]; const int width = I1.cols; const int height = I1.rows; const int src_depth = I1.type() == CV_8U ? 8 : 16; const int dst_depth = 16; const int src_bytes = src_depth * width * height / 8; const int dst_bytes = dst_depth * width * height / 8; const sgm::StereoSGM::Parameters param(10, 120, 0.95f, subpixel); sgm::StereoSGM sgm(width, height, disp_size, src_depth, dst_depth, sgm::EXECUTE_INOUT_CUDA2CUDA, param); device_buffer d_I1(src_bytes), d_I2(src_bytes), d_disparity(dst_bytes); cv::Mat disparity(height, width, dst_depth == 8 ? CV_8S : CV_16S), disparity_color, disparity_32f, draw; std::vector points; const int invalid_disp = sgm.get_invalid_disparity(); const int disp_scale = subpixel ? sgm::StereoSGM::SUBPIXEL_SCALE : 1; for (int frame_no = start_number;; frame_no++) { I1 = cv::imread(cv::format(argv[1], frame_no), cv::IMREAD_UNCHANGED); I2 = cv::imread(cv::format(argv[2], frame_no), cv::IMREAD_UNCHANGED); if (I1.empty() || I2.empty()) { frame_no = start_number - 1; continue; } d_I1.upload(I1.data); d_I2.upload(I2.data); const auto t1 = std::chrono::system_clock::now(); sgm.execute(d_I1.data, d_I2.data, d_disparity.data); cudaDeviceSynchronize(); const auto t2 = std::chrono::system_clock::now(); const auto duration = std::chrono::duration_cast(t2 - t1).count(); const double fps = 1e6 / duration; d_disparity.download(disparity.data); // reproject points disparity.convertTo(disparity_32f, CV_32F, 1. / disp_scale); reprojectPointsTo3D(disparity_32f, camera, points, subpixel); // draw results if (I1.type() != CV_8U) cv::normalize(I1, I1, 0, 255, cv::NORM_MINMAX, CV_8U); colorize_disparity(disparity, disparity_color, disp_scale * disp_size, disparity == invalid_disp); cv::putText(disparity_color, cv::format("sgm execution time: %4.1f[msec] %4.1f[FPS]", 1e-3 * duration, fps), cv::Point(50, 50), 2, 0.75, cv::Scalar(255, 255, 255)); drawPoints3D(points, draw); cv::imshow("left image", I1); cv::imshow("disparity", disparity_color); cv::imshow("points", draw); const char c = cv::waitKey(1); if (c == 27) // ESC break; } return 0; }