mirror of https://github.com/opencv/opencv.git
Open Source Computer Vision Library
https://opencv.org/
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
568 lines
18 KiB
568 lines
18 KiB
#include <opencv2/core/core.hpp> |
|
#include <opencv2/imgproc/imgproc.hpp> |
|
#include <opencv2/calib3d/calib3d.hpp> |
|
#include <opencv2/highgui/highgui.hpp> |
|
|
|
#include <ctype.h> |
|
#include <stdio.h> |
|
#include <stdlib.h> |
|
|
|
using namespace cv; |
|
|
|
struct MouseEvent |
|
{ |
|
MouseEvent() { event = -1; buttonState = 0; } |
|
Point pt; |
|
int event; |
|
int buttonState; |
|
}; |
|
|
|
static void onMouse(int event, int x, int y, int flags, void* userdata) |
|
{ |
|
MouseEvent* data = (MouseEvent*)userdata; |
|
data->event = event; |
|
data->pt = Point(x,y); |
|
data->buttonState = flags; |
|
} |
|
|
|
static bool readCameraMatrix(const string& filename, |
|
Mat& cameraMatrix, Mat& distCoeffs, |
|
Size& calibratedImageSize ) |
|
{ |
|
FileStorage fs(filename, FileStorage::READ); |
|
fs["image_width"] >> calibratedImageSize.width; |
|
fs["image_height"] >> calibratedImageSize.height; |
|
fs["distortion_coefficients"] >> distCoeffs; |
|
fs["camera_matrix"] >> cameraMatrix; |
|
|
|
if( distCoeffs.type() != CV_64F ) |
|
distCoeffs = Mat_<double>(distCoeffs); |
|
if( cameraMatrix.type() != CV_64F ) |
|
cameraMatrix = Mat_<double>(cameraMatrix); |
|
|
|
return true; |
|
} |
|
|
|
static void calcChessboardCorners(Size boardSize, float squareSize, vector<Point3f>& corners) |
|
{ |
|
corners.resize(0); |
|
|
|
for( int i = 0; i < boardSize.height; i++ ) |
|
for( int j = 0; j < boardSize.width; j++ ) |
|
corners.push_back(Point3f(float(j*squareSize), |
|
float(i*squareSize), 0)); |
|
} |
|
|
|
|
|
static Point3f image2plane(Point2f imgpt, const Mat& R, const Mat& tvec, |
|
const Mat& cameraMatrix, double Z) |
|
{ |
|
Mat R1 = R.clone(); |
|
R1.col(2) = R1.col(2)*Z + tvec; |
|
Mat_<double> v = (cameraMatrix*R1).inv()*(Mat_<double>(3,1) << imgpt.x, imgpt.y, 1); |
|
double iw = fabs(v(2,0)) > DBL_EPSILON ? 1./v(2,0) : 0; |
|
return Point3f(v(0,0)*iw, v(1,0)*iw, Z); |
|
} |
|
|
|
|
|
static Rect extract3DBox(const Mat& frame, Mat& shownFrame, Mat& selectedObjFrame, |
|
const Mat& cameraMatrix, const Mat& rvec, const Mat& tvec, |
|
const vector<Point3f>& box, int nobjpt, bool runExtraSegmentation) |
|
{ |
|
selectedObjFrame = Mat::zeros(frame.size(), frame.type()); |
|
if( nobjpt == 0 ) |
|
return Rect(); |
|
vector<Point3f> objpt; |
|
vector<Point2f> imgpt; |
|
|
|
objpt.push_back(box[0]); |
|
if( nobjpt > 1 ) |
|
objpt.push_back(box[1]); |
|
if( nobjpt > 2 ) |
|
{ |
|
objpt.push_back(box[2]); |
|
objpt.push_back(objpt[2] - objpt[1] + objpt[0]); |
|
} |
|
if( nobjpt > 3 ) |
|
for( int i = 0; i < 4; i++ ) |
|
objpt.push_back(Point3f(objpt[i].x, objpt[i].y, box[3].z)); |
|
|
|
projectPoints(Mat(objpt), rvec, tvec, cameraMatrix, Mat(), imgpt); |
|
|
|
if( shownFrame.data ) |
|
{ |
|
if( nobjpt == 1 ) |
|
circle(shownFrame, imgpt[0], 3, Scalar(0,255,0), -1, CV_AA); |
|
else if( nobjpt == 2 ) |
|
{ |
|
circle(shownFrame, imgpt[0], 3, Scalar(0,255,0), -1, CV_AA); |
|
circle(shownFrame, imgpt[1], 3, Scalar(0,255,0), -1, CV_AA); |
|
line(shownFrame, imgpt[0], imgpt[1], Scalar(0,255,0), 3, CV_AA); |
|
} |
|
else if( nobjpt == 3 ) |
|
for( int i = 0; i < 4; i++ ) |
|
{ |
|
circle(shownFrame, imgpt[i], 3, Scalar(0,255,0), -1, CV_AA); |
|
line(shownFrame, imgpt[i], imgpt[(i+1)%4], Scalar(0,255,0), 3, CV_AA); |
|
} |
|
else |
|
for( int i = 0; i < 8; i++ ) |
|
{ |
|
circle(shownFrame, imgpt[i], 3, Scalar(0,255,0), -1, CV_AA); |
|
line(shownFrame, imgpt[i], imgpt[(i+1)%4 + (i/4)*4], Scalar(0,255,0), 3, CV_AA); |
|
line(shownFrame, imgpt[i], imgpt[i%4], Scalar(0,255,0), 3, CV_AA); |
|
} |
|
} |
|
|
|
if( nobjpt <= 2 ) |
|
return Rect(); |
|
vector<Point> hull; |
|
convexHull(Mat_<Point>(Mat(imgpt)), hull); |
|
Mat selectedObjMask = Mat::zeros(frame.size(), CV_8U); |
|
fillConvexPoly(selectedObjMask, &hull[0], hull.size(), Scalar::all(255), 8, 0); |
|
Rect roi = boundingRect(Mat(hull)) & Rect(Point(), frame.size()); |
|
|
|
if( runExtraSegmentation ) |
|
{ |
|
selectedObjMask = Scalar::all(GC_BGD); |
|
fillConvexPoly(selectedObjMask, &hull[0], hull.size(), Scalar::all(GC_PR_FGD), 8, 0); |
|
Mat bgdModel, fgdModel; |
|
grabCut(frame, selectedObjMask, roi, bgdModel, fgdModel, |
|
3, GC_INIT_WITH_RECT + GC_INIT_WITH_MASK); |
|
bitwise_and(selectedObjMask, Scalar::all(1), selectedObjMask); |
|
} |
|
|
|
frame.copyTo(selectedObjFrame, selectedObjMask); |
|
return roi; |
|
} |
|
|
|
|
|
static int select3DBox(const string& windowname, const string& selWinName, const Mat& frame, |
|
const Mat& cameraMatrix, const Mat& rvec, const Mat& tvec, |
|
vector<Point3f>& box) |
|
{ |
|
const float eps = 1e-3f; |
|
MouseEvent mouse; |
|
|
|
setMouseCallback(windowname, onMouse, &mouse); |
|
vector<Point3f> tempobj(8); |
|
vector<Point2f> imgpt(4), tempimg(8); |
|
vector<Point> temphull; |
|
int nobjpt = 0; |
|
Mat R, selectedObjMask, selectedObjFrame, shownFrame; |
|
Rodrigues(rvec, R); |
|
box.resize(4); |
|
|
|
for(;;) |
|
{ |
|
float Z = 0.f; |
|
bool dragging = (mouse.buttonState & CV_EVENT_FLAG_LBUTTON) != 0; |
|
int npt = nobjpt; |
|
|
|
if( (mouse.event == CV_EVENT_LBUTTONDOWN || |
|
mouse.event == CV_EVENT_LBUTTONUP || |
|
dragging) && nobjpt < 4 ) |
|
{ |
|
Point2f m = mouse.pt; |
|
|
|
if( nobjpt < 2 ) |
|
imgpt[npt] = m; |
|
else |
|
{ |
|
tempobj.resize(1); |
|
int nearestIdx = npt-1; |
|
if( nobjpt == 3 ) |
|
{ |
|
nearestIdx = 0; |
|
for( int i = 1; i < npt; i++ ) |
|
if( norm(m - imgpt[i]) < norm(m - imgpt[nearestIdx]) ) |
|
nearestIdx = i; |
|
} |
|
|
|
if( npt == 2 ) |
|
{ |
|
float dx = box[1].x - box[0].x, dy = box[1].y - box[0].y; |
|
float len = 1.f/std::sqrt(dx*dx+dy*dy); |
|
tempobj[0] = Point3f(dy*len + box[nearestIdx].x, |
|
-dx*len + box[nearestIdx].y, 0.f); |
|
} |
|
else |
|
tempobj[0] = Point3f(box[nearestIdx].x, box[nearestIdx].y, 1.f); |
|
|
|
projectPoints(Mat(tempobj), rvec, tvec, cameraMatrix, Mat(), tempimg); |
|
|
|
Point2f a = imgpt[nearestIdx], b = tempimg[0], d1 = b - a, d2 = m - a; |
|
float n1 = norm(d1), n2 = norm(d2); |
|
if( n1*n2 < eps ) |
|
imgpt[npt] = a; |
|
else |
|
{ |
|
Z = d1.dot(d2)/(n1*n1); |
|
imgpt[npt] = d1*Z + a; |
|
} |
|
} |
|
box[npt] = image2plane(imgpt[npt], R, tvec, cameraMatrix, npt<3 ? 0 : Z); |
|
|
|
if( (npt == 0 && mouse.event == CV_EVENT_LBUTTONDOWN) || |
|
(npt > 0 && norm(box[npt] - box[npt-1]) > eps && |
|
mouse.event == CV_EVENT_LBUTTONUP) ) |
|
{ |
|
nobjpt++; |
|
if( nobjpt < 4 ) |
|
{ |
|
imgpt[nobjpt] = imgpt[nobjpt-1]; |
|
box[nobjpt] = box[nobjpt-1]; |
|
} |
|
} |
|
|
|
// reset the event |
|
mouse.event = -1; |
|
//mouse.buttonState = 0; |
|
npt++; |
|
} |
|
|
|
frame.copyTo(shownFrame); |
|
extract3DBox(frame, shownFrame, selectedObjFrame, |
|
cameraMatrix, rvec, tvec, box, npt, false); |
|
imshow(windowname, shownFrame); |
|
imshow(selWinName, selectedObjFrame); |
|
|
|
int c = waitKey(30); |
|
if( (c & 255) == 27 ) |
|
{ |
|
nobjpt = 0; |
|
} |
|
if( c == 'q' || c == 'Q' || c == ' ' ) |
|
{ |
|
box.clear(); |
|
return c == ' ' ? -1 : -100; |
|
} |
|
if( (c == '\r' || c == '\n') && nobjpt == 4 && box[3].z != 0 ) |
|
return 1; |
|
} |
|
} |
|
|
|
|
|
static bool readModelViews( const string& filename, vector<Point3f>& box, |
|
vector<string>& imagelist, |
|
vector<Rect>& roiList, vector<Vec6f>& poseList ) |
|
{ |
|
imagelist.resize(0); |
|
roiList.resize(0); |
|
poseList.resize(0); |
|
box.resize(0); |
|
|
|
FileStorage fs(filename, FileStorage::READ); |
|
if( !fs.isOpened() ) |
|
return false; |
|
fs["box"] >> box; |
|
|
|
FileNode all = fs["views"]; |
|
if( all.type() != FileNode::SEQ ) |
|
return false; |
|
FileNodeIterator it = all.begin(), it_end = all.end(); |
|
|
|
for(; it != it_end; ++it) |
|
{ |
|
FileNode n = *it; |
|
imagelist.push_back((string)n["image"]); |
|
FileNode nr = n["rect"]; |
|
roiList.push_back(Rect((int)nr[0], (int)nr[1], (int)nr[2], (int)nr[3])); |
|
FileNode np = n["pose"]; |
|
poseList.push_back(Vec6f((float)np[0], (float)np[1], (float)np[2], |
|
(float)np[3], (float)np[4], (float)np[5])); |
|
} |
|
|
|
return true; |
|
} |
|
|
|
|
|
static bool writeModelViews(const string& filename, const vector<Point3f>& box, |
|
const vector<string>& imagelist, |
|
const vector<Rect>& roiList, |
|
const vector<Vec6f>& poseList) |
|
{ |
|
FileStorage fs(filename, FileStorage::WRITE); |
|
if( !fs.isOpened() ) |
|
return false; |
|
|
|
fs << "box" << "[:"; |
|
fs << box << "]" << "views" << "["; |
|
|
|
size_t i, nviews = imagelist.size(); |
|
|
|
CV_Assert( nviews == roiList.size() && nviews == poseList.size() ); |
|
|
|
for( i = 0; i < nviews; i++ ) |
|
{ |
|
Rect r = roiList[i]; |
|
Vec6f p = poseList[i]; |
|
|
|
fs << "{" << "image" << imagelist[i] << |
|
"roi" << "[:" << r.x << r.y << r.width << r.height << "]" << |
|
"pose" << "[:" << p[0] << p[1] << p[2] << p[3] << p[4] << p[5] << "]" << "}"; |
|
} |
|
fs << "]"; |
|
|
|
return true; |
|
} |
|
|
|
|
|
static bool readStringList( const string& filename, vector<string>& l ) |
|
{ |
|
l.resize(0); |
|
FileStorage fs(filename, FileStorage::READ); |
|
if( !fs.isOpened() ) |
|
return false; |
|
FileNode n = fs.getFirstTopLevelNode(); |
|
if( n.type() != FileNode::SEQ ) |
|
return false; |
|
FileNodeIterator it = n.begin(), it_end = n.end(); |
|
for( ; it != it_end; ++it ) |
|
l.push_back((string)*it); |
|
return true; |
|
} |
|
|
|
|
|
int main(int argc, char** argv) |
|
{ |
|
const char* help = "Usage: select3dobj -w <board_width -h <board_height> [-s <square_size>]\n" |
|
"\t-i <intrinsics_filename> -o <output_prefix> [video_filename/cameraId]\n"; |
|
const char* screen_help = |
|
"Actions: \n" |
|
"\tSelect object as 3D box with the mouse. That's it\n" |
|
"\tESC - Reset the selection\n" |
|
"\tSPACE - Skip the frame; move to the next frame (not in video mode)\n" |
|
"\tENTER - Confirm the selection. Grab next object in video mode.\n" |
|
"\tq - Exit the program\n"; |
|
|
|
if(argc < 5) |
|
{ |
|
puts(help); |
|
return 0; |
|
} |
|
const char* intrinsicsFilename = 0; |
|
const char* outprefix = 0; |
|
const char* inputName = 0; |
|
int cameraId = 0; |
|
Size boardSize; |
|
double squareSize = 1; |
|
vector<string> imageList; |
|
|
|
for( int i = 1; i < argc; i++ ) |
|
{ |
|
if( strcmp(argv[i], "-i") == 0 ) |
|
intrinsicsFilename = argv[++i]; |
|
else if( strcmp(argv[i], "-o") == 0 ) |
|
outprefix = argv[++i]; |
|
else if( strcmp(argv[i], "-w") == 0 ) |
|
{ |
|
if(sscanf(argv[++i], "%d", &boardSize.width) != 1 || boardSize.width <= 0) |
|
{ |
|
printf("Incorrect -w parameter (must be a positive integer)\n"); |
|
puts(help); |
|
return 0; |
|
} |
|
} |
|
else if( strcmp(argv[i], "-h") == 0 ) |
|
{ |
|
if(sscanf(argv[++i], "%d", &boardSize.height) != 1 || boardSize.height <= 0) |
|
{ |
|
printf("Incorrect -h parameter (must be a positive integer)\n"); |
|
puts(help); |
|
return 0; |
|
} |
|
} |
|
else if( strcmp(argv[i], "-s") == 0 ) |
|
{ |
|
if(sscanf(argv[++i], "%lf", &squareSize) != 1 || squareSize <= 0) |
|
{ |
|
printf("Incorrect -w parameter (must be a positive real number)\n"); |
|
puts(help); |
|
return 0; |
|
} |
|
} |
|
else if( argv[i][0] != '-' ) |
|
{ |
|
if( isdigit(argv[i][0])) |
|
sscanf(argv[i], "%d", &cameraId); |
|
else |
|
inputName = argv[i]; |
|
} |
|
else |
|
{ |
|
printf("Incorrect option\n"); |
|
puts(help); |
|
return 0; |
|
} |
|
} |
|
|
|
if( !intrinsicsFilename || !outprefix || |
|
boardSize.width <= 0 || boardSize.height <= 0 ) |
|
{ |
|
printf("Some of the required parameters are missing\n"); |
|
puts(help); |
|
return 0; |
|
} |
|
|
|
Mat cameraMatrix, distCoeffs; |
|
Size calibratedImageSize; |
|
readCameraMatrix(intrinsicsFilename, cameraMatrix, distCoeffs, calibratedImageSize ); |
|
|
|
VideoCapture capture; |
|
if( inputName ) |
|
{ |
|
if( !readStringList(inputName, imageList) && |
|
!capture.open(inputName)) |
|
{ |
|
fprintf( stderr, "The input file could not be opened\n" ); |
|
return -1; |
|
} |
|
} |
|
else |
|
capture.open(cameraId); |
|
|
|
if( !capture.isOpened() && imageList.empty() ) |
|
return fprintf( stderr, "Could not initialize video capture\n" ), -2; |
|
|
|
const char* outbarename = 0; |
|
{ |
|
outbarename = strrchr(outprefix, '/'); |
|
const char* tmp = strrchr(outprefix, '\\'); |
|
char cmd[1000]; |
|
sprintf(cmd, "mkdir %s", outprefix); |
|
if( tmp && tmp > outbarename ) |
|
outbarename = tmp; |
|
if( outbarename ) |
|
{ |
|
cmd[6 + outbarename - outprefix] = '\0'; |
|
system(cmd); |
|
outbarename++; |
|
} |
|
else |
|
outbarename = outprefix; |
|
} |
|
|
|
Mat frame, shownFrame, selectedObjFrame, mapxy; |
|
|
|
namedWindow("View", 1); |
|
namedWindow("Selected Object", 1); |
|
setMouseCallback("View", onMouse, 0); |
|
bool boardFound = false; |
|
|
|
string indexFilename = format("%s_index.yml", outprefix); |
|
|
|
vector<string> capturedImgList; |
|
vector<Rect> roiList; |
|
vector<Vec6f> poseList; |
|
vector<Point3f> box, boardPoints; |
|
|
|
readModelViews(indexFilename, box, capturedImgList, roiList, poseList); |
|
calcChessboardCorners(boardSize, squareSize, boardPoints); |
|
int frameIdx = 0; |
|
bool grabNext = !imageList.empty(); |
|
|
|
puts(screen_help); |
|
|
|
for(int i = 0;;i++) |
|
{ |
|
Mat frame0; |
|
if( !imageList.empty() ) |
|
{ |
|
if( i < (int)imageList.size() ) |
|
frame0 = imread(string(imageList[i]), 1); |
|
} |
|
else |
|
capture >> frame0; |
|
if( !frame0.data ) |
|
break; |
|
if( !frame.data ) |
|
{ |
|
if( frame0.size() != calibratedImageSize ) |
|
{ |
|
double sx = (double)frame0.cols/calibratedImageSize.width; |
|
double sy = (double)frame0.rows/calibratedImageSize.height; |
|
|
|
// adjust the camera matrix for the new resolution |
|
cameraMatrix.at<double>(0,0) *= sx; |
|
cameraMatrix.at<double>(0,2) *= sx; |
|
cameraMatrix.at<double>(1,1) *= sy; |
|
cameraMatrix.at<double>(1,2) *= sy; |
|
} |
|
Mat dummy; |
|
initUndistortRectifyMap(cameraMatrix, distCoeffs, Mat(), |
|
cameraMatrix, frame0.size(), |
|
CV_32FC2, mapxy, dummy ); |
|
distCoeffs = Mat::zeros(5, 1, CV_64F); |
|
} |
|
remap(frame0, frame, mapxy, Mat(), INTER_LINEAR); |
|
vector<Point2f> foundBoardCorners; |
|
boardFound = findChessboardCorners(frame, boardSize, foundBoardCorners); |
|
|
|
Mat rvec, tvec; |
|
if( boardFound ) |
|
solvePnP(Mat(boardPoints), Mat(foundBoardCorners), cameraMatrix, |
|
distCoeffs, rvec, tvec, false); |
|
|
|
frame.copyTo(shownFrame); |
|
drawChessboardCorners(shownFrame, boardSize, Mat(foundBoardCorners), boardFound); |
|
selectedObjFrame = Mat::zeros(frame.size(), frame.type()); |
|
|
|
if( boardFound && grabNext ) |
|
{ |
|
if( box.empty() ) |
|
{ |
|
int code = select3DBox("View", "Selected Object", frame, |
|
cameraMatrix, rvec, tvec, box); |
|
if( code == -100 ) |
|
break; |
|
} |
|
|
|
if( !box.empty() ) |
|
{ |
|
Rect r = extract3DBox(frame, shownFrame, selectedObjFrame, |
|
cameraMatrix, rvec, tvec, box, 4, true); |
|
if( r.area() ) |
|
{ |
|
const int maxFrameIdx = 10000; |
|
char path[1000]; |
|
for(;frameIdx < maxFrameIdx;frameIdx++) |
|
{ |
|
sprintf(path, "%s%04d.jpg", outprefix, frameIdx); |
|
FILE* f = fopen(path, "rb"); |
|
if( !f ) |
|
break; |
|
fclose(f); |
|
} |
|
if( frameIdx == maxFrameIdx ) |
|
{ |
|
printf("Can not save the image as %s<...>.jpg", outprefix); |
|
break; |
|
} |
|
imwrite(path, selectedObjFrame(r)); |
|
|
|
capturedImgList.push_back(string(path)); |
|
roiList.push_back(r); |
|
|
|
float p[6]; |
|
Mat RV(3, 1, CV_32F, p), TV(3, 1, CV_32F, p+3); |
|
rvec.convertTo(RV, RV.type()); |
|
tvec.convertTo(TV, TV.type()); |
|
poseList.push_back(Vec6f(p[0], p[1], p[2], p[3], p[4], p[5])); |
|
} |
|
} |
|
grabNext = !imageList.empty(); |
|
} |
|
|
|
imshow("View", shownFrame); |
|
imshow("Selected Object", selectedObjFrame); |
|
int c = waitKey(imageList.empty() && !box.empty() ? 30 : 300); |
|
if( c == 'q' || c == 'Q' ) |
|
break; |
|
if( c == '\r' || c == '\n' ) |
|
grabNext = true; |
|
} |
|
|
|
writeModelViews(indexFilename, box, capturedImgList, roiList, poseList); |
|
return 0; |
|
}
|
|
|