OpenXR VR rendering cameras into eyes - lensing effect

richtea · June 3, 2023, 11:43am

Starcommander* and I have been trying to get OpenXR based virtual reality to work in JMonkey (Credit where credits due; Starcommander did most of the initial getting it to work, I’ve been tinkering round the edges and adding hand related stuff like actions and hand skeletons). It mostly works but with some odd lensing effects (Objects in the corner of your eye move so they no longer seem to be where they are supposed to be). My suspicion is because of the way the eyes are being rendered but I don’t really know.

The render loop looks like this:

private boolean renderLayerOpenXR(MemoryStack stack, long predictedDisplayTime, XrCompositionLayerProjection layer) {
    XrViewState viewState = XrViewState.calloc(stack)
        .type$Default();

    IntBuffer pi = stack.mallocInt(1);
    check(xrLocateViews(
        xrSession,
        XrViewLocateInfo.malloc(stack)
            .type$Default()
            .next(NULL)
            .viewConfigurationType(viewConfigType)
            .displayTime(predictedDisplayTime)
            .space(xrAppSpace),
        viewState,
        pi,
        views
    ));

    if ((viewState.viewStateFlags() & XR_VIEW_STATE_POSITION_VALID_BIT) == 0 ||
        (viewState.viewStateFlags() & XR_VIEW_STATE_ORIENTATION_VALID_BIT) == 0) {
        return false;  // There is no valid tracking poses for the views.
    }

    int viewCountOutput = pi.get(0);
    assert (viewCountOutput == views.capacity());
    assert (viewCountOutput == viewConfigs.capacity());
    assert (viewCountOutput == swapchains.length);

    XrCompositionLayerProjectionView.Buffer projectionLayerViews = XRHelper.fill(
        XrCompositionLayerProjectionView.calloc(viewCountOutput, stack),
        XrCompositionLayerProjectionView.TYPE,
        XR_TYPE_COMPOSITION_LAYER_PROJECTION_VIEW
    );

    // Render view to the appropriate part of the swapchain image.
    for (int viewIndex = 0; viewIndex < viewCountOutput; viewIndex++) {
        // Each view has a separate swapchain which is acquired, rendered to, and released.
        Swapchain viewSwapchain = swapchains[viewIndex];

        check(xrAcquireSwapchainImage(
            viewSwapchain.handle,
            XrSwapchainImageAcquireInfo.calloc(stack)
                .type$Default(),
            pi
        ));
        int swapchainImageIndex = pi.get(0);

        check(xrWaitSwapchainImage(
            viewSwapchain.handle,
            XrSwapchainImageWaitInfo.malloc(stack)
                .type$Default()
                .next(NULL)
                .timeout(XR_INFINITE_DURATION)
        ));

        XrCompositionLayerProjectionView projectionLayerView = projectionLayerViews.get(viewIndex)
            .pose(views.get(viewIndex).pose())
            .fov(views.get(viewIndex).fov())
            .subImage(si -> si
                .swapchain(viewSwapchain.handle)
                .imageRect(rect -> rect
                    .offset(offset -> offset
                        .x(0)
                        .y(0))
                    .extent(extent -> extent
                        .width(viewSwapchain.width)
                        .height(viewSwapchain.height)
                    )));

        openGLRenderView(projectionLayerView, viewSwapchain.images.get(swapchainImageIndex), viewIndex);

        check(xrReleaseSwapchainImage(
            viewSwapchain.handle,
            XrSwapchainImageReleaseInfo.calloc(stack)
                .type$Default()
        ));
    }

    layer.space(xrAppSpace);
    layer.views(projectionLayerViews);
    checkForGLErrors();
    return true;
}

private static Vector3f viewPos = new Vector3f();
private static Quaternion viewRot = new Quaternion();

private void openGLRenderView(XrCompositionLayerProjectionView layerView, XrSwapchainImageOpenGLKHR swapchainImage, int viewIndex) {
    glBindFramebuffer(GL_FRAMEBUFFER, swapchainFramebuffer);

    glFramebufferTexture2D(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, GL_TEXTURE_2D, swapchainImage.image(), 0);
    glFramebufferTexture2D(GL_FRAMEBUFFER, GL_DEPTH_ATTACHMENT, GL_TEXTURE_2D, depthTextures.get(swapchainImage), 0);

    XrRect2Di imageRect = layerView.subImage().imageRect();
    glViewport(
        imageRect.offset().x(),
        imageRect.offset().y(),
        imageRect.extent().width(),
        imageRect.extent().height()
    );
    glClear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT | GL_STENCIL_BUFFER_BIT);

    glFrontFace(GL_CW);
    glCullFace(GL_BACK);
    glEnable(GL_DEPTH_TEST);

    XrPosef       pose        = layerView.pose();
    XrVector3f    pos         = pose.position$();
    XrQuaternionf orientation = pose.orientation();

    //I don't like these coordinate transformations, they were necessary, but why
    viewPos.set(pos.x(), pos.y(), -pos.z());
    viewRot.set(orientation.x(), orientation.y(), -orientation.z(), orientation.w());
    viewRot.inverseLocal();

    Eye eye = viewIndex == 0 ? xrHmd.getLeftEye() : xrHmd.getRightEye();

    eye.setRotation(viewRot);
    eye.setPosition(viewPos);

    float foyY = -layerView.fov().angleLeft() + layerView.fov().angleRight();
    float foyX = -layerView.fov().angleDown() + layerView.fov().angleUp();

    eye.setFieldOfView(foyX,foyY);
    eye.render();

    glBindFramebuffer(GL_FRAMEBUFFER, 0);

    if (viewIndex == swapchains.length - 1) {
        glFlush();
    }
    checkForGLErrors();
}

With the supporting Eye class like this:

public class Eye {
	static int index = 0;
	private final SimpleApplication app;
    private Texture2D offTex;
    private final Geometry offGeo;

    private Camera offCamera;

    float fovX = -1;
    float fovY = -1;
    
    public Eye(SimpleApplication app)
    {
    	this.app = app;
    	setupOffscreenView(app);
        Material mat = new Material(app.getAssetManager(), "Common/MatDefs/Misc/Unshaded.j3md");
        mat.setTexture("ColorMap", offTex);
        
        offGeo = new Geometry("box", new Box(1, 1, 1));
        offGeo.setMaterial(mat);
    }

    public void setPosition(Vector3f newPosition){
        offCamera.setLocation(newPosition);
    }

    public void setRotation(Quaternion newRotation){
        offCamera.setRotation(newRotation);
    }

    /**
     * Sets the field of view for the eye. Angles in radians.
     */
    public void setFieldOfView(float fovX, float fovY){
        if (this.fovX!= fovX || this.fovY!= fovY){
            this.fovX = fovX;
            this.fovY = fovY;
            offCamera.setFrustumPerspective(FastMath.RAD_TO_DEG*fovY, fovX/fovY, 0.1f, 1000f);
        }
    }

    private void setupOffscreenView(SimpleApplication app)
    {
    	int w = app.getContext().getSettings().getWidth();
    	int h = app.getContext().getSettings().getHeight();
        offCamera = new Camera(w, h);

        ViewPort offView = app.getRenderManager().createPreView("OffscreenViewX" + (index++), offCamera);
        offView.setClearFlags(true, true, true);
        offView.setBackgroundColor(ColorRGBA.DarkGray);
        FrameBuffer offBuffer = new FrameBuffer(w, h, 1);

        //setup framebuffer's texture
        offTex = new Texture2D(w, h, Format.RGBA8);
        offTex.setMinFilter(Texture.MinFilter.Trilinear);
        offTex.setMagFilter(Texture.MagFilter.Bilinear);

        //setup framebuffer to use texture
        offBuffer.setDepthTarget(FrameBufferTarget.newTarget(Format.Depth));
        offBuffer.addColorTarget(FrameBufferTarget.newTarget(offTex));

        //set viewport to render to offscreen framebuffer
        offView.setOutputFrameBuffer(offBuffer);
        offView.attachScene(app.getRootNode());
    }
    
    public void render()
    {
    	app.getRenderManager().renderGeometry(offGeo);
    }
}

That rendering by rendering a cube that has it’s texture set as the cameras output feels wrong, but I tried doing things like

app.getRenderManager().renderViewPort(eye.getViewPort(), tpf)

and that didn’t work (left eye completely black, right eye the background colour of the camera).

Does anyone have any guidance on if this is the right way to render the eye cameras? Or what might be causing the lensing (I would provide a video but I don’t think a video would necessarily show the wrongness - its a subtle misalignment between where you know things should be and where they are actually rendered - Setting the FOV to 130° rather than what OpenXR suggests (110° ish) reduces the effect but feels like its two wrongs making a right rather than the real solution)

The full code is at jmonkeyengine/jme3-xr at openxr-withmove · richardTingle/jmonkeyengine · GitHub

*Not sure what Starcommander’s handle is on the JME forum?

richtea · June 3, 2023, 11:44am

This is an application that boots the whole thing up

public class XRTestMain3 extends SimpleApplication{

    public static void main(String[] args){

        XRTestMain3 app = new XRTestMain3();
        AppSettings settings = new AppSettings(true);
        XrHmd.setRendererForSettings(settings);
        app.setSettings(settings);
        app.start();
    }

    @Override
    public void simpleInitApp() {
        XrHmd.initHmd(this);

        for(int i = 0; i < 5; i++){
            Box b = new Box(0.1f, 0.1f, 0.1f);
            Geometry geom = new Geometry("Box", b);
            Material mat = new Material(assetManager,
                    "Common/MatDefs/Light/Lighting.j3md");
            geom.setMaterial(mat);
            geom.setLocalTranslation(i,0,0);
            rootNode.attachChild(geom);
        }
        for(int i = 1; i < 5; i++){
            Box b = new Box(0.05f, 0.1f, 0.1f);
            Geometry geom = new Geometry("Box", b);
            Material mat = new Material(assetManager,
                    "Common/MatDefs/Light/Lighting.j3md");
            geom.setMaterial(mat);
            geom.setLocalTranslation(0,i,0);
            rootNode.attachChild(geom);
        }
        for(int i = 1; i < 5; i++){
            Box b = new Box(0.1f, 0.1f, 0.1f);
            Geometry geom = new Geometry("Box", b);
            Material mat = new Material(assetManager,
                    "Common/MatDefs/Light/Lighting.j3md");
            geom.setMaterial(mat);
            geom.setLocalTranslation(0,0,i);
            rootNode.attachChild(geom);
        }

        rootNode.attachChild(checkerboardFloor(assetManager));

        DirectionalLight directionalLight = new DirectionalLight(new Vector3f(0.4f,-0.3f,0.6f).normalizeLocal());
        AmbientLight al = new AmbientLight();
        al.setColor(ColorRGBA.White.mult(0.3f));
        rootNode.addLight(al);
        rootNode.addLight(directionalLight);
    }

    public static Geometry checkerboardFloor(AssetManager assetManager){
        Quad floorQuad = new Quad(10,10);
        Geometry floor = new Geometry("floor", floorQuad);

        Texture floorTexture = assetManager.loadTexture("Textures/checkerBoard.png");
        floorTexture.setMagFilter(Texture.MagFilter.Nearest);
        Material mat = new Material(assetManager,"Common/MatDefs/Misc/Unshaded.j3md");
        mat.setTexture("ColorMap", floorTexture);
        mat.getAdditionalRenderState().setFaceCullMode(RenderState.FaceCullMode.Off);

        floor.setMaterial(mat);
        Quaternion floorRotate = new Quaternion();
        floorRotate.fromAngleAxis(-FastMath.HALF_PI, Vector3f.UNIT_X);
        floor.setLocalRotation(floorRotate);
        floor.setLocalTranslation(-5,-1,5);

        return floor;
    }
}

pspeed · June 3, 2023, 12:00pm

Without looking, is this a case of one referring to horizontal FOV and the other referring to vertical FOV?

richtea · June 3, 2023, 12:20pm

They are more or less the same. The FOV is set here

public void setFieldOfView(float fovX, float fovY){
    if (this.fovX!= fovX || this.fovY!= fovY){
        this.fovX = fovX;
        this.fovY = fovY;
        offCamera.setFrustumPerspective(FastMath.RAD_TO_DEG*fovY, fovX/fovY, 0.1f, 1000f);
    }
}

And fovX is 99.695 degrees and fovY is 97 degrees. Which is actually a bit weird, as Oculus’s documentation says 106 degrees horizontal by 96 degrees vertical (Hard coding it to those values does not help).

These come out of the layerview that OpenXR produces

    float foyY = -layerView.fov().angleLeft() + layerView.fov().angleRight();
    float foyX = -layerView.fov().angleDown() + layerView.fov().angleUp();

In OpenVR days it was just hard coded to 108 degrees for everyone. Part of me wondered if there was some “excess” fov that the runtime keeps hidden so turns of the head could get something before the app responded but I couldn’t find anything like that in the documentation

starcommander · June 22, 2023, 9:45am

If anyone has hardware: We can need testers for openxr using different configuration and hardware.
PullRequest:

https://github.com/jMonkeyEngine/jmonkeyengine/pull/2012

@richtea Maybe you can also provide your hardware and settings that you use:
(Linux/Windows, OpenXR via monado or via steam, …)
My configuration is listed in pull-request directly.
Also we shoult check if coordinate system is correct, as explained here:
Viewing and Transformations - OpenGL Wiki → Can_I_make_OpenGL_use_a_left-handed_coordinate_space
Maybe this is the issue, you explained in PR?