2019-10-01 13:17:20 +00:00
|
|
|
/*
|
|
|
|
KVMGFX Client - A KVM Client for VGA Passthrough
|
|
|
|
Copyright (C) 2017-2019 Geoffrey McRae <geoff@hostfission.com>
|
|
|
|
https://looking-glass.hostfission.com
|
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
|
|
Foundation; either version 2 of the License, or (at your option) any later
|
|
|
|
version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
|
|
|
|
PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
|
|
this program; if not, write to the Free Software Foundation, Inc., 59 Temple
|
|
|
|
Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "common/framebuffer.h"
|
|
|
|
#include "common/debug.h"
|
|
|
|
|
|
|
|
#include <string.h>
|
2020-04-12 03:14:53 +00:00
|
|
|
#include <stdatomic.h>
|
2020-08-03 01:16:30 +00:00
|
|
|
#include <emmintrin.h>
|
2020-08-03 01:58:38 +00:00
|
|
|
#include <smmintrin.h>
|
2020-08-10 06:18:08 +00:00
|
|
|
#include <unistd.h>
|
2020-04-12 03:14:53 +00:00
|
|
|
|
2020-08-10 06:18:08 +00:00
|
|
|
#define FB_CHUNK_SIZE 1048576 // 1MB
|
|
|
|
#define FB_SPIN_LIMIT 10000 // 10ms
|
2019-10-01 13:17:20 +00:00
|
|
|
|
2020-04-12 03:14:53 +00:00
|
|
|
struct stFrameBuffer
|
|
|
|
{
|
|
|
|
atomic_uint_least32_t wp;
|
|
|
|
uint8_t data[0];
|
|
|
|
};
|
|
|
|
|
|
|
|
const size_t FrameBufferStructSize = sizeof(FrameBuffer);
|
|
|
|
|
|
|
|
void framebuffer_wait(const FrameBuffer * frame, size_t size)
|
|
|
|
{
|
2020-10-29 15:32:25 +00:00
|
|
|
while(atomic_load_explicit(&frame->wp, memory_order_acquire) < size) {
|
|
|
|
while(frame->wp < size)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
}
|
2020-04-12 03:14:53 +00:00
|
|
|
}
|
|
|
|
|
2020-08-03 04:41:57 +00:00
|
|
|
bool framebuffer_read(const FrameBuffer * frame, void * restrict dst,
|
|
|
|
size_t dstpitch, size_t height, size_t width, size_t bpp, size_t pitch)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-08-03 04:41:57 +00:00
|
|
|
uint8_t * restrict d = (uint8_t*)dst;
|
2020-04-14 03:27:07 +00:00
|
|
|
uint_least32_t rp = 0;
|
|
|
|
size_t y = 0;
|
|
|
|
const size_t linewidth = width * bpp;
|
2020-08-03 04:41:57 +00:00
|
|
|
const size_t blocks = linewidth / 64;
|
|
|
|
const size_t left = linewidth % 64;
|
2020-04-14 03:27:07 +00:00
|
|
|
|
|
|
|
while(y < height)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-04-12 03:14:53 +00:00
|
|
|
uint_least32_t wp;
|
2020-08-10 06:18:08 +00:00
|
|
|
int spinCount = 0;
|
2020-04-12 03:14:53 +00:00
|
|
|
|
2019-10-01 13:17:20 +00:00
|
|
|
/* spinlock */
|
2020-08-10 06:18:08 +00:00
|
|
|
wp = atomic_load_explicit(&frame->wp, memory_order_acquire);
|
|
|
|
while(wp - rp < linewidth)
|
|
|
|
{
|
|
|
|
if (++spinCount == FB_SPIN_LIMIT)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
usleep(1);
|
2020-08-03 01:16:30 +00:00
|
|
|
wp = atomic_load_explicit(&frame->wp, memory_order_acquire);
|
2020-08-10 06:18:08 +00:00
|
|
|
}
|
2019-10-14 07:08:06 +00:00
|
|
|
|
2020-08-03 04:41:57 +00:00
|
|
|
_mm_mfence();
|
|
|
|
__m128i * restrict s = (__m128i *)(frame->data + rp);
|
|
|
|
for(int i = 0; i < blocks; ++i)
|
|
|
|
{
|
|
|
|
__m128i *_d = (__m128i *)d;
|
|
|
|
__m128i *_s = (__m128i *)s;
|
|
|
|
__m128i v1 = _mm_stream_load_si128(_s + 0);
|
|
|
|
__m128i v2 = _mm_stream_load_si128(_s + 1);
|
|
|
|
__m128i v3 = _mm_stream_load_si128(_s + 2);
|
|
|
|
__m128i v4 = _mm_stream_load_si128(_s + 3);
|
|
|
|
|
|
|
|
_mm_storeu_si128(_d + 0, v1);
|
|
|
|
_mm_storeu_si128(_d + 1, v2);
|
|
|
|
_mm_storeu_si128(_d + 2, v3);
|
|
|
|
_mm_storeu_si128(_d + 3, v4);
|
|
|
|
|
|
|
|
d += 64;
|
|
|
|
s += 4;
|
|
|
|
}
|
2020-08-03 01:16:30 +00:00
|
|
|
|
|
|
|
if (left)
|
2020-08-03 04:41:57 +00:00
|
|
|
{
|
|
|
|
memcpy(d, s, left);
|
|
|
|
d += left;
|
|
|
|
}
|
2019-10-14 07:08:06 +00:00
|
|
|
|
2020-04-14 03:27:07 +00:00
|
|
|
rp += pitch;
|
2020-08-03 04:41:57 +00:00
|
|
|
d += dstpitch - linewidth;
|
2020-04-14 03:27:07 +00:00
|
|
|
++y;
|
2019-10-01 13:17:20 +00:00
|
|
|
}
|
2020-04-14 03:27:07 +00:00
|
|
|
|
2019-10-01 13:17:20 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-04-14 03:27:07 +00:00
|
|
|
bool framebuffer_read_fn(const FrameBuffer * frame, size_t height, size_t width,
|
|
|
|
size_t bpp, size_t pitch, FrameBufferReadFn fn, void * opaque)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-04-14 03:27:07 +00:00
|
|
|
uint_least32_t rp = 0;
|
|
|
|
size_t y = 0;
|
|
|
|
const size_t linewidth = width * bpp;
|
|
|
|
|
|
|
|
while(y < height)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-04-12 03:14:53 +00:00
|
|
|
uint_least32_t wp;
|
2020-08-10 06:18:08 +00:00
|
|
|
int spinCount = 0;
|
2020-04-12 03:14:53 +00:00
|
|
|
|
2019-10-01 13:17:20 +00:00
|
|
|
/* spinlock */
|
2020-08-10 06:18:08 +00:00
|
|
|
wp = atomic_load_explicit(&frame->wp, memory_order_acquire);
|
|
|
|
while(wp - rp < linewidth)
|
|
|
|
{
|
|
|
|
if (++spinCount == FB_SPIN_LIMIT)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
usleep(1);
|
2020-08-03 01:16:30 +00:00
|
|
|
wp = atomic_load_explicit(&frame->wp, memory_order_acquire);
|
2020-08-10 06:18:08 +00:00
|
|
|
}
|
2019-10-14 07:08:06 +00:00
|
|
|
|
2020-04-14 03:27:07 +00:00
|
|
|
if (!fn(opaque, frame->data + rp, linewidth))
|
2019-10-01 13:17:20 +00:00
|
|
|
return false;
|
2019-10-14 07:08:06 +00:00
|
|
|
|
2020-04-14 03:27:07 +00:00
|
|
|
rp += pitch;
|
|
|
|
++y;
|
2019-10-01 13:17:20 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Prepare the framebuffer for writing
|
|
|
|
*/
|
2020-01-13 08:30:49 +00:00
|
|
|
void framebuffer_prepare(FrameBuffer * frame)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-08-03 01:16:30 +00:00
|
|
|
atomic_store_explicit(&frame->wp, 0, memory_order_release);
|
2019-10-01 13:17:20 +00:00
|
|
|
}
|
|
|
|
|
2020-08-03 04:41:57 +00:00
|
|
|
bool framebuffer_write(FrameBuffer * frame, const void * restrict src, size_t size)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-08-03 04:41:57 +00:00
|
|
|
__m128i * restrict s = (__m128i *)src;
|
|
|
|
__m128i * restrict d = (__m128i *)frame->data;
|
|
|
|
size_t wp = 0;
|
|
|
|
|
|
|
|
_mm_mfence();
|
2020-08-03 01:16:30 +00:00
|
|
|
|
2019-10-01 13:17:20 +00:00
|
|
|
/* copy in chunks */
|
2020-08-03 02:24:11 +00:00
|
|
|
while(size > 63)
|
2020-08-03 01:16:30 +00:00
|
|
|
{
|
2020-08-03 04:41:57 +00:00
|
|
|
__m128i *_d = (__m128i *)d;
|
|
|
|
__m128i *_s = (__m128i *)s;
|
|
|
|
__m128i v1 = _mm_stream_load_si128(_s + 0);
|
|
|
|
__m128i v2 = _mm_stream_load_si128(_s + 1);
|
|
|
|
__m128i v3 = _mm_stream_load_si128(_s + 2);
|
|
|
|
__m128i v4 = _mm_stream_load_si128(_s + 3);
|
|
|
|
|
|
|
|
_mm_store_si128(_d + 0, v1);
|
|
|
|
_mm_store_si128(_d + 1, v2);
|
|
|
|
_mm_store_si128(_d + 2, v3);
|
|
|
|
_mm_store_si128(_d + 3, v4);
|
|
|
|
|
|
|
|
s += 4;
|
|
|
|
d += 4;
|
2020-08-03 02:24:11 +00:00
|
|
|
size -= 64;
|
|
|
|
wp += 64;
|
2020-08-03 01:44:24 +00:00
|
|
|
|
|
|
|
if (wp % FB_CHUNK_SIZE == 0)
|
|
|
|
atomic_store_explicit(&frame->wp, wp, memory_order_release);
|
2020-08-03 01:16:30 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if(size)
|
2019-10-01 13:17:20 +00:00
|
|
|
{
|
2020-08-03 02:24:11 +00:00
|
|
|
memcpy(frame->data + wp, s, size);
|
2020-08-03 01:44:24 +00:00
|
|
|
wp += size;
|
2019-10-01 13:17:20 +00:00
|
|
|
}
|
2020-08-03 01:16:30 +00:00
|
|
|
|
2020-08-03 01:44:24 +00:00
|
|
|
atomic_store_explicit(&frame->wp, wp, memory_order_release);
|
2019-10-01 13:17:20 +00:00
|
|
|
return true;
|
2020-04-12 03:14:53 +00:00
|
|
|
}
|