mirror of
https://github.com/ZDoom/raze-gles.git
synced 2025-01-12 03:00:38 +00:00
Lunatic: add 'randgen' module, implementing an encapsulated JKISS PRNG.
Also fix error handling path in our_require(), i.e. when loadstring fails. git-svn-id: https://svn.eduke32.com/eduke32@2857 1a8010ca-5511-0410-912e-c29ae57300e0
This commit is contained in:
parent
e7d3dcba78
commit
fdfcca557b
6 changed files with 168 additions and 9 deletions
|
@ -166,7 +166,8 @@ ifneq (0,$(LUNATIC))
|
||||||
GAMEOBJS+= $(OBJ)/../lpeg.$o # TEMP
|
GAMEOBJS+= $(OBJ)/../lpeg.$o # TEMP
|
||||||
GAMEOBJS+= $(OBJ)/luaJIT_BC_con_lang.$o \
|
GAMEOBJS+= $(OBJ)/luaJIT_BC_con_lang.$o \
|
||||||
$(OBJ)/luaJIT_BC_lunacon.$o \
|
$(OBJ)/luaJIT_BC_lunacon.$o \
|
||||||
$(OBJ)/luaJIT_BC_geom.$o
|
$(OBJ)/luaJIT_BC_geom.$o \
|
||||||
|
$(OBJ)/luaJIT_BC_randgen.$o
|
||||||
|
|
||||||
# now, take care of having the necessary symbols (sector, wall, etc.) in the
|
# now, take care of having the necessary symbols (sector, wall, etc.) in the
|
||||||
# executable no matter what the debugging level
|
# executable no matter what the debugging level
|
||||||
|
|
|
@ -482,6 +482,19 @@ void kclose(int32_t handle);
|
||||||
int32_t kread(int32_t handle, void *buffer, int32_t leng);
|
int32_t kread(int32_t handle, void *buffer, int32_t leng);
|
||||||
]]
|
]]
|
||||||
|
|
||||||
|
-- JKISS PRNG state struct and functions, see randgen module
|
||||||
|
ffi.cdef[[
|
||||||
|
typedef struct {
|
||||||
|
uint32_t x, y, z, c;
|
||||||
|
} rng_jkiss_t;
|
||||||
|
]]
|
||||||
|
decl[[
|
||||||
|
uint32_t rand_jkiss_u32(rng_jkiss_t *s);
|
||||||
|
double rand_jkiss_dbl(rng_jkiss_t *s);
|
||||||
|
|
||||||
|
void md4once(const unsigned char *block, unsigned int len, unsigned char digest[16]);
|
||||||
|
]]
|
||||||
|
|
||||||
ffi.cdef[[
|
ffi.cdef[[
|
||||||
int32_t ksqrt(uint32_t num);
|
int32_t ksqrt(uint32_t num);
|
||||||
]]
|
]]
|
||||||
|
@ -523,6 +536,8 @@ local string_dump = string.dump
|
||||||
string.dump = nil
|
string.dump = nil
|
||||||
|
|
||||||
|
|
||||||
|
gv_tmp = gv_ -- required by randgen
|
||||||
|
|
||||||
local allowed_modules = {
|
local allowed_modules = {
|
||||||
coroutine=coroutine, bit=bit, table=table, math=math, string=string,
|
coroutine=coroutine, bit=bit, table=table, math=math, string=string,
|
||||||
|
|
||||||
|
@ -530,6 +545,7 @@ local allowed_modules = {
|
||||||
clock = function() return gv_.gethitickms()/1000 end,
|
clock = function() return gv_.gethitickms()/1000 end,
|
||||||
},
|
},
|
||||||
|
|
||||||
|
randgen = require("randgen"),
|
||||||
geom = require("geom"),
|
geom = require("geom"),
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -620,7 +636,7 @@ local function our_require(modname)
|
||||||
|
|
||||||
local modfunc, errmsg = loadstring(str)
|
local modfunc, errmsg = loadstring(str)
|
||||||
if (modfunc == nil) then
|
if (modfunc == nil) then
|
||||||
errorf(ERRLEV-1, "Couldn't load \"%s\": %s", fn, errmsg)
|
errorf(ERRLEV-1, "Couldn't load \"%s\": %s", modname, errmsg)
|
||||||
end
|
end
|
||||||
|
|
||||||
local modtab = modfunc(modname)
|
local modtab = modfunc(modname)
|
||||||
|
|
|
@ -41,6 +41,11 @@ g_player;
|
||||||
luaJIT_BC_lunacon;
|
luaJIT_BC_lunacon;
|
||||||
luaJIT_BC_con_lang;
|
luaJIT_BC_con_lang;
|
||||||
luaJIT_BC_geom;
|
luaJIT_BC_geom;
|
||||||
|
luaJIT_BC_randgen;
|
||||||
|
|
||||||
|
rand_jkiss_u32;
|
||||||
|
rand_jkiss_dbl;
|
||||||
|
md4once;
|
||||||
|
|
||||||
gethitickms;
|
gethitickms;
|
||||||
};
|
};
|
||||||
|
|
|
@ -35,6 +35,35 @@ static int32_t SetActor_luacf(lua_State *L);
|
||||||
// in lpeg.o
|
// in lpeg.o
|
||||||
extern int luaopen_lpeg(lua_State *L);
|
extern int luaopen_lpeg(lua_State *L);
|
||||||
|
|
||||||
|
|
||||||
|
typedef struct {
|
||||||
|
uint32_t x, y, z, c;
|
||||||
|
} rng_jkiss_t;
|
||||||
|
|
||||||
|
// See: Good Practice in (Pseudo) Random Number Generation for
|
||||||
|
// Bioinformatics Applications, by David Jones
|
||||||
|
ATTRIBUTE((optimize("O2")))
|
||||||
|
uint32_t rand_jkiss_u32(rng_jkiss_t *s)
|
||||||
|
{
|
||||||
|
uint64_t t;
|
||||||
|
s->x = 314527869 * s->x + 1234567;
|
||||||
|
s->y ^= s->y << 5; s->y ^= s->y >> 7; s->y ^= s->y << 22;
|
||||||
|
t = 4294584393ULL * s->z + s->c; s->c = t >> 32; s->z = t;
|
||||||
|
return s->x + s->y + s->z;
|
||||||
|
}
|
||||||
|
|
||||||
|
ATTRIBUTE((optimize("O2")))
|
||||||
|
double rand_jkiss_dbl(rng_jkiss_t *s)
|
||||||
|
{
|
||||||
|
double x;
|
||||||
|
unsigned int a, b;
|
||||||
|
a = rand_jkiss_u32(s) >> 6; /* Upper 26 bits */
|
||||||
|
b = rand_jkiss_u32(s) >> 5; /* Upper 27 bits */
|
||||||
|
x = (a * 134217728.0 + b) / 9007199254740992.0;
|
||||||
|
return x;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
void El_PrintTimes(void)
|
void El_PrintTimes(void)
|
||||||
{
|
{
|
||||||
int32_t i;
|
int32_t i;
|
||||||
|
|
78
polymer/eduke32/source/lunatic/randgen.lua
Normal file
78
polymer/eduke32/source/lunatic/randgen.lua
Normal file
|
@ -0,0 +1,78 @@
|
||||||
|
-- Pseudo random number generation module for Lunatic
|
||||||
|
|
||||||
|
local ffi = require("ffi")
|
||||||
|
local ffiC = ffi.C
|
||||||
|
|
||||||
|
local rawset = rawset
|
||||||
|
|
||||||
|
local type = type
|
||||||
|
local gv = gv_tmp -- temporarily set in defs.c
|
||||||
|
|
||||||
|
local print = print -- for commented out debug block in new() below
|
||||||
|
|
||||||
|
module(...)
|
||||||
|
|
||||||
|
|
||||||
|
-- NOTE: PRNG state struct and functions are declared in defs.ilua
|
||||||
|
|
||||||
|
ffi.cdef[[
|
||||||
|
typedef union { unsigned char u[16]; double d[2]; } uchar_double_u_t;
|
||||||
|
typedef union { unsigned char u[16]; uint32_t i[4]; } uchar_uint_u_t;
|
||||||
|
]]
|
||||||
|
|
||||||
|
local mt = {
|
||||||
|
__tostring = function(s)
|
||||||
|
return "rand.new("..s.x..","..s.y..","..s.z..","..s.c..")"
|
||||||
|
end,
|
||||||
|
|
||||||
|
__index = {
|
||||||
|
getu32 = ffiC.rand_jkiss_u32,
|
||||||
|
getdbl = ffiC.rand_jkiss_dbl,
|
||||||
|
|
||||||
|
-- Initialize the JKISS PRNG using the MD4 of the lower bits of the
|
||||||
|
-- profiling timer
|
||||||
|
init_time_md4 = function(s)
|
||||||
|
local tin = ffi.new("uchar_double_u_t")
|
||||||
|
local tout = ffi.new("uchar_uint_u_t")
|
||||||
|
|
||||||
|
repeat
|
||||||
|
tin.d[0] = gv.gethitickms() % 1
|
||||||
|
tin.d[1] = gv.gethitickms() % 1
|
||||||
|
|
||||||
|
ffiC.md4once(tin.u, 16, tout.u)
|
||||||
|
|
||||||
|
s.y = tout.u[1]
|
||||||
|
until (s.y ~= 0) -- y must not be zero!
|
||||||
|
|
||||||
|
s.x = tout.u[0]
|
||||||
|
s.z = tout.u[2]
|
||||||
|
s.c = tout.u[3] % 698769068 + 1 -- Should be less than 698769069
|
||||||
|
end,
|
||||||
|
},
|
||||||
|
}
|
||||||
|
local jkiss = ffi.metatype("rng_jkiss_t", mt)
|
||||||
|
|
||||||
|
function new(x,y,z,c)
|
||||||
|
local s
|
||||||
|
if (x == nil or type(x)=="boolean") then
|
||||||
|
s = jkiss(0,0,0,0) -- invalid state, must be initialized first
|
||||||
|
if (x) then
|
||||||
|
s:init_time_md4()
|
||||||
|
end
|
||||||
|
else
|
||||||
|
s = jkiss(x,y,z,c)
|
||||||
|
end
|
||||||
|
--[[
|
||||||
|
print("TEST")
|
||||||
|
local r=ffi.new("rng_jkiss_t")
|
||||||
|
r.x = 123456789; r.y = 987654321; r.z = 43219876; r.c = 6543217;
|
||||||
|
|
||||||
|
t=gv.gethitickms()
|
||||||
|
for i=1,4*2*1e6 do
|
||||||
|
ffiC.rand_jkiss_dbl(r)
|
||||||
|
end
|
||||||
|
print("TIME: "..gv.gethitickms()-t) -- x86_64: approx. 100 ms
|
||||||
|
--]]
|
||||||
|
|
||||||
|
return s
|
||||||
|
end
|
|
@ -1,22 +1,49 @@
|
||||||
#!/usr/bin/env luajit
|
#!/usr/bin/env luajit
|
||||||
|
|
||||||
local math = require("math")
|
|
||||||
local os = require("os")
|
local os = require("os")
|
||||||
|
|
||||||
local geom = require("geom")
|
local geom = require("geom")
|
||||||
|
|
||||||
|
|
||||||
local N = os.exit and tostring(arg[1]) or 1e6
|
local N = os.exit and (arg[1] and tostring(arg[1])) or 1e6
|
||||||
|
|
||||||
local A,B = {}, {}
|
local A,B = {}, {}
|
||||||
local V,W = {}, {}
|
local V,W = {}, {}
|
||||||
|
|
||||||
local function randvec()
|
local randvec
|
||||||
|
|
||||||
|
if (os.exit) then
|
||||||
|
local math = require("math")
|
||||||
|
|
||||||
|
randvec = function()
|
||||||
return geom.vec2(math.random(), math.random())
|
return geom.vec2(math.random(), math.random())
|
||||||
|
end
|
||||||
|
else
|
||||||
|
local randgen = require("randgen")
|
||||||
|
local s = randgen.new(true)
|
||||||
|
|
||||||
|
-- NOTE: factoring out the inner s:getdbl() into a separate function
|
||||||
|
-- reduces performance seriously (about an order of magnitude!)
|
||||||
|
randvec = function()
|
||||||
|
return geom.vec2(s:getdbl(), s:getdbl())
|
||||||
|
end
|
||||||
end
|
end
|
||||||
|
|
||||||
local t1 = os.clock()
|
local t1 = os.clock()
|
||||||
|
|
||||||
|
if (os.exit == nil) then
|
||||||
|
local randgen = require("randgen")
|
||||||
|
local r = randgen.new(true)
|
||||||
|
|
||||||
|
for i=1,4*2*N do
|
||||||
|
-- This is to test the performance compared to a direct
|
||||||
|
-- ffiC.rand_jkiss_dbl() call in randgen.lua
|
||||||
|
r:getdbl()
|
||||||
|
end
|
||||||
|
end
|
||||||
|
|
||||||
|
local t2 = os.clock()
|
||||||
|
|
||||||
-- init random points and vectors
|
-- init random points and vectors
|
||||||
for i=1,N do
|
for i=1,N do
|
||||||
A[i] = randvec()
|
A[i] = randvec()
|
||||||
|
@ -25,17 +52,20 @@ for i=1,N do
|
||||||
W[i] = randvec()
|
W[i] = randvec()
|
||||||
end
|
end
|
||||||
|
|
||||||
local t2 = os.clock()
|
local t3 = os.clock()
|
||||||
|
|
||||||
local v = geom.vec2(0, 0)
|
local v = geom.vec2(0, 0)
|
||||||
for i=1,N do
|
for i=1,N do
|
||||||
v = v + geom.intersect(A[i],V[i], B[i],W[i], true)
|
v = v + geom.intersect(A[i],V[i], B[i],W[i], true)
|
||||||
end
|
end
|
||||||
|
|
||||||
local t3 = os.clock()
|
local t4 = os.clock()
|
||||||
|
|
||||||
|
-- x86_64 (embedded): approx. 200 ms (vs. the 100 ms of direct
|
||||||
|
-- ffiC.rand_jkiss_dbl()):
|
||||||
print(1000*(t2-t1))
|
print(1000*(t2-t1))
|
||||||
print(1000*(t3-t2))
|
print(1000*(t3-t2)) -- x86_64: approx. 500 ms
|
||||||
|
print(1000*(t4-t3)) -- x86_64: approx. 35 ms
|
||||||
print(v)
|
print(v)
|
||||||
|
|
||||||
return {} -- appease Lunatic's require
|
return {} -- appease Lunatic's require
|
||||||
|
|
Loading…
Reference in a new issue