X-Git-Url: http://git.osdn.net/view?p=csp-qt%2Fcommon_source_project-fm7.git;a=blobdiff_plain;f=source%2Fsrc%2Fcommon.h;h=ec899592a5fa527952236e143a8ce584ac723d03;hp=46f441f65323693173de66e18dc3ce262b357dc3;hb=d4eda6c3bca1f8ff98534197e0704e9558a5fae5;hpb=22e767792b7fdb2411c7e11ddbc9a2f3ffcc1170

diff --git a/source/src/common.h b/source/src/common.h
index 46f441f65..ec899592a 100644
--- a/source/src/common.h
+++ b/source/src/common.h
@@ -15,6 +15,10 @@
 //	#define USE_SHARED_DLL
 //#endif
 
+#ifdef _USE_QT
+#include <SDL.h>
+#endif
+
 // use zlib to decompress gzip file???
 #ifdef _WIN32
 	#if defined(_MSC_VER) && (_MSC_VER >= 1500)
@@ -108,6 +112,7 @@
 #include <stdlib.h>
 #include <string.h>
 #ifdef _MSC_VER
+#include <io.h>
 #include <typeinfo.h>
 #else
 #include <typeinfo>
@@ -279,8 +284,10 @@ typedef union {
 		int8_t l, h;
 #endif
 	} sb;
-	uint16_t u16;
-	int16_t s16;
+	uint16_t u16; // ToDo: Remove
+	int16_t s16; // ToDo: Remove
+	uint16_t w;
+	int16_t sw;
 
 	inline void read_2bytes_le_from(uint8_t *t)
 	{
@@ -384,7 +391,8 @@ typedef union {
 	} p16;
 	uint32_t d;
 	int32_t sd;
-	float f;
+	float f; // single float
+  
 	inline void read_2bytes_le_from(uint8_t *t)
 	{
 		b.l = t[0]; b.h = t[1]; b.h2 = b.h3 = 0;
@@ -509,7 +517,7 @@ typedef union {
 		littlev.b.l = b.l; littlev.b.h = b.h; littlev.b.h2 = b.h2; littlev.b.h3 = b.h3;
 		return littlev.dw;
 	}
-} pair_t;
+} pair32_t;
 
 
 typedef union {
@@ -564,14 +572,21 @@ typedef union {
 	} sd;
 	struct {
 #ifdef __BIG_ENDIAN__
-		pair_t h, l;
+		pair32_t h, l;
 #else
-		pair_t l, h;
+		pair32_t l, h;
 #endif
 	} p32;
-	uint64_t u64;
-	int64_t s64;
-	double d64;
+	struct {
+#ifdef __BIG_ENDIAN__
+		float h, l;
+#else
+		float l, h;
+#endif
+	} f32;
+	uint64_t q;
+	int64_t sq;
+	double df; // double float
 	inline void read_2bytes_le_from(uint8_t *t)
 	{
 		b.l = t[0]; b.h = t[1]; b.h2 = b.h3 = 0;
@@ -927,7 +942,7 @@ uint16_t DLL_PREFIX EndianFromBig_WORD(uint16_t x);
 
 // hint for SIMD
 #if defined(__clang__)
-	#define __DECL_VECTORIZED_LOOP   _Pragma("clang loop vectorize(enable) interleave(enable)")
+	#define __DECL_VECTORIZED_LOOP   _Pragma("clang loop vectorize(enable) distribute(enable)")
 #elif defined(__GNUC__)
 	#define __DECL_VECTORIZED_LOOP	_Pragma("GCC ivdep")
 #else
@@ -936,7 +951,7 @@ uint16_t DLL_PREFIX EndianFromBig_WORD(uint16_t x);
 
 // C99 math functions
 #ifdef _MSC_VER
-	#define my_isfinite _finite
+	#define my_isfinite  _finite
 	#define my_log2(v) (log((double)(v)) / log(2.0))
 #else
 	#include <cmath>
@@ -990,10 +1005,284 @@ uint16_t DLL_PREFIX EndianFromBig_WORD(uint16_t x);
 #endif
 #endif
 
+// 20181104 K.O:
+// Below routines aims to render common routine.
+
+#ifdef _MSC_VER
+	#define __DECL_ALIGNED(foo) __declspec(align(foo))
+	#ifndef __builtin_assume_aligned
+		#define __builtin_assume_aligned(foo, a) foo
+	#endif
+#elif defined(__GNUC__)
+	#define __DECL_ALIGNED(foo) __attribute__((aligned(foo)))
+#else
+	// ToDo
+	#define __builtin_assume_aligned(foo, a) foo
+	#define __DECL_ALIGNED(foo)
+#endif
+
+// ToDo: for MSVC
+#if defined(_RGB555) || defined(_RGBA565)
+typedef	__DECL_ALIGNED(16) union {
+	scrntype_t w[8];
+	__v8hi v;
+} scrntype_vec8_t;
+typedef	__DECL_ALIGNED(16) union {
+	scrntype_t w[16];
+	__v8hi v[2];
+} scrntype_vec16_t;
+#else
+typedef	__DECL_ALIGNED(32) union {
+	scrntype_t w[8];
+	__v16hi v;
+} scrntype_vec8_t;
+typedef	__DECL_ALIGNED(32) union {
+	scrntype_t w[16];
+	__v16hi v[2];
+} scrntype_vec16_t;
+#endif
+
+typedef __DECL_ALIGNED(16) union {
+	__v4hi v;
+	uint8_t w[8];
+} uint8_vec8_t;
+
+typedef __DECL_ALIGNED(16) union {
+	__v8hi v;
+	uint16_t w[8];
+} uint16_vec8_t;
+
+typedef __DECL_ALIGNED(16) union {
+	__v16hi v;
+	uint32_t w[8];
+} uint32_vec8_t;
+
+typedef __DECL_ALIGNED(16) struct {
+	uint16_vec8_t plane_table[256];
+} _bit_trans_table_t;
+
+typedef __DECL_ALIGNED(sizeof(scrntype_vec8_t)) struct {
+	scrntype_vec8_t plane_table[256];
+} _bit_trans_table_scrn_t;
+
+typedef struct {
+	scrntype_t* palette; // Must be 2^planes entries. If NULL, assume RGB.
+	_bit_trans_table_t* bit_trans_table[16]; // Must be exist >= planes. Must be aligned with sizeof(uint16_vec8_t).
+	int xzoom; // 1 - 4?
+	bool is_render[16];
+	int shift;
+	uint8_t* data[16];
+	uint32_t baseaddress[16];
+	uint32_t voffset[16];
+	uint32_t addrmask;  // For global increment.
+	uint32_t addrmask2; // For local increment.
+	uint32_t begin_pos;
+	uint32_t render_width;
+} _render_command_data_t;
+
+
+inline scrntype_vec8_t ConvertByteToMonochromePackedPixel(uint8_t src, _bit_trans_table_t *tbl,scrntype_t on_val, scrntype_t off_val)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	__DECL_ALIGNED(32) scrntype_vec8_t tmpdd;
+	_bit_trans_table_t*  vt = (_bit_trans_table_t*)__builtin_assume_aligned(tbl, sizeof(uint16_vec8_t));
+
+	tmpd.v = vt->plane_table[src].v;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 8; i++) {
+		tmpdd.w[i] = (tmpd.w[i] == 0) ? off_val: on_val;
+	}
+	return tmpdd;
+}
+
+// Note: Pls. read Note(s) of common.cpp -- 20181105 K.Ohta.
+// Tables for below functions must be aligned by 16 (_bit_trans_table_t) or 32(_bit_trans_table_scrn_t).  
+void DLL_PREFIX ConvertByteToPackedPixelByColorTable(uint8_t *src, scrntype_t* dst, int bytes, _bit_trans_table_t *tbl, scrntype_t *on_color_table, scrntype_t* off_color_table);
+void DLL_PREFIX ConvertByteToPackedPixelByColorTable2(uint8_t *src, scrntype_t* dst, int bytes, _bit_trans_table_scrn_t *tbl, scrntype_t *on_color_table, scrntype_t* off_color_table);
+void DLL_PREFIX ConvertByteToSparceUint16(uint8_t *src, uint16_t* dst, int bytes, _bit_trans_table_t *tbl, uint16_t mask);
+void DLL_PREFIX ConvertByteToSparceUint8(uint8_t *src, uint16_t* dst, int bytes, _bit_trans_table_t *tbl, uint16_t mask);
+
+// Table must be (ON_VAL_COLOR : OFF_VAL_COLOR)[256].
+inline scrntype_vec8_t ConvertByteToPackedPixel_PixelTbl(uint8_t src, _bit_trans_table_scrn_t *tbl)
+{
+	__DECL_ALIGNED(32) scrntype_vec8_t tmpdd;
+	_bit_trans_table_scrn_t*  vt = (_bit_trans_table_scrn_t*)__builtin_assume_aligned(tbl, sizeof(uint16_vec8_t));
+
+	tmpdd.v = vt->plane_table[src].v;
+	return tmpdd;
+}
+
+// Table must be (ON_VAL_COLOR : OFF_VAL_COLOR)[256].
+inline scrntype_vec16_t ConvertByteToDoublePackedPixel_PixelTbl(uint8_t src, _bit_trans_table_scrn_t *tbl)
+{
+	__DECL_ALIGNED(32) scrntype_vec16_t tmpdd;
+	__DECL_ALIGNED(32) scrntype_vec8_t tmpd;
+	_bit_trans_table_scrn_t*  vt = (_bit_trans_table_scrn_t*)__builtin_assume_aligned(tbl, sizeof(uint16_vec8_t));
+	tmpd.v = vt->plane_table[src].v;
+	int j = 0;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 16; i += 2) {
+		tmpdd.w[i]     = tmpd.w[j];
+		tmpdd.w[i + 1] = tmpd.w[j];
+		j++;
+	}
+	return tmpdd;
+}
+
+// Table must be initialize ON_COLOR : OFF_COLOR
+inline void ConvertByteToDoubleMonochromeUint8(uint8_t src, uint8_t* dst, _bit_trans_table_t* tbl)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  vt = (uint16_vec8_t*)__builtin_assume_aligned(&(tbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	__DECL_ALIGNED(16) uint8_t d[16];
+	tmpd = vt[src];
+	int j = 0;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 16; i += 2) {
+		d[i]     = (uint8_t)(tmpd.w[j]);
+		d[i + 1] = (uint8_t)(tmpd.w[j]);
+		j++;
+	}
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 16; i++) {
+		dst[i] = d[i];
+	}
+}
+
+inline void ConvertByteToMonochromeUint8(uint8_t src, uint8_t* dst, _bit_trans_table_t* tbl)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  vt = (uint16_vec8_t*)__builtin_assume_aligned(&(tbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	tmpd = vt[src];
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 8; i++) {
+		dst[i] = (uint8_t)(tmpd.w[i]);
+	}
+}
+
+inline void ConvertRGBTo8ColorsUint8(uint8_t r, uint8_t g, uint8_t b, uint8_t* dst, _bit_trans_table_t* rtbl, _bit_trans_table_t* gtbl, _bit_trans_table_t* btbl, int shift)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  rvt = (uint16_vec8_t*)__builtin_assume_aligned(&(rtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  gvt = (uint16_vec8_t*)__builtin_assume_aligned(&(gtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  bvt = (uint16_vec8_t*)__builtin_assume_aligned(&(btbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	tmpd.v = rvt[r].v;
+	tmpd.v = tmpd.v | gvt[g].v;
+	tmpd.v = tmpd.v | bvt[b].v;
+	tmpd.v = tmpd.v >> shift;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 8; i++) {
+		dst[i] = (uint8_t)(tmpd.w[i]);
+	}
+}
+
+inline void ConvertRGBTo8ColorsUint8_Zoom2Left(uint8_t r, uint8_t g, uint8_t b, uint8_t* dst, _bit_trans_table_t* rtbl, _bit_trans_table_t* gtbl, _bit_trans_table_t* btbl, int shift)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  rvt = (uint16_vec8_t*)__builtin_assume_aligned(&(rtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  gvt = (uint16_vec8_t*)__builtin_assume_aligned(&(gtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  bvt = (uint16_vec8_t*)__builtin_assume_aligned(&(btbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	tmpd.v = rvt[r].v;
+	tmpd.v = tmpd.v | gvt[g].v;
+	tmpd.v = tmpd.v | bvt[b].v;
+	tmpd.v = tmpd.v >> shift;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0, j = 0; i < 8; i += 2, j++) {
+		dst[i]     = (uint8_t)(tmpd.w[j]);
+		dst[i + 1] = (uint8_t)(tmpd.w[j]);
+	}
+}
+
+inline void ConvertRGBTo8ColorsUint8_Zoom2Right(uint8_t r, uint8_t g, uint8_t b, uint8_t* dst, _bit_trans_table_t* rtbl, _bit_trans_table_t* gtbl, _bit_trans_table_t* btbl, int shift)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  rvt = (uint16_vec8_t*)__builtin_assume_aligned(&(rtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  gvt = (uint16_vec8_t*)__builtin_assume_aligned(&(gtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  bvt = (uint16_vec8_t*)__builtin_assume_aligned(&(btbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	tmpd.v = rvt[r].v;
+	tmpd.v = tmpd.v | gvt[g].v;
+	tmpd.v = tmpd.v | bvt[b].v;
+	tmpd.v = tmpd.v >> shift;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0, j = 4; i < 8; i += 2, j++) {
+		dst[i]     = (uint8_t)(tmpd.w[j]);
+		dst[i + 1] = (uint8_t)(tmpd.w[j]);
+	}
+}
+
+inline void ConvertRGBTo8ColorsUint8_Zoom2Double(uint8_t r, uint8_t g, uint8_t b, uint8_t* dst, _bit_trans_table_t* rtbl, _bit_trans_table_t* gtbl, _bit_trans_table_t* btbl, int shift)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  rvt = (uint16_vec8_t*)__builtin_assume_aligned(&(rtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  gvt = (uint16_vec8_t*)__builtin_assume_aligned(&(gtbl->plane_table[0]), sizeof(uint16_vec8_t));
+	uint16_vec8_t*  bvt = (uint16_vec8_t*)__builtin_assume_aligned(&(btbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	tmpd.v = rvt[r].v;
+	tmpd.v = tmpd.v | gvt[g].v;
+	tmpd.v = tmpd.v | bvt[b].v;
+	tmpd.v = tmpd.v >> shift;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0, j = 0; i < 16; i += 2, j++) {
+		dst[i]     = (uint8_t)(tmpd.w[j]);
+		dst[i + 1] = (uint8_t)(tmpd.w[j]);
+	}
+}
+
+inline void ConvertByteToMonochromeUint8Cond_Zoom2(uint8_t src, uint8_t* dst, _bit_trans_table_t* tbl, uint8_t on_color, uint8_t off_color)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  vt = (uint16_vec8_t*)__builtin_assume_aligned(&(tbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	__DECL_ALIGNED(16) uint8_t d[16];
+	tmpd = vt[src];
+	int j = 0;
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 16; i += 2) {
+		d[i]     = (tmpd.w[j] == 0) ? off_color : on_color;
+		d[i + 1] = (tmpd.w[j] == 0) ? off_color : on_color;
+		j++;
+	}
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 16; i++) {
+		dst[i] = d[i];
+	}
+}
+
+inline void ConvertByteToMonochromeUint8Cond(uint8_t src, uint8_t* dst, _bit_trans_table_t* tbl, uint8_t on_color, uint8_t off_color)
+{
+	__DECL_ALIGNED(16) uint16_vec8_t   tmpd;
+	uint16_vec8_t*  vt = (uint16_vec8_t*)__builtin_assume_aligned(&(tbl->plane_table[0]), sizeof(uint16_vec8_t));
+
+	tmpd = vt[src];
+__DECL_VECTORIZED_LOOP
+	for(int i = 0; i < 8; i++) {
+		dst[i]     = (tmpd.w[i] == 0) ? off_color : on_color;
+	}
+}
+
+void DLL_PREFIX PrepareBitTransTableUint16(_bit_trans_table_t *tbl, uint16_t on_val, uint16_t off_val);
+void DLL_PREFIX PrepareBitTransTableScrnType(_bit_trans_table_scrn_t *tbl, scrntype_t on_val, scrntype_t off_val);
+void DLL_PREFIX PrepareReverseBitTransTableUint16(_bit_trans_table_t *tbl, uint16_t on_val, uint16_t off_val);
+void DLL_PREFIX PrepareReverseBitTransTableScrnType(_bit_trans_table_scrn_t *tbl, scrntype_t on_val, scrntype_t off_val);
+
+void DLL_PREFIX Render8Colors_Line(_render_command_data_t *src, scrntype_t *dst, scrntype_t *dst2, bool scan_line);
+
+void DLL_PREFIX Render16Colors_Line(_render_command_data_t *src, scrntype_t *dst, scrntype_t *dst2, bool scan_line);
+void DLL_PREFIX Render2NColors_Line(_render_command_data_t *src, scrntype_t *dst, scrntype_t* dst2, bool scan_line, int planes);
+
+void DLL_PREFIX Convert8ColorsToByte_Line(_render_command_data_t *src, uint8_t *dst);
+void DLL_PREFIX Convert2NColorsToByte_Line(_render_command_data_t *src, uint8_t *dst, int planes);
+void DLL_PREFIX Convert2NColorsToByte_LineZoom2(_render_command_data_t *src, uint8_t *dst, int planes);
+
 inline uint64_t ExchangeEndianU64(uint64_t __in)
 {
 	pair64_t __i, __o;
-	__i.u64 = __in;
+	__i.q = __in;
 	__o.b.h7  = __i.b.l;
 	__o.b.h6  = __i.b.h;
 	__o.b.h5  = __i.b.h2;
@@ -1002,13 +1291,13 @@ inline uint64_t ExchangeEndianU64(uint64_t __in)
 	__o.b.h2  = __i.b.h5;
 	__o.b.h   = __i.b.h6;
 	__o.b.l   = __i.b.h7;
-	return __o.u64;
+	return __o.q;
 }
 
 inline int64_t ExchangeEndianS64(uint64_t __in)
 {
 	pair64_t __i, __o;
-	__i.u64 = __in;
+	__i.q = __in;
 	__o.b.h7  = __i.b.l;
 	__o.b.h6  = __i.b.h;
 	__o.b.h5  = __i.b.h2;
@@ -1017,11 +1306,11 @@ inline int64_t ExchangeEndianS64(uint64_t __in)
 	__o.b.h2  = __i.b.h5;
 	__o.b.h   = __i.b.h6;
 	__o.b.l   = __i.b.h7;
-	return __o.s64;
+	return __o.sq;
 }
 inline uint32_t ExchangeEndianU32(uint32_t __in)
 {
-	pair_t __i, __o;
+	pair32_t __i, __o;
 	__i.d = __in;
 	__o.b.h3 = __i.b.l;
 	__o.b.h2 = __i.b.h;
@@ -1032,7 +1321,7 @@ inline uint32_t ExchangeEndianU32(uint32_t __in)
 
 inline int32_t ExchangeEndianS32(uint32_t __in)
 {
-	pair_t __i, __o;
+	pair32_t __i, __o;
 	__i.d = __in;
 	__o.b.h3 = __i.b.l;
 	__o.b.h2 = __i.b.h;
@@ -1114,6 +1403,8 @@ void DLL_PREFIX create_local_path(_TCHAR *file_path, int length, const _TCHAR *f
 const _TCHAR *DLL_PREFIX create_date_file_path(const _TCHAR *extension);
 bool DLL_PREFIX is_absolute_path(const _TCHAR *file_path);
 void DLL_PREFIX create_date_file_path(_TCHAR *file_path, int length, const _TCHAR *extension);
+const _TCHAR *DLL_PREFIX create_date_file_name(const _TCHAR *extension);
+void DLL_PREFIX create_date_file_name(_TCHAR *file_path, int length, const _TCHAR *extension);
 bool DLL_PREFIX check_file_extension(const _TCHAR *file_path, const _TCHAR *ext);
 const _TCHAR *DLL_PREFIX get_file_path_without_extensiton(const _TCHAR *file_path);
 void DLL_PREFIX get_long_full_path_name(const _TCHAR* src, _TCHAR* dst, size_t dst_len);
@@ -1142,6 +1433,11 @@ uint16_t DLL_PREFIX jis_to_sjis(uint16_t jis);
 int DLL_PREFIX decibel_to_volume(int decibel);
 int32_t DLL_PREFIX apply_volume(int32_t sample, int volume);
 
+// High pass filter and Low pass filter.
+void DLL_PREFIX calc_high_pass_filter(int32_t* dst, int32_t* src, int sample_freq, int hpf_freq, int samples, double quality = 1.0, bool is_add = true);
+void DLL_PREFIX calc_low_pass_filter(int32_t* dst, int32_t* src, int sample_freq, int lpf_freq, int samples, double quality = 1.0, bool is_add = true);
+
+
 #define array_length(array) (sizeof(array) / sizeof(array[0]))
 
 #define FROM_BCD(v)	(((v) & 0x0f) + (((v) >> 4) & 0x0f) * 10)