diff foosdk/sdk/foobar2000/shared/utf8.cpp @ 1:20d02a178406 default tip

*: check in everything else yay
author Paper <paper@tflc.us>
date Mon, 05 Jan 2026 02:15:46 -0500
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/foosdk/sdk/foobar2000/shared/utf8.cpp	Mon Jan 05 02:15:46 2026 -0500
@@ -0,0 +1,226 @@
+#include "shared.h"
+
+#include <locale.h>
+
+using namespace pfc;
+
+extern "C" {
+
+#if 0
+inline static unsigned q_tolower(unsigned c)
+{
+	if (c>='A' && c<='Z') c += 'a' - 'A';
+	return c;
+}
+#else
+static const t_uint8 ascii_tolower_table[128] = {0x00,0x01,0x02,0x03,0x04,0x05,0x06,0x07,0x08,0x09,0x0A,0x0B,0x0C,0x0D,0x0E,0x0F,0x10,0x11,0x12,0x13,0x14,0x15,0x16,0x17,0x18,0x19,0x1A,0x1B,0x1C,0x1D,0x1E,0x1F,0x20,0x21,0x22,0x23,0x24,0x25,0x26,0x27,0x28,0x29,0x2A,0x2B,0x2C,0x2D,0x2E,0x2F,0x30,0x31,0x32,0x33,0x34,0x35,0x36,0x37,0x38,0x39,0x3A,0x3B,0x3C,0x3D,0x3E,0x3F,0x40,0x61,0x62,0x63,0x64,0x65,0x66,0x67,0x68,0x69,0x6A,0x6B,0x6C,0x6D,0x6E,0x6F,0x70,0x71,0x72,0x73,0x74,0x75,0x76,0x77,0x78,0x79,0x7A,0x5B,0x5C,0x5D,0x5E,0x5F,0x60,0x61,0x62,0x63,0x64,0x65,0x66,0x67,0x68,0x69,0x6A,0x6B,0x6C,0x6D,0x6E,0x6F,0x70,0x71,0x72,0x73,0x74,0x75,0x76,0x77,0x78,0x79,0x7A,0x7B,0x7C,0x7D,0x7E,0x7F};
+#define q_tolower(c) ascii_tolower_table[(unsigned)c]
+#endif
+
+
+unsigned SHARED_EXPORT uCharLower(unsigned param)
+{
+	return pfc::charLower(param);
+}
+
+unsigned SHARED_EXPORT uCharUpper(unsigned param)
+{
+	return pfc::charUpper(param);
+}
+
+static inline int compare_wchar(unsigned c1,unsigned c2) throw()
+{
+	if (c1==c2) return 0;
+	c1 = pfc::charLower(c1);
+	c2 = pfc::charLower(c2);
+	if (c1<c2) return -1;
+	else if (c1>c2) return 1;
+	else return 0;
+}
+
+
+int SHARED_EXPORT stricmp_utf8(const char * p1,const char * p2) throw()
+{
+	for(;;)
+	{
+		if (*p1>=0 && *p2>=0)//signed char
+		{
+			unsigned c1 = q_tolower(*p1), c2 = q_tolower(*p2);
+			if (c1<c2) return -1;
+			else if (c1>c2) return 1;
+			else if (c1 == 0) return 0;
+			else
+			{
+				p1++;
+				p2++;
+			}
+		}
+		else
+		{
+			unsigned w1,w2; t_size d1,d2;
+			d1 = utf8_decode_char(p1,w1);
+			d2 = utf8_decode_char(p2,w2);
+			if (d1 == 0 && d2 == 0) return 0;
+			else if (d1==0) return -1;
+			else if (d2==0) return 1;
+			int rv = compare_wchar(w1,w2);
+			if (rv) return rv;
+			p1 += d1;
+			p2 += d2;
+		}
+	}
+}
+
+int SHARED_EXPORT stricmp_utf8_stringtoblock(const char * p1,const char * p2,t_size p2_bytes) throw()
+{
+	return stricmp_utf8_ex(p1,-1,p2,p2_bytes);
+}
+
+int SHARED_EXPORT stricmp_utf8_partial(const char * p1,const char * p2,t_size num) throw()
+{
+	for(;num;)
+	{
+		unsigned w1,w2; t_size d1,d2;
+		d1 = utf8_decode_char(p1,w1);
+		d2 = utf8_decode_char(p2,w2);
+		if (w2==0 || d2==0) return 0;
+		int rv = compare_wchar(w1,w2);
+		if (rv) return rv;
+		p1 += d1;
+		p2 += d2;
+		num--;
+	}
+	return 0;
+}
+
+int SHARED_EXPORT stricmp_utf8_max(const char * p1,const char * p2,t_size p1_bytes) throw()
+{
+	return stricmp_utf8_ex(p1,p1_bytes,p2,-1);
+}
+
+namespace {
+	typedef bool (*t_replace_test)(const char * src,const char * test,t_size len);
+
+	static bool replace_test_i(const char * src,const char * test,t_size len)
+	{
+		return stricmp_utf8_max(src,test,len)==0;
+	}
+
+	static bool replace_test(const char * src,const char * test,t_size len)
+	{
+		t_size ptr;
+		bool rv = true;
+		for(ptr=0;ptr<len;ptr++)
+		{
+			if (src[ptr]!=test[ptr]) {rv = false; break;}
+		}
+		return rv;
+	}
+}
+
+t_size SHARED_EXPORT uReplaceStringAdd(string_base & out,const char * src,t_size src_len,const char * s1,t_size len1,const char * s2,t_size len2,bool casesens)
+{
+	t_replace_test testfunc = casesens ? replace_test : replace_test_i;
+
+	len1 = strlen_max(s1,len1); len2 = strlen_max(s2,len2);
+
+	t_size len = strlen_max(src,src_len);
+	
+	t_size count = 0;
+
+	if (len1>0)
+	{
+		t_size ptr = 0;
+		while(ptr+len1<=len)
+		{
+			if (testfunc(src+ptr,s1,len1))
+			{
+				count++;
+				out.add_string(s2,len2);
+				ptr += len1;
+			}
+			else out.add_byte(src[ptr++]);
+		}
+		if (ptr<len) out.add_string(src+ptr,len-ptr);
+	}
+	return count;
+}
+
+t_size SHARED_EXPORT uReplaceCharAdd(string_base & out,const char * src,t_size src_len,unsigned c1,unsigned c2,bool casesens)
+{
+	assert(c1>0);
+	assert(c2>0);
+	char s1[8],s2[8];
+	t_size len1,len2;
+	len1 = utf8_encode_char(c1,s1);
+	len2 = utf8_encode_char(c2,s2);
+	return uReplaceString(out,src,src_len,s1,len1,s2,len2,casesens);
+}
+
+
+void SHARED_EXPORT uAddStringLower(string_base & out,const char * src,t_size len)
+{
+	while(len && *src)
+	{
+		unsigned c; t_size d;
+		d = utf8_decode_char(src,c,len);
+		if (d==0 || d>len) break;
+		out.add_char(uCharLower(c));
+		src+=d;
+		len-=d;
+	}
+}
+
+void SHARED_EXPORT uAddStringUpper(string_base & out,const char * src,t_size len)
+{
+	while(len && *src)
+	{
+		unsigned c; t_size d;
+		d = utf8_decode_char(src,c,len);
+		if (d==0 || d>len) break;
+		out.add_char(uCharUpper(c));
+		src+=d;
+		len-=d;
+	}
+}
+
+int SHARED_EXPORT stricmp_utf8_ex(const char * p1,t_size p1_bytes,const char * p2,t_size p2_bytes) throw()
+{
+	p1_bytes = strlen_max(p1,p1_bytes);
+	p2_bytes = strlen_max(p2,p2_bytes);
+	for(;;)
+	{
+		if (p1_bytes == 0 && p2_bytes == 0) return 0;
+		else if (p1_bytes == 0) return -1;
+		else if (p2_bytes == 0) return 1;
+		else if (*p1>0 && *p2>0)//signed char
+		{
+			unsigned c1 = q_tolower(*p1), c2 = q_tolower(*p2);
+			if (c1<c2) return -1;
+			else if (c1>c2) return 1;
+			else
+			{
+				p1++;
+				p2++;
+				p1_bytes--;
+				p2_bytes--;				
+			}
+		}
+		else
+		{
+			unsigned w1,w2;
+			auto d1 = utf8_decode_char(p1,w1,p1_bytes);
+			auto d2 = utf8_decode_char(p2,w2,p2_bytes);
+			if (d1==0) return -1;
+			if (d2==0) return 1;
+			int rv = compare_wchar(w1,w2);
+			if (rv) return rv;
+			p1 += d1;
+			p2 += d2;
+			p1_bytes -= d1;
+			p2_bytes -= d2;
+		}
+	}
+}
+
+}