mirror of
				https://github.com/OpenMW/openmw.git
				synced 2025-10-25 19:56:37 +00:00 
			
		
		
		
	This patch is in relation to commit 25fa8165f97 (Use char literals in UTF 8 conversion to fix 798 warnings), which changed the UTF 8 table to have char integer values instead of unsigned chars. Those values were converted using a custom Python script. This patch changes the original table generator so it can now output the same format.
		
			
				
	
	
		
			116 lines
		
	
	
	
		
			3 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			116 lines
		
	
	
	
		
			3 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| // This program generates the file tables_gen.hpp
 | |
| 
 | |
| #include <iostream>
 | |
| using namespace std;
 | |
| 
 | |
| #include <iconv.h>
 | |
| #include <cassert>
 | |
| 
 | |
| void tab() { cout << "   "; }
 | |
| 
 | |
| // write one number with a space in front of it and a comma after it
 | |
| void num(char i, bool last)
 | |
| {
 | |
|   // Convert i to its integer value, i.e. -128 to 127. Printing it directly
 | |
|   // would result in non-printable characters in the source code, which is bad.
 | |
|   cout << " " << static_cast<int>(i);
 | |
|   if(!last) cout << ",";
 | |
| }
 | |
| 
 | |
| // Write one table entry (UTF8 value), 1-5 bytes
 | |
| void writeChar(char *value, int length, bool last, const std::string &comment="")
 | |
| {
 | |
|   assert(length >= 1 && length <= 5);
 | |
|   tab();
 | |
|   num(length, false);
 | |
|   for(int i=0;i<5;i++)
 | |
|     num(value[i], last && i==4);
 | |
| 
 | |
|   if(comment != "")
 | |
|     cout << " // " << comment;
 | |
| 
 | |
|   cout << endl;
 | |
| }
 | |
| 
 | |
| // What to write on missing characters
 | |
| void writeMissing(bool last)
 | |
| {
 | |
|   // Just write a space character
 | |
|   char value[5];
 | |
|   value[0] = ' ';
 | |
|   for(int i=1; i<5; i++)
 | |
|     value[i] = 0;
 | |
|   writeChar(value, 1, last, "not part of this charset");
 | |
| }
 | |
| 
 | |
| int write_table(const std::string &charset, const std::string &tableName)
 | |
| {
 | |
|   // Write table header
 | |
|   cout << "static char " << tableName << "[] =\n{\n";
 | |
| 
 | |
|   // Open conversion system
 | |
|   iconv_t cd = iconv_open ("UTF-8", charset.c_str());
 | |
| 
 | |
|   // Convert each character from 0 to 255
 | |
|   for(int i=0; i<256; i++)
 | |
|     {
 | |
|       bool last = (i==255);
 | |
| 
 | |
|       char input = i;
 | |
|       char *iptr = &input;
 | |
|       size_t ileft = 1;
 | |
| 
 | |
|       char output[5];
 | |
|       for(int k=0; k<5; k++) output[k] = 0;
 | |
|       char *optr = output;
 | |
|       size_t oleft = 5;
 | |
| 
 | |
|       size_t res = iconv(cd, &iptr, &ileft, &optr, &oleft);
 | |
| 
 | |
|       if(res) writeMissing(last);
 | |
|       else writeChar(output, 5-oleft, last);
 | |
|     }
 | |
| 
 | |
|   iconv_close (cd);
 | |
| 
 | |
|   // Finish table
 | |
|   cout << "};\n";
 | |
| 
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| int main()
 | |
| {
 | |
|   // Write header guard
 | |
|   cout << "#ifndef COMPONENTS_TOUTF8_TABLE_GEN_H\n#define COMPONENTS_TOUTF8_TABLE_GEN_H\n\n";
 | |
| 
 | |
|   // Write namespace
 | |
|   cout << "namespace ToUTF8\n{\n\n";
 | |
| 
 | |
|   // Central European and Eastern European languages that use Latin script, such as
 | |
|   // Polish, Czech, Slovak, Hungarian, Slovene, Bosnian, Croatian, Serbian (Latin script), Romanian and Albanian.
 | |
|   cout << "\n/// Central European and Eastern European languages that use Latin script,"
 | |
|           "\n/// such as Polish, Czech, Slovak, Hungarian, Slovene, Bosnian, Croatian,"
 | |
|           "\n/// Serbian (Latin script), Romanian and Albanian."
 | |
|           "\n";
 | |
|   write_table("WINDOWS-1250", "windows_1250");
 | |
| 
 | |
|   // Cyrillic alphabet such as Russian, Bulgarian, Serbian Cyrillic and other languages
 | |
|   cout << "\n/// Cyrillic alphabet such as Russian, Bulgarian, Serbian Cyrillic"
 | |
|           "\n/// and other languages"
 | |
|           "\n";
 | |
|   write_table("WINDOWS-1251", "windows_1251");
 | |
| 
 | |
|   // English
 | |
|   cout << "\n/// Latin alphabet used by English and some other Western languages"
 | |
|           "\n";
 | |
|   write_table("WINDOWS-1252", "windows_1252");
 | |
| 
 | |
|   // Close namespace
 | |
|   cout << "\n}\n\n";
 | |
| 
 | |
|   // Close header guard
 | |
|   cout << "#endif\n\n";
 | |
| 
 | |
|   return 0;
 | |
| }
 |