mirror of
				https://github.com/Atmosphere-NX/Atmosphere.git
				synced 2025-10-25 01:35:51 +02:00 
			
		
		
		
	
		
			
				
	
	
		
			155 lines
		
	
	
		
			6.5 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			155 lines
		
	
	
		
			6.5 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2018-2020 Atmosphère-NX
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify it
 | |
|  * under the terms and conditions of the GNU General Public License,
 | |
|  * version 2, as published by the Free Software Foundation.
 | |
|  *
 | |
|  * This program is distributed in the hope it will be useful, but WITHOUT
 | |
|  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 | |
|  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 | |
|  * more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 | |
|  */
 | |
| #include <vapours.hpp>
 | |
| 
 | |
| namespace ams::util {
 | |
| 
 | |
|     namespace {
 | |
| 
 | |
|         constexpr inline int8_t Utf8NBytesInnerTable[0x100 + 1] = {
 | |
|             -1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
 | |
|             0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
 | |
|             0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
 | |
|             0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
 | |
|             0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
 | |
|             2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
 | |
|             2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
 | |
|             3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
 | |
|             4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6, 7, 8,
 | |
|         };
 | |
| 
 | |
|         constexpr inline const char * const Utf8NBytesTable = static_cast<const char *>(static_cast<const void *>(Utf8NBytesInnerTable + 1));
 | |
| 
 | |
|     }
 | |
| 
 | |
|     CharacterEncodingResult ConvertCharacterUtf8ToUtf32(u32 *dst, const char *src) {
 | |
|         /* Check pre-conditions. */
 | |
|         AMS_ASSERT(dst != nullptr);
 | |
|         AMS_ASSERT(src != nullptr);
 | |
| 
 | |
|         /* Perform the conversion. */
 | |
|         const unsigned char *p = reinterpret_cast<const unsigned char *>(src);
 | |
|         switch (Utf8NBytesTable[p[0]]) {
 | |
|             case 1:
 | |
|                 *dst = static_cast<u32>(p[0]);
 | |
|                 return CharacterEncodingResult_Success;
 | |
|             case 2:
 | |
|                 if ((p[0] & 0x1E) != 0) {
 | |
|                     if (Utf8NBytesTable[p[1]] == 0) {
 | |
|                         *dst = (static_cast<uint32_t>(p[0] & 0x1F) << 6) | (static_cast<uint32_t>(p[1] & 0x3F) << 0);
 | |
|                         return CharacterEncodingResult_Success;
 | |
|                     }
 | |
|                 }
 | |
|                 break;
 | |
|             case 3:
 | |
|                 if (Utf8NBytesTable[p[1]] == 0 && Utf8NBytesTable[p[2]] == 0) {
 | |
|                     const u32 c = (static_cast<uint32_t>(p[0] & 0xF) << 12) | (static_cast<uint32_t>(p[1] & 0x3F) << 6) | (static_cast<uint32_t>(p[2] & 0x3F) << 0);
 | |
|                     if ((c & 0xF800) != 0 && (c & 0xF800) != 0xD800) {
 | |
|                         *dst = c;
 | |
|                         return CharacterEncodingResult_Success;
 | |
|                     }
 | |
|                 }
 | |
|                 return CharacterEncodingResult_InvalidFormat;
 | |
|             case 4:
 | |
|                 if (Utf8NBytesTable[p[1]] == 0 && Utf8NBytesTable[p[2]] == 0 && Utf8NBytesTable[p[3]] == 0) {
 | |
|                     const u32 c = (static_cast<uint32_t>(p[0] & 0x7) << 18) | (static_cast<uint32_t>(p[1] & 0x3F) << 12) | (static_cast<uint32_t>(p[2] & 0x3F) << 6) | (static_cast<uint32_t>(p[3] & 0x3F) << 0);
 | |
|                     if (c >= 0x10000 && c < 0x110000) {
 | |
|                         *dst = c;
 | |
|                         return CharacterEncodingResult_Success;
 | |
|                     }
 | |
|                 }
 | |
|                 return CharacterEncodingResult_InvalidFormat;
 | |
|             default:
 | |
|                 break;
 | |
|         }
 | |
| 
 | |
|         /* We failed to convert. */
 | |
|         return CharacterEncodingResult_InvalidFormat;
 | |
|     }
 | |
| 
 | |
|     CharacterEncodingResult PickOutCharacterFromUtf8String(char *dst, const char **str) {
 | |
|         /* Check pre-conditions. */
 | |
|         AMS_ASSERT(dst != nullptr);
 | |
|         AMS_ASSERT(str != nullptr);
 | |
|         AMS_ASSERT(*str != nullptr);
 | |
| 
 | |
|         /* Clear the output. */
 | |
|         dst[0] = 0;
 | |
|         dst[1] = 0;
 | |
|         dst[2] = 0;
 | |
|         dst[3] = 0;
 | |
| 
 | |
|         /* Perform the conversion. */
 | |
|         const unsigned char *p = reinterpret_cast<const unsigned char *>(*str);
 | |
|         u32 c = *p;
 | |
|         switch (Utf8NBytesTable[c]) {
 | |
|             case 1:
 | |
|                 dst[0] = (*str)[0];
 | |
|                 ++(*str);
 | |
|                 break;
 | |
|             case 2:
 | |
|                 if ((p[0] & 0x1E) != 0) {
 | |
|                     if (Utf8NBytesTable[p[1]] == 0) {
 | |
|                         c = (static_cast<uint32_t>(p[0] & 0x1F) << 6) | (static_cast<uint32_t>(p[1] & 0x3F) << 0);
 | |
|                         dst[0] = (*str)[0];
 | |
|                         dst[1] = (*str)[1];
 | |
|                         (*str) += 2;
 | |
|                         break;
 | |
|                     }
 | |
|                 }
 | |
|                 return CharacterEncodingResult_InvalidFormat;
 | |
|             case 3:
 | |
|                 if (Utf8NBytesTable[p[1]] == 0 && Utf8NBytesTable[p[2]] == 0) {
 | |
|                     c = (static_cast<uint32_t>(p[0] & 0xF) << 12) | (static_cast<uint32_t>(p[1] & 0x3F) << 6) | (static_cast<uint32_t>(p[2] & 0x3F) << 0);
 | |
|                     if ((c & 0xF800) != 0 && (c & 0xF800) != 0xD800) {
 | |
|                         dst[0] = (*str)[0];
 | |
|                         dst[1] = (*str)[1];
 | |
|                         dst[2] = (*str)[2];
 | |
|                         (*str) += 3;
 | |
|                         break;
 | |
|                     }
 | |
|                 }
 | |
|                 return CharacterEncodingResult_InvalidFormat;
 | |
|             case 4:
 | |
|                 if (Utf8NBytesTable[p[1]] == 0 && Utf8NBytesTable[p[2]] == 0 && Utf8NBytesTable[p[3]] == 0) {
 | |
|                     c = (static_cast<uint32_t>(p[0] & 0x7) << 18) | (static_cast<uint32_t>(p[1] & 0x3F) << 12) | (static_cast<uint32_t>(p[2] & 0x3F) << 6) | (static_cast<uint32_t>(p[3] & 0x3F) << 0);
 | |
|                     if (c >= 0x10000 && c < 0x110000) {
 | |
|                         dst[0] = (*str)[0];
 | |
|                         dst[1] = (*str)[1];
 | |
|                         dst[2] = (*str)[2];
 | |
|                         dst[3] = (*str)[3];
 | |
|                         (*str) += 4;
 | |
|                         break;
 | |
|                     }
 | |
|                 }
 | |
|                 return CharacterEncodingResult_InvalidFormat;
 | |
|             default:
 | |
|                 return CharacterEncodingResult_InvalidFormat;
 | |
|         }
 | |
| 
 | |
|         return CharacterEncodingResult_Success;
 | |
|     }
 | |
| 
 | |
| }
 |