BF-admins agree to remove header information that isn't useful, to reduce noise. - BEGIN/END license blocks Developers should add non license comments as separate comment blocks. No need for separator text. - Contributors This is often invalid, outdated or misleading especially when splitting files. It's more useful to git-blame to find out who has developed the code. See P901 for script to perform these edits.
		
			
				
	
	
		
			310 lines
		
	
	
		
			7.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			310 lines
		
	
	
		
			7.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * This program is free software; you can redistribute it and/or
 | 
						|
 * modify it under the terms of the GNU General Public License
 | 
						|
 * as published by the Free Software Foundation; either version 2
 | 
						|
 * of the License, or (at your option) any later version.
 | 
						|
 *
 | 
						|
 * This program is distributed in the hope that it will be useful,
 | 
						|
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
 * GNU General Public License for more details.
 | 
						|
 *
 | 
						|
 * You should have received a copy of the GNU General Public License
 | 
						|
 * along with this program; if not, write to the Free Software Foundation,
 | 
						|
 * Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
 | 
						|
 *
 | 
						|
 * The Original Code is Copyright (C) 2011 Blender Foundation.
 | 
						|
 * All rights reserved.
 | 
						|
 */
 | 
						|
 | 
						|
/** \file blender/blenlib/intern/string_cursor_utf8.c
 | 
						|
 *  \ingroup bli
 | 
						|
 */
 | 
						|
 | 
						|
#include <stdio.h>
 | 
						|
#include <stdlib.h>
 | 
						|
 | 
						|
#include "BLI_utildefines.h"
 | 
						|
#include "BLI_string_utf8.h"
 | 
						|
 | 
						|
#include "BLI_string_cursor_utf8.h" /* own include */
 | 
						|
 | 
						|
#ifdef __GNUC__
 | 
						|
#  pragma GCC diagnostic error "-Wsign-conversion"
 | 
						|
#endif
 | 
						|
 | 
						|
typedef enum eStrCursorDelimType {
 | 
						|
	STRCUR_DELIM_NONE,
 | 
						|
	STRCUR_DELIM_ALPHANUMERIC,
 | 
						|
	STRCUR_DELIM_PUNCT,
 | 
						|
	STRCUR_DELIM_BRACE,
 | 
						|
	STRCUR_DELIM_OPERATOR,
 | 
						|
	STRCUR_DELIM_QUOTE,
 | 
						|
	STRCUR_DELIM_WHITESPACE,
 | 
						|
	STRCUR_DELIM_OTHER
 | 
						|
} eStrCursorDelimType;
 | 
						|
 | 
						|
static eStrCursorDelimType cursor_delim_type_unicode(const uint uch)
 | 
						|
{
 | 
						|
	switch (uch) {
 | 
						|
		case ',':
 | 
						|
		case '.':
 | 
						|
			return STRCUR_DELIM_PUNCT;
 | 
						|
 | 
						|
		case '{':
 | 
						|
		case '}':
 | 
						|
		case '[':
 | 
						|
		case ']':
 | 
						|
		case '(':
 | 
						|
		case ')':
 | 
						|
			return STRCUR_DELIM_BRACE;
 | 
						|
 | 
						|
		case '+':
 | 
						|
		case '-':
 | 
						|
		case '=':
 | 
						|
		case '~':
 | 
						|
		case '%':
 | 
						|
		case '/':
 | 
						|
		case '<':
 | 
						|
		case '>':
 | 
						|
		case '^':
 | 
						|
		case '*':
 | 
						|
		case '&':
 | 
						|
		case '|':
 | 
						|
			return STRCUR_DELIM_OPERATOR;
 | 
						|
 | 
						|
		case '\'':
 | 
						|
		case '\"':
 | 
						|
			return STRCUR_DELIM_QUOTE;
 | 
						|
 | 
						|
		case ' ':
 | 
						|
		case '\t':
 | 
						|
		case '\n':
 | 
						|
			return STRCUR_DELIM_WHITESPACE;
 | 
						|
 | 
						|
		case '\\':
 | 
						|
		case '@':
 | 
						|
		case '#':
 | 
						|
		case '$':
 | 
						|
		case ':':
 | 
						|
		case ';':
 | 
						|
		case '?':
 | 
						|
		case '!':
 | 
						|
		case 0xA3:  /* pound */
 | 
						|
		case 0x80:  /* euro */
 | 
						|
			/* case '_': *//* special case, for python */
 | 
						|
			return STRCUR_DELIM_OTHER;
 | 
						|
 | 
						|
		default:
 | 
						|
			break;
 | 
						|
	}
 | 
						|
	return STRCUR_DELIM_ALPHANUMERIC; /* Not quite true, but ok for now */
 | 
						|
}
 | 
						|
 | 
						|
static eStrCursorDelimType cursor_delim_type_utf8(const char *ch_utf8)
 | 
						|
{
 | 
						|
	/* for full unicode support we really need to have large lookup tables to figure
 | 
						|
	 * out whats what in every possible char set - and python, glib both have these. */
 | 
						|
	uint uch = BLI_str_utf8_as_unicode(ch_utf8);
 | 
						|
	return cursor_delim_type_unicode(uch);
 | 
						|
}
 | 
						|
 | 
						|
bool BLI_str_cursor_step_next_utf8(const char *str, size_t maxlen, int *pos)
 | 
						|
{
 | 
						|
	const char *str_end = str + (maxlen + 1);
 | 
						|
	const char *str_pos = str + (*pos);
 | 
						|
	const char *str_next = BLI_str_find_next_char_utf8(str_pos, str_end);
 | 
						|
	if (str_next) {
 | 
						|
		(*pos) += (str_next - str_pos);
 | 
						|
		if ((*pos) > (int)maxlen) {
 | 
						|
			(*pos) = (int)maxlen;
 | 
						|
		}
 | 
						|
		return true;
 | 
						|
	}
 | 
						|
 | 
						|
	return false;
 | 
						|
}
 | 
						|
 | 
						|
bool BLI_str_cursor_step_prev_utf8(const char *str, size_t UNUSED(maxlen), int *pos)
 | 
						|
{
 | 
						|
	if ((*pos) > 0) {
 | 
						|
		const char *str_pos = str + (*pos);
 | 
						|
		const char *str_prev = BLI_str_find_prev_char_utf8(str, str_pos);
 | 
						|
		if (str_prev) {
 | 
						|
			(*pos) -= (str_pos - str_prev);
 | 
						|
			return true;
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	return false;
 | 
						|
}
 | 
						|
 | 
						|
void BLI_str_cursor_step_utf8(
 | 
						|
        const char *str, size_t maxlen,
 | 
						|
        int *pos, eStrCursorJumpDirection direction,
 | 
						|
        eStrCursorJumpType jump, bool use_init_step)
 | 
						|
{
 | 
						|
	const int pos_orig = *pos;
 | 
						|
 | 
						|
	if (direction == STRCUR_DIR_NEXT) {
 | 
						|
		if (use_init_step) {
 | 
						|
			BLI_str_cursor_step_next_utf8(str, maxlen, pos);
 | 
						|
		}
 | 
						|
		else {
 | 
						|
			BLI_assert(jump == STRCUR_JUMP_DELIM);
 | 
						|
		}
 | 
						|
 | 
						|
		if (jump != STRCUR_JUMP_NONE) {
 | 
						|
			const eStrCursorDelimType delim_type =
 | 
						|
			        (*pos) < maxlen ? cursor_delim_type_utf8(&str[*pos]) : STRCUR_DELIM_NONE;
 | 
						|
			/* jump between special characters (/,\,_,-, etc.),
 | 
						|
			 * look at function cursor_delim_type() for complete
 | 
						|
			 * list of special character, ctr -> */
 | 
						|
			while ((*pos) < maxlen) {
 | 
						|
				if (BLI_str_cursor_step_next_utf8(str, maxlen, pos)) {
 | 
						|
					if ((jump != STRCUR_JUMP_ALL) &&
 | 
						|
					    (delim_type != cursor_delim_type_utf8(&str[*pos])))
 | 
						|
					{
 | 
						|
						break;
 | 
						|
					}
 | 
						|
				}
 | 
						|
				else {
 | 
						|
					break; /* unlikely but just in case */
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	else if (direction == STRCUR_DIR_PREV) {
 | 
						|
		if (use_init_step) {
 | 
						|
			BLI_str_cursor_step_prev_utf8(str, maxlen, pos);
 | 
						|
		}
 | 
						|
		else {
 | 
						|
			BLI_assert(jump == STRCUR_JUMP_DELIM);
 | 
						|
		}
 | 
						|
 | 
						|
		if (jump != STRCUR_JUMP_NONE) {
 | 
						|
			const eStrCursorDelimType delim_type =
 | 
						|
			        (*pos) > 0 ? cursor_delim_type_utf8(&str[(*pos) - 1]) : STRCUR_DELIM_NONE;
 | 
						|
			/* jump between special characters (/,\,_,-, etc.),
 | 
						|
			 * look at function cursor_delim_type() for complete
 | 
						|
			 * list of special character, ctr -> */
 | 
						|
			while ((*pos) > 0) {
 | 
						|
				const int pos_prev = *pos;
 | 
						|
				if (BLI_str_cursor_step_prev_utf8(str, maxlen, pos)) {
 | 
						|
					if ((jump != STRCUR_JUMP_ALL) &&
 | 
						|
					    (delim_type != cursor_delim_type_utf8(&str[*pos])))
 | 
						|
					{
 | 
						|
						/* left only: compensate for index/change in direction */
 | 
						|
						if ((pos_orig - (*pos)) >= 1) {
 | 
						|
							*pos = pos_prev;
 | 
						|
						}
 | 
						|
						break;
 | 
						|
					}
 | 
						|
				}
 | 
						|
				else {
 | 
						|
					break;
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	else {
 | 
						|
		BLI_assert(0);
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
/* wchar_t version of BLI_str_cursor_step_utf8 (keep in sync!)
 | 
						|
 * less complex since it doesn't need to do multi-byte stepping.
 | 
						|
 */
 | 
						|
 | 
						|
/* helper funcs so we can match BLI_str_cursor_step_utf8 */
 | 
						|
static bool wchar_t_step_next(const wchar_t *UNUSED(str), size_t maxlen, int *pos)
 | 
						|
{
 | 
						|
	if ((*pos) >= (int)maxlen) {
 | 
						|
		return false;
 | 
						|
	}
 | 
						|
	(*pos)++;
 | 
						|
	return true;
 | 
						|
}
 | 
						|
 | 
						|
static bool wchar_t_step_prev(const wchar_t *UNUSED(str), size_t UNUSED(maxlen), int *pos)
 | 
						|
{
 | 
						|
	if ((*pos) <= 0) {
 | 
						|
		return false;
 | 
						|
	}
 | 
						|
	(*pos)--;
 | 
						|
	return true;
 | 
						|
}
 | 
						|
 | 
						|
void BLI_str_cursor_step_wchar(
 | 
						|
        const wchar_t *str, size_t maxlen,
 | 
						|
        int *pos, eStrCursorJumpDirection direction,
 | 
						|
        eStrCursorJumpType jump, bool use_init_step)
 | 
						|
{
 | 
						|
	const int pos_orig = *pos;
 | 
						|
 | 
						|
	if (direction == STRCUR_DIR_NEXT) {
 | 
						|
		if (use_init_step) {
 | 
						|
			wchar_t_step_next(str, maxlen, pos);
 | 
						|
		}
 | 
						|
		else {
 | 
						|
			BLI_assert(jump == STRCUR_JUMP_DELIM);
 | 
						|
		}
 | 
						|
 | 
						|
		if (jump != STRCUR_JUMP_NONE) {
 | 
						|
			const eStrCursorDelimType delim_type =
 | 
						|
			        (*pos) < maxlen ? cursor_delim_type_unicode((uint)str[*pos]) : STRCUR_DELIM_NONE;
 | 
						|
			/* jump between special characters (/,\,_,-, etc.),
 | 
						|
			 * look at function cursor_delim_type_unicode() for complete
 | 
						|
			 * list of special character, ctr -> */
 | 
						|
			while ((*pos) < maxlen) {
 | 
						|
				if (wchar_t_step_next(str, maxlen, pos)) {
 | 
						|
					if ((jump != STRCUR_JUMP_ALL) &&
 | 
						|
					    (delim_type != cursor_delim_type_unicode((uint)str[*pos])))
 | 
						|
					{
 | 
						|
						break;
 | 
						|
					}
 | 
						|
				}
 | 
						|
				else {
 | 
						|
					break; /* unlikely but just in case */
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	else if (direction == STRCUR_DIR_PREV) {
 | 
						|
		if (use_init_step) {
 | 
						|
			wchar_t_step_prev(str, maxlen, pos);
 | 
						|
		}
 | 
						|
		else {
 | 
						|
			BLI_assert(jump == STRCUR_JUMP_DELIM);
 | 
						|
		}
 | 
						|
 | 
						|
		if (jump != STRCUR_JUMP_NONE) {
 | 
						|
			const eStrCursorDelimType delim_type =
 | 
						|
			        (*pos) > 0 ? cursor_delim_type_unicode((uint)str[(*pos) - 1]) : STRCUR_DELIM_NONE;
 | 
						|
			/* jump between special characters (/,\,_,-, etc.),
 | 
						|
			 * look at function cursor_delim_type() for complete
 | 
						|
			 * list of special character, ctr -> */
 | 
						|
			while ((*pos) > 0) {
 | 
						|
				const int pos_prev = *pos;
 | 
						|
				if (wchar_t_step_prev(str, maxlen, pos)) {
 | 
						|
					if ((jump != STRCUR_JUMP_ALL) &&
 | 
						|
					    (delim_type != cursor_delim_type_unicode((uint)str[*pos])))
 | 
						|
					{
 | 
						|
						/* left only: compensate for index/change in direction */
 | 
						|
						if ((pos_orig - (*pos)) >= 1) {
 | 
						|
							*pos = pos_prev;
 | 
						|
						}
 | 
						|
						break;
 | 
						|
					}
 | 
						|
				}
 | 
						|
				else {
 | 
						|
					break;
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	else {
 | 
						|
		BLI_assert(0);
 | 
						|
	}
 | 
						|
}
 |