mirror of
https://github.com/fish-shell/fish-shell
synced 2024-12-28 22:03:12 +00:00
8f420b9272
This makes the wide char tests run by `./fish_tests` pass on systems where sizeof wchar_t is two (e.g., Cygwin). In doing so it corrects several problems with the underlying code in module *utf8.cpp* such as allowing five and six byte UTF-8 sequences. They were allowed by the original Unicode proposal but are not allowed by the adopted standard.
36 lines
1.5 KiB
C++
36 lines
1.5 KiB
C++
/*
|
|
* Copyright (c) 2007 Alexey Vatchenko <av@bsdua.org>
|
|
*
|
|
* Permission to use, copy, modify, and/or distribute this software for any
|
|
* purpose with or without fee is hereby granted, provided that the above
|
|
* copyright notice and this permission notice appear in all copies.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
|
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
|
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
|
|
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
|
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
|
|
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
|
|
*/
|
|
|
|
// Implementation of UTF-8 charset encoding (RFC3629).
|
|
#ifndef _UTF8_H_
|
|
#define _UTF8_H_
|
|
|
|
#include <stddef.h>
|
|
#include <string>
|
|
|
|
#define UTF8_IGNORE_ERROR 0x01
|
|
#define UTF8_SKIP_BOM 0x02
|
|
|
|
/// Convert a string between UTF8 and UCS-2/4 (depending on size of wchar_t). Returns true if
|
|
/// successful, storing the result of the conversion in *result*.
|
|
bool wchar_to_utf8_string(const std::wstring &input, std::string *result);
|
|
|
|
/// Convert a string between UTF8 and UCS-2/4 (depending on size of wchar_t). Returns nonzero if
|
|
/// successful, storing the result of the conversion in *out*.
|
|
size_t utf8_to_wchar(const char *in, size_t insize, std::wstring *out, int flags);
|
|
size_t wchar_to_utf8(const wchar_t *in, size_t insize, char *out, size_t outsize, int flags);
|
|
|
|
#endif /* !_UTF8_H_ */
|