diff options
author | Sven Gothel <[email protected]> | 2020-10-16 16:08:23 +0200 |
---|---|---|
committer | Sven Gothel <[email protected]> | 2020-10-16 16:08:23 +0200 |
commit | d5c6787a8d7e9c123b6c30dd877af58057df4204 (patch) | |
tree | d719b90b1a374de02f354faa2fdeac19e762b7ce /include/jau/dfa_utf8_decode.hpp | |
parent | da13a199446d143732cc6d0d996501bac1c1d4f8 (diff) |
Move jaucpp files to root-folder
Diffstat (limited to 'include/jau/dfa_utf8_decode.hpp')
-rw-r--r-- | include/jau/dfa_utf8_decode.hpp | 55 |
1 files changed, 55 insertions, 0 deletions
diff --git a/include/jau/dfa_utf8_decode.hpp b/include/jau/dfa_utf8_decode.hpp new file mode 100644 index 0000000..308858e --- /dev/null +++ b/include/jau/dfa_utf8_decode.hpp @@ -0,0 +1,55 @@ +/* + * Author: Sven Gothel <[email protected]> + * Copyright (c) 2008-2010 Bjoern Hoehrmann <[email protected]> (see details below) + * Copyright (c) 2020 Gothel Software e.K. + * Copyright (c) 2020 ZAFENA AB + * + * Permission is hereby granted, free of charge, to any person obtaining + * a copy of this software and associated documentation files (the + * "Software"), to deal in the Software without restriction, including + * without limitation the rights to use, copy, modify, merge, publish, + * distribute, sublicense, and/or sell copies of the Software, and to + * permit persons to whom the Software is furnished to do so, subject to + * the following conditions: + * + * The above copyright notice and this permission notice shall be + * included in all copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, + * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF + * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND + * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE + * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION + * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION + * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. + */ + +#ifndef JAU_DFA_UTF8_DECODE_HPP_ +#define JAU_DFA_UTF8_DECODE_HPP_ + +#define DFA_UTF8_ACCEPT 0 +#define DFA_UTF8_REJECT 12 + +#include <string> +#include <cstdint> +#include <cinttypes> + +namespace jau { + uint32_t dfa_utf8_decode(uint32_t & state, uint32_t & codep, const uint32_t byte_value); + + /** + * Returns all valid consecutive UTF-8 characters within buffer + * in the range up to buffer_size or until EOS. + * <p> + * In case a non UTF-8 character has been detected, + * the content will be cut off and the decoding loop ends. + * </p> + * <p> + * Method utilizes a finite state machine detecting variable length UTF-8 codes. + * See Bjoern Hoehrmann's site <http://bjoern.hoehrmann.de/utf-8/decoder/dfa/> for details. + * </p> + */ + std::string dfa_utf8_decode(const uint8_t *buffer, const size_t buffer_size); +} /* namespace jau */ + +#endif /* JAU_DFA_UTF8_DECODE_HPP_ */ |