Damien George | 04b9147 | 2014-05-03 23:27:38 +0100 | [diff] [blame] | 1 | /* |
Alexander Steffen | 55f3324 | 2017-06-30 09:22:17 +0200 | [diff] [blame] | 2 | * This file is part of the MicroPython project, http://micropython.org/ |
Damien George | 04b9147 | 2014-05-03 23:27:38 +0100 | [diff] [blame] | 3 | * |
| 4 | * The MIT License (MIT) |
| 5 | * |
| 6 | * Copyright (c) 2013, 2014 Damien P. George |
| 7 | * |
| 8 | * Permission is hereby granted, free of charge, to any person obtaining a copy |
| 9 | * of this software and associated documentation files (the "Software"), to deal |
| 10 | * in the Software without restriction, including without limitation the rights |
| 11 | * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell |
| 12 | * copies of the Software, and to permit persons to whom the Software is |
| 13 | * furnished to do so, subject to the following conditions: |
| 14 | * |
| 15 | * The above copyright notice and this permission notice shall be included in |
| 16 | * all copies or substantial portions of the Software. |
| 17 | * |
| 18 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 19 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 20 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE |
| 21 | * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| 22 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| 23 | * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN |
| 24 | * THE SOFTWARE. |
| 25 | */ |
Alexander Steffen | 299bc62 | 2017-06-29 23:14:58 +0200 | [diff] [blame] | 26 | #ifndef MICROPY_INCLUDED_PY_OBJSTR_H |
| 27 | #define MICROPY_INCLUDED_PY_OBJSTR_H |
Damien George | 51dfcb4 | 2015-01-01 20:27:54 +0000 | [diff] [blame] | 28 | |
| 29 | #include "py/obj.h" |
Andrew Leech | f7f56d4 | 2022-08-10 14:13:17 +1000 | [diff] [blame] | 30 | #include "py/objarray.h" |
Damien George | 04b9147 | 2014-05-03 23:27:38 +0100 | [diff] [blame] | 31 | |
Paul Sokolovsky | 58676fc | 2014-04-14 01:45:06 +0300 | [diff] [blame] | 32 | typedef struct _mp_obj_str_t { |
| 33 | mp_obj_base_t base; |
Damien George | 82b3500 | 2022-08-11 16:34:02 +1000 | [diff] [blame] | 34 | size_t hash; |
Paul Sokolovsky | 58676fc | 2014-04-14 01:45:06 +0300 | [diff] [blame] | 35 | // len == number of bytes used in data, alloc = len + 1 because (at the moment) we also append a null byte |
Damien George | c0d9500 | 2017-02-16 16:26:48 +1100 | [diff] [blame] | 36 | size_t len; |
Paul Sokolovsky | 58676fc | 2014-04-14 01:45:06 +0300 | [diff] [blame] | 37 | const byte *data; |
| 38 | } mp_obj_str_t; |
| 39 | |
Andrew Leech | f7f56d4 | 2022-08-10 14:13:17 +1000 | [diff] [blame] | 40 | // This static assert is used to ensure that mp_obj_str_t and mp_obj_array_t are compatible, |
| 41 | // meaning that their len and data/items entries are at the same offsets in the struct. |
| 42 | // This allows the same code to be used for str/bytes and bytearray. |
| 43 | #define MP_STATIC_ASSERT_STR_ARRAY_COMPATIBLE \ |
| 44 | MP_STATIC_ASSERT(offsetof(mp_obj_str_t, len) == offsetof(mp_obj_array_t, len) \ |
| 45 | && offsetof(mp_obj_str_t, data) == offsetof(mp_obj_array_t, items)) |
| 46 | |
Damien George | 69661f3 | 2020-02-27 15:36:53 +1100 | [diff] [blame] | 47 | #define MP_DEFINE_STR_OBJ(obj_name, str) mp_obj_str_t obj_name = {{&mp_type_str}, 0, sizeof(str) - 1, (const byte *)str} |
Damien George | 897fe0c | 2014-04-15 22:03:55 +0100 | [diff] [blame] | 48 | |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 49 | // use this macro to extract the string hash |
Damien George | 5f3bda4 | 2016-09-02 14:42:53 +1000 | [diff] [blame] | 50 | // warning: the hash can be 0, meaning invalid, and must then be explicitly computed from the data |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 51 | #define GET_STR_HASH(str_obj_in, str_hash) \ |
Damien George | 82b3500 | 2022-08-11 16:34:02 +1000 | [diff] [blame] | 52 | size_t str_hash; \ |
Damien George | b598678 | 2022-08-10 14:09:22 +1000 | [diff] [blame] | 53 | if (mp_obj_is_qstr(str_obj_in)) { \ |
| 54 | str_hash = qstr_hash(MP_OBJ_QSTR_VALUE(str_obj_in)); \ |
| 55 | } else { \ |
| 56 | str_hash = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->hash; \ |
| 57 | } |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 58 | |
| 59 | // use this macro to extract the string length |
| 60 | #define GET_STR_LEN(str_obj_in, str_len) \ |
Damien George | b598678 | 2022-08-10 14:09:22 +1000 | [diff] [blame] | 61 | size_t str_len; \ |
| 62 | if (mp_obj_is_qstr(str_obj_in)) { \ |
| 63 | str_len = qstr_len(MP_OBJ_QSTR_VALUE(str_obj_in)); \ |
| 64 | } else { \ |
| 65 | str_len = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->len; \ |
| 66 | } |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 67 | |
| 68 | // use this macro to extract the string data and length |
Damien George | 4c0176d | 2019-12-27 23:15:52 +1100 | [diff] [blame] | 69 | #if MICROPY_OBJ_REPR == MICROPY_OBJ_REPR_C || MICROPY_OBJ_REPR == MICROPY_OBJ_REPR_D |
Damien George | c3f64d9 | 2015-11-27 12:23:18 +0000 | [diff] [blame] | 70 | const byte *mp_obj_str_get_data_no_check(mp_obj_t self_in, size_t *len); |
Damien George | 04353cc | 2015-10-18 23:09:04 +0100 | [diff] [blame] | 71 | #define GET_STR_DATA_LEN(str_obj_in, str_data, str_len) \ |
Damien George | b598678 | 2022-08-10 14:09:22 +1000 | [diff] [blame] | 72 | size_t str_len; \ |
| 73 | const byte *str_data = mp_obj_str_get_data_no_check(str_obj_in, &str_len); |
Damien George | 04353cc | 2015-10-18 23:09:04 +0100 | [diff] [blame] | 74 | #else |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 75 | #define GET_STR_DATA_LEN(str_obj_in, str_data, str_len) \ |
Damien George | b598678 | 2022-08-10 14:09:22 +1000 | [diff] [blame] | 76 | const byte *str_data; \ |
| 77 | size_t str_len; \ |
| 78 | if (mp_obj_is_qstr(str_obj_in)) { \ |
| 79 | str_data = qstr_data(MP_OBJ_QSTR_VALUE(str_obj_in), &str_len); \ |
| 80 | } else { \ |
Andrew Leech | f7f56d4 | 2022-08-10 14:13:17 +1000 | [diff] [blame] | 81 | MP_STATIC_ASSERT_STR_ARRAY_COMPATIBLE; \ |
Damien George | b598678 | 2022-08-10 14:09:22 +1000 | [diff] [blame] | 82 | str_len = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->len; \ |
| 83 | str_data = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->data; \ |
| 84 | } |
Damien George | 04353cc | 2015-10-18 23:09:04 +0100 | [diff] [blame] | 85 | #endif |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 86 | |
Damien George | 5b3f0b7 | 2016-01-03 15:55:55 +0000 | [diff] [blame] | 87 | mp_obj_t mp_obj_str_make_new(const mp_obj_type_t *type_in, size_t n_args, size_t n_kw, const mp_obj_t *args); |
Damien George | 999cedb | 2015-11-27 17:01:44 +0000 | [diff] [blame] | 88 | void mp_str_print_json(const mp_print_t *print, const byte *str_data, size_t str_len); |
Damien George | 4b72b3a | 2016-01-03 14:21:40 +0000 | [diff] [blame] | 89 | mp_obj_t mp_obj_str_format(size_t n_args, const mp_obj_t *args, mp_map_t *kwargs); |
| 90 | mp_obj_t mp_obj_str_split(size_t n_args, const mp_obj_t *args); |
Jim Mussared | 6c3d8d3 | 2022-08-24 12:22:57 +1000 | [diff] [blame] | 91 | mp_obj_t mp_obj_new_str_copy(const mp_obj_type_t *type, const byte *data, size_t len); // for type=str, input data must be valid utf-8 |
| 92 | mp_obj_t mp_obj_new_str_of_type(const mp_obj_type_t *type, const byte *data, size_t len); // for type=str, will check utf-8 (raises UnicodeError) |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 93 | |
Damien George | 58321dd | 2017-08-29 13:04:01 +1000 | [diff] [blame] | 94 | mp_obj_t mp_obj_str_binary_op(mp_binary_op_t op, mp_obj_t lhs_in, mp_obj_t rhs_in); |
Damien George | 4d91723 | 2014-08-30 14:28:06 +0100 | [diff] [blame] | 95 | mp_int_t mp_obj_str_get_buffer(mp_obj_t self_in, mp_buffer_info_t *bufinfo, mp_uint_t flags); |
Paul Sokolovsky | 9731912 | 2014-06-13 22:01:26 +0300 | [diff] [blame] | 96 | |
Jim Mussared | c44b392 | 2022-10-07 11:06:43 +1100 | [diff] [blame] | 97 | void mp_obj_str_set_data(mp_obj_str_t *str, const byte *data, size_t len); |
| 98 | |
Damien George | 999cedb | 2015-11-27 17:01:44 +0000 | [diff] [blame] | 99 | const byte *str_index_to_ptr(const mp_obj_type_t *type, const byte *self_data, size_t self_len, |
Damien George | 69661f3 | 2020-02-27 15:36:53 +1100 | [diff] [blame] | 100 | mp_obj_t index, bool is_slice); |
Damien George | c0d9500 | 2017-02-16 16:26:48 +1100 | [diff] [blame] | 101 | const byte *find_subbytes(const byte *haystack, size_t hlen, const byte *needle, size_t nlen, int direction); |
Paul Sokolovsky | ea2c936 | 2014-06-15 00:35:09 +0300 | [diff] [blame] | 102 | |
Angus Gratton | 47e8475 | 2023-11-23 09:43:06 +1100 | [diff] [blame] | 103 | #define MP_DEFINE_BYTES_OBJ(obj_name, target, len) mp_obj_str_t obj_name = {{&mp_type_bytes}, 0, (len), (const byte *)(target)} |
| 104 | |
Jim Mussared | 28aaab9 | 2021-07-13 18:01:12 +1000 | [diff] [blame] | 105 | mp_obj_t mp_obj_bytes_hex(size_t n_args, const mp_obj_t *args, const mp_obj_type_t *type); |
| 106 | mp_obj_t mp_obj_bytes_fromhex(mp_obj_t type_in, mp_obj_t data); |
| 107 | |
Andrew Leech | f7f56d4 | 2022-08-10 14:13:17 +1000 | [diff] [blame] | 108 | extern const mp_obj_dict_t mp_obj_str_locals_dict; |
| 109 | |
Jim Mussared | 28aaab9 | 2021-07-13 18:01:12 +1000 | [diff] [blame] | 110 | #if MICROPY_PY_BUILTINS_MEMORYVIEW && MICROPY_PY_BUILTINS_BYTES_HEX |
| 111 | extern const mp_obj_dict_t mp_obj_memoryview_locals_dict; |
| 112 | #endif |
| 113 | |
Andrew Leech | f7f56d4 | 2022-08-10 14:13:17 +1000 | [diff] [blame] | 114 | #if MICROPY_PY_BUILTINS_BYTEARRAY |
| 115 | extern const mp_obj_dict_t mp_obj_bytearray_locals_dict; |
| 116 | #endif |
| 117 | |
| 118 | #if MICROPY_PY_ARRAY |
| 119 | extern const mp_obj_dict_t mp_obj_array_locals_dict; |
| 120 | #endif |
| 121 | |
Alexander Steffen | 299bc62 | 2017-06-29 23:14:58 +0200 | [diff] [blame] | 122 | #endif // MICROPY_INCLUDED_PY_OBJSTR_H |