blob: 8f87c3018a3c9aef6ce99616b3c7c6e0290cdfe6 [file] [log] [blame]
Damien George04b91472014-05-03 23:27:38 +01001/*
Alexander Steffen55f33242017-06-30 09:22:17 +02002 * This file is part of the MicroPython project, http://micropython.org/
Damien George04b91472014-05-03 23:27:38 +01003 *
4 * The MIT License (MIT)
5 *
6 * Copyright (c) 2013, 2014 Damien P. George
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a copy
9 * of this software and associated documentation files (the "Software"), to deal
10 * in the Software without restriction, including without limitation the rights
11 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
12 * copies of the Software, and to permit persons to whom the Software is
13 * furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be included in
16 * all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 * THE SOFTWARE.
25 */
Alexander Steffen299bc622017-06-29 23:14:58 +020026#ifndef MICROPY_INCLUDED_PY_OBJSTR_H
27#define MICROPY_INCLUDED_PY_OBJSTR_H
Damien George51dfcb42015-01-01 20:27:54 +000028
29#include "py/obj.h"
Damien George04b91472014-05-03 23:27:38 +010030
Paul Sokolovsky58676fc2014-04-14 01:45:06 +030031typedef struct _mp_obj_str_t {
32 mp_obj_base_t base;
Damien George26a0d4f2014-08-22 18:34:28 +010033 mp_uint_t hash;
Paul Sokolovsky58676fc2014-04-14 01:45:06 +030034 // len == number of bytes used in data, alloc = len + 1 because (at the moment) we also append a null byte
Damien Georgec0d95002017-02-16 16:26:48 +110035 size_t len;
Paul Sokolovsky58676fc2014-04-14 01:45:06 +030036 const byte *data;
37} mp_obj_str_t;
38
Damien George69661f32020-02-27 15:36:53 +110039#define MP_DEFINE_STR_OBJ(obj_name, str) mp_obj_str_t obj_name = {{&mp_type_str}, 0, sizeof(str) - 1, (const byte *)str}
Damien George897fe0c2014-04-15 22:03:55 +010040
Paul Sokolovsky97319122014-06-13 22:01:26 +030041// use this macro to extract the string hash
Damien George5f3bda42016-09-02 14:42:53 +100042// warning: the hash can be 0, meaning invalid, and must then be explicitly computed from the data
Paul Sokolovsky97319122014-06-13 22:01:26 +030043#define GET_STR_HASH(str_obj_in, str_hash) \
Damien Georgeb5986782022-08-10 14:09:22 +100044 mp_uint_t str_hash; \
45 if (mp_obj_is_qstr(str_obj_in)) { \
46 str_hash = qstr_hash(MP_OBJ_QSTR_VALUE(str_obj_in)); \
47 } else { \
48 str_hash = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->hash; \
49 }
Paul Sokolovsky97319122014-06-13 22:01:26 +030050
51// use this macro to extract the string length
52#define GET_STR_LEN(str_obj_in, str_len) \
Damien Georgeb5986782022-08-10 14:09:22 +100053 size_t str_len; \
54 if (mp_obj_is_qstr(str_obj_in)) { \
55 str_len = qstr_len(MP_OBJ_QSTR_VALUE(str_obj_in)); \
56 } else { \
57 str_len = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->len; \
58 }
Paul Sokolovsky97319122014-06-13 22:01:26 +030059
60// use this macro to extract the string data and length
Damien George4c0176d2019-12-27 23:15:52 +110061#if MICROPY_OBJ_REPR == MICROPY_OBJ_REPR_C || MICROPY_OBJ_REPR == MICROPY_OBJ_REPR_D
Damien Georgec3f64d92015-11-27 12:23:18 +000062const byte *mp_obj_str_get_data_no_check(mp_obj_t self_in, size_t *len);
Damien George04353cc2015-10-18 23:09:04 +010063#define GET_STR_DATA_LEN(str_obj_in, str_data, str_len) \
Damien Georgeb5986782022-08-10 14:09:22 +100064 size_t str_len; \
65 const byte *str_data = mp_obj_str_get_data_no_check(str_obj_in, &str_len);
Damien George04353cc2015-10-18 23:09:04 +010066#else
Paul Sokolovsky97319122014-06-13 22:01:26 +030067#define GET_STR_DATA_LEN(str_obj_in, str_data, str_len) \
Damien Georgeb5986782022-08-10 14:09:22 +100068 const byte *str_data; \
69 size_t str_len; \
70 if (mp_obj_is_qstr(str_obj_in)) { \
71 str_data = qstr_data(MP_OBJ_QSTR_VALUE(str_obj_in), &str_len); \
72 } else { \
73 str_len = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->len; \
74 str_data = ((mp_obj_str_t *)MP_OBJ_TO_PTR(str_obj_in))->data; \
75 }
Damien George04353cc2015-10-18 23:09:04 +010076#endif
Paul Sokolovsky97319122014-06-13 22:01:26 +030077
Damien George5b3f0b72016-01-03 15:55:55 +000078mp_obj_t mp_obj_str_make_new(const mp_obj_type_t *type_in, size_t n_args, size_t n_kw, const mp_obj_t *args);
Damien George999cedb2015-11-27 17:01:44 +000079void mp_str_print_json(const mp_print_t *print, const byte *str_data, size_t str_len);
Damien George4b72b3a2016-01-03 14:21:40 +000080mp_obj_t mp_obj_str_format(size_t n_args, const mp_obj_t *args, mp_map_t *kwargs);
81mp_obj_t mp_obj_str_split(size_t n_args, const mp_obj_t *args);
Damien George69661f32020-02-27 15:36:53 +110082mp_obj_t mp_obj_new_str_copy(const mp_obj_type_t *type, const byte *data, size_t len);
83mp_obj_t mp_obj_new_str_of_type(const mp_obj_type_t *type, const byte *data, size_t len);
Paul Sokolovsky97319122014-06-13 22:01:26 +030084
Damien George58321dd2017-08-29 13:04:01 +100085mp_obj_t mp_obj_str_binary_op(mp_binary_op_t op, mp_obj_t lhs_in, mp_obj_t rhs_in);
Damien George4d917232014-08-30 14:28:06 +010086mp_int_t mp_obj_str_get_buffer(mp_obj_t self_in, mp_buffer_info_t *bufinfo, mp_uint_t flags);
Paul Sokolovsky97319122014-06-13 22:01:26 +030087
Damien George999cedb2015-11-27 17:01:44 +000088const byte *str_index_to_ptr(const mp_obj_type_t *type, const byte *self_data, size_t self_len,
Damien George69661f32020-02-27 15:36:53 +110089 mp_obj_t index, bool is_slice);
Damien Georgec0d95002017-02-16 16:26:48 +110090const byte *find_subbytes(const byte *haystack, size_t hlen, const byte *needle, size_t nlen, int direction);
Paul Sokolovskyea2c9362014-06-15 00:35:09 +030091
Damien George4ebdb1f2016-10-18 11:06:20 +110092MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_encode_obj);
93MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_find_obj);
94MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rfind_obj);
95MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_index_obj);
96MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rindex_obj);
97MP_DECLARE_CONST_FUN_OBJ_2(str_join_obj);
98MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_split_obj);
99MP_DECLARE_CONST_FUN_OBJ_KW(str_splitlines_obj);
100MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rsplit_obj);
101MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_startswith_obj);
102MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_endswith_obj);
103MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_strip_obj);
104MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_lstrip_obj);
105MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rstrip_obj);
106MP_DECLARE_CONST_FUN_OBJ_KW(str_format_obj);
107MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_replace_obj);
108MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_count_obj);
109MP_DECLARE_CONST_FUN_OBJ_2(str_partition_obj);
110MP_DECLARE_CONST_FUN_OBJ_2(str_rpartition_obj);
111MP_DECLARE_CONST_FUN_OBJ_2(str_center_obj);
112MP_DECLARE_CONST_FUN_OBJ_1(str_lower_obj);
113MP_DECLARE_CONST_FUN_OBJ_1(str_upper_obj);
114MP_DECLARE_CONST_FUN_OBJ_1(str_isspace_obj);
115MP_DECLARE_CONST_FUN_OBJ_1(str_isalpha_obj);
116MP_DECLARE_CONST_FUN_OBJ_1(str_isdigit_obj);
117MP_DECLARE_CONST_FUN_OBJ_1(str_isupper_obj);
118MP_DECLARE_CONST_FUN_OBJ_1(str_islower_obj);
stijnfb547362019-05-20 10:35:31 +0200119MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(bytes_decode_obj);
Damien George51dfcb42015-01-01 20:27:54 +0000120
Alexander Steffen299bc622017-06-29 23:14:58 +0200121#endif // MICROPY_INCLUDED_PY_OBJSTR_H