blob: 4e55cad0913e12ed4c21fe70c14d0ed44d5e08ed [file] [log] [blame]
Damien George04b91472014-05-03 23:27:38 +01001/*
Alexander Steffen55f33242017-06-30 09:22:17 +02002 * This file is part of the MicroPython project, http://micropython.org/
Damien George04b91472014-05-03 23:27:38 +01003 *
4 * The MIT License (MIT)
5 *
6 * Copyright (c) 2013, 2014 Damien P. George
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a copy
9 * of this software and associated documentation files (the "Software"), to deal
10 * in the Software without restriction, including without limitation the rights
11 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
12 * copies of the Software, and to permit persons to whom the Software is
13 * furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be included in
16 * all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 * THE SOFTWARE.
25 */
Alexander Steffen299bc622017-06-29 23:14:58 +020026#ifndef MICROPY_INCLUDED_PY_OBJSTR_H
27#define MICROPY_INCLUDED_PY_OBJSTR_H
Damien George51dfcb42015-01-01 20:27:54 +000028
29#include "py/obj.h"
Damien George04b91472014-05-03 23:27:38 +010030
Paul Sokolovsky58676fc2014-04-14 01:45:06 +030031typedef struct _mp_obj_str_t {
32 mp_obj_base_t base;
Damien George26a0d4f2014-08-22 18:34:28 +010033 mp_uint_t hash;
Paul Sokolovsky58676fc2014-04-14 01:45:06 +030034 // len == number of bytes used in data, alloc = len + 1 because (at the moment) we also append a null byte
Damien Georgec0d95002017-02-16 16:26:48 +110035 size_t len;
Paul Sokolovsky58676fc2014-04-14 01:45:06 +030036 const byte *data;
37} mp_obj_str_t;
38
Damien George4dea9222015-04-09 15:29:54 +000039#define MP_DEFINE_STR_OBJ(obj_name, str) mp_obj_str_t obj_name = {{&mp_type_str}, 0, sizeof(str) - 1, (const byte*)str}
Damien George897fe0c2014-04-15 22:03:55 +010040
Paul Sokolovsky97319122014-06-13 22:01:26 +030041// use this macro to extract the string hash
Damien George5f3bda42016-09-02 14:42:53 +100042// warning: the hash can be 0, meaning invalid, and must then be explicitly computed from the data
Paul Sokolovsky97319122014-06-13 22:01:26 +030043#define GET_STR_HASH(str_obj_in, str_hash) \
Damien George39dc1452014-10-03 19:52:22 +010044 mp_uint_t str_hash; if (MP_OBJ_IS_QSTR(str_obj_in)) \
Damien George999cedb2015-11-27 17:01:44 +000045 { str_hash = qstr_hash(MP_OBJ_QSTR_VALUE(str_obj_in)); } else { str_hash = ((mp_obj_str_t*)MP_OBJ_TO_PTR(str_obj_in))->hash; }
Paul Sokolovsky97319122014-06-13 22:01:26 +030046
47// use this macro to extract the string length
48#define GET_STR_LEN(str_obj_in, str_len) \
Damien Georgec3f64d92015-11-27 12:23:18 +000049 size_t str_len; if (MP_OBJ_IS_QSTR(str_obj_in)) \
Damien George999cedb2015-11-27 17:01:44 +000050 { str_len = qstr_len(MP_OBJ_QSTR_VALUE(str_obj_in)); } else { str_len = ((mp_obj_str_t*)MP_OBJ_TO_PTR(str_obj_in))->len; }
Paul Sokolovsky97319122014-06-13 22:01:26 +030051
52// use this macro to extract the string data and length
Damien George04353cc2015-10-18 23:09:04 +010053#if MICROPY_OBJ_REPR == MICROPY_OBJ_REPR_C
Damien Georgec3f64d92015-11-27 12:23:18 +000054const byte *mp_obj_str_get_data_no_check(mp_obj_t self_in, size_t *len);
Damien George04353cc2015-10-18 23:09:04 +010055#define GET_STR_DATA_LEN(str_obj_in, str_data, str_len) \
Damien Georgec3f64d92015-11-27 12:23:18 +000056 size_t str_len; const byte *str_data = mp_obj_str_get_data_no_check(str_obj_in, &str_len);
Damien George04353cc2015-10-18 23:09:04 +010057#else
Paul Sokolovsky97319122014-06-13 22:01:26 +030058#define GET_STR_DATA_LEN(str_obj_in, str_data, str_len) \
Damien Georgec3f64d92015-11-27 12:23:18 +000059 const byte *str_data; size_t str_len; if (MP_OBJ_IS_QSTR(str_obj_in)) \
Paul Sokolovsky97319122014-06-13 22:01:26 +030060 { str_data = qstr_data(MP_OBJ_QSTR_VALUE(str_obj_in), &str_len); } \
Damien George999cedb2015-11-27 17:01:44 +000061 else { str_len = ((mp_obj_str_t*)MP_OBJ_TO_PTR(str_obj_in))->len; str_data = ((mp_obj_str_t*)MP_OBJ_TO_PTR(str_obj_in))->data; }
Damien George04353cc2015-10-18 23:09:04 +010062#endif
Paul Sokolovsky97319122014-06-13 22:01:26 +030063
Damien George5b3f0b72016-01-03 15:55:55 +000064mp_obj_t mp_obj_str_make_new(const mp_obj_type_t *type_in, size_t n_args, size_t n_kw, const mp_obj_t *args);
Damien George999cedb2015-11-27 17:01:44 +000065void mp_str_print_json(const mp_print_t *print, const byte *str_data, size_t str_len);
Damien George4b72b3a2016-01-03 14:21:40 +000066mp_obj_t mp_obj_str_format(size_t n_args, const mp_obj_t *args, mp_map_t *kwargs);
67mp_obj_t mp_obj_str_split(size_t n_args, const mp_obj_t *args);
Damien George1f1d5192017-11-16 13:53:04 +110068mp_obj_t mp_obj_new_str_copy(const mp_obj_type_t *type, const byte* data, size_t len);
Damien George999cedb2015-11-27 17:01:44 +000069mp_obj_t mp_obj_new_str_of_type(const mp_obj_type_t *type, const byte* data, size_t len);
Paul Sokolovsky97319122014-06-13 22:01:26 +030070
Damien George58321dd2017-08-29 13:04:01 +100071mp_obj_t mp_obj_str_binary_op(mp_binary_op_t op, mp_obj_t lhs_in, mp_obj_t rhs_in);
Damien George4d917232014-08-30 14:28:06 +010072mp_int_t mp_obj_str_get_buffer(mp_obj_t self_in, mp_buffer_info_t *bufinfo, mp_uint_t flags);
Paul Sokolovsky97319122014-06-13 22:01:26 +030073
Damien George999cedb2015-11-27 17:01:44 +000074const byte *str_index_to_ptr(const mp_obj_type_t *type, const byte *self_data, size_t self_len,
Paul Sokolovskyea2c9362014-06-15 00:35:09 +030075 mp_obj_t index, bool is_slice);
Damien Georgec0d95002017-02-16 16:26:48 +110076const byte *find_subbytes(const byte *haystack, size_t hlen, const byte *needle, size_t nlen, int direction);
Paul Sokolovskyea2c9362014-06-15 00:35:09 +030077
Damien George4ebdb1f2016-10-18 11:06:20 +110078MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_encode_obj);
79MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_find_obj);
80MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rfind_obj);
81MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_index_obj);
82MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rindex_obj);
83MP_DECLARE_CONST_FUN_OBJ_2(str_join_obj);
84MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_split_obj);
85MP_DECLARE_CONST_FUN_OBJ_KW(str_splitlines_obj);
86MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rsplit_obj);
87MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_startswith_obj);
88MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_endswith_obj);
89MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_strip_obj);
90MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_lstrip_obj);
91MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_rstrip_obj);
92MP_DECLARE_CONST_FUN_OBJ_KW(str_format_obj);
93MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_replace_obj);
94MP_DECLARE_CONST_FUN_OBJ_VAR_BETWEEN(str_count_obj);
95MP_DECLARE_CONST_FUN_OBJ_2(str_partition_obj);
96MP_DECLARE_CONST_FUN_OBJ_2(str_rpartition_obj);
97MP_DECLARE_CONST_FUN_OBJ_2(str_center_obj);
98MP_DECLARE_CONST_FUN_OBJ_1(str_lower_obj);
99MP_DECLARE_CONST_FUN_OBJ_1(str_upper_obj);
100MP_DECLARE_CONST_FUN_OBJ_1(str_isspace_obj);
101MP_DECLARE_CONST_FUN_OBJ_1(str_isalpha_obj);
102MP_DECLARE_CONST_FUN_OBJ_1(str_isdigit_obj);
103MP_DECLARE_CONST_FUN_OBJ_1(str_isupper_obj);
104MP_DECLARE_CONST_FUN_OBJ_1(str_islower_obj);
Damien George51dfcb42015-01-01 20:27:54 +0000105
Alexander Steffen299bc622017-06-29 23:14:58 +0200106#endif // MICROPY_INCLUDED_PY_OBJSTR_H