blob: 6a0721d45f01b226a3aaad243a4a2182250d99e3 [file] [log] [blame]
Damiend99b0522013-12-21 18:17:45 +00001#include <stdlib.h>
2#include <stdint.h>
3#include <stdarg.h>
4#include <string.h>
5#include <assert.h>
6
7#include "nlr.h"
8#include "misc.h"
9#include "mpconfig.h"
10#include "obj.h"
11#include "runtime0.h"
12#include "runtime.h"
13
14typedef struct _mp_obj_str_t {
15 mp_obj_base_t base;
16 qstr qstr;
17} mp_obj_str_t;
18
19void str_print(void (*print)(void *env, const char *fmt, ...), void *env, mp_obj_t self_in) {
20 mp_obj_str_t *self = self_in;
21 // TODO need to escape chars etc
22 print(env, "'%s'", qstr_str(self->qstr));
23}
24
25mp_obj_t str_binary_op(int op, mp_obj_t lhs_in, mp_obj_t rhs_in) {
26 mp_obj_str_t *lhs = lhs_in;
27 const char *lhs_str = qstr_str(lhs->qstr);
28 switch (op) {
29 case RT_BINARY_OP_SUBSCR:
Paul Sokolovsky31ba60f2014-01-03 02:51:16 +020030 // TODO: need predicate to check for int-like type (bools are such for example)
31 // ["no", "yes"][1 == 2] is common idiom
32 if (MP_OBJ_IS_SMALL_INT(rhs_in)) {
33 // TODO: This implements byte string access for single index so far
Paul Sokolovskyf8b9d3c2014-01-04 01:38:26 +020034 // TODO: Handle negative indexes.
Paul Sokolovsky31ba60f2014-01-03 02:51:16 +020035 return mp_obj_new_int(lhs_str[mp_obj_get_int(rhs_in)]);
Paul Sokolovskye606cb62014-01-04 01:34:23 +020036#if MICROPY_ENABLE_SLICE
Paul Sokolovsky31ba60f2014-01-03 02:51:16 +020037 } else if (MP_OBJ_IS_TYPE(rhs_in, &slice_type)) {
38 int start, stop, step;
39 mp_obj_slice_get(rhs_in, &start, &stop, &step);
40 assert(step == 1);
Paul Sokolovskydecad082014-01-03 23:36:56 +020041 int len = strlen(lhs_str);
42 if (start < 0) {
43 start = len + start;
44 }
45 if (stop <= 0) {
46 stop = len + stop;
47 }
Paul Sokolovsky31ba60f2014-01-03 02:51:16 +020048 return mp_obj_new_str(qstr_from_strn_copy(lhs_str + start, stop - start));
Paul Sokolovskye606cb62014-01-04 01:34:23 +020049#endif
Paul Sokolovsky31ba60f2014-01-03 02:51:16 +020050 } else {
Paul Sokolovskyf8b9d3c2014-01-04 01:38:26 +020051 // Message doesn't match CPython, but we don't have so much bytes as they
52 // to spend them on verbose wording
53 nlr_jump(mp_obj_new_exception_msg(rt_q_TypeError, "index must be int"));
Paul Sokolovsky31ba60f2014-01-03 02:51:16 +020054 }
Damiend99b0522013-12-21 18:17:45 +000055
56 case RT_BINARY_OP_ADD:
57 case RT_BINARY_OP_INPLACE_ADD:
58 if (MP_OBJ_IS_TYPE(rhs_in, &str_type)) {
59 // add 2 strings
60 const char *rhs_str = qstr_str(((mp_obj_str_t*)rhs_in)->qstr);
Damien Georgefe8fb912014-01-02 16:36:09 +000061 size_t lhs_len = strlen(lhs_str);
62 size_t rhs_len = strlen(rhs_str);
63 int alloc_len = lhs_len + rhs_len + 1;
Damien732407f2013-12-29 19:33:23 +000064 char *val = m_new(char, alloc_len);
Damien Georgefe8fb912014-01-02 16:36:09 +000065 memcpy(val, lhs_str, lhs_len);
66 memcpy(val + lhs_len, rhs_str, rhs_len);
67 val[lhs_len + rhs_len] = '\0';
Damien732407f2013-12-29 19:33:23 +000068 return mp_obj_new_str(qstr_from_str_take(val, alloc_len));
Damiend99b0522013-12-21 18:17:45 +000069 }
70 break;
71 }
72
73 return MP_OBJ_NULL; // op not supported
74}
75
76mp_obj_t str_join(mp_obj_t self_in, mp_obj_t arg) {
77 assert(MP_OBJ_IS_TYPE(self_in, &str_type));
78 mp_obj_str_t *self = self_in;
Damiend99b0522013-12-21 18:17:45 +000079
Damien Georgefe8fb912014-01-02 16:36:09 +000080 // get separation string
81 const char *sep_str = qstr_str(self->qstr);
82 size_t sep_len = strlen(sep_str);
83
84 // process args
Damiend99b0522013-12-21 18:17:45 +000085 uint seq_len;
86 mp_obj_t *seq_items;
87 if (MP_OBJ_IS_TYPE(arg, &tuple_type)) {
88 mp_obj_tuple_get(arg, &seq_len, &seq_items);
89 } else if (MP_OBJ_IS_TYPE(arg, &list_type)) {
90 mp_obj_list_get(arg, &seq_len, &seq_items);
91 } else {
92 goto bad_arg;
93 }
Damien Georgefe8fb912014-01-02 16:36:09 +000094
95 // count required length
96 int required_len = 0;
Damiend99b0522013-12-21 18:17:45 +000097 for (int i = 0; i < seq_len; i++) {
98 if (!MP_OBJ_IS_TYPE(seq_items[i], &str_type)) {
99 goto bad_arg;
100 }
Damien Georgefe8fb912014-01-02 16:36:09 +0000101 if (i > 0) {
102 required_len += sep_len;
103 }
Damiend99b0522013-12-21 18:17:45 +0000104 required_len += strlen(qstr_str(mp_obj_str_get(seq_items[i])));
105 }
106
107 // make joined string
108 char *joined_str = m_new(char, required_len + 1);
Damien Georgefe8fb912014-01-02 16:36:09 +0000109 char *s_dest = joined_str;
Damiend99b0522013-12-21 18:17:45 +0000110 for (int i = 0; i < seq_len; i++) {
Damiend99b0522013-12-21 18:17:45 +0000111 if (i > 0) {
Damien Georgefe8fb912014-01-02 16:36:09 +0000112 memcpy(s_dest, sep_str, sep_len);
113 s_dest += sep_len;
Damiend99b0522013-12-21 18:17:45 +0000114 }
Damien Georgefe8fb912014-01-02 16:36:09 +0000115 const char *s2 = qstr_str(mp_obj_str_get(seq_items[i]));
116 size_t s2_len = strlen(s2);
117 memcpy(s_dest, s2, s2_len);
118 s_dest += s2_len;
Damiend99b0522013-12-21 18:17:45 +0000119 }
Damien Georgefe8fb912014-01-02 16:36:09 +0000120 *s_dest = '\0';
121
122 // return joined string
Damien732407f2013-12-29 19:33:23 +0000123 return mp_obj_new_str(qstr_from_str_take(joined_str, required_len + 1));
Damiend99b0522013-12-21 18:17:45 +0000124
125bad_arg:
126 nlr_jump(mp_obj_new_exception_msg(rt_q_TypeError, "?str.join expecting a list of str's"));
127}
128
129void vstr_printf_wrapper(void *env, const char *fmt, ...) {
130 va_list args;
131 va_start(args, fmt);
132 vstr_vprintf(env, fmt, args);
133 va_end(args);
134}
135
136mp_obj_t str_format(int n_args, const mp_obj_t *args) {
137 assert(MP_OBJ_IS_TYPE(args[0], &str_type));
138 mp_obj_str_t *self = args[0];
139
140 const char *str = qstr_str(self->qstr);
141 int arg_i = 1;
142 vstr_t *vstr = vstr_new();
143 for (; *str; str++) {
144 if (*str == '{') {
145 str++;
146 if (*str == '{') {
147 vstr_add_char(vstr, '{');
148 } else if (*str == '}') {
149 if (arg_i >= n_args) {
150 nlr_jump(mp_obj_new_exception_msg(rt_q_IndexError, "tuple index out of range"));
151 }
152 mp_obj_print_helper(vstr_printf_wrapper, vstr, args[arg_i]);
153 arg_i++;
154 }
155 } else {
156 vstr_add_char(vstr, *str);
157 }
158 }
159
Damien732407f2013-12-29 19:33:23 +0000160 return mp_obj_new_str(qstr_from_str_take(vstr->buf, vstr->alloc));
Damiend99b0522013-12-21 18:17:45 +0000161}
162
163static MP_DEFINE_CONST_FUN_OBJ_2(str_join_obj, str_join);
164static MP_DEFINE_CONST_FUN_OBJ_VAR(str_format_obj, 1, str_format);
165
166const mp_obj_type_t str_type = {
167 { &mp_const_type },
168 "str",
169 str_print, // print
170 NULL, // call_n
171 NULL, // unary_op
172 str_binary_op, // binary_op
173 NULL, // getiter
174 NULL, // iternext
175 { // method list
176 { "join", &str_join_obj },
177 { "format", &str_format_obj },
178 { NULL, NULL }, // end-of-list sentinel
179 },
180};
181
182mp_obj_t mp_obj_new_str(qstr qstr) {
183 mp_obj_str_t *o = m_new_obj(mp_obj_str_t);
184 o->base.type = &str_type;
185 o->qstr = qstr;
186 return o;
187}
188
189qstr mp_obj_str_get(mp_obj_t self_in) {
190 assert(MP_OBJ_IS_TYPE(self_in, &str_type));
191 mp_obj_str_t *self = self_in;
192 return self->qstr;
193}