Merge pull request #59 from pfalcon/slice
Implement basic slice object and string slicing
This commit is contained in:
commit
b95d90b2f3
@ -25,3 +25,9 @@
|
|||||||
#ifndef MICROPY_MEM_STATS
|
#ifndef MICROPY_MEM_STATS
|
||||||
#define MICROPY_MEM_STATS (1)
|
#define MICROPY_MEM_STATS (1)
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
// Whether to support slice object and correspondingly
|
||||||
|
// slice subscript operators
|
||||||
|
#ifndef MICROPY_ENABLE_SLICE
|
||||||
|
#define MICROPY_ENABLE_SLICE (1)
|
||||||
|
#endif
|
||||||
|
5
py/obj.h
5
py/obj.h
@ -144,6 +144,7 @@ mp_obj_t mp_obj_new_list(uint n, mp_obj_t *items);
|
|||||||
mp_obj_t mp_obj_new_list_reverse(uint n, mp_obj_t *items);
|
mp_obj_t mp_obj_new_list_reverse(uint n, mp_obj_t *items);
|
||||||
mp_obj_t mp_obj_new_dict(int n_args);
|
mp_obj_t mp_obj_new_dict(int n_args);
|
||||||
mp_obj_t mp_obj_new_set(int n_args, mp_obj_t *items);
|
mp_obj_t mp_obj_new_set(int n_args, mp_obj_t *items);
|
||||||
|
mp_obj_t mp_obj_new_slice(mp_obj_t start, mp_obj_t stop, mp_obj_t step);
|
||||||
mp_obj_t mp_obj_new_bound_meth(mp_obj_t self, mp_obj_t meth);
|
mp_obj_t mp_obj_new_bound_meth(mp_obj_t self, mp_obj_t meth);
|
||||||
mp_obj_t mp_obj_new_class(struct _mp_map_t *class_locals);
|
mp_obj_t mp_obj_new_class(struct _mp_map_t *class_locals);
|
||||||
mp_obj_t mp_obj_new_instance(mp_obj_t clas);
|
mp_obj_t mp_obj_new_instance(mp_obj_t clas);
|
||||||
@ -214,6 +215,10 @@ mp_obj_t mp_obj_dict_store(mp_obj_t self_in, mp_obj_t key, mp_obj_t value);
|
|||||||
// set
|
// set
|
||||||
void mp_obj_set_store(mp_obj_t self_in, mp_obj_t item);
|
void mp_obj_set_store(mp_obj_t self_in, mp_obj_t item);
|
||||||
|
|
||||||
|
// slice
|
||||||
|
extern const mp_obj_type_t slice_type;
|
||||||
|
void mp_obj_slice_get(mp_obj_t self_in, machine_int_t *start, machine_int_t *stop, machine_int_t *step);
|
||||||
|
|
||||||
// functions
|
// functions
|
||||||
typedef struct _mp_obj_fun_native_t { // need this so we can define const objects (to go in ROM)
|
typedef struct _mp_obj_fun_native_t { // need this so we can define const objects (to go in ROM)
|
||||||
mp_obj_base_t base;
|
mp_obj_base_t base;
|
||||||
|
74
py/objslice.c
Normal file
74
py/objslice.c
Normal file
@ -0,0 +1,74 @@
|
|||||||
|
#include <stdlib.h>
|
||||||
|
#include <stdint.h>
|
||||||
|
#include <string.h>
|
||||||
|
#include <assert.h>
|
||||||
|
|
||||||
|
#include "nlr.h"
|
||||||
|
#include "misc.h"
|
||||||
|
#include "mpconfig.h"
|
||||||
|
#include "obj.h"
|
||||||
|
#include "runtime0.h"
|
||||||
|
|
||||||
|
#if MICROPY_ENABLE_SLICE
|
||||||
|
|
||||||
|
// TODO: This implements only variant of slice with 2 integer args only.
|
||||||
|
// CPython supports 3rd arg (step), plus args can be arbitrary Python objects.
|
||||||
|
typedef struct _mp_obj_slice_t {
|
||||||
|
mp_obj_base_t base;
|
||||||
|
machine_int_t start;
|
||||||
|
machine_int_t stop;
|
||||||
|
} mp_obj_slice_t;
|
||||||
|
|
||||||
|
void slice_print(void (*print)(void *env, const char *fmt, ...), void *env, mp_obj_t o_in) {
|
||||||
|
mp_obj_slice_t *o = o_in;
|
||||||
|
print(env, "slice(" INT_FMT ", " INT_FMT ")", o->start, o->stop);
|
||||||
|
}
|
||||||
|
|
||||||
|
const mp_obj_type_t slice_type = {
|
||||||
|
{ &mp_const_type },
|
||||||
|
"slice",
|
||||||
|
slice_print,
|
||||||
|
NULL, // call_n
|
||||||
|
NULL, // unary_op
|
||||||
|
NULL, // binary_op
|
||||||
|
NULL, // getiter
|
||||||
|
NULL, // iternext
|
||||||
|
{ { NULL, NULL }, }, // method list
|
||||||
|
};
|
||||||
|
|
||||||
|
// TODO: Make sure to handle "empty" values, which are signified by None in CPython
|
||||||
|
mp_obj_t mp_obj_new_slice(mp_obj_t ostart, mp_obj_t ostop, mp_obj_t ostep) {
|
||||||
|
assert(ostep == NULL);
|
||||||
|
machine_int_t start = 0, stop = 0;
|
||||||
|
if (ostart != mp_const_none) {
|
||||||
|
start = mp_obj_get_int(ostart);
|
||||||
|
}
|
||||||
|
if (ostop != mp_const_none) {
|
||||||
|
stop = mp_obj_get_int(ostop);
|
||||||
|
if (stop == 0) {
|
||||||
|
// [x:0] is a special case - in our slice object, stop = 0 means
|
||||||
|
// "end of sequence". Fortunately, [x:0] is an empty seqence for
|
||||||
|
// any x (including negative). [x:x] is also always empty sequence.
|
||||||
|
// but x also can be 0. But note that b""[x:x] is b"" for any x (i.e.
|
||||||
|
// no IndexError, at least in Python 3.3.3). So, we just use -1's to
|
||||||
|
// signify that. -1 is catchy "special" number in case someone will
|
||||||
|
// try to print [x:0] slice ever.
|
||||||
|
start = stop = -1;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
mp_obj_slice_t *o = m_new(mp_obj_slice_t, 1);
|
||||||
|
o->base.type = &slice_type;
|
||||||
|
o->start = start;
|
||||||
|
o->stop = stop;
|
||||||
|
return (mp_obj_t)o;
|
||||||
|
}
|
||||||
|
|
||||||
|
void mp_obj_slice_get(mp_obj_t self_in, machine_int_t *start, machine_int_t *stop, machine_int_t *step) {
|
||||||
|
assert(MP_OBJ_IS_TYPE(self_in, &slice_type));
|
||||||
|
mp_obj_slice_t *self = self_in;
|
||||||
|
*start = self->start;
|
||||||
|
*stop = self->stop;
|
||||||
|
*step = 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
#endif
|
28
py/objstr.c
28
py/objstr.c
@ -27,9 +27,31 @@ mp_obj_t str_binary_op(int op, mp_obj_t lhs_in, mp_obj_t rhs_in) {
|
|||||||
const char *lhs_str = qstr_str(lhs->qstr);
|
const char *lhs_str = qstr_str(lhs->qstr);
|
||||||
switch (op) {
|
switch (op) {
|
||||||
case RT_BINARY_OP_SUBSCR:
|
case RT_BINARY_OP_SUBSCR:
|
||||||
// string access
|
// TODO: need predicate to check for int-like type (bools are such for example)
|
||||||
// XXX a massive hack!
|
// ["no", "yes"][1 == 2] is common idiom
|
||||||
return mp_obj_new_int(lhs_str[mp_obj_get_int(rhs_in)]);
|
if (MP_OBJ_IS_SMALL_INT(rhs_in)) {
|
||||||
|
// TODO: This implements byte string access for single index so far
|
||||||
|
// TODO: Handle negative indexes.
|
||||||
|
return mp_obj_new_int(lhs_str[mp_obj_get_int(rhs_in)]);
|
||||||
|
#if MICROPY_ENABLE_SLICE
|
||||||
|
} else if (MP_OBJ_IS_TYPE(rhs_in, &slice_type)) {
|
||||||
|
int start, stop, step;
|
||||||
|
mp_obj_slice_get(rhs_in, &start, &stop, &step);
|
||||||
|
assert(step == 1);
|
||||||
|
int len = strlen(lhs_str);
|
||||||
|
if (start < 0) {
|
||||||
|
start = len + start;
|
||||||
|
}
|
||||||
|
if (stop <= 0) {
|
||||||
|
stop = len + stop;
|
||||||
|
}
|
||||||
|
return mp_obj_new_str(qstr_from_strn_copy(lhs_str + start, stop - start));
|
||||||
|
#endif
|
||||||
|
} else {
|
||||||
|
// Message doesn't match CPython, but we don't have so much bytes as they
|
||||||
|
// to spend them on verbose wording
|
||||||
|
nlr_jump(mp_obj_new_exception_msg(rt_q_TypeError, "index must be int"));
|
||||||
|
}
|
||||||
|
|
||||||
case RT_BINARY_OP_ADD:
|
case RT_BINARY_OP_ADD:
|
||||||
case RT_BINARY_OP_INPLACE_ADD:
|
case RT_BINARY_OP_INPLACE_ADD:
|
||||||
|
14
py/vm.c
14
py/vm.c
@ -410,6 +410,20 @@ bool mp_execute_byte_code_2(const byte **ip_in_out, mp_obj_t *fastn, mp_obj_t **
|
|||||||
sp++;
|
sp++;
|
||||||
break;
|
break;
|
||||||
|
|
||||||
|
#if MICROPY_ENABLE_SLICE
|
||||||
|
case MP_BC_BUILD_SLICE:
|
||||||
|
DECODE_UINT;
|
||||||
|
if (unum == 2) {
|
||||||
|
obj2 = POP();
|
||||||
|
obj1 = TOP();
|
||||||
|
SET_TOP(mp_obj_new_slice(obj1, obj2, NULL));
|
||||||
|
} else {
|
||||||
|
printf("3-argument slice is not supported\n");
|
||||||
|
assert(0);
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
#endif
|
||||||
|
|
||||||
case MP_BC_UNPACK_SEQUENCE:
|
case MP_BC_UNPACK_SEQUENCE:
|
||||||
DECODE_UINT;
|
DECODE_UINT;
|
||||||
rt_unpack_sequence(sp[0], unum, sp - unum + 1);
|
rt_unpack_sequence(sp[0], unum, sp - unum + 1);
|
||||||
|
@ -78,6 +78,7 @@ PY_O = \
|
|||||||
objnone.o \
|
objnone.o \
|
||||||
objrange.o \
|
objrange.o \
|
||||||
objset.o \
|
objset.o \
|
||||||
|
objslice.o \
|
||||||
objstr.o \
|
objstr.o \
|
||||||
objtuple.o \
|
objtuple.o \
|
||||||
objtype.o \
|
objtype.o \
|
||||||
|
27
tests/basics/tests/slice-bstr1.py
Normal file
27
tests/basics/tests/slice-bstr1.py
Normal file
@ -0,0 +1,27 @@
|
|||||||
|
b"123"[0:1]
|
||||||
|
|
||||||
|
b"123"[0:2]
|
||||||
|
|
||||||
|
b"123"[:1]
|
||||||
|
|
||||||
|
b"123"[1:]
|
||||||
|
|
||||||
|
# Idiom for copying sequence
|
||||||
|
b"123"[:]
|
||||||
|
|
||||||
|
b"123"[:-1]
|
||||||
|
|
||||||
|
# Weird cases
|
||||||
|
b"123"[0:0]
|
||||||
|
b"123"[1:0]
|
||||||
|
b"123"[1:1]
|
||||||
|
b"123"[-1:-1]
|
||||||
|
b"123"[-3:]
|
||||||
|
b"123"[-3:3]
|
||||||
|
b"123"[0:]
|
||||||
|
b"123"[:0]
|
||||||
|
b"123"[:-3]
|
||||||
|
b"123"[:-4]
|
||||||
|
# No IndexError!
|
||||||
|
b""[1:1]
|
||||||
|
b""[-1:-1]
|
@ -43,6 +43,7 @@ PY_O = \
|
|||||||
objnone.o \
|
objnone.o \
|
||||||
objrange.o \
|
objrange.o \
|
||||||
objset.o \
|
objset.o \
|
||||||
|
objslice.o \
|
||||||
objstr.o \
|
objstr.o \
|
||||||
objtuple.o \
|
objtuple.o \
|
||||||
objtype.o \
|
objtype.o \
|
||||||
|
@ -50,6 +50,7 @@ PY_O = \
|
|||||||
objnone.o \
|
objnone.o \
|
||||||
objrange.o \
|
objrange.o \
|
||||||
objset.o \
|
objset.o \
|
||||||
|
objslice.o \
|
||||||
objstr.o \
|
objstr.o \
|
||||||
objtuple.o \
|
objtuple.o \
|
||||||
objtype.o \
|
objtype.o \
|
||||||
|
Loading…
Reference in New Issue
Block a user