usse/funda-scraper/venv/lib/python3.10/site-packages/mypyc/primitives/str_ops.py

206 lines
5.5 KiB
Python

"""Primitive str ops."""
from typing import List, Tuple
from mypyc.ir.ops import ERR_MAGIC, ERR_NEVER
from mypyc.ir.rtypes import (
RType, object_rprimitive, str_rprimitive, int_rprimitive, list_rprimitive,
c_int_rprimitive, pointer_rprimitive, bool_rprimitive, bit_rprimitive,
c_pyssize_t_rprimitive, bytes_rprimitive
)
from mypyc.primitives.registry import (
method_op, binary_op, function_op,
load_address_op, custom_op, ERR_NEG_INT
)
# Get the 'str' type object.
load_address_op(
name='builtins.str',
type=object_rprimitive,
src='PyUnicode_Type')
# str(obj)
str_op = function_op(
name='builtins.str',
arg_types=[object_rprimitive],
return_type=str_rprimitive,
c_function_name='PyObject_Str',
error_kind=ERR_MAGIC)
# str1 + str2
binary_op(
name='+',
arg_types=[str_rprimitive, str_rprimitive],
return_type=str_rprimitive,
c_function_name='PyUnicode_Concat',
error_kind=ERR_MAGIC)
# str1 += str2
#
# PyUnicode_Append makes an effort to reuse the LHS when the refcount
# is 1. This is super dodgy but oh well, the interpreter does it.
binary_op(
name='+=',
arg_types=[str_rprimitive, str_rprimitive],
return_type=str_rprimitive,
c_function_name='CPyStr_Append',
error_kind=ERR_MAGIC,
steals=[True, False])
unicode_compare = custom_op(
arg_types=[str_rprimitive, str_rprimitive],
return_type=c_int_rprimitive,
c_function_name='PyUnicode_Compare',
error_kind=ERR_NEVER)
# str[index] (for an int index)
method_op(
name='__getitem__',
arg_types=[str_rprimitive, int_rprimitive],
return_type=str_rprimitive,
c_function_name='CPyStr_GetItem',
error_kind=ERR_MAGIC
)
# str[begin:end]
str_slice_op = custom_op(
arg_types=[str_rprimitive, int_rprimitive, int_rprimitive],
return_type=object_rprimitive,
c_function_name='CPyStr_GetSlice',
error_kind=ERR_MAGIC)
# str.join(obj)
method_op(
name='join',
arg_types=[str_rprimitive, object_rprimitive],
return_type=str_rprimitive,
c_function_name='PyUnicode_Join',
error_kind=ERR_MAGIC
)
str_build_op = custom_op(
arg_types=[c_pyssize_t_rprimitive],
return_type=str_rprimitive,
c_function_name='CPyStr_Build',
error_kind=ERR_MAGIC,
var_arg_type=str_rprimitive
)
# str.startswith(str)
method_op(
name='startswith',
arg_types=[str_rprimitive, str_rprimitive],
return_type=bool_rprimitive,
c_function_name='CPyStr_Startswith',
error_kind=ERR_NEVER
)
# str.endswith(str)
method_op(
name='endswith',
arg_types=[str_rprimitive, str_rprimitive],
return_type=bool_rprimitive,
c_function_name='CPyStr_Endswith',
error_kind=ERR_NEVER
)
# str.split(...)
str_split_types: List[RType] = [str_rprimitive, str_rprimitive, int_rprimitive]
str_split_functions = ["PyUnicode_Split", "PyUnicode_Split", "CPyStr_Split"]
str_split_constants: List[List[Tuple[int, RType]]] = [
[(0, pointer_rprimitive), (-1, c_int_rprimitive)],
[(-1, c_int_rprimitive)],
[],
]
for i in range(len(str_split_types)):
method_op(
name='split',
arg_types=str_split_types[0:i+1],
return_type=list_rprimitive,
c_function_name=str_split_functions[i],
extra_int_constants=str_split_constants[i],
error_kind=ERR_MAGIC)
# str.replace(old, new)
method_op(
name='replace',
arg_types=[str_rprimitive, str_rprimitive, str_rprimitive],
return_type=str_rprimitive,
c_function_name='PyUnicode_Replace',
error_kind=ERR_MAGIC,
extra_int_constants=[(-1, c_int_rprimitive)])
# str.replace(old, new, count)
method_op(
name='replace',
arg_types=[str_rprimitive, str_rprimitive, str_rprimitive, int_rprimitive],
return_type=str_rprimitive,
c_function_name='CPyStr_Replace',
error_kind=ERR_MAGIC)
# check if a string is true (isn't an empty string)
str_check_if_true = custom_op(
arg_types=[str_rprimitive],
return_type=bit_rprimitive,
c_function_name='CPyStr_IsTrue',
error_kind=ERR_NEVER)
str_ssize_t_size_op = custom_op(
arg_types=[str_rprimitive],
return_type=c_pyssize_t_rprimitive,
c_function_name='CPyStr_Size_size_t',
error_kind=ERR_NEG_INT)
# obj.decode()
method_op(
name='decode',
arg_types=[bytes_rprimitive],
return_type=str_rprimitive,
c_function_name='CPy_Decode',
error_kind=ERR_MAGIC,
extra_int_constants=[(0, pointer_rprimitive), (0, pointer_rprimitive)])
# obj.decode(encoding)
method_op(
name='decode',
arg_types=[bytes_rprimitive, str_rprimitive],
return_type=str_rprimitive,
c_function_name='CPy_Decode',
error_kind=ERR_MAGIC,
extra_int_constants=[(0, pointer_rprimitive)])
# obj.decode(encoding, errors)
method_op(
name='decode',
arg_types=[bytes_rprimitive, str_rprimitive, str_rprimitive],
return_type=str_rprimitive,
c_function_name='CPy_Decode',
error_kind=ERR_MAGIC)
# str.encode()
method_op(
name='encode',
arg_types=[str_rprimitive],
return_type=bytes_rprimitive,
c_function_name='CPy_Encode',
error_kind=ERR_MAGIC,
extra_int_constants=[(0, pointer_rprimitive), (0, pointer_rprimitive)])
# str.encode(encoding)
method_op(
name='encode',
arg_types=[str_rprimitive, str_rprimitive],
return_type=bytes_rprimitive,
c_function_name='CPy_Encode',
error_kind=ERR_MAGIC,
extra_int_constants=[(0, pointer_rprimitive)])
# str.encode(encoding, errors)
method_op(
name='encode',
arg_types=[str_rprimitive, str_rprimitive, str_rprimitive],
return_type=bytes_rprimitive,
c_function_name='CPy_Encode',
error_kind=ERR_MAGIC)