CPython에서 내장 합성곱 함수 사용하기

CPython의 decimal 모듈은 C로 작성된 NTT를 사용해 큰 수의 곱셈을 수행합니다. CPython의 버그를 이용하여 메모리에 직접 접근을 할 수 있다면 Decimal 객체를 조작하여 합성곱을 구할 수 있습니다.

import array
import _io
import _decimal
 
 
class Unsafe:
    __slots__ = ('p', 'nogc')
 
    def __init__(self):
        self.nogc = []
 
    def magic(self):
        self.p = [0]
        f = _io._RawIOBase()
        f.readable = lambda: True
        f.readinto = lambda x: not self.p.__setitem__(0, x)
        r = _io.BufferedReader(f)
        r.read(1)
        del r
        ptr = self.p[0].cast('P')
        obj = [0] * len(ptr)
        self.nogc.append(obj)
        return ptr, obj
 
    def view(self, addr, n):
        ptr, obj = self.magic()
        data = array.array(
            'Q', [9, id(bytearray), n, n, addr, addr, 0]).tobytes()
        self.nogc.append(data)
        ptr[0] = id(data) + 32
        return obj[0]
 
 
class FFT:
    __slots__ = ('unsafe', 'a_repr', 'b_repr', 'a', 'b')
    _decimal.getcontext().prec = 1 << 30
    _decimal.getcontext().Emax = 1 << 30
 
    def __init__(self):
        self.unsafe = Unsafe()
        self.a_repr = array.array(
            'Q', [9, id(_decimal.Decimal), 0, 0, 0, 0, 0, 0, 0])
        self.b_repr = array.array('Q', self.a_repr)
        self.unsafe.nogc.append(self.a_repr)
        self.unsafe.nogc.append(self.b_repr)
        a_addr = int.from_bytes(
            self.unsafe.view(id(self.a_repr) + 24, 8), 'little')
        b_addr = int.from_bytes(
            self.unsafe.view(id(self.b_repr) + 24, 8), 'little')
        ptr, a_obj = self.unsafe.magic()
        ptr[0] = a_addr
        ptr, b_obj = self.unsafe.magic()
        ptr[0] = b_addr
        self.a = a_obj[0]
        self.b = b_obj[0]
 
    def conv(self, a: array.array('Q'), b: array.array('Q')) -> memoryview:
        a_buf = int.from_bytes(self.unsafe.view(id(a) + 24, 8), 'little')
        self.a_repr[6] = len(a)
        self.a_repr[8] = a_buf
        b_buf = int.from_bytes(self.unsafe.view(id(b) + 24, 8), 'little')
        self.b_repr[6] = len(b)
        self.b_repr[8] = b_buf
        c = self.a * self.b
        c_repr = self.unsafe.view(id(c) + 48, 24)
        c_len = int.from_bytes(c_repr[:8], 'little')
        c_buf = int.from_bytes(c_repr[-8:], 'little')
        self.unsafe.nogc.append(c)
        return memoryview(self.unsafe.view(c_buf, c_len * 8)).cast('Q')

a, b를 복사하지 않으며 Decimal 객체를 매번 생성하지 않아 효율적입니다. 다만 CPython에 강하게 의존하여 PyPy에서는 사용하기 어렵습니다.

임의 메모리 조작 방법은 기회가 있으면 써 보겠습니다.