2022-08-08 22:31:55 +05:30

257 lines
9.2 KiB
C

/*
* rsync.c
* Copyright (C) 2021 Kovid Goyal <kovid at kovidgoyal.net>
*
* Distributed under terms of the GPL3 license.
*/
#include "data-types.h"
#include <librsync.h>
#define SIGNATURE_CAPSULE "rs_signature_t"
#define JOB_WITH_CALLBACK_CAPSULE "rs_callback_job_t"
// See whole.c in the librsync source code for estimating IO_BUFFER_SIZE
#define IO_BUFFER_SIZE (64u * 1024u)
static PyObject *RsyncError = NULL;
static void
free_job_with_callback_capsule(PyObject *capsule) {
if (PyCapsule_IsValid(capsule, JOB_WITH_CALLBACK_CAPSULE)) {
void *job = PyCapsule_GetPointer(capsule, JOB_WITH_CALLBACK_CAPSULE);
if (job && job != RsyncError) rs_job_free(job);
PyObject *callback = PyCapsule_GetContext(capsule);
Py_CLEAR(callback);
}
}
static void
free_sig_capsule(PyObject *capsule) {
rs_signature_t *sig = PyCapsule_GetPointer(capsule, SIGNATURE_CAPSULE);
if (sig) rs_free_sumset(sig);
}
#define CREATE_JOB(func, cb, ...) \
PyObject *job_capsule = PyCapsule_New(RsyncError, JOB_WITH_CALLBACK_CAPSULE, free_job_with_callback_capsule); \
if (job_capsule) { \
rs_job_t *job = func(__VA_ARGS__); \
if (job) { \
if (PyCapsule_SetPointer(job_capsule, job) == 0) { \
if (cb) { \
if (PyCapsule_SetContext(job_capsule, cb) == 0) { Py_INCREF(cb); } \
else { Py_CLEAR(job_capsule); } \
} \
} else { \
rs_job_free(job); Py_CLEAR(job_capsule); \
} \
} else { \
Py_CLEAR(job_capsule); \
} \
}
static PyObject*
begin_create_signature(PyObject *self UNUSED, PyObject *args) {
long long file_size = -1;
long sl = 0;
if (!PyArg_ParseTuple(args, "|Ll", &file_size, &sl)) return NULL;
rs_magic_number magic_number = 0;
size_t block_len = 0, strong_len = sl;
#ifdef KITTY_HAS_RS_SIG_ARGS
rs_result res = rs_sig_args(file_size, &magic_number, &block_len, &strong_len);
if (res != RS_DONE) {
PyErr_SetString(PyExc_ValueError, rs_strerror(res));
return NULL;
}
#else
block_len = RS_DEFAULT_BLOCK_LEN;
strong_len = 8;
magic_number = RS_MD4_SIG_MAGIC;
#endif
CREATE_JOB(rs_sig_begin, NULL, block_len, strong_len, magic_number);
return Py_BuildValue("Nnn", job_capsule, (Py_ssize_t)block_len, (Py_ssize_t)strong_len);
}
#define GET_JOB_FROM_CAPSULE \
rs_job_t *job = PyCapsule_GetPointer(job_capsule, JOB_WITH_CALLBACK_CAPSULE); \
if (!job) { PyErr_SetString(PyExc_TypeError, "Not a job capsule"); return NULL; } \
static PyObject*
iter_job(PyObject *self UNUSED, PyObject *args) {
FREE_BUFFER_AFTER_FUNCTION Py_buffer input_buf = {0};
FREE_BUFFER_AFTER_FUNCTION Py_buffer output_buf = {0};
PyObject *job_capsule, *output_array;
if (!PyArg_ParseTuple(args, "O!y*O!", &PyCapsule_Type, &job_capsule, &input_buf, &PyByteArray_Type, &output_array)) return NULL;
GET_JOB_FROM_CAPSULE;
if (PyObject_GetBuffer(output_array, &output_buf, PyBUF_WRITE) != 0) return NULL;
int eof = input_buf.len > 0 ? 0 : 1;
rs_buffers_t buffer = {
.avail_in=input_buf.len, .next_in=input_buf.buf, .eof_in=eof,
.avail_out=output_buf.len, .next_out=output_buf.buf
};
size_t before = buffer.avail_out;
rs_result result = rs_job_iter(job, &buffer);
Py_ssize_t output_size = before - buffer.avail_out;
if (result == RS_DONE || result == RS_BLOCKED) {
Py_ssize_t unused_input = buffer.avail_in;
return Py_BuildValue("Onn", result == RS_DONE ? Py_True : Py_False, unused_input, output_size);
}
PyErr_SetString(RsyncError, rs_strerror(result));
return NULL;
}
static PyObject*
begin_load_signature(PyObject *self UNUSED, PyObject *args UNUSED) {
rs_signature_t *sig = NULL;
CREATE_JOB(rs_loadsig_begin, NULL, &sig);
if (!job_capsule) { rs_free_sumset(sig); return NULL; }
PyObject *sc = PyCapsule_New(sig, SIGNATURE_CAPSULE, free_sig_capsule);
if (!sc) { Py_CLEAR(job_capsule); rs_free_sumset(sig); return NULL; }
return Py_BuildValue("NN", job_capsule, sc);
}
#define GET_SIG_FROM_CAPSULE \
rs_signature_t *sig = PyCapsule_GetPointer(sig_capsule, SIGNATURE_CAPSULE); \
if (!sig) { PyErr_SetString(PyExc_TypeError, "Not a sig capsule"); return NULL; }
static PyObject*
build_hash_table(PyObject *self UNUSED, PyObject *args) {
PyObject *sig_capsule;
if (!PyArg_ParseTuple(args, "O!", &PyCapsule_Type, &sig_capsule)) return NULL;
GET_SIG_FROM_CAPSULE;
rs_result res = rs_build_hash_table(sig);
if (res != RS_DONE) {
PyErr_SetString(RsyncError, rs_strerror(res));
return NULL;
}
Py_RETURN_NONE;
}
static PyObject*
begin_create_delta(PyObject *self UNUSED, PyObject *args) {
PyObject *sig_capsule;
if (!PyArg_ParseTuple(args, "O!", &PyCapsule_Type, &sig_capsule)) return NULL;
GET_SIG_FROM_CAPSULE;
CREATE_JOB(rs_delta_begin, NULL, sig);
return job_capsule;
}
static rs_result
copy_callback(void *opaque, rs_long_t pos, size_t *len, void **buf) {
PyObject *callback = opaque;
long long p = pos;
PyObject *mem = PyMemoryView_FromMemory(*buf, *len, PyBUF_WRITE);
if (!mem) { PyErr_Clear(); return RS_MEM_ERROR; }
PyObject *res = PyObject_CallFunction(callback, "OL", mem, p);
Py_DECREF(mem);
if (res == NULL) { PyErr_Print(); return RS_IO_ERROR; }
rs_result r = RS_DONE;
if (PyLong_Check(res)) { *len = PyLong_AsSize_t(res); }
else { r = RS_INTERNAL_ERROR; }
Py_DECREF(res);
return r;
}
static PyObject*
begin_patch(PyObject *self UNUSED, PyObject *callback) {
if (!PyCallable_Check(callback)) { PyErr_SetString(PyExc_TypeError, "callback must be a callable"); return NULL; }
CREATE_JOB(rs_patch_begin, callback, copy_callback, callback);
return job_capsule;
}
static bool
call_ftc_callback(PyObject *callback, char *src, Py_ssize_t key_start, Py_ssize_t key_length, Py_ssize_t val_start, Py_ssize_t val_length, PyObject *has_semicolons) {
DECREF_AFTER_FUNCTION PyObject *k = PyMemoryView_FromMemory(src + key_start, key_length, PyBUF_READ);
if (!k) return false;
DECREF_AFTER_FUNCTION PyObject *v = PyMemoryView_FromMemory(src + val_start, val_length, PyBUF_READ);
if (!v) return false;
DECREF_AFTER_FUNCTION PyObject *ret = PyObject_CallFunctionObjArgs(callback, k, v, has_semicolons, NULL);
return ret != NULL;
}
static PyObject*
decode_utf8_buffer(PyObject *self UNUSED, PyObject *args) {
FREE_BUFFER_AFTER_FUNCTION Py_buffer buf = {0};
if (!PyArg_ParseTuple(args, "s*", &buf)) return NULL;
return PyUnicode_FromStringAndSize(buf.buf, buf.len);
}
static PyObject*
parse_ftc(PyObject *self UNUSED, PyObject *args) {
FREE_BUFFER_AFTER_FUNCTION Py_buffer buf = {0};
PyObject *callback;
size_t i = 0, key_start = 0, key_length = 0, val_start = 0, val_length = 0;
if (!PyArg_ParseTuple(args, "s*O", &buf, &callback)) return NULL;
char *src = buf.buf;
size_t sz = buf.len;
if (!PyCallable_Check(callback)) { PyErr_SetString(PyExc_TypeError, "callback must be callable"); return NULL; }
PyObject *has_semicolons = Py_False;
for (i = 0; i < sz; i++) {
char ch = src[i];
if (key_length == 0) {
if (ch == '=') {
key_length = i - key_start;
val_start = i + 1;
has_semicolons = Py_False;
}
} else {
if (ch == ';') {
if (i + 1 < sz && src[i + 1] == ';') {
has_semicolons = Py_True;
i++;
} else {
val_length = i - val_start;
if (!call_ftc_callback(callback, src, key_start, key_length, val_start, val_length, has_semicolons)) return NULL;
key_length = 0; key_start = i + 1; val_start = 0;
}
}
}
}
if (key_length && val_start) {
val_length = sz - val_start;
if (!call_ftc_callback(callback, src, key_start, key_length, val_start, val_length, has_semicolons)) return NULL;
}
Py_RETURN_NONE;
}
static PyMethodDef module_methods[] = {
{"begin_create_signature", begin_create_signature, METH_VARARGS, ""},
{"begin_load_signature", begin_load_signature, METH_NOARGS, ""},
{"build_hash_table", build_hash_table, METH_VARARGS, ""},
{"begin_patch", begin_patch, METH_O, ""},
{"begin_create_delta", begin_create_delta, METH_VARARGS, ""},
{"iter_job", iter_job, METH_VARARGS, ""},
{"parse_ftc", parse_ftc, METH_VARARGS, ""},
{"decode_utf8_buffer", decode_utf8_buffer, METH_VARARGS, ""},
{NULL, NULL, 0, NULL} /* Sentinel */
};
static int
exec_module(PyObject *m) {
RsyncError = PyErr_NewException("rsync.RsyncError", NULL, NULL);
if (RsyncError == NULL) return -1;
PyModule_AddObject(m, "RsyncError", RsyncError);
PyModule_AddIntMacro(m, IO_BUFFER_SIZE);
return 0;
}
IGNORE_PEDANTIC_WARNINGS
static PyModuleDef_Slot slots[] = { {Py_mod_exec, (void*)exec_module}, {0, NULL} };
END_IGNORE_PEDANTIC_WARNINGS
static struct PyModuleDef module = {
.m_base = PyModuleDef_HEAD_INIT,
.m_name = "rsync", /* name of module */
.m_doc = NULL,
.m_slots = slots,
.m_methods = module_methods
};
EXPORTED PyMODINIT_FUNC
PyInit_rsync(void) {
return PyModuleDef_Init(&module);
}