Compare commits

..

58 Commits

Author SHA1 Message Date
wangjiyu 49c540a78e debug 2025-05-28 15:26:24 +08:00
wangjiyu 392ec2416b debug 2025-05-04 11:18:59 +08:00
wangjiyu a9d531c6fc debug 2025-05-04 11:14:22 +08:00
wangjiyu 00bd8c4c64 debug 2025-05-04 11:03:44 +08:00
wangjiyu e70e728b98 debug 2025-05-04 10:58:59 +08:00
wangjiyu 7ed30e6edc debug 2025-05-04 10:48:24 +08:00
wangjiyu 0843f56fa9 debug 2025-05-04 10:27:31 +08:00
wangjiyu 3944db37fd debug 2025-05-04 10:05:49 +08:00
wangjiyu 396f808877 debug 2025-05-04 10:01:24 +08:00
wangjiyu 98c7b8e7ad debug 2025-05-04 09:47:49 +08:00
wangjiyu 6e6e7f4337 debug 2025-05-03 23:32:21 +08:00
wangjiyu a4713448d7 debug 2025-05-03 23:20:21 +08:00
wangjiyu f5840b46d2 debug 2025-05-03 23:03:33 +08:00
wangjiyu b6a33bcfbd debug 2025-05-03 23:02:06 +08:00
wangjiyu 0228402b5b debug 2025-05-03 22:58:13 +08:00
wangjiyu 39c474fa22 debug 2025-05-03 22:55:10 +08:00
wangjiyu ceff0bd694 use pybind 2025-05-03 21:51:02 +08:00
wangjiyu f688c690aa add demo:play audio in python after migu rtc 2025-04-24 16:38:10 +08:00
wangjiyu 95969ffcc8 add demo:send audio to app 2025-04-24 10:31:26 +08:00
wangjiyu 756e782ef1 debug 2025-04-16 19:46:35 +08:00
wangjiyu dcb81f9915 debug 2025-04-16 19:43:18 +08:00
wangjiyu b34a1956ee debug 2025-04-16 19:40:25 +08:00
wangjiyu f00ed230a0 debug 2025-04-16 19:38:34 +08:00
wangjiyu af0a29f3dc debug 2025-04-16 19:30:53 +08:00
wangjiyu d910833a9c debug 2025-04-16 19:09:51 +08:00
wangjiyu 3157894c1a debug 2025-04-16 19:07:53 +08:00
wangjiyu ad48b2e55a debug 2025-04-16 17:53:08 +08:00
wangjiyu 0bee448294 debug 2025-04-16 17:46:00 +08:00
wangjiyu df30aa53c9 debug 2025-04-16 17:44:03 +08:00
wangjiyu 815956c01c debug 2025-04-16 17:29:00 +08:00
wangjiyu 3fbe05cf92 debug 2025-04-16 17:24:57 +08:00
wangjiyu 5c5228c3b2 debug 2025-04-16 17:04:32 +08:00
wangjiyu 6cb5d60eb5 debug 2025-04-16 16:55:10 +08:00
wangjiyu a6e6f7fdde debug 2025-04-16 16:29:16 +08:00
wangjiyu e7fc174bc7 debug 2025-04-16 16:19:22 +08:00
wangjiyu 9ef5758116 debug 2025-04-16 16:18:24 +08:00
wangjiyu 29f14acd5f debug 2025-04-16 16:04:25 +08:00
wangjiyu 7c11d681f9 debug 2025-04-16 15:59:45 +08:00
wangjiyu e089162220 debug 2025-04-16 15:44:43 +08:00
wangjiyu fe9c640c5b debug 2025-04-16 15:40:46 +08:00
wangjiyu b04c665ac6 debug 2025-04-16 15:31:43 +08:00
wangjiyu 0042f506c2 debug 2025-04-16 15:30:55 +08:00
wangjiyu 088f373770 debug 2025-04-16 11:34:51 +08:00
wangjiyu 6f24ab5105 debug 2025-04-16 11:26:13 +08:00
wangjiyu 847aad603e debug 2025-04-16 11:23:04 +08:00
wangjiyu f3fbcf94f7 debug 2025-04-16 11:18:33 +08:00
wangjiyu 80fe99160f debug 2025-04-16 11:15:19 +08:00
wangjiyu c668b06ef8 debug 2025-04-16 11:05:29 +08:00
wangjiyu a98aa02dce debug 2025-04-16 10:53:36 +08:00
wangjiyu c1130200b8 debug 2025-04-16 10:47:29 +08:00
wangjiyu c58d016357 debug 2025-04-16 10:45:48 +08:00
wangjiyu 8a2389bf68 debug 2025-04-16 10:39:45 +08:00
wangjiyu b9a981b57a debug 2025-04-15 23:43:13 +08:00
wangjiyu f53fc89531 debug 2025-04-15 23:36:59 +08:00
wangjiyu c8c3a25fe9 debug 2025-04-15 23:31:07 +08:00
wangjiyu 418654abf4 debug 2025-04-15 23:23:35 +08:00
wangjiyu 715687e85c debug 2025-04-15 23:21:48 +08:00
wangjiyu 6936dfd292 debug 2025-04-15 23:13:54 +08:00
10 changed files with 361 additions and 357 deletions

View File

@ -1,17 +1,3 @@
g++ -shared -fPIC \
-I/usr/include/python3.10 -I/usr/include/python3.10/numpy -I./include \
-L./lib -L/usr/lib/x86_64-linux-gnu \
-DRTC_NUMPY_IMPL \
rtc_plugins.cpp util/RTCContext.cpp \
-lMRTCEngine -lboost_python310 -lboost_numpy310 -lpython3.10 \
-Wl,-rpath='$ORIGIN/lib' \
-o rtc_plugins.so
#g++ -shared -fPIC \
# -I/usr/include/python3.10 -I/usr/include/python3.10/numpy -I./include \
# -I/usr/include/python3.10 -I/usr/include/numpy \
# -Wl,-rpath='$ORIGIN/lib' \
# -lboost_python310 -lpython3.10 \
# -lMRTCEngine -lboost_python310 -lpython3.10 \
# -L$(python3 -c "import numpy; print(numpy.get_include())") \
# rtc_plugins.cpp util/RTCContext.cpp \
# -o rtc_plugins.so
#g++ -shared -fPIC -std=c++17 $(python3 -m pybind11 --includes) -I./include -L./lib -L/usr/lib/x86_64-linux-gnu -lMRTCEngine -lpython3.10 -Wl,-rpath='$ORIGIN/lib' -o rtc_plugins$(python3-config --extension-suffix) rtc_plugins.cpp util/RTCContext.cpp
g++ -shared -fPIC -std=c++17 $(python3 -m pybind11 --includes) -I./include -L./lib -L/usr/lib/x86_64-linux-gnu -Wl,--no-as-needed -lMRTCEngine -Wl,--as-needed -lpython3.10 -Wl,-rpath='$ORIGIN/lib' -o rtc_plugins$(python3-config --extension-suffix) rtc_plugins.cpp util/RTCContext.cpp

View File

@ -1,20 +1,11 @@
// rtc_plugins.cpp
#include "util/RTCContext.h"
#include <pybind11/pybind11.h>
#include <pybind11/numpy.h> // pybind11 的 NumPy 支持
#define IMPLEMENT_NUMPY_API // 标记这是实现文件
#include "util/numpyStub.h"
namespace py = pybind11;
#include "util/RTCContext.h"
// 提供转换接口
void** get_numpy_api() {
return (void**)RTC_PLUGINS_ARRAY_API;
}
namespace py = boost::python;
int init(const char* selfUserId, const char* selfDisplayName, const char* selfRoomId, boost::python::object callback) {
RTCContext::instance().setPyCallback(callback);
int init(const char* selfUserId, const char* selfDisplayName, const char* selfRoomId) {
bool res = RTCContext::instance().init(selfUserId, selfDisplayName, selfRoomId);
if (res) {
return 0;
@ -23,7 +14,6 @@ int init(const char* selfUserId, const char* selfDisplayName, const char* selfRo
}
}
int initRecv(const char* destRoomId, const char* srcUserId, const int16_t destChannelIndex) {
bool res = RTCContext::instance().initRecv(destRoomId, srcUserId, destChannelIndex);
if (res) {
return 0;
@ -31,7 +21,7 @@ int initRecv(const char* destRoomId, const char* srcUserId, const int16_t destCh
return -1;
}
}
int initSend(const char* srcRoomId, const char* destRoomId, const int16_t destChannelIndex, const uint8_t channelNum) {
int initSend(const char* srcRoomId, const char* destRoomId, const int16_t destChannelIndex, const int16_t channelNum) {
bool res = RTCContext::instance().initSend(srcRoomId, destRoomId, destChannelIndex, channelNum);
if (res) {
return 0;
@ -39,92 +29,84 @@ int initSend(const char* srcRoomId, const char* destRoomId, const int16_t destCh
return -1;
}
}
py::object create_int16_array() {
// 1. 定义数组维度1维长度为 4
npy_intp dims[1] = {4};
// 2. 创建原生 C 数组int16_t 数据)
int16_t data[4] = {1, 2, -3, 4}; // 示例数据
// 3. 通过 NumPy C API 创建 PyObject*
PyObject* py_array = PyArray_SimpleNewFromData(
1, // 维度数
dims, // 各维度大小
NPY_INT16, // 数据类型np.int16
data // 数据指针
// NumPy 数据交互(关键修改)
py::array_t<int16_t> getNumpyData() {
return py::array_t<int16_t>(
RTCContext::instance().getNumpyData() // 假设返回的是已有 NumPy 数组
);
if (!py_array) {
throw std::runtime_error("Failed to create NumPy array");
}
// 4. 转换为 py::object自动管理引用计数
return py::object(py::handle<>(py_array));
}
int sendCustomAudioData(int16_t destChannelIndex, py::object pD,
int sendCustomAudioData(int16_t destChannelIndex, py::array_t<int16_t> inputArray,
int32_t sampleRate, uint64_t channelNum, uint64_t dataLen) {
try {
// 强制转换为 int16 连续数组
PyObject* py_array = PyArray_FROM_OTF(
pD.ptr(),
NPY_INT16,
NPY_ARRAY_IN_ARRAY | NPY_ARRAY_FORCECAST
);
if (!py_array) {
throw std::runtime_error("Failed to convert input to int16 array");
}
//py::gil_scoped_release release;
// 修复点:使用花括号初始化
py::object arr{py::handle<>(py_array)};
// 检查数据长度
PyArrayObject* npArray = reinterpret_cast<PyArrayObject*>(arr.ptr());
if (PyArray_SIZE(npArray) != static_cast<npy_intp>(dataLen)) {
Py_DECREF(py_array);
throw std::runtime_error("Array length does not match dataLen");
}
// 处理数据...
void* dataPtr = PyArray_DATA(npArray);
int ret = RTCContext::instance().sendCustomAudioData(
destChannelIndex, dataPtr, sampleRate, channelNum, dataLen
);
Py_DECREF(py_array); // 释放临时数组
return ret;
} catch (...) {
PyErr_SetString(PyExc_RuntimeError, "Invalid audio data");
return -1;
py::array_t<int16_t> contiguous = py::array::ensure(inputArray);
if (!contiguous) throw py::value_error("Array conversion failed");
auto buf = contiguous.request();
if (buf.size != dataLen) {
throw py::value_error("Array length does not match dataLen");
}
std::vector<int16_t> localCopy(static_cast<int16_t*>(buf.ptr),
static_cast<int16_t*>(buf.ptr) + buf.size);
return RTCContext::instance().sendCustomAudioData(
destChannelIndex, localCopy.data(), sampleRate, channelNum, dataLen
);
//return RTCContext::instance().sendCustomAudioData(
// destChannelIndex, buf.ptr, sampleRate, channelNum, dataLen
//);
}
py::list getListData() {
return RTCContext::instance().getListData();
}
int getSize() {
return RTCContext::instance().getSize();
}
RetAudioFrame getData() {
return RTCContext::instance().getData();
}
int16_t getDataCount() {
return RTCContext::instance().getDataCount();
}
void init_numpy() {
// 直接调用底层函数,绕过宏的问题
if (_import_array() < 0) {
PyErr_SetString(PyExc_ImportError, "numpy.core.multiarray failed to import");
throw std::runtime_error("NumPy initialization failed");
}
std::cout << "NumPy API addr: " << PyArray_API << std::endl;
}
BOOST_PYTHON_MODULE(rtc_plugins) {
try {
init_numpy();
void** numpyApi = (void**)PyArray_API;
if (!numpyApi || !numpyApi[93]) { // 93是PyArray_SimpleNew的偏移量
std::cout << "NumPy API corrupt! Key functions missing." << std::endl;
PyErr_Print();
throw std::runtime_error("Invalid NumPy API state");
} else {
RTCContext::instance().setNumpyApi(numpyApi);
std::cout << "set numpyApi succ:" << numpyApi[93] << std::endl;
}
PYBIND11_MODULE(rtc_plugins, m) {
// 可选:暴露 RetAudioFrame 类(需额外绑定)
py::class_<RetAudioFrame>(m, "RetAudioFrame")
// 定义 data 属性(包含 getter 和 setter
.def_property("data",
// Getter返回 NumPy 数组
[](RetAudioFrame& self) {
return py::array_t<short>(
{self.dataCount}, // 数组形状
{sizeof(short)}, // 步长
self.data.get() // 数据指针(原始内存)
);
},
// Setter从 NumPy 数组复制数据
[](RetAudioFrame& self, py::array_t<short> arr) {
auto buf = arr.request(); // 获取数组信息
self.data.reset(new short[buf.size]); // 重新分配内存
std::memcpy(
self.data.get(), // 目标指针
buf.ptr, // 源数据指针
buf.size * sizeof(short) // 数据大小
);
self.dataCount = buf.size; // 更新数据长度
}
)
.def_readwrite("dataCount", &RetAudioFrame::dataCount)
.def_readwrite("sampleRate", &RetAudioFrame::sampleRate)
.def_readwrite("numChannels", &RetAudioFrame::numChannels)
.def_readwrite("channelIndex", &RetAudioFrame::channelIndex);
m.def("init", &init);
m.def("initRecv", &initRecv);
m.def("initSend", &initSend);
m.def("sendCustomAudioData", &sendCustomAudioData);
m.def("getSize", &getSize);
m.def("getData", &getData);
m.def("getNumpyData", &getNumpyData);
m.def("getListData", &getListData);
m.def("getDataCount", &getDataCount);
py::def("init", &init);
py::def("initRecv", &initRecv);
py::def("initSend", &initSend);
py::def("sendCustomAudioData", &sendCustomAudioData);
} catch (...) {
PyErr_SetString(PyExc_RuntimeError, "Module initialization failed");
}
}

45
test_audio_r.py Normal file
View File

@ -0,0 +1,45 @@
import rtc_plugins
import time
import sounddevice as sd
import numpy as np
import mmap
import os
from ctypes import c_int16
import struct
srcUserId = "srcUser12"
destUserId = "destUser12"
srcDisplayName = "srcDisplayName12"
destDisplayName = "destDisplayName12"
srcRoomId = "srcRoom12"
#destRoomId = "destRoomId12"
destRoomId = srcRoomId
srcChannelIndex = 46
destChannelIndex = 47
def my_callback_r(shmName, dataSize, dataCount, sampleRate, numChannels, channelIndex):
print(f"my_callback_r, dataSize:{dataSize}, dataCount:{dataCount}, sampleRate:{sampleRate}, numChannels:{numChannels}, channelIndex:{channelIndex}")
print(f"data:{shmName}")
print("after my_callback_r")
ret = rtc_plugins.init(destUserId, destDisplayName, destRoomId, my_callback_r)
if ret != 0:
print(f"init fail, ret:{ret}")
exit(1)
ret = rtc_plugins.initRecv(destRoomId, srcUserId, destChannelIndex)
if ret != 0:
print(f"initRecv fail, ret:{ret}")
exit(1)
#ret = rtc_plugins.initSend(destRoomId, srcRoomId, srcChannelIndex, 1)
#if ret != 0:
# print(f"initSend fail, ret:{ret}")
# exit(1)
sampleRate = 16000
while True:
frame = rtc_plugins.getListData()
sd.play(frame, sampleRate)
sd.wait()
print(f"get frame:{frame}")
time.sleep(0.005)

51
test_audio_s.py Normal file
View File

@ -0,0 +1,51 @@
import rtc_plugins
import time
import numpy as np
from scipy.io import wavfile
srcUserId = "srcUser12"
destUserId = "destUser12"
srcDisplayName = "srcDisplayName12"
destDisplayName = "destDisplayName12"
srcRoomId = "srcRoom12"
#destRoomId = "destRoomId12"
destRoomId = srcRoomId
srcChannelIndex = 46
destChannelIndex = 47
ret = rtc_plugins.init(srcUserId, srcDisplayName, srcRoomId)
if ret != 0:
print(f"init fail, ret:{ret}")
exit(1)
ret = rtc_plugins.initSend(srcRoomId, destRoomId, destChannelIndex, 1)
if ret != 0:
print(f"initSend fail, ret:{ret}")
exit(1)
#audioData = np.array([0, 1, -1, 0], dtype=np.int16)
sampleRate, audioData = wavfile.read("xusample1.wav")
print(f"sampleRate:{sampleRate} HZ")
print(f"shape:{audioData.shape}")
print(f"type:{audioData.dtype}")
if audioData.dtype != np.int16:
audioData = (audioData * 32767).astype(np.int16)
ret = rtc_plugins.sendCustomAudioData(destChannelIndex, audioData, sampleRate, 1, len(audioData))
if ret != 0:
print(f"send fail, ret:{ret}")
print("send succ")
ret = rtc_plugins.initRecv(srcRoomId, srcUserId, srcChannelIndex)
if ret != 0:
print(f"initRecv fail, ret:{ret}")
exit(1)
for i in range(100):
ret = rtc_plugins.sendCustomAudioData(destChannelIndex, audioData, sampleRate, 1, len(audioData))
if ret != 0:
print(f"send fail, ret:{ret}")
#size = rtc_plugins.getSize()
#print(f"data size:{size}")
#frame = rtc_plugins.getListData()
#print(f"get frame:{frame}")
#dataCount = rtc_plugins.getDataCount()
#print(f"data count:{dataCount}")
time.sleep(3)

View File

@ -17,7 +17,7 @@ ret = rtc_plugins.init(srcUserId, srcDisplayName, srcRoomId, my_callback)
if ret != 0:
print(f"init fail, ret:{ret}")
exit(1)
ret = rtc_plugins.initSend(srcRoomId, destRoomId, destChannelIndex, 1)
ret = rtc_plugins.initSend(srcRoomId, destRoomId, destChannelIndex)
if ret != 0:
print(f"initSend fail, ret:{ret}")
exit(1)

View File

@ -4,6 +4,7 @@ import numpy as np
import mmap
import os
from ctypes import c_int16
import struct
srcUserId = "srcUser12"
destUserId = "destUser12"
@ -15,11 +16,12 @@ srcRoomId = "srcRoom12"
destRoomId = srcRoomId
srcChannelIndex = 46
destChannelIndex = 47
def my_callback(shmName, dataSize, dataCount, sampleRate, numChannels, channelIndex):
print(f"dataSize:{dataSize}, dataCount:{dataCount}, sampleRate:{sampleRate}, numChannels:{numChannels}, channelIndex:{channelIndex}")
def my_callback_r(shmName, dataSize, dataCount, sampleRate, numChannels, channelIndex):
print(f"my_callback_r, dataSize:{dataSize}, dataCount:{dataCount}, sampleRate:{sampleRate}, numChannels:{numChannels}, channelIndex:{channelIndex}")
print(f"data:{shmName}")
print("after my_callback_r")
ret = rtc_plugins.init(destUserId, destDisplayName, destRoomId, my_callback)
ret = rtc_plugins.init(destUserId, destDisplayName, destRoomId, my_callback_r)
if ret != 0:
print(f"init fail, ret:{ret}")
exit(1)
@ -34,10 +36,17 @@ if ret != 0:
while True:
print("recv")
#audioData = np.array([0, 1, -1, 0], dtype=np.int16)
#ret = rtc_plugins.sendCustomAudioData(srcChannelIndex, audioData, 48000, 1, len(audioData))
#if ret != 0:
# print(f"resend fail, ret:{ret}")
#else:
# print("resend succ")
time.sleep(30)
audioData = np.array([0, 1, -1, 0], dtype=np.int16)
ret = rtc_plugins.sendCustomAudioData(srcChannelIndex, audioData, 48000, 1, len(audioData))
if ret != 0:
print(f"resend fail, ret:{ret}")
else:
print("resend succ")
size = rtc_plugins.getSize()
print(f"data size:{size}")
#frame = rtc_plugins.getNumpyData()
frame = rtc_plugins.getListData()
print(f"get frame:{frame}")
dataCount = rtc_plugins.getDataCount()
print(f"data count:{dataCount}")
time.sleep(0.005)

View File

@ -12,8 +12,10 @@ srcRoomId = "srcRoom12"
destRoomId = srcRoomId
srcChannelIndex = 46
destChannelIndex = 47
def my_callback(npData, dataCount, sampleRate, numChannels, channelIndex):
print(f"dataCount:{dataCount}, sampleRate:{sampleRate}, numChannels:{numChannels}, channelIndex:{channelIndex}")
def my_callback(shmName, dataSize, dataCount, sampleRate, numChannels, channelIndex):
print(f"my_callback, dataSize:{dataSize}, dataCount:{dataCount}, sampleRate:{sampleRate}, numChannels:{numChannels}, channelIndex:{channelIndex}")
print(f"data:{shmName}")
print("after my_callback_r")
ret = rtc_plugins.init(srcUserId, srcDisplayName, srcRoomId, my_callback)
if ret != 0:
print(f"init fail, ret:{ret}")
@ -34,4 +36,11 @@ for i in range(100):
ret = rtc_plugins.sendCustomAudioData(destChannelIndex, audioData, 48000, 1, len(audioData))
if ret != 0:
print(f"send fail, ret:{ret}")
time.sleep(30)
size = rtc_plugins.getSize()
print(f"data size:{size}")
frame = rtc_plugins.getListData()
print(f"get frame:{frame}")
dataCount = rtc_plugins.getDataCount()
print(f"data count:{dataCount}")
time.sleep(3)

View File

@ -1,5 +1,5 @@
#include "RTCContext.h"
#define GIL
#include <fstream>
void RTCContext::onRoom(uint32_t typeId, RTCENGINE_NAMESPACE::MRTCRoomInfo& roomInfo) {
//std::cout << "RTCContext::onRoom():" << roomInfo.roomId << "," << roomInfo.displayName << "," << roomInfo.userId << "," << roomInfo.message;
@ -7,14 +7,16 @@ void RTCContext::onRoom(uint32_t typeId, RTCENGINE_NAMESPACE::MRTCRoomInfo& room
std::lock_guard<std::mutex> lock(mutex_);
isOnRoom_ = true;
}
void RTCContext::onConsumer(uint32_t msgId, const char* roomId, const char* peerId,
RTCENGINE_NAMESPACE::MRTCConsumerInfo& consumerInfo) {
std::cout << "RTCContext::onConsumer():" << consumerInfo.roomId << "," << consumerInfo.displayName << ","
<< consumerInfo.channelIndex << std::endl;
if (isRecv_) {
std::lock_guard<std::mutex> lock(mutex_);
void RTCContext::onConsumer(uint32_t msgId, const char* roomId, const char* peerId, RTCENGINE_NAMESPACE::MRTCConsumerInfo& consumerInfo) {
std::cout << "RTCContext::onConsumer()" << std::endl;
std::cout << "RTCContext::onConsumer():msgId:" << msgId << ", roomId:" << consumerInfo.roomId << ", displayName:"
<< consumerInfo.displayName << ", type:" << consumerInfo.audioSourceType << ", channelIndex:" << (int)consumerInfo.channelIndex
<< std::endl;
if (msgId == RTCENGINE_NAMESPACE::MRTCConsumerStatusType::TYPE_STATUS_CONSUMER_START && std::string(consumerInfo.kind) == "audio") {
std::lock_guard <std::mutex> lock(mutex_);
isOnConsumer_ = true;
std::cout << "registerSoundLevelListener" << std::endl;
int16_t ret1 = rtcEngine_->registerSoundLevelListener(mrtc::TYPE_AUDIO_SOURCE_CUSTOM, consumerInfo.roomId,
int16_t ret1 = rtcEngine_->registerSoundLevelListener(consumerInfo.audioSourceType, roomId,
peerId, consumerInfo.channelIndex, this);
if (0 != ret1) {
std::cout << "RTCContext::instance().registerSoundLevelListener() inUser failed, ret:" << ret1;
@ -22,7 +24,7 @@ void RTCContext::onConsumer(uint32_t msgId, const char* roomId, const char* peer
}
std::cout << "muteAudio" << std::endl;
int16_t ret2 = rtcEngine_->muteAudio(consumerInfo.roomId, peerId, mrtc::TYPE_AUDIO_SOURCE_CUSTOM,
int16_t ret2 = rtcEngine_->muteAudio(roomId, peerId, consumerInfo.audioSourceType,
false, consumerInfo.channelIndex);
if (0 != ret2) {
std::cout << "RTCContext::instance().muteAudio() failed, ret:" << ret2;
@ -45,6 +47,7 @@ void RTCContext::onCallBackMessage(uint32_t msgId, const char* msg) {
}
std::cout << "RTCContext::onCallBackMessage(), msgId:" << msgId << ", msg:" << msg << std::endl;
//std::cout << "RTCContext::onCallBackMessage()" << std::endl;
}
void RTCContext::onCallBackCustomData(RTCENGINE_NAMESPACE::MRTCCustomDataObject object) {
//std::cout << "RTCContext::onCallBackCustomData(), obj:" << object.peerId << "," << object.data << "," << object.data_length;
@ -53,154 +56,43 @@ void RTCContext::onCallBackCustomData(RTCENGINE_NAMESPACE::MRTCCustomDataObject
void RTCContext::onSoundLevelUpdate(const char* roomId, const char* peerId, uint16_t audioSourceType,
uint8_t channelIndex, uint16_t volume, int32_t vad)
{
std::cout << "RTCContext::onSoundLevelUpdate()" << std::endl;
//std::cout << "RTCContext::onSoundLevelUpdate()" << std::endl;
}
void printTimestamp() {
// 获取系统当前时间点
auto now = std::chrono::system_clock::now();
// 转换为时间戳(秒 + 毫秒)
auto timestamp = std::chrono::duration_cast<std::chrono::seconds>(
now.time_since_epoch()).count();
auto milliseconds = std::chrono::duration_cast<std::chrono::milliseconds>(
now.time_since_epoch()).count() % 1000;
// 转换为本地时间(可读格式)
std::time_t time = std::chrono::system_clock::to_time_t(now);
std::cout << "Timestamp: " << timestamp << "." << milliseconds << std::endl;
}
void RTCContext::onAudioProcess(const char* roomId, const char* peerId,
mrtc::MRTCAudioFrame& audioFrame,
mrtc::MRTCAudioSourceType audioSourceType)
{
namespace np = boost::python::numpy;
namespace py = boost::python;
Py_Initialize(); // 初始化 Python
np::initialize();
std::cout << "=== 开始音频处理 ===" << std::endl;
std::cout << "audioFrame:" << audioFrame.dataCount << "," << audioFrame.sampleRate << "," <<
audioFrame.numChannels << "," << audioFrame.channelIndex << std::endl;
// 1. 获取GIL
std::cout << "[1] 获取GIL锁..." << std::endl;
#ifdef GIL
PyGILState_STATE gstate = PyGILState_Ensure();
#endif
try {
// 2. 输入参数校验
std::cout << "[2] 检查输入参数..." << std::endl;
std::cout << " dataCount: " << audioFrame.dataCount
<< " (max: " << std::numeric_limits<npy_intp>::max() << ")" << std::endl;
if (!audioFrame.data || audioFrame.dataCount <= 0) {
std::cout << "[ERROR] 无效音频数据指针或长度" << std::endl;
throw std::invalid_argument("Invalid audio frame data");
}
const size_t data_size = audioFrame.dataCount * sizeof(int16_t);
std::cout << "step1" << std::endl;
namespace py = boost::python;
namespace np = boost::python::numpy;
npy_intp shape[1] = { static_cast<npy_intp>(audioFrame.dataCount) };
std::cout << "step2" << std::endl;
// 7. 执行回调
if (!pyCallback_.is_none()) {
std::cout << "[7] 准备执行Python回调..." << std::endl;
// 增加引用计数防止提前释放
//Py_INCREF(pyCallback_.ptr());
try {
//PyGILState_STATE gstate = PyGILState_Ensure();
std::cout << "data:" << audioFrame.data << std::endl;
std::cout << "当前线程是否持有 GIL: " << PyGILState_Check() << std::endl;
np::dtype dtype = np::dtype::get_builtin<int16_t>();
std::cout << "init dtype" << std::endl;
if (!Py_IsInitialized()) {
std::cerr << "Python 解释器未初始化!" << std::endl;
return;
}
try {
py::object str_repr = py::str(dtype);
std::cout << "str_repr" << std::endl;
if(str_repr.ptr() != Py_None) {
std::cout << "str_repr is not null" << std::endl;
std::string dtype_str = py::extract<std::string>(str_repr);
std::cout << "数据类型: " << dtype_str << std::endl;
} else {
std::cout << "数据类型: None" << std::endl;
}
} catch (const py::error_already_set&) {
std::cout<< "数据类型转换错误" << std::endl;
PyErr_Clear();
}
std::cout << "数据形状: " << shape[0] << std::endl;
np::ndarray audioArray = np::from_data(
audioFrame.data, // 数据指针
dtype, // 数据类型 (int16)
py::make_tuple(shape[0]), // 形状 (1D)
py::make_tuple(sizeof(int16_t)), // 步长
py::object() // 所有者Python管理
);
std::cout << " 数据拷贝完成" << std::endl;
pyCallback_(
audioArray, // numpy 数组
data_size, // 数据大小
audioFrame.dataCount,
audioFrame.sampleRate,
audioFrame.numChannels,
audioFrame.channelIndex
);
std::cout << " after callback" << std::endl;
if (PyErr_Occurred()) {
PyObject *type, *value, *traceback;
PyErr_Fetch(&type, &value, &traceback);
if (value) {
PyObject* str = PyObject_Str(value);
if (str) {
std::cerr << "Python Error: " << PyUnicode_AsUTF8(str) << std::endl;
Py_DECREF(str);
}
}
Py_XDECREF(type);
Py_XDECREF(value);
Py_XDECREF(traceback);
//PyErr_Print();
throw std::runtime_error("Python callback error");
}
std::cout << " 回调执行成功" << std::endl;
} catch (const py::error_already_set& e) {
std::cerr << "[PYTHON ERROR] ";
PyErr_Print(); // 自动打印到stderr
// 可选:获取更详细的错误信息
if (PyErr_Occurred()) {
PyObject *type, *value, *traceback;
PyErr_Fetch(&type, &value, &traceback);
std::cerr << "Details: "
<< PyUnicode_AsUTF8(PyObject_Str(value)) << std::endl;
PyErr_Restore(type, value, traceback);
}
//Py_DECREF(pyCallback_.ptr());
} catch (...) {
std::cout << "[ERROR] 回调执行失败" << std::endl;
//Py_DECREF(pyCallback_.ptr());
throw;
}
//Py_DECREF(pyCallback_.ptr());
} else {
std::cout << "[7] 无回调函数设置" << std::endl;
}
// 8. 释放资源
std::cout << "[8] 释放共享内存资源..." << std::endl;
std::cout << "[9] 释放GIL..." << std::endl;
#ifdef GIL
PyGILState_Release(gstate);
#endif
std::cout << "=== 音频处理完成 ===" << std::endl;
} catch (const std::exception& e) {
std::cout << "[EXCEPTION] 异常捕获: " << e.what() << std::endl;
#ifdef GIL
PyGILState_Release(gstate);
#endif
std::cerr << "Audio process error: " << e.what() << std::endl;
//std::cout << "onAudioProcess, roomId:" << roomId << ", peerId:" << peerId << ", type:" << audioSourceType
// << ", datacount:" << audioFrame.dataCount << std::endl;
if (audioFrame.data == nullptr || audioFrame.dataCount <= 0) {
return;
}
#ifdef GIL
PyGILState_Release(gstate);
#endif
// 以二进制追加模式打开文件
//std::ofstream outFile("audio_data.pcm", std::ios::binary | std::ios::app);
//if (!outFile.is_open()) {
// std::cerr << "Failed to open file for writing!" << std::endl;
// return;
//}
//// 写入数据int16_t格式
//outFile.write(reinterpret_cast<const char*>(audioFrame.data),
// audioFrame.dataCount);
setData(audioFrame);
}
void RTCContext::onProducer(uint32_t msgId, mrtc::MRTCProducerInfo& info)
@ -210,12 +102,6 @@ void RTCContext::onProducer(uint32_t msgId, mrtc::MRTCProducerInfo& info)
}
bool RTCContext::init(const char* selfUserId, const char* selfDisplayName, const char* selfRoomId)
{
std::cout << "init, numpyApi_:" << numpyApi_[93] << std::endl;
if (!numpyApi_ || !numpyApi_[93]) { // 93是PyArray_SimpleNew的偏移量
std::cout << "numpyApi_ is null in init" << std::endl;
} else {
std::cout << "numpyApi_ is not null in init" << std::endl;
}
mrtc::IMRTCEngineFactory * rtcFactory = mrtc::getMRTCEngineFactory();
if (!rtcFactory)
{
@ -261,20 +147,21 @@ bool RTCContext::init(const char* selfUserId, const char* selfDisplayName, const
std::cout << "RTCContext::instance().registerListener() failed" << std::endl;
return false;
}
//namespace py = boost::python;
//namespace np = boost::python::numpy;
//Py_Initialize(); // 初始化 Python
//np::initialize();
return true;
}
bool RTCContext::initRecv(const char* destRoomId, const char* srcUserId, const int16_t destChannelIndex)
{
isRecv_ = true;
while (!isOnConsumer_)
{
std::cout << "wait for OnConsumer" << std::endl;
sleep(3);
}
return true;
}
bool RTCContext::initSend(const char* srcRoomId, const char* destRoomId, const int16_t destChannelIndex, uint8_t channelNum)
bool RTCContext::initSend(const char* srcRoomId, const char* destRoomId, const int16_t destChannelIndex,
const uint8_t channelNum)
{
while (!isOnRoom_)
{
@ -295,11 +182,11 @@ bool RTCContext::initSend(const char* srcRoomId, const char* destRoomId, const i
}
mrtc::MRTCAudioOption option;
option.channel = channelNum;
if (std::string(srcRoomId) != std::string(destRoomId)) {
strcpy(option.dstRoomId, destRoomId);
}
option.channelIndex = destChannelIndex;
option.channel = channelNum;
std::cout << "startCustomAudio" << std::endl;
int16_t ret2 = rtcEngine_->startCustomAudio(option);
if (ret2 != 0)
@ -310,16 +197,12 @@ bool RTCContext::initSend(const char* srcRoomId, const char* destRoomId, const i
std::cout << "init send succ" << std::endl;
return true;
}
bool RTCContext::initGIL() {
isGIL_ = true;
}
void RTCContext::destorySend(const int16_t selfChannelIndex)
{
rtcEngine_->stopCustomAudio(selfChannelIndex);
}
int16_t RTCContext::sendAudioData(uint8_t channelIndex, const void* pData, int32_t nSampleRate, uint64_t nNumberOfChannels,
uint64_t dataLength)
int16_t RTCContext::sendAudioData(uint8_t channelIndex, const void* pData, int32_t nSampleRate, uint64_t nNumberOfChannels, uint64_t dataLength)
{
std::lock_guard<std::mutex> lock(mutex_);
if (pData_)
@ -341,8 +224,7 @@ int16_t RTCContext::sendCustomAudioData(const int16_t channelIndex, void* custom
return -1;
}
std::cout << "customData addr is:" << customData << std::endl;
return rtcEngine_->sendCustomAudioData(channelIndex, customData, sampleRate,
channelNum, dataLen);
return rtcEngine_->sendCustomAudioData(channelIndex, customData, sampleRate, channelNum, dataLen);
}
mrtc::IMRTCEngine* RTCContext::getRtcEngine() const
{
@ -359,12 +241,75 @@ void RTCContext::setpData(void* pData)
std::lock_guard<std::mutex> lock(mutex_);
pData_ = pData;
}
void RTCContext::setPyCallback(boost::python::object callback) {
std::lock_guard<std::mutex> lock(mutex_);
pyCallback_ = callback;
void RTCContext::setData(const mrtc::MRTCAudioFrame& frame) {
std::lock_guard<std::mutex> lock(dataMutex_);
if (dataSize_ == totalSize_) {
bottom_ = (bottom_ + 1) % totalSize_;
dataSize_--;
}
RetAudioFrame newFrame;
newFrame.dataCount = frame.dataCount;
newFrame.sampleRate = frame.sampleRate;
newFrame.numChannels = frame.numChannels;
newFrame.channelIndex = frame.channelIndex;
newFrame.data = std::make_unique<int16_t[]>(frame.dataCount);
//std::memcpy(newFrame.data.get(), frame.data, frame.dataCount* sizeof(int16_t));
std::memcpy(newFrame.data.get(), frame.data, frame.dataCount);
data_[head_] = std::move(newFrame);
head_ = (head_ + 1) % totalSize_;
dataSize_++;
}
void RTCContext::setNumpyApi(void **numpyApi) {
std::lock_guard<std::mutex> lock(mutex_);
numpyApi_ = numpyApi;
std::cout << "setNupyApi, numpyApi_:" << numpyApi_[93] << std::endl;
RetAudioFrame RTCContext::getData() {
//std::lock_guard<std::mutex> lock(dataMutex_);
if (dataSize_ > 0) {
RetAudioFrame frame = std::move(data_[bottom_]); // 移动而非拷贝
bottom_ = (bottom_ + 1) % totalSize_;
dataSize_--;
return frame; // 返回值优化(RVO)会生效
}
return {}; // 返回空对象
}
py::array_t<int16_t> RTCContext::getNumpyData() {
std::cout << "step1" << std::endl;
std::lock_guard<std::mutex> lock(dataMutex_);
RetAudioFrame frame = getData();
std::cout << "step2" << std::endl;
int16_t* dataPtr = frame.data.get(); // 你的数据指针
std::cout << "step3" << std::endl;
size_t length = frame.dataCount; // 数据长度
std::cout << "step4" << std::endl;
if (!dataPtr || length == 0) {
return py::array_t<int16_t>({0}); // 返回空数组
}
// 直接构造 pybind11 的 NumPy 数组(自动管理内存)
py::array_t<int16_t> result({static_cast<py::ssize_t>(length)});
auto buf = result.mutable_unchecked();
for (size_t i = 0; i < length; i++) {
buf[i] = dataPtr[i];
}
return result;
}
py::list RTCContext::getListData() {
std::lock_guard<std::mutex> lock(dataMutex_);
RetAudioFrame frame = getData();
py::list result;
if (frame.data) {
for (int i = 0; i < frame.dataCount/sizeof(int16_t); i++) {
result.append(frame.data.get()[i]);
}
}
return result;
}
int16_t RTCContext::getDataCount() {
std::lock_guard<std::mutex> lock(dataMutex_);
RetAudioFrame frame = getData();
return frame.dataCount;
}
int16_t RTCContext::getSize() {
std::lock_guard<std::mutex> lock(dataMutex_);
return dataSize_;
}

View File

@ -1,9 +1,6 @@
// RTCContext.h
#pragma once
//#include "numpyConfig.h"
#include "numpyStub.h"
#include "IMRTCEngine.hpp"
#include "MRTCEngineDefine.hpp"
#include "IMRTCEngineFactory.hpp"
@ -18,23 +15,26 @@
#include <sys/stat.h>
#include <Python.h>
#include <boost/python.hpp>
#include <boost/python/detail/wrap_python.hpp>
#include <boost/python/numpy.hpp>
#include <boost/python/detail/prefix.hpp>
#include <boost/python/module.hpp>
#include <boost/python/def.hpp>
#include <numpy/ndarrayobject.h>
#include <numpy/arrayobject.h>
// pybind11 头文件
#include <pybind11/pybind11.h>
#include <pybind11/numpy.h>
#include <pybind11/stl.h>
namespace py = pybind11;
//#include <numpy/arrayobject.h>
// 必须声明外部变量(关键!)
//#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
namespace fs = std::filesystem;
#define ENV_PRODUCT
//#define SEND_MODE
// 音频数据帧
struct RetAudioFrame
{
std::unique_ptr<int16_t[]> data;
int dataCount = 0;
int sampleRate = 48000;
int numChannels = 1;
int channelIndex = 0;
};
class RTCContext :
public RTCENGINE_NAMESPACE::IMRTCRoomCallBack,
public RTCENGINE_NAMESPACE::IMRTCConsumerCallBack,
@ -60,37 +60,22 @@ public:
static RTCContext instance;
return instance;
}
static void** numpy_api() {
static void** api = [](){
// 强制初始化NumPy
if (_import_array() < 0) {
PyErr_Print();
throw std::runtime_error("NumPy initialization failed");
}
void** ptr = reinterpret_cast<void**>(RTC_PLUGINS_ARRAY_API);
std::cout << "ptr:" << ptr << std::endl;
if (!ptr || !ptr[93]) {
std::cerr << "NumPy API corrupt! Expected at 93: "
<< (ptr ? (void*)ptr[93] : nullptr) << std::endl;
abort();
}
return ptr;
}();
return api;
}
RTCContext(const RTCContext&) = delete;
RTCContext& operator=(const RTCContext&) = delete;
mrtc::IMRTCEngine* getRtcEngine() const;
bool init(const char* selfUserId, const char* selfDisplayName, const char* selfRoomId);
bool initRecv(const char* destRoomId, const char* srcUserId, const int16_t destChannelIndex);
bool initSend(const char* srcRoomId, const char* destRoomId, const int16_t destChannelIndex, uint8_t channelNum);
bool initGIL();
bool initSend(const char* srcRoomId, const char* destRoomId, const int16_t destChannelIndex, const uint8_t channelNum);
int16_t getSize();
void setData(const mrtc::MRTCAudioFrame& frame);
RetAudioFrame getData();
py::array_t<int16_t> getNumpyData();
py::list getListData();
int16_t getDataCount();
void* getpData() const;
void setpData(void* pData);
void setPyCallback(boost::python::object callback);
void setNumpyApi(void** numpyApi);
int16_t sendAudioData(uint8_t channelIndex = 0, const void* pData = nullptr, int32_t nSampleRate = 48000, uint64_t nNumberOfChannels = 2, uint64_t dataLength = 0);
int16_t sendCustomAudioData(const int16_t channelIndex, void* customData, int32_t sampleRate,
@ -100,17 +85,21 @@ public:
private:
RTCContext()
{
data_.resize(totalSize_);
}
mutable std::mutex mutex_;
mrtc::IMRTCEngine * rtcEngine_ = nullptr;
void* pData_ = nullptr;
bool isOnRoom_ = false;
bool isRecv_ = false;
bool isOnConsumer_ = false;
bool isJoinMultiRoom_ = false;
bool isMultiRoom_ = false;
bool isGIL_ = false;
boost::python::object pyCallback_;
void ** numpyApi_;
std::vector<RetAudioFrame> data_;
mutable std::mutex dataMutex_;
const int16_t totalSize_ = 100;
int16_t dataSize_ = 0;
int16_t bottom_ = 0;
int16_t head_= 0;
void onRoom(uint32_t typeId, RTCENGINE_NAMESPACE::MRTCRoomInfo& roomInfo);
void onConsumer(uint32_t msgId, const char* roomId, const char* peerId, RTCENGINE_NAMESPACE::MRTCConsumerInfo& consumerInfo);
void onRender(const char* roomId, const char* peerId,

View File

@ -1,12 +0,0 @@
// numpy_interface.h (新建)
#pragma once
#ifdef IMPLEMENT_NUMPY_API
// 主模块实现路径
#define PY_ARRAY_UNIQUE_SYMBOL RTC_PLUGINS_ARRAY_API
#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
#include <numpy/arrayobject.h>
#else
// 用户头文件路径
extern void* RTC_PLUGINS_ARRAY_API[]; // 严格匹配NumPy类型
#endif