WIP: стабилизация звонков и E2EE + инструменты сборки WebRTC

This commit is contained in:
2026-03-25 22:20:24 +05:00
parent 530047c5d0
commit eea650face
8 changed files with 1119 additions and 219 deletions

View File

@@ -25,6 +25,7 @@ val gitShortSha = safeGitOutput("rev-parse", "--short", "HEAD") ?: "unknown"
// ═══════════════════════════════════════════════════════════ // ═══════════════════════════════════════════════════════════
val rosettaVersionName = "1.3.0" val rosettaVersionName = "1.3.0"
val rosettaVersionCode = 32 // Increment on each release val rosettaVersionCode = 32 // Increment on each release
val customWebRtcAar = file("libs/libwebrtc-custom.aar")
android { android {
namespace = "com.rosetta.messenger" namespace = "com.rosetta.messenger"
@@ -182,8 +183,13 @@ dependencies {
implementation("androidx.camera:camera-lifecycle:1.3.1") implementation("androidx.camera:camera-lifecycle:1.3.1")
implementation("androidx.camera:camera-view:1.3.1") implementation("androidx.camera:camera-view:1.3.1")
// WebRTC for voice calls // WebRTC for voice calls.
implementation("io.github.webrtc-sdk:android:125.6422.07") // If app/libs/libwebrtc-custom.aar exists, prefer it (custom E2EE-enabled build).
if (customWebRtcAar.exists()) {
implementation(files(customWebRtcAar))
} else {
implementation("io.github.webrtc-sdk:android:125.6422.07")
}
// Baseline Profiles for startup performance // Baseline Profiles for startup performance
implementation("androidx.profileinstaller:profileinstaller:1.3.1") implementation("androidx.profileinstaller:profileinstaller:1.3.1")

View File

@@ -45,6 +45,280 @@ static void diag_write(const char *fmt, ...) {
if (n > 0) write(g_diag_fd, buf, n); if (n > 0) write(g_diag_fd, buf, n);
} }
/* ── RTP helpers (for cases when additional_data is empty) ───── */
struct ParsedRtpPacket {
size_t header_size = 0;
uint16_t sequence = 0;
uint32_t timestamp = 0;
uint32_t ssrc = 0;
};
struct RtpProbeState {
bool locked = false;
bool has_probe = false;
uint32_t probe_ssrc = 0;
uint16_t probe_sequence = 0;
uint32_t probe_timestamp = 0;
uint32_t ssrc = 0;
uint16_t last_sequence = 0;
uint32_t last_timestamp = 0;
};
struct GeneratedTsState {
bool initialized = false;
uint32_t next_timestamp = 0;
uint32_t next_step = 960; // 20 ms @ 48 kHz (default Opus packetization)
};
struct AdditionalTsState {
bool initialized64 = false;
bool initialized32 = false;
uint64_t base64 = 0;
uint32_t base32 = 0;
};
static inline uint16_t load16_be(const uint8_t* p) {
return (uint16_t)(((uint16_t)p[0] << 8) | (uint16_t)p[1]);
}
static inline uint32_t load32_be(const uint8_t* p) {
return ((uint32_t)p[0] << 24) |
((uint32_t)p[1] << 16) |
((uint32_t)p[2] << 8) |
((uint32_t)p[3]);
}
static inline uint64_t load64_be(const uint8_t* p) {
return ((uint64_t)p[0] << 56) |
((uint64_t)p[1] << 48) |
((uint64_t)p[2] << 40) |
((uint64_t)p[3] << 32) |
((uint64_t)p[4] << 24) |
((uint64_t)p[5] << 16) |
((uint64_t)p[6] << 8) |
((uint64_t)p[7]);
}
static inline void store64_be(uint8_t* p, uint64_t v) {
p[0] = (uint8_t)(v >> 56);
p[1] = (uint8_t)(v >> 48);
p[2] = (uint8_t)(v >> 40);
p[3] = (uint8_t)(v >> 32);
p[4] = (uint8_t)(v >> 24);
p[5] = (uint8_t)(v >> 16);
p[6] = (uint8_t)(v >> 8);
p[7] = (uint8_t)(v);
}
static bool parse_rtp_packet(const uint8_t* data, size_t len, ParsedRtpPacket* out) {
if (!data || !out || len < 12) return false;
// RTP version must be 2.
const uint8_t version = (data[0] >> 6) & 0x03;
if (version != 2) return false;
const size_t csrc_count = (size_t)(data[0] & 0x0F);
const bool has_extension = (data[0] & 0x10) != 0;
size_t header = 12 + csrc_count * 4;
if (header > len) return false;
if (has_extension) {
// Extension header: 16-bit profile + 16-bit length (in 32-bit words)
if (len < header + 4) return false;
const uint16_t ext_len_words =
(uint16_t)(((uint16_t)data[header + 2] << 8) | (uint16_t)data[header + 3]);
const size_t ext_bytes = (size_t)ext_len_words * 4;
header += 4 + ext_bytes;
if (header > len) return false;
}
const size_t payload_size = len - header;
if (payload_size == 0 || payload_size > 1200) return false;
out->header_size = header;
out->sequence = load16_be(data + 2);
out->timestamp = load32_be(data + 4);
out->ssrc = load32_be(data + 8);
return true;
}
static bool fill_nonce_from_rtp_frame(const uint8_t* data,
size_t len,
RtpProbeState* state,
uint8_t nonce[24],
size_t* header_size) {
if (!state) return false;
ParsedRtpPacket packet;
if (!parse_rtp_packet(data, len, &packet)) return false;
if (!state->locked) {
if (!state->has_probe) {
state->has_probe = true;
state->probe_ssrc = packet.ssrc;
state->probe_sequence = packet.sequence;
state->probe_timestamp = packet.timestamp;
return false;
}
const bool same_ssrc = packet.ssrc == state->probe_ssrc;
const uint16_t seq_delta = (uint16_t)(packet.sequence - state->probe_sequence);
const bool sequence_progressed = seq_delta > 0 && seq_delta <= 10;
if (!same_ssrc || !sequence_progressed) {
state->probe_ssrc = packet.ssrc;
state->probe_sequence = packet.sequence;
state->probe_timestamp = packet.timestamp;
return false;
}
state->locked = true;
state->has_probe = false;
state->ssrc = packet.ssrc;
state->last_sequence = packet.sequence;
state->last_timestamp = packet.timestamp;
} else {
if (packet.ssrc != state->ssrc) {
state->locked = false;
state->has_probe = true;
state->probe_ssrc = packet.ssrc;
state->probe_sequence = packet.sequence;
state->probe_timestamp = packet.timestamp;
return false;
}
const uint16_t seq_delta = (uint16_t)(packet.sequence - state->last_sequence);
// Accept in-order packets and small jumps (packet loss).
if (seq_delta != 0 && seq_delta <= 200) {
state->last_sequence = packet.sequence;
state->last_timestamp = packet.timestamp;
} else if (seq_delta != 0) {
// Not plausible for a continuous stream: re-probe.
state->locked = false;
state->has_probe = true;
state->probe_ssrc = packet.ssrc;
state->probe_sequence = packet.sequence;
state->probe_timestamp = packet.timestamp;
return false;
}
}
nonce[4] = (uint8_t)(packet.timestamp >> 24);
nonce[5] = (uint8_t)(packet.timestamp >> 16);
nonce[6] = (uint8_t)(packet.timestamp >> 8);
nonce[7] = (uint8_t)(packet.timestamp);
if (header_size) *header_size = packet.header_size;
return true;
}
static bool fill_nonce_from_additional_data(const uint8_t* data,
size_t len,
uint8_t nonce[24],
AdditionalTsState* ts_state,
bool normalize_timestamps,
bool* used_normalized,
bool* used_rtp_header) {
if (used_normalized) *used_normalized = false;
if (used_rtp_header) *used_rtp_header = false;
if (!data || len < 8) return false;
// Common native WebRTC layout: additional_data is RTP header bytes.
if (len >= 12) {
const uint8_t version = (data[0] >> 6) & 0x03;
if (version == 2) {
uint32_t ts = load32_be(data + 4);
if (normalize_timestamps && ts_state) {
if (!ts_state->initialized32) {
ts_state->initialized32 = true;
ts_state->base32 = ts;
}
ts = (uint32_t)(ts - ts_state->base32);
if (used_normalized) *used_normalized = true;
}
nonce[4] = (uint8_t)(ts >> 24);
nonce[5] = (uint8_t)(ts >> 16);
nonce[6] = (uint8_t)(ts >> 8);
nonce[7] = (uint8_t)(ts);
if (used_rtp_header) *used_rtp_header = true;
return true;
}
}
// Generic 8-byte timestamp layout (desktop's nonce[0..7] layout).
uint64_t ts = load64_be(data);
if (normalize_timestamps && ts_state) {
if (!ts_state->initialized64) {
ts_state->initialized64 = true;
ts_state->base64 = ts;
}
ts = (uint64_t)(ts - ts_state->base64);
if (used_normalized) *used_normalized = true;
}
store64_be(nonce, ts);
return true;
}
static inline void fill_nonce_from_ts32(uint32_t ts, uint8_t nonce[24]) {
nonce[4] = (uint8_t)(ts >> 24);
nonce[5] = (uint8_t)(ts >> 16);
nonce[6] = (uint8_t)(ts >> 8);
nonce[7] = (uint8_t)(ts);
}
static inline uint32_t opus_base_frame_samples(uint8_t config) {
// RFC 6716 TOC config mapping at 48 kHz.
if (config <= 11) {
// SILK: 10/20/40/60 ms
static const uint32_t kSilk[4] = {480, 960, 1920, 2880};
return kSilk[config & 0x03];
}
if (config <= 15) {
// Hybrid: 10/20 ms
return (config & 0x01) ? 960 : 480;
}
// CELT-only: 2.5/5/10/20 ms
static const uint32_t kCelt[4] = {120, 240, 480, 960};
return kCelt[config & 0x03];
}
static uint32_t infer_opus_packet_duration_samples(const uint8_t* packet, size_t len) {
if (!packet || len == 0) return 960;
const uint8_t toc = packet[0];
const uint8_t config = (uint8_t)(toc >> 3);
const uint8_t frame_code = (uint8_t)(toc & 0x03);
uint32_t frame_count = 1;
if (frame_code == 1 || frame_code == 2) {
frame_count = 2;
} else if (frame_code == 3) {
if (len < 2) return 960;
frame_count = (uint32_t)(packet[1] & 0x3F);
if (frame_count == 0 || frame_count > 48) return 960;
}
uint32_t base = opus_base_frame_samples(config);
uint32_t total = base * frame_count;
if (total < 120 || total > 5760) return 960;
return total;
}
static bool is_plausible_opus_packet(const uint8_t* packet, size_t len) {
if (!packet || len == 0 || len > 2000) return false;
const uint8_t toc = packet[0];
const uint8_t config = (uint8_t)(toc >> 3);
if (config > 31) return false;
const uint8_t frame_code = (uint8_t)(toc & 0x03);
if (frame_code != 3) return true;
if (len < 2) return false;
const uint8_t frame_count = (uint8_t)(packet[1] & 0x3F);
if (frame_count == 0 || frame_count > 48) return false;
const uint32_t total = opus_base_frame_samples(config) * (uint32_t)frame_count;
return total <= 5760;
}
/* ── Native crash handler — writes to file before dying ──────── */ /* ── Native crash handler — writes to file before dying ──────── */
static char g_crash_path[512] = {0}; static char g_crash_path[512] = {0};
@@ -98,57 +372,114 @@ public:
} }
/** /**
* Frame format: [4-byte counter BE] + [xchacha20_xor(frame)] * Desktop-compatible frame format: ciphertext only (no custom prefix).
* *
* Nonce (24 bytes): [0,0,0,0, counter_BE_4bytes, 0,...,0] * Nonce (24 bytes) is derived exactly like desktop:
* This matches Desktop's layout where nonce[4..7] = timestamp. * - nonce[0..3] = 0
* The counter is embedded so the receiver can reconstruct the nonce * - nonce[4..7] = RTP timestamp
* even if frames are dropped/reordered. * - nonce[8..23] = 0
*
* Primary source of timestamp: additional_data[4..7] (if provided by WebRTC).
* Fallback (Android path where additional_data can be empty):
* parse RTP header from frame and take timestamp from frame[4..7].
*
* If RTP header is found inside frame, we leave header bytes unencrypted
* and encrypt only payload (desktop-compatible).
*/ */
int Encrypt(cricket::MediaType /*media_type*/, int Encrypt(cricket::MediaType /*media_type*/,
uint32_t /*ssrc*/, uint32_t /*ssrc*/,
rtc::ArrayView<const uint8_t> /*additional_data*/, rtc::ArrayView<const uint8_t> additional_data,
rtc::ArrayView<const uint8_t> frame, rtc::ArrayView<const uint8_t> frame,
rtc::ArrayView<uint8_t> encrypted_frame, rtc::ArrayView<uint8_t> encrypted_frame,
size_t* bytes_written) override { size_t* bytes_written) override {
const size_t HEADER = 4; // counter prefix if (frame.size() == 0 || encrypted_frame.size() < frame.size()) {
if (frame.size() == 0 || encrypted_frame.size() < frame.size() + HEADER) {
*bytes_written = 0; *bytes_written = 0;
return -1; return -1;
} }
uint32_t ctr = counter_.fetch_add(1, std::memory_order_relaxed); size_t header_size = 0;
bool nonce_from_rtp_header = false;
bool nonce_from_generated_ts = false;
bool nonce_from_additional_data = false;
bool nonce_from_additional_normalized = false;
bool additional_was_rtp_header = false;
uint32_t generated_ts_used = 0;
// Write 4-byte counter as big-endian prefix // Build nonce from RTP timestamp in additional_data (preferred).
encrypted_frame.data()[0] = (uint8_t)(ctr >> 24);
encrypted_frame.data()[1] = (uint8_t)(ctr >> 16);
encrypted_frame.data()[2] = (uint8_t)(ctr >> 8);
encrypted_frame.data()[3] = (uint8_t)(ctr);
// Build nonce from counter (same positions as Desktop's timestamp)
uint8_t nonce[24] = {0}; uint8_t nonce[24] = {0};
nonce[4] = encrypted_frame.data()[0]; nonce_from_additional_data = fill_nonce_from_additional_data(
nonce[5] = encrypted_frame.data()[1]; additional_data.data(),
nonce[6] = encrypted_frame.data()[2]; additional_data.size(),
nonce[7] = encrypted_frame.data()[3]; nonce,
&additional_ts_,
true,
&nonce_from_additional_normalized,
&additional_was_rtp_header);
if (!nonce_from_additional_data) {
nonce_from_rtp_header =
fill_nonce_from_rtp_frame(frame.data(), frame.size(), &rtp_probe_, nonce, &header_size);
if (!nonce_from_rtp_header) {
if (!generated_ts_.initialized) {
generated_ts_.initialized = true;
generated_ts_.next_timestamp = 0;
generated_ts_.next_step = 960;
}
nonce_from_generated_ts = true;
generated_ts_used = generated_ts_.next_timestamp;
fill_nonce_from_ts32(generated_ts_used, nonce);
}
}
rosetta_xchacha20_xor(encrypted_frame.data() + HEADER, if (nonce_from_rtp_header && header_size <= frame.size()) {
frame.data(), frame.size(), nonce, key_); // Keep RTP header clear, encrypt payload only.
*bytes_written = frame.size() + HEADER; if (header_size > 0) {
memcpy(encrypted_frame.data(), frame.data(), header_size);
}
const size_t payload_size = frame.size() - header_size;
rosetta_xchacha20_xor(
encrypted_frame.data() + header_size,
frame.data() + header_size,
payload_size,
nonce,
key_);
} else {
// Legacy path: frame is payload-only.
rosetta_xchacha20_xor(encrypted_frame.data(),
frame.data(), frame.size(), nonce, key_);
}
*bytes_written = frame.size();
if (nonce_from_generated_ts) {
const uint32_t step = infer_opus_packet_duration_samples(frame.data(), frame.size());
generated_ts_.next_step = step;
generated_ts_.next_timestamp = generated_ts_used + step;
}
// Diag: log first 3 frames // Diag: log first 3 frames
int n = diag_count_.fetch_add(1, std::memory_order_relaxed); int n = diag_count_.fetch_add(1, std::memory_order_relaxed);
if (n < 3) { if (n < 3) {
LOGI("ENC frame#%d: sz=%zu ctr=%u out=%zu", const char* mode =
n, frame.size(), ctr, frame.size() + HEADER); nonce_from_rtp_header
diag_write("ENC frame#%d: sz=%zu ctr=%u nonce[4..7]=%02x%02x%02x%02x\n", ? "rtp"
n, frame.size(), ctr, nonce[4], nonce[5], nonce[6], nonce[7]); : (nonce_from_generated_ts
? "gen"
: (nonce_from_additional_data
? (additional_was_rtp_header
? (nonce_from_additional_normalized ? "ad-rtp-norm" : "ad-rtp")
: (nonce_from_additional_normalized ? "raw-norm" : "raw-abs"))
: "raw-abs"));
LOGI("ENC frame#%d: sz=%zu ad=%zu hdr=%zu mode=%s nonce=%02x%02x%02x%02x",
n, frame.size(), additional_data.size(), header_size, mode,
nonce[4], nonce[5], nonce[6], nonce[7]);
diag_write("ENC frame#%d: sz=%zu ad=%zu hdr=%zu mode=%s nonce[4..7]=%02x%02x%02x%02x\n",
n, frame.size(), additional_data.size(), header_size, mode,
nonce[4], nonce[5], nonce[6], nonce[7]);
} }
return 0; return 0;
} }
size_t GetMaxCiphertextByteSize(cricket::MediaType, size_t frame_size) override { size_t GetMaxCiphertextByteSize(cricket::MediaType, size_t frame_size) override {
return frame_size + 4; // +4 for counter prefix return frame_size;
} }
protected: protected:
@@ -156,8 +487,10 @@ protected:
private: private:
mutable std::atomic<int> ref_{0}; mutable std::atomic<int> ref_{0};
mutable std::atomic<uint32_t> counter_{0};
mutable std::atomic<int> diag_count_{0}; mutable std::atomic<int> diag_count_{0};
mutable RtpProbeState rtp_probe_;
mutable GeneratedTsState generated_ts_;
mutable AdditionalTsState additional_ts_;
uint8_t key_[32]; uint8_t key_[32];
}; };
@@ -185,57 +518,180 @@ public:
} }
/** /**
* Decrypt frame: read 4-byte counter prefix → derive nonce → decrypt. * Desktop-compatible decrypt:
* If frame has no prefix (< 5 bytes or from Desktop), fallback to * - nonce from RTP timestamp
* nonce derived from additional_data (RTP header) or zeros. * - if RTP header is present inside encrypted_frame (fallback path),
* keep header bytes untouched and decrypt payload only.
*/ */
Result Decrypt(cricket::MediaType /*media_type*/, Result Decrypt(cricket::MediaType /*media_type*/,
const std::vector<uint32_t>& /*csrcs*/, const std::vector<uint32_t>& /*csrcs*/,
rtc::ArrayView<const uint8_t> additional_data, rtc::ArrayView<const uint8_t> additional_data,
rtc::ArrayView<const uint8_t> encrypted_frame, rtc::ArrayView<const uint8_t> encrypted_frame,
rtc::ArrayView<uint8_t> frame) override { rtc::ArrayView<uint8_t> frame) override {
const size_t HEADER = 4;
uint8_t nonce[24] = {0}; uint8_t nonce[24] = {0};
const uint8_t *payload; size_t header_size = 0;
size_t payload_sz; bool nonce_from_rtp_header = false;
bool nonce_from_generated_ts = false;
if (encrypted_frame.size() > HEADER) { bool nonce_from_additional_data = false;
// Android format: [4-byte counter] + [encrypted data] bool nonce_from_additional_normalized = false;
nonce[4] = encrypted_frame.data()[0]; bool additional_was_rtp_header = false;
nonce[5] = encrypted_frame.data()[1]; bool used_absolute_additional_fallback = false;
nonce[6] = encrypted_frame.data()[2]; uint32_t generated_ts_used = 0;
nonce[7] = encrypted_frame.data()[3]; nonce_from_additional_data = fill_nonce_from_additional_data(
payload = encrypted_frame.data() + HEADER; additional_data.data(),
payload_sz = encrypted_frame.size() - HEADER; additional_data.size(),
} else { nonce,
// Fallback: no counter prefix &additional_ts_,
payload = encrypted_frame.data(); true,
payload_sz = encrypted_frame.size(); &nonce_from_additional_normalized,
&additional_was_rtp_header);
if (!nonce_from_additional_data) {
nonce_from_rtp_header =
fill_nonce_from_rtp_frame(encrypted_frame.data(), encrypted_frame.size(), &rtp_probe_, nonce, &header_size);
if (!nonce_from_rtp_header) {
if (!generated_ts_.initialized) {
generated_ts_.initialized = true;
generated_ts_.next_timestamp = 0;
generated_ts_.next_step = 960;
}
nonce_from_generated_ts = true;
generated_ts_used = generated_ts_.next_timestamp;
fill_nonce_from_ts32(generated_ts_used, nonce);
}
} }
if (payload_sz == 0 || frame.size() < payload_sz) { if (encrypted_frame.size() == 0 || frame.size() < encrypted_frame.size()) {
return {Result::Status::kFailedToDecrypt, 0}; return {Result::Status::kFailedToDecrypt, 0};
} }
rosetta_xchacha20_xor(frame.data(), payload, payload_sz, nonce, key_); bool used_generated_resync = false;
if (nonce_from_rtp_header && header_size <= encrypted_frame.size()) {
if (header_size > 0) {
memcpy(frame.data(), encrypted_frame.data(), header_size);
}
const size_t payload_size = encrypted_frame.size() - header_size;
rosetta_xchacha20_xor(
frame.data() + header_size,
encrypted_frame.data() + header_size,
payload_size,
nonce,
key_);
} else {
rosetta_xchacha20_xor(frame.data(), encrypted_frame.data(), encrypted_frame.size(), nonce, key_);
}
// additional_data on Android can be absolute RTP-ish timestamp, while
// desktop nonce source is normalized stream timestamp. If normalized
// nonce gives implausible Opus, retry with absolute additional_data.
if (!nonce_from_generated_ts &&
nonce_from_additional_data &&
encrypted_frame.size() > 0 &&
additional_data.size() >= 8) {
const uint8_t* payload_ptr = frame.data() + header_size;
const size_t payload_size = encrypted_frame.size() - header_size;
if (!is_plausible_opus_packet(payload_ptr, payload_size)) {
uint8_t nonce_abs[24] = {0};
bool abs_norm = false;
bool abs_rtp = false;
if (fill_nonce_from_additional_data(
additional_data.data(),
additional_data.size(),
nonce_abs,
nullptr,
false,
&abs_norm,
&abs_rtp) &&
memcmp(nonce_abs, nonce, 24) != 0) {
if (nonce_from_rtp_header && header_size <= encrypted_frame.size()) {
if (header_size > 0) {
memcpy(frame.data(), encrypted_frame.data(), header_size);
}
rosetta_xchacha20_xor(
frame.data() + header_size,
encrypted_frame.data() + header_size,
payload_size,
nonce_abs,
key_);
} else {
rosetta_xchacha20_xor(
frame.data(),
encrypted_frame.data(),
encrypted_frame.size(),
nonce_abs,
key_);
}
payload_ptr = frame.data() + header_size;
if (is_plausible_opus_packet(payload_ptr, payload_size)) {
memcpy(nonce, nonce_abs, 24);
used_absolute_additional_fallback = true;
}
}
}
}
if (nonce_from_generated_ts) {
bool plausible = is_plausible_opus_packet(frame.data(), encrypted_frame.size());
// Recover after lost packets by probing a few forward timestamp steps.
if (!plausible) {
std::vector<uint8_t> candidate(encrypted_frame.size());
for (uint32_t i = 1; i <= 8; ++i) {
const uint32_t ts_try = generated_ts_used + generated_ts_.next_step * i;
uint8_t nonce_try[24] = {0};
fill_nonce_from_ts32(ts_try, nonce_try);
rosetta_xchacha20_xor(
candidate.data(),
encrypted_frame.data(),
encrypted_frame.size(),
nonce_try,
key_);
if (is_plausible_opus_packet(candidate.data(), candidate.size())) {
memcpy(frame.data(), candidate.data(), candidate.size());
generated_ts_used = ts_try;
used_generated_resync = true;
plausible = true;
break;
}
}
}
const uint32_t step = infer_opus_packet_duration_samples(frame.data(), encrypted_frame.size());
generated_ts_.next_step = step;
generated_ts_.next_timestamp = generated_ts_used + step;
}
// Diag: log first 3 frames // Diag: log first 3 frames
int n = diag_count_.fetch_add(1, std::memory_order_relaxed); int n = diag_count_.fetch_add(1, std::memory_order_relaxed);
if (n < 3) { if (n < 3) {
LOGI("DEC frame#%d: enc_sz=%zu payload=%zu nonce=%02x%02x%02x%02x", const char* mode = nullptr;
n, encrypted_frame.size(), payload_sz, if (nonce_from_rtp_header) {
mode = "rtp";
} else if (nonce_from_generated_ts) {
mode = used_generated_resync ? "gen-resync" : "gen";
} else if (used_absolute_additional_fallback) {
mode = additional_was_rtp_header ? "ad-rtp-abs-fb" : "raw-abs-fb";
} else if (nonce_from_additional_data) {
mode =
additional_was_rtp_header
? (nonce_from_additional_normalized ? "ad-rtp-norm" : "ad-rtp")
: (nonce_from_additional_normalized ? "raw-norm" : "raw-abs");
} else {
mode = "raw-abs";
}
LOGI("DEC frame#%d: enc_sz=%zu ad=%zu hdr=%zu mode=%s nonce=%02x%02x%02x%02x",
n, encrypted_frame.size(), additional_data.size(), header_size, mode,
nonce[4], nonce[5], nonce[6], nonce[7]); nonce[4], nonce[5], nonce[6], nonce[7]);
diag_write("DEC frame#%d: enc_sz=%zu payload=%zu nonce[4..7]=%02x%02x%02x%02x\n", diag_write("DEC frame#%d: enc_sz=%zu ad=%zu hdr=%zu mode=%s nonce[4..7]=%02x%02x%02x%02x\n",
n, encrypted_frame.size(), payload_sz, n, encrypted_frame.size(), additional_data.size(), header_size, mode,
nonce[4], nonce[5], nonce[6], nonce[7]); nonce[4], nonce[5], nonce[6], nonce[7]);
} }
return {Result::Status::kOk, payload_sz}; return {Result::Status::kOk, encrypted_frame.size()};
} }
size_t GetMaxPlaintextByteSize(cricket::MediaType, size_t encrypted_frame_size) override { size_t GetMaxPlaintextByteSize(cricket::MediaType, size_t encrypted_frame_size) override {
return encrypted_frame_size; // >= actual (payload = enc - 4) return encrypted_frame_size;
} }
protected: protected:
@@ -244,6 +700,9 @@ protected:
private: private:
mutable std::atomic<int> ref_{0}; mutable std::atomic<int> ref_{0};
mutable std::atomic<int> diag_count_{0}; mutable std::atomic<int> diag_count_{0};
mutable RtpProbeState rtp_probe_;
mutable GeneratedTsState generated_ts_;
mutable AdditionalTsState additional_ts_;
uint8_t key_[32]; uint8_t key_[32];
}; };

View File

@@ -3,6 +3,7 @@ package com.rosetta.messenger.network
import android.content.Context import android.content.Context
import android.media.AudioManager import android.media.AudioManager
import android.util.Log import android.util.Log
import com.rosetta.messenger.data.MessageRepository
import java.security.SecureRandom import java.security.SecureRandom
import kotlinx.coroutines.CoroutineScope import kotlinx.coroutines.CoroutineScope
import kotlinx.coroutines.Dispatchers import kotlinx.coroutines.Dispatchers
@@ -14,6 +15,8 @@ import kotlinx.coroutines.flow.StateFlow
import kotlinx.coroutines.flow.asStateFlow import kotlinx.coroutines.flow.asStateFlow
import kotlinx.coroutines.flow.update import kotlinx.coroutines.flow.update
import kotlinx.coroutines.launch import kotlinx.coroutines.launch
import kotlinx.coroutines.sync.Mutex
import kotlinx.coroutines.sync.withLock
import kotlinx.coroutines.suspendCancellableCoroutine import kotlinx.coroutines.suspendCancellableCoroutine
import org.bouncycastle.math.ec.rfc7748.X25519 import org.bouncycastle.math.ec.rfc7748.X25519
import org.json.JSONObject import org.json.JSONObject
@@ -24,6 +27,7 @@ import org.webrtc.MediaConstraints
import org.webrtc.PeerConnection import org.webrtc.PeerConnection
import org.webrtc.PeerConnectionFactory import org.webrtc.PeerConnectionFactory
import org.webrtc.RtpReceiver import org.webrtc.RtpReceiver
import org.webrtc.RtpSender
import org.webrtc.RtpTransceiver import org.webrtc.RtpTransceiver
import org.webrtc.SdpObserver import org.webrtc.SdpObserver
import org.webrtc.SessionDescription import org.webrtc.SessionDescription
@@ -105,10 +109,12 @@ object CallManager {
private var durationJob: Job? = null private var durationJob: Job? = null
private var protocolStateJob: Job? = null private var protocolStateJob: Job? = null
private var disconnectResetJob: Job? = null
private var signalWaiter: ((Packet) -> Unit)? = null private var signalWaiter: ((Packet) -> Unit)? = null
private var webRtcWaiter: ((Packet) -> Unit)? = null private var webRtcWaiter: ((Packet) -> Unit)? = null
private var iceWaiter: ((Packet) -> Unit)? = null private var iceWaiter: ((Packet) -> Unit)? = null
private val webRtcSignalMutex = Mutex()
private var peerConnectionFactory: PeerConnectionFactory? = null private var peerConnectionFactory: PeerConnectionFactory? = null
private var peerConnection: PeerConnection? = null private var peerConnection: PeerConnection? = null
@@ -228,6 +234,7 @@ object CallManager {
} }
fun endCall() { fun endCall() {
breadcrumb("UI: endCall requested")
resetSession(reason = null, notifyPeer = true) resetSession(reason = null, notifyPeer = true)
} }
@@ -392,58 +399,85 @@ object CallManager {
} }
private suspend fun handleWebRtcPacket(packet: PacketWebRTC) { private suspend fun handleWebRtcPacket(packet: PacketWebRTC) {
val phase = _state.value.phase webRtcSignalMutex.withLock {
if (phase != CallPhase.CONNECTING && phase != CallPhase.ACTIVE) { val phase = _state.value.phase
breadcrumb("RTC: IGNORED ${packet.signalType} — phase=$phase") if (phase != CallPhase.CONNECTING && phase != CallPhase.ACTIVE) {
return breadcrumb("RTC: IGNORED ${packet.signalType} — phase=$phase")
} return@withLock
val pc = peerConnection }
if (pc == null) { val pc = peerConnection
breadcrumb("RTC: IGNORED ${packet.signalType} — peerConnection=null!") if (pc == null) {
return breadcrumb("RTC: IGNORED ${packet.signalType} — peerConnection=null!")
} return@withLock
}
when (packet.signalType) { when (packet.signalType) {
WebRTCSignalType.ANSWER -> { WebRTCSignalType.ANSWER -> {
breadcrumb("RTC: ANSWER received") val answer = parseSessionDescription(packet.sdpOrCandidate) ?: return@withLock
val answer = parseSessionDescription(packet.sdpOrCandidate) ?: return if (answer.type != SessionDescription.Type.ANSWER) {
try { breadcrumb("RTC: ANSWER packet with type=${answer.type} ignored")
pc.setRemoteDescriptionAwait(answer) return@withLock
remoteDescriptionSet = true }
flushBufferedRemoteCandidates()
breadcrumb("RTC: ANSWER applied OK, remoteDesc=true") val stateBefore = pc.signalingState()
} catch (e: Exception) { breadcrumb("RTC: ANSWER received state=$stateBefore")
breadcrumb("RTC: ANSWER FAILED — ${e.message}") if (stateBefore == PeerConnection.SignalingState.STABLE && remoteDescriptionSet) {
saveCrashReport("setRemoteDescription(answer) failed", e) breadcrumb("RTC: ANSWER duplicate ignored (already stable)")
return@withLock
}
try {
pc.setRemoteDescriptionAwait(answer)
remoteDescriptionSet = true
flushBufferedRemoteCandidates()
breadcrumb("RTC: ANSWER applied OK, state=${pc.signalingState()}")
} catch (e: Exception) {
breadcrumb("RTC: ANSWER FAILED — ${e.message}")
saveCrashReport("setRemoteDescription(answer) failed", e)
}
} }
} WebRTCSignalType.ICE_CANDIDATE -> {
WebRTCSignalType.ICE_CANDIDATE -> { val candidate = parseIceCandidate(packet.sdpOrCandidate) ?: return@withLock
val candidate = parseIceCandidate(packet.sdpOrCandidate) ?: return if (!remoteDescriptionSet) {
if (!remoteDescriptionSet) { breadcrumb("RTC: ICE buffered (remoteDesc not set yet)")
breadcrumb("RTC: ICE buffered (remoteDesc not set yet)") bufferedRemoteCandidates.add(candidate)
bufferedRemoteCandidates.add(candidate) return@withLock
return }
breadcrumb("RTC: ICE added: ${candidate.sdp.take(40)}")
runCatching { pc.addIceCandidate(candidate) }
} }
breadcrumb("RTC: ICE added: ${candidate.sdp.take(40)}") WebRTCSignalType.OFFER -> {
runCatching { pc.addIceCandidate(candidate) } val remoteOffer = parseSessionDescription(packet.sdpOrCandidate) ?: return@withLock
} if (remoteOffer.type != SessionDescription.Type.OFFER) {
WebRTCSignalType.OFFER -> { breadcrumb("RTC: OFFER packet with type=${remoteOffer.type} ignored")
breadcrumb("RTC: OFFER received (offerSent=$offerSent)") return@withLock
val remoteOffer = parseSessionDescription(packet.sdpOrCandidate) ?: return }
try {
pc.setRemoteDescriptionAwait(remoteOffer) breadcrumb("RTC: OFFER received (offerSent=$offerSent state=${pc.signalingState()})")
remoteDescriptionSet = true try {
flushBufferedRemoteCandidates() pc.setRemoteDescriptionAwait(remoteOffer)
val answer = pc.createAnswerAwait() remoteDescriptionSet = true
pc.setLocalDescriptionAwait(answer) flushBufferedRemoteCandidates()
ProtocolManager.sendWebRtcSignal(
signalType = WebRTCSignalType.ANSWER, val stateAfterRemote = pc.signalingState()
sdpOrCandidate = serializeSessionDescription(answer) if (stateAfterRemote != PeerConnection.SignalingState.HAVE_REMOTE_OFFER &&
) stateAfterRemote != PeerConnection.SignalingState.HAVE_LOCAL_PRANSWER
breadcrumb("RTC: OFFER handled → ANSWER sent") ) {
} catch (e: Exception) { breadcrumb("RTC: OFFER skip createAnswer, bad state=$stateAfterRemote")
breadcrumb("RTC: OFFER FAILED — ${e.message}") return@withLock
saveCrashReport("handleOffer failed", e) }
val answer = pc.createAnswerAwait()
pc.setLocalDescriptionAwait(answer)
ProtocolManager.sendWebRtcSignal(
signalType = WebRTCSignalType.ANSWER,
sdpOrCandidate = serializeSessionDescription(answer)
)
breadcrumb("RTC: OFFER handled → ANSWER sent")
} catch (e: Exception) {
breadcrumb("RTC: OFFER FAILED — ${e.message}")
saveCrashReport("handleOffer failed", e)
}
} }
} }
} }
@@ -493,9 +527,14 @@ object CallManager {
if (localAudioTrack == null) { if (localAudioTrack == null) {
localAudioTrack = factory.createAudioTrack(LOCAL_AUDIO_TRACK_ID, audioSource) localAudioTrack = factory.createAudioTrack(LOCAL_AUDIO_TRACK_ID, audioSource)
localAudioTrack?.setEnabled(!_state.value.isMuted) localAudioTrack?.setEnabled(!_state.value.isMuted)
pc.addTrack(localAudioTrack, listOf(LOCAL_MEDIA_STREAM_ID)) val txInit =
breadcrumb("PC: audio track added, attaching E2EE…") RtpTransceiver.RtpTransceiverInit(
attachSenderE2EE(pc) RtpTransceiver.RtpTransceiverDirection.SEND_RECV,
listOf(LOCAL_MEDIA_STREAM_ID)
)
val transceiver = pc.addTransceiver(localAudioTrack, txInit)
breadcrumb("PC: audio transceiver added, attaching E2EE…")
attachSenderE2EE(transceiver?.sender)
} }
try { try {
@@ -561,16 +600,37 @@ object CallManager {
breadcrumb("PC: connState=$newState") breadcrumb("PC: connState=$newState")
when (newState) { when (newState) {
PeerConnection.PeerConnectionState.CONNECTED -> { PeerConnection.PeerConnectionState.CONNECTED -> {
disconnectResetJob?.cancel()
disconnectResetJob = null
onCallConnected() onCallConnected()
} }
PeerConnection.PeerConnectionState.DISCONNECTED,
PeerConnection.PeerConnectionState.FAILED, PeerConnection.PeerConnectionState.FAILED,
PeerConnection.PeerConnectionState.CLOSED -> { PeerConnection.PeerConnectionState.CLOSED -> {
disconnectResetJob?.cancel()
disconnectResetJob = null
// Dispatch to our scope — this callback fires on WebRTC thread // Dispatch to our scope — this callback fires on WebRTC thread
scope.launch { scope.launch {
resetSession(reason = "Connection lost", notifyPeer = false) resetSession(reason = "Connection lost", notifyPeer = false)
} }
} }
PeerConnection.PeerConnectionState.DISCONNECTED -> {
// Desktop tolerates short network dips; do not kill call immediately.
disconnectResetJob?.cancel()
disconnectResetJob =
scope.launch {
delay(5_000L)
val pcState = peerConnection?.connectionState()
if (pcState == PeerConnection.PeerConnectionState.DISCONNECTED ||
pcState == PeerConnection.PeerConnectionState.FAILED ||
pcState == PeerConnection.PeerConnectionState.CLOSED
) {
breadcrumb("PC: DISCONNECTED timeout → reset")
resetSession(reason = "Connection lost", notifyPeer = false)
} else {
breadcrumb("PC: DISCONNECTED recovered (state=$pcState)")
}
}
}
else -> Unit else -> Unit
} }
} }
@@ -625,6 +685,34 @@ object CallManager {
peerConnectionFactory = PeerConnectionFactory.builder().createPeerConnectionFactory() peerConnectionFactory = PeerConnectionFactory.builder().createPeerConnectionFactory()
} }
private fun emitCallAttachmentIfNeeded(snapshot: CallUiState) {
if (role != CallRole.CALLER) return
val peerPublicKey = snapshot.peerPublicKey.trim()
val context = appContext ?: return
if (peerPublicKey.isBlank()) return
val durationSec = snapshot.durationSec.coerceAtLeast(0)
val callAttachment =
MessageAttachment(
id = java.util.UUID.randomUUID().toString().replace("-", "").take(16),
blob = "",
type = AttachmentType.CALL,
preview = durationSec.toString()
)
scope.launch {
runCatching {
MessageRepository.getInstance(context).sendMessage(
toPublicKey = peerPublicKey,
text = "",
attachments = listOf(callAttachment)
)
}.onFailure { error ->
Log.w(TAG, "Failed to send call attachment", error)
}
}
}
private fun resetSession(reason: String?, notifyPeer: Boolean) { private fun resetSession(reason: String?, notifyPeer: Boolean) {
breadcrumb("RESET: reason=$reason notifyPeer=$notifyPeer phase=${_state.value.phase}") breadcrumb("RESET: reason=$reason notifyPeer=$notifyPeer phase=${_state.value.phase}")
val snapshot = _state.value val snapshot = _state.value
@@ -646,6 +734,7 @@ object CallManager {
if (!reason.isNullOrBlank()) { if (!reason.isNullOrBlank()) {
Log.d(TAG, reason) Log.d(TAG, reason)
} }
emitCallAttachmentIfNeeded(snapshot)
resetRtcObjects() resetRtcObjects()
e2eeAvailable = true e2eeAvailable = true
role = null role = null
@@ -656,6 +745,8 @@ object CallManager {
localPublicKey = null localPublicKey = null
durationJob?.cancel() durationJob?.cancel()
durationJob = null durationJob = null
disconnectResetJob?.cancel()
disconnectResetJob = null
setSpeakerphone(false) setSpeakerphone(false)
_state.value = CallUiState() _state.value = CallUiState()
} }
@@ -732,10 +823,10 @@ object CallManager {
} catch (_: Throwable) {} } catch (_: Throwable) {}
} }
private fun attachSenderE2EE(pc: PeerConnection) { private fun attachSenderE2EE(sender: RtpSender?) {
if (!e2eeAvailable) return if (!e2eeAvailable) return
val key = sharedKeyBytes ?: return val key = sharedKeyBytes ?: return
val sender = pc.senders.firstOrNull() ?: return if (sender == null) return
try { try {
breadcrumb("1. encryptor: nativeLoaded=${XChaCha20E2EE.nativeLoaded}") breadcrumb("1. encryptor: nativeLoaded=${XChaCha20E2EE.nativeLoaded}")

View File

@@ -19,6 +19,7 @@ import androidx.compose.animation.core.tween
import androidx.compose.foundation.Canvas import androidx.compose.foundation.Canvas
import androidx.compose.foundation.Image import androidx.compose.foundation.Image
import androidx.compose.foundation.background import androidx.compose.foundation.background
import androidx.compose.foundation.border
import androidx.compose.foundation.ExperimentalFoundationApi import androidx.compose.foundation.ExperimentalFoundationApi
import androidx.compose.foundation.clickable import androidx.compose.foundation.clickable
import androidx.compose.foundation.combinedClickable import androidx.compose.foundation.combinedClickable
@@ -1555,27 +1556,48 @@ fun ImageAttachment(
} }
} }
private fun parseCallAttachmentPreview(preview: String): Pair<String, String?> { private data class DesktopCallUi(
if (preview.isBlank()) return "Call" to null val title: String,
val subtitle: String,
val isError: Boolean
)
val pieces = preview.split("::") private fun parseCallDurationSeconds(preview: String): Int {
val title = pieces.firstOrNull()?.trim().orEmpty().ifBlank { "Call" } if (preview.isBlank()) return 0
val subtitle = pieces.drop(1).joinToString(" ").trim().ifBlank { null }
val tail = preview.substringAfterLast("::").trim()
tail.toIntOrNull()?.let { return it.coerceAtLeast(0) }
val durationRegex = Regex("duration(?:Sec|Seconds)?\\s*[:=]\\s*(\\d+)", RegexOption.IGNORE_CASE) val durationRegex = Regex("duration(?:Sec|Seconds)?\\s*[:=]\\s*(\\d+)", RegexOption.IGNORE_CASE)
val fallbackDurationRegex = Regex("^(\\d{1,5})$") durationRegex.find(preview)?.groupValues?.getOrNull(1)?.toIntOrNull()?.let {
val durationSec = return it.coerceAtLeast(0)
durationRegex.find(preview)?.groupValues?.getOrNull(1)?.toIntOrNull() }
?: fallbackDurationRegex.find(title)?.groupValues?.getOrNull(1)?.toIntOrNull()
val normalizedSubtitle = return preview.trim().toIntOrNull()?.coerceAtLeast(0) ?: 0
durationSec?.let { sec -> }
val mins = sec / 60
val secs = sec % 60
"Duration ${"%d:%02d".format(mins, secs)}"
} ?: subtitle
return title to normalizedSubtitle private fun formatDesktopCallDuration(durationSec: Int): String {
val minutes = durationSec / 60
val seconds = durationSec % 60
return "$minutes:${seconds.toString().padStart(2, '0')}"
}
private fun resolveDesktopCallUi(preview: String, isOutgoing: Boolean): DesktopCallUi {
val durationSec = parseCallDurationSeconds(preview)
val isError = durationSec == 0
val title =
if (isError) {
if (isOutgoing) "Rejected call" else "Missed call"
} else {
if (isOutgoing) "Outgoing call" else "Incoming call"
}
val subtitle =
if (isError) {
"Call was not answered or was rejected"
} else {
formatDesktopCallDuration(durationSec)
}
return DesktopCallUi(title = title, subtitle = subtitle, isError = isError)
} }
/** Call attachment bubble */ /** Call attachment bubble */
@@ -1587,116 +1609,141 @@ fun CallAttachment(
timestamp: java.util.Date, timestamp: java.util.Date,
messageStatus: MessageStatus = MessageStatus.READ messageStatus: MessageStatus = MessageStatus.READ
) { ) {
val (title, subtitle) = remember(attachment.preview) { parseCallAttachmentPreview(attachment.preview) } val callUi = remember(attachment.preview, isOutgoing) {
resolveDesktopCallUi(attachment.preview, isOutgoing)
Row( }
modifier = Modifier.fillMaxWidth().padding(vertical = 4.dp), val containerShape = RoundedCornerShape(10.dp)
verticalAlignment = Alignment.CenterVertically val containerBackground =
) { if (isOutgoing) {
Box( Color.White.copy(alpha = 0.12f)
modifier = } else {
Modifier.size(40.dp) if (isDarkTheme) Color(0xFF1F2733) else Color(0xFFF3F8FF)
.clip(CircleShape) }
.background( val containerBorder =
if (isOutgoing) { if (isOutgoing) {
Color.White.copy(alpha = 0.18f) Color.White.copy(alpha = 0.2f)
} else { } else {
if (isDarkTheme) Color(0xFF2B3A4D) else Color(0xFFE7F2FF) if (isDarkTheme) Color(0xFF33435A) else Color(0xFFD8E5F4)
} }
), val iconBackground = if (callUi.isError) Color(0xFFE55A5A) else PrimaryBlue
contentAlignment = Alignment.Center val iconVector =
) { when {
Icon( callUi.isError -> Icons.Default.Close
imageVector = Icons.Default.Call, isOutgoing -> Icons.Default.CallMade
contentDescription = null, else -> Icons.Default.CallReceived
tint =
if (isOutgoing) Color.White
else if (isDarkTheme) Color(0xFF8EC9FF) else PrimaryBlue,
modifier = Modifier.size(20.dp)
)
} }
Spacer(modifier = Modifier.width(10.dp)) Box(
modifier =
Modifier
.padding(vertical = 4.dp)
.widthIn(min = 200.dp)
.heightIn(min = 60.dp)
.clip(containerShape)
.background(containerBackground)
.border(width = 1.dp, color = containerBorder, shape = containerShape)
.padding(horizontal = 10.dp, vertical = 8.dp)
) {
Row(
verticalAlignment = Alignment.CenterVertically
) {
Box(
modifier =
Modifier.size(40.dp)
.clip(CircleShape)
.background(iconBackground),
contentAlignment = Alignment.Center
) {
Icon(
imageVector = iconVector,
contentDescription = null,
tint = Color.White,
modifier = Modifier.size(20.dp)
)
}
Column(modifier = Modifier.weight(1f)) { Spacer(modifier = Modifier.width(10.dp))
Text(
text = title, Column(modifier = Modifier.weight(1f)) {
fontSize = 14.sp,
fontWeight = FontWeight.Medium,
color = if (isOutgoing) Color.White else if (isDarkTheme) Color.White else Color.Black,
maxLines = 1,
overflow = TextOverflow.Ellipsis
)
if (!subtitle.isNullOrBlank()) {
Spacer(modifier = Modifier.height(2.dp))
Text( Text(
text = subtitle, text = callUi.title,
fontSize = 12.sp, fontSize = 14.sp,
color = fontWeight = FontWeight.Medium,
if (isOutgoing) { color = if (isOutgoing) Color.White else if (isDarkTheme) Color.White else Color.Black,
Color.White.copy(alpha = 0.7f)
} else {
if (isDarkTheme) Color(0xFF8BA0B8) else Color(0xFF5E6E82)
},
maxLines = 1, maxLines = 1,
overflow = TextOverflow.Ellipsis overflow = TextOverflow.Ellipsis
) )
} Spacer(modifier = Modifier.height(2.dp))
}
if (isOutgoing) {
Spacer(modifier = Modifier.width(8.dp))
Row(verticalAlignment = Alignment.CenterVertically) {
Text( Text(
text = android.text.format.DateFormat.format("HH:mm", timestamp).toString(), text = callUi.subtitle,
fontSize = 11.sp, fontSize = 12.sp,
color = Color.White.copy(alpha = 0.7f) color =
if (callUi.isError) {
Color(0xFFE55A5A)
} else if (isOutgoing) {
Color.White.copy(alpha = 0.72f)
} else {
if (isDarkTheme) Color(0xFF8EC9FF) else PrimaryBlue
},
maxLines = 1,
overflow = TextOverflow.Ellipsis
) )
Spacer(modifier = Modifier.width(4.dp)) }
when (messageStatus) {
MessageStatus.SENDING -> { if (isOutgoing) {
Icon( Spacer(modifier = Modifier.width(8.dp))
painter = TelegramIcons.Clock, Row(verticalAlignment = Alignment.CenterVertically) {
contentDescription = null, Text(
tint = Color.White.copy(alpha = 0.7f), text = android.text.format.DateFormat.format("HH:mm", timestamp).toString(),
modifier = Modifier.size(14.dp) fontSize = 11.sp,
) color = Color.White.copy(alpha = 0.7f)
} )
MessageStatus.SENT, MessageStatus.DELIVERED -> { Spacer(modifier = Modifier.width(4.dp))
Icon( when (messageStatus) {
painter = TelegramIcons.Done, MessageStatus.SENDING -> {
contentDescription = null,
tint = Color.White.copy(alpha = 0.8f),
modifier = Modifier.size(14.dp)
)
}
MessageStatus.READ -> {
Box(modifier = Modifier.height(14.dp)) {
Icon( Icon(
painter = TelegramIcons.Done, painter = TelegramIcons.Clock,
contentDescription = null, contentDescription = null,
tint = Color.White, tint = Color.White.copy(alpha = 0.7f),
modifier = Modifier.size(14.dp) modifier = Modifier.size(14.dp)
) )
}
MessageStatus.SENT, MessageStatus.DELIVERED -> {
Icon( Icon(
painter = TelegramIcons.Done, painter = TelegramIcons.Done,
contentDescription = null, contentDescription = null,
tint = Color.White, tint = Color.White.copy(alpha = 0.8f),
modifier = Modifier.size(14.dp).offset(x = 4.dp) modifier = Modifier.size(14.dp)
)
}
MessageStatus.READ -> {
Box(modifier = Modifier.height(14.dp)) {
Icon(
painter = TelegramIcons.Done,
contentDescription = null,
tint = Color.White,
modifier = Modifier.size(14.dp)
)
Icon(
painter = TelegramIcons.Done,
contentDescription = null,
tint = Color.White,
modifier = Modifier.size(14.dp).offset(x = 4.dp)
)
}
}
MessageStatus.ERROR -> {
Icon(
imageVector = Icons.Default.Error,
contentDescription = null,
tint = Color(0xFFE53935),
modifier = Modifier.size(14.dp)
) )
} }
} }
MessageStatus.ERROR -> {
Icon(
imageVector = Icons.Default.Error,
contentDescription = null,
tint = Color(0xFFE53935),
modifier = Modifier.size(14.dp)
)
}
} }
} }
} }
} }
} }

View File

@@ -0,0 +1,76 @@
# Custom WebRTC for Rosetta Android (Audio E2EE Timestamp)
This setup builds a custom `libwebrtc.aar` for Android and patches audio E2EE so
`FrameEncryptor/FrameDecryptor` receive non-empty `additional_data` with RTP timestamp bytes.
## Why
Stock `io.github.webrtc-sdk:android:125.6422.07` can call audio frame encryptor with empty
`additional_data` (`ad=0`), so nonce derivation based on timestamp is unavailable.
Desktop uses frame timestamp for nonce. This patch aligns Android with that approach by passing
an 8-byte big-endian timestamp payload in `additional_data`:
- bytes `0..3` = `0`
- bytes `4..7` = RTP timestamp (big-endian)
## Files
- `build_custom_webrtc.sh` — reproducible build script
- `patches/0001-audio-e2ee-pass-rtp-timestamp-as-additional-data.patch` — WebRTC patch
## Build
Recommended on Linux (macOS can work but is less predictable for long WebRTC builds).
Bootstrap `depot_tools` first:
```bash
cd /path/to/rosetta-android/tools/webrtc-custom
./bootstrap_depot_tools.sh
```
Then run:
```bash
cd /path/to/rosetta-android/tools/webrtc-custom
./build_custom_webrtc.sh
```
Optional env vars:
- `WEBRTC_ROOT` — checkout root (default: `$HOME/webrtc_android`)
- `WEBRTC_SRC` — direct path to `src/`
- `WEBRTC_BRANCH` — default `branch-heads/6422`
- `WEBRTC_TAG` — use a specific tag/commit instead of branch
- `OUT_AAR` — output AAR path (default: `app/libs/libwebrtc-custom.aar`)
- `SYNC_JOBS``gclient sync` jobs (default: `1`, safer for googlesource limits)
- `SYNC_RETRIES` — sync retry attempts (default: `8`)
- `SYNC_RETRY_BASE_SEC` — base retry delay in seconds (default: `20`)
## Troubleshooting (HTTP 429 / RESOURCE_EXHAUSTED)
If build fails with:
- `The requested URL returned error: 429`
- `RESOURCE_EXHAUSTED`
- `Short term server-time rate limit exceeded`
run with conservative sync settings:
```bash
SYNC_JOBS=1 SYNC_RETRIES=12 SYNC_RETRY_BASE_SEC=30 ./build_custom_webrtc.sh
```
The script now retries `fetch`, `git fetch`, and `gclient sync` with backoff.
## Integration in app
`app/build.gradle.kts` already prefers local `app/libs/libwebrtc-custom.aar` if present.
If file exists, Maven WebRTC dependency is not used.
## Maintenance policy
- Keep patch small and isolated to `audio/channel_send.cc` + `audio/channel_receive.cc`.
- Pin WebRTC branch/tag for releases.
- Rebuild AAR on version bumps and verify `e2ee_diag.txt` shows `ad=8` (or non-zero).

View File

@@ -0,0 +1,13 @@
#!/usr/bin/env bash
set -euo pipefail
DEPOT_TOOLS_DIR="${DEPOT_TOOLS_DIR:-$HOME/depot_tools}"
if [[ ! -d "${DEPOT_TOOLS_DIR}/.git" ]]; then
git clone https://chromium.googlesource.com/chromium/tools/depot_tools.git "${DEPOT_TOOLS_DIR}"
fi
echo
echo "depot_tools ready: ${DEPOT_TOOLS_DIR}"
echo "Add to PATH in your shell profile:"
echo " export PATH=\"${DEPOT_TOOLS_DIR}:\$PATH\""

View File

@@ -0,0 +1,154 @@
#!/usr/bin/env bash
set -euo pipefail
# Reproducible custom WebRTC AAR build for Rosetta Android.
# Requirements:
# - Linux machine
# - depot_tools in PATH
# - python3, git
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
ROSETTA_ANDROID_DIR="$(cd "${SCRIPT_DIR}/../.." && pwd)"
PATCH_FILE="${SCRIPT_DIR}/patches/0001-audio-e2ee-pass-rtp-timestamp-as-additional-data.patch"
# Default target: WebRTC M125 family used by app dependency 125.6422.07.
WEBRTC_BRANCH="${WEBRTC_BRANCH:-branch-heads/6422}"
WEBRTC_TAG="${WEBRTC_TAG:-}"
# Source checkout root (contains src/)
WEBRTC_ROOT="${WEBRTC_ROOT:-$HOME/webrtc_android}"
WEBRTC_SRC="${WEBRTC_SRC:-${WEBRTC_ROOT}/src}"
# Output AAR consumed by app/build.gradle.kts.
OUT_AAR="${OUT_AAR:-${ROSETTA_ANDROID_DIR}/app/libs/libwebrtc-custom.aar}"
# Sync tuning to survive chromium.googlesource short-term 429 limits.
SYNC_JOBS="${SYNC_JOBS:-1}"
SYNC_RETRIES="${SYNC_RETRIES:-8}"
SYNC_RETRY_BASE_SEC="${SYNC_RETRY_BASE_SEC:-20}"
# Architectures used by the app.
ARCHS=("armeabi-v7a" "arm64-v8a" "x86_64")
echo "[webrtc-custom] root: ${WEBRTC_ROOT}"
echo "[webrtc-custom] src: ${WEBRTC_SRC}"
echo "[webrtc-custom] out: ${OUT_AAR}"
echo "[webrtc-custom] sync jobs: ${SYNC_JOBS}, retries: ${SYNC_RETRIES}"
# Keep depot_tools from auto-updating during long runs.
export DEPOT_TOOLS_UPDATE=0
retry_cmd() {
local max_attempts="$1"
shift
local attempt=1
local backoff="${SYNC_RETRY_BASE_SEC}"
while true; do
if "$@"; then
return 0
fi
if (( attempt >= max_attempts )); then
return 1
fi
echo "[webrtc-custom] attempt ${attempt}/${max_attempts} failed, retrying in ${backoff}s: $*"
sleep "${backoff}"
backoff=$(( backoff * 2 ))
if (( backoff > 300 )); then
backoff=300
fi
attempt=$(( attempt + 1 ))
done
}
sync_with_retry() {
local attempt=1
while true; do
# Heal known broken checkout state after interrupted/failed gclient runs.
if [[ -d "${WEBRTC_SRC}/third_party/libjpeg_turbo/.git" ]]; then
git -C "${WEBRTC_SRC}/third_party/libjpeg_turbo" reset --hard >/dev/null 2>&1 || true
git -C "${WEBRTC_SRC}/third_party/libjpeg_turbo" clean -fd >/dev/null 2>&1 || true
fi
if [[ -d "${WEBRTC_ROOT}/_bad_scm/src/third_party" ]]; then
find "${WEBRTC_ROOT}/_bad_scm/src/third_party" -maxdepth 1 -type d -name 'libjpeg_turbo*' -exec rm -rf {} + >/dev/null 2>&1 || true
fi
if gclient sync -D --jobs "${SYNC_JOBS}"; then
return 0
fi
if (( attempt >= SYNC_RETRIES )); then
echo "[webrtc-custom] ERROR: gclient sync failed after ${SYNC_RETRIES} attempts"
echo "[webrtc-custom] Tip: wait 10-15 min and rerun with lower burst:"
echo "[webrtc-custom] SYNC_JOBS=1 SYNC_RETRIES=12 ./build_custom_webrtc.sh"
return 1
fi
local wait_sec=$(( SYNC_RETRY_BASE_SEC * attempt ))
if (( wait_sec > 300 )); then
wait_sec=300
fi
echo "[webrtc-custom] gclient sync failed (attempt ${attempt}/${SYNC_RETRIES}), sleeping ${wait_sec}s..."
sleep "${wait_sec}"
attempt=$(( attempt + 1 ))
done
}
if ! command -v fetch >/dev/null 2>&1; then
echo "[webrtc-custom] ERROR: depot_tools 'fetch' not found in PATH"
exit 1
fi
if [[ ! -d "${WEBRTC_SRC}/.git" ]]; then
echo "[webrtc-custom] checkout not found, fetching webrtc_android..."
mkdir -p "${WEBRTC_ROOT}"
pushd "${WEBRTC_ROOT}" >/dev/null
retry_cmd "${SYNC_RETRIES}" fetch --nohooks --no-history webrtc_android
sync_with_retry
popd >/dev/null
fi
pushd "${WEBRTC_SRC}" >/dev/null
echo "[webrtc-custom] syncing source..."
retry_cmd "${SYNC_RETRIES}" git fetch --all --tags
if [[ -n "${WEBRTC_TAG}" ]]; then
retry_cmd "${SYNC_RETRIES}" git checkout "${WEBRTC_TAG}"
else
if git show-ref --verify --quiet "refs/remotes/origin/${WEBRTC_BRANCH}"; then
retry_cmd "${SYNC_RETRIES}" git checkout -B "${WEBRTC_BRANCH}" "origin/${WEBRTC_BRANCH}"
else
retry_cmd "${SYNC_RETRIES}" git checkout "${WEBRTC_BRANCH}"
fi
if git rev-parse --abbrev-ref --symbolic-full-name '@{u}' >/dev/null 2>&1; then
retry_cmd "${SYNC_RETRIES}" git pull --ff-only
else
echo "[webrtc-custom] no upstream for current branch, skipping git pull"
fi
fi
sync_with_retry
echo "[webrtc-custom] applying Rosetta patch..."
git reset --hard
git apply --check "${PATCH_FILE}"
git apply "${PATCH_FILE}"
mkdir -p "$(dirname "${OUT_AAR}")"
echo "[webrtc-custom] building AAR (this can take a while)..."
python3 tools_webrtc/android/build_aar.py \
--build-dir out_rosetta_aar \
--output "${OUT_AAR}" \
--arch "${ARCHS[@]}" \
--extra-gn-args \
is_debug=false \
is_component_build=false \
rtc_include_tests=false \
rtc_build_examples=false
echo "[webrtc-custom] done"
echo "[webrtc-custom] AAR: ${OUT_AAR}"
popd >/dev/null

View File

@@ -0,0 +1,54 @@
diff --git a/audio/channel_receive.cc b/audio/channel_receive.cc
index 17cf859ed8..b9d9ab14c8 100644
--- a/audio/channel_receive.cc
+++ b/audio/channel_receive.cc
@@ -693,10 +693,20 @@ void ChannelReceive::ReceivePacket(const uint8_t* packet,
const std::vector<uint32_t> csrcs(header.arrOfCSRCs,
header.arrOfCSRCs + header.numCSRCs);
+ const uint8_t additional_data_bytes[8] = {
+ 0,
+ 0,
+ 0,
+ 0,
+ static_cast<uint8_t>((header.timestamp >> 24) & 0xff),
+ static_cast<uint8_t>((header.timestamp >> 16) & 0xff),
+ static_cast<uint8_t>((header.timestamp >> 8) & 0xff),
+ static_cast<uint8_t>(header.timestamp & 0xff),
+ };
const FrameDecryptorInterface::Result decrypt_result =
frame_decryptor_->Decrypt(
cricket::MEDIA_TYPE_AUDIO, csrcs,
- /*additional_data=*/nullptr,
+ /*additional_data=*/additional_data_bytes,
rtc::ArrayView<const uint8_t>(payload, payload_data_length),
decrypted_audio_payload);
diff --git a/audio/channel_send.cc b/audio/channel_send.cc
index 4a2700177b..93283c2e78 100644
--- a/audio/channel_send.cc
+++ b/audio/channel_send.cc
@@ -320,10 +320,21 @@ int32_t ChannelSend::SendRtpAudio(AudioFrameType frameType,
// Encrypt the audio payload into the buffer.
size_t bytes_written = 0;
+ const uint8_t additional_data_bytes[8] = {
+ 0,
+ 0,
+ 0,
+ 0,
+ static_cast<uint8_t>((rtp_timestamp_without_offset >> 24) & 0xff),
+ static_cast<uint8_t>((rtp_timestamp_without_offset >> 16) & 0xff),
+ static_cast<uint8_t>((rtp_timestamp_without_offset >> 8) & 0xff),
+ static_cast<uint8_t>(rtp_timestamp_without_offset & 0xff),
+ };
+
int encrypt_status = frame_encryptor_->Encrypt(
cricket::MEDIA_TYPE_AUDIO, rtp_rtcp_->SSRC(),
- /*additional_data=*/nullptr, payload, encrypted_audio_payload,
- &bytes_written);
+ /*additional_data=*/additional_data_bytes, payload,
+ encrypted_audio_payload, &bytes_written);
if (encrypt_status != 0) {
RTC_DLOG(LS_ERROR)
<< "Channel::SendData() failed encrypt audio payload: "