Skip to content

Commit

Permalink
Merge pull request atomvm#1483 from pguyot/w04/fix-binary-split
Browse files Browse the repository at this point in the history
Fix memory corruption caused by `binary:split/2,3`

These changes are made under both the "Apache 2.0" and the "GNU Lesser General
Public License 2.1 or later" license terms (dual license).

SPDX-License-Identifier: Apache-2.0 OR LGPL-2.1-or-later
  • Loading branch information
bettio committed Jan 22, 2025
2 parents af48881 + a44111e commit 09783b4
Show file tree
Hide file tree
Showing 5 changed files with 71 additions and 30 deletions.
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,7 @@ certain VM instructions are used.
- Fixed a double free when esp32 uart driver was closed, yielding an assert abort
- Fixed compilation with latest debian gcc-arm-none-eabi
- Fix `network:stop/0` on ESP32 so the network can be started again
- Fix a memory corruption caused by `binary:split/2,3`

## [0.6.5] - 2024-10-15

Expand Down
6 changes: 5 additions & 1 deletion src/libAtomVM/nifs.c
Original file line number Diff line number Diff line change
Expand Up @@ -3121,15 +3121,19 @@ static term nif_binary_split(Context *ctx, int argc, term argv[])
size_t num_segments = 1;
const char *temp_bin_data = bin_data;
int temp_bin_size = bin_size;
size_t heap_size = 0;
do {
const char *found = (const char *) memmem(temp_bin_data, temp_bin_size, pattern_data, pattern_size);
if (!found) break;
num_segments++;
heap_size += CONS_SIZE + term_sub_binary_heap_size(argv[0], found - temp_bin_data);
int next_search_offset = found - temp_bin_data + pattern_size;
temp_bin_data += next_search_offset;
temp_bin_size -= next_search_offset;
} while (global && temp_bin_size >= pattern_size);

heap_size += CONS_SIZE + term_sub_binary_heap_size(argv[0], temp_bin_size);

term result_list = term_nil();

if (num_segments == 1) {
Expand All @@ -3142,7 +3146,7 @@ static term nif_binary_split(Context *ctx, int argc, term argv[])
}

// binary:split/2,3 always return sub binaries, except when copied binaries are as small as sub-binaries.
if (UNLIKELY(memory_ensure_free_with_roots(ctx, LIST_SIZE(num_segments, TERM_BOXED_SUB_BINARY_SIZE), 2, argv, MEMORY_CAN_SHRINK) != MEMORY_GC_OK)) {
if (UNLIKELY(memory_ensure_free_with_roots(ctx, heap_size, 2, argv, MEMORY_CAN_SHRINK) != MEMORY_GC_OK)) {
RAISE_ERROR(OUT_OF_MEMORY_ATOM);
}

Expand Down
2 changes: 1 addition & 1 deletion src/libAtomVM/term.h
Original file line number Diff line number Diff line change
Expand Up @@ -1068,7 +1068,7 @@ static inline term term_from_literal_binary(const void *data, size_t size, Heap
*/
static inline size_t term_sub_binary_heap_size(term binary, size_t len)
{
if (term_is_refc_binary(binary) && len >= SUB_BINARY_MIN) {
if ((term_is_refc_binary(binary) || term_is_sub_binary(binary)) && len >= SUB_BINARY_MIN) {
return TERM_BOXED_SUB_BINARY_SIZE;
} else {
return term_binary_heap_size(len);
Expand Down
90 changes: 63 additions & 27 deletions tests/erlang_tests/test_binary_split.erl
Original file line number Diff line number Diff line change
Expand Up @@ -20,63 +20,99 @@

-module(test_binary_split).

-export([start/0, split_compare/3, split_compare/2, compare_bin/2, fail_split/1]).
-export([start/0, split_compare/3, split_compare/2, compare_bin/2, fail_split/1, id/1]).

start() ->
split_compare(<<"Hello:World">>, <<"Hello">>, <<"World">>) +
split_compare(<<"Hello:::World:">>, <<"Hello">>, <<"::World:">>) +
split_compare(<<"Test:">>, <<"Test">>, <<>>) +
split_compare(<<":">>, <<>>, <<>>) +
split_compare(<<>>, <<>>) +
split_compare(<<"Test">>, <<>>) +
split_compare2(<<"Test">>, <<>>) +
split_compare2(<<"helloSEPARATORworld">>, <<"hello">>, <<"world">>) +
fail_split(<<>>) +
fail_split({1, 2}) +
fail_split2({1, 2}).
ok = split_compare(<<"Hello:World">>, <<"Hello">>, <<"World">>),
ok = split_compare(<<"Hello:::World:">>, <<"Hello">>, <<"::World:">>),
ok = split_compare(<<"Test:">>, <<"Test">>, <<>>),
ok = split_compare(<<":">>, <<>>, <<>>),
ok = split_compare(<<>>, <<>>),
ok = split_compare(<<"Test">>, <<>>),
ok = split_compare2(<<"Test">>, <<>>),
ok = split_compare2(<<"helloSEPARATORworld">>, <<"hello">>, <<"world">>),
ok = fail_split(<<>>),
ok = fail_split({1, 2}),
ok = fail_split2({1, 2}),
case erlang:system_info(machine) of
"BEAM" -> ok;
"ATOM" -> ok = memory_allocation_split()
end,
0.

split_compare(Bin, Part1) ->
[A] = binary:split(Bin, <<":">>),
compare_bin(Part1, A).

split_compare(Bin, Part1, Part2) ->
[A, B] = binary:split(Bin, <<":">>),
compare_bin(Part1, A) + compare_bin(B, Part2).
ok = compare_bin(Part1, A),
ok = compare_bin(B, Part2).

split_compare2(Bin, Part1) ->
[A] = binary:split(Bin, <<"SEPARATOR">>),
compare_bin(Part1, A).

split_compare2(Bin, Part1, Part2) ->
[A, B] = binary:split(Bin, <<"SEPARATOR">>),
compare_bin(Part1, A) + compare_bin(B, Part2).
ok = compare_bin(Part1, A),
ok = compare_bin(B, Part2).

compare_bin(Bin1, Bin2) ->
compare_bin(Bin1, Bin2, byte_size(Bin1) - 1).

compare_bin(_Bin1, _Bin2, -1) ->
1;
ok;
compare_bin(Bin1, Bin2, Index) ->
B1 = binary:at(Bin1, Index),
case binary:at(Bin2, Index) of
B1 ->
compare_bin(Bin1, Bin2, Index - 1);
_Any ->
0
end.
B1 = binary:at(Bin2, Index),
compare_bin(Bin1, Bin2, Index - 1).

fail_split(Separator) ->
try binary:split(<<"TESTBIN">>, Separator) of
_Any -> 2000
_Any -> {unexpected, _Any}
catch
error:badarg -> 1;
_:_ -> 4000
error:badarg -> ok;
T:V -> {unexpected, {T, V}}
end.

fail_split2(Bin) ->
try binary:split(Bin, <<"TESTSEPARATOR">>) of
_Any -> 2000
_Any -> {unxpected, _Any}
catch
error:badarg -> 1;
_:_ -> 4000
error:badarg -> ok;
T:V -> {unxpected, {T, V}}
end.

memory_allocation_split() ->
Parent = self(),
Hostname = <<"atomvm">>,
{Pid, MonitorRef} = spawn_opt(
fun() ->
% Carefully designed lists to generate a crash on unix 64 bits
% This binary is 63 bytes long, so it's stored on heap on 64 bits
% binary:split should allocate sufficient bytes as subbinaries
% have to be on heap as well
HeapBin = list_to_binary([
id(Hostname), <<"@atomvms3.object.stream.atomvms3.object.stream.atomvms3.o">>
]),
List1 = binary:split(HeapBin, <<"@">>, [global]),
Parent ! {self(), List1}
end,
[link, monitor, {atomvm_heap_growth, minimum}]
),
ok =
receive
{Pid, List1} ->
2 = length(List1),
ok
after 5000 -> timeout
end,
normal =
receive
{'DOWN', MonitorRef, process, Pid, Reason} -> Reason
after 5000 -> timeout
end,
ok.

id(X) -> X.
2 changes: 1 addition & 1 deletion tests/test.c
Original file line number Diff line number Diff line change
Expand Up @@ -318,7 +318,7 @@ struct Test tests[] = {
TEST_CASE(test_unicode),

TEST_CASE_EXPECTED(test_binary_part, 12),
TEST_CASE_EXPECTED(test_binary_split, 16),
TEST_CASE(test_binary_split),

TEST_CASE_COND(plusone, 134217728, LONG_MAX != 9223372036854775807),

Expand Down

0 comments on commit 09783b4

Please sign in to comment.