Skip to content

Commit e45b605

Browse files
authored
Fix long encoding (#3303)
1 parent 3395f4b commit e45b605

File tree

3 files changed

+50
-11
lines changed

3 files changed

+50
-11
lines changed

lang/php/lib/Datum/AvroIOBinaryDecoder.php

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -124,7 +124,7 @@ public static function decodeLongFromArray($bytes)
124124
$n |= (($b & 0x7f) << $shift);
125125
$shift += 7;
126126
}
127-
return (($n >> 1) ^ -($n & 1));
127+
return ($n >> 1) ^ (($n >> 63) << 63) ^ -($n & 1);
128128
}
129129

130130
/**

lang/php/lib/Datum/AvroIOBinaryEncoder.php

Lines changed: 17 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -101,13 +101,24 @@ public static function encodeLong($n)
101101
{
102102
$n = (int) $n;
103103
$n = ($n << 1) ^ ($n >> 63);
104-
$str = '';
105-
while (0 != ($n & ~0x7F)) {
106-
$str .= chr(($n & 0x7F) | 0x80);
107-
$n >>= 7;
104+
105+
if ($n >= 0 && $n < 0x80) {
106+
return chr($n);
108107
}
109-
$str .= chr($n);
110-
return $str;
108+
109+
$buf = [];
110+
if (($n & ~0x7F) != 0) {
111+
$buf[] = ($n | 0x80) & 0xFF;
112+
$n = ($n >> 7) ^ (($n >> 63) << 57); // unsigned shift right ($n >>> 7)
113+
114+
while ($n > 0x7F) {
115+
$buf[] = ($n | 0x80) & 0xFF;
116+
$n >>= 7; // $n is always positive here
117+
}
118+
}
119+
120+
$buf[] = $n;
121+
return pack("C*", ...$buf);
111122
}
112123

113124
/**

lang/php/test/DatumIOTest.php

Lines changed: 32 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,12 @@
2828
use Apache\Avro\Schema\AvroSchema;
2929
use PHPUnit\Framework\TestCase;
3030

31+
/**
32+
* @covers AvroIOBinaryDecoder
33+
* @covers AvroIOBinaryEncoder
34+
* @covers AvroIODatumReader
35+
* @covers AvroIODatumWriter
36+
*/
3137
class DatumIOTest extends TestCase
3238
{
3339
/**
@@ -68,11 +74,33 @@ function data_provider()
6874
array('"int"', 1, "\002"),
6975
array('"int"', 2147483647, "\xFE\xFF\xFF\xFF\x0F"),
7076

71-
// array('"long"', (int) -9223372036854775808, "\001"),
77+
array('"long"', (int) -9223372036854775808, "\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF\x01"),
78+
array('"long"', -(1<<62), "\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF\x7F"),
79+
array('"long"', -(1<<61), "\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF\x3F"),
80+
array('"long"', -4294967295, "\xFD\xFF\xFF\xFF\x1F"),
81+
array('"long"', -1<<24, "\xFF\xFF\xFF\x0F"),
82+
array('"long"', -1<<16, "\xFF\xFF\x07"),
83+
array('"long"', -255, "\xFD\x03"),
84+
array('"long"', -128, "\xFF\x01"),
85+
array('"long"', -127, "\xFD\x01"),
86+
array('"long"', -10, "\x13"),
87+
array('"long"', -3, "\005"),
88+
array('"long"', -2, "\003"),
7289
array('"long"', -1, "\001"),
73-
array('"long"', 0, "\000"),
74-
array('"long"', 1, "\002"),
75-
// array('"long"', 9223372036854775807, "\002")
90+
array('"long"', 0, "\000"),
91+
array('"long"', 1, "\002"),
92+
array('"long"', 2, "\004"),
93+
array('"long"', 3, "\006"),
94+
array('"long"', 10, "\x14"),
95+
array('"long"', 127, "\xFE\x01"),
96+
array('"long"', 128, "\x80\x02"),
97+
array('"long"', 255, "\xFE\x03"),
98+
array('"long"', 1<<16, "\x80\x80\x08"),
99+
array('"long"', 1<<24, "\x80\x80\x80\x10"),
100+
array('"long"', 4294967295, "\xFE\xFF\xFF\xFF\x1F"),
101+
array('"long"', 1<<61, "\x80\x80\x80\x80\x80\x80\x80\x80\x40"),
102+
array('"long"', 1<<62, "\x80\x80\x80\x80\x80\x80\x80\x80\x80\x01"),
103+
array('"long"', 9223372036854775807, "\xFE\xFF\xFF\xFF\xFF\xFF\xFF\xFF\xFF\x01"),
76104

77105
array('"float"', (float) -10.0, "\000\000 \301"),
78106
array('"float"', (float) -1.0, "\000\000\200\277"),

0 commit comments

Comments
 (0)