Skip to content

Commit 0e41c7d

Browse files
committed
Cleanup type conversions in java_bytecode_parsert::read
We can safely read signed values and don't need to defer the type conversion to the call site.
1 parent 66004dc commit 0e41c7d

File tree

1 file changed

+21
-24
lines changed

1 file changed

+21
-24
lines changed

jbmc/src/java_bytecode/java_bytecode_parser.cpp

+21-24
Original file line numberDiff line numberDiff line change
@@ -132,20 +132,17 @@ class java_bytecode_parsert final : public parsert
132132
T read()
133133
{
134134
static_assert(
135-
std::is_unsigned<T>::value, "T should be an unsigned integer");
135+
std::is_unsigned<T>::value || std::is_signed<T>::value,
136+
"T should be a signed or unsigned integer");
136137
const constexpr size_t bytes = sizeof(T);
137-
u8 result = 0;
138-
for(size_t i = 0; i < bytes; i++)
138+
T result;
139+
in->read(reinterpret_cast<char *>(&result), bytes);
140+
if(!*in || static_cast<std::size_t>(in->gcount()) < bytes)
139141
{
140-
if(!*in)
141-
{
142-
log.error() << "unexpected end of bytecode file" << messaget::eom;
143-
throw 0;
144-
}
145-
result <<= 8u;
146-
result |= static_cast<u1>(in->get());
142+
log.error() << "unexpected end of bytecode file" << messaget::eom;
143+
throw 0;
147144
}
148-
return narrow_cast<T>(result);
145+
return result;
149146
}
150147

151148
void store_unknown_method_handle(size_t bootstrap_method_index);
@@ -942,15 +939,15 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
942939

943940
case 'b': // a signed byte
944941
{
945-
const s1 c = read<u1>();
942+
const s1 c = read<s1>();
946943
instruction.args.push_back(from_integer(c, signedbv_typet(8)));
947944
}
948945
address+=1;
949946
break;
950947

951948
case 'o': // two byte branch offset, signed
952949
{
953-
const s2 offset = read<u2>();
950+
const s2 offset = read<s2>();
954951
// By converting the signed offset into an absolute address (by adding
955952
// the current address) the number represented becomes unsigned.
956953
instruction.args.push_back(
@@ -961,7 +958,7 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
961958

962959
case 'O': // four byte branch offset, signed
963960
{
964-
const s4 offset = read<u4>();
961+
const s4 offset = read<s4>();
965962
// By converting the signed offset into an absolute address (by adding
966963
// the current address) the number represented becomes unsigned.
967964
instruction.args.push_back(
@@ -994,15 +991,15 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
994991
{
995992
const u2 v = read<u2>();
996993
instruction.args.push_back(from_integer(v, unsignedbv_typet(16)));
997-
const s2 c = read<u2>();
994+
const s2 c = read<s2>();
998995
instruction.args.push_back(from_integer(c, signedbv_typet(16)));
999996
address+=4;
1000997
}
1001998
else // local variable index (one byte) plus one signed byte
1002999
{
10031000
const u1 v = read<u1>();
10041001
instruction.args.push_back(from_integer(v, unsignedbv_typet(8)));
1005-
const s1 c = read<u1>();
1002+
const s1 c = read<s1>();
10061003
instruction.args.push_back(from_integer(c, signedbv_typet(8)));
10071004
address+=2;
10081005
}
@@ -1032,7 +1029,7 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
10321029
}
10331030

10341031
// now default value
1035-
const s4 default_value = read<u4>();
1032+
const s4 default_value = read<s4>();
10361033
// By converting the signed offset into an absolute address (by adding
10371034
// the current address) the number represented becomes unsigned.
10381035
instruction.args.push_back(
@@ -1045,8 +1042,8 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
10451042

10461043
for(std::size_t i=0; i<npairs; i++)
10471044
{
1048-
const s4 match = read<u4>();
1049-
const s4 offset = read<u4>();
1045+
const s4 match = read<s4>();
1046+
const s4 offset = read<s4>();
10501047
instruction.args.push_back(
10511048
from_integer(match, signedbv_typet(32)));
10521049
// By converting the signed offset into an absolute address (by adding
@@ -1070,23 +1067,23 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
10701067
}
10711068

10721069
// now default value
1073-
const s4 default_value = read<u4>();
1070+
const s4 default_value = read<s4>();
10741071
instruction.args.push_back(
10751072
from_integer(base_offset+default_value, signedbv_typet(32)));
10761073
address+=4;
10771074

10781075
// now low value
1079-
const s4 low_value = read<u4>();
1076+
const s4 low_value = read<s4>();
10801077
address+=4;
10811078

10821079
// now high value
1083-
const s4 high_value = read<u4>();
1080+
const s4 high_value = read<s4>();
10841081
address+=4;
10851082

10861083
// there are high-low+1 offsets, and they are signed
10871084
for(s4 i=low_value; i<=high_value; i++)
10881085
{
1089-
s4 offset = read<u4>();
1086+
s4 offset = read<s4>();
10901087
instruction.args.push_back(from_integer(i, signedbv_typet(32)));
10911088
// By converting the signed offset into an absolute address (by adding
10921089
// the current address) the number represented becomes unsigned.
@@ -1130,7 +1127,7 @@ void java_bytecode_parsert::rbytecode(std::vector<instructiont> &instructions)
11301127

11311128
case 's': // a signed short
11321129
{
1133-
const s2 s = read<u2>();
1130+
const s2 s = read<s2>();
11341131
instruction.args.push_back(from_integer(s, signedbv_typet(16)));
11351132
}
11361133
address+=2;

0 commit comments

Comments
 (0)