mirror of
https://github.com/NationalSecurityAgency/ghidra.git
synced 2026-05-29 05:29:43 +08:00
Merge remote-tracking branch 'origin/patch'
This commit is contained in:
+6
-3
@@ -277,15 +277,18 @@ public class RandomForestTrainingTask extends Task {
|
||||
monitor.setMessage(
|
||||
"Selecting " + numEntries * factor + " random addresses within function interiors");
|
||||
start = System.nanoTime();
|
||||
AddressSetView randomFuncInteriors =
|
||||
RandomSubsetUtils.randomSubset(selectableInteriors, numEntries * factor, monitor);
|
||||
long numInteriors = numEntries * factor;
|
||||
|
||||
AddressSetView randomFuncInteriors = numInteriors < selectableInteriors.getNumAddresses()
|
||||
? RandomSubsetUtils.randomSubset(selectableInteriors, numInteriors, monitor)
|
||||
: selectableInteriors;
|
||||
end = System.nanoTime();
|
||||
Msg.info(this, String.format("factor: %d elapsed selecting random interiors: %g seconds",
|
||||
factor, (end - start) / NANOSECONDS_PER_SECOND));
|
||||
trainingNegative = trainingNegative.union(randomFuncInteriors);
|
||||
if (trainingNegative.isEmpty()) {
|
||||
Msg.showError(this, null, "Data Gathering Error",
|
||||
"No function interiors in training set");
|
||||
"No non-starts in training set for sampling factor " + factor);
|
||||
return null;
|
||||
}
|
||||
if (trainingPositive.intersects(trainingNegative)) {
|
||||
|
||||
+29
@@ -358,4 +358,33 @@ public class RandomForestTrainingTaskTest extends AbstractProgramBasedTest {
|
||||
assertTrue(data.getTestNegative().contains(definedData));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testExhaustingFunctionInteriors() throws CancelledException {
|
||||
params = new FunctionStartRFParams(program);
|
||||
params.setMaxStarts(5);
|
||||
int tooBig = 10;
|
||||
Address begin = program.getSymbolTable().getSymbols("entry").next().getAddress();
|
||||
AddressSet entries = new AddressSet();
|
||||
for (int i = 0; i < 10; ++i) {
|
||||
entries.add(begin.add(i));
|
||||
}
|
||||
AddressSet interiors = new AddressSet();
|
||||
for (int i = 10; i < 25; ++i) {
|
||||
interiors.add(begin.add(i));
|
||||
}
|
||||
AddressSet definedData = new AddressSet();
|
||||
for (int i = 25; i < 30; ++i) {
|
||||
definedData.add(begin.add(i));
|
||||
}
|
||||
RandomForestTrainingTask task = new RandomForestTrainingTask(program, params, null,
|
||||
RandomForestFunctionFinderPlugin.TEST_SET_MAX_SIZE_DEFAULT);
|
||||
TrainingAndTestData data =
|
||||
task.getTrainingAndTestData(entries, interiors, definedData, tooBig, TaskMonitor.DUMMY);
|
||||
assertTrue(data.getTrainingPositive().getNumAddresses() == 5);
|
||||
assertTrue(data.getTestPositive().getNumAddresses() == 5);
|
||||
assertTrue(data.getTestPositive().union(data.getTrainingPositive()).equals(entries));
|
||||
assertTrue(data.getTrainingNegative().equals(interiors));
|
||||
assertTrue(data.getTestNegative().equals(definedData));
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
@@ -1,19 +1,19 @@
|
||||
##VERSION: 2.0
|
||||
Module.manifest||GHIDRA||||END|
|
||||
data/languages/80251.cspec||GHIDRA||||END|
|
||||
data/languages/80251.pspec||GHIDRA||reviewed||END|
|
||||
data/languages/80251.pspec||GHIDRA||||END|
|
||||
data/languages/80251.sinc||GHIDRA||||END|
|
||||
data/languages/80251.slaspec||GHIDRA||||END|
|
||||
data/languages/80390.cspec||GHIDRA||||END|
|
||||
data/languages/80390.slaspec||GHIDRA||||END|
|
||||
data/languages/8051.cspec||GHIDRA||||END|
|
||||
data/languages/8051.ldefs||GHIDRA||||END|
|
||||
data/languages/8051.pspec||GHIDRA||reviewed||END|
|
||||
data/languages/8051.pspec||GHIDRA||||END|
|
||||
data/languages/8051.slaspec||GHIDRA||||END|
|
||||
data/languages/8051_archimedes.cspec||GHIDRA||||END|
|
||||
data/languages/8051_main.sinc||GHIDRA||||END|
|
||||
data/languages/mx51.cspec||GHIDRA||||END|
|
||||
data/languages/mx51.pspec||GHIDRA||reviewed||END|
|
||||
data/languages/mx51.pspec||GHIDRA||||END|
|
||||
data/languages/mx51.sinc||GHIDRA||||END|
|
||||
data/languages/mx51.slaspec||GHIDRA||||END|
|
||||
data/languages/old/8051v1.lang||GHIDRA||reviewed||END|
|
||||
|
||||
@@ -6,6 +6,7 @@
|
||||
|
||||
<volatile outputop="write_volatile" inputop="read_volatile">
|
||||
<range space="SFR" first="0x0" last="0x1FF"/>
|
||||
<range space="BITS" first="0x400" last="0x800"/>
|
||||
</volatile>
|
||||
|
||||
<default_symbols>
|
||||
|
||||
@@ -6,6 +6,7 @@
|
||||
|
||||
<volatile outputop="write_volatile" inputop="read_volatile">
|
||||
<range space="SFR" first="0x0" last="0xFF"/>
|
||||
<range space="BITS" first="0x80" last="0xFF"/>
|
||||
</volatile>
|
||||
|
||||
<default_symbols>
|
||||
|
||||
@@ -6,6 +6,7 @@
|
||||
|
||||
<volatile outputop="write_volatile" inputop="read_volatile">
|
||||
<range space="SFR" first="0x0" last="0xFF"/>
|
||||
<range space="BITS" first="0x80" last="0xFF"/>
|
||||
</volatile>
|
||||
|
||||
<default_symbols>
|
||||
@@ -47,10 +48,10 @@
|
||||
<symbol name="BANK3_R7" address="RAM:7f001f"/>
|
||||
|
||||
<symbol name="P0" address="SFR:80"/>
|
||||
<symbol name="SP" address="SFR:81"/>
|
||||
<symbol name="DPL" address="SFR:82"/>
|
||||
<symbol name="DPH" address="SFR:83"/>
|
||||
<symbol name="DPXL" address="SFR:84"/>
|
||||
<symbol name="SP" address="SFR:81"/>
|
||||
<symbol name="DPL" address="SFR:82"/>
|
||||
<symbol name="DPH" address="SFR:83"/>
|
||||
<symbol name="DPXL" address="SFR:84"/>
|
||||
<symbol name="PCON" address="SFR:87"/>
|
||||
<symbol name="TCON" address="SFR:88"/>
|
||||
<symbol name="TMOD" address="SFR:89"/>
|
||||
@@ -274,10 +275,10 @@
|
||||
<symbol name="P0.1" address="BITS:81"/>
|
||||
<symbol name="P0.2" address="BITS:82"/>
|
||||
<symbol name="P0.3" address="BITS:83"/>
|
||||
<symbol name="P0.4" address="BITS:84"/>
|
||||
<symbol name="P0.5" address="BITS:85"/>
|
||||
<symbol name="P0.6" address="BITS:86"/>
|
||||
<symbol name="P0.7" address="BITS:87"/>
|
||||
<symbol name="P0.4" address="BITS:84/>
|
||||
<symbol name="P0.5" address="BITS:85/>
|
||||
<symbol name="P0.6" address="BITS:86/>
|
||||
<symbol name="P0.7" address="BITS:87/>
|
||||
<symbol name="IT0" address="BITS:88"/>
|
||||
<symbol name="IE0" address="BITS:89"/>
|
||||
<symbol name="IT1" address="BITS:8a"/>
|
||||
|
||||
@@ -709,7 +709,10 @@ define token instr (32)
|
||||
op2030=(20,30)
|
||||
op2031=(20,31)
|
||||
sop2031=(20,31) signed
|
||||
op2121=(21,21)
|
||||
op2130=(21,30)
|
||||
op2222=(22,22)
|
||||
op2323=(23,23)
|
||||
op2324=(23,24)
|
||||
op2424=(24,24)
|
||||
op2427=(24,27)
|
||||
@@ -753,8 +756,10 @@ define token cinstr (16)
|
||||
cr0206=(2,6)
|
||||
cfr0206=(2,6)
|
||||
cop0212=(2,12)
|
||||
cop0303=(3,3)
|
||||
cop0304=(3,4)
|
||||
cop0305=(3,5)
|
||||
cop0404=(4,4)
|
||||
cop0406=(4,6)
|
||||
cop0505=(5,5)
|
||||
cop0506=(5,6)
|
||||
@@ -773,6 +778,7 @@ define token cinstr (16)
|
||||
cfr0711=(7,11)
|
||||
cop0712=(7,12)
|
||||
cop0808=(8,8)
|
||||
cop0909=(9,9)
|
||||
cop0910=(9,10)
|
||||
cop0912=(9,12)
|
||||
cop1010=(10,10)
|
||||
|
||||
@@ -123,11 +123,18 @@
|
||||
}
|
||||
|
||||
# jal d,a 0000006f 0000007f JSR (0, 0)
|
||||
# call if RA set, destreg == RA
|
||||
:jal ra,immUJ is immUJ & ra & r0711=1 & op0001=0x3 & op0204=0x3 & op0506=0x3
|
||||
{
|
||||
ra = inst_next;
|
||||
call immUJ;
|
||||
}
|
||||
|
||||
# goto if RA not set, destreg != RA
|
||||
:jal rd,immUJ is immUJ & rd & op0001=0x3 & op0204=0x3 & op0506=0x3
|
||||
{
|
||||
#TODO RAS: push inst_next if rd=x1/x5
|
||||
rd = inst_next;
|
||||
call immUJ;
|
||||
goto immUJ;
|
||||
}
|
||||
|
||||
# j a 0000006f 00000fff BRANCH|ALIAS (0, 0)
|
||||
@@ -136,14 +143,21 @@
|
||||
goto immUJ;
|
||||
}
|
||||
|
||||
|
||||
# jalr d,s,j 00000067 0000707f JSR (0, 0)
|
||||
# call if RA set, destreg == RA
|
||||
:jalr ra,rs1,immI is rs1 & immI & ra & r0711=1 & op0001=0x3 & op0204=0x1 & op0506=0x3 & funct3=0x0
|
||||
{
|
||||
local ea:$(XLEN) = (rs1 + immI) & ~1;
|
||||
ra = inst_next;
|
||||
call [ea];
|
||||
}
|
||||
|
||||
# goto if RA not set, destreg != RA
|
||||
:jalr rd,rs1,immI is rs1 & immI & rd & op0001=0x3 & op0204=0x1 & op0506=0x3 & funct3=0x0
|
||||
{
|
||||
#TODO RAS: push inst_next/pop based on rd=x1/x5 or rs1=x1/x5
|
||||
local ea:$(XLEN) = (rs1 + immI) & ~1;
|
||||
rd = inst_next;
|
||||
call [ea];
|
||||
goto [ea];
|
||||
}
|
||||
|
||||
# jr o(s) 00000067 00007fff BRANCH|ALIAS (0, 0)
|
||||
|
||||
@@ -355,11 +355,13 @@
|
||||
*[ram]:4 ea = crs2:4;
|
||||
}
|
||||
|
||||
# c.unimp 00000000 0000ffff SIMPLE (0, 0)
|
||||
:c.unimp is cop0001=0x0 & cop1315=0x0 & cop0212=0x0
|
||||
{
|
||||
trap();
|
||||
}
|
||||
# c.unimp 00000000 0000ffff SIMPLE (0, 0)
|
||||
# would be better not to decode as it is used as padding
|
||||
#
|
||||
# :c.unimp is cop0001=0x0 & cop1315=0x0 & cop0212=0x0
|
||||
#{
|
||||
# trap();
|
||||
#}
|
||||
|
||||
# c.xor Cs,Ct 00008c21 0000fc63 SIMPLE (0, 0)
|
||||
:c.xor cr0709s,cr0204s is cr0204s & cr0709s & cop0001=0x1 & cop1315=0x4 & cop0506=0x1 & cop1012=0x3
|
||||
|
||||
@@ -203,21 +203,25 @@ cbimm: reloc is scop1212 & cop1011 & cop0506 & cop0304 & cop0202 [ reloc = inst_
|
||||
# used for goto
|
||||
cjimm: reloc is scop1212 & cop1111 & cop0910 & cop0808 & cop0707 & cop0606 & cop0305 & cop0202 [ reloc = inst_start + ((scop1212 << 11) | (cop1111 << 4) | (cop0910 << 8) | (cop0808 << 10) | (cop0707 << 6) | (cop0606 << 7) | (cop0305 << 1) | (cop0202 << 5)); ] { export *[ram]:$(XLEN) reloc; }
|
||||
|
||||
|
||||
nzuimm5: is cop0606=1 | cop0505=1 | cop0404=1 | cop0303 = 1 | cop0202=1 {}
|
||||
nzuimm6: is cop1212=1 | cop0606=1 | cop0505=1 | cop0404=1 | cop0303 = 1 | cop0202=1 {}
|
||||
|
||||
@if ADDRSIZE == "32"
|
||||
#TODO nonzero, would like to have cop0205>0
|
||||
c6imm: uimm is cop1212=0 & cop0206 [ uimm = (cop0206 + 0); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
c6imm: uimm is cop1212=0 & cop0206 & nzuimm5 [ uimm = (cop0206 + 0); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
@elif ADDRSIZE == "64"
|
||||
#TODO nonzero, would like to have cop0205>0 | cop0206>0
|
||||
c6imm: uimm is cop1212 & cop0206 [ uimm = (cop1212 << 5) | (cop0206); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
c6imm: uimm is cop1212 & cop0206 & nzuimm6 [ uimm = (cop1212 << 5) | (cop0206); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
@elif ADDRSIZE == "128"
|
||||
c6imm: uimm is cop1212 & cop0206 [ uimm = (cop1212 << 5) | (cop0206); ] { local tmp:$(XLEN) = uimm + (64 * (uimm == 0)); export tmp; }
|
||||
@endif
|
||||
|
||||
cbigimm: uimm is cop1212 & scop1212 & cop0206 [ uimm = (cop1212 << 5) | (cop0206); ] { local tmp:$(XLEN) = (scop1212 << 17) | (cop0206 << 12); export tmp; }
|
||||
cbigimm: uimm is cop1212 & scop1212 & cop0206 & nzuimm6 [ uimm = (cop1212 << 5) | (cop0206); ] { local tmp:$(XLEN) = (scop1212 << 17) | (cop0206 << 12); export tmp; }
|
||||
|
||||
caddi4spnimm: uimm is cop1112 & cop0710 & cop0606 & cop0505 [ uimm = (cop0710 << 6) | (cop1112 << 4) | (cop0505 << 3) | (cop0606 << 2); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
nzcaddi4: is cop1212=1 | cop1111=1 | cop1010=1 | cop0909=1 | cop0808=1 | cop0707=1 | cop0606=1 | cop0505=1 {}
|
||||
|
||||
caddi16spimm: imm is scop1212 & cop0606 & cop0505 & cop0304 & cop0202 [ imm = (scop1212 << 9) | (cop0304 << 7) | (cop0505 << 6) | (cop0202 << 5) | (cop0606 << 4); ] { local tmp:$(XLEN) = imm; export tmp; }
|
||||
caddi4spnimm: uimm is nzcaddi4 & cop1112 & cop0710 & cop0606 & cop0505 [ uimm = (cop0710 << 6) | (cop1112 << 4) | (cop0505 << 3) | (cop0606 << 2); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
|
||||
caddi16spimm: imm is scop1212 & cop0606 & cop0505 & cop0304 & cop0202 & nzuimm6 [ imm = (scop1212 << 9) | (cop0304 << 7) | (cop0505 << 6) | (cop0202 << 5) | (cop0606 << 4); ] { local tmp:$(XLEN) = imm; export tmp; }
|
||||
|
||||
|
||||
clwimm: uimm is cop1012 & cop0606 & cop0505 [ uimm = (cop1012 << 3) | (cop0606 << 2) | (cop0505 << 6); ] { local tmp:$(XLEN) = uimm; export tmp; }
|
||||
|
||||
@@ -69,20 +69,20 @@
|
||||
</output>
|
||||
<unaffected>
|
||||
<register name="sp"/>
|
||||
<register name="gp"/>
|
||||
<register name="tp"/>
|
||||
<register name="gp"/>
|
||||
<register name="tp"/>
|
||||
<register name="s0"/>
|
||||
<register name="s1"/>
|
||||
<register name="s2"/>
|
||||
<register name="s3"/>
|
||||
<register name="s4"/>
|
||||
<register name="s5"/>
|
||||
<register name="s6"/>
|
||||
<register name="s7"/>
|
||||
<register name="s8"/>
|
||||
<register name="s9"/>
|
||||
<register name="s10"/>
|
||||
<register name="s11"/>
|
||||
<register name="s1"/>
|
||||
<register name="s2"/>
|
||||
<register name="s3"/>
|
||||
<register name="s4"/>
|
||||
<register name="s5"/>
|
||||
<register name="s6"/>
|
||||
<register name="s7"/>
|
||||
<register name="s8"/>
|
||||
<register name="s9"/>
|
||||
<register name="s10"/>
|
||||
<register name="s11"/>
|
||||
</unaffected>
|
||||
</prototype>
|
||||
</default_proto>
|
||||
|
||||
@@ -69,20 +69,20 @@
|
||||
</output>
|
||||
<unaffected>
|
||||
<register name="sp"/>
|
||||
<register name="gp"/>
|
||||
<register name="tp"/>
|
||||
<register name="gp"/>
|
||||
<register name="tp"/>
|
||||
<register name="s0"/>
|
||||
<register name="s1"/>
|
||||
<register name="s2"/>
|
||||
<register name="s3"/>
|
||||
<register name="s4"/>
|
||||
<register name="s5"/>
|
||||
<register name="s6"/>
|
||||
<register name="s7"/>
|
||||
<register name="s8"/>
|
||||
<register name="s9"/>
|
||||
<register name="s10"/>
|
||||
<register name="s11"/>
|
||||
<register name="s1"/>
|
||||
<register name="s2"/>
|
||||
<register name="s3"/>
|
||||
<register name="s4"/>
|
||||
<register name="s5"/>
|
||||
<register name="s6"/>
|
||||
<register name="s7"/>
|
||||
<register name="s8"/>
|
||||
<register name="s9"/>
|
||||
<register name="s10"/>
|
||||
<register name="s11"/>
|
||||
</unaffected>
|
||||
</prototype>
|
||||
</default_proto>
|
||||
|
||||
@@ -1,52 +1,45 @@
|
||||
<patternlist>
|
||||
<patternpairs totalbits="32" postbits="0">
|
||||
|
||||
<patternpairs totalbits="27" postbits="11">
|
||||
<!-- Higher confidence patterns, after a return and more defined bits -->
|
||||
<prepatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>10000010 10000000</data> <!-- ret -->
|
||||
<data>......01 101.....</data> <!-- c.j imm -->
|
||||
<data>10000010 10000000</data> <!-- ret -->
|
||||
<data>10000010 10000000 00000000 00000000 </data> <!-- ret; padding -->
|
||||
</prepatterns>
|
||||
<postpatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>0.....01 01110001</data> <!-- c.addi16sp sp,-imm -->
|
||||
<data>0.....01 00010001</data> <!-- c.addi sp,-imm -->
|
||||
<funcstart/>
|
||||
</postpatterns>
|
||||
</patternpairs>
|
||||
<patternpairs totalbits="48" postbits="0">
|
||||
<prepatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>10000010 10000000</data> <!-- ret -->
|
||||
<data>......01 101.....</data> <!-- c.j imm -->
|
||||
</prepatterns>
|
||||
<postpatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>0.....01 01110001</data> <!-- c.addi16sp sp,-imm -->
|
||||
<data>0.....01 00010001</data> <!-- c.addi sp,-imm -->
|
||||
<data>00010011 00000001 ....0001 1.......</data> <!-- addi sp,sp,-imm -->
|
||||
<data>.0010111 ........ ........ ........</data> <!-- auipc rd,imm-->
|
||||
<funcstart/>
|
||||
</postpatterns>
|
||||
</patternpairs>
|
||||
<patternpairs totalbits="48" postbits="0">
|
||||
|
||||
<patternpairs totalbits="16" postbits="11">
|
||||
<!-- Medium confidence, more bits, but prepattern are jumps, not return -->
|
||||
<prepatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>01101111 ....0000 ........ ........</data> <!-- j imm -->
|
||||
<data>01101111 ....0000 ........ ........</data> <!-- j imm -->
|
||||
<data>......01 101..... </data> <!-- c.j imm -->
|
||||
<data>......01 101..... 00000000 00000000 </data> <!-- c.j imm; padding -->
|
||||
</prepatterns>
|
||||
<postpatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>0.....01 01110001</data> <!-- c.addi16sp sp,-imm -->
|
||||
<data>0.....01 00010001</data> <!-- c.addi sp,-imm -->
|
||||
<funcstart/>
|
||||
</postpatterns>
|
||||
</patternpairs>
|
||||
<patternpairs totalbits="64" postbits="0">
|
||||
<prepatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>01101111 ....0000 ........ ........</data> <!-- j imm -->
|
||||
</prepatterns>
|
||||
<postpatterns>
|
||||
<!-- 76543210 54321098 32109876 10987654 -->
|
||||
<data>0.....01 01110001</data> <!-- c.addi16sp sp,-imm -->
|
||||
<data>0.....01 00010001</data> <!-- c.addi sp,-imm -->
|
||||
<data>00010011 00000001 ....0001 1.......</data> <!-- addi sp,sp,-imm -->
|
||||
<data>.0010111 ........ ........ ........</data> <!-- auipc rd,imm-->
|
||||
<funcstart/>
|
||||
<possiblefuncstart/>
|
||||
</postpatterns>
|
||||
</patternpairs>
|
||||
</patternlist>
|
||||
|
||||
<patternpairs totalbits="20" postbits="7">
|
||||
<!-- Lower confidence, too few bits on start pattern -->
|
||||
<prepatterns>
|
||||
<data>10000010 10000000</data> <!-- ret -->
|
||||
<data>10000010 10000000 00000000 00000000 </data> <!-- ret; padding -->
|
||||
<data>......01 101..... 00000000 00000000 </data> <!-- c.j imm; padding -->
|
||||
<data>01101111 ....0000 ........ ........</data> <!-- j imm -->
|
||||
</prepatterns>
|
||||
<postpatterns>
|
||||
<data>.0010111 ........ ........ ........</data> <!-- auipc rd,imm-->
|
||||
<possiblefuncstart/>
|
||||
</postpatterns>
|
||||
</patternpairs>
|
||||
</patternlist>
|
||||
Reference in New Issue
Block a user