mupen64plus-core/tools/r4300prof.c
2021-06-16 07:35:12 -06:00

521 lines
17 KiB
C

/* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
* Mupen64plus - r4300prof.c *
* Mupen64Plus homepage: https://mupen64plus.org/ *
* Copyright (C) 2008 Richard Goedeken *
* *
* This program is free software; you can redistribute it and/or modify *
* it under the terms of the GNU General Public License as published by *
* the Free Software Foundation; either version 2 of the License, or *
* (at your option) any later version. *
* *
* This program is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
* GNU General Public License for more details. *
* *
* You should have received a copy of the GNU General Public License *
* along with this program; if not, write to the *
* Free Software Foundation, Inc., *
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. *
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
/* Global data */
unsigned int instr_samples[132];
char instr_name[][10] =
{
"reserved", "NI", "J", "JAL", "BEQ", "BNE", "BLEZ", "BGTZ",
"ADDI", "ADDIU", "SLTI", "SLTIU", "ANDI", "ORI", "XORI", "LUI",
"BEQL", "BNEL", "BLEZL", "BGTZL", "DADDI", "DADDIU", "LDL", "LDR",
"LB", "LH", "LW", "LWL", "LBU", "LHU", "LWU", "LWR",
"SB", "SH", "SW", "SWL", "SWR", "SDL", "SDR", "LWC1",
"LDC1", "LD", "LL", "SWC1", "SDC1", "SD", "SC", "BLTZ",
"BGEZ", "BLTZL", "BGEZL", "BLTZAL", "BGEZAL", "BLTZALL", "BGEZALL", "SLL",
"SRL", "SRA", "SLLV", "SRLV", "SRAV", "JR", "JALR", "SYSCALL",
"MFHI", "MTHI", "MFLO", "MTLO", "DSLLV", "DSRLV", "DSRAV", "MULT",
"MULTU", "DIV", "DIVU", "DMULT", "DMULTU", "DDIV", "DDIVU", "ADD",
"ADDU", "SUB", "SUBU", "AND", "OR", "XOR", "NOR", "SLT",
"SLTU", "DADD", "DADDU", "DSUB", "DSUBU", "DSLL", "DSRL", "DSRA",
"TEQ", "DSLL32", "DSRL32", "DSRA32", "BC1F", "BC1T", "BC1FL", "BC1TL",
"TLBWI", "TLBP", "TLBR", "TLBWR", "ERET", "MFC0", "MTC0", "MFC1",
"DMFC1", "CFC1", "MTC1", "DMTC1", "CTC1", "f.CVT", "f.CMP", "f.ADD",
"f.SUB", "f.MUL", "f.DIV", "f.SQRT", "f.ABS", "f.MOV", "f.NEG", "f.ROUND",
"f.TRUNC", "f.CEIL", "f.FLOOR"
};
unsigned int instr_type[131] = { 9, 10, 6, 6, 7, 7, 7, 7, 3, 3, 4, 4, 3, 4, 4, 0,
7, 7, 7, 7, 4, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 7,
7, 7, 7, 7, 7, 7, 7, 3, 3, 3, 3, 3, 3, 6, 6, 10,
2, 2, 2, 2, 4, 4, 4, 3, 3, 3, 3, 4, 4, 4, 4, 3,
3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
8, 4, 4, 4, 7, 7, 7, 7, 10, 10, 10, 10, 8, 2, 2, 2,
2, 2, 2, 2, 2, 2, 5, 5, 5, 5, 5, 5, 5, 2, 5, 5,
5, 5, 5 };
char instr_typename[][20] = { "Load", "Store", "Data move/convert", "32-bit math", "64-bit math", "Float Math",
"Jump", "Branch", "Exceptions", "Reserved", "Other" };
/* Global functions */
int GetInstrType(int opcode);
int AddrCompare(const void *, const void *);
int ParseProfLine(const char *pchIn, long *plAddress, int *piSamples, float *pfPercentage);
/* defined types */
typedef struct __attribute__ ((__packed__))
{
int mipsop;
long x86addr;
} r4300op;
typedef struct
{
long x86addr;
int samples;
} profilehit;
/* static functions */
static int isSpace(char ch)
{
return (ch == ' ' || ch == '\t' ? 1 : 0);
}
static int isNum(char ch)
{
return (ch >= '0' && ch <= '9' ? 1 : 0);
}
static int isFloat(char ch)
{
return ((ch >= '0' && ch <= '9') || ch == '.' || ch == '+' || ch == '-' || ch == 'e' ? 1 : 0);
}
static int isHex(char ch)
{
return ((ch >= '0' && ch <= '9') || ((ch & 0xdf) >= 'A' && (ch & 0xdf) <= 'F') ? 1 : 0);
}
/* main */
int main(int argc, void *argv[])
{
long lOpStart, lOpEnd;
int flength, oplistlength, totaltime, proflistlength;
int samp_unknown, samp_blockend, samp_notcompiled, samp_wrappers, samp_flush;
int i, j;
FILE *pfIn;
r4300op *pOpAddrTable;
profilehit *pProfTable;
char *pch, *pchSampleData;
/* check arguments */
if (argc < 3)
{
printf("Usage: r4300prof r4300addr.dat x86profile.txt\n\n");
printf("r4300addr.dat - binary table of r4300 opcodes and corresponding x86 starting addresses\n");
printf("x86profile.txt - text file containing a list of profile sample counts by x86 address on the heap\n\n");
return 1;
}
/* open r4300 opcode/x86 address table generated from emulator run */
printf("Loading %s...\n", argv[1]);
pfIn = osal_file_open(argv[1], "rb");
if (pfIn == NULL)
{
printf("Couldn't open input file: %s\n", argv[1]);
return 2;
}
/* get file length and calculate number of r4300op table entries */
fseek(pfIn, 0L, SEEK_END);
flength = (int) ftell(pfIn);
fseek(pfIn, 0L, SEEK_SET);
oplistlength = flength / sizeof(r4300op);
/* read the file */
pOpAddrTable = (r4300op *) malloc(flength);
if (pOpAddrTable == NULL)
{
printf("Failed to allocate %i bytes for OpAddrTable!\n", flength);
fclose(pfIn);
return 3;
}
fread(pOpAddrTable, 1, flength, pfIn);
fclose(pfIn);
printf("%i r4300 instruction locations read.\n", oplistlength);
/* sort the opcode/address table according to x86addr */
qsort(pOpAddrTable, oplistlength, sizeof(r4300op), AddrCompare);
/* remove any 0-length r4300 instructions */
i = 0;
j = 0;
while (i < oplistlength)
{
pOpAddrTable[j].mipsop = pOpAddrTable[i].mipsop;
pOpAddrTable[j].x86addr = pOpAddrTable[i].x86addr;
i++;
if (pOpAddrTable[j].x86addr != pOpAddrTable[i].x86addr)
j++;
}
oplistlength = j;
printf("%i non-empty MIPS instructions.\n", oplistlength);
/* convert each r4300 opcode to an instruction type index */
for (i = 0; i < oplistlength; i++)
if (pOpAddrTable[i].mipsop > 0 || pOpAddrTable[i].mipsop < -16)
pOpAddrTable[i].mipsop = GetInstrType(pOpAddrTable[i].mipsop);
/* open the profiling sample data file */
printf("Loading %s...\n", argv[2]);
pfIn = osal_file_open(argv[2], "rb");
if (pfIn == NULL)
{
printf("Couldn't open input file: %s\n", argv[2]);
free(pOpAddrTable);
return 4;
}
/* load it */
fseek(pfIn, 0L, SEEK_END);
flength = (int) ftell(pfIn);
fseek(pfIn, 0L, SEEK_SET);
pchSampleData = (char *) malloc(flength + 16);
if (pchSampleData == NULL)
{
printf("Failed to allocate %i bytes for pchSampleData!\n", flength + 16);
fclose(pfIn);
free(pOpAddrTable);
return 5;
}
fread(pchSampleData, 1, flength, pfIn);
pchSampleData[flength] = 0;
fclose(pfIn);
/* count the number of newlines in the ascii-formatted sample data file */
proflistlength = 1;
pch = pchSampleData;
while (pch = strchr(pch, '\n'))
{
proflistlength++;
pch++;
}
printf("%i lines in sample data file.\n", proflistlength);
/* extract text data into binary table */
pProfTable = (profilehit *) malloc(proflistlength * sizeof(profilehit));
if (pProfTable == NULL)
{
printf("Failed to allocate %i bytes for pProfTable!\n", proflistlength * sizeof(profilehit));
free(pOpAddrTable);
free(pchSampleData);
return 6;
}
pch = pchSampleData;
j = 0;
long long llOffset = 0;
while (j < proflistlength)
{
long lAddress;
int iSamples;
float fPercentage;
char *pchNext = strchr(pch, '\n');
if (pchNext != NULL) *pchNext++ = 0; // null-terminate this line
if (strstr(pch, "range:0x") != NULL) // search for offset change
{
pch = strstr(pch, "range:0x") + 8; // extract hex value and update our offset
char *pch2 = pch;
while (isHex(*pch2)) pch2++;
*pch2 = 0;
llOffset = strtoll(pch, NULL, 16);
}
else // parse line for sample point
{
int rval = ParseProfLine(pch, &lAddress, &iSamples, &fPercentage);
if (rval != 0)
{
pProfTable[j].x86addr = (unsigned long) (lAddress + llOffset);
pProfTable[j].samples = iSamples;
j++;
}
}
pch = pchNext;
if (pch == NULL) break;
}
free(pchSampleData);
proflistlength = j;
printf("Found %i profile hits.\n", proflistlength);
/* clear r4300 instruction sample data table */
for (i = 0; i < 132; i++)
instr_samples[i] = 0;
/* calculate r4300 instruction profiling data by merging the tables */
samp_unknown = 0;
samp_blockend = 0;
samp_notcompiled = 0;
samp_wrappers = 0;
samp_flush = 0;
i = 0; // i == OpAddrTable index
lOpStart = pOpAddrTable[0].x86addr;
lOpEnd = pOpAddrTable[1].x86addr;
for (j = 0; j < proflistlength; j++) // j == pProfTable index
{
long lOpx86addr = pProfTable[j].x86addr;
if (lOpx86addr >= lOpStart && lOpx86addr <= lOpEnd) /* these profile samples lie within current r4300 instruction */
{
int instr = pOpAddrTable[i].mipsop;
if (instr == -1) printf("%lx sample point lies between %i/%lx and %i/%lx\n", lOpx86addr, instr, lOpStart, pOpAddrTable[i+1].mipsop, lOpEnd);
if (instr == -1)
samp_unknown += pProfTable[j].samples;
else if (instr == -2)
samp_notcompiled += pProfTable[j].samples;
else if (instr == -3)
samp_blockend += pProfTable[j].samples;
else if (instr == -4)
samp_wrappers += pProfTable[j].samples;
else if (instr == -5)
samp_flush += pProfTable[j].samples;
else
instr_samples[instr] += pProfTable[j].samples;
continue;
}
if (lOpx86addr < pOpAddrTable[0].x86addr || lOpx86addr >= pOpAddrTable[oplistlength-1].x86addr)
{ /* outside the range of all recompiled instructions */
samp_unknown += pProfTable[j].samples;
continue;
}
if (lOpx86addr < lOpStart) /* discontinuity in profile list, go back to start */
{
i = 0;
lOpStart = pOpAddrTable[0].x86addr;
lOpEnd = pOpAddrTable[1].x86addr;
j--;
continue;
}
/* this profile point is ahead of current r4300 instruction */
do /* race ahead in r4300 opcode list until we hit this profile sample point */
{
i++;
} while (i+1 < oplistlength && lOpx86addr > pOpAddrTable[i+1].x86addr);
lOpStart = pOpAddrTable[i].x86addr;
lOpEnd = pOpAddrTable[i+1].x86addr;
if (lOpx86addr < lOpStart || lOpx86addr > lOpEnd)
{
printf("Error: lOpx86addr = %lx but lOpStart, lOpEnd = %lx, %lx\n", lOpx86addr, lOpStart, lOpEnd);
return 7;
}
/* we have found the correct r4300 instruction corresponding to this profile point */
j--;
}
/* print the results */
unsigned int iTypeCount[11] = {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
printf("\nInstruction time (samples):\n");
totaltime = 0;
for (i = 0; i < 131; i++)
{
printf("%8s: %08i ", instr_name[i], instr_samples[i]);
if (i % 5 == 4) printf("\n");
iTypeCount[instr_type[i]] += instr_samples[i];
totaltime += instr_samples[i];
}
int special = samp_flush + samp_wrappers + samp_notcompiled + samp_blockend;
printf("\n\nSpecial code samples:\n");
printf(" Regcache flushing: %i\n", samp_flush);
printf(" Jump wrappers: %i\n", samp_wrappers);
printf(" NOTCOMPILED: %i\n", samp_notcompiled);
printf(" block postfix & link samples: %i\n", samp_blockend);
printf("\nUnaccounted samples: %i\n", samp_unknown);
printf("Total accounted instruction samples: %i\n", totaltime + special);
for (i = 0; i < 11; i++)
{
printf("%20s: %04.1f%% (%i)\n", instr_typename[i], (float) iTypeCount[i] * 100.0 / totaltime, iTypeCount[i]);
}
free(pOpAddrTable);
free(pProfTable);
return 0;
}
int AddrCompare(const void *p1, const void *p2)
{
const r4300op *pOp1 = (const r4300op *) p1;
const r4300op *pOp2 = (const r4300op *) p2;
if (pOp1->x86addr < pOp2->x86addr)
return -1;
else if (pOp1->x86addr == pOp2->x86addr)
return (int) (pOp1 - pOp2); /* this forces qsort to be stable */
else
return 1;
}
int ParseProfLine(const char *pchIn, long *plAddress, int *piSamples, float *pfPercentage)
{
char chVal[128], *pchOut;
/* skip any initial whitespace */
while (isSpace(*pchIn)) pchIn++;
if (!isHex(*pchIn)) return 0;
/* parse hexadecimal address value */
pchOut = chVal;
while (isHex(*pchIn)) *pchOut++ = *pchIn++;
*pchOut = 0;
if (!isSpace(*pchIn)) return 0;
*plAddress = strtol(chVal, NULL, 16);
/* skip more whitespace */
while (isSpace(*pchIn)) pchIn++;
if (!isNum(*pchIn)) return 0;
/* parse decimal sample count value */
pchOut = chVal;
while (isNum(*pchIn)) *pchOut++ = *pchIn++;
*pchOut = 0;
if (!isSpace(*pchIn)) return 0;
*piSamples = atoi(chVal);
/* skip more whitespace */
while (isSpace(*pchIn)) pchIn++;
if (!isFloat(*pchIn)) return 0;
/* parse floating-point percentage value */
pchOut = chVal;
while (isFloat(*pchIn)) *pchOut++ = *pchIn++;
*pchOut = 0;
if (!isSpace(*pchIn) && *pchIn != '\r' && *pchIn != '\n' && *pchIn != 0) return 0;
*pfPercentage = atof(chVal);
/* if this isn't the end of the line, it's not a valid sample point */
while (isSpace(*pchIn)) pchIn++;
if (*pchIn != '\r' && *pchIn != '\n' && *pchIn != 0) return 0;
return 1;
}
static int InstrTypeStd[64] =
{
-1, -1, 02, 03, 04, 05, 06, 07, 8, 9, 10, 11, 12, 13, 14, 15,
-1, -1, 00, 00, 16, 17, 18, 19, 20, 21, 22, 23, 00, 00, 00, 00,
24, 25, 27, 26, 28, 29, 31, 30, 32, 33, 35, 34, 37, 38, 36, 01,
42, 39, 00, 00, 01, 40, 00, 41, 46, 43, 00, 00, 01, 44, 00, 45
};
static int InstrTypeSpecial[64] =
{
55, 00, 56, 57, 58, 00, 59, 60,
61, 62, 00, 00, 63, 01, 00, 00,
64, 65, 66, 67, 68, 00, 69, 70,
71, 72, 73, 74, 75, 76, 77, 78,
79, 80, 81, 82, 83, 84, 85, 86,
00, 00, 87, 88, 89, 90, 91, 92,
01, 01, 01, 01, 96, 00, 01, 00,
93, 00, 94, 95, 97, 00, 98, 99
};
static int InstrTypeRegImm[32] =
{
47, 48, 49, 50, 00, 00, 00, 00, 01, 01, 01, 01, 01, 00, 01, 00,
51, 52, 53, 54, 00, 00, 00, 00, 00, 00, 00, 00, 00, 00, 00, 00
};
static int InstrTypeCop1[32] =
{
111, 112, 113, 00, 114, 115, 116, 00,
-1, 00, 00, 00, 00, 00, 00, 00,
-1, -1, 00, 00, -1, -1, 00, 00,
00, 00, 00, 00, 00, 00, 00, 00
};
static int InstrTypeCop1Math[64] =
{
119, 120, 121, 122, 123, 124, 125, 126,
127, 128, 129, 130, 127, 128, 129, 130,
00, 00, 00, 00, 00, 00, 00, 00,
00, 00, 00, 00, 00, 00, 00, 00,
117, 117, 00, 00, 117, 117, 00, 00,
00, 00, 00, 00, 00, 00, 00, 00,
118, 118, 118, 118, 118, 118, 118, 118,
118, 118, 118, 118, 118, 118, 118, 118
};
int GetInstrType(int opcode)
{
int iType = (opcode >> 26) & 63;
if (iType == 0)
{
/* SPECIAL instruction */
iType = opcode & 63;
return InstrTypeSpecial[iType];
}
else if (iType == 1)
{
/* REGIMM instruction */
iType = (opcode >> 16) & 31;
return InstrTypeRegImm[iType];
}
else if (iType == 16)
{
/* COP0 instruction */
int iType1 = opcode & 0x01FFFFFF;
int iType2 = (opcode >> 21) & 31;
if (iType1 == 1)
return 106; // TLBR
else if (iType1 == 2)
return 104; // TLBWI
else if (iType1 == 6)
return 107; // TLBWR
else if (iType1 == 8)
return 105; // TLBP
else if (iType1 == 24)
return 108; // ERET
else if ((opcode & 0x7FF) == 0 && iType2 == 0)
return 109; // MFC0
else if ((opcode & 0x7FF) == 0 && iType2 == 4)
return 110; // MTC0
else
return 0; // reserved
}
else if (iType == 17)
{
/* COP1 instruction */
int iType1 = (opcode >> 21) & 31;
if (iType1 == 8)
{
/* conditional branch */
int iType2 = (opcode >> 16) & 31;
if (iType2 == 0)
return 100; // BC1F
else if (iType2 == 1)
return 101; // BC1T
else if (iType2 == 2)
return 102; // BC1FL
else if (iType2 == 3)
return 103; // BC1TL
else
return 0; // reserved
}
else if (iType1 == 16 || iType1 == 17 || iType1 == 20 || iType1 == 21)
{
/* Single, Double, Word, Long instructions */
int iType2 = opcode & 63;
return InstrTypeCop1Math[iType2];
}
else
{
/* other Cop1 (move) */
return InstrTypeCop1[iType1];
}
}
/* standard MIPS instruction */
return InstrTypeStd[iType];
}