Files
Pyarmor-Static-Unpack-1shot/pycdas.cpp

357 lines
14 KiB
C++
Raw Normal View History

2009-07-24 08:35:21 +00:00
#include <cstdio>
#include <cstring>
2009-07-24 08:35:21 +00:00
#include <cstdarg>
#include <string>
2023-06-02 00:36:58 +02:00
#include <iostream>
2011-10-23 17:48:10 -07:00
#include "pyc_module.h"
#include "pyc_numeric.h"
2009-07-24 08:35:21 +00:00
#include "bytecode.h"
2023-06-02 00:36:58 +02:00
#include <fstream>
2009-07-24 08:35:21 +00:00
#ifdef WIN32
# define PATHSEP '\\'
#else
# define PATHSEP '/'
#endif
static const char* flag_names[] = {
"CO_OPTIMIZED", "CO_NEWLOCALS", "CO_VARARGS", "CO_VARKEYWORDS",
2015-10-01 16:06:09 -07:00
"CO_NESTED", "CO_GENERATOR", "CO_NOFREE", "CO_COROUTINE",
"CO_ITERABLE_COROUTINE", "<0x200>", "<0x400>", "<0x800>",
"CO_GENERATOR_ALLOWED", "CO_FUTURE_DIVISION",
"CO_FUTURE_ABSOLUTE_IMPORT", "CO_FUTURE_WITH_STATEMENT",
"CO_FUTURE_PRINT_FUNCTION", "CO_FUTURE_UNICODE_LITERALS",
2015-10-01 16:06:09 -07:00
"CO_FUTURE_BARRY_AS_BDFL", "CO_FUTURE_GENERATOR_STOP",
"<0x100000>", "<0x200000>", "<0x400000>", "<0x800000>",
"<0x1000000>", "<0x2000000>", "<0x4000000>", "<0x8000000>",
"<0x10000000>", "<0x20000000>", "<0x40000000>", "<0x80000000>"
};
2023-06-02 00:36:58 +02:00
static void print_coflags(unsigned long flags, std::ostream& pyc_output)
{
if (flags == 0) {
2023-06-02 00:36:58 +02:00
pyc_output << "\n";
return;
}
2023-06-02 00:36:58 +02:00
pyc_output << " (";
unsigned long f = 1;
int k = 0;
while (k < 32) {
if ((flags & f) != 0) {
flags &= ~f;
if (flags == 0)
2023-06-02 00:36:58 +02:00
pyc_output << flag_names[k];
else
2023-06-02 00:36:58 +02:00
pyc_output << flag_names[k] << " | ";
}
++k;
f <<= 1;
}
2023-06-02 00:36:58 +02:00
pyc_output << ")\n";
}
2023-06-02 00:36:58 +02:00
static void iputs(std::ostream& pyc_output, int indent, const char* text)
{
for (int i=0; i<indent; i++)
2023-06-02 00:36:58 +02:00
pyc_output << " ";
pyc_output << text;
}
2023-06-02 00:36:58 +02:00
static void ivprintf(std::ostream& pyc_output, int indent, const char* fmt, va_list varargs)
2009-07-24 08:35:21 +00:00
{
for (int i=0; i<indent; i++)
2023-06-02 00:36:58 +02:00
pyc_output << " ";
formatted_print(pyc_output, fmt, varargs);
2009-07-24 08:35:21 +00:00
}
2023-06-02 00:36:58 +02:00
static void iprintf(std::ostream& pyc_output, int indent, const char* fmt, ...)
2009-07-24 08:35:21 +00:00
{
va_list varargs;
va_start(varargs, fmt);
2023-06-02 00:36:58 +02:00
ivprintf(pyc_output, indent, fmt, varargs);
2009-07-24 08:35:21 +00:00
va_end(varargs);
}
void output_object(PycRef<PycObject> obj, PycModule* mod, int indent,
2023-06-02 00:36:58 +02:00
unsigned flags, std::ostream& pyc_output)
2009-07-24 08:35:21 +00:00
{
if (obj == NULL) {
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "<NULL>");
return;
}
2009-07-24 08:35:21 +00:00
switch (obj->type()) {
case PycObject::TYPE_CODE:
2009-07-25 00:43:46 +00:00
case PycObject::TYPE_CODE2:
2009-07-24 08:35:21 +00:00
{
PycRef<PycCode> codeObj = obj.cast<PycCode>();
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "[Code]\n");
iprintf(pyc_output, indent + 1, "File Name: %s\n", codeObj->fileName()->value());
iprintf(pyc_output, indent + 1, "Object Name: %s\n", codeObj->name()->value());
if (mod->verCompare(3, 11) >= 0)
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent + 1, "Qualified Name: %s\n", codeObj->qualName()->value());
iprintf(pyc_output, indent + 1, "Arg Count: %d\n", codeObj->argCount());
if (mod->verCompare(3, 8) >= 0)
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent + 1, "Pos Only Arg Count: %d\n", codeObj->posOnlyArgCount());
if (mod->majorVer() >= 3)
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent + 1, "KW Only Arg Count: %d\n", codeObj->kwOnlyArgCount());
if (mod->verCompare(3, 11) < 0)
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent + 1, "Locals: %d\n", codeObj->numLocals());
if (mod->verCompare(1, 5) >= 0)
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent + 1, "Stack Size: %d\n", codeObj->stackSize());
if (mod->verCompare(1, 3) >= 0) {
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent + 1, "Flags: 0x%08X", codeObj->flags());
print_coflags(codeObj->flags(), pyc_output);
2009-07-24 23:21:56 +00:00
}
2009-07-24 08:35:21 +00:00
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Names]\n");
for (int i=0; i<codeObj->names()->size(); i++)
2023-06-02 00:36:58 +02:00
output_object(codeObj->names()->get(i), mod, indent + 2, flags, pyc_output);
if (mod->verCompare(1, 3) >= 0 && mod->verCompare(3, 11) < 0) {
if (mod->verCompare(3, 11) >= 0)
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Locals+Names]\n");
else
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Var Names]\n");
for (int i=0; i<codeObj->localNames()->size(); i++)
2023-06-02 00:36:58 +02:00
output_object(codeObj->localNames()->get(i), mod, indent + 2, flags, pyc_output);
}
if (mod->verCompare(3, 11) >= 0 && (flags & Pyc::DISASM_PYCODE_VERBOSE) != 0) {
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Locals+Kinds]\n");
output_object(codeObj->localKinds().cast<PycObject>(), mod, indent + 2, flags, pyc_output);
2009-07-24 23:21:56 +00:00
}
2009-07-24 08:35:21 +00:00
if (mod->verCompare(2, 1) >= 0 && mod->verCompare(3, 11) < 0) {
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Free Vars]\n");
2009-07-24 23:21:56 +00:00
for (int i=0; i<codeObj->freeVars()->size(); i++)
2023-06-02 00:36:58 +02:00
output_object(codeObj->freeVars()->get(i), mod, indent + 2, flags, pyc_output);
2009-07-24 08:35:21 +00:00
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Cell Vars]\n");
2009-07-24 23:21:56 +00:00
for (int i=0; i<codeObj->cellVars()->size(); i++)
2023-06-02 00:36:58 +02:00
output_object(codeObj->cellVars()->get(i), mod, indent + 2, flags, pyc_output);
2009-07-24 23:21:56 +00:00
}
2009-07-24 08:35:21 +00:00
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Constants]\n");
for (int i=0; i<codeObj->consts()->size(); i++)
2023-06-02 00:36:58 +02:00
output_object(codeObj->consts()->get(i), mod, indent + 2, flags, pyc_output);
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Disassembly]\n");
bc_disasm(codeObj, mod, indent + 2, flags, pyc_output);
if (mod->verCompare(1, 5) >= 0 && (flags & Pyc::DISASM_PYCODE_VERBOSE) != 0) {
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Line Number Table]\n");
output_object(codeObj->lnTable().cast<PycObject>(), mod, indent + 2, flags, pyc_output);
}
if (mod->verCompare(3, 11) >= 0 && (flags & Pyc::DISASM_PYCODE_VERBOSE) != 0) {
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent + 1, "[Exception Table]\n");
output_object(codeObj->exceptTable().cast<PycObject>(), mod, indent + 2, flags, pyc_output);
}
2009-07-24 08:35:21 +00:00
}
break;
case PycObject::TYPE_STRING:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "");
OutputString(obj.cast<PycString>(), mod->strIsUnicode() ? 'b' : 0, false, pyc_output);
pyc_output << "\n";
2009-07-24 08:35:21 +00:00
break;
case PycObject::TYPE_UNICODE:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "");
OutputString(obj.cast<PycString>(), mod->strIsUnicode() ? 0 : 'u', false, pyc_output);
pyc_output << "\n";
break;
case PycObject::TYPE_INTERNED:
case PycObject::TYPE_ASCII:
case PycObject::TYPE_ASCII_INTERNED:
case PycObject::TYPE_SHORT_ASCII:
case PycObject::TYPE_SHORT_ASCII_INTERNED:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "");
if (mod->majorVer() >= 3)
2023-06-02 00:36:58 +02:00
OutputString(obj.cast<PycString>(), 0, false, pyc_output);
else
2023-06-02 00:36:58 +02:00
OutputString(obj.cast<PycString>(), mod->strIsUnicode() ? 'b' : 0, false, pyc_output);
pyc_output << "\n";
break;
2009-07-24 08:35:21 +00:00
case PycObject::TYPE_TUPLE:
case PycObject::TYPE_SMALL_TUPLE:
2009-07-24 08:35:21 +00:00
{
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "(\n");
for (const auto& val : obj.cast<PycTuple>()->values())
2023-06-02 00:36:58 +02:00
output_object(val, mod, indent + 1, flags, pyc_output);
iputs(pyc_output, indent, ")\n");
2009-07-24 08:35:21 +00:00
}
break;
case PycObject::TYPE_LIST:
{
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "[\n");
for (const auto& val : obj.cast<PycList>()->values())
2023-06-02 00:36:58 +02:00
output_object(val, mod, indent + 1, flags, pyc_output);
iputs(pyc_output, indent, "]\n");
2009-07-24 08:35:21 +00:00
}
break;
2009-07-24 21:39:51 +00:00
case PycObject::TYPE_DICT:
{
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "{\n");
2009-07-24 21:39:51 +00:00
PycDict::key_t keys = obj.cast<PycDict>()->keys();
PycDict::value_t values = obj.cast<PycDict>()->values();
PycDict::key_t::const_iterator ki = keys.begin();
PycDict::value_t::const_iterator vi = values.begin();
2009-07-24 21:39:51 +00:00
while (ki != keys.end()) {
2023-06-02 00:36:58 +02:00
output_object(*ki, mod, indent + 1, flags, pyc_output);
output_object(*vi, mod, indent + 2, flags, pyc_output);
++ki, ++vi;
2009-07-24 21:39:51 +00:00
}
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "}\n");
2009-07-24 21:39:51 +00:00
}
break;
case PycObject::TYPE_SET:
{
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "{\n");
for (const auto& val : obj.cast<PycSet>()->values())
2023-06-02 00:36:58 +02:00
output_object(val, mod, indent + 1, flags, pyc_output);
iputs(pyc_output, indent, "}\n");
}
break;
case PycObject::TYPE_FROZENSET:
{
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "frozenset({\n");
for (const auto& val : obj.cast<PycSet>()->values())
2023-06-02 00:36:58 +02:00
output_object(val, mod, indent + 1, flags, pyc_output);
iputs(pyc_output, indent, "})\n");
}
break;
2009-07-24 08:35:21 +00:00
case PycObject::TYPE_NONE:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "None\n");
2009-07-24 08:35:21 +00:00
break;
case PycObject::TYPE_FALSE:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "False\n");
break;
case PycObject::TYPE_TRUE:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "True\n");
break;
2016-08-30 13:32:53 -07:00
case PycObject::TYPE_ELLIPSIS:
2023-06-02 00:36:58 +02:00
iputs(pyc_output, indent, "...\n");
2016-08-30 13:32:53 -07:00
break;
2009-07-24 08:35:21 +00:00
case PycObject::TYPE_INT:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "%d\n", obj.cast<PycInt>()->value());
2009-07-24 08:35:21 +00:00
break;
2011-09-23 21:46:05 -07:00
case PycObject::TYPE_LONG:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "%s\n", obj.cast<PycLong>()->repr().c_str());
2011-09-23 21:46:05 -07:00
break;
2009-07-24 08:35:21 +00:00
case PycObject::TYPE_FLOAT:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "%s\n", obj.cast<PycFloat>()->value());
2009-07-24 08:35:21 +00:00
break;
case PycObject::TYPE_COMPLEX:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "(%s+%sj)\n", obj.cast<PycComplex>()->value(),
obj.cast<PycComplex>()->imag());
break;
case PycObject::TYPE_BINARY_FLOAT:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "%g\n", obj.cast<PycCFloat>()->value());
break;
case PycObject::TYPE_BINARY_COMPLEX:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "(%g+%gj)\n", obj.cast<PycCComplex>()->value(),
obj.cast<PycCComplex>()->imag());
break;
2009-07-24 08:35:21 +00:00
default:
2023-06-02 00:36:58 +02:00
iprintf(pyc_output, indent, "<TYPE: %d>\n", obj->type());
2009-07-24 08:35:21 +00:00
}
}
int main(int argc, char* argv[])
{
const char* infile = nullptr;
bool marshalled = false;
const char* version = nullptr;
unsigned disasm_flags = 0;
2023-06-02 00:36:58 +02:00
std::ostream &pyc_output = std::cout;
for (int arg = 1; arg < argc; ++arg) {
if (strcmp(argv[arg], "-o") == 0) {
if (arg + 1 < argc) {
const char* filename = argv[++arg];
2023-06-02 00:36:58 +02:00
auto* outfile = new std::filebuf;
if(! outfile->open(filename, std::ios::out)) {
fprintf(stderr, "Error opening file '%s' for writing\n",
argv[arg]);
return 1;
}
2023-06-02 00:36:58 +02:00
pyc_output.rdbuf(outfile);
} else {
fputs("Option '-o' requires a filename\n", stderr);
return 1;
}
} else if (strcmp(argv[arg], "-c") == 0) {
marshalled = true;
} else if (strcmp(argv[arg], "-v") == 0) {
if (arg + 1 < argc) {
version = argv[++arg];
} else {
fputs("Option '-v' requires a version\n", stderr);
return 1;
}
} else if (strcmp(argv[arg], "--pycode-extra") == 0) {
disasm_flags |= Pyc::DISASM_PYCODE_VERBOSE;
} else if (strcmp(argv[arg], "--show-caches") == 0) {
disasm_flags |= Pyc::DISASM_SHOW_CACHES;
} else if (strcmp(argv[arg], "--help") == 0 || strcmp(argv[arg], "-h") == 0) {
fprintf(stderr, "Usage: %s [options] input.pyc\n\n", argv[0]);
fputs("Options:\n", stderr);
fputs(" -o <filename> Write output to <filename> (default: stdout)\n", stderr);
fputs(" -c Specify loading a compiled code object. Requires the version to be set\n", stderr);
2022-06-16 12:49:04 +01:00
fputs(" -v <x.y> Specify a Python version for loading a compiled code object\n", stderr);
fputs(" --pycode-extra Show extra fields in PyCode object dumps\n", stderr);
fputs(" --show-caches Don't suprress CACHE instructions in Python 3.11+ disassembly\n", stderr);
fputs(" --help Show this help text and then exit\n", stderr);
return 0;
} else if (argv[arg][0] == '-') {
fprintf(stderr, "Error: Unrecognized argument %s\n", argv[arg]);
return 1;
} else {
infile = argv[arg];
}
}
if (!infile) {
fputs("No input file specified\n", stderr);
2009-07-24 08:35:21 +00:00
return 1;
}
PycModule mod;
if (!marshalled) {
try {
mod.loadFromFile(infile);
} catch (std::exception &ex) {
fprintf(stderr, "Error disassembling %s: %s\n", infile, ex.what());
return 1;
}
} else {
if (!version) {
fputs("Opening raw code objects requires a version to be specified\n", stderr);
return 1;
}
std::string s(version);
auto dot = s.find('.');
if (dot == std::string::npos || dot == s.size()-1) {
2022-06-16 12:49:04 +01:00
fputs("Unable to parse version string (use the format x.y)\n", stderr);
return 1;
}
int major = std::stoi(s.substr(0, dot));
int minor = std::stoi(s.substr(dot+1, s.size()));
mod.loadFromMarshalledFile(infile, major, minor);
}
const char* dispname = strrchr(infile, PATHSEP);
dispname = (dispname == NULL) ? infile : dispname + 1;
2023-06-02 00:36:58 +02:00
formatted_print(pyc_output, "%s (Python %d.%d%s)\n", dispname, mod.majorVer(), mod.minorVer(),
(mod.majorVer() < 3 && mod.isUnicode()) ? " -U" : "");
try {
2023-06-02 00:36:58 +02:00
output_object(mod.code().try_cast<PycObject>(), &mod, 0, disasm_flags, pyc_output);
} catch (std::exception& ex) {
fprintf(stderr, "Error disassembling %s: %s\n", infile, ex.what());
return 1;
}
2009-07-24 08:35:21 +00:00
return 0;
}