Files
Pyarmor-Static-Unpack-1shot/pycdc/pyc_string.cpp

183 lines
5.4 KiB
C++
Raw Normal View History

2011-10-23 17:48:10 -07:00
#include "pyc_string.h"
#include "pyc_module.h"
2009-07-24 08:35:21 +00:00
#include "data.h"
#include <stdexcept>
2025-03-02 23:48:24 +08:00
#include "plusaes.hpp"
2009-07-24 08:35:21 +00:00
static bool check_ascii(const std::string& data)
{
auto cp = reinterpret_cast<const unsigned char*>(data.c_str());
while (*cp) {
if (*cp & 0x80)
return false;
++cp;
}
return true;
}
2009-07-24 08:35:21 +00:00
/* PycString */
void PycString::load(PycData* stream, PycModule* mod)
{
if (type() == TYPE_STRINGREF) {
PycRef<PycString> str = mod->getIntern(stream->get32());
m_type = str->m_type;
m_value = str->m_value;
2009-07-24 08:35:21 +00:00
} else {
int length;
if (type() == TYPE_SHORT_ASCII || type() == TYPE_SHORT_ASCII_INTERNED)
length = stream->getByte();
else
length = stream->get32();
if (length < 0)
throw std::bad_alloc();
m_value.resize(length);
if (length) {
stream->getBuffer(length, &m_value.front());
if (type() == TYPE_ASCII || type() == TYPE_ASCII_INTERNED ||
type() == TYPE_SHORT_ASCII || type() == TYPE_SHORT_ASCII_INTERNED) {
if (!check_ascii(m_value))
throw std::runtime_error("Invalid bytes in ASCII string");
}
2009-07-24 08:35:21 +00:00
}
if (type() == TYPE_INTERNED || type() == TYPE_ASCII_INTERNED ||
type() == TYPE_SHORT_ASCII_INTERNED)
2009-07-24 08:35:21 +00:00
mod->intern(this);
}
}
2009-07-24 19:52:47 +00:00
2009-07-24 21:15:51 +00:00
bool PycString::isEqual(PycRef<PycObject> obj) const
{
if (type() != obj.type())
return false;
2009-07-24 21:15:51 +00:00
PycRef<PycString> strObj = obj.cast<PycString>();
return isEqual(strObj->m_value);
2009-07-24 21:15:51 +00:00
}
void PycString::print(std::ostream &pyc_output, PycModule* mod, bool triple,
const char* parent_f_string_quote)
2009-07-24 19:52:47 +00:00
{
char prefix = 0;
switch (type()) {
case TYPE_STRING:
prefix = mod->strIsUnicode() ? 'b' : 0;
break;
case PycObject::TYPE_UNICODE:
prefix = mod->strIsUnicode() ? 0 : 'u';
break;
case PycObject::TYPE_INTERNED:
prefix = mod->internIsBytes() ? 'b' : 0;
break;
case PycObject::TYPE_ASCII:
case PycObject::TYPE_ASCII_INTERNED:
case PycObject::TYPE_SHORT_ASCII:
case PycObject::TYPE_SHORT_ASCII_INTERNED:
// These types don't exist until Python 3.4
prefix = 0;
break;
default:
throw std::runtime_error("Invalid string type");
}
if (prefix != 0)
2023-06-02 00:36:58 +02:00
pyc_output << prefix;
if (m_value.empty()) {
2023-06-02 00:36:58 +02:00
pyc_output << "''";
2009-07-24 19:52:47 +00:00
return;
}
// Determine preferred quote style (Emulate Python's method)
bool useQuotes = false;
2020-10-17 21:04:39 +11:00
if (!parent_f_string_quote) {
for (char ch : m_value) {
if (ch == '\'') {
useQuotes = true;
} else if (ch == '"') {
useQuotes = false;
break;
}
}
2020-10-20 21:08:02 -07:00
} else {
useQuotes = parent_f_string_quote[0] == '"';
}
// Output the string
if (!parent_f_string_quote) {
if (triple)
pyc_output << (useQuotes ? R"(""")" : "'''");
else
2023-06-02 00:36:58 +02:00
pyc_output << (useQuotes ? '"' : '\'');
}
for (char ch : m_value) {
if (static_cast<unsigned char>(ch) < 0x20 || ch == 0x7F) {
if (ch == '\r') {
2023-06-02 00:36:58 +02:00
pyc_output << "\\r";
} else if (ch == '\n') {
if (triple)
2023-06-02 00:36:58 +02:00
pyc_output << '\n';
2009-07-24 19:52:47 +00:00
else
2023-06-02 00:36:58 +02:00
pyc_output << "\\n";
} else if (ch == '\t') {
2023-06-02 00:36:58 +02:00
pyc_output << "\\t";
2009-07-24 19:52:47 +00:00
} else {
formatted_print(pyc_output, "\\x%02x", (ch & 0xFF));
2009-07-24 19:52:47 +00:00
}
} else if (static_cast<unsigned char>(ch) >= 0x80) {
if (type() == TYPE_UNICODE) {
// Unicode stored as UTF-8... Let the stream interpret it
pyc_output << ch;
} else {
formatted_print(pyc_output, "\\x%02x", (ch & 0xFF));
}
2009-07-24 19:52:47 +00:00
} else {
if (!useQuotes && ch == '\'')
pyc_output << R"(\')";
else if (useQuotes && ch == '"')
pyc_output << R"(\")";
else if (ch == '\\')
pyc_output << R"(\\)";
else if (parent_f_string_quote && ch == '{')
2023-06-02 00:36:58 +02:00
pyc_output << "{{";
else if (parent_f_string_quote && ch == '}')
2023-06-02 00:36:58 +02:00
pyc_output << "}}";
2009-07-24 19:52:47 +00:00
else
pyc_output << ch;
2009-07-24 19:52:47 +00:00
}
}
if (!parent_f_string_quote) {
2020-10-17 21:04:39 +11:00
if (triple)
pyc_output << (useQuotes ? R"(""")" : "'''");
2020-10-17 21:04:39 +11:00
else
2023-06-02 00:36:58 +02:00
pyc_output << (useQuotes ? '"' : '\'');
2020-10-17 21:04:39 +11:00
}
2009-07-24 19:52:47 +00:00
}
2025-03-02 23:48:24 +08:00
void PycString::dasPrintAndDecrypt(std::ostream &stream, PycModule *mod, bool triple, const char *parent_f_string_quote)
{
if (m_value.empty() || !(m_value[0] & 0x80)
|| (m_value[0] & 0x7F) == 0 || (m_value[0] & 0x7F) > 4)
return print(stream, mod, triple, parent_f_string_quote);
std::string result(m_value.substr(1));
unsigned char nonce[16] = {0};
memcpy(nonce, mod->pyarmor_mix_str_aes_nonce, 12);
nonce[15] = 2;
plusaes::crypt_ctr(
(unsigned char *)&result[0],
result.length(),
mod->pyarmor_aes_key,
16,
&nonce);
PycString decrypted(m_value[0] & 1 ? TYPE_UNICODE : TYPE_STRING);
2025-03-02 23:48:24 +08:00
decrypted.setValue(result);
decrypted.print(stream, mod, triple, parent_f_string_quote);
stream << " # ";
print(stream, mod, triple, parent_f_string_quote);
}