summaryrefslogtreecommitdiff
path: root/src/mangling/dex
diff options
context:
space:
mode:
authorCyrille Bagard <nocbos@gmail.com>2018-03-11 21:57:05 (GMT)
committerCyrille Bagard <nocbos@gmail.com>2018-03-11 21:57:05 (GMT)
commit8088f1cbb4304c686ff41520099707a333084a4e (patch)
tree147411c3f90097dc1ae950ec390df2dfccf07ad7 /src/mangling/dex
parenta33dd28e763e3a8b04145fb549aca9320e100a4b (diff)
Defined a new Dex demangler with MUTF-8 support as plugin.
Diffstat (limited to 'src/mangling/dex')
-rw-r--r--src/mangling/dex/Makefile.am46
-rw-r--r--src/mangling/dex/context.c154
-rw-r--r--src/mangling/dex/context.h52
-rw-r--r--src/mangling/dex/shorty_gram.y138
-rw-r--r--src/mangling/dex/shorty_tok.l28
-rw-r--r--src/mangling/dex/type_gram.y159
-rw-r--r--src/mangling/dex/type_tok.l150
7 files changed, 0 insertions, 727 deletions
diff --git a/src/mangling/dex/Makefile.am b/src/mangling/dex/Makefile.am
deleted file mode 100644
index 547d686..0000000
--- a/src/mangling/dex/Makefile.am
+++ /dev/null
@@ -1,46 +0,0 @@
-
-BUILT_SOURCES = libmanglingdexshorty_la-shorty_gram.h libmanglingdextype_la-type_gram.h
-
-AM_YFLAGS = -d
-
-noinst_LTLIBRARIES = libmanglingdex.la libmanglingdexshorty.la libmanglingdextype.la
-
-libmanglingdex_la_SOURCES = \
- context.h context.c
-
-libmanglingdex_la_LDFLAGS =
-
-libmanglingdex_la_LIBADD = \
- libmanglingdexshorty.la \
- libmanglingdextype.la
-
-
-libmanglingdexshorty_la_SOURCES = \
- shorty_gram.y \
- shorty_tok.l
-
-libmanglingdexshorty_la_YFLAGS = -d -p shorty_ -o y.tab.c
-
-libmanglingdexshorty_la_LFLAGS = -P shorty_ -o lex.yy.c
-
-
-libmanglingdextype_la_SOURCES = \
- type_gram.y \
- type_tok.l
-
-libmanglingdextype_la_YFLAGS = -d -p type_ -o y.tab.c
-
-libmanglingdextype_la_LFLAGS = -P type_ -o lex.yy.c
-
-
-AM_CPPFLAGS = $(LIBGTK_CFLAGS) $(LIBXML_CFLAGS)
-
-AM_CFLAGS = $(DEBUG_CFLAGS) $(WARNING_FLAGS) $(COMPLIANCE_FLAGS)
-
-
-# Automake fait les choses à moitié
-CLEANFILES = \
- libmanglingdexshorty_la-shorty_gram.h libmanglingdexshorty_la-shorty_gram.c \
- libmanglingdexshorty_la-shorty_tok.c \
- libmanglingdextype_la-type_gram.h libmanglingdextype_la-type_gram.c \
- libmanglingdextype_la-type_tok.c
diff --git a/src/mangling/dex/context.c b/src/mangling/dex/context.c
deleted file mode 100644
index 9dd9b9c..0000000
--- a/src/mangling/dex/context.c
+++ /dev/null
@@ -1,154 +0,0 @@
-
-/* Chrysalide - Outil d'analyse de fichiers binaires
- * context.c - contextes de décodage DEX
- *
- * Copyright (C) 2015-2017 Cyrille Bagard
- *
- * This file is part of Chrysalide.
- *
- * Chrysalide is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 3 of the License, or
- * (at your option) any later version.
- *
- * Chrysalide is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with Foobar. If not, see <http://www.gnu.org/licenses/>.
- */
-
-
-#include "context.h"
-
-
-#include "../context-int.h"
-
-
-
-/* Contexte de décodage DEX (instance) */
-struct _GDexDemangler
-{
- GDemanglingContext parent; /* A laisser en premier */
-
-};
-
-/* Contexte de décodage DEX (classe) */
-struct _GDexDemanglerClass
-{
- GDemanglingContextClass parent; /* A laisser en premier */
-
-};
-
-
-/* Initialise la classe des contextes de décodage DEX. */
-static void g_dex_demangler_class_init(GDexDemanglerClass *);
-
-/* Initialise une instance de contexte pour décodage DEX. */
-static void g_dex_demangler_init(GDexDemangler *);
-
-/* Supprime toutes les références externes. */
-static void g_dex_demangler_dispose(GDexDemangler *);
-
-/* Procède à la libération totale de la mémoire. */
-static void g_dex_demangler_finalize(GDexDemangler *);
-
-
-/* Procède au décodage d'une chaîne de caractères. */
-extern bool demangle_dex_routine(GDexDemangler *, const char *);
-
-/* Procède au décodage d'une chaîne de caractères. */
-extern bool demangle_dex_type(GDexDemangler *, const char *);
-
-
-
-/* Indique le type défini pour un contexte de décodage DEX. */
-G_DEFINE_TYPE(GDexDemangler, g_dex_demangler, G_TYPE_DEMANGLING_CONTEXT);
-
-
-/******************************************************************************
-* *
-* Paramètres : klass = classe à initialiser. *
-* *
-* Description : Initialise la classe des contextes de décodage DEX. *
-* *
-* Retour : - *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-
-static void g_dex_demangler_class_init(GDexDemanglerClass *klass)
-{
- GObjectClass *object; /* Autre version de la classe */
- GDemanglingContextClass *context; /* Version parente */
-
- object = G_OBJECT_CLASS(klass);
-
- object->dispose = (GObjectFinalizeFunc/* ! */)g_dex_demangler_dispose;
- object->finalize = (GObjectFinalizeFunc)g_dex_demangler_finalize;
-
- context = G_DEMANGLING_CONTEXT_CLASS(klass);
-
- context->demangle_type = (demangle_fc)demangle_dex_type;
- context->demangle_routine = (demangle_fc)demangle_dex_routine;
-
-}
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = instance à initialiser. *
-* *
-* Description : Initialise une instance de contexte pour décodage DEX. *
-* *
-* Retour : - *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-
-static void g_dex_demangler_init(GDexDemangler *demangler)
-{
-
-}
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = instance d'objet GLib à traiter. *
-* *
-* Description : Supprime toutes les références externes. *
-* *
-* Retour : - *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-
-static void g_dex_demangler_dispose(GDexDemangler *demangler)
-{
- G_OBJECT_CLASS(g_dex_demangler_parent_class)->dispose(G_OBJECT(demangler));
-
-}
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = instance d'objet GLib à traiter. *
-* *
-* Description : Procède à la libération totale de la mémoire. *
-* *
-* Retour : - *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-
-static void g_dex_demangler_finalize(GDexDemangler *demangler)
-{
- G_OBJECT_CLASS(g_dex_demangler_parent_class)->finalize(G_OBJECT(demangler));
-
-}
diff --git a/src/mangling/dex/context.h b/src/mangling/dex/context.h
deleted file mode 100644
index 1af7a9d..0000000
--- a/src/mangling/dex/context.h
+++ /dev/null
@@ -1,52 +0,0 @@
-
-/* Chrysalide - Outil d'analyse de fichiers binaires
- * context.h - prototypes internes liés aux contextes de décodage DEX
- *
- * Copyright (C) 2015-2017 Cyrille Bagard
- *
- * This file is part of Chrysalide.
- *
- * Chrysalide is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 3 of the License, or
- * (at your option) any later version.
- *
- * Chrysalide is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with Foobar. If not, see <http://www.gnu.org/licenses/>.
- */
-
-
-#ifndef _FORMAT_MANGLING_DEX_CONTEXT_H
-#define _FORMAT_MANGLING_DEX_CONTEXT_H
-
-
-#include <glib-object.h>
-
-
-
-#define G_TYPE_DEX_DEMANGLER g_dex_demangler_get_type()
-#define G_DEX_DEMANGLER(obj) (G_TYPE_CHECK_INSTANCE_CAST((obj), g_dex_demangler_get_type(), GDexDemangler))
-#define G_IS_DEX_DEMANGLER(obj) (G_TYPE_CHECK_INSTANCE_TYPE((obj), g_dex_demangler_get_type()))
-#define G_DEX_DEMANGLER_CLASS(klass) (G_TYPE_CHECK_CLASS_CAST((klass), G_TYPE_DEX_DEMANGLER, GDexDemanglerClass))
-#define G_IS_DEX_DEMANGLER_CLASS(klass) (G_TYPE_CHECK_CLASS_TYPE((klass), G_TYPE_DEX_DEMANGLER))
-#define G_DEX_DEMANGLER_GET_CLASS(obj) (G_TYPE_INSTANCE_GET_CLASS((obj), G_TYPE_DEX_DEMANGLER, GDexDemanglerClass))
-
-
-/* Contexte de décodage DEX (instance) */
-typedef struct _GDexDemangler GDexDemangler;
-
-/* Contexte de décodage DEX (classe) */
-typedef struct _GDexDemanglerClass GDexDemanglerClass;
-
-
-/* Indique le type défini pour un contexte de décodage DEX. */
-GType g_dex_demangler_get_type(void);
-
-
-
-#endif /* _FORMAT_MANGLING_DEX_CONTEXT_H */
diff --git a/src/mangling/dex/shorty_gram.y b/src/mangling/dex/shorty_gram.y
deleted file mode 100644
index b688896..0000000
--- a/src/mangling/dex/shorty_gram.y
+++ /dev/null
@@ -1,138 +0,0 @@
-
-%{
-
-#include <stdbool.h>
-
-
-#include "context.h"
-#include "../context-int.h"
-
-
-
-/* Affiche un message d'erreur concernant l'analyse. */
-static int shorty_error(GDexDemangler *, char *);
-
-/* Procède au décodage d'une chaîne de caractères. */
-bool demangle_dex_routine(GDexDemangler *, const char *);
-
-
-%}
-
-
-%code requires {
-
-#include "../../analysis/types/basic.h"
-#include "../../analysis/types/cse.h"
-
-}
-
-%union {
-
- GDataType *type; /* Type reconstruit */
-
-}
-
-
-%parse-param { GDexDemangler *demangler }
-
-%token V Z B S C I J F D L
-
-%type <type> shorty_return_type shorty_field_type
-
-
-%{
-
-/* Déclarations issues de l'analyseur syntaxique... */
-
-typedef struct yy_buffer_state *YY_BUFFER_STATE;
-
-extern YY_BUFFER_STATE shorty__scan_string(const char *);
-extern void shorty__delete_buffer(YY_BUFFER_STATE);
-extern int shorty_lex(void);
-
-%}
-
-
-%%
-
-
-shorty_descriptor:
- shorty_return_type shorty_field_type_list {
- GBinRoutine *routine;
- routine = G_DEMANGLING_CONTEXT(demangler)->routine;
- g_binary_routine_set_return_type(routine, $1);
- }
-
-shorty_field_type_list:
- /* empty */
- | shorty_field_type shorty_field_type_list {
- GBinRoutine *routine;
- GBinVariable *var;
- routine = G_DEMANGLING_CONTEXT(demangler)->routine;
- var = g_binary_variable_new($1);
- g_binary_routine_add_arg(routine, var);
- }
-
-shorty_return_type:
- V { $$ = g_basic_type_new(BTP_VOID); }
- | shorty_field_type { $$ = $1; }
-
-shorty_field_type:
- Z { $$ = g_basic_type_new(BTP_BOOL); }
- | B { $$ = g_basic_type_new(BTP_UCHAR); }
- | S { $$ = g_basic_type_new(BTP_SHORT); }
- | C { $$ = g_basic_type_new(BTP_CHAR); }
- | I { $$ = g_basic_type_new(BTP_INT); }
- | J { $$ = g_basic_type_new(BTP_LONG); }
- | F { $$ = g_basic_type_new(BTP_FLOAT); }
- | D { $$ = g_basic_type_new(BTP_DOUBLE); }
- | L { $$ = g_class_enum_type_new(CET_CLASS, ""); }
-
-
-%%
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = contexte associé à la procédure de décodage. *
-* msg = indications humaines sur l'événement. *
-* *
-* Description : Affiche un message d'erreur concernant l'analyse. *
-* *
-* Retour : Valeur historique, ignorée. *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-static int shorty_error(GDexDemangler *demangler, char *msg)
-{
- return -1;
-
-}
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = contexte de décodage à utiliser. *
-* desc = chaîne de caractères à décoder. *
-* *
-* Description : Procède au décodage d'une chaîne de caractères. *
-* *
-* Retour : Bilan de l'opération. *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-
-bool demangle_dex_routine(GDexDemangler *demangler, const char *desc)
-{
- YY_BUFFER_STATE buffer; /* Tampon pour bison */
- int ret; /* Bilan de l'appel */
-
- buffer = shorty__scan_string(desc);
- ret = yyparse(demangler);
- shorty__delete_buffer(buffer);
-
- return (ret == 0);
-
-}
diff --git a/src/mangling/dex/shorty_tok.l b/src/mangling/dex/shorty_tok.l
deleted file mode 100644
index a3545a2..0000000
--- a/src/mangling/dex/shorty_tok.l
+++ /dev/null
@@ -1,28 +0,0 @@
-
-%{
-
-#include "context.h"
-#include "libmanglingdexshorty_la-shorty_gram.h"
-
-%}
-
-
-%option noyywrap
-%option yylineno
-%option nounput
-%option noinput
-
-%%
-
-"V" { return V; }
-"Z" { return Z; }
-"B" { return B; }
-"S" { return S; }
-"C" { return C; }
-"I" { return I; }
-"J" { return J; }
-"F" { return F; }
-"D" { return D; }
-"L" { return L; }
-
-%%
diff --git a/src/mangling/dex/type_gram.y b/src/mangling/dex/type_gram.y
deleted file mode 100644
index 79c9320..0000000
--- a/src/mangling/dex/type_gram.y
+++ /dev/null
@@ -1,159 +0,0 @@
-
-%{
-
-#include <stdbool.h>
-
-
-#include "context.h"
-#include "../context-int.h"
-
-typedef void *yyscan_t;
-
-/* Affiche un message d'erreur concernant l'analyse. */
-static int type_error(GDexDemangler *, yyscan_t, char *);
-
-/* Procède au décodage d'une chaîne de caractères. */
-bool demangle_dex_type(GDexDemangler *, const char *);
-
-
-%}
-
-
-%code requires {
-
-#include "../../analysis/types/basic.h"
-#include "../../analysis/types/cse.h"
-#include "../../common/extstr.h"
-
-}
-
-%union {
-
- GDataType *type; /* Type reconstruit */
- size_t adeep; /* Dimension d'un tableau */
- char *text; /* Chaîne de caractères */
-
-}
-
-
-
-%define api.pure full
-%parse-param { GDexDemangler *demangler } { yyscan_t scanner }
-%lex-param { yyscan_t scanner }
-
-
-%token V Z B S C I J F D
-%token ARRAY
-%token L SEMICOLON
-%token SLASH DOLLAR
-%token TEXT
-
-%type <type> type_descriptor field_type_descriptor non_array_field_type_descriptor full_class_name
-
-%type <text> TEXT simple_name
-
-
-%{
-
-/* Déclarations issues de l'analyseur syntaxique... */
-
-typedef struct yy_buffer_state *YY_BUFFER_STATE;
-
-extern int type_lex_init(yyscan_t *scanner);
-extern YY_BUFFER_STATE type__scan_string(const char *, yyscan_t);
-extern void type__delete_buffer(YY_BUFFER_STATE, yyscan_t);
-extern int type_lex(YYSTYPE *, yyscan_t);
-extern int type_lex_destroy(yyscan_t);
-
-%}
-
-
-%%
-
-
-input:
- type_descriptor { G_DEMANGLING_CONTEXT(demangler)->type = $1; }
-
-type_descriptor:
- V { $$ = g_basic_type_new(BTP_VOID); }
- | field_type_descriptor { $$ = $1; }
-
-field_type_descriptor:
- non_array_field_type_descriptor { $$ = $1; }
- | ARRAY non_array_field_type_descriptor { $$ = $2; }
-
-non_array_field_type_descriptor:
- Z { $$ = g_basic_type_new(BTP_BOOL); }
- | B { $$ = g_basic_type_new(BTP_UCHAR); }
- | S { $$ = g_basic_type_new(BTP_SHORT); }
- | C { $$ = g_basic_type_new(BTP_CHAR); }
- | I { $$ = g_basic_type_new(BTP_INT); }
- | J { $$ = g_basic_type_new(BTP_LONG); }
- | F { $$ = g_basic_type_new(BTP_FLOAT); }
- | D { $$ = g_basic_type_new(BTP_DOUBLE); }
- | L full_class_name SEMICOLON { $$ = $2; }
-
-full_class_name:
- simple_name { $$ = g_class_enum_type_new(CET_CLASS, $1); }
- | full_class_name SLASH simple_name {
- $$ = g_class_enum_type_new(CET_CLASS, $3);
- g_data_type_set_namespace($$, $1);
- g_object_unref($1);
- }
-simple_name:
- TEXT { $$ = strdup($1); }
- | simple_name TEXT { $$ = stradd($1, $2); }
-
-%%
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = contexte associé à la procédure de décodage. *
-* scanner = données internes aux analyseurs. *
-* msg = indications humaines sur l'événement. *
-* *
-* Description : Affiche un message d'erreur concernant l'analyse. *
-* *
-* Retour : Valeur historique, ignorée. *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-static int type_error(GDexDemangler *demangler, yyscan_t scanner, char *msg)
-{
- return -1;
-
-}
-
-
-/******************************************************************************
-* *
-* Paramètres : demangler = contexte de décodage à utiliser. *
-* desc = chaîne de caractères à décoder. *
-* *
-* Description : Procède au décodage d'une chaîne de caractères. *
-* *
-* Retour : Bilan de l'opération. *
-* *
-* Remarques : - *
-* *
-******************************************************************************/
-
-bool demangle_dex_type(GDexDemangler *demangler, const char *desc)
-{
- yyscan_t scanner; /* Données internes */
- YY_BUFFER_STATE buffer; /* Tampon pour bison */
- int ret; /* Bilan de l'appel */
-
- type_lex_init(&scanner);
-
- buffer = type__scan_string(desc, scanner);
- ret = yyparse(demangler, scanner);
- type__delete_buffer(buffer, scanner);
-
- type_lex_destroy(scanner);
-
- return (ret == 0);
-
-}
diff --git a/src/mangling/dex/type_tok.l b/src/mangling/dex/type_tok.l
deleted file mode 100644
index 7e85d43..0000000
--- a/src/mangling/dex/type_tok.l
+++ /dev/null
@@ -1,150 +0,0 @@
-
-%{
-
-#include "context.h"
-#include "libmanglingdextype_la-type_gram.h"
-
-/* See lemoda.net/c/reentrant-parser */
-
-%}
-
-
-%option noyywrap
-%option yylineno
-%option nounput
-/*%option noinput*/
-%option reentrant
-%option bison-bridge
-
-%x string
-
-ASCII [A-Za-z0-9]
-SIMPLE {ASCII}|"$"|"-"|"_"
-
-%%
-
-"V" { return V; }
-"Z" { return Z; }
-"B" { return B; }
-"S" { return S; }
-"C" { return C; }
-"I" { return I; }
-"J" { return J; }
-"F" { return F; }
-"D" { return D; }
-"L" { BEGIN(string); return L; }
-"["* { yylval->adeep = strlen(yytext); return ARRAY; }
-<string>"/" { return SLASH; }
-<string>";" { BEGIN(INITIAL); return SEMICOLON; }
-
-<string>{SIMPLE}* { yylval->text = yytext; return TEXT; }
-
-<string>. {
- unsigned char next;
- char mutf8[4];
-
- switch ((unsigned char)yytext[0])
- {
- /* U+00a1 ... U+1fff */
- case 0x00 ... 0x1f:
-
- next = input(yyscanner);
-
- if (yytext[0] == 0x00 && next < 0xa1)
- {
- REJECT;
- }
-
- else
- {
- mutf8[0] = yytext[0];
- mutf8[1] = next;
- mutf8[2] = '\0';
-
- strcpy(yylval->text, mutf8); return TEXT;
-
- }
-
- break;
-
- /* U+2010 ... U+2027 / U+2030 ... U+d7ff */
- case 0x20:
-
- next = input(yyscanner);
-
- switch (next)
- {
- case 0x10 ... 0x27:
- case 0x30 ... 0xff:
-
- mutf8[0] = yytext[0];
- mutf8[1] = next;
- mutf8[2] = '\0';
-
- strcpy(yylval->text, mutf8); return TEXT;
- break;
-
- default:
- REJECT;
- break;
-
- }
-
- break;
-
- /* ~ U+2030 ... U+d7ff */
- case 0x21 ... 0xd7:
-
- next = input(yyscanner);
-
- mutf8[0] = yytext[0];
- mutf8[1] = next;
- mutf8[2] = '\0';
-
- strcpy(yylval->text, mutf8); return TEXT;
- break;
-
- /* U+e000 ... U+ffef */
- case 0xe0 ... 0xff:
-
- next = input(yyscanner);
-
- if (yytext[0] == 0xff && next > 0xef)
- {
- REJECT;
- }
-
- else
- {
- mutf8[0] = yytext[0];
- mutf8[1] = next;
- mutf8[2] = '\0';
-
- strcpy(yylval->text, mutf8); return TEXT;
-
- }
-
- break;
-
- /* U+10000 ... U+10ffff */
- /*
- case 0x10:
-
- mutf8[0] = yytext[0];
- mutf8[1] = input(yyscanner);
- mutf8[2] = input(yyscanner);
- mutf8[3] = '\0';
-
- strcpy(yylval->text, mutf8); return TEXT;
- break;
- */
-
- default:
- REJECT;
- break;
-
- }
-
- }
-
-%%