如何解析. apk 包中的 AndroidManifest.xml 文件

此文件似乎是二进制 XML 格式。这种格式是什么? 如何通过编程方式解析它(与在 SDK 中使用 apatdump 工具相反) ?

文档 给你中没有讨论这种二进制格式。

注意: 我想从 Android 环境之外访问这些信息,最好是从 Java。

197469 次浏览

您可以使用 一个 href = “ http://code.google.com/p/android 随机/source/浏览/躯干/axml2xml/axml2xml.pl”rel = “ noReferrer”> axml2xml.pl 工具开发了一段时间以前在 机器人,随机项目。它将从二进制文件生成文本清单文件(AndroidManifest.xml)。

我说的是“ 原文”而不是“ 原创的”,因为像许多逆向工程工具一样,这个工具并不完美,而且 结果 < 强 > 不会 完成也不完美。我假设它要么从来没有完成过功能,要么就是不能向前兼容(使用较新的二进制编码方案)。不管是什么原因,Xml2xml.pl工具将无法正确地提取所有属性值。这些属性包括 minSdkVersion、 targetSdkVersion 和基本上所有引用资源的属性(如字符串、图标等) ,也就是说,只有类名(活动、服务等)被正确提取。

但是,你仍然可以通过在原始的 Android 应用程序文件(。 apk)上运行 恰到好处工具来找到这些缺失的信息:

适应 l-a < em > < somapp.apk >

使用 android-apktool

有一个应用程序可以读取 apk 文件并将 XML 解码为几乎原始的形式。

用法:

apktool d Gmail.apk && cat Gmail/AndroidManifest.xml

有关更多信息,请查看 Android-apktool

这个运行在 Android 上的 Java 方法在。APK 软件包。第二个代码框显示如何调用解压缩 XML,以及如何从设备上的 app 包文件加载 byte []。(有些字段的用途我不明白,如果你知道它们的意思,告诉我,我会更新信息。)

// decompressXML -- Parse the 'compressed' binary form of Android XML docs
// such as for AndroidManifest.xml in .apk files
public static int endDocTag = 0x00100101;
public static int startTag =  0x00100102;
public static int endTag =    0x00100103;
public void decompressXML(byte[] xml) {
// Compressed XML file/bytes starts with 24x bytes of data,
// 9 32 bit words in little endian order (LSB first):
//   0th word is 03 00 08 00
//   3rd word SEEMS TO BE:  Offset at then of StringTable
//   4th word is: Number of strings in string table
// WARNING: Sometime I indiscriminently display or refer to word in
//   little endian storage format, or in integer format (ie MSB first).
int numbStrings = LEW(xml, 4*4);


// StringIndexTable starts at offset 24x, an array of 32 bit LE offsets
// of the length/string data in the StringTable.
int sitOff = 0x24;  // Offset of start of StringIndexTable


// StringTable, each string is represented with a 16 bit little endian
// character count, followed by that number of 16 bit (LE) (Unicode) chars.
int stOff = sitOff + numbStrings*4;  // StringTable follows StrIndexTable


// XMLTags, The XML tag tree starts after some unknown content after the
// StringTable.  There is some unknown data after the StringTable, scan
// forward from this point to the flag for the start of an XML start tag.
int xmlTagOff = LEW(xml, 3*4);  // Start from the offset in the 3rd word.
// Scan forward until we find the bytes: 0x02011000(x00100102 in normal int)
for (int ii=xmlTagOff; ii<xml.length-4; ii+=4) {
if (LEW(xml, ii) == startTag) {
xmlTagOff = ii;  break;
}
} // end of hack, scanning for start of first start tag


// XML tags and attributes:
// Every XML start and end tag consists of 6 32 bit words:
//   0th word: 02011000 for startTag and 03011000 for endTag
//   1st word: a flag?, like 38000000
//   2nd word: Line of where this tag appeared in the original source file
//   3rd word: FFFFFFFF ??
//   4th word: StringIndex of NameSpace name, or FFFFFFFF for default NS
//   5th word: StringIndex of Element Name
//   (Note: 01011000 in 0th word means end of XML document, endDocTag)


// Start tags (not end tags) contain 3 more words:
//   6th word: 14001400 meaning??
//   7th word: Number of Attributes that follow this tag(follow word 8th)
//   8th word: 00000000 meaning??


// Attributes consist of 5 words:
//   0th word: StringIndex of Attribute Name's Namespace, or FFFFFFFF
//   1st word: StringIndex of Attribute Name
//   2nd word: StringIndex of Attribute Value, or FFFFFFF if ResourceId used
//   3rd word: Flags?
//   4th word: str ind of attr value again, or ResourceId of value


// TMP, dump string table to tr for debugging
//tr.addSelect("strings", null);
//for (int ii=0; ii<numbStrings; ii++) {
//  // Length of string starts at StringTable plus offset in StrIndTable
//  String str = compXmlString(xml, sitOff, stOff, ii);
//  tr.add(String.valueOf(ii), str);
//}
//tr.parent();


// Step through the XML tree element tags and attributes
int off = xmlTagOff;
int indent = 0;
int startTagLineNo = -2;
while (off < xml.length) {
int tag0 = LEW(xml, off);
//int tag1 = LEW(xml, off+1*4);
int lineNo = LEW(xml, off+2*4);
//int tag3 = LEW(xml, off+3*4);
int nameNsSi = LEW(xml, off+4*4);
int nameSi = LEW(xml, off+5*4);


if (tag0 == startTag) { // XML START TAG
int tag6 = LEW(xml, off+6*4);  // Expected to be 14001400
int numbAttrs = LEW(xml, off+7*4);  // Number of Attributes to follow
//int tag8 = LEW(xml, off+8*4);  // Expected to be 00000000
off += 9*4;  // Skip over 6+3 words of startTag data
String name = compXmlString(xml, sitOff, stOff, nameSi);
//tr.addSelect(name, null);
startTagLineNo = lineNo;


// Look for the Attributes
StringBuffer sb = new StringBuffer();
for (int ii=0; ii<numbAttrs; ii++) {
int attrNameNsSi = LEW(xml, off);  // AttrName Namespace Str Ind, or FFFFFFFF
int attrNameSi = LEW(xml, off+1*4);  // AttrName String Index
int attrValueSi = LEW(xml, off+2*4); // AttrValue Str Ind, or FFFFFFFF
int attrFlags = LEW(xml, off+3*4);
int attrResId = LEW(xml, off+4*4);  // AttrValue ResourceId or dup AttrValue StrInd
off += 5*4;  // Skip over the 5 words of an attribute


String attrName = compXmlString(xml, sitOff, stOff, attrNameSi);
String attrValue = attrValueSi!=-1
? compXmlString(xml, sitOff, stOff, attrValueSi)
: "resourceID 0x"+Integer.toHexString(attrResId);
sb.append(" "+attrName+"=\""+attrValue+"\"");
//tr.add(attrName, attrValue);
}
prtIndent(indent, "<"+name+sb+">");
indent++;


} else if (tag0 == endTag) { // XML END TAG
indent--;
off += 6*4;  // Skip over 6 words of endTag data
String name = compXmlString(xml, sitOff, stOff, nameSi);
prtIndent(indent, "</"+name+">  (line "+startTagLineNo+"-"+lineNo+")");
//tr.parent();  // Step back up the NobTree


} else if (tag0 == endDocTag) {  // END OF XML DOC TAG
break;


} else {
prt("  Unrecognized tag code '"+Integer.toHexString(tag0)
+"' at offset "+off);
break;
}
} // end of while loop scanning tags and attributes of XML tree
prt("    end at offset "+off);
} // end of decompressXML




public String compXmlString(byte[] xml, int sitOff, int stOff, int strInd) {
if (strInd < 0) return null;
int strOff = stOff + LEW(xml, sitOff+strInd*4);
return compXmlStringAt(xml, strOff);
}




public static String spaces = "                                             ";
public void prtIndent(int indent, String str) {
prt(spaces.substring(0, Math.min(indent*2, spaces.length()))+str);
}




// compXmlStringAt -- Return the string stored in StringTable format at
// offset strOff.  This offset points to the 16 bit string length, which
// is followed by that number of 16 bit (Unicode) chars.
public String compXmlStringAt(byte[] arr, int strOff) {
int strLen = arr[strOff+1]<<8&0xff00 | arr[strOff]&0xff;
byte[] chars = new byte[strLen];
for (int ii=0; ii<strLen; ii++) {
chars[ii] = arr[strOff+2+ii*2];
}
return new String(chars);  // Hack, just use 8 byte chars
} // end of compXmlStringAt




// LEW -- Return value of a Little Endian 32 bit word from the byte array
//   at offset off.
public int LEW(byte[] arr, int off) {
return arr[off+3]<<24&0xff000000 | arr[off+2]<<16&0xff0000
| arr[off+1]<<8&0xff00 | arr[off]&0xFF;
} // end of LEW

此方法将 AndroidManifest 读入一个字节[]以进行处理:

public void getIntents(String path) {
try {
JarFile jf = new JarFile(path);
InputStream is = jf.getInputStream(jf.getEntry("AndroidManifest.xml"));
byte[] xml = new byte[is.available()];
int br = is.read(xml);
//Tree tr = TrunkFactory.newTree();
decompressXML(xml);
//prt("XML\n"+tr.list());
} catch (Exception ex) {
console.log("getIntents, ex: "+ex);  ex.printStackTrace();
}
} // end of getIntents

大多数应用程序都存储在/system/app 中,这个应用程序不需要 root 用户就可以阅读我的 Evo,其他应用程序存储在/data/app 中,我需要 root 用户来查看。上面的‘ path’参数类似于: “/system/app/Weather.apk”

如果有用的话,下面是 Ribo 发布的 Java 代码片段的 C + + 版本:

struct decompressXML
{
// decompressXML -- Parse the 'compressed' binary form of Android XML docs
// such as for AndroidManifest.xml in .apk files
enum
{
endDocTag = 0x00100101,
startTag =  0x00100102,
endTag =    0x00100103
};


decompressXML(const BYTE* xml, int cb) {
// Compressed XML file/bytes starts with 24x bytes of data,
// 9 32 bit words in little endian order (LSB first):
//   0th word is 03 00 08 00
//   3rd word SEEMS TO BE:  Offset at then of StringTable
//   4th word is: Number of strings in string table
// WARNING: Sometime I indiscriminently display or refer to word in
//   little endian storage format, or in integer format (ie MSB first).
int numbStrings = LEW(xml, cb, 4*4);


// StringIndexTable starts at offset 24x, an array of 32 bit LE offsets
// of the length/string data in the StringTable.
int sitOff = 0x24;  // Offset of start of StringIndexTable


// StringTable, each string is represented with a 16 bit little endian
// character count, followed by that number of 16 bit (LE) (Unicode) chars.
int stOff = sitOff + numbStrings*4;  // StringTable follows StrIndexTable


// XMLTags, The XML tag tree starts after some unknown content after the
// StringTable.  There is some unknown data after the StringTable, scan
// forward from this point to the flag for the start of an XML start tag.
int xmlTagOff = LEW(xml, cb, 3*4);  // Start from the offset in the 3rd word.
// Scan forward until we find the bytes: 0x02011000(x00100102 in normal int)
for (int ii=xmlTagOff; ii<cb-4; ii+=4) {
if (LEW(xml, cb, ii) == startTag) {
xmlTagOff = ii;  break;
}
} // end of hack, scanning for start of first start tag


// XML tags and attributes:
// Every XML start and end tag consists of 6 32 bit words:
//   0th word: 02011000 for startTag and 03011000 for endTag
//   1st word: a flag?, like 38000000
//   2nd word: Line of where this tag appeared in the original source file
//   3rd word: FFFFFFFF ??
//   4th word: StringIndex of NameSpace name, or FFFFFFFF for default NS
//   5th word: StringIndex of Element Name
//   (Note: 01011000 in 0th word means end of XML document, endDocTag)


// Start tags (not end tags) contain 3 more words:
//   6th word: 14001400 meaning??
//   7th word: Number of Attributes that follow this tag(follow word 8th)
//   8th word: 00000000 meaning??


// Attributes consist of 5 words:
//   0th word: StringIndex of Attribute Name's Namespace, or FFFFFFFF
//   1st word: StringIndex of Attribute Name
//   2nd word: StringIndex of Attribute Value, or FFFFFFF if ResourceId used
//   3rd word: Flags?
//   4th word: str ind of attr value again, or ResourceId of value


// TMP, dump string table to tr for debugging
//tr.addSelect("strings", null);
//for (int ii=0; ii<numbStrings; ii++) {
//  // Length of string starts at StringTable plus offset in StrIndTable
//  String str = compXmlString(xml, sitOff, stOff, ii);
//  tr.add(String.valueOf(ii), str);
//}
//tr.parent();


// Step through the XML tree element tags and attributes
int off = xmlTagOff;
int indent = 0;
int startTagLineNo = -2;
while (off < cb) {
int tag0 = LEW(xml, cb, off);
//int tag1 = LEW(xml, off+1*4);
int lineNo = LEW(xml, cb, off+2*4);
//int tag3 = LEW(xml, off+3*4);
int nameNsSi = LEW(xml, cb, off+4*4);
int nameSi = LEW(xml, cb, off+5*4);


if (tag0 == startTag) { // XML START TAG
int tag6 = LEW(xml, cb, off+6*4);  // Expected to be 14001400
int numbAttrs = LEW(xml, cb, off+7*4);  // Number of Attributes to follow
//int tag8 = LEW(xml, off+8*4);  // Expected to be 00000000
off += 9*4;  // Skip over 6+3 words of startTag data
std::string name = compXmlString(xml, cb, sitOff, stOff, nameSi);
//tr.addSelect(name, null);
startTagLineNo = lineNo;


// Look for the Attributes
std::string sb;
for (int ii=0; ii<numbAttrs; ii++) {
int attrNameNsSi = LEW(xml, cb, off);  // AttrName Namespace Str Ind, or FFFFFFFF
int attrNameSi = LEW(xml, cb, off+1*4);  // AttrName String Index
int attrValueSi = LEW(xml, cb, off+2*4); // AttrValue Str Ind, or FFFFFFFF
int attrFlags = LEW(xml, cb, off+3*4);
int attrResId = LEW(xml, cb, off+4*4);  // AttrValue ResourceId or dup AttrValue StrInd
off += 5*4;  // Skip over the 5 words of an attribute


std::string attrName = compXmlString(xml, cb, sitOff, stOff, attrNameSi);
std::string attrValue = attrValueSi!=-1
? compXmlString(xml, cb, sitOff, stOff, attrValueSi)
: "resourceID 0x"+toHexString(attrResId);
sb.append(" "+attrName+"=\""+attrValue+"\"");
//tr.add(attrName, attrValue);
}
prtIndent(indent, "<"+name+sb+">");
indent++;


} else if (tag0 == endTag) { // XML END TAG
indent--;
off += 6*4;  // Skip over 6 words of endTag data
std::string name = compXmlString(xml, cb, sitOff, stOff, nameSi);
prtIndent(indent, "</"+name+">  (line "+toIntString(startTagLineNo)+"-"+toIntString(lineNo)+")");
//tr.parent();  // Step back up the NobTree


} else if (tag0 == endDocTag) {  // END OF XML DOC TAG
break;


} else {
prt("  Unrecognized tag code '"+toHexString(tag0)
+"' at offset "+toIntString(off));
break;
}
} // end of while loop scanning tags and attributes of XML tree
prt("    end at offset "+off);
} // end of decompressXML




std::string compXmlString(const BYTE* xml, int cb, int sitOff, int stOff, int strInd) {
if (strInd < 0) return std::string("");
int strOff = stOff + LEW(xml, cb, sitOff+strInd*4);
return compXmlStringAt(xml, cb, strOff);
}


void prt(std::string str)
{
printf("%s", str.c_str());
}
void prtIndent(int indent, std::string str) {
char spaces[46];
memset(spaces, ' ', sizeof(spaces));
spaces[min(indent*2,  sizeof(spaces) - 1)] = 0;
prt(spaces);
prt(str);
prt("\n");
}




// compXmlStringAt -- Return the string stored in StringTable format at
// offset strOff.  This offset points to the 16 bit string length, which
// is followed by that number of 16 bit (Unicode) chars.
std::string compXmlStringAt(const BYTE* arr, int cb, int strOff) {
if (cb < strOff + 2) return std::string("");
int strLen = arr[strOff+1]<<8&0xff00 | arr[strOff]&0xff;
char* chars = new char[strLen + 1];
chars[strLen] = 0;
for (int ii=0; ii<strLen; ii++) {
if (cb < strOff + 2 + ii * 2)
{
chars[ii] = 0;
break;
}
chars[ii] = arr[strOff+2+ii*2];
}
std::string str(chars);
free(chars);
return str;
} // end of compXmlStringAt




// LEW -- Return value of a Little Endian 32 bit word from the byte array
//   at offset off.
int LEW(const BYTE* arr, int cb, int off) {
return (cb > off + 3) ? ( arr[off+3]<<24&0xff000000 | arr[off+2]<<16&0xff0000
| arr[off+1]<<8&0xff00 | arr[off]&0xFF ) : 0;
} // end of LEW


std::string toHexString(DWORD attrResId)
{
char ch[20];
sprintf_s(ch, 20, "%lx", attrResId);
return std::string(ch);
}
std::string toIntString(int i)
{
char ch[20];
sprintf_s(ch, 20, "%ld", i);
return std::string(ch);
}
};

检查下面的 WPF 计划,它正确地解码了属性。

以下是我对 Ribo 代码的解释。主要的区别在于解压缩 XML ()直接返回一个 String,在我看来,这是一种更合适的用法。

注意: 我使用 Ribo 的解决方案的唯一目的是获取一个。APK 文件从 Manifest XML 文件发布的版本,并且我确认为此目的它工作得非常好。

编辑[2013-03-16] : 它工作得很好 如果版本被设置为纯文本,但是如果它被设置为引用资源 XML,它将显示为“ Resource 0x1”,例如。在这种特殊情况下,您可能必须将这个解决方案与另一个解决方案耦合起来,这个解决方案将获取适当的字符串资源引用。

/**
* Binary XML doc ending Tag
*/
public static int endDocTag = 0x00100101;


/**
* Binary XML start Tag
*/
public static int startTag =  0x00100102;


/**
* Binary XML end Tag
*/
public static int endTag =    0x00100103;




/**
* Reference var for spacing
* Used in prtIndent()
*/
public static String spaces = "                                             ";




/**
* Parse the 'compressed' binary form of Android XML docs
* such as for AndroidManifest.xml in .apk files
* Source: http://stackoverflow.com/questions/2097813/how-to-parse-the-androidmanifest-xml-file-inside-an-apk-package/4761689#4761689
*
* @param xml Encoded XML content to decompress
*/
public static String decompressXML(byte[] xml) {


StringBuilder resultXml = new StringBuilder();


// Compressed XML file/bytes starts with 24x bytes of data,
// 9 32 bit words in little endian order (LSB first):
//   0th word is 03 00 08 00
//   3rd word SEEMS TO BE:  Offset at then of StringTable
//   4th word is: Number of strings in string table
// WARNING: Sometime I indiscriminently display or refer to word in
//   little endian storage format, or in integer format (ie MSB first).
int numbStrings = LEW(xml, 4*4);


// StringIndexTable starts at offset 24x, an array of 32 bit LE offsets
// of the length/string data in the StringTable.
int sitOff = 0x24;  // Offset of start of StringIndexTable


// StringTable, each string is represented with a 16 bit little endian
// character count, followed by that number of 16 bit (LE) (Unicode) chars.
int stOff = sitOff + numbStrings*4;  // StringTable follows StrIndexTable


// XMLTags, The XML tag tree starts after some unknown content after the
// StringTable.  There is some unknown data after the StringTable, scan
// forward from this point to the flag for the start of an XML start tag.
int xmlTagOff = LEW(xml, 3*4);  // Start from the offset in the 3rd word.
// Scan forward until we find the bytes: 0x02011000(x00100102 in normal int)
for (int ii=xmlTagOff; ii<xml.length-4; ii+=4) {
if (LEW(xml, ii) == startTag) {
xmlTagOff = ii;  break;
}
} // end of hack, scanning for start of first start tag


// XML tags and attributes:
// Every XML start and end tag consists of 6 32 bit words:
//   0th word: 02011000 for startTag and 03011000 for endTag
//   1st word: a flag?, like 38000000
//   2nd word: Line of where this tag appeared in the original source file
//   3rd word: FFFFFFFF ??
//   4th word: StringIndex of NameSpace name, or FFFFFFFF for default NS
//   5th word: StringIndex of Element Name
//   (Note: 01011000 in 0th word means end of XML document, endDocTag)


// Start tags (not end tags) contain 3 more words:
//   6th word: 14001400 meaning??
//   7th word: Number of Attributes that follow this tag(follow word 8th)
//   8th word: 00000000 meaning??


// Attributes consist of 5 words:
//   0th word: StringIndex of Attribute Name's Namespace, or FFFFFFFF
//   1st word: StringIndex of Attribute Name
//   2nd word: StringIndex of Attribute Value, or FFFFFFF if ResourceId used
//   3rd word: Flags?
//   4th word: str ind of attr value again, or ResourceId of value


// TMP, dump string table to tr for debugging
//tr.addSelect("strings", null);
//for (int ii=0; ii<numbStrings; ii++) {
//  // Length of string starts at StringTable plus offset in StrIndTable
//  String str = compXmlString(xml, sitOff, stOff, ii);
//  tr.add(String.valueOf(ii), str);
//}
//tr.parent();


// Step through the XML tree element tags and attributes
int off = xmlTagOff;
int indent = 0;
int startTagLineNo = -2;
while (off < xml.length) {
int tag0 = LEW(xml, off);
//int tag1 = LEW(xml, off+1*4);
int lineNo = LEW(xml, off+2*4);
//int tag3 = LEW(xml, off+3*4);
int nameNsSi = LEW(xml, off+4*4);
int nameSi = LEW(xml, off+5*4);


if (tag0 == startTag) { // XML START TAG
int tag6 = LEW(xml, off+6*4);  // Expected to be 14001400
int numbAttrs = LEW(xml, off+7*4);  // Number of Attributes to follow
//int tag8 = LEW(xml, off+8*4);  // Expected to be 00000000
off += 9*4;  // Skip over 6+3 words of startTag data
String name = compXmlString(xml, sitOff, stOff, nameSi);
//tr.addSelect(name, null);
startTagLineNo = lineNo;


// Look for the Attributes
StringBuffer sb = new StringBuffer();
for (int ii=0; ii<numbAttrs; ii++) {
int attrNameNsSi = LEW(xml, off);  // AttrName Namespace Str Ind, or FFFFFFFF
int attrNameSi = LEW(xml, off+1*4);  // AttrName String Index
int attrValueSi = LEW(xml, off+2*4); // AttrValue Str Ind, or FFFFFFFF
int attrFlags = LEW(xml, off+3*4);
int attrResId = LEW(xml, off+4*4);  // AttrValue ResourceId or dup AttrValue StrInd
off += 5*4;  // Skip over the 5 words of an attribute


String attrName = compXmlString(xml, sitOff, stOff, attrNameSi);
String attrValue = attrValueSi!=-1
? compXmlString(xml, sitOff, stOff, attrValueSi)
: "resourceID 0x"+Integer.toHexString(attrResId);
sb.append(" "+attrName+"=\""+attrValue+"\"");
//tr.add(attrName, attrValue);
}
resultXml.append(prtIndent(indent, "<"+name+sb+">"));
indent++;


} else if (tag0 == endTag) { // XML END TAG
indent--;
off += 6*4;  // Skip over 6 words of endTag data
String name = compXmlString(xml, sitOff, stOff, nameSi);
resultXml.append(prtIndent(indent, "</"+name+">  (line "+startTagLineNo+"-"+lineNo+")"));
//tr.parent();  // Step back up the NobTree


} else if (tag0 == endDocTag) {  // END OF XML DOC TAG
break;


} else {
Log.e(TAG, "  Unrecognized tag code '"+Integer.toHexString(tag0)
+"' at offset "+off);
break;
}
} // end of while loop scanning tags and attributes of XML tree
Log.i(TAG, "    end at offset "+off);


return resultXml.toString();
} // end of decompressXML




/**
* Tool Method for decompressXML();
* Compute binary XML to its string format
* Source: Source: http://stackoverflow.com/questions/2097813/how-to-parse-the-androidmanifest-xml-file-inside-an-apk-package/4761689#4761689
*
* @param xml Binary-formatted XML
* @param sitOff
* @param stOff
* @param strInd
* @return String-formatted XML
*/
public static String compXmlString(byte[] xml, int sitOff, int stOff, int strInd) {
if (strInd < 0) return null;
int strOff = stOff + LEW(xml, sitOff+strInd*4);
return compXmlStringAt(xml, strOff);
}




/**
* Tool Method for decompressXML();
* Apply indentation
*
* @param indent Indentation level
* @param str String to indent
* @return Indented string
*/
public static String prtIndent(int indent, String str) {


return (spaces.substring(0, Math.min(indent*2, spaces.length()))+str);
}




/**
* Tool method for decompressXML()
* Return the string stored in StringTable format at
* offset strOff.  This offset points to the 16 bit string length, which
* is followed by that number of 16 bit (Unicode) chars.
*
* @param arr StringTable array
* @param strOff Offset to get string from
* @return String from StringTable at offset strOff
*
*/
public static String compXmlStringAt(byte[] arr, int strOff) {
int strLen = arr[strOff+1]<<8&0xff00 | arr[strOff]&0xff;
byte[] chars = new byte[strLen];
for (int ii=0; ii<strLen; ii++) {
chars[ii] = arr[strOff+2+ii*2];
}
return new String(chars);  // Hack, just use 8 byte chars
} // end of compXmlStringAt




/**
* Return value of a Little Endian 32 bit word from the byte array
*   at offset off.
*
* @param arr Byte array with 32 bit word
* @param off Offset to get word from
* @return Value of Little Endian 32 bit word specified
*/
public static int LEW(byte[] arr, int off) {
return arr[off+3]<<24&0xff000000 | arr[off+2]<<16&0xff0000
| arr[off+1]<<8&0xff00 | arr[off]&0xFF;
} // end of LEW

希望它也能帮助其他人。

我找到了 AXMLPrinter2,这是 Android4Me 项目的一个 Java 应用程序,可以很好地处理我的 AndroidManifest.XML (并以一种很好的格式打印出 XML)。 http://code.google.com/p/android4me/downloads/detail?name=AXMLPrinter2.jar

一个音符。.它(以及 Ribo 提供的答案中的代码)似乎不能处理我遇到的所有编译过的 XML 文件。我发现其中一个字符串以每个字符一个字节的形式存储,而不是它假定的双字节格式。

如何将来自 Android SDK 的 Android 资产打包工具(aapt)用于 Python (或其他)脚本?

实际上,可以通过 aapt (http://elinux.org/Android_aapt)检索有关 。 apk包及其 AndroidManifest.xml文件的信息。特别是,您可以通过 “转储”子命令提取 。 apk包中各个元素的值。例如,您可以这样解压 。 apk包中的 AndroidManifest.xml文件中的 用户权限:

$ aapt dump permissions package.apk

其中 Package.apk是您的 。 apk包。

此外,您可以使用 Unix 管道命令来清除输出:

$ aapt dump permissions package.apk | sed 1d | awk '{ print $NF }'

这里有一个 Python 脚本,可以通过编程实现:

import os
import subprocess


#Current directory and file name:
curpath = os.path.dirname( os.path.realpath(__file__) )
filepath = os.path.join(curpath, "package.apk")


#Extract the AndroidManifest.xml permissions:
command = "aapt dump permissions " + filepath + " | sed 1d | awk '{ print $NF }'"
process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=None, shell=True)
permissions = process.communicate()[0]


print permissions

以类似的方式,您可以提取 AndroidManifest.xml的其他信息(例如 包裹应用程序名称等) :

#Extract the APK package info:
shellcommand = "aapt dump badging " + filepath
process = subprocess.Popen(shellcommand, stdout=subprocess.PIPE, stderr=None, shell=True)
apkInfo = process.communicate()[0].splitlines()


for info in apkInfo:
#Package info:
if string.find(info, "package:", 0) != -1:
print "App Package: " + findBetween(info, "name='", "'")
print "App Version: " + findBetween(info, "versionName='", "'")
continue


#App name:
if string.find(info, "application:", 0) != -1:
print "App Name: " + findBetween(info, "label='", "'")
continue




def findBetween(s, prefix, suffix):
try:
start = s.index(prefix) + len(prefix)
end = s.index(suffix, start)
return s[start:end]
except ValueError:
return ""

如果你想解析整个 AndroidManifest XML 树,你可以用类似的方法使用 Xmltree命令:

aapt dump xmltree package.apk AndroidManifest.xml

像以前一样使用 Python:

#Extract the AndroidManifest XML tree:
shellcommand = "aapt dump xmltree " + filepath + " AndroidManifest.xml"
process = subprocess.Popen(shellcommand, stdout=subprocess.PIPE, stderr=None, shell=True)
xmlTree = process.communicate()[0]


print "Number of Activities: " + str(xmlTree.count("activity"))
print "Number of Services: " + str(xmlTree.count("service"))
print "Number of BroadcastReceivers: " + str(xmlTree.count("receiver"))

如果您使用 Python 或 安德鲁卫士,AndroGuard Androaxml 特性将为您执行此转换。该功能在 这篇博文中有详细介绍,还有附加的 文件来源在这里

用法:

$ ./androaxml.py -h
Usage: androaxml.py [options]


Options:
-h, --help            show this help message and exit
-i INPUT, --input=INPUT
filename input (APK or android's binary xml)
-o OUTPUT, --output=OUTPUT
filename output of the xml
-v, --version         version of the API


$ ./androaxml.py -i yourfile.apk -o output.xml
$ ./androaxml.py -i AndroidManifest.xml -o output.xml

Apk-parser https://github.com/caoqianli/apk-parser是 Java 的轻量级实现,不依赖于 aapt 或其他二进制文件,适用于解析二进制 xml 文件和其他 apk 信息。

ApkParser apkParser = new ApkParser(new File(filePath));
// set a locale to translate resource tag into specific strings in language the locale specified, you set locale to Locale.ENGLISH then get apk title 'WeChat' instead of '@string/app_name' for example
apkParser.setPreferredLocale(locale);


String xml = apkParser.getManifestXml();
System.out.println(xml);


String xml2 = apkParser.transBinaryXml(xmlPathInApk);
System.out.println(xml2);


ApkMeta apkMeta = apkParser.getApkMeta();
System.out.println(apkMeta);


Set<Locale> locales = apkParser.getLocales();
for (Locale l : locales) {
System.out.println(l);
}
apkParser.close();

在 Android 工作室2.2中,你可以直接分析 apk。去建立-分析 APK。选择 apk,导航到 androidManif.xml。你可以看到机器人清单的细节。

会有帮助的

public static int vCodeApk(String path) {
PackageManager pm = G.context.getPackageManager();
PackageInfo info = pm.getPackageArchiveInfo(path, 0);
return info.versionCode;
//        Toast.makeText(this, "VersionCode : " + info.versionCode + ", VersionName : " + info.versionName, Toast.LENGTH_LONG).show();
}

G 是我的应用类:

public class G extends Application {

我已经使用上面贴出的 Ribo 代码运行了一年多,它对我们很有帮助。不过,随着最近的更新(Gradle 3.x) ,我不再能够解析 AndroidManifest.xml,我得到的索引出界错误,一般来说,它不再能够解析文件。

我现在认为我们的问题是升级到3级。本文描述了 AirWatch 是如何出现问题的,并且可以通过使用 Gradle 设置来使用 aapt 而不是 aapt2 AirWatch 似乎与 Gradle3.0.0-beta1的 Android 插件不兼容来解决

在四处搜索的过程中,我偶然发现了这个开源项目,它正在被维护,我能够直奔主题,阅读我以前能够解析的旧的 APK 和新的 APK,Ribo 的逻辑抛出了异常

https://github.com/xgouchet/AXML

从他的例子来看,这就是我正在做的

  zf = new ZipFile(apkFile);


//Getting the manifest
ZipEntry entry = zf.getEntry("AndroidManifest.xml");
InputStream is = zf.getInputStream(entry);


// Read our manifest Document
Document manifestDoc = new CompressedXmlParser().parseDOM(is);


// Make sure we got a doc, and that it has children
if (null != manifestDoc && manifestDoc.getChildNodes().getLength() > 0) {
//
Node firstNode = manifestDoc.getFirstChild();


// Now get the attributes out of the node
NamedNodeMap nodeMap = firstNode.getAttributes();


// Finally to a point where we can read out our values
versionName = nodeMap.getNamedItem("android:versionName").getNodeValue();
versionCode = nodeMap.getNamedItem("android:versionCode").getNodeValue();
}

使用最新的 SDK-Tools,您现在可以使用名为 apkanalyzer 的工具来打印 APK 的 AndroidManifest.xml (以及其他部分,如资源)。

[android sdk]/tools/bin/apkanalyzer manifest print [app.apk]

一个 href = “ https://developer.android.com/Studio/command-line/apkanalyzer.html”rel = “ norefrer”title = “ apkanalyzer”> apkanalyzer

Apkanalyzer 会有帮助的

@echo off


::##############################################################################
::##
::##  apkanalyzer start up script for Windows
::##
::##  converted by ewwink
::##
::##############################################################################


::Attempt to set APP_HOME


SET SAVED=%cd%
SET APP_HOME=C:\android\sdk\tools
SET APP_NAME="apkanalyzer"


::Add default JVM options here. You can also use JAVA_OPTS and APKANALYZER_OPTS to pass JVM options to this script.
SET DEFAULT_JVM_OPTS=-Dcom.android.sdklib.toolsdir=%APP_HOME%


SET CLASSPATH=%APP_HOME%\lib\dvlib-26.0.0-dev.jar;%APP_HOME%\lib\util-2.2.1.jar;%APP_HOME%\lib\jimfs-1.1.jar;%APP_HOME%\lib\annotations-13.0.jar;%APP_HOME%\lib\ddmlib-26.0.0-dev.jar;%APP_HOME%\lib\repository-26.0.0-dev.jar;%APP_HOME%\lib\sdk-common-26.0.0-dev.jar;%APP_HOME%\lib\kotlin-stdlib-1.1.3-2.jar;%APP_HOME%\lib\protobuf-java-3.0.0.jar;%APP_HOME%\lib\apkanalyzer-cli.jar;%APP_HOME%\lib\gson-2.3.jar;%APP_HOME%\lib\httpcore-4.2.5.jar;%APP_HOME%\lib\dexlib2-2.2.1.jar;%APP_HOME%\lib\commons-compress-1.12.jar;%APP_HOME%\lib\generator.jar;%APP_HOME%\lib\error_prone_annotations-2.0.18.jar;%APP_HOME%\lib\commons-codec-1.6.jar;%APP_HOME%\lib\kxml2-2.3.0.jar;%APP_HOME%\lib\httpmime-4.1.jar;%APP_HOME%\lib\annotations-12.0.jar;%APP_HOME%\lib\bcpkix-jdk15on-1.56.jar;%APP_HOME%\lib\jsr305-3.0.0.jar;%APP_HOME%\lib\explainer.jar;%APP_HOME%\lib\builder-model-3.0.0-dev.jar;%APP_HOME%\lib\baksmali-2.2.1.jar;%APP_HOME%\lib\j2objc-annotations-1.1.jar;%APP_HOME%\lib\layoutlib-api-26.0.0-dev.jar;%APP_HOME%\lib\jcommander-1.64.jar;%APP_HOME%\lib\commons-logging-1.1.1.jar;%APP_HOME%\lib\annotations-26.0.0-dev.jar;%APP_HOME%\lib\builder-test-api-3.0.0-dev.jar;%APP_HOME%\lib\animal-sniffer-annotations-1.14.jar;%APP_HOME%\lib\bcprov-jdk15on-1.56.jar;%APP_HOME%\lib\httpclient-4.2.6.jar;%APP_HOME%\lib\common-26.0.0-dev.jar;%APP_HOME%\lib\jopt-simple-4.9.jar;%APP_HOME%\lib\sdklib-26.0.0-dev.jar;%APP_HOME%\lib\apkanalyzer.jar;%APP_HOME%\lib\shared.jar;%APP_HOME%\lib\binary-resources.jar;%APP_HOME%\lib\guava-22.0.jar


SET APP_ARGS=%*
::Collect all arguments for the java command, following the shell quoting and substitution rules
SET APKANALYZER_OPTS=%DEFAULT_JVM_OPTS% -classpath %CLASSPATH% com.android.tools.apk.analyzer.ApkAnalyzerCli %APP_ARGS%


::Determine the Java command to use to start the JVM.
SET JAVACMD="java"
where %JAVACMD% >nul 2>nul
if %errorlevel%==1 (
echo ERROR: 'java' command could be found in your PATH.
echo Please set the 'java' variable in your environment to match the
echo location of your Java installation.
echo.
exit /b 0
)


:: execute apkanalyzer


%JAVACMD% %APKANALYZER_OPTS%

原始后 https://stackoverflow.com/a/51905063/1383521

@ Mathieu Kotlin 版本如下:

fun main(args : Array<String>) {
val fileName = "app.apk"
ZipFile(fileName).use { zip ->
zip.entries().asSequence().forEach { entry ->
if(entry.name == "AndroidManifest.xml") {
zip.getInputStream(entry).use { input ->
val xml = decompressXML(input.readBytes())
//TODO: parse the XML
println(xml)


}
}
}
}
}


/**
* Binary XML doc ending Tag
*/
var endDocTag = 0x00100101


/**
* Binary XML start Tag
*/
var startTag = 0x00100102


/**
* Binary XML end Tag
*/
var endTag = 0x00100103




/**
* Reference var for spacing
* Used in prtIndent()
*/
var spaces = "                                             "




/**
* Parse the 'compressed' binary form of Android XML docs
* such as for AndroidManifest.xml in .apk files
* Source: http://stackoverflow.com/questions/2097813/how-to-parse-the-androidmanifest-xml-file-inside-an-apk-package/4761689#4761689
*
* @param xml Encoded XML content to decompress
*/
fun decompressXML(xml: ByteArray): String {


val resultXml = StringBuilder()


// Compressed XML file/bytes starts with 24x bytes of data,
// 9 32 bit words in little endian order (LSB first):
//   0th word is 03 00 08 00
//   3rd word SEEMS TO BE:  Offset at then of StringTable
//   4th word is: Number of strings in string table
// WARNING: Sometime I indiscriminently display or refer to word in
//   little endian storage format, or in integer format (ie MSB first).
val numbStrings = LEW(xml, 4 * 4)


// StringIndexTable starts at offset 24x, an array of 32 bit LE offsets
// of the length/string data in the StringTable.
val sitOff = 0x24  // Offset of start of StringIndexTable


// StringTable, each string is represented with a 16 bit little endian
// character count, followed by that number of 16 bit (LE) (Unicode) chars.
val stOff = sitOff + numbStrings * 4  // StringTable follows StrIndexTable


// XMLTags, The XML tag tree starts after some unknown content after the
// StringTable.  There is some unknown data after the StringTable, scan
// forward from this point to the flag for the start of an XML start tag.
var xmlTagOff = LEW(xml, 3 * 4)  // Start from the offset in the 3rd word.
// Scan forward until we find the bytes: 0x02011000(x00100102 in normal int)
run {
var ii = xmlTagOff
while (ii < xml.size - 4) {
if (LEW(xml, ii) == startTag) {
xmlTagOff = ii
break
}
ii += 4
}
} // end of hack, scanning for start of first start tag


// XML tags and attributes:
// Every XML start and end tag consists of 6 32 bit words:
//   0th word: 02011000 for startTag and 03011000 for endTag
//   1st word: a flag?, like 38000000
//   2nd word: Line of where this tag appeared in the original source file
//   3rd word: FFFFFFFF ??
//   4th word: StringIndex of NameSpace name, or FFFFFFFF for default NS
//   5th word: StringIndex of Element Name
//   (Note: 01011000 in 0th word means end of XML document, endDocTag)


// Start tags (not end tags) contain 3 more words:
//   6th word: 14001400 meaning??
//   7th word: Number of Attributes that follow this tag(follow word 8th)
//   8th word: 00000000 meaning??


// Attributes consist of 5 words:
//   0th word: StringIndex of Attribute Name's Namespace, or FFFFFFFF
//   1st word: StringIndex of Attribute Name
//   2nd word: StringIndex of Attribute Value, or FFFFFFF if ResourceId used
//   3rd word: Flags?
//   4th word: str ind of attr value again, or ResourceId of value


// TMP, dump string table to tr for debugging
//tr.addSelect("strings", null);
//for (int ii=0; ii<numbStrings; ii++) {
//  // Length of string starts at StringTable plus offset in StrIndTable
//  String str = compXmlString(xml, sitOff, stOff, ii);
//  tr.add(String.valueOf(ii), str);
//}
//tr.parent();


// Step through the XML tree element tags and attributes
var off = xmlTagOff
var indent = 0
var startTagLineNo = -2
while (off < xml.size) {
val tag0 = LEW(xml, off)
//int tag1 = LEW(xml, off+1*4);
val lineNo = LEW(xml, off + 2 * 4)
//int tag3 = LEW(xml, off+3*4);
val nameNsSi = LEW(xml, off + 4 * 4)
val nameSi = LEW(xml, off + 5 * 4)


if (tag0 == startTag) { // XML START TAG
val tag6 = LEW(xml, off + 6 * 4)  // Expected to be 14001400
val numbAttrs = LEW(xml, off + 7 * 4)  // Number of Attributes to follow
//int tag8 = LEW(xml, off+8*4);  // Expected to be 00000000
off += 9 * 4  // Skip over 6+3 words of startTag data
val name = compXmlString(xml, sitOff, stOff, nameSi)
//tr.addSelect(name, null);
startTagLineNo = lineNo


// Look for the Attributes
val sb = StringBuffer()
for (ii in 0 until numbAttrs) {
val attrNameNsSi = LEW(xml, off)  // AttrName Namespace Str Ind, or FFFFFFFF
val attrNameSi = LEW(xml, off + 1 * 4)  // AttrName String Index
val attrValueSi = LEW(xml, off + 2 * 4) // AttrValue Str Ind, or FFFFFFFF
val attrFlags = LEW(xml, off + 3 * 4)
val attrResId = LEW(xml, off + 4 * 4)  // AttrValue ResourceId or dup AttrValue StrInd
off += 5 * 4  // Skip over the 5 words of an attribute


val attrName = compXmlString(xml, sitOff, stOff, attrNameSi)
val attrValue = if (attrValueSi != -1)
compXmlString(xml, sitOff, stOff, attrValueSi)
else
"resourceID 0x" + Integer.toHexString(attrResId)
sb.append(" $attrName=\"$attrValue\"")
//tr.add(attrName, attrValue);
}
resultXml.append(prtIndent(indent, "<$name$sb>"))
indent++


} else if (tag0 == endTag) { // XML END TAG
indent--
off += 6 * 4  // Skip over 6 words of endTag data
val name = compXmlString(xml, sitOff, stOff, nameSi)
resultXml.append(prtIndent(indent, "</$name>  (line $startTagLineNo-$lineNo)"))
//tr.parent();  // Step back up the NobTree


} else if (tag0 == endDocTag) {  // END OF XML DOC TAG
break


} else {
println("  Unrecognized tag code '" + Integer.toHexString(tag0)
+ "' at offset " + off
)
break
}
} // end of while loop scanning tags and attributes of XML tree
println("    end at offset $off")


return resultXml.toString()
} // end of decompressXML




/**
* Tool Method for decompressXML();
* Compute binary XML to its string format
* Source: Source: http://stackoverflow.com/questions/2097813/how-to-parse-the-androidmanifest-xml-file-inside-an-apk-package/4761689#4761689
*
* @param xml Binary-formatted XML
* @param sitOff
* @param stOff
* @param strInd
* @return String-formatted XML
*/
fun compXmlString(xml: ByteArray, sitOff: Int, stOff: Int, strInd: Int): String? {
if (strInd < 0) return null
val strOff = stOff + LEW(xml, sitOff + strInd * 4)
return compXmlStringAt(xml, strOff)
}




/**
* Tool Method for decompressXML();
* Apply indentation
*
* @param indent Indentation level
* @param str String to indent
* @return Indented string
*/
fun prtIndent(indent: Int, str: String): String {


return spaces.substring(0, Math.min(indent * 2, spaces.length)) + str
}




/**
* Tool method for decompressXML()
* Return the string stored in StringTable format at
* offset strOff.  This offset points to the 16 bit string length, which
* is followed by that number of 16 bit (Unicode) chars.
*
* @param arr StringTable array
* @param strOff Offset to get string from
* @return String from StringTable at offset strOff
*/
fun compXmlStringAt(arr: ByteArray, strOff: Int): String {
val strLen = (arr[strOff + 1] shl (8 and 0xff00)) or (arr[strOff].toInt() and 0xff)
val chars = ByteArray(strLen)
for (ii in 0 until strLen) {
chars[ii] = arr[strOff + 2 + ii * 2]
}
return String(chars)  // Hack, just use 8 byte chars
} // end of compXmlStringAt




/**
* Return value of a Little Endian 32 bit word from the byte array
* at offset off.
*
* @param arr Byte array with 32 bit word
* @param off Offset to get word from
* @return Value of Little Endian 32 bit word specified
*/
fun LEW(arr: ByteArray, off: Int): Int {
return (arr[off + 3] shl 24 and -0x1000000 or ((arr[off + 2] shl 16) and 0xff0000)
or (arr[off + 1] shl 8 and 0xff00) or (arr[off].toInt() and 0xFF))
} // end of LEW


private infix fun Byte.shl(i: Int): Int = (this.toInt() shl i)
private infix fun Int.shl(i: Int): Int = (this shl i)

这是上面答案的 Kotlin 版本。