python代码是我用它的Java代码问GPT改版的,具体逻辑我也不清楚
Java版本(批量处理版)
package main.java.com.example.demo;
import java.io.*;
import java.util.Arrays;
import java.util.HashMap;
import java.util.Map;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicReference;
public class WxChatImgRevert2 {
public static void main(String[] args) {
String path = "C:\\Users\\Administrator\\Documents\\WeChat Files\\xxx\\FileStorage";
String targetPath = "D:\\weChat\\temp";
convert(path, targetPath);
}
/**
* @param path 图片目录地址
* @param targetPath 转换后目录
*/
private static void convert(String path, String targetPath) {
File[] file = new File(path).listFiles();
if (file == null) {
return;
}
int size = file.length;
System.out.println("总共" + size + "个文件");
AtomicReference<Integer> integer = new AtomicReference<>(0);
AtomicInteger x = new AtomicInteger();
for (File file1 : file) {
if (file1.isFile()) {
Object[] xori = getXor(file1);
if (xori != null && xori[1] != null){
x.set((int)xori[1]);
}
break;
}
}
Arrays.stream(file).parallel().forEach(file1 -> {
if (file1.isDirectory()) {
String[] newTargetPath = file1.getPath().split("/|\\\\");
File targetFile = new File(targetPath+File.separator+newTargetPath[newTargetPath.length - 1]);
if (!targetFile.exists()) {
targetFile.mkdirs();
}
convert(file1.getPath(),targetPath+File.separator+newTargetPath[newTargetPath.length - 1]);
return;
}
Object[] xor = getXor(file1);
if (x.get() == 0 && xor[1] != null && (int) xor[1] != 0) {
x.set((int) xor[1]);
}
xor[1] = xor[1] == null ? x.get() : xor[1];
try (InputStream reader = new FileInputStream(file1);
OutputStream writer =
new FileOutputStream(targetPath + File.separator + file1.getName().split("\\.")[0] + (xor[0] != null ?
"." + xor[0] : ""))) {
byte[] bytes = new byte[1024 * 10];
int b;
while ((b = reader.read(bytes)) != -1) {//这里的in.read(bytes);就是把输入流中的东西,写入到内存中(bytes)。
for (int i = 0; i < bytes.length; i++) {
bytes[i] = (byte) (int) (bytes[i] ^ (int) xor[1]);
if (i == (b - 1)) {
break;
}
}
writer.write(bytes, 0, b);
writer.flush();
}
integer.set(integer.get() + 1);
System.out.println(file1.getName() + "(大小:" + ((double) file1.length() / 1000) + "kb,异或值:" + xor[1] + ")," +
"进度:" + integer.get() +
"/" + size);
} catch (Exception e) {
e.printStackTrace();
}
});
System.out.println("解析完毕!");
}
/**
* 判断图片异或值
*
* @param file
* @return
*/
private static Object[] getXor(File file) {
Object[] xor = null;
if (file != null) {
byte[] bytes = new byte[4];
try (InputStream reader = new FileInputStream(file)) {
reader.read(bytes, 0, bytes.length);
} catch (Exception e) {
e.printStackTrace();
}
xor = getXor(bytes);
}
return xor;
}
/**
* @param bytes
* @return
*/
private static Object[] getXor(byte[] bytes) {
Object[] xorType = new Object[2];
int[] xors = new int[3];
for (Map.Entry<String, String> type : FILE_TYPE_MAP.entrySet()) {
String[] hex = {
String.valueOf(type.getKey().charAt(0)) + type.getKey().charAt(1),
String.valueOf(type.getKey().charAt(2)) + type.getKey().charAt(3),
String.valueOf(type.getKey().charAt(4)) + type.getKey().charAt(5)
};
xors[0] = bytes[0] & 0xFF ^ Integer.parseInt(hex[0], 16);
xors[1] = bytes[1] & 0xFF ^ Integer.parseInt(hex[1], 16);
xors[2] = bytes[2] & 0xFF ^ Integer.parseInt(hex[2], 16);
if (xors[0] == xors[1] && xors[1] == xors[2]) {
xorType[0] = type.getValue();
xorType[1] = xors[0];
break;
}
}
return xorType;
}
private final static Map<String, String> FILE_TYPE_MAP = new HashMap<String, String>();
static {
getAllFileType();
}
private static void getAllFileType() {
FILE_TYPE_MAP.put("ffd8ffe000104a464946", "jpg"); //JPEG (jpg)
FILE_TYPE_MAP.put("89504e470d0a1a0a0000", "png"); //PNG (png)
FILE_TYPE_MAP.put("47494638396126026f01", "gif"); //GIF (gif)
FILE_TYPE_MAP.put("49492a00227105008037", "tif"); //TIFF (tif)
FILE_TYPE_MAP.put("424d228c010000000000", "bmp"); //16色位图(bmp)
FILE_TYPE_MAP.put("424d8240090000000000", "bmp"); //24位位图(bmp)
FILE_TYPE_MAP.put("424d8e1b030000000000", "bmp"); //256色位图(bmp)
FILE_TYPE_MAP.put("41433130313500000000", "dwg"); //CAD (dwg)
FILE_TYPE_MAP.put("3c21444f435459504520", "html"); //HTML (html)
FILE_TYPE_MAP.put("3c21646f637479706520", "htm"); //HTM (htm)
FILE_TYPE_MAP.put("48544d4c207b0d0a0942", "css"); //css
FILE_TYPE_MAP.put("696b2e71623d696b2e71", "js"); //js
FILE_TYPE_MAP.put("7b5c727466315c616e73", "rtf"); //Rich Text Format (rtf)
FILE_TYPE_MAP.put("38425053000100000000", "psd"); //Photoshop (psd)
FILE_TYPE_MAP.put("46726f6d3a203d3f6762", "eml"); //Email [Outlook Express 6] (eml)
FILE_TYPE_MAP.put("d0cf11e0a1b11ae10000", "doc"); //MS Excel 注意:word、msi 和 excel的文件头一样
FILE_TYPE_MAP.put("d0cf11e0a1b11ae10000", "vsd"); //Visio 绘图
FILE_TYPE_MAP.put("5374616E64617264204A", "mdb"); //MS Access (mdb)
FILE_TYPE_MAP.put("252150532D41646F6265", "ps");
FILE_TYPE_MAP.put("255044462d312e360d25", "pdf"); //Adobe Acrobat (pdf)
FILE_TYPE_MAP.put("2e524d46000000120001", "rmvb"); //rmvb/rm相同
FILE_TYPE_MAP.put("464c5601050000000900", "flv"); //flv与f4v相同
FILE_TYPE_MAP.put("00000020667479706973", "mp4");
FILE_TYPE_MAP.put("49443303000000000f76", "mp3");
FILE_TYPE_MAP.put("000001ba210001000180", "mpg"); //
FILE_TYPE_MAP.put("3026b2758e66cf11a6d9", "wmv"); //wmv与asf相同
FILE_TYPE_MAP.put("524946464694c9015741", "wav"); //Wave (wav)
FILE_TYPE_MAP.put("52494646d07d60074156", "avi");
FILE_TYPE_MAP.put("4d546864000000060001", "mid"); //MIDI (mid)
FILE_TYPE_MAP.put("504b0304140000000800", "zip");
FILE_TYPE_MAP.put("526172211a0700cf9073", "rar");
FILE_TYPE_MAP.put("235468697320636f6e66", "ini");
FILE_TYPE_MAP.put("504b03040a0000000000", "jar");
FILE_TYPE_MAP.put("4d5a9000030000000400", "exe");//可执行文件
FILE_TYPE_MAP.put("3c25402070616765206c", "jsp");//jsp文件
FILE_TYPE_MAP.put("4d616e69666573742d56", "mf");//MF文件
FILE_TYPE_MAP.put("3c3f786d6c2076657273", "xml");//xml文件
FILE_TYPE_MAP.put("efbbbf2f2a0d0a53514c", "sql");//xml文件
FILE_TYPE_MAP.put("7061636b616765207765", "java");//java文件
FILE_TYPE_MAP.put("406563686f206f66660d", "bat");//bat文件
FILE_TYPE_MAP.put("1f8b0800000000000000", "gz");//gz文件
FILE_TYPE_MAP.put("6c6f67346a2e726f6f74", "properties");//bat文件
FILE_TYPE_MAP.put("cafebabe0000002e0041", "class");//bat文件
FILE_TYPE_MAP.put("49545346030000006000", "chm");//bat文件
FILE_TYPE_MAP.put("04000000010000001300", "mxp");//bat文件
FILE_TYPE_MAP.put("504b0304140006000800", "docx");//docx文件
FILE_TYPE_MAP.put("d0cf11e0a1b11ae10000", "wps");//WPS文字wps、表格et、演示dps都是一样的
FILE_TYPE_MAP.put("6431303a637265617465", "torrent");
FILE_TYPE_MAP.put("494d4b48010100000200", "264");
FILE_TYPE_MAP.put("6D6F6F76", "mov"); //Quicktime (mov)
FILE_TYPE_MAP.put("FF575043", "wpd"); //WordPerfect (wpd)
FILE_TYPE_MAP.put("CFAD12FEC5FD746F", "dbx"); //Outlook Express (dbx)
FILE_TYPE_MAP.put("2142444E", "pst"); //Outlook (pst)
FILE_TYPE_MAP.put("AC9EBD8F", "qdf"); //Quicken (qdf)
FILE_TYPE_MAP.put("E3828596", "pwl"); //Windows Password (pwl)
FILE_TYPE_MAP.put("2E7261FD", "ram"); //Real Audio (ram)
}
}
Python版本 (单文件处理版)
import os
FILE_TYPE_MAP = {
"ffd8ffe000104a464946": "jpg", # JPEG (jpg)
"89504e470d0a1a0a0000": "png", # PNG (png)
"47494638396126026f01": "gif", # GIF (gif)
"49492a00227105008037": "tif", # TIFF (tif)
"424d228c010000000000": "bmp", # 16色位图(bmp)
"424d8240090000000000": "bmp", # 24位位图(bmp)
"424d8e1b030000000000": "bmp", # 256色位图(bmp)
"41433130313500000000": "dwg", # CAD (dwg)
"3c21444f435459504520": "html", # HTML (html)
"3c21646f637479706520": "htm", # HTM (htm)
"48544d4c207b0d0a0942": "css", # css
"696b2e71623d696b2e71": "js", # js
"7b5c727466315c616e73": "rtf", # Rich Text Format (rtf)
"38425053000100000000": "psd", # Photoshop (psd)
"46726f6d3a203d3f6762": "eml", # Email [Outlook Express 6] (eml)
"d0cf11e0a1b11ae10000": "doc", # MS Excel 注意:word、msi 和 excel的文件头一样
# "d0cf11e0a1b11ae10000": "vsd", # Visio 绘图
# "d0cf11e0a1b11ae10000": "wps", # WPS文字wps、表格et、演示dps都是一样的
"5374616e64617264204a": "mdb", # MS Access (mdb)
"252150532d41646f6265": "ps",
"255044462d312e360d25": "pdf", # Adobe Acrobat (pdf)
"2e524d46000000120001": "rmvb", # rmvb/rm相同
"464c5601050000000900": "flv", # flv与f4v相同
"00000020667479706973": "mp4",
"49443303000000000f76": "mp3",
"000001ba210001000180": "mpg", #
"3026b2758e66cf11a6d9": "wmv", # wmv与asf相同
"524946464694c9015741": "wav", # Wave (wav)
"52494646d07d60074156": "avi",
"4d546864000000060001": "mid", # MIDI (mid)
"504b0304140000000800": "zip",
"526172211a0700cf9073": "rar",
"235468697320636f6e66": "ini",
"504b03040a0000000000": "jar",
"4d5a9000030000000400": "exe", # 可执行文件
"3c25402070616765206c": "jsp", # jsp文件
"4d616e69666573742d56": "mf", # MF文件
"3c3f786d6c2076657273": "xml", # xml文件
"efbbbf2f2a0d0a53514c": "sql", # xml文件
"7061636b616765207765": "java", # java文件
"406563686f206f66660d": "bat", # bat文件
"1f8b0800000000000000": "gz", # gz文件
"6c6f67346a2e726f6f74": "properties", # bat文件
"cafebabe0000002e0041": "class", # bat文件
"49545346030000006000": "chm", # bat文件
"04000000010000001300": "mxp", # bat文件
"504b0304140006000800": "docx", # docx文件
"6431303a637265617465": "torrent",
"494d4b48010100000200": "264",
"6d6f6f76": "mov", # Quicktime (mov)
"ff575043": "wpd", # WordPerfect (wpd)
"cfad12fec5fd746f": "dbx", # Outlook Express (dbx)
"2142444e": "pst", # Outlook (pst)
"ac9ebd8f": "qdf", # Quicken (qdf)
"e3828596": "pwl", # Windows Password (pwl)
"2e7261fd": "ram", # Real Audio (ram)
}
def get_xor(bytes_data):
xor_type = [None, None]
xors = [0, 0, 0]
for key, value in FILE_TYPE_MAP.items():
hex_bytes = [
int(key[0:2], 16),
int(key[2:4], 16),
int(key[4:6], 16)
]
xors[0] = bytes_data[0] ^ hex_bytes[0]
xors[1] = bytes_data[1] ^ hex_bytes[1]
xors[2] = bytes_data[2] ^ hex_bytes[2]
if xors[0] == xors[1] and xors[1] == xors[2]:
xor_type[0] = value
xor_type[1] = xors[0]
break
return xor_type
def convert_file(file_path, target_path):
os.makedirs(target_path, exist_ok=True)
if not os.path.isfile(file_path):
print(f"{file_path} is not a valid file.")
return
with open(file_path, 'rb') as f:
xori = get_xor(f.read(3))
xor_value = xori[1] if xori[1] is not None else 0
file_type = xori[0] if xori[0] else os.path.splitext(file_path)[1][1:]
output_file_name = f"{os.path.splitext(os.path.basename(file_path))[0]}.{file_type}"
output_file_path = os.path.join(target_path, output_file_name)
with open(file_path, 'rb') as reader, open(output_file_path, 'wb') as writer:
while chunk := reader.read(1024 * 10):
chunk = bytes([b ^ xor_value for b in chunk])
writer.write(chunk)
print(f"Converted {file_path} to {output_file_path} with XOR value: {xor_value}")
if __name__ == "__main__":
file_path = r"C:\Users\Admin\Desktop\image\1822231586051853196.dat" # Example file path
target_path = r"C:\Users\Admin\Desktop\jm"
convert_file(file_path, target_path)