From 59a0d2f09b034b5ee99879b0e9531899c37b8b32 Mon Sep 17 00:00:00 2001 From: Ben Gruver Date: Wed, 7 Jan 2015 17:14:44 -0800 Subject: [PATCH] Refactor ClassFileNameHandler This makes the logic quite a bit easier to follow, and fixes an issue with the previous implementatation, where it didn't correctly handle the case when were multiple long names that collided after being shortened Conflicts: brut.apktool.smali/util/src/main/java/ds/tree/DuplicateKeyException.java brut.apktool.smali/util/src/main/java/ds/tree/RadixTree.java brut.apktool.smali/util/src/main/java/ds/tree/RadixTreeImpl.java brut.apktool.smali/util/src/main/java/ds/tree/RadixTreeNode.java brut.apktool.smali/util/src/main/java/ds/tree/Visitor.java brut.apktool.smali/util/src/main/java/ds/tree/VisitorImpl.java --- .../org/jf/util/ClassFileNameHandler.java | 335 +++++++++--------- .../org/jf/util/ClassFileNameHandlerTest.java | 141 +++++++- 2 files changed, 306 insertions(+), 170 deletions(-) diff --git a/brut.apktool.smali/util/src/main/java/org/jf/util/ClassFileNameHandler.java b/brut.apktool.smali/util/src/main/java/org/jf/util/ClassFileNameHandler.java index 7ac77352..d67836d9 100644 --- a/brut.apktool.smali/util/src/main/java/org/jf/util/ClassFileNameHandler.java +++ b/brut.apktool.smali/util/src/main/java/org/jf/util/ClassFileNameHandler.java @@ -28,35 +28,62 @@ package org.jf.util; -import ds.tree.RadixTree; -import ds.tree.RadixTreeImpl; +import com.google.common.collect.ArrayListMultimap; +import com.google.common.collect.Multimap; import javax.annotation.Nonnull; +import javax.annotation.Nullable; import java.io.*; import java.nio.ByteBuffer; import java.nio.CharBuffer; import java.nio.IntBuffer; +import java.util.Collection; import java.util.regex.Pattern; /** - * This class checks for case-insensitive file systems, and generates file names based on a given class name, that are - * guaranteed to be unique. When "colliding" class names are found, it appends a numeric identifier to the end of the - * class name to distinguish it from another class with a name that differes only by case. i.e. a.smali and a_2.smali + * This class handles the complexities of translating a class name into a file name. i.e. dealing with case insensitive + * file systems, windows reserved filenames, class names with extremely long package/class elements, etc. + * + * The types of transformations this class does include: + * - append a '#123' style numeric suffix if 2 physical representations collide + * - replace some number of characters in the middle with a '#' character name if an individual path element is too long + * - append a '#' if an individual path element would otherwise be considered a reserved filename */ public class ClassFileNameHandler { - // we leave an extra 10 characters to allow for a numeric suffix to be added, if it's needed - private static final int MAX_FILENAME_LENGTH = 245; + private static final int MAX_FILENAME_LENGTH = 255; + // How many characters to reserve in the physical filename for numeric suffixes + // Dex files can currently only have 64k classes, so 5 digits plus 1 for an '#' should + // be sufficient to handle the case when every class has a conflicting name + private static final int NUMERIC_SUFFIX_RESERVE = 6; - private PackageNameEntry top; + private final int NO_VALUE = -1; + private final int CASE_INSENSITIVE = 0; + private final int CASE_SENSITIVE = 1; + private int forcedCaseSensitivity = NO_VALUE; + + private DirectoryEntry top; private String fileExtension; private boolean modifyWindowsReservedFilenames; public ClassFileNameHandler(File path, String fileExtension) { - this.top = new PackageNameEntry(path); + this.top = new DirectoryEntry(path); this.fileExtension = fileExtension; this.modifyWindowsReservedFilenames = testForWindowsReservedFileNames(path); } + // for testing + public ClassFileNameHandler(File path, String fileExtension, boolean caseSensitive, + boolean modifyWindowsReservedFilenames) { + this.top = new DirectoryEntry(path); + this.fileExtension = fileExtension; + this.forcedCaseSensitivity = caseSensitive?CASE_SENSITIVE:CASE_INSENSITIVE; + this.modifyWindowsReservedFilenames = modifyWindowsReservedFilenames; + } + + private int getMaxFilenameLength() { + return MAX_FILENAME_LENGTH - NUMERIC_SUFFIX_RESERVE; + } + public File getUniqueFilenameForClass(String className) { //class names should be passed in the normal dalvik style, with a leading L, a trailing ;, and using //'/' as a separator. @@ -71,7 +98,6 @@ public class ClassFileNameHandler { } } - String packageElement; String[] packageElements = new String[packageElementCount]; int elementIndex = 0; int elementStart = 1; @@ -83,18 +109,7 @@ public class ClassFileNameHandler { throw new RuntimeException("Not a valid dalvik class name"); } - packageElement = className.substring(elementStart, i); - - if (modifyWindowsReservedFilenames && isReservedFileName(packageElement)) { - packageElement += "#"; - } - - int utf8Length = utf8Length(packageElement); - if (utf8Length > MAX_FILENAME_LENGTH) { - packageElement = shortenPathComponent(packageElement, utf8Length - MAX_FILENAME_LENGTH); - } - - packageElements[elementIndex++] = packageElement; + packageElements[elementIndex++] = className.substring(elementStart, i); elementStart = ++i; } } @@ -107,19 +122,29 @@ public class ClassFileNameHandler { throw new RuntimeException("Not a valid dalvik class name"); } - packageElement = className.substring(elementStart, className.length()-1); - if (modifyWindowsReservedFilenames && isReservedFileName(packageElement)) { - packageElement += "#"; + packageElements[elementIndex] = className.substring(elementStart, className.length()-1); + + return addUniqueChild(top, packageElements, 0); + } + + @Nonnull + private File addUniqueChild(@Nonnull DirectoryEntry parent, @Nonnull String[] packageElements, + int packageElementIndex) { + if (packageElementIndex == packageElements.length - 1) { + FileEntry fileEntry = new FileEntry(parent, packageElements[packageElementIndex] + fileExtension); + parent.addChild(fileEntry); + + String physicalName = fileEntry.getPhysicalName(); + + // the physical name should be set when adding it as a child to the parent + assert physicalName != null; + + return new File(parent.file, physicalName); + } else { + DirectoryEntry directoryEntry = new DirectoryEntry(parent, packageElements[packageElementIndex]); + directoryEntry = (DirectoryEntry)parent.addChild(directoryEntry); + return addUniqueChild(directoryEntry, packageElements, packageElementIndex+1); } - - int utf8Length = utf8Length(packageElement) + utf8Length(fileExtension); - if (utf8Length > MAX_FILENAME_LENGTH) { - packageElement = shortenPathComponent(packageElement, utf8Length - MAX_FILENAME_LENGTH); - } - - packageElements[elementIndex] = packageElement; - - return top.addUniqueChild(packageElements, 0); } private static int utf8Length(String str) { @@ -167,7 +192,6 @@ public class ClassFileNameHandler { } int midPoint = codePoints.length/2; - int delta = 0; int firstEnd = midPoint; // exclusive int secondStart = midPoint+1; // inclusive @@ -228,166 +252,133 @@ public class ClassFileNameHandler { return false; } - private static Pattern reservedFileNameRegex = Pattern.compile("^CON|PRN|AUX|NUL|COM[1-9]|LPT[1-9]$", + private static Pattern reservedFileNameRegex = Pattern.compile("^(CON|PRN|AUX|NUL|COM[1-9]|LPT[1-9])(\\..*)?$", Pattern.CASE_INSENSITIVE); private static boolean isReservedFileName(String className) { return reservedFileNameRegex.matcher(className).matches(); } private abstract class FileSystemEntry { - public final File file; + @Nullable public final DirectoryEntry parent; + @Nonnull public final String logicalName; + @Nullable protected String physicalName = null; - public FileSystemEntry(File file) { - this.file = file; + private FileSystemEntry(@Nullable DirectoryEntry parent, @Nonnull String logicalName) { + this.parent = parent; + this.logicalName = logicalName; } - public abstract File addUniqueChild(String[] pathElements, int pathElementsIndex); + @Nonnull public String getNormalizedName(boolean preserveCase) { + String elementName = logicalName; + if (!preserveCase && parent != null && !parent.isCaseSensitive()) { + elementName = elementName.toLowerCase(); + } - public FileSystemEntry makeVirtual(File parent) { - return new VirtualGroupEntry(this, parent); + if (modifyWindowsReservedFilenames && isReservedFileName(elementName)) { + elementName = addSuffixBeforeExtension(elementName, "#"); + } + + int utf8Length = utf8Length(elementName); + if (utf8Length > getMaxFilenameLength()) { + elementName = shortenPathComponent(elementName, utf8Length - getMaxFilenameLength()); + } + return elementName; } + + @Nullable + public String getPhysicalName() { + return physicalName; + } + + public void setSuffix(int suffix) { + if (suffix < 0 || suffix > 99999) { + throw new IllegalArgumentException("suffix must be in [0, 100000)"); + } + + if (this.physicalName != null) { + throw new IllegalStateException("The suffix can only be set once"); + } + this.physicalName = makePhysicalName(suffix); + } + + protected abstract String makePhysicalName(int suffix); } - private class PackageNameEntry extends FileSystemEntry { - //this contains the FileSystemEntries for all of this package's children - //the associated keys are all lowercase - private RadixTree children = new RadixTreeImpl(); + private class DirectoryEntry extends FileSystemEntry { + @Nullable private File file = null; + private int caseSensitivity = forcedCaseSensitivity; - public PackageNameEntry(File parent, String name) { - super(new File(parent, name)); + // maps a normalized (but not suffixed) entry name to 1 or more FileSystemEntries. + // Each FileSystemEntry asociated with a normalized entry name must have a distinct + // physical name + private final Multimap children = ArrayListMultimap.create(); + + public DirectoryEntry(@Nonnull File path) { + super(null, path.getName()); + file = path; + physicalName = file.getName(); } - public PackageNameEntry(File path) { - super(path); + public DirectoryEntry(@Nullable DirectoryEntry parent, @Nonnull String logicalName) { + super(parent, logicalName); } - @Override - public synchronized File addUniqueChild(String[] pathElements, int pathElementsIndex) { - String elementName; - String elementNameLower; - - if (pathElementsIndex == pathElements.length - 1) { - elementName = pathElements[pathElementsIndex]; - elementName += fileExtension; - } else { - elementName = pathElements[pathElementsIndex]; - } - elementNameLower = elementName.toLowerCase(); - - FileSystemEntry existingEntry = children.find(elementNameLower); - if (existingEntry != null) { - FileSystemEntry virtualEntry = existingEntry; - //if there is already another entry with the same name but different case, we need to - //add a virtual group, and then add the existing entry and the new entry to that group - if (!(existingEntry instanceof VirtualGroupEntry)) { - if (existingEntry.file.getName().equals(elementName)) { - if (pathElementsIndex == pathElements.length - 1) { - return existingEntry.file; - } else { - return existingEntry.addUniqueChild(pathElements, pathElementsIndex + 1); - } - } else { - virtualEntry = existingEntry.makeVirtual(file); - children.replace(elementNameLower, virtualEntry); + public FileSystemEntry addChild(FileSystemEntry entry) { + String normalizedChildName = entry.getNormalizedName(false); + Collection entries = children.get(normalizedChildName); + if (entry instanceof DirectoryEntry) { + for (FileSystemEntry childEntry: entries) { + if (childEntry.logicalName.equals(entry.logicalName)) { + return childEntry; } } - - return virtualEntry.addUniqueChild(pathElements, pathElementsIndex); } - - if (pathElementsIndex == pathElements.length - 1) { - ClassNameEntry classNameEntry = new ClassNameEntry(file, elementName); - children.insert(elementNameLower, classNameEntry); - return classNameEntry.file; - } else { - PackageNameEntry packageNameEntry = new PackageNameEntry(file, elementName); - children.insert(elementNameLower, packageNameEntry); - return packageNameEntry.addUniqueChild(pathElements, pathElementsIndex + 1); - } - } - } - - /** - * A virtual group that groups together file system entries with the same name, differing only in case - */ - private class VirtualGroupEntry extends FileSystemEntry { - //this contains the FileSystemEntries for all of the files/directories in this group - //the key is the unmodified name of the entry, before it is modified to be made unique (if needed). - private RadixTree groupEntries = new RadixTreeImpl(); - - //whether the containing directory is case sensitive or not. - //-1 = unset - //0 = false; - //1 = true; - private int isCaseSensitive = -1; - - public VirtualGroupEntry(FileSystemEntry firstChild, File parent) { - super(parent); - - //use the name of the first child in the group as-is - groupEntries.insert(firstChild.file.getName(), firstChild); + entry.setSuffix(entries.size()); + entries.add(entry); + return entry; } @Override - public File addUniqueChild(String[] pathElements, int pathElementsIndex) { - String elementName = pathElements[pathElementsIndex]; - - if (pathElementsIndex == pathElements.length - 1) { - elementName = elementName + fileExtension; + protected String makePhysicalName(int suffix) { + if (suffix > 0) { + return getNormalizedName(true) + "." + Integer.toString(suffix); } + return getNormalizedName(true); + } - FileSystemEntry existingEntry = groupEntries.find(elementName); - if (existingEntry != null) { - if (pathElementsIndex == pathElements.length - 1) { - return existingEntry.file; - } else { - return existingEntry.addUniqueChild(pathElements, pathElementsIndex+1); - } - } - - if (pathElementsIndex == pathElements.length - 1) { - String fileName; - if (!isCaseSensitive()) { - fileName = pathElements[pathElementsIndex] + "." + (groupEntries.getSize()+1) + fileExtension; - } else { - fileName = elementName; - } - - ClassNameEntry classNameEntry = new ClassNameEntry(file, fileName); - groupEntries.insert(elementName, classNameEntry); - return classNameEntry.file; - } else { - String fileName; - if (!isCaseSensitive()) { - fileName = pathElements[pathElementsIndex] + "." + (groupEntries.getSize()+1); - } else { - fileName = elementName; - } - - PackageNameEntry packageNameEntry = new PackageNameEntry(file, fileName); - groupEntries.insert(elementName, packageNameEntry); - return packageNameEntry.addUniqueChild(pathElements, pathElementsIndex + 1); + @Override + public void setSuffix(int suffix) { + super.setSuffix(suffix); + String physicalName = getPhysicalName(); + if (parent != null && physicalName != null) { + file = new File(parent.file, physicalName); } } - private boolean isCaseSensitive() { - if (isCaseSensitive != -1) { - return isCaseSensitive == 1; + protected boolean isCaseSensitive() { + if (getPhysicalName() == null || file == null) { + throw new IllegalStateException("Must call setSuffix() first"); + } + + if (caseSensitivity != NO_VALUE) { + return caseSensitivity == CASE_SENSITIVE; } File path = file; - if (path.exists() && path.isFile()) { - path = path.getParentFile(); + if (!path.delete()) { + throw new ExceptionWithContext("Can't delete %s to make it into a directory", + path.getAbsolutePath()); + } } - if ((!file.exists() && !file.mkdirs())) { - return false; + if (!path.exists() && !path.mkdirs()) { + throw new ExceptionWithContext("Couldn't create directory %s", path.getAbsolutePath()); } try { boolean result = testCaseSensitivity(path); - isCaseSensitive = result?1:0; + caseSensitivity = result?CASE_SENSITIVE:CASE_INSENSITIVE; return result; } catch (IOException ex) { return false; @@ -447,22 +438,34 @@ public class ClassFileNameHandler { try { f2.delete(); } catch (Exception ex) {} } } + } + + private class FileEntry extends FileSystemEntry { + private FileEntry(@Nullable DirectoryEntry parent, @Nonnull String logicalName) { + super(parent, logicalName); + } @Override - public FileSystemEntry makeVirtual(File parent) { - return this; + protected String makePhysicalName(int suffix) { + if (suffix > 0) { + return addSuffixBeforeExtension(getNormalizedName(true), '.' + Integer.toString(suffix)); + } + return getNormalizedName(true); } } - private class ClassNameEntry extends FileSystemEntry { - public ClassNameEntry(File parent, String name) { - super(new File(parent, name)); - } + private static String addSuffixBeforeExtension(String pathElement, String suffix) { + int extensionStart = pathElement.lastIndexOf('.'); - @Override - public File addUniqueChild(String[] pathElements, int pathElementsIndex) { - assert false; - return file; + StringBuilder newName = new StringBuilder(pathElement.length() + suffix.length() + 1); + if (extensionStart < 0) { + newName.append(pathElement); + newName.append(suffix); + } else { + newName.append(pathElement.subSequence(0, extensionStart)); + newName.append(suffix); + newName.append(pathElement.subSequence(extensionStart, pathElement.length())); } + return newName.toString(); } } diff --git a/brut.apktool.smali/util/src/test/java/org/jf/util/ClassFileNameHandlerTest.java b/brut.apktool.smali/util/src/test/java/org/jf/util/ClassFileNameHandlerTest.java index e3dfd154..125fbd2f 100644 --- a/brut.apktool.smali/util/src/test/java/org/jf/util/ClassFileNameHandlerTest.java +++ b/brut.apktool.smali/util/src/test/java/org/jf/util/ClassFileNameHandlerTest.java @@ -31,9 +31,12 @@ package org.jf.util; +import com.google.common.base.Strings; +import com.google.common.io.Files; import junit.framework.Assert; import org.junit.Test; +import java.io.File; import java.nio.charset.Charset; public class ClassFileNameHandlerTest { @@ -91,6 +94,7 @@ public class ClassFileNameHandlerTest { Assert.assertEquals(98, result.length()); } + @Test public void test4ByteEncodings() { StringBuilder sb = new StringBuilder(); for (int i=0x10000; i<0x10000+100; i++) { @@ -101,12 +105,141 @@ public class ClassFileNameHandlerTest { String result = ClassFileNameHandler.shortenPathComponent(sb.toString(), 8); Assert.assertEquals(400, sb.toString().getBytes(UTF8).length); Assert.assertEquals(389, result.getBytes(UTF8).length); - Assert.assertEquals(98, result.length()); + Assert.assertEquals(195, result.length()); - // we remove 3 codepoints == 6 characters == 12 bytes, and then add back in the 1-byte '#' + // we remove 2 codepoints == 4 characters == 8 bytes, and then add back in the 1-byte '#' result = ClassFileNameHandler.shortenPathComponent(sb.toString(), 7); Assert.assertEquals(400, sb.toString().getBytes(UTF8).length); - Assert.assertEquals(3892, result.getBytes(UTF8).length); - Assert.assertEquals(98, result.length()); + Assert.assertEquals(393, result.getBytes(UTF8).length); + Assert.assertEquals(197, result.length()); + } + + @Test + public void testMultipleLongNames() { + String filenameFragment = Strings.repeat("a", 512); + + File tempDir = Files.createTempDir(); + ClassFileNameHandler handler = new ClassFileNameHandler(tempDir, ".smali"); + + // put the differentiating character in the middle, where it will get stripped out by the filename shortening + // logic + File file1 = handler.getUniqueFilenameForClass("La/a/" + filenameFragment + "1" + filenameFragment + ";"); + checkFilename(tempDir, file1, "a", "a", Strings.repeat("a", 124) + "#" + Strings.repeat("a", 118) + ".smali"); + + File file2 = handler.getUniqueFilenameForClass("La/a/" + filenameFragment + "2" + filenameFragment + ";"); + checkFilename(tempDir, file2, "a", "a", Strings.repeat("a", 124) + "#" + Strings.repeat("a", 118) + ".1.smali"); + + Assert.assertFalse(file1.getAbsolutePath().equals(file2.getAbsolutePath())); + } + + @Test + public void testBasicFunctionality() { + File tempDir = Files.createTempDir(); + ClassFileNameHandler handler = new ClassFileNameHandler(tempDir, ".smali"); + + File file = handler.getUniqueFilenameForClass("La/b/c/d;"); + checkFilename(tempDir, file, "a", "b", "c", "d.smali"); + + file = handler.getUniqueFilenameForClass("La/b/c/e;"); + checkFilename(tempDir, file, "a", "b", "c", "e.smali"); + + file = handler.getUniqueFilenameForClass("La/b/d/d;"); + checkFilename(tempDir, file, "a", "b", "d", "d.smali"); + + file = handler.getUniqueFilenameForClass("La/b;"); + checkFilename(tempDir, file, "a", "b.smali"); + + file = handler.getUniqueFilenameForClass("Lb;"); + checkFilename(tempDir, file, "b.smali"); + } + + @Test + public void testCaseInsensitiveFilesystem() { + File tempDir = Files.createTempDir(); + ClassFileNameHandler handler = new ClassFileNameHandler(tempDir, ".smali", false, false); + + File file = handler.getUniqueFilenameForClass("La/b/c;"); + checkFilename(tempDir, file, "a", "b", "c.smali"); + + file = handler.getUniqueFilenameForClass("La/b/C;"); + checkFilename(tempDir, file, "a", "b", "C.1.smali"); + + file = handler.getUniqueFilenameForClass("La/B/c;"); + checkFilename(tempDir, file, "a", "B.1", "c.smali"); + } + + @Test + public void testCaseSensitiveFilesystem() { + File tempDir = Files.createTempDir(); + ClassFileNameHandler handler = new ClassFileNameHandler(tempDir, ".smali", true, false); + + File file = handler.getUniqueFilenameForClass("La/b/c;"); + checkFilename(tempDir, file, "a", "b", "c.smali"); + + file = handler.getUniqueFilenameForClass("La/b/C;"); + checkFilename(tempDir, file, "a", "b", "C.smali"); + + file = handler.getUniqueFilenameForClass("La/B/c;"); + checkFilename(tempDir, file, "a", "B", "c.smali"); + } + + @Test + public void testWindowsReservedFilenames() { + File tempDir = Files.createTempDir(); + ClassFileNameHandler handler = new ClassFileNameHandler(tempDir, ".smali", false, true); + + File file = handler.getUniqueFilenameForClass("La/con/c;"); + checkFilename(tempDir, file, "a", "con#", "c.smali"); + + file = handler.getUniqueFilenameForClass("La/Con/c;"); + checkFilename(tempDir, file, "a", "Con#.1", "c.smali"); + + file = handler.getUniqueFilenameForClass("La/b/PRN;"); + checkFilename(tempDir, file, "a", "b", "PRN#.smali"); + + file = handler.getUniqueFilenameForClass("La/b/prN;"); + checkFilename(tempDir, file, "a", "b", "prN#.1.smali"); + + file = handler.getUniqueFilenameForClass("La/b/com0;"); + checkFilename(tempDir, file, "a", "b", "com0.smali"); + + for (String reservedName: new String[] {"con", "prn", "aux", "nul", "com1", "com9", "lpt1", "lpt9"}) { + file = handler.getUniqueFilenameForClass("L" + reservedName + ";"); + checkFilename(tempDir, file, reservedName +"#.smali"); + } + } + + @Test + public void testIgnoringWindowsReservedFilenames() { + File tempDir = Files.createTempDir(); + ClassFileNameHandler handler = new ClassFileNameHandler(tempDir, ".smali", true, false); + + File file = handler.getUniqueFilenameForClass("La/con/c;"); + checkFilename(tempDir, file, "a", "con", "c.smali"); + + file = handler.getUniqueFilenameForClass("La/Con/c;"); + checkFilename(tempDir, file, "a", "Con", "c.smali"); + + file = handler.getUniqueFilenameForClass("La/b/PRN;"); + checkFilename(tempDir, file, "a", "b", "PRN.smali"); + + file = handler.getUniqueFilenameForClass("La/b/prN;"); + checkFilename(tempDir, file, "a", "b", "prN.smali"); + + file = handler.getUniqueFilenameForClass("La/b/com0;"); + checkFilename(tempDir, file, "a", "b", "com0.smali"); + + for (String reservedName: new String[] {"con", "prn", "aux", "nul", "com1", "com9", "lpt1", "lpt9"}) { + file = handler.getUniqueFilenameForClass("L" + reservedName + ";"); + checkFilename(tempDir, file, reservedName +".smali"); + } + } + + private void checkFilename(File base, File file, String... elements) { + for (int i=elements.length-1; i>=0; i--) { + Assert.assertEquals(elements[i], file.getName()); + file = file.getParentFile(); + } + Assert.assertEquals(base.getAbsolutePath(), file.getAbsolutePath()); } }