src/main/java/com/android/tools/r8/naming/MethodNameMinifier.java - r8 - Git at Google

 // Copyright (c) 2017, the R8 project authors. Please see the AUTHORS file
 // for details. All rights reserved. Use of this source code is governed by a
 // BSD-style license that can be found in the LICENSE file.
 package com.android.tools.r8.naming;

 import com.android.tools.r8.graph.DexCallSite;
 import com.android.tools.r8.graph.DexClass;
 import com.android.tools.r8.graph.DexEncodedMethod;
 import com.android.tools.r8.graph.DexMethod;
 import com.android.tools.r8.graph.DexProto;
 import com.android.tools.r8.graph.DexString;
 import com.android.tools.r8.graph.DexType;
 import com.android.tools.r8.shaking.Enqueuer.AppInfoWithLiveness;
 import com.android.tools.r8.shaking.RootSetBuilder.RootSet;
 import com.android.tools.r8.utils.InternalOptions;
 import com.android.tools.r8.utils.MethodJavaSignatureEquivalence;
 import com.android.tools.r8.utils.MethodSignatureEquivalence;
 import com.android.tools.r8.utils.Timing;
 import com.google.common.base.Equivalence;
 import com.google.common.base.Equivalence.Wrapper;
 import com.google.common.collect.Sets;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.IdentityHashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Map.Entry;
 import java.util.Set;
 import java.util.function.Function;

 /**
  * A pass to rename methods using common, short names.
  * <p>
  * To assign names, we model the scopes of methods names and overloading/shadowing based on the
  * subtyping tree of classes. Such a naming scope is encoded by {@link NamingState}. It keeps
  * track of its parent node, names that have been reserved (due to keep annotations or otherwise)
  * and what names have been used for renaming so far.
  * <p>
  * As in the Dalvik VM method dispatch takes argument and return types of methods into account, we
  * can further reuse names if the prototypes of two methods differ. For this, we store the above
  * state separately for each proto using a map from protos to {@link NamingState.InternalState}
  * objects. These internal state objects are also linked.
  * <p>
  * Name assignment happens in 4 stages. In the first stage, we record all names that are used by
  * library classes or are flagged using a keep rule as reserved. This step also allocates the
  * {@link NamingState} objects for library classes. We can fully allocate these objects as we
  * never perform naming for library classes. For non-library classes, we only allocate a state
  * for the highest non-library class, i.e., we allocate states for every direct subtype of a library
  * class. The states at the boundary between library and program classes are referred to as the
  * frontier states in the code.
  * <p>
  * When reserving names in program classes, we reserve them in the state of the corresponding
  * frontier class. This is to ensure that the names are not used for renaming in any supertype.
  * Thus, they will still be available in the subtype where they are reserved. Note that name
  * reservation only blocks names from being used for minification. We assume that the input program
  * is correctly named.
  * <p>
  * In stage 2, we reserve names that stem from interfaces. These are not propagated to
  * subinterfaces or implementing classes. Instead, stage 3 makes sure to query related states when
  * making naming decisions.
  * <p>
  * In stage 3, we compute minified names for all interface methods. We do this first to reduce
  * assignment conflicts. Interfaces do not build a tree-like inheritance structure we can exploit.
  * Thus, we have to infer the structure on the fly. For this, we compute a sets of reachable
  * interfaces. i.e., interfaces that are related via subtyping. Based on these sets, we then
  * find, for each method signature, the classes and interfaces this method signature is defined in.
  * For classes, as we still use frontier states at this point, we do not have to consider subtype
  * relations. For interfaces, we reserve the name in all reachable interfaces and thus ensure
  * availability.
  * <p>
  * Name assignment in this phase is a search over all impacted naming states. Using the naming state
  * of the interface this method first originated from, we propose names until we find a matching
  * one. We use the naming state of the interface to not impact name availability in naming states of
  * classes. Hence, skipping over names during interface naming does not impact their availability in
  * the next phase.
  * <p>
  * In the final stage, we assign names to methods by traversing the subtype tree, now allocating
  * separate naming states for each class starting from the frontier. In the first swoop, we allocate
  * all non-private methods, updating naming states accordingly. In a second swoop, we then allocate
  * private methods, as those may safely use names that are used by a public method further down in
  * the subtyping tree.
  * <p>
  * Finally, the computed renamings are returned as a map from {@link DexMethod} to
  * {@link DexString}. The MethodNameMinifier object should not be retained to ensure all
  * intermediate state is freed.
  * <p>
  * TODO(herhut): Currently, we do not minify members of annotation interfaces, as this would require
  * parsing and minification of the string arguments to annotations.
  */
 class MethodNameMinifier extends MemberNameMinifier<DexMethod, DexProto> {

   private final Set<DexCallSite> desugaredCallSites;

   private final Equivalence<DexMethod> equivalence;
   private final Map<DexCallSite, DexString> callSiteRenaming = new IdentityHashMap<>();

   MethodNameMinifier(
       AppInfoWithLiveness appInfo,
       RootSet rootSet,
       Set<DexCallSite> desugaredCallSites,
       InternalOptions options) {
     super(appInfo, rootSet, options);
     this.desugaredCallSites = desugaredCallSites;
     equivalence =
         overloadAggressively
             ? MethodSignatureEquivalence.get()
             : MethodJavaSignatureEquivalence.get();
   }

   @Override
   Function<DexProto, ?> getKeyTransform() {
     if (overloadAggressively) {
       // Use the full proto as key, hence reuse names based on full signature.
       return a -> a;
     } else {
       // Only use the parameters as key, hence do not reuse names on return type.
       return proto -> proto.parameters;
     }
   }

   static class MethodRenaming {
     final Map<DexMethod, DexString> renaming;
     final Map<DexCallSite, DexString> callSiteRenaming;

     private MethodRenaming(
         Map<DexMethod, DexString> renaming, Map<DexCallSite, DexString> callSiteRenaming) {
       this.renaming = renaming;
       this.callSiteRenaming = callSiteRenaming;
     }
   }

   MethodRenaming computeRenaming(Timing timing) {
     // Phase 1: Reserve all the names that need to be kept and allocate linked state in the
     //          library part.
     timing.begin("Phase 1");
     Map<DexType, DexType> frontierMap = new IdentityHashMap<>();
     reserveNamesInClasses(appInfo.dexItemFactory.objectType,
         appInfo.dexItemFactory.objectType,
         null, frontierMap);
     timing.end();
     // Phase 2: Reserve all the names that are required for interfaces.
     timing.begin("Phase 2");
     DexType.forAllInterfaces(
         appInfo.dexItemFactory, iface -> reserveNamesInInterfaces(iface, frontierMap));
     timing.end();
     // Phase 3: Assign names to interface methods. These are assigned by finding a name that is
     //          free in all naming states that may hold an implementation.
     timing.begin("Phase 3");
     assignNamesToInterfaceMethods(frontierMap, timing);
     timing.end();
     // Phase 4: Assign names top-down by traversing the subtype hierarchy.
     timing.begin("Phase 4");
     assignNamesToClassesMethods(appInfo.dexItemFactory.objectType, false);
     timing.end();
     // Phase 4: Do the same for private methods.
     timing.begin("Phase 5");
     assignNamesToClassesMethods(appInfo.dexItemFactory.objectType, true);
     timing.end();

     return new MethodRenaming(renaming, callSiteRenaming);
   }

   private void assignNamesToClassesMethods(DexType type, boolean doPrivates) {
     DexClass holder = appInfo.definitionFor(type);
     if (holder != null && !holder.isLibraryClass()) {
       Map<Wrapper<DexMethod>, DexString> renamingAtThisLevel = new HashMap<>();
       NamingState<DexProto, ?> state =
           computeStateIfAbsent(type, k -> getState(holder.superType).createChild());
       for (DexEncodedMethod method : holder.allMethodsSorted()) {
         assignNameToMethod(method, state, renamingAtThisLevel, doPrivates);
       }
       if (!doPrivates && !useUniqueMemberNames) {
         renamingAtThisLevel.forEach(
             (key, candidate) -> {
               DexMethod method = key.get();
               state.addRenaming(method.name, method.proto, candidate);
             });
       }
     }
     type.forAllExtendsSubtypes(subtype -> assignNamesToClassesMethods(subtype, doPrivates));
   }

   private void assignNameToMethod(
       DexEncodedMethod encodedMethod,
       NamingState<DexProto, ?> state,
       Map<Wrapper<DexMethod>, DexString> renamingAtThisLevel,
       boolean doPrivates) {
     if (encodedMethod.accessFlags.isPrivate() != doPrivates) {
       return;
     }
     DexMethod method = encodedMethod.method;
     if (!state.isReserved(method.name, method.proto)
         && !encodedMethod.accessFlags.isConstructor()) {
       DexString renamedName =
           renamingAtThisLevel.computeIfAbsent(
               equivalence.wrap(method),
               key -> state.assignNewNameFor(method.name, method.proto, useUniqueMemberNames));
       renaming.put(method, renamedName);
     }
   }

   private Set<NamingState<DexProto, ?>> getReachableStates(DexType type,
       Map<DexType, DexType> frontierMap) {
     Set<DexType> interfaces = Sets.newIdentityHashSet();
     interfaces.add(type);
     collectSuperInterfaces(type, interfaces);
     collectSubInterfaces(type, interfaces);
     Set<NamingState<DexProto, ?>> reachableStates = new HashSet<>();
     for (DexType iface : interfaces) {
       // Add the interface itself
       reachableStates.add(getState(iface));
       // And the frontiers that correspond to the classes that implement the interface.
       iface.forAllImplementsSubtypes(t -> {
         NamingState<DexProto, ?> state = getState(frontierMap.get(t));
         assert state != null;
         reachableStates.add(state);
       });
     }
     return reachableStates;
   }

   private void assignNamesToInterfaceMethods(Map<DexType, DexType> frontierMap, Timing timing) {
     // First compute a map from method signatures to a set of naming states for interfaces and
     // frontier states of classes that implement them. We add the frontier states so that we can
     // reserve the names for later method naming.
     timing.begin("Compute map");
     // A map from DexMethods to all the states linked to interfaces they appear in.
     Map<Wrapper<DexMethod>, Set<NamingState<DexProto, ?>>> globalStateMap = new HashMap<>();
     // A map from DexMethods to all the definitions seen. Needed as the Wrapper equalizes them all.
     Map<Wrapper<DexMethod>, Set<DexMethod>> sourceMethodsMap = new HashMap<>();
     // A map from DexMethods to the first interface state it was seen in. Used to pick good names.
     Map<Wrapper<DexMethod>, NamingState<DexProto, ?>> originStates = new HashMap<>();
     DexType.forAllInterfaces(appInfo.dexItemFactory, iface -> {
       assert iface.isInterface();
       DexClass clazz = appInfo.definitionFor(iface);
       if (clazz != null) {
         Set<NamingState<DexProto, ?>> collectedStates = getReachableStates(iface, frontierMap);
         for (DexEncodedMethod method : shuffleMethods(clazz.methods())) {
           addStatesToGlobalMapForMethod(
               method, collectedStates, globalStateMap, sourceMethodsMap, originStates, iface);
         }
       }
     });
     // Collect the live call sites for multi-interface lambda expression renaming. For code with
     // desugared lambdas this is a conservative estimate, as we don't track if the generated
     // lambda classes survive into the output. As multi-interface lambda expressions are rare
     // this is not a big deal.
     Set<DexCallSite> liveCallSites = Sets.union(desugaredCallSites, appInfo.callSites);
     // If the input program contains a multi-interface lambda expression that implements
     // interface methods with different protos, we need to make sure that
     // the implemented lambda methods are renamed to the same name.
     // To achieve this, we map each DexCallSite that corresponds to a lambda expression to one of
     // the DexMethods it implements, and we unify the DexMethods that need to be renamed together.
     Map<DexCallSite, DexMethod> callSites = new IdentityHashMap<>();
     // Union-find structure to keep track of methods that must be renamed together.
     // Note that if the input does not use multi-interface lambdas,
     // unificationParent will remain empty.
     Map<Wrapper<DexMethod>, Wrapper<DexMethod>> unificationParent = new HashMap<>();
     liveCallSites.forEach(
         callSite -> {
           Set<Wrapper<DexMethod>> callSiteMethods = new HashSet<>();
           // Don't report errors, as the set of call sites is a conservative estimate, and can
           // refer to interfaces which has been removed.
           Set<DexEncodedMethod> implementedMethods =
               appInfo.lookupLambdaImplementedMethods(callSite);
           if (implementedMethods.isEmpty()) {
             return;
           }
           callSites.put(callSite, implementedMethods.iterator().next().method);
           for (DexEncodedMethod method : implementedMethods) {
             DexType iface = method.method.holder;
             assert iface.isInterface();
             Set<NamingState<DexProto, ?>> collectedStates = getReachableStates(iface, frontierMap);
             addStatesToGlobalMapForMethod(
                 method, collectedStates, globalStateMap, sourceMethodsMap, originStates, iface);
             callSiteMethods.add(equivalence.wrap(method.method));
           }
           if (callSiteMethods.size() > 1) {
             // Implemented interfaces have different return types. Unify them.
             Wrapper<DexMethod> mainKey = callSiteMethods.iterator().next();
             mainKey = unificationParent.getOrDefault(mainKey, mainKey);
             for (Wrapper<DexMethod> key : callSiteMethods) {
               unificationParent.put(key, mainKey);
             }
           }
         });
     Map<Wrapper<DexMethod>, Set<Wrapper<DexMethod>>> unification = new HashMap<>();
     for (Wrapper<DexMethod> key : unificationParent.keySet()) {
       // Find root with path-compression.
       Wrapper<DexMethod> root = unificationParent.get(key);
       while (unificationParent.get(root) != root) {
         Wrapper<DexMethod> k = unificationParent.get(unificationParent.get(root));
         unificationParent.put(root, k);
         root = k;
       }
       unification.computeIfAbsent(root, k -> new HashSet<>()).add(key);
     }
     timing.end();
     // Go over every method and assign a name.
     timing.begin("Allocate names");
     // Sort the methods by the number of dependent states, so that we use short names for methods
     // references in many places.
     List<Wrapper<DexMethod>> methods = new ArrayList<>(globalStateMap.keySet());
     methods.sort((a, b) -> globalStateMap.get(b).size() - globalStateMap.get(a).size());
     for (Wrapper<DexMethod> key : methods) {
       if (!unificationParent.getOrDefault(key, key).equals(key)) {
         continue;
       }
       List<MethodNamingState> collectedStates = new ArrayList<>();
       Set<DexMethod> sourceMethods = Sets.newIdentityHashSet();
       for (Wrapper<DexMethod> k : unification.getOrDefault(key, Collections.singleton(key))) {
         DexMethod unifiedMethod = k.get();
         assert unifiedMethod != null;
         sourceMethods.addAll(sourceMethodsMap.get(k));
         for (NamingState<DexProto, ?> namingState : globalStateMap.get(k)) {
           collectedStates.add(
               new MethodNamingState(namingState, unifiedMethod.name, unifiedMethod.proto));
         }
       }
       DexMethod method = key.get();
       assert method != null;
       MethodNamingState originState =
           new MethodNamingState(originStates.get(key), method.name, method.proto);
       assignNameForInterfaceMethodInAllStates(collectedStates, sourceMethods, originState);
     }
     for (Entry<DexCallSite, DexMethod> entry : callSites.entrySet()) {
       DexMethod method = entry.getValue();
       DexString renamed = renaming.get(method);
       if (originStates.get(equivalence.wrap(method)).isReserved(method.name, method.proto)) {
         assert renamed == null;
         callSiteRenaming.put(entry.getKey(), method.name);
       } else {
         assert renamed != null;
         callSiteRenaming.put(entry.getKey(), renamed);
       }
     }
     timing.end();
   }

   private void collectSuperInterfaces(DexType iface, Set<DexType> interfaces) {
     DexClass clazz = appInfo.definitionFor(iface);
     // In cases where we lack the interface's definition, we can at least look at subtypes and
     // tie those up to get proper naming.
     if (clazz != null) {
       for (DexType type : clazz.interfaces.values) {
         if (interfaces.add(type)) {
           collectSuperInterfaces(type, interfaces);
         }
       }
     }
   }

   private void collectSubInterfaces(DexType iface, Set<DexType> interfaces) {
     iface.forAllExtendsSubtypes(subtype -> {
       assert subtype.isInterface();
       if (interfaces.add(subtype)) {
         collectSubInterfaces(subtype, interfaces);
       }
     });
   }

   private void addStatesToGlobalMapForMethod(
       DexEncodedMethod method,
       Set<NamingState<DexProto, ?>> collectedStates,
       Map<Wrapper<DexMethod>, Set<NamingState<DexProto, ?>>> globalStateMap,
       Map<Wrapper<DexMethod>, Set<DexMethod>> sourceMethodsMap,
       Map<Wrapper<DexMethod>, NamingState<DexProto, ?>> originStates,
       DexType originInterface) {
     Wrapper<DexMethod> key = equivalence.wrap(method.method);
     Set<NamingState<DexProto, ?>> stateSet =
         globalStateMap.computeIfAbsent(key, k -> new HashSet<>());
     stateSet.addAll(collectedStates);
     sourceMethodsMap.computeIfAbsent(key, k -> new HashSet<>()).add(method.method);
     originStates.putIfAbsent(key, getState(originInterface));
   }

   private void assignNameForInterfaceMethodInAllStates(
       List<MethodNamingState> collectedStates,
       Set<DexMethod> sourceMethods,
       MethodNamingState originState) {
     if (anyIsReserved(collectedStates)) {
       // This method's name is reserved in at least one naming state, so reserve it everywhere.
       for (MethodNamingState state : collectedStates) {
         state.reserveName();
       }
       return;
     }
     // We use the origin state to allocate a name here so that we can reuse names between different
     // unrelated interfaces. This saves some space. The alternative would be to use a global state
     // for allocating names, which would save the work to search here.
     DexString previousCandidate = null;
     DexString candidate;
     do {
       candidate = originState.assignNewNameFor(false);
       // If the state returns the same candidate for two consecutive trials, it should be this case:
       //   1) an interface method with the same signature (name, param) but different return type
       //   has been already renamed; and 2) -useuniqueclassmembernames is set.
       // The option forces the naming state to return the same renamed name for the same signature.
       // So, here we break the loop in an ad-hoc manner.
       if (candidate != null && candidate == previousCandidate) {
         assert useUniqueMemberNames;
         break;
       }
       for (MethodNamingState state : collectedStates) {
         if (!state.isAvailable(candidate)) {
           previousCandidate = candidate;
           candidate = null;
           break;
         }
       }
     } while (candidate == null);
     for (MethodNamingState state : collectedStates) {
       state.addRenaming(candidate);
     }
     // Rename all methods in interfaces that gave rise to this renaming.
     for (DexMethod sourceMethod : sourceMethods) {
       renaming.put(sourceMethod, candidate);
     }
   }

   private boolean anyIsReserved(List<MethodNamingState> collectedStates) {
     DexString name = collectedStates.get(0).getName();
     Map<DexProto, Boolean> globalStateCache = new HashMap<>();
     for (MethodNamingState state : collectedStates) {
       assert state.getName() == name;
       if (globalStateCache.computeIfAbsent(
               state.getProto(), proto -> globalState.isReserved(name, proto))
           && state.isReserved()) {
         return true;
       }
     }
     return false;
   }

   private void reserveNamesInClasses(DexType type, DexType libraryFrontier,
       NamingState<DexProto, ?> parent,
       Map<DexType, DexType> frontierMap) {
     assert !type.isInterface();
     DexClass holder = appInfo.definitionFor(type);
     NamingState<DexProto, ?> state = allocateNamingStateAndReserve(holder, type, libraryFrontier,
         parent, frontierMap);
     // If this is a library class (or effectively a library class as it is missing) move the
     // frontier forward.
     type.forAllExtendsSubtypes(subtype -> {
       assert !subtype.isInterface();
       reserveNamesInClasses(subtype,
           holder == null || holder.isLibraryClass() ? subtype : libraryFrontier,
           state, frontierMap);
     });
   }

   private void reserveNamesInInterfaces(DexType type, Map<DexType, DexType> frontierMap) {
     assert type.isInterface();
     frontierMap.put(type, type);
     DexClass holder = appInfo.definitionFor(type);
     allocateNamingStateAndReserve(holder, type, type, null, frontierMap);
   }

   private NamingState<DexProto, ?> allocateNamingStateAndReserve(DexClass holder, DexType type,
       DexType libraryFrontier,
       NamingState<DexProto, ?> parent,
       Map<DexType, DexType> frontierMap) {
     frontierMap.put(type, libraryFrontier);
     NamingState<DexProto, ?> state =
         computeStateIfAbsent(
             libraryFrontier,
             ignore -> parent == null
                 ? NamingState.createRoot(
                     appInfo.dexItemFactory, dictionary, getKeyTransform(), useUniqueMemberNames)
                 : parent.createChild());
     if (holder != null) {
       boolean keepAll = holder.isLibraryClass() || holder.accessFlags.isAnnotation();
       for (DexEncodedMethod method : shuffleMethods(holder.methods())) {
         reserveNamesForMethod(method, keepAll, state);
       }
     }
     return state;
   }

   private void reserveNamesForMethod(DexEncodedMethod method,
       boolean keepAll, NamingState<DexProto, ?> state) {
     if (keepAll || rootSet.noObfuscation.contains(method)) {
       state.reserveName(method.method.name, method.method.proto);
       globalState.reserveName(method.method.name, method.method.proto);
     }
   }

   /**
    * Capture a (name, proto)-pair for a {@link NamingState}. Each method methodState.METHOD(...)
    * simply defers to parent.METHOD(name, proto, ...). This allows R8 to assign the same name to
    * methods with different prototypes, which is needed for multi-interface lambdas.
    */
   private static class MethodNamingState {

     private final NamingState<DexProto, ?> parent;
     private final DexString name;
     private final DexProto proto;

     MethodNamingState(NamingState<DexProto, ?> parent, DexString name, DexProto proto) {
       assert parent != null;
       this.parent = parent;
       this.name = name;
       this.proto = proto;
     }

     DexString assignNewNameFor(boolean markAsUsed) {
       return parent.assignNewNameFor(name, proto, markAsUsed);
     }

     void reserveName() {
       parent.reserveName(name, proto);
     }

     boolean isReserved() {
       return parent.isReserved(name, proto);
     }

     boolean isAvailable(DexString candidate) {
       return parent.isAvailable(name, proto, candidate);
     }

     void addRenaming(DexString newName) {
       parent.addRenaming(name, proto, newName);
     }

     DexString getName() {
       return name;
     }

     DexProto getProto() {
       return proto;
     }
   }

   // Shuffles the given methods if assertions are enabled and deterministic debugging is disabled.
   // Used to ensure that the generated output is deterministic.
   private Iterable<DexEncodedMethod> shuffleMethods(Iterable<DexEncodedMethod> methods) {
     return options.testing.irOrdering.order(methods);
   }
 }