Home | History | Annotate | Download | only in src
      1 /*
      2  * Copyright (C) 2016 The Android Open Source Project
      3  *
      4  * Licensed under the Apache License, Version 2.0 (the "License");
      5  * you may not use this file except in compliance with the License.
      6  * You may obtain a copy of the License at
      7  *
      8  *      http://www.apache.org/licenses/LICENSE-2.0
      9  *
     10  * Unless required by applicable law or agreed to in writing, software
     11  * distributed under the License is distributed on an "AS IS" BASIS,
     12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     13  * See the License for the specific language governing permissions and
     14  * limitations under the License.
     15  */
     16 
     17 #include "Preprocessor.h"
     18 
     19 #include <err.h>
     20 #include <fcntl.h>
     21 #include <fts.h>
     22 #include <libgen.h>
     23 #include <string.h>
     24 #include <sys/stat.h>
     25 #include <sys/types.h>
     26 #include <unistd.h>
     27 
     28 #include <deque>
     29 #include <fstream>
     30 #include <string>
     31 #include <unordered_map>
     32 
     33 #include <llvm/ADT/StringRef.h>
     34 #include <llvm/ADT/Twine.h>
     35 #include <llvm/Support/FileSystem.h>
     36 #include <llvm/Support/Path.h>
     37 
     38 #include "Arch.h"
     39 #include "DeclarationDatabase.h"
     40 #include "versioner.h"
     41 
     42 using namespace std::string_literals;
     43 
     44 static DeclarationAvailability calculateRequiredGuard(const Declaration& declaration) {
     45   // To avoid redundant macro guards, the availability calculated by this function is the set
     46   // difference of 'targets marked-available' from 'targets the declaration is visible in'.
     47   // For example, a declaration that is visible always and introduced in 9 would return introduced
     48   // in 9, but the same declaration, except only visible in 9+ would return an empty
     49   // DeclarationAvailability.
     50 
     51   // This currently only handles __INTRODUCED_IN.
     52   // TODO: Do the same for __REMOVED_IN.
     53   int global_min_api_visible = 0;
     54   ArchMap<int> arch_visibility;
     55 
     56   for (const auto& it : declaration.availability) {
     57     const CompilationType& type = it.first;
     58 
     59     if (global_min_api_visible == 0 || global_min_api_visible > type.api_level) {
     60       global_min_api_visible = type.api_level;
     61     }
     62 
     63     if (arch_visibility[type.arch] == 0 || arch_visibility[type.arch] > type.api_level) {
     64       arch_visibility[type.arch] = type.api_level;
     65     }
     66   }
     67 
     68   DeclarationAvailability decl_av;
     69   if (!declaration.calculateAvailability(&decl_av)) {
     70     fprintf(stderr, "versioner: failed to calculate availability while preprocessing:\n");
     71     declaration.dump("", stderr, 2);
     72     exit(1);
     73   }
     74 
     75   D("Calculating required guard for %s:\n", declaration.name.c_str());
     76   D("  Declaration availability: %s\n", to_string(decl_av).c_str());
     77 
     78   if (verbose) {
     79     std::string arch_visibility_str;
     80     for (Arch arch : supported_archs) {
     81       if (arch_visibility[arch] != 0) {
     82         arch_visibility_str += to_string(arch);
     83         arch_visibility_str += ": ";
     84         arch_visibility_str += std::to_string(arch_visibility[arch]);
     85         arch_visibility_str += ", ";
     86       }
     87     }
     88     if (!arch_visibility_str.empty()) {
     89       arch_visibility_str.resize(arch_visibility_str.size() - 2);
     90     }
     91     D("  Declaration visibility: global = %d, arch = %s\n", global_min_api_visible,
     92       arch_visibility_str.c_str());
     93   }
     94 
     95   DeclarationAvailability result = decl_av;
     96   if (result.global_availability.introduced <= global_min_api_visible) {
     97     result.global_availability.introduced = 0;
     98   }
     99 
    100   for (Arch arch : supported_archs) {
    101     if (result.arch_availability[arch].introduced <= arch_visibility[arch]) {
    102       result.arch_availability[arch].introduced = 0;
    103     }
    104   }
    105 
    106   D("  Calculated result: %s\n", to_string(result).c_str());
    107   D("\n");
    108 
    109   return result;
    110 }
    111 
    112 static std::deque<std::string> readFileLines(const std::string& path) {
    113   std::ifstream is(path.c_str());
    114   std::deque<std::string> result;
    115   std::string line;
    116 
    117   while (std::getline(is, line)) {
    118     result.push_back(std::move(line));
    119   }
    120 
    121   return result;
    122 }
    123 
    124 static void writeFileLines(const std::string& path, const std::deque<std::string>& lines) {
    125   if (!mkdirs(dirname(path))) {
    126     err(1, "failed to create directory '%s'", dirname(path).c_str());
    127   }
    128 
    129   std::ofstream os(path.c_str(), std::ios_base::out | std::ios_base::trunc);
    130 
    131   for (const std::string& line : lines) {
    132     os << line << "\n";
    133   }
    134 }
    135 
    136 using GuardMap = std::map<Location, DeclarationAvailability>;
    137 
    138 static std::string generateGuardCondition(const DeclarationAvailability& avail) {
    139   // Logically orred expressions that constitute the macro guard.
    140   std::vector<std::string> expressions;
    141   static const std::vector<std::pair<std::string, std::set<Arch>>> arch_sets = {
    142     { "", supported_archs },
    143     { "!defined(__LP64__)", { Arch::arm, Arch::mips, Arch::x86 } },
    144     { "defined(__LP64__)", { Arch::arm64, Arch::mips64, Arch::x86_64 } },
    145     { "defined(__mips__)", { Arch::mips, Arch::mips64 } },
    146   };
    147   std::map<Arch, std::string> individual_archs = {
    148     { Arch::arm, "defined(__arm__)" },
    149     { Arch::arm64, "defined(__aarch64__)" },
    150     { Arch::mips, "defined(__mips__) && !defined(__LP64__)" },
    151     { Arch::mips64, "defined(__mips__) && defined(__LP64__)" },
    152     { Arch::x86, "defined(__i386__)" },
    153     { Arch::x86_64, "defined(__x86_64__)" },
    154   };
    155 
    156   auto generate_guard = [](const std::string& arch_expr, int min_version) {
    157     if (min_version == 0) {
    158       return arch_expr;
    159     }
    160     return arch_expr + " && __ANDROID_API__ >= " + std::to_string(min_version);
    161   };
    162 
    163   D("Generating guard for availability: %s\n", to_string(avail).c_str());
    164   if (!avail.global_availability.empty()) {
    165     for (Arch arch : supported_archs) {
    166       if (!avail.arch_availability[arch].empty()) {
    167         errx(1, "attempted to generate guard with global and per-arch values: %s",
    168              to_string(avail).c_str());
    169       }
    170     }
    171 
    172     if (avail.global_availability.introduced == 0) {
    173       fprintf(stderr, "warning: attempted to generate guard with empty availability: %s\n",
    174               to_string(avail).c_str());
    175       return "";
    176     }
    177 
    178     if (avail.global_availability.introduced <= 9) {
    179       return "";
    180     }
    181 
    182     return "__ANDROID_API__ >= "s + std::to_string(avail.global_availability.introduced);
    183   }
    184 
    185   for (const auto& it : arch_sets) {
    186     const std::string& arch_expr = it.first;
    187     const std::set<Arch>& archs = it.second;
    188 
    189     D("  Checking arch set '%s'\n", arch_expr.c_str());
    190 
    191     int version = avail.arch_availability[*it.second.begin()].introduced;
    192 
    193     // Assume that the entire declaration is declared __INTRODUCED_IN_FUTURE if one arch is.
    194     bool future = avail.arch_availability[*it.second.begin()].future;
    195 
    196     if (future) {
    197       return "__ANDROID_API__ >= __ANDROID_API_FUTURE__";
    198     }
    199 
    200     // The maximum min_version of the set.
    201     int max_min_version = 0;
    202     for (Arch arch : archs) {
    203       if (arch_min_api[arch] > max_min_version) {
    204         max_min_version = arch_min_api[arch];
    205       }
    206 
    207       if (avail.arch_availability[arch].introduced != version) {
    208         D("    Skipping arch set, availability for %s doesn't match %s\n",
    209           to_string(*it.second.begin()).c_str(), to_string(arch).c_str());
    210         goto skip;
    211       }
    212     }
    213 
    214     // If all of the archs in the set have a min_api that satifies version, elide the check.
    215     if (max_min_version >= version) {
    216       version = 0;
    217     }
    218 
    219     expressions.emplace_back(generate_guard(arch_expr, version));
    220 
    221     D("    Generated expression '%s'\n", expressions.rbegin()->c_str());
    222 
    223     for (Arch arch : archs) {
    224       individual_archs.erase(arch);
    225     }
    226 
    227   skip:
    228     continue;
    229   }
    230 
    231   for (const auto& it : individual_archs) {
    232     const std::string& arch_expr = it.second;
    233     int introduced = avail.arch_availability[it.first].introduced;
    234     if (introduced == 0) {
    235       expressions.emplace_back(arch_expr);
    236     } else {
    237       expressions.emplace_back(generate_guard(arch_expr, introduced));
    238     }
    239   }
    240 
    241   if (expressions.size() == 0) {
    242     errx(1, "generated empty guard for availability %s", to_string(avail).c_str());
    243   } else if (expressions.size() == 1) {
    244     return expressions[0];
    245   }
    246 
    247   return "("s + Join(expressions, ") || (") + ")";
    248 }
    249 
    250 // Assumes that nothing crazy is happening (e.g. having the semicolon be in a macro)
    251 static FileLocation findNextSemicolon(const std::deque<std::string>& lines, FileLocation start) {
    252   unsigned current_line = start.line;
    253   unsigned current_column = start.column;
    254   while (current_line <= lines.size()) {
    255     size_t result = lines[current_line - 1].find_first_of(';', current_column - 1);
    256 
    257     if (result != std::string::npos) {
    258       FileLocation loc = {
    259         .line = current_line,
    260         .column = unsigned(result) + 1,
    261       };
    262 
    263       return loc;
    264     }
    265 
    266     ++current_line;
    267     current_column = 0;
    268   }
    269 
    270   errx(1, "failed to find semicolon starting from %u:%u", start.line, start.column);
    271 }
    272 
    273 // Merge adjacent blocks with identical guards.
    274 static void mergeGuards(std::deque<std::string>& file_lines, GuardMap& guard_map) {
    275   if (guard_map.size() < 2) {
    276     return;
    277   }
    278 
    279   auto current = guard_map.begin();
    280   auto next = current;
    281   ++next;
    282 
    283   while (next != guard_map.end()) {
    284     if (current->second != next->second) {
    285       ++current;
    286       ++next;
    287       continue;
    288     }
    289 
    290     // Scan from the end of current to the beginning of next.
    291     bool in_block_comment = false;
    292     bool valid = true;
    293 
    294     FileLocation current_location = current->first.end;
    295     FileLocation end_location = next->first.start;
    296 
    297     auto nextLine = [&current_location]() {
    298       ++current_location.line;
    299       current_location.column = 1;
    300     };
    301 
    302     auto nextCol = [&file_lines, &current_location, &nextLine]() {
    303       if (current_location.column == file_lines[current_location.line - 1].length()) {
    304         nextLine();
    305       } else {
    306         ++current_location.column;
    307       }
    308     };
    309 
    310     // The end location will point to the semicolon, which we don't want to read, so skip it.
    311     nextCol();
    312 
    313     while (current_location < end_location) {
    314       const std::string& line = file_lines[current_location.line - 1];
    315       size_t line_index = current_location.column - 1;
    316 
    317       if (in_block_comment) {
    318         size_t pos = line.find("*/", line_index);
    319         if (pos == std::string::npos) {
    320           D("Didn't find block comment terminator, skipping line\n");
    321           nextLine();
    322           continue;
    323         } else {
    324           D("Found block comment terminator\n");
    325           in_block_comment = false;
    326           current_location.column = pos + 2;
    327           nextCol();
    328           continue;
    329         }
    330       } else {
    331         size_t pos = line.find_first_not_of(" \t", line_index);
    332         if (pos == std::string::npos) {
    333           nextLine();
    334           continue;
    335         }
    336 
    337         current_location.column = pos + 1;
    338         if (line[pos] != '/') {
    339           valid = false;
    340           break;
    341         }
    342 
    343         nextCol();
    344         if (line.length() <= pos + 1) {
    345           // Trailing slash at the end of a line?
    346           D("Trailing slash at end of line\n");
    347           valid = false;
    348           break;
    349         }
    350 
    351         if (line[pos + 1] == '/') {
    352           // C++ style comment
    353           nextLine();
    354         } else if (line[pos + 1] == '*') {
    355           // Block comment
    356           nextCol();
    357           in_block_comment = true;
    358           D("In a block comment\n");
    359         } else {
    360           // Garbage?
    361           D("Unexpected output after /: %s\n", line.substr(pos).c_str());
    362           valid = false;
    363           break;
    364         }
    365       }
    366     }
    367 
    368     if (!valid) {
    369       D("Not merging blocks %s and %s\n", to_string(current->first).c_str(),
    370         to_string(next->first).c_str());
    371       ++current;
    372       ++next;
    373       continue;
    374     }
    375 
    376     D("Merging blocks %s and %s\n", to_string(current->first).c_str(),
    377       to_string(next->first).c_str());
    378 
    379     Location merged = current->first;
    380     merged.end = next->first.end;
    381 
    382     DeclarationAvailability avail = current->second;
    383 
    384     guard_map.erase(current);
    385     guard_map.erase(next);
    386     bool dummy;
    387     std::tie(current, dummy) = guard_map.insert(std::make_pair(merged, avail));
    388     next = current;
    389     ++next;
    390   }
    391 }
    392 
    393 static void rewriteFile(const std::string& output_path, std::deque<std::string>& file_lines,
    394                         const GuardMap& guard_map) {
    395   for (auto it = guard_map.rbegin(); it != guard_map.rend(); ++it) {
    396     const Location& loc = it->first;
    397     const DeclarationAvailability& avail = it->second;
    398 
    399     std::string condition = generateGuardCondition(avail);
    400     if (condition.empty()) {
    401       continue;
    402     }
    403 
    404     std::string prologue = "\n#if "s + condition + "\n";
    405     std::string epilogue = "\n#endif /* " + condition + " */\n";
    406 
    407     file_lines[loc.end.line - 1].insert(loc.end.column, epilogue);
    408     file_lines[loc.start.line - 1].insert(loc.start.column - 1, prologue);
    409   }
    410 
    411   if (verbose) {
    412     printf("Preprocessing %s...\n", output_path.c_str());
    413   }
    414   writeFileLines(output_path, file_lines);
    415 }
    416 
    417 bool preprocessHeaders(const std::string& dst_dir, const std::string& src_dir,
    418                        HeaderDatabase* database) {
    419   std::unordered_map<std::string, GuardMap> guards;
    420   std::unordered_map<std::string, std::deque<std::string>> file_lines;
    421 
    422   for (const auto& symbol_it : database->symbols) {
    423     const Symbol& symbol = symbol_it.second;
    424 
    425     for (const auto& decl_it : symbol.declarations) {
    426       const Location& location = decl_it.first;
    427       const Declaration& decl = decl_it.second;
    428 
    429       if (decl.no_guard) {
    430         // No guard required.
    431         continue;
    432       }
    433 
    434       DeclarationAvailability macro_guard = calculateRequiredGuard(decl);
    435       if (!macro_guard.empty()) {
    436         guards[location.filename][location] = macro_guard;
    437       }
    438     }
    439   }
    440 
    441   // Copy over the original headers before preprocessing.
    442   char* fts_paths[2] = { const_cast<char*>(src_dir.c_str()), nullptr };
    443   std::unique_ptr<FTS, decltype(&fts_close)> fts(fts_open(fts_paths, FTS_LOGICAL, nullptr),
    444                                                  fts_close);
    445   if (!fts) {
    446     err(1, "failed to open directory %s", src_dir.c_str());
    447   }
    448 
    449   while (FTSENT* ent = fts_read(fts.get())) {
    450     llvm::StringRef path = ent->fts_path;
    451     if (!path.startswith(src_dir)) {
    452       err(1, "path '%s' doesn't start with source dir '%s'", ent->fts_path, src_dir.c_str());
    453     }
    454 
    455     if (ent->fts_info != FTS_F) {
    456       continue;
    457     }
    458 
    459     std::string rel_path = path.substr(src_dir.length() + 1);
    460     std::string dst_path = dst_dir + "/" + rel_path;
    461     llvm::StringRef parent_path = llvm::sys::path::parent_path(dst_path);
    462     if (llvm::sys::fs::create_directories(parent_path)) {
    463       errx(1, "failed to ensure existence of directory '%s'", parent_path.str().c_str());
    464     }
    465     if (llvm::sys::fs::copy_file(path, dst_path)) {
    466       errx(1, "failed to copy '%s/%s' to '%s'", src_dir.c_str(), path.str().c_str(),
    467            dst_path.c_str());
    468     }
    469   }
    470 
    471   for (const auto& file_it : guards) {
    472     file_lines[file_it.first] = readFileLines(file_it.first);
    473   }
    474 
    475   for (auto& file_it : guards) {
    476     llvm::StringRef file_path = file_it.first;
    477     GuardMap& orig_guard_map = file_it.second;
    478 
    479     // The end positions given to us are the end of the declaration, which is some point before the
    480     // semicolon. Fix up the end positions by scanning for the next semicolon.
    481     GuardMap guard_map;
    482     for (const auto& it : orig_guard_map) {
    483       Location loc = it.first;
    484       loc.end = findNextSemicolon(file_lines[file_path], loc.end);
    485       guard_map[loc] = it.second;
    486     }
    487 
    488     // TODO: Make sure that the Locations don't overlap.
    489     // TODO: Merge adjacent non-identical guards.
    490     mergeGuards(file_lines[file_path], guard_map);
    491 
    492     if (!file_path.startswith(src_dir)) {
    493       errx(1, "input file %s is not in %s\n", file_path.str().c_str(), src_dir.c_str());
    494     }
    495 
    496     // rel_path has a leading slash.
    497     llvm::StringRef rel_path = file_path.substr(src_dir.size(), file_path.size() - src_dir.size());
    498     std::string output_path = (llvm::Twine(dst_dir) + rel_path).str();
    499 
    500     rewriteFile(output_path, file_lines[file_path], guard_map);
    501   }
    502 
    503   return true;
    504 }
    505