ArchiveWriter.cpp 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399
  1. //===- ArchiveWriter.cpp - ar File Format implementation --------*- C++ -*-===//
  2. //
  3. // The LLVM Compiler Infrastructure
  4. //
  5. // This file is distributed under the University of Illinois Open Source
  6. // License. See LICENSE.TXT for details.
  7. //
  8. //===----------------------------------------------------------------------===//
  9. //
  10. // This file defines the writeArchive function.
  11. //
  12. //===----------------------------------------------------------------------===//
  13. #include "llvm/Object/ArchiveWriter.h"
  14. #include "llvm/ADT/ArrayRef.h"
  15. #include "llvm/ADT/StringRef.h"
  16. #include "llvm/IR/LLVMContext.h"
  17. #include "llvm/Object/Archive.h"
  18. #include "llvm/Object/ObjectFile.h"
  19. #include "llvm/Object/SymbolicFile.h"
  20. #include "llvm/Support/EndianStream.h"
  21. #include "llvm/Support/Errc.h"
  22. #include "llvm/Support/ErrorHandling.h"
  23. #include "llvm/Support/Format.h"
  24. #include "llvm/Support/Path.h"
  25. #include "llvm/Support/ToolOutputFile.h"
  26. #include "llvm/Support/raw_ostream.h"
  27. #if !defined(_MSC_VER) && !defined(__MINGW32__)
  28. #include <unistd.h>
  29. #else
  30. #include <io.h>
  31. #endif
  32. using namespace llvm;
  33. NewArchiveIterator::NewArchiveIterator(object::Archive::child_iterator I,
  34. StringRef Name)
  35. : IsNewMember(false), Name(Name), OldI(I) {}
  36. NewArchiveIterator::NewArchiveIterator(StringRef NewFilename, StringRef Name)
  37. : IsNewMember(true), Name(Name), NewFilename(NewFilename) {}
  38. StringRef NewArchiveIterator::getName() const { return Name; }
  39. bool NewArchiveIterator::isNewMember() const { return IsNewMember; }
  40. object::Archive::child_iterator NewArchiveIterator::getOld() const {
  41. assert(!IsNewMember);
  42. return OldI;
  43. }
  44. StringRef NewArchiveIterator::getNew() const {
  45. assert(IsNewMember);
  46. return NewFilename;
  47. }
  48. llvm::ErrorOr<int>
  49. NewArchiveIterator::getFD(sys::fs::file_status &NewStatus) const {
  50. assert(IsNewMember);
  51. int NewFD;
  52. if (auto EC = sys::fs::openFileForRead(NewFilename, NewFD))
  53. return EC;
  54. assert(NewFD != -1);
  55. if (auto EC = sys::fs::status(NewFD, NewStatus))
  56. return EC;
  57. // Opening a directory doesn't make sense. Let it fail.
  58. // Linux cannot open directories with open(2), although
  59. // cygwin and *bsd can.
  60. if (NewStatus.type() == sys::fs::file_type::directory_file)
  61. return make_error_code(errc::is_a_directory);
  62. return NewFD;
  63. }
  64. template <typename T>
  65. static void printWithSpacePadding(raw_fd_ostream &OS, T Data, unsigned Size,
  66. bool MayTruncate = false) {
  67. uint64_t OldPos = OS.tell();
  68. OS << Data;
  69. unsigned SizeSoFar = OS.tell() - OldPos;
  70. if (Size > SizeSoFar) {
  71. OS.indent(Size - SizeSoFar);
  72. } else if (Size < SizeSoFar) {
  73. assert(MayTruncate && "Data doesn't fit in Size");
  74. // Some of the data this is used for (like UID) can be larger than the
  75. // space available in the archive format. Truncate in that case.
  76. OS.seek(OldPos + Size);
  77. }
  78. }
  79. static void print32(raw_ostream &Out, object::Archive::Kind Kind,
  80. uint32_t Val) {
  81. if (Kind == object::Archive::K_GNU)
  82. support::endian::Writer<support::big>(Out).write(Val);
  83. else
  84. support::endian::Writer<support::little>(Out).write(Val);
  85. }
  86. static void printRestOfMemberHeader(raw_fd_ostream &Out,
  87. const sys::TimeValue &ModTime, unsigned UID,
  88. unsigned GID, unsigned Perms,
  89. unsigned Size) {
  90. printWithSpacePadding(Out, ModTime.toEpochTime(), 12);
  91. printWithSpacePadding(Out, UID, 6, true);
  92. printWithSpacePadding(Out, GID, 6, true);
  93. printWithSpacePadding(Out, format("%o", Perms), 8);
  94. printWithSpacePadding(Out, Size, 10);
  95. Out << "`\n";
  96. }
  97. static void printGNUSmallMemberHeader(raw_fd_ostream &Out, StringRef Name,
  98. const sys::TimeValue &ModTime,
  99. unsigned UID, unsigned GID,
  100. unsigned Perms, unsigned Size) {
  101. printWithSpacePadding(Out, Twine(Name) + "/", 16);
  102. printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, Size);
  103. }
  104. static void printBSDMemberHeader(raw_fd_ostream &Out, StringRef Name,
  105. const sys::TimeValue &ModTime, unsigned UID,
  106. unsigned GID, unsigned Perms, unsigned Size) {
  107. uint64_t PosAfterHeader = Out.tell() + 60 + Name.size();
  108. // Pad so that even 64 bit object files are aligned.
  109. unsigned Pad = OffsetToAlignment(PosAfterHeader, 8);
  110. unsigned NameWithPadding = Name.size() + Pad;
  111. printWithSpacePadding(Out, Twine("#1/") + Twine(NameWithPadding), 16);
  112. printRestOfMemberHeader(Out, ModTime, UID, GID, Perms,
  113. NameWithPadding + Size);
  114. Out << Name;
  115. assert(PosAfterHeader == Out.tell());
  116. while (Pad--)
  117. Out.write(uint8_t(0));
  118. }
  119. static void
  120. printMemberHeader(raw_fd_ostream &Out, object::Archive::Kind Kind,
  121. StringRef Name,
  122. std::vector<unsigned>::iterator &StringMapIndexIter,
  123. const sys::TimeValue &ModTime, unsigned UID, unsigned GID,
  124. unsigned Perms, unsigned Size) {
  125. if (Kind == object::Archive::K_BSD)
  126. return printBSDMemberHeader(Out, Name, ModTime, UID, GID, Perms, Size);
  127. if (Name.size() < 16)
  128. return printGNUSmallMemberHeader(Out, Name, ModTime, UID, GID, Perms, Size);
  129. Out << '/';
  130. printWithSpacePadding(Out, *StringMapIndexIter++, 15);
  131. printRestOfMemberHeader(Out, ModTime, UID, GID, Perms, Size);
  132. }
  133. static void writeStringTable(raw_fd_ostream &Out,
  134. ArrayRef<NewArchiveIterator> Members,
  135. std::vector<unsigned> &StringMapIndexes) {
  136. unsigned StartOffset = 0;
  137. for (ArrayRef<NewArchiveIterator>::iterator I = Members.begin(),
  138. E = Members.end();
  139. I != E; ++I) {
  140. StringRef Name = I->getName();
  141. if (Name.size() < 16)
  142. continue;
  143. if (StartOffset == 0) {
  144. printWithSpacePadding(Out, "//", 58);
  145. Out << "`\n";
  146. StartOffset = Out.tell();
  147. }
  148. StringMapIndexes.push_back(Out.tell() - StartOffset);
  149. Out << Name << "/\n";
  150. }
  151. if (StartOffset == 0)
  152. return;
  153. if (Out.tell() % 2)
  154. Out << '\n';
  155. int Pos = Out.tell();
  156. Out.seek(StartOffset - 12);
  157. printWithSpacePadding(Out, Pos - StartOffset, 10);
  158. Out.seek(Pos);
  159. }
  160. static sys::TimeValue now(bool Deterministic) {
  161. if (!Deterministic)
  162. return sys::TimeValue::now();
  163. sys::TimeValue TV;
  164. TV.fromEpochTime(0);
  165. return TV;
  166. }
  167. // Returns the offset of the first reference to a member offset.
  168. static ErrorOr<unsigned>
  169. writeSymbolTable(raw_fd_ostream &Out, object::Archive::Kind Kind,
  170. ArrayRef<NewArchiveIterator> Members,
  171. ArrayRef<MemoryBufferRef> Buffers,
  172. std::vector<unsigned> &MemberOffsetRefs, bool Deterministic) {
  173. unsigned HeaderStartOffset = 0;
  174. unsigned BodyStartOffset = 0;
  175. SmallString<128> NameBuf;
  176. raw_svector_ostream NameOS(NameBuf);
  177. LLVMContext Context;
  178. for (unsigned MemberNum = 0, N = Members.size(); MemberNum < N; ++MemberNum) {
  179. MemoryBufferRef MemberBuffer = Buffers[MemberNum];
  180. ErrorOr<std::unique_ptr<object::SymbolicFile>> ObjOrErr =
  181. object::SymbolicFile::createSymbolicFile(
  182. MemberBuffer, sys::fs::file_magic::unknown, &Context);
  183. if (!ObjOrErr)
  184. continue; // FIXME: check only for "not an object file" errors.
  185. object::SymbolicFile &Obj = *ObjOrErr.get();
  186. if (!HeaderStartOffset) {
  187. HeaderStartOffset = Out.tell();
  188. if (Kind == object::Archive::K_GNU)
  189. printGNUSmallMemberHeader(Out, "", now(Deterministic), 0, 0, 0, 0);
  190. else
  191. printBSDMemberHeader(Out, "__.SYMDEF", now(Deterministic), 0, 0, 0, 0);
  192. BodyStartOffset = Out.tell();
  193. print32(Out, Kind, 0); // number of entries or bytes
  194. }
  195. for (const object::BasicSymbolRef &S : Obj.symbols()) {
  196. uint32_t Symflags = S.getFlags();
  197. if (Symflags & object::SymbolRef::SF_FormatSpecific)
  198. continue;
  199. if (!(Symflags & object::SymbolRef::SF_Global))
  200. continue;
  201. if (Symflags & object::SymbolRef::SF_Undefined)
  202. continue;
  203. unsigned NameOffset = NameOS.tell();
  204. if (auto EC = S.printName(NameOS))
  205. return EC;
  206. NameOS << '\0';
  207. MemberOffsetRefs.push_back(MemberNum);
  208. if (Kind == object::Archive::K_BSD)
  209. print32(Out, Kind, NameOffset);
  210. print32(Out, Kind, 0); // member offset
  211. }
  212. }
  213. if (HeaderStartOffset == 0)
  214. return 0;
  215. StringRef StringTable = NameOS.str();
  216. if (Kind == object::Archive::K_BSD)
  217. print32(Out, Kind, StringTable.size()); // byte count of the string table
  218. Out << StringTable;
  219. // ld64 requires the next member header to start at an offset that is
  220. // 4 bytes aligned.
  221. unsigned Pad = OffsetToAlignment(Out.tell(), 4);
  222. while (Pad--)
  223. Out.write(uint8_t(0));
  224. // Patch up the size of the symbol table now that we know how big it is.
  225. unsigned Pos = Out.tell();
  226. const unsigned MemberHeaderSize = 60;
  227. Out.seek(HeaderStartOffset + 48); // offset of the size field.
  228. printWithSpacePadding(Out, Pos - MemberHeaderSize - HeaderStartOffset, 10);
  229. // Patch up the number of symbols.
  230. Out.seek(BodyStartOffset);
  231. unsigned NumSyms = MemberOffsetRefs.size();
  232. if (Kind == object::Archive::K_GNU)
  233. print32(Out, Kind, NumSyms);
  234. else
  235. print32(Out, Kind, NumSyms * 8);
  236. Out.seek(Pos);
  237. return BodyStartOffset + 4;
  238. }
  239. std::pair<StringRef, std::error_code> llvm::writeArchive(
  240. StringRef ArcName, std::vector<NewArchiveIterator> &NewMembers,
  241. bool WriteSymtab, object::Archive::Kind Kind, bool Deterministic) {
  242. SmallString<128> TmpArchive;
  243. int TmpArchiveFD;
  244. if (auto EC = sys::fs::createUniqueFile(ArcName + ".temp-archive-%%%%%%%.a",
  245. TmpArchiveFD, TmpArchive))
  246. return std::make_pair(ArcName, EC);
  247. tool_output_file Output(TmpArchive, TmpArchiveFD);
  248. raw_fd_ostream &Out = Output.os();
  249. Out << "!<arch>\n";
  250. std::vector<unsigned> MemberOffsetRefs;
  251. std::vector<std::unique_ptr<MemoryBuffer>> Buffers;
  252. std::vector<MemoryBufferRef> Members;
  253. std::vector<sys::fs::file_status> NewMemberStatus;
  254. for (unsigned I = 0, N = NewMembers.size(); I < N; ++I) {
  255. NewArchiveIterator &Member = NewMembers[I];
  256. MemoryBufferRef MemberRef;
  257. if (Member.isNewMember()) {
  258. StringRef Filename = Member.getNew();
  259. NewMemberStatus.resize(NewMemberStatus.size() + 1);
  260. sys::fs::file_status &Status = NewMemberStatus.back();
  261. ErrorOr<int> FD = Member.getFD(Status);
  262. if (auto EC = FD.getError())
  263. return std::make_pair(Filename, EC);
  264. ErrorOr<std::unique_ptr<MemoryBuffer>> MemberBufferOrErr =
  265. MemoryBuffer::getOpenFile(FD.get(), Filename, Status.getSize(),
  266. false);
  267. if (auto EC = MemberBufferOrErr.getError())
  268. return std::make_pair(Filename, EC);
  269. if (close(FD.get()) != 0)
  270. return std::make_pair(Filename,
  271. std::error_code(errno, std::generic_category()));
  272. Buffers.push_back(std::move(MemberBufferOrErr.get()));
  273. MemberRef = Buffers.back()->getMemBufferRef();
  274. } else {
  275. object::Archive::child_iterator OldMember = Member.getOld();
  276. ErrorOr<MemoryBufferRef> MemberBufferOrErr =
  277. OldMember->getMemoryBufferRef();
  278. if (auto EC = MemberBufferOrErr.getError())
  279. return std::make_pair("", EC);
  280. MemberRef = MemberBufferOrErr.get();
  281. }
  282. Members.push_back(MemberRef);
  283. }
  284. unsigned MemberReferenceOffset = 0;
  285. if (WriteSymtab) {
  286. ErrorOr<unsigned> MemberReferenceOffsetOrErr = writeSymbolTable(
  287. Out, Kind, NewMembers, Members, MemberOffsetRefs, Deterministic);
  288. if (auto EC = MemberReferenceOffsetOrErr.getError())
  289. return std::make_pair(ArcName, EC);
  290. MemberReferenceOffset = MemberReferenceOffsetOrErr.get();
  291. }
  292. std::vector<unsigned> StringMapIndexes;
  293. if (Kind != object::Archive::K_BSD)
  294. writeStringTable(Out, NewMembers, StringMapIndexes);
  295. unsigned MemberNum = 0;
  296. unsigned NewMemberNum = 0;
  297. std::vector<unsigned>::iterator StringMapIndexIter = StringMapIndexes.begin();
  298. std::vector<unsigned> MemberOffset;
  299. for (const NewArchiveIterator &I : NewMembers) {
  300. MemoryBufferRef File = Members[MemberNum++];
  301. unsigned Pos = Out.tell();
  302. MemberOffset.push_back(Pos);
  303. sys::TimeValue ModTime;
  304. unsigned UID;
  305. unsigned GID;
  306. unsigned Perms;
  307. if (Deterministic) {
  308. ModTime.fromEpochTime(0);
  309. UID = 0;
  310. GID = 0;
  311. Perms = 0644;
  312. } else if (I.isNewMember()) {
  313. const sys::fs::file_status &Status = NewMemberStatus[NewMemberNum];
  314. ModTime = Status.getLastModificationTime();
  315. UID = Status.getUser();
  316. GID = Status.getGroup();
  317. Perms = Status.permissions();
  318. } else {
  319. object::Archive::child_iterator OldMember = I.getOld();
  320. ModTime = OldMember->getLastModified();
  321. UID = OldMember->getUID();
  322. GID = OldMember->getGID();
  323. Perms = OldMember->getAccessMode();
  324. }
  325. if (I.isNewMember()) {
  326. StringRef FileName = I.getNew();
  327. const sys::fs::file_status &Status = NewMemberStatus[NewMemberNum++];
  328. printMemberHeader(Out, Kind, sys::path::filename(FileName),
  329. StringMapIndexIter, ModTime, UID, GID, Perms,
  330. Status.getSize());
  331. } else {
  332. object::Archive::child_iterator OldMember = I.getOld();
  333. printMemberHeader(Out, Kind, I.getName(), StringMapIndexIter, ModTime,
  334. UID, GID, Perms, OldMember->getSize());
  335. }
  336. Out << File.getBuffer();
  337. if (Out.tell() % 2)
  338. Out << '\n';
  339. }
  340. if (MemberReferenceOffset) {
  341. Out.seek(MemberReferenceOffset);
  342. for (unsigned MemberNum : MemberOffsetRefs) {
  343. if (Kind == object::Archive::K_BSD)
  344. Out.seek(Out.tell() + 4); // skip over the string offset
  345. print32(Out, Kind, MemberOffset[MemberNum]);
  346. }
  347. }
  348. Output.keep();
  349. Out.close();
  350. sys::fs::rename(TmpArchive, ArcName);
  351. return std::make_pair("", std::error_code());
  352. }