gllvm/extractor.go

311 lines
8.6 KiB
Go
Raw Normal View History

package main
import (
2017-06-29 21:38:04 +02:00
"debug/elf"
"debug/macho"
"io/ioutil"
"os"
"path"
"path/filepath"
2017-06-29 21:38:04 +02:00
"runtime"
"strings"
)
2017-06-30 02:46:30 +02:00
type extractionArgs struct {
2017-06-29 21:38:04 +02:00
InputFile string
InputType int
OutputFile string
LinkerName string
ArchiverName string
ArArgs []string
ObjectTypeInArchive int // Type of file that can be put into an archive
Extractor func(string) []string
IsVerbose bool
IsWriteManifest bool
IsBuildBitcodeArchive bool
}
func extract(args []string) {
2017-06-30 02:46:30 +02:00
ea := parseExtractionArgs(args)
switch ea.InputType {
2017-06-30 20:54:59 +02:00
case fileTypeELFEXECUTABLE,
fileTypeELFSHARED,
fileTypeELFOBJECT,
fileTypeMACHEXECUTABLE,
fileTypeMACHSHARED,
fileTypeMACHOBJECT:
handleExecutable(ea)
2017-06-30 20:54:59 +02:00
case fileTypeARCHIVE:
handleArchive(ea)
2017-06-29 21:38:04 +02:00
default:
2017-06-30 21:07:35 +02:00
logFatal("Incorrect input file type %v.", ea.InputType)
}
}
2017-06-30 02:46:30 +02:00
func parseExtractionArgs(args []string) extractionArgs {
2017-06-30 21:17:27 +02:00
origArgs := args
// Initializing args to defaults
2017-06-30 02:46:30 +02:00
ea := extractionArgs{
2017-06-29 21:38:04 +02:00
LinkerName: "llvm-link",
ArchiverName: "llvm-ar",
}
// Checking environment variables
if LLVMLINKName != "" {
//FIXME: this check can be eliminated because filepath.Join("", "baz") = "baz"
if LLVMToolChainBinDir != "" {
ea.LinkerName = filepath.Join(LLVMToolChainBinDir, LLVMLINKName)
} else {
ea.LinkerName = LLVMLINKName
}
}
if LLVMARName != "" {
//FIXME: this check can be eliminated because filepath.Join("", "baz") = "baz"
if LLVMToolChainBinDir != "" {
ea.ArchiverName = filepath.Join(LLVMToolChainBinDir, LLVMARName)
} else {
ea.ArchiverName = LLVMARName
}
}
// Parsing cli input. FIXME: "get-bc -mb libfoo.a" should work just like "get-bc -m -b libfoo.a"
for len(args) > 0 {
switch arg := args[0]; arg {
case "-b":
ea.IsBuildBitcodeArchive = true
args = args[1:]
case "-v":
ea.IsVerbose = true
args = args[1:]
case "-m":
ea.IsWriteManifest = true
args = args[1:]
case "-o":
if len(args) < 2 {
2017-06-30 21:17:27 +02:00
logFatal("There was an error parsing the arguments: %v.", origArgs)
}
ea.OutputFile = args[1]
args = args[2:]
default:
ea.InputFile = arg
args = args[1:]
}
}
// Sanity-check the parsed arguments
if len(ea.InputFile) == 0 {
2017-06-30 21:07:35 +02:00
logFatal("No input file was given.")
}
if _, err := os.Stat(ea.InputFile); os.IsNotExist(err) {
2017-06-30 21:07:35 +02:00
logFatal("The input file %s does not exist.", ea.InputFile)
}
realPath, err := filepath.EvalSymlinks(ea.InputFile)
if err != nil {
2017-06-30 21:07:35 +02:00
logFatal("There was an error getting the real path of %s.", ea.InputFile)
}
ea.InputFile = realPath
ea.InputType = getFileType(realPath)
// Set arguments according to runtime OS
switch platform := runtime.GOOS; platform {
case "freebsd", "linux":
ea.Extractor = extractSectionUnix
if ea.IsVerbose {
ea.ArArgs = append(ea.ArArgs, "xv")
} else {
ea.ArArgs = append(ea.ArArgs, "x")
}
2017-06-30 20:54:59 +02:00
ea.ObjectTypeInArchive = fileTypeELFOBJECT
case "darwin":
ea.Extractor = extractSectionDarwin
ea.ArArgs = append(ea.ArArgs, "-x")
if ea.IsVerbose {
ea.ArArgs = append(ea.ArArgs, "-v")
}
2017-06-30 20:54:59 +02:00
ea.ObjectTypeInArchive = fileTypeMACHOBJECT
default:
2017-06-30 21:07:35 +02:00
logFatal("Unsupported platform: %s.", platform)
}
// Create output filename if not given
if ea.OutputFile == "" {
2017-06-30 20:54:59 +02:00
if ea.InputType == fileTypeARCHIVE {
var ext string
if ea.IsBuildBitcodeArchive {
ext = ".a.bc"
} else {
ext = ".bca"
}
ea.OutputFile = strings.TrimSuffix(ea.InputFile, ".a") + ext
} else {
ea.OutputFile = ea.InputFile + ".bc"
}
}
return ea
}
2017-06-30 02:46:30 +02:00
func handleExecutable(ea extractionArgs) {
artifactPaths := ea.Extractor(ea.InputFile)
filesToLink := make([]string, len(artifactPaths))
for i, artPath := range artifactPaths {
filesToLink[i] = resolveBitcodePath(artPath)
}
extractTimeLinkFiles(ea, filesToLink)
// Write manifest
if ea.IsWriteManifest {
writeManifest(ea, filesToLink, artifactPaths)
}
2017-06-26 21:42:47 +02:00
}
2017-06-30 02:46:30 +02:00
func handleArchive(ea extractionArgs) {
// List bitcode files to link
var bcFiles []string
var artifactFiles []string
// Create tmp dir
tmpDirName, err := ioutil.TempDir("", "gllvm")
if err != nil {
2017-06-30 21:07:35 +02:00
logFatal("The temporary directory in which to extract object files could not be created.")
}
defer os.RemoveAll(tmpDirName)
// Extract objects to tmpDir
arArgs := ea.ArArgs
inputAbsPath, _ := filepath.Abs(ea.InputFile)
arArgs = append(arArgs, inputAbsPath)
success, err := execCmd("ar", arArgs, tmpDirName)
if !success {
logFatal("Failed to extract object files from %s to %s because: %v.\n", ea.InputFile, tmpDirName, err)
}
// Define object file handling closure
var walkHandlingFunc = func(path string, info os.FileInfo, err error) error {
if err == nil && !info.IsDir() {
2017-06-30 20:54:59 +02:00
fileType := getFileType(path)
if fileType == ea.ObjectTypeInArchive {
artifactPaths := ea.Extractor(path)
for _, artPath := range artifactPaths {
bcPath := resolveBitcodePath(artPath)
bcFiles = append(bcFiles, bcPath)
}
artifactFiles = append(artifactFiles, artifactPaths...)
}
}
return nil
}
// Handle object files
filepath.Walk(tmpDirName, walkHandlingFunc)
// Build archive
if ea.IsBuildBitcodeArchive {
extractTimeLinkFiles(ea, bcFiles)
} else {
archiveBcFiles(ea, bcFiles)
}
// Write manifest
if ea.IsWriteManifest {
writeManifest(ea, bcFiles, artifactFiles)
}
2017-06-26 21:42:47 +02:00
}
2017-06-30 02:46:30 +02:00
func archiveBcFiles(ea extractionArgs, bcFiles []string) {
// We do not want full paths in the archive, so we need to chdir into each
// bitcode's folder. Handle this by calling llvm-ar once for all bitcode
// files in the same directory
dirToBcMap := make(map[string][]string)
for _, bcFile := range bcFiles {
dirName, baseName := path.Split(bcFile)
dirToBcMap[dirName] = append(dirToBcMap[dirName], baseName)
}
// Call llvm-ar from each directory
absOutputFile, _ := filepath.Abs(ea.OutputFile)
for dir, bcFilesInDir := range dirToBcMap {
var args []string
args = append(args, "rs", absOutputFile)
args = append(args, bcFilesInDir...)
2017-06-30 21:17:27 +02:00
success, err := execCmd(ea.ArchiverName, args, dir)
if !success {
logFatal("There was an error creating the bitcode archive: %v.\n", err)
}
}
2017-06-30 21:07:35 +02:00
logInfo("Built bitcode archive: %s.", ea.OutputFile)
}
2017-06-30 02:46:30 +02:00
func extractTimeLinkFiles(ea extractionArgs, filesToLink []string) {
var linkArgs []string
if ea.IsVerbose {
linkArgs = append(linkArgs, "-v")
}
linkArgs = append(linkArgs, "-o", ea.OutputFile)
linkArgs = append(linkArgs, filesToLink...)
success, err := execCmd(ea.LinkerName, linkArgs, "")
if !success {
2017-06-30 21:07:35 +02:00
logFatal("There was an error linking input files into %s because %v.\n", ea.OutputFile, err)
}
2017-06-30 21:07:35 +02:00
logInfo("Bitcode file extracted to: %s.", ea.OutputFile)
}
2017-06-28 19:05:19 +02:00
func extractSectionDarwin(inputFile string) (contents []string) {
machoFile, err := macho.Open(inputFile)
if err != nil {
2017-06-30 21:07:35 +02:00
logFatal("Mach-O file %s could not be read.", inputFile)
}
2017-06-30 20:54:59 +02:00
section := machoFile.Section(DarwinSectionName)
sectionContents, errContents := section.Data()
if errContents != nil {
2017-06-30 21:07:35 +02:00
logFatal("Error reading the %s section of Mach-O file %s.", DarwinSectionName, inputFile)
}
contents = strings.Split(strings.TrimSuffix(string(sectionContents), "\n"), "\n")
return
}
2017-06-28 19:05:19 +02:00
func extractSectionUnix(inputFile string) (contents []string) {
elfFile, err := elf.Open(inputFile)
if err != nil {
2017-06-30 21:07:35 +02:00
logFatal("ELF file %s could not be read.", inputFile)
}
2017-06-30 20:54:59 +02:00
section := elfFile.Section(ELFSectionName)
sectionContents, errContents := section.Data()
if errContents != nil {
2017-06-30 21:07:35 +02:00
logFatal("Error reading the %s section of ELF file %s.", ELFSectionName, inputFile)
}
contents = strings.Split(strings.TrimSuffix(string(sectionContents), "\n"), "\n")
return
}
2017-06-26 21:42:47 +02:00
// Return the actual path to the bitcode file, or an empty string if it does not exist
func resolveBitcodePath(bcPath string) string {
if _, err := os.Stat(bcPath); os.IsNotExist(err) {
// If the bitcode file does not exist, try to find it in the store
if BitcodeStorePath != "" {
// Compute absolute path hash
absBcPath, _ := filepath.Abs(bcPath)
storeBcPath := path.Join(BitcodeStorePath, getHashedPath(absBcPath))
if _, err := os.Stat(storeBcPath); os.IsNotExist(err) {
return ""
}
2017-06-29 23:19:12 +02:00
return storeBcPath
}
2017-06-29 23:25:55 +02:00
return ""
2017-06-29 23:44:39 +02:00
}
2017-06-29 23:25:55 +02:00
return bcPath
2017-06-26 21:42:47 +02:00
}
2017-06-30 02:46:30 +02:00
func writeManifest(ea extractionArgs, bcFiles []string, artifactFiles []string) {
section1 := "Physical location of extracted files:\n" + strings.Join(bcFiles, "\n") + "\n\n"
section2 := "Build-time location of extracted files:\n" + strings.Join(artifactFiles, "\n")
contents := []byte(section1 + section2)
manifestFilename := ea.OutputFile + ".llvm.manifest"
if err := ioutil.WriteFile(manifestFilename, contents, 0644); err != nil {
2017-06-30 21:07:35 +02:00
logFatal("There was an error while writing the manifest file: ", err)
}
2017-06-30 21:07:35 +02:00
logInfo("Manifest file written to %s.", manifestFilename)
2017-06-26 21:42:47 +02:00
}