// Copyright (c) 2017, Google Inc. // // Permission to use, copy, modify, and/or distribute this software for any // purpose with or without fee is hereby granted, provided that the above // copyright notice and this permission notice appear in all copies. // // THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES // WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF // MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY // SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES // WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION // OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN // CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ // delocate performs several transformations of textual assembly code. See // FIPS.md in this directory for an overview. package main import ( "bufio" "bytes" "flag" "fmt" "os" "path/filepath" "sort" "strconv" "strings" "unicode/utf8" ) func main() { // The .a file, if given, is expected to be an archive of textual // assembly sources. That's odd, but CMake really wants to create // archive files so it's the only way that we can make it work. arInput := flag.String("a", "", "Path to a .a file containing assembly sources") outFile := flag.String("o", "", "Path to output assembly") asmFiles := flag.String("as", "", "Comma separated list of assembly inputs") flag.Parse() var lines []string var err error if len(*arInput) > 0 { if lines, err = arLines(lines, *arInput); err != nil { panic(err) } } asPaths := strings.Split(*asmFiles, ",") for i, path := range asPaths { if len(path) == 0 { continue } if lines, err = asLines(lines, path, i); err != nil { panic(err) } } symbols := definedSymbols(lines) lines = transform(lines, symbols) out, err := os.OpenFile(*outFile, os.O_CREATE|os.O_TRUNC|os.O_WRONLY, 0644) if err != nil { panic(err) } defer out.Close() for _, line := range lines { out.WriteString(line) out.WriteString("\n") } } func removeComment(line string) string { if i := strings.Index(line, "#"); i != -1 { return line[:i] } return line } // isSymbolDef returns detects whether line contains a (non-local) symbol // definition. If so, it returns the symbol and true. Otherwise it returns "" // and false. func isSymbolDef(line string) (string, bool) { line = strings.TrimSpace(removeComment(line)) if len(line) > 0 && line[len(line)-1] == ':' && line[0] != '.' { symbol := line[:len(line)-1] if validSymbolName(symbol) { return symbol, true } } return "", false } // definedSymbols finds all (non-local) symbols from lines and returns a map // from symbol name to whether or not that symbol is global. func definedSymbols(lines []string) map[string]bool { globalSymbols := make(map[string]struct{}) symbols := make(map[string]bool) for _, line := range lines { if len(line) == 0 { continue } if symbol, ok := isSymbolDef(line); ok { _, isGlobal := globalSymbols[symbol] symbols[symbol] = isGlobal } parts := strings.Fields(strings.TrimSpace(line)) if parts[0] == ".globl" { globalSymbols[parts[1]] = struct{}{} } } return symbols } func referencesIA32CapDirectly(line string) bool { const symbol = "OPENSSL_ia32cap_P" i := strings.Index(line, symbol) if i < 0 { return false } i += len(symbol) return i == len(line) || line[i] == '+' || line[i] == '(' || line[i] == '@' } // threadLocalOffsetFunc describes a function that fetches the offset to symbol // in the thread-local space and writes it to the given target register. type threadLocalOffsetFunc struct { target string symbol string } type lineSource struct { lines []string lineNo int } func (ls *lineSource) Next() (string, bool) { if ls.lineNo == len(ls.lines) { return "", false } ret := ls.lines[ls.lineNo] ls.lineNo++ return ret, true } func (ls *lineSource) Unread() { ls.lineNo-- } // transform performs a number of transformations on the given assembly code. // See FIPS.md in the current directory for an overview. func transform(lines []string, symbols map[string]bool) (ret []string) { ret = append(ret, ".text", "BORINGSSL_bcm_text_start:") // redirectors maps from out-call symbol name to the name of a // redirector function for that symbol. redirectors := make(map[string]string) // ia32capAddrNeeded is true iff OPENSSL_ia32cap_addr has been // referenced and thus needs to be emitted outside the module. ia32capAddrNeeded := false // bssAccessorsNeeded maps the names of BSS variables for which // accessor functions need to be emitted outside of the module, to the // BSS symbols they point to. For example, “EVP_sha256_once” could map // to “.LEVP_sha256_once_local_target” or “EVP_sha256_once” (if .comm // was used). bssAccessorsNeeded := make(map[string]string) // threadLocalOffsets records the accessor functions needed for getting // offsets in the thread-local storage. threadLocalOffsets := make(map[string]threadLocalOffsetFunc) source := &lineSource{lines: lines} for { line, ok := source.Next() if !ok { break } // References to OPENSSL_ia32cap_P via the GOT result from C // code. The OPENSSL_ia32cap_addr symbol, generated by this // script, is just like a GOT entry, but at a known offset. line = strings.Replace(line, "OPENSSL_ia32cap_P@GOTPCREL(%rip)", "OPENSSL_ia32cap_addr(%rip)", -1) if referencesIA32CapDirectly(line) { panic("reference to OPENSSL_ia32cap_P needs to be changed to indirect via OPENSSL_ia32cap_addr") } if strings.Contains(line, "OPENSSL_ia32cap_addr(%rip)") { ia32capAddrNeeded = true } line = strings.Replace(line, "@PLT", "", -1) parts := strings.Fields(strings.TrimSpace(line)) if len(parts) == 0 { ret = append(ret, line) continue } switch parts[0] { case "call", "callq", "jmp", "jne", "jb", "jz", "jnz", "ja": target := parts[1] // indirect via register or local label if strings.HasPrefix(target, "*") || strings.HasPrefix(target, ".L") { ret = append(ret, line) continue } if strings.HasSuffix(target, "_bss_get") { // reference to a synthesised function. Don't // indirect it. ret = append(ret, line) continue } if isGlobal, ok := symbols[target]; ok { newTarget := target if isGlobal { newTarget = localTargetName(target) } ret = append(ret, fmt.Sprintf("\t%s %s", parts[0], newTarget)) continue } redirectorName := "bcm_redirector_" + target ret = append(ret, fmt.Sprintf("\t%s %s", parts[0], redirectorName)) redirectors[redirectorName] = target continue case "leaq", "movq", "cmpq": if parts[0] == "movq" && strings.Contains(line, "@GOTTPOFF(%rip)") { // GOTTPOFF are offsets into the thread-local // storage that are stored in the GOT. We have // to move these relocations out of the module, // but do not know whether rax is live at this // point. Thus a normal function call might // clobber a register and so we synthesize // different functions for writing to each // target register. // // (BoringSSL itself does not use __thread // variables, but ASAN and MSAN may add these // references for their bookkeeping.) targetRegister := parts[2][1:] symbol := strings.SplitN(parts[1], "@", 2)[0] functionName := fmt.Sprintf("BORINGSSL_bcm_tpoff_to_%s_for_%s", targetRegister, symbol) threadLocalOffsets[functionName] = threadLocalOffsetFunc{target: targetRegister, symbol: symbol} ret = append(ret, "\tcallq "+functionName+"\n") continue } target := strings.SplitN(parts[1], ",", 2)[0] if strings.HasSuffix(target, "(%rip)") { target = target[:len(target)-6] if isGlobal := symbols[target]; isGlobal { line = strings.Replace(line, target, localTargetName(target), 1) } if strings.Contains(line, "@GOTPCREL") && parts[0] == "movq" { line = strings.Replace(line, "@GOTPCREL", "", -1) target = strings.Replace(target, "@GOTPCREL", "", -1) if isGlobal := symbols[target]; isGlobal { line = strings.Replace(line, target, localTargetName(target), 1) } // Nobody actually wants to read the // code of a function. This is a load // from the GOT which, now that we're // referencing the symbol directly, // needs to be transformed into an LEA. line = strings.Replace(line, "movq", "leaq", 1) } } ret = append(ret, line) continue case ".comm": p := strings.Split(parts[1], ",") name := p[0] bssAccessorsNeeded[name] = name ret = append(ret, line) case ".section": p := strings.Split(parts[1], ",") section := strings.Trim(p[0], "\"") if section == ".data.rel.ro" { // In a normal build, this is an indication of // a problem but any references from the module // to this section will result in a relocation // and thus will break the integrity check. // However, ASAN can generate these sections // and so we cannot forbid them. ret = append(ret, line) continue } sectionType, ok := sectionType(section) if !ok { panic(fmt.Sprintf("unknown section %q on line %d", section, source.lineNo)) } switch sectionType { case ".rodata", ".text": // Move .rodata to .text so it may be accessed // without a relocation. GCC with // -fmerge-constants will place strings into // separate sections, so we move all sections // named like .rodata. Also move .text.startup // so the self-test function is also in the // module. ret = append(ret, ".text # "+section) case ".data": panic(fmt.Sprintf("bad section %q on line %d", parts[1], source.lineNo)) case ".init_array", ".fini_array", ".ctors", ".dtors": // init_array/ctors/dtors contains function // pointers to constructor/destructor // functions. These contain relocations, but // they're in a different section anyway. ret = append(ret, line) case ".debug", ".note": ret = append(ret, line) case ".bss": ret = append(ret, line) var accessors map[string]string accessors, ret = handleBSSSection(ret, source) for accessor, name := range accessors { bssAccessorsNeeded[accessor] = name } default: panic(fmt.Sprintf("unknown section %q on line %d", section, source.lineNo)) } default: if symbol, ok := isSymbolDef(line); ok { if isGlobal := symbols[symbol]; isGlobal { ret = append(ret, localTargetName(symbol)+":") } } ret = append(ret, line) } } ret = append(ret, ".text") ret = append(ret, "BORINGSSL_bcm_text_end:") // Emit redirector functions. Each is a single JMP instruction. var redirectorNames []string for name := range redirectors { redirectorNames = append(redirectorNames, name) } sort.Strings(redirectorNames) for _, name := range redirectorNames { ret = append(ret, ".type "+name+", @function") ret = append(ret, name+":") ret = append(ret, "\tjmp "+redirectors[name]+"@PLT") } var accessorNames []string for accessor := range bssAccessorsNeeded { accessorNames = append(accessorNames, accessor) } sort.Strings(accessorNames) // Emit BSS accessor functions. Each is a single LEA followed by RET. for _, name := range accessorNames { funcName := accessorName(name) ret = append(ret, ".type "+funcName+", @function") ret = append(ret, funcName+":") ret = append(ret, "\tleaq "+bssAccessorsNeeded[name]+"(%rip), %rax") ret = append(ret, "\tret") } // Emit an indirect reference to OPENSSL_ia32cap_P. if ia32capAddrNeeded { ret = append(ret, ".extern OPENSSL_ia32cap_P") ret = append(ret, ".type OPENSSL_ia32cap_addr,@object") ret = append(ret, ".size OPENSSL_ia32cap_addr,8") ret = append(ret, "OPENSSL_ia32cap_addr:") ret = append(ret, "\t.quad OPENSSL_ia32cap_P") } // Emit accessors for thread-local offsets. var threadAccessorNames []string for name := range threadLocalOffsets { threadAccessorNames = append(threadAccessorNames, name) } sort.Strings(threadAccessorNames) for _, name := range threadAccessorNames { f := threadLocalOffsets[name] ret = append(ret, ".type "+name+",@function") ret = append(ret, name+":") ret = append(ret, "\tmovq "+f.symbol+"@GOTTPOFF(%rip), %"+f.target) ret = append(ret, "\tret") } // Emit an array for storing the module hash. ret = append(ret, ".type BORINGSSL_bcm_text_hash,@object") ret = append(ret, ".size OPENSSL_ia32cap_addr,32") ret = append(ret, "BORINGSSL_bcm_text_hash:") for _, b := range uninitHashValue { ret = append(ret, ".byte 0x"+strconv.FormatUint(uint64(b), 16)) } return ret } // handleBSSSection reads lines from source until the next section and adds a // local symbol for each BSS symbol found. func handleBSSSection(lines []string, source *lineSource) (map[string]string, []string) { accessors := make(map[string]string) for { line, ok := source.Next() if !ok { return accessors, lines } parts := strings.Fields(strings.TrimSpace(line)) if len(parts) == 0 { lines = append(lines, line) continue } if strings.HasSuffix(parts[0], ":") { symbol := parts[0][:len(parts[0])-1] localSymbol := ".L" + symbol + "_local_target" lines = append(lines, line) lines = append(lines, localSymbol + ":") accessors[symbol] = localSymbol continue } switch parts[0] { case ".text", ".section": source.Unread() return accessors, lines default: lines = append(lines, line) } } } // accessorName returns the name of the accessor function for a BSS symbol // named name. func accessorName(name string) string { return name + "_bss_get" } // localTargetName returns the name of the local target label for a global // symbol named name. func localTargetName(name string) string { return ".L" + name + "_local_target" } // sectionType returns the type of a section. I.e. a section called “.text.foo” // is a “.text” section. func sectionType(section string) (string, bool) { if len(section) == 0 || section[0] != '.' { return "", false } i := strings.Index(section[1:], ".") if i != -1 { section = section[:i+1] } if strings.HasPrefix(section, ".debug_") { return ".debug", true } return section, true } // asLines appends the contents of path to lines. Local symbols are renamed // using uniqueId to avoid collisions. func asLines(lines []string, path string, uniqueId int) ([]string, error) { basename := symbolRuneOrUnderscore(filepath.Base(path)) asFile, err := os.Open(path) if err != nil { return nil, err } defer asFile.Close() // localSymbols maps from the symbol name used in the input, to a // unique symbol name. localSymbols := make(map[string]string) scanner := bufio.NewScanner(asFile) var contents []string if len(lines) == 0 { // If this is the first assembly file, don't rewrite symbols. // Only all-but-one file needs to be rewritten and so time can // be saved by putting the (large) bcm.s first. for scanner.Scan() { lines = append(lines, scanner.Text()) } if err := scanner.Err(); err != nil { return nil, err } return lines, nil } for scanner.Scan() { line := scanner.Text() trimmed := strings.TrimSpace(line) if strings.HasPrefix(trimmed, ".L") && strings.HasSuffix(trimmed, ":") { symbol := trimmed[:len(trimmed)-1] mappedSymbol := fmt.Sprintf(".L%s_%d_%s", basename, uniqueId, symbol[2:]) localSymbols[symbol] = mappedSymbol contents = append(contents, mappedSymbol+":") continue } contents = append(contents, line) } if err := scanner.Err(); err != nil { return nil, err } for _, line := range contents { for symbol, mappedSymbol := range localSymbols { i := 0 for match := strings.Index(line, symbol); match >= 0; match = strings.Index(line[i:], symbol) { i += match before := ' ' if i > 0 { before, _ = utf8.DecodeLastRuneInString(line[:i]) } after, _ := utf8.DecodeRuneInString(line[i+len(symbol):]) if !symbolRune(before) && !symbolRune(after) { line = strings.Replace(line, symbol, mappedSymbol, 1) i += len(mappedSymbol) } else { i += len(symbol) } } } lines = append(lines, line) } return lines, nil } func arLines(lines []string, arPath string) ([]string, error) { arFile, err := os.Open(arPath) if err != nil { return nil, err } defer arFile.Close() ar, err := ParseAR(arFile) if err != nil { return nil, err } if len(ar) != 1 { return nil, fmt.Errorf("expected one file in archive, but found %d", len(ar)) } for _, contents := range ar { scanner := bufio.NewScanner(bytes.NewBuffer(contents)) for scanner.Scan() { lines = append(lines, scanner.Text()) } if err := scanner.Err(); err != nil { return nil, err } } return lines, nil } // validSymbolName returns true if s is a valid (non-local) name for a symbol. func validSymbolName(s string) bool { if len(s) == 0 { return false } r, n := utf8.DecodeRuneInString(s) // symbols don't start with a digit. if r == utf8.RuneError || !symbolRune(r) || ('0' <= s[0] && s[0] <= '9') { return false } return strings.IndexFunc(s[n:], func(r rune) bool { return !symbolRune(r) }) == -1 } // symbolRune returns true if r is valid in a symbol name. func symbolRune(r rune) bool { return (r >= 'a' && r <= 'z') || (r >= 'A' && r <= 'Z') || (r >= '0' && r <= '9') || r == '$' || r == '_' } // symbolRuneOrUnderscore maps s where runes valid in a symbol name map to // themselves and all other runs map to underscore. func symbolRuneOrUnderscore(s string) string { runes := make([]rune, 0, len(s)) for _, r := range s { if symbolRune(r) { runes = append(runes, r) } else { runes = append(runes, '_') } } return string(runes) }