Auto merge of #31460 - alexcrichton:supafast-rustc, r=brson
Looking at some profiles of rustc recently, these seemed like two pretty easy wins we could get in terms of performance on the table.
This commit is contained in:
commit
a888333ea6
12
mk/rt.mk
12
mk/rt.mk
@ -148,7 +148,15 @@ ifeq ($$(CFG_WINDOWSY_$(1)),1)
|
|||||||
else ifeq ($(OSTYPE_$(1)), apple-ios)
|
else ifeq ($(OSTYPE_$(1)), apple-ios)
|
||||||
JEMALLOC_ARGS_$(1) := --disable-tls
|
JEMALLOC_ARGS_$(1) := --disable-tls
|
||||||
else ifeq ($(findstring android, $(OSTYPE_$(1))), android)
|
else ifeq ($(findstring android, $(OSTYPE_$(1))), android)
|
||||||
JEMALLOC_ARGS_$(1) := --disable-tls
|
# We force android to have prefixed symbols because apparently replacement of
|
||||||
|
# the libc allocator doesn't quite work. When this was tested (unprefixed
|
||||||
|
# symbols), it was found that the `realpath` function in libc would allocate
|
||||||
|
# with libc malloc (not jemalloc malloc), and then the standard library would
|
||||||
|
# free with jemalloc free, causing a segfault.
|
||||||
|
#
|
||||||
|
# If the test suite passes, however, without symbol prefixes then we should be
|
||||||
|
# good to go!
|
||||||
|
JEMALLOC_ARGS_$(1) := --disable-tls --with-jemalloc-prefix=je_
|
||||||
endif
|
endif
|
||||||
|
|
||||||
ifdef CFG_ENABLE_DEBUG_JEMALLOC
|
ifdef CFG_ENABLE_DEBUG_JEMALLOC
|
||||||
@ -186,7 +194,7 @@ JEMALLOC_LOCAL_$(1) := $$(JEMALLOC_BUILD_DIR_$(1))/lib/$$(JEMALLOC_REAL_NAME_$(1
|
|||||||
$$(JEMALLOC_LOCAL_$(1)): $$(JEMALLOC_DEPS) $$(MKFILE_DEPS)
|
$$(JEMALLOC_LOCAL_$(1)): $$(JEMALLOC_DEPS) $$(MKFILE_DEPS)
|
||||||
@$$(call E, make: jemalloc)
|
@$$(call E, make: jemalloc)
|
||||||
cd "$$(JEMALLOC_BUILD_DIR_$(1))"; "$(S)src/jemalloc/configure" \
|
cd "$$(JEMALLOC_BUILD_DIR_$(1))"; "$(S)src/jemalloc/configure" \
|
||||||
$$(JEMALLOC_ARGS_$(1)) --with-jemalloc-prefix=je_ $(CFG_JEMALLOC_FLAGS) \
|
$$(JEMALLOC_ARGS_$(1)) $(CFG_JEMALLOC_FLAGS) \
|
||||||
--build=$$(CFG_GNU_TRIPLE_$(CFG_BUILD)) --host=$$(CFG_GNU_TRIPLE_$(1)) \
|
--build=$$(CFG_GNU_TRIPLE_$(CFG_BUILD)) --host=$$(CFG_GNU_TRIPLE_$(1)) \
|
||||||
CC="$$(CC_$(1)) $$(CFG_JEMALLOC_CFLAGS_$(1))" \
|
CC="$$(CC_$(1)) $$(CFG_JEMALLOC_CFLAGS_$(1))" \
|
||||||
AR="$$(AR_$(1))" \
|
AR="$$(AR_$(1))" \
|
||||||
|
@ -50,7 +50,7 @@ fn main() {
|
|||||||
.env("AR", &ar)
|
.env("AR", &ar)
|
||||||
.env("RANLIB", format!("{} s", ar.display()));
|
.env("RANLIB", format!("{} s", ar.display()));
|
||||||
|
|
||||||
if target.contains("windows-gnu") {
|
if target.contains("windows") {
|
||||||
// A bit of history here, this used to be --enable-lazy-lock added in
|
// A bit of history here, this used to be --enable-lazy-lock added in
|
||||||
// #14006 which was filed with jemalloc in jemalloc/jemalloc#83 which
|
// #14006 which was filed with jemalloc in jemalloc/jemalloc#83 which
|
||||||
// was also reported to MinGW:
|
// was also reported to MinGW:
|
||||||
@ -72,7 +72,19 @@ fn main() {
|
|||||||
// locking, but requires passing an option due to a historical
|
// locking, but requires passing an option due to a historical
|
||||||
// default with jemalloc.
|
// default with jemalloc.
|
||||||
cmd.arg("--disable-lazy-lock");
|
cmd.arg("--disable-lazy-lock");
|
||||||
} else if target.contains("ios") || target.contains("android") {
|
} else if target.contains("ios") {
|
||||||
|
cmd.arg("--disable-tls");
|
||||||
|
} else if target.contains("android") {
|
||||||
|
// We force android to have prefixed symbols because apparently
|
||||||
|
// replacement of the libc allocator doesn't quite work. When this was
|
||||||
|
// tested (unprefixed symbols), it was found that the `realpath`
|
||||||
|
// function in libc would allocate with libc malloc (not jemalloc
|
||||||
|
// malloc), and then the standard library would free with jemalloc free,
|
||||||
|
// causing a segfault.
|
||||||
|
//
|
||||||
|
// If the test suite passes, however, without symbol prefixes then we
|
||||||
|
// should be good to go!
|
||||||
|
cmd.arg("--with-jemalloc-prefix=je_");
|
||||||
cmd.arg("--disable-tls");
|
cmd.arg("--disable-tls");
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -82,7 +94,6 @@ fn main() {
|
|||||||
|
|
||||||
// Turn off broken quarantine (see jemalloc/jemalloc#161)
|
// Turn off broken quarantine (see jemalloc/jemalloc#161)
|
||||||
cmd.arg("--disable-fill");
|
cmd.arg("--disable-fill");
|
||||||
cmd.arg("--with-jemalloc-prefix=je_");
|
|
||||||
cmd.arg(format!("--host={}", build_helper::gnu_target(&target)));
|
cmd.arg(format!("--host={}", build_helper::gnu_target(&target)));
|
||||||
cmd.arg(format!("--build={}", build_helper::gnu_target(&host)));
|
cmd.arg(format!("--build={}", build_helper::gnu_target(&host)));
|
||||||
|
|
||||||
|
@ -41,12 +41,25 @@ use libc::{c_int, c_void, size_t};
|
|||||||
#[cfg(not(cargobuild))]
|
#[cfg(not(cargobuild))]
|
||||||
extern {}
|
extern {}
|
||||||
|
|
||||||
|
// Note that the symbols here are prefixed by default on OSX (we don't
|
||||||
|
// explicitly request it), and on Android we explicitly request it as
|
||||||
|
// unprefixing cause segfaults (mismatches in allocators).
|
||||||
extern {
|
extern {
|
||||||
fn je_mallocx(size: size_t, flags: c_int) -> *mut c_void;
|
#[cfg_attr(any(target_os = "macos", target_os = "android"),
|
||||||
fn je_rallocx(ptr: *mut c_void, size: size_t, flags: c_int) -> *mut c_void;
|
link_name = "je_mallocx")]
|
||||||
fn je_xallocx(ptr: *mut c_void, size: size_t, extra: size_t, flags: c_int) -> size_t;
|
fn mallocx(size: size_t, flags: c_int) -> *mut c_void;
|
||||||
fn je_sdallocx(ptr: *mut c_void, size: size_t, flags: c_int);
|
#[cfg_attr(any(target_os = "macos", target_os = "android"),
|
||||||
fn je_nallocx(size: size_t, flags: c_int) -> size_t;
|
link_name = "je_rallocx")]
|
||||||
|
fn rallocx(ptr: *mut c_void, size: size_t, flags: c_int) -> *mut c_void;
|
||||||
|
#[cfg_attr(any(target_os = "macos", target_os = "android"),
|
||||||
|
link_name = "je_xallocx")]
|
||||||
|
fn xallocx(ptr: *mut c_void, size: size_t, extra: size_t, flags: c_int) -> size_t;
|
||||||
|
#[cfg_attr(any(target_os = "macos", target_os = "android"),
|
||||||
|
link_name = "je_sdallocx")]
|
||||||
|
fn sdallocx(ptr: *mut c_void, size: size_t, flags: c_int);
|
||||||
|
#[cfg_attr(any(target_os = "macos", target_os = "android"),
|
||||||
|
link_name = "je_nallocx")]
|
||||||
|
fn nallocx(size: size_t, flags: c_int) -> size_t;
|
||||||
}
|
}
|
||||||
|
|
||||||
// The minimum alignment guaranteed by the architecture. This value is used to
|
// The minimum alignment guaranteed by the architecture. This value is used to
|
||||||
@ -78,7 +91,7 @@ fn align_to_flags(align: usize) -> c_int {
|
|||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
pub extern "C" fn __rust_allocate(size: usize, align: usize) -> *mut u8 {
|
pub extern "C" fn __rust_allocate(size: usize, align: usize) -> *mut u8 {
|
||||||
let flags = align_to_flags(align);
|
let flags = align_to_flags(align);
|
||||||
unsafe { je_mallocx(size as size_t, flags) as *mut u8 }
|
unsafe { mallocx(size as size_t, flags) as *mut u8 }
|
||||||
}
|
}
|
||||||
|
|
||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
@ -88,7 +101,7 @@ pub extern "C" fn __rust_reallocate(ptr: *mut u8,
|
|||||||
align: usize)
|
align: usize)
|
||||||
-> *mut u8 {
|
-> *mut u8 {
|
||||||
let flags = align_to_flags(align);
|
let flags = align_to_flags(align);
|
||||||
unsafe { je_rallocx(ptr as *mut c_void, size as size_t, flags) as *mut u8 }
|
unsafe { rallocx(ptr as *mut c_void, size as size_t, flags) as *mut u8 }
|
||||||
}
|
}
|
||||||
|
|
||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
@ -98,19 +111,19 @@ pub extern "C" fn __rust_reallocate_inplace(ptr: *mut u8,
|
|||||||
align: usize)
|
align: usize)
|
||||||
-> usize {
|
-> usize {
|
||||||
let flags = align_to_flags(align);
|
let flags = align_to_flags(align);
|
||||||
unsafe { je_xallocx(ptr as *mut c_void, size as size_t, 0, flags) as usize }
|
unsafe { xallocx(ptr as *mut c_void, size as size_t, 0, flags) as usize }
|
||||||
}
|
}
|
||||||
|
|
||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
pub extern "C" fn __rust_deallocate(ptr: *mut u8, old_size: usize, align: usize) {
|
pub extern "C" fn __rust_deallocate(ptr: *mut u8, old_size: usize, align: usize) {
|
||||||
let flags = align_to_flags(align);
|
let flags = align_to_flags(align);
|
||||||
unsafe { je_sdallocx(ptr as *mut c_void, old_size as size_t, flags) }
|
unsafe { sdallocx(ptr as *mut c_void, old_size as size_t, flags) }
|
||||||
}
|
}
|
||||||
|
|
||||||
#[no_mangle]
|
#[no_mangle]
|
||||||
pub extern "C" fn __rust_usable_size(size: usize, align: usize) -> usize {
|
pub extern "C" fn __rust_usable_size(size: usize, align: usize) -> usize {
|
||||||
let flags = align_to_flags(align);
|
let flags = align_to_flags(align);
|
||||||
unsafe { je_nallocx(size as size_t, flags) as usize }
|
unsafe { nallocx(size as size_t, flags) as usize }
|
||||||
}
|
}
|
||||||
|
|
||||||
// These symbols are used by jemalloc on android but the really old android
|
// These symbols are used by jemalloc on android but the really old android
|
||||||
|
@ -35,10 +35,12 @@ pub fn FnvHashSet<V: Hash + Eq>() -> FnvHashSet<V> {
|
|||||||
pub struct FnvHasher(u64);
|
pub struct FnvHasher(u64);
|
||||||
|
|
||||||
impl Default for FnvHasher {
|
impl Default for FnvHasher {
|
||||||
|
#[inline]
|
||||||
fn default() -> FnvHasher { FnvHasher(0xcbf29ce484222325) }
|
fn default() -> FnvHasher { FnvHasher(0xcbf29ce484222325) }
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Hasher for FnvHasher {
|
impl Hasher for FnvHasher {
|
||||||
|
#[inline]
|
||||||
fn write(&mut self, bytes: &[u8]) {
|
fn write(&mut self, bytes: &[u8]) {
|
||||||
let FnvHasher(mut hash) = *self;
|
let FnvHasher(mut hash) = *self;
|
||||||
for byte in bytes {
|
for byte in bytes {
|
||||||
@ -47,5 +49,7 @@ impl Hasher for FnvHasher {
|
|||||||
}
|
}
|
||||||
*self = FnvHasher(hash);
|
*self = FnvHasher(hash);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[inline]
|
||||||
fn finish(&self) -> u64 { self.0 }
|
fn finish(&self) -> u64 { self.0 }
|
||||||
}
|
}
|
||||||
|
@ -1253,7 +1253,11 @@ fn add_upstream_rust_crates(cmd: &mut Linker, sess: &Session,
|
|||||||
|
|
||||||
if any_objects {
|
if any_objects {
|
||||||
archive.build();
|
archive.build();
|
||||||
|
if dylib {
|
||||||
cmd.link_whole_rlib(&fix_windows_verbatim_for_gcc(&dst));
|
cmd.link_whole_rlib(&fix_windows_verbatim_for_gcc(&dst));
|
||||||
|
} else {
|
||||||
|
cmd.link_rlib(&fix_windows_verbatim_for_gcc(&dst));
|
||||||
|
}
|
||||||
}
|
}
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
18
src/test/run-make/lto-no-link-whole-rlib/Makefile
Normal file
18
src/test/run-make/lto-no-link-whole-rlib/Makefile
Normal file
@ -0,0 +1,18 @@
|
|||||||
|
# Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||||
|
# file at the top-level directory of this distribution and at
|
||||||
|
# http://rust-lang.org/COPYRIGHT.
|
||||||
|
#
|
||||||
|
# Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
# http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
# <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
# option. This file may not be copied, modified, or distributed
|
||||||
|
# except according to those terms.
|
||||||
|
|
||||||
|
-include ../tools.mk
|
||||||
|
|
||||||
|
all: $(call NATIVE_STATICLIB,foo) $(call NATIVE_STATICLIB,bar)
|
||||||
|
$(RUSTC) lib1.rs
|
||||||
|
$(RUSTC) lib2.rs
|
||||||
|
$(RUSTC) main.rs -Clto
|
||||||
|
$(call RUN,main)
|
||||||
|
|
13
src/test/run-make/lto-no-link-whole-rlib/bar.c
Normal file
13
src/test/run-make/lto-no-link-whole-rlib/bar.c
Normal file
@ -0,0 +1,13 @@
|
|||||||
|
// Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||||
|
// file at the top-level directory of this distribution and at
|
||||||
|
// http://rust-lang.org/COPYRIGHT.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
// option. This file may not be copied, modified, or distributed
|
||||||
|
// except according to those terms.
|
||||||
|
|
||||||
|
int foo() {
|
||||||
|
return 2;
|
||||||
|
}
|
13
src/test/run-make/lto-no-link-whole-rlib/foo.c
Normal file
13
src/test/run-make/lto-no-link-whole-rlib/foo.c
Normal file
@ -0,0 +1,13 @@
|
|||||||
|
// Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||||
|
// file at the top-level directory of this distribution and at
|
||||||
|
// http://rust-lang.org/COPYRIGHT.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
// option. This file may not be copied, modified, or distributed
|
||||||
|
// except according to those terms.
|
||||||
|
|
||||||
|
int foo() {
|
||||||
|
return 1;
|
||||||
|
}
|
20
src/test/run-make/lto-no-link-whole-rlib/lib1.rs
Normal file
20
src/test/run-make/lto-no-link-whole-rlib/lib1.rs
Normal file
@ -0,0 +1,20 @@
|
|||||||
|
// Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||||
|
// file at the top-level directory of this distribution and at
|
||||||
|
// http://rust-lang.org/COPYRIGHT.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
// option. This file may not be copied, modified, or distributed
|
||||||
|
// except according to those terms.
|
||||||
|
|
||||||
|
#![crate_type = "rlib"]
|
||||||
|
|
||||||
|
#[link(name = "foo", kind = "static")]
|
||||||
|
extern {
|
||||||
|
fn foo() -> i32;
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn foo1() -> i32 {
|
||||||
|
unsafe { foo() }
|
||||||
|
}
|
23
src/test/run-make/lto-no-link-whole-rlib/lib2.rs
Normal file
23
src/test/run-make/lto-no-link-whole-rlib/lib2.rs
Normal file
@ -0,0 +1,23 @@
|
|||||||
|
// Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||||
|
// file at the top-level directory of this distribution and at
|
||||||
|
// http://rust-lang.org/COPYRIGHT.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
// option. This file may not be copied, modified, or distributed
|
||||||
|
// except according to those terms.
|
||||||
|
|
||||||
|
#![crate_type = "rlib"]
|
||||||
|
|
||||||
|
extern crate lib1;
|
||||||
|
|
||||||
|
#[link(name = "bar", kind = "static")]
|
||||||
|
extern {
|
||||||
|
fn foo() -> i32;
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn foo2() -> i32 {
|
||||||
|
unsafe { foo() }
|
||||||
|
}
|
||||||
|
|
17
src/test/run-make/lto-no-link-whole-rlib/main.rs
Normal file
17
src/test/run-make/lto-no-link-whole-rlib/main.rs
Normal file
@ -0,0 +1,17 @@
|
|||||||
|
// Copyright 2016 The Rust Project Developers. See the COPYRIGHT
|
||||||
|
// file at the top-level directory of this distribution and at
|
||||||
|
// http://rust-lang.org/COPYRIGHT.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
// option. This file may not be copied, modified, or distributed
|
||||||
|
// except according to those terms.
|
||||||
|
|
||||||
|
extern crate lib1;
|
||||||
|
extern crate lib2;
|
||||||
|
|
||||||
|
fn main() {
|
||||||
|
assert_eq!(lib1::foo1(), 2);
|
||||||
|
assert_eq!(lib2::foo2(), 2);
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user