auto merge of #14075 : Rufflewind/rust/patch-3, r=alexcrichton

- Use Unicode-aware versions of `CreateProcess` (Fixes #13815) and `Get/FreeEnvironmentStrings`.
    - Includes a helper function `os::win32::as_mut_utf16_p`, which does the same thing as `os::win32::as_utf16_p` except the pointer is mutable.
    - Fixed `make_command_line` to handle Unicode correctly.
- Tests for the above.
This commit is contained in:
bors 2014-05-13 16:01:48 -07:00
commit cb115ac2d4
4 changed files with 153 additions and 32 deletions

View File

@ -208,7 +208,7 @@ pub use funcs::bsd43::{shutdown};
#[cfg(windows)] pub use consts::os::extra::{TRUE, FALSE, INFINITE}; #[cfg(windows)] pub use consts::os::extra::{TRUE, FALSE, INFINITE};
#[cfg(windows)] pub use consts::os::extra::{PROCESS_TERMINATE, PROCESS_QUERY_INFORMATION}; #[cfg(windows)] pub use consts::os::extra::{PROCESS_TERMINATE, PROCESS_QUERY_INFORMATION};
#[cfg(windows)] pub use consts::os::extra::{STILL_ACTIVE, DETACHED_PROCESS}; #[cfg(windows)] pub use consts::os::extra::{STILL_ACTIVE, DETACHED_PROCESS};
#[cfg(windows)] pub use consts::os::extra::{CREATE_NEW_PROCESS_GROUP}; #[cfg(windows)] pub use consts::os::extra::{CREATE_NEW_PROCESS_GROUP, CREATE_UNICODE_ENVIRONMENT};
#[cfg(windows)] pub use consts::os::extra::{FILE_BEGIN, FILE_END, FILE_CURRENT}; #[cfg(windows)] pub use consts::os::extra::{FILE_BEGIN, FILE_END, FILE_CURRENT};
#[cfg(windows)] pub use consts::os::extra::{FILE_GENERIC_READ, FILE_GENERIC_WRITE}; #[cfg(windows)] pub use consts::os::extra::{FILE_GENERIC_READ, FILE_GENERIC_WRITE};
#[cfg(windows)] pub use consts::os::extra::{FILE_SHARE_READ, FILE_SHARE_WRITE, FILE_SHARE_DELETE}; #[cfg(windows)] pub use consts::os::extra::{FILE_SHARE_READ, FILE_SHARE_WRITE, FILE_SHARE_DELETE};
@ -1937,6 +1937,7 @@ pub mod consts {
pub static DETACHED_PROCESS: DWORD = 0x00000008; pub static DETACHED_PROCESS: DWORD = 0x00000008;
pub static CREATE_NEW_PROCESS_GROUP: DWORD = 0x00000200; pub static CREATE_NEW_PROCESS_GROUP: DWORD = 0x00000200;
pub static CREATE_UNICODE_ENVIRONMENT: DWORD = 0x00000400;
pub static PIPE_ACCESS_DUPLEX: DWORD = 0x00000003; pub static PIPE_ACCESS_DUPLEX: DWORD = 0x00000003;
pub static PIPE_ACCESS_INBOUND: DWORD = 0x00000001; pub static PIPE_ACCESS_INBOUND: DWORD = 0x00000001;
@ -4193,8 +4194,8 @@ pub mod funcs {
pub mod kernel32 { pub mod kernel32 {
use types::os::arch::c95::{c_uint}; use types::os::arch::c95::{c_uint};
use types::os::arch::extra::{BOOL, DWORD, SIZE_T, HMODULE, use types::os::arch::extra::{BOOL, DWORD, SIZE_T, HMODULE,
LPCWSTR, LPWSTR, LPCSTR, LPSTR, LPCWSTR, LPWSTR,
LPCH, LPDWORD, LPVOID, LPWCH, LPDWORD, LPVOID,
LPCVOID, LPOVERLAPPED, LPCVOID, LPOVERLAPPED,
LPSECURITY_ATTRIBUTES, LPSECURITY_ATTRIBUTES,
LPSTARTUPINFO, LPSTARTUPINFO,
@ -4211,8 +4212,8 @@ pub mod funcs {
-> DWORD; -> DWORD;
pub fn SetEnvironmentVariableW(n: LPCWSTR, v: LPCWSTR) pub fn SetEnvironmentVariableW(n: LPCWSTR, v: LPCWSTR)
-> BOOL; -> BOOL;
pub fn GetEnvironmentStringsA() -> LPCH; pub fn GetEnvironmentStringsW() -> LPWCH;
pub fn FreeEnvironmentStringsA(env_ptr: LPCH) -> BOOL; pub fn FreeEnvironmentStringsW(env_ptr: LPWCH) -> BOOL;
pub fn GetModuleFileNameW(hModule: HMODULE, pub fn GetModuleFileNameW(hModule: HMODULE,
lpFilename: LPWSTR, lpFilename: LPWSTR,
nSize: DWORD) nSize: DWORD)
@ -4251,8 +4252,8 @@ pub mod funcs {
dwProcessId: DWORD) dwProcessId: DWORD)
-> HANDLE; -> HANDLE;
pub fn GetCurrentProcess() -> HANDLE; pub fn GetCurrentProcess() -> HANDLE;
pub fn CreateProcessA(lpApplicationName: LPCSTR, pub fn CreateProcessW(lpApplicationName: LPCWSTR,
lpCommandLine: LPSTR, lpCommandLine: LPWSTR,
lpProcessAttributes: lpProcessAttributes:
LPSECURITY_ATTRIBUTES, LPSECURITY_ATTRIBUTES,
lpThreadAttributes: lpThreadAttributes:
@ -4260,7 +4261,7 @@ pub mod funcs {
bInheritHandles: BOOL, bInheritHandles: BOOL,
dwCreationFlags: DWORD, dwCreationFlags: DWORD,
lpEnvironment: LPVOID, lpEnvironment: LPVOID,
lpCurrentDirectory: LPCSTR, lpCurrentDirectory: LPCWSTR,
lpStartupInfo: LPSTARTUPINFO, lpStartupInfo: LPSTARTUPINFO,
lpProcessInformation: lpProcessInformation:
LPPROCESS_INFORMATION) LPPROCESS_INFORMATION)

View File

@ -258,7 +258,7 @@ fn spawn_process_os(config: p::ProcessConfig,
GetCurrentProcess, GetCurrentProcess,
DuplicateHandle, DuplicateHandle,
CloseHandle, CloseHandle,
CreateProcessA CreateProcessW
}; };
use libc::funcs::extra::msvcrt::get_osfhandle; use libc::funcs::extra::msvcrt::get_osfhandle;
@ -318,15 +318,15 @@ fn spawn_process_os(config: p::ProcessConfig,
let mut create_err = None; let mut create_err = None;
// stolen from the libuv code. // stolen from the libuv code.
let mut flags = 0; let mut flags = libc::CREATE_UNICODE_ENVIRONMENT;
if config.detach { if config.detach {
flags |= libc::DETACHED_PROCESS | libc::CREATE_NEW_PROCESS_GROUP; flags |= libc::DETACHED_PROCESS | libc::CREATE_NEW_PROCESS_GROUP;
} }
with_envp(env, |envp| { with_envp(env, |envp| {
with_dirp(dir, |dirp| { with_dirp(dir, |dirp| {
cmd.with_c_str(|cmdp| { os::win32::as_mut_utf16_p(cmd, |cmdp| {
let created = CreateProcessA(ptr::null(), mem::transmute(cmdp), let created = CreateProcessW(ptr::null(), cmdp,
ptr::mut_null(), ptr::mut_null(), TRUE, ptr::mut_null(), ptr::mut_null(), TRUE,
flags, envp, dirp, &mut si, flags, envp, dirp, &mut si,
&mut pi); &mut pi);
@ -409,16 +409,17 @@ fn make_command_line(prog: &str, args: &[~str]) -> ~str {
if quote { if quote {
cmd.push_char('"'); cmd.push_char('"');
} }
for i in range(0u, arg.len()) { let argvec: Vec<char> = arg.chars().collect();
append_char_at(cmd, arg, i); for i in range(0u, argvec.len()) {
append_char_at(cmd, &argvec, i);
} }
if quote { if quote {
cmd.push_char('"'); cmd.push_char('"');
} }
} }
fn append_char_at(cmd: &mut StrBuf, arg: &str, i: uint) { fn append_char_at(cmd: &mut StrBuf, arg: &Vec<char>, i: uint) {
match arg[i] as char { match *arg.get(i) {
'"' => { '"' => {
// Escape quotes. // Escape quotes.
cmd.push_str("\\\""); cmd.push_str("\\\"");
@ -438,11 +439,11 @@ fn make_command_line(prog: &str, args: &[~str]) -> ~str {
} }
} }
fn backslash_run_ends_in_quote(s: &str, mut i: uint) -> bool { fn backslash_run_ends_in_quote(s: &Vec<char>, mut i: uint) -> bool {
while i < s.len() && s[i] as char == '\\' { while i < s.len() && *s.get(i) == '\\' {
i += 1; i += 1;
} }
return i < s.len() && s[i] as char == '"'; return i < s.len() && *s.get(i) == '"';
} }
} }
@ -691,7 +692,7 @@ fn with_envp<T>(env: Option<~[(~str, ~str)]>, cb: |*mut c_void| -> T) -> T {
for pair in env.iter() { for pair in env.iter() {
let kv = format!("{}={}", *pair.ref0(), *pair.ref1()); let kv = format!("{}={}", *pair.ref0(), *pair.ref1());
blk.push_all(kv.as_bytes()); blk.push_all(kv.to_utf16().as_slice());
blk.push(0); blk.push(0);
} }
@ -704,9 +705,12 @@ fn with_envp<T>(env: Option<~[(~str, ~str)]>, cb: |*mut c_void| -> T) -> T {
} }
#[cfg(windows)] #[cfg(windows)]
fn with_dirp<T>(d: Option<&Path>, cb: |*libc::c_char| -> T) -> T { fn with_dirp<T>(d: Option<&Path>, cb: |*u16| -> T) -> T {
match d { match d {
Some(dir) => dir.with_c_str(|buf| cb(buf)), Some(dir) => match dir.as_str() {
Some(dir_str) => os::win32::as_utf16_p(dir_str, cb),
None => cb(ptr::null())
},
None => cb(ptr::null()) None => cb(ptr::null())
} }
} }
@ -860,5 +864,9 @@ mod tests {
make_command_line("echo", ["a b c".to_owned()]), make_command_line("echo", ["a b c".to_owned()]),
"echo \"a b c\"".to_owned() "echo \"a b c\"".to_owned()
); );
assert_eq!(
make_command_line("\u03c0\u042f\u97f3\u00e6\u221e", []),
"\u03c0\u042f\u97f3\u00e6\u221e".to_owned()
);
} }
} }

View File

@ -31,7 +31,7 @@
use clone::Clone; use clone::Clone;
use container::Container; use container::Container;
use libc; use libc;
use libc::{c_char, c_void, c_int}; use libc::{c_void, c_int};
use option::{Some, None, Option}; use option::{Some, None, Option};
use os; use os;
use ops::Drop; use ops::Drop;
@ -49,6 +49,8 @@ use vec::Vec;
#[cfg(unix)] #[cfg(unix)]
use c_str::ToCStr; use c_str::ToCStr;
#[cfg(unix)]
use libc::c_char;
#[cfg(windows)] #[cfg(windows)]
use str::OwnedStr; use str::OwnedStr;
@ -141,10 +143,14 @@ pub mod win32 {
} }
pub fn as_utf16_p<T>(s: &str, f: |*u16| -> T) -> T { pub fn as_utf16_p<T>(s: &str, f: |*u16| -> T) -> T {
as_mut_utf16_p(s, |t| { f(t as *u16) })
}
pub fn as_mut_utf16_p<T>(s: &str, f: |*mut u16| -> T) -> T {
let mut t = s.to_utf16(); let mut t = s.to_utf16();
// Null terminate before passing on. // Null terminate before passing on.
t.push(0u16); t.push(0u16);
f(t.as_ptr()) f(t.as_mut_ptr())
} }
} }
@ -182,22 +188,42 @@ pub fn env_as_bytes() -> Vec<(~[u8],~[u8])> {
unsafe { unsafe {
#[cfg(windows)] #[cfg(windows)]
unsafe fn get_env_pairs() -> Vec<~[u8]> { unsafe fn get_env_pairs() -> Vec<~[u8]> {
use c_str; use slice::raw;
use libc::funcs::extra::kernel32::{ use libc::funcs::extra::kernel32::{
GetEnvironmentStringsA, GetEnvironmentStringsW,
FreeEnvironmentStringsA FreeEnvironmentStringsW
}; };
let ch = GetEnvironmentStringsA(); let ch = GetEnvironmentStringsW();
if ch as uint == 0 { if ch as uint == 0 {
fail!("os::env() failure getting env string from OS: {}", fail!("os::env() failure getting env string from OS: {}",
os::last_os_error()); os::last_os_error());
} }
// Here, we lossily decode the string as UTF16.
//
// The docs suggest that the result should be in Unicode, but
// Windows doesn't guarantee it's actually UTF16 -- it doesn't
// validate the environment string passed to CreateProcess nor
// SetEnvironmentVariable. Yet, it's unlikely that returning a
// raw u16 buffer would be of practical use since the result would
// be inherently platform-dependent and introduce additional
// complexity to this code.
//
// Using the non-Unicode version of GetEnvironmentStrings is even
// worse since the result is in an OEM code page. Characters that
// can't be encoded in the code page would be turned into question
// marks.
let mut result = Vec::new(); let mut result = Vec::new();
c_str::from_c_multistring(ch as *c_char, None, |cstr| { let mut i = 0;
result.push(cstr.as_bytes_no_nul().to_owned()); while *ch.offset(i) != 0 {
}); let p = &*ch.offset(i);
FreeEnvironmentStringsA(ch); let len = ptr::position(p, |c| *c == 0);
raw::buf_as_slice(p, len, |s| {
result.push(str::from_utf16_lossy(s).into_bytes());
});
i += len as int + 1;
}
FreeEnvironmentStringsW(ch);
result result
} }
#[cfg(unix)] #[cfg(unix)]

View File

@ -0,0 +1,86 @@
// Copyright 2014 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
// no-prefer-dynamic
// The test copies itself into a subdirectory with a non-ASCII name and then
// runs it as a child process within the subdirectory. The parent process
// also adds an environment variable and an argument, both containing
// non-ASCII characters. The child process ensures all the strings are
// intact.
extern crate native;
use std::io;
use std::io::fs;
use std::io::process::Process;
use std::io::process::ProcessConfig;
use std::os;
use std::path::Path;
fn main() {
let my_args = os::args();
let my_cwd = os::getcwd();
let my_env = os::env();
let my_path = Path::new(os::self_exe_name().unwrap());
let my_dir = my_path.dir_path();
let my_ext = my_path.extension_str().unwrap_or("");
// some non-ASCII characters
let blah = "\u03c0\u042f\u97f3\u00e6\u221e";
let child_name = "child";
let child_dir = "process-spawn-with-unicode-params-" + blah;
// parameters sent to child / expected to be received from parent
let arg = blah;
let cwd = my_dir.join(Path::new(child_dir.clone()));
let env = ("RUST_TEST_PROC_SPAWN_UNICODE".to_owned(), blah.to_owned());
// am I the parent or the child?
if my_args.len() == 1 { // parent
let child_filestem = Path::new(child_name);
let child_filename = child_filestem.with_extension(my_ext);
let child_path = cwd.join(child_filename.clone());
// make a separate directory for the child
drop(fs::mkdir(&cwd, io::UserRWX).is_ok());
assert!(fs::copy(&my_path, &child_path).is_ok());
// run child
let p = Process::configure(ProcessConfig {
program: child_path.as_str().unwrap(),
args: [arg.to_owned()],
cwd: Some(&cwd),
env: Some(my_env.append_one(env).as_slice()),
.. ProcessConfig::new()
}).unwrap().wait_with_output();
// display the output
assert!(io::stdout().write(p.output.as_slice()).is_ok());
assert!(io::stderr().write(p.error.as_slice()).is_ok());
// make sure the child succeeded
assert!(p.status.success());
} else { // child
// check working directory (don't try to compare with `cwd` here!)
assert!(my_cwd.ends_with_path(&Path::new(child_dir)));
// check arguments
assert_eq!(my_args.get(1).as_slice(), arg);
// check environment variable
assert!(my_env.contains(&env));
};
}