2012-02-28 10:51:25 -05:00
|
|
|
#include "ruby/ruby.h"
|
2012-08-23 23:44:56 -04:00
|
|
|
#include "ruby/encoding.h"
|
* include/ruby/ruby.h: constify RBasic::klass and add
RBASIC_CLASS(obj) macro which returns a class of `obj'.
This change is a part of RGENGC branch [ruby-trunk - Feature #8339].
* object.c: add new function rb_obj_reveal().
This function reveal interal (hidden) object by rb_obj_hide().
Note that do not change class before and after hiding.
Only permitted example is:
klass = RBASIC_CLASS(obj);
rb_obj_hide(obj);
....
rb_obj_reveal(obj, klass);
TODO: API design. rb_obj_reveal() should be replaced with others.
TODO: modify constified variables using cast may be harmful for
compiler's analysis and optimizaton.
Any idea to prohibt inserting RBasic::klass directly?
If rename RBasic::klass and force to use RBASIC_CLASS(obj),
then all codes such as `RBASIC(obj)->klass' will be
compilation error. Is it acceptable? (We have similar
experience at Ruby 1.9,
for example "RARRAY(ary)->ptr" to "RARRAY_PTR(ary)".
* internal.h: add some macros.
* RBASIC_CLEAR_CLASS(obj) clear RBasic::klass to make it internal
object.
* RBASIC_SET_CLASS(obj, cls) set RBasic::klass.
* RBASIC_SET_CLASS_RAW(obj, cls) same as RBASIC_SET_CLASS
without write barrier (planned).
* RCLASS_SET_SUPER(a, b) set super class of a.
* array.c, class.c, compile.c, encoding.c, enum.c, error.c, eval.c,
file.c, gc.c, hash.c, io.c, iseq.c, marshal.c, object.c,
parse.y, proc.c, process.c, random.c, ruby.c, sprintf.c,
string.c, thread.c, transcode.c, vm.c, vm_eval.c, win32/file.c:
Use above macros and functions to access RBasic::klass.
* ext/coverage/coverage.c, ext/readline/readline.c,
ext/socket/ancdata.c, ext/socket/init.c,
* ext/zlib/zlib.c: ditto.
git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@40691 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
2013-05-13 06:49:11 -04:00
|
|
|
#include "internal.h"
|
2012-02-28 10:51:25 -05:00
|
|
|
#include <winbase.h>
|
2012-08-23 23:44:56 -04:00
|
|
|
#include <wchar.h>
|
|
|
|
#include <shlwapi.h>
|
2012-02-28 10:51:25 -05:00
|
|
|
|
2012-04-18 01:50:45 -04:00
|
|
|
#ifndef INVALID_FILE_ATTRIBUTES
|
|
|
|
# define INVALID_FILE_ATTRIBUTES ((DWORD)-1)
|
|
|
|
#endif
|
|
|
|
|
2012-08-23 23:44:56 -04:00
|
|
|
/* cache 'encoding name' => 'code page' into a hash */
|
2013-10-19 06:59:06 -04:00
|
|
|
static struct code_page_table {
|
|
|
|
USHORT *table;
|
|
|
|
unsigned int count;
|
|
|
|
} rb_code_page;
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
#define IS_DIR_SEPARATOR_P(c) (c == L'\\' || c == L'/')
|
|
|
|
#define IS_DIR_UNC_P(c) (IS_DIR_SEPARATOR_P(c[0]) && IS_DIR_SEPARATOR_P(c[1]))
|
|
|
|
|
|
|
|
/* MultiByteToWideChar() doesn't work with code page 51932 */
|
|
|
|
#define INVALID_CODE_PAGE 51932
|
|
|
|
#define PATH_BUFFER_SIZE MAX_PATH * 2
|
|
|
|
|
|
|
|
#define insecure_obj_p(obj, level) ((level) >= 4 || ((level) > 0 && OBJ_TAINTED(obj)))
|
|
|
|
|
2014-08-09 06:10:11 -04:00
|
|
|
/* defined in win32/win32.c */
|
|
|
|
#define system_code_page rb_w32_filecp
|
|
|
|
#define mbstr_to_wstr rb_w32_mbstr_to_wstr
|
|
|
|
#define wstr_to_mbstr rb_w32_wstr_to_mbstr
|
|
|
|
UINT rb_w32_filecp(void);
|
|
|
|
WCHAR *rb_w32_mbstr_to_wstr(UINT, const char *, int, long *);
|
|
|
|
char *rb_w32_wstr_to_mbstr(UINT, const WCHAR *, int, long *);
|
|
|
|
|
2012-08-23 23:44:56 -04:00
|
|
|
static inline void
|
|
|
|
replace_wchar(wchar_t *s, int find, int replace)
|
|
|
|
{
|
|
|
|
while (*s != 0) {
|
|
|
|
if (*s == find)
|
|
|
|
*s = replace;
|
|
|
|
s++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
Return user's home directory using environment variables combinations.
|
2012-09-05 01:29:41 -04:00
|
|
|
Memory allocated by this function should be manually freed afterwards.
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
Try:
|
|
|
|
HOME, HOMEDRIVE + HOMEPATH and USERPROFILE environment variables
|
|
|
|
TODO: Special Folders - Profile and Personal
|
|
|
|
*/
|
|
|
|
static wchar_t *
|
2012-09-05 01:29:41 -04:00
|
|
|
home_dir(void)
|
2012-08-23 23:44:56 -04:00
|
|
|
{
|
|
|
|
wchar_t *buffer = NULL;
|
|
|
|
size_t buffer_len = 0, len = 0;
|
|
|
|
size_t home_env = 0;
|
|
|
|
|
|
|
|
/*
|
|
|
|
GetEnvironmentVariableW when used with NULL will return the required
|
|
|
|
buffer size and its terminating character.
|
|
|
|
http://msdn.microsoft.com/en-us/library/windows/desktop/ms683188(v=vs.85).aspx
|
|
|
|
*/
|
|
|
|
|
|
|
|
if (len = GetEnvironmentVariableW(L"HOME", NULL, 0)) {
|
|
|
|
buffer_len = len;
|
|
|
|
home_env = 1;
|
|
|
|
}
|
|
|
|
else if (len = GetEnvironmentVariableW(L"HOMEDRIVE", NULL, 0)) {
|
|
|
|
buffer_len = len;
|
|
|
|
if (len = GetEnvironmentVariableW(L"HOMEPATH", NULL, 0)) {
|
|
|
|
buffer_len += len;
|
|
|
|
home_env = 2;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
buffer_len = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (len = GetEnvironmentVariableW(L"USERPROFILE", NULL, 0)) {
|
|
|
|
buffer_len = len;
|
|
|
|
home_env = 3;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* allocate buffer */
|
|
|
|
if (home_env)
|
|
|
|
buffer = (wchar_t *)xmalloc(buffer_len * sizeof(wchar_t));
|
|
|
|
|
|
|
|
switch (home_env) {
|
2012-09-05 01:29:41 -04:00
|
|
|
case 1:
|
|
|
|
/* HOME */
|
|
|
|
GetEnvironmentVariableW(L"HOME", buffer, buffer_len);
|
|
|
|
break;
|
|
|
|
case 2:
|
|
|
|
/* HOMEDRIVE + HOMEPATH */
|
|
|
|
len = GetEnvironmentVariableW(L"HOMEDRIVE", buffer, buffer_len);
|
|
|
|
GetEnvironmentVariableW(L"HOMEPATH", buffer + len, buffer_len - len);
|
|
|
|
break;
|
|
|
|
case 3:
|
|
|
|
/* USERPROFILE */
|
|
|
|
GetEnvironmentVariableW(L"USERPROFILE", buffer, buffer_len);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
if (home_env) {
|
|
|
|
/* sanitize backslashes with forwardslashes */
|
|
|
|
replace_wchar(buffer, L'\\', L'/');
|
|
|
|
|
|
|
|
return buffer;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Remove trailing invalid ':$DATA' of the path. */
|
|
|
|
static inline size_t
|
2012-09-05 01:29:41 -04:00
|
|
|
remove_invalid_alternative_data(wchar_t *wfullpath, size_t size)
|
|
|
|
{
|
2012-08-23 23:44:56 -04:00
|
|
|
static const wchar_t prime[] = L":$DATA";
|
|
|
|
enum { prime_len = (sizeof(prime) / sizeof(wchar_t)) -1 };
|
|
|
|
|
|
|
|
if (size <= prime_len || _wcsnicmp(wfullpath + size - prime_len, prime, prime_len) != 0)
|
|
|
|
return size;
|
|
|
|
|
|
|
|
/* alias of stream */
|
|
|
|
/* get rid of a bug of x64 VC++ */
|
|
|
|
if (wfullpath[size - (prime_len + 1)] == ':') {
|
|
|
|
/* remove trailing '::$DATA' */
|
|
|
|
size -= prime_len + 1; /* prime */
|
|
|
|
wfullpath[size] = L'\0';
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* remove trailing ':$DATA' of paths like '/aa:a:$DATA' */
|
|
|
|
wchar_t *pos = wfullpath + size - (prime_len + 1);
|
|
|
|
while (!IS_DIR_SEPARATOR_P(*pos) && pos != wfullpath) {
|
|
|
|
if (*pos == L':') {
|
|
|
|
size -= prime_len; /* alternative */
|
|
|
|
wfullpath[size] = L'\0';
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
pos--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return size;
|
|
|
|
}
|
|
|
|
|
2013-10-07 03:20:59 -04:00
|
|
|
void rb_enc_foreach_name(int (*func)(st_data_t name, st_data_t idx, st_data_t arg), st_data_t arg);
|
|
|
|
|
|
|
|
static int
|
|
|
|
code_page_i(st_data_t name, st_data_t idx, st_data_t arg)
|
|
|
|
{
|
|
|
|
const char *n = (const char *)name;
|
|
|
|
if (strncmp("CP", n, 2) == 0) {
|
|
|
|
int code_page = atoi(n + 2);
|
|
|
|
if (code_page != 0) {
|
2013-10-19 06:59:06 -04:00
|
|
|
struct code_page_table *cp = (struct code_page_table *)arg;
|
|
|
|
unsigned int count = cp->count;
|
|
|
|
USHORT *table = cp->table;
|
|
|
|
if (count <= idx) {
|
|
|
|
unsigned int i = count;
|
|
|
|
cp->count = count = ((idx + 4) & ~31 | 28);
|
|
|
|
cp->table = table = realloc(table, count * sizeof(*table));
|
|
|
|
while (i < count) table[i++] = INVALID_CODE_PAGE;
|
|
|
|
}
|
|
|
|
table[idx] = (USHORT)code_page;
|
2013-10-07 03:20:59 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return ST_CONTINUE;
|
|
|
|
}
|
|
|
|
|
2012-08-23 23:44:56 -04:00
|
|
|
/*
|
|
|
|
Return code page number of the encoding.
|
|
|
|
Cache code page into a hash for performance since finding the code page in
|
|
|
|
Encoding#names is slow.
|
|
|
|
*/
|
|
|
|
static UINT
|
|
|
|
code_page(rb_encoding *enc)
|
|
|
|
{
|
2013-10-07 02:50:18 -04:00
|
|
|
int enc_idx;
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
if (!enc)
|
|
|
|
return system_code_page();
|
|
|
|
|
2013-10-07 02:50:18 -04:00
|
|
|
enc_idx = rb_enc_to_index(enc);
|
|
|
|
|
2013-10-07 02:09:01 -04:00
|
|
|
/* map US-ASCII and ASCII-8bit as code page 1252 (us-ascii) */
|
2013-10-07 02:50:18 -04:00
|
|
|
if (enc_idx == rb_usascii_encindex() || enc_idx == rb_ascii8bit_encindex()) {
|
2013-10-07 02:09:01 -04:00
|
|
|
return 1252;
|
|
|
|
}
|
2014-08-09 07:50:13 -04:00
|
|
|
if (enc_idx == rb_utf8_encindex()) {
|
|
|
|
return CP_UTF8;
|
|
|
|
}
|
2013-10-07 02:09:01 -04:00
|
|
|
|
2013-10-19 06:59:06 -04:00
|
|
|
if (0 <= enc_idx && (unsigned int)enc_idx < rb_code_page.count)
|
|
|
|
return rb_code_page.table[enc_idx];
|
2012-08-23 23:44:56 -04:00
|
|
|
|
2013-10-07 03:20:59 -04:00
|
|
|
return INVALID_CODE_PAGE;
|
2012-08-23 23:44:56 -04:00
|
|
|
}
|
|
|
|
|
2013-07-26 04:49:31 -04:00
|
|
|
#define fix_string_encoding(str, encoding) rb_str_conv_enc((str), (encoding), rb_utf8_encoding())
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
/*
|
|
|
|
Replace the last part of the path to long name.
|
|
|
|
We try to avoid to call FindFirstFileW() since it takes long time.
|
|
|
|
*/
|
|
|
|
static inline size_t
|
2012-09-05 01:29:41 -04:00
|
|
|
replace_to_long_name(wchar_t **wfullpath, size_t size, int heap)
|
|
|
|
{
|
2012-08-23 23:44:56 -04:00
|
|
|
WIN32_FIND_DATAW find_data;
|
|
|
|
HANDLE find_handle;
|
|
|
|
|
|
|
|
/*
|
|
|
|
Skip long name conversion if the path is already long name.
|
|
|
|
Short name is 8.3 format.
|
|
|
|
http://en.wikipedia.org/wiki/8.3_filename
|
|
|
|
This check can be skipped for directory components that have file
|
|
|
|
extensions longer than 3 characters, or total lengths longer than
|
|
|
|
12 characters.
|
|
|
|
http://msdn.microsoft.com/en-us/library/windows/desktop/aa364980(v=vs.85).aspx
|
|
|
|
*/
|
|
|
|
size_t const max_short_name_size = 8 + 1 + 3;
|
|
|
|
size_t const max_extension_size = 3;
|
|
|
|
size_t path_len = 1, extension_len = 0;
|
|
|
|
wchar_t *pos = *wfullpath;
|
|
|
|
|
|
|
|
if (size == 3 && pos[1] == L':' && pos[2] == L'\\' && pos[3] == L'\0') {
|
|
|
|
/* root path doesn't need short name expansion */
|
|
|
|
return size;
|
|
|
|
}
|
|
|
|
|
2012-11-17 07:46:17 -05:00
|
|
|
/* skip long name conversion if path contains wildcard characters */
|
2012-11-17 12:53:21 -05:00
|
|
|
if (wcspbrk(pos, L"*?")) {
|
2012-11-16 17:43:22 -05:00
|
|
|
return size;
|
|
|
|
}
|
|
|
|
|
2012-08-23 23:44:56 -04:00
|
|
|
pos = *wfullpath + size - 1;
|
|
|
|
while (!IS_DIR_SEPARATOR_P(*pos) && pos != *wfullpath) {
|
|
|
|
if (!extension_len && *pos == L'.') {
|
|
|
|
extension_len = path_len - 1;
|
|
|
|
}
|
|
|
|
if (path_len > max_short_name_size || extension_len > max_extension_size) {
|
|
|
|
return size;
|
|
|
|
}
|
|
|
|
path_len++;
|
|
|
|
pos--;
|
|
|
|
}
|
|
|
|
|
|
|
|
find_handle = FindFirstFileW(*wfullpath, &find_data);
|
|
|
|
if (find_handle != INVALID_HANDLE_VALUE) {
|
|
|
|
size_t trail_pos = wcslen(*wfullpath);
|
|
|
|
size_t file_len = wcslen(find_data.cFileName);
|
|
|
|
|
|
|
|
FindClose(find_handle);
|
|
|
|
while (trail_pos > 0) {
|
|
|
|
if (IS_DIR_SEPARATOR_P((*wfullpath)[trail_pos]))
|
|
|
|
break;
|
|
|
|
trail_pos--;
|
|
|
|
}
|
|
|
|
size = trail_pos + 1 + file_len;
|
|
|
|
if ((size + 1) > sizeof(*wfullpath) / sizeof((*wfullpath)[0])) {
|
|
|
|
wchar_t *buf = (wchar_t *)xmalloc((size + 1) * sizeof(wchar_t));
|
|
|
|
wcsncpy(buf, *wfullpath, trail_pos + 1);
|
|
|
|
if (heap)
|
|
|
|
xfree(*wfullpath);
|
|
|
|
*wfullpath = buf;
|
|
|
|
}
|
|
|
|
wcsncpy(*wfullpath + trail_pos + 1, find_data.cFileName, file_len + 1);
|
|
|
|
}
|
|
|
|
return size;
|
|
|
|
}
|
|
|
|
|
2014-08-09 07:50:13 -04:00
|
|
|
static inline size_t
|
2014-09-29 09:54:50 -04:00
|
|
|
user_length_in_path(const wchar_t *wuser, size_t len)
|
2013-03-13 23:56:09 -04:00
|
|
|
{
|
2014-09-29 09:54:50 -04:00
|
|
|
size_t i;
|
2013-03-13 23:56:09 -04:00
|
|
|
|
2014-09-29 09:54:50 -04:00
|
|
|
for (i = 0; i < len && !IS_DIR_SEPARATOR_P(wuser[i]); i++)
|
|
|
|
;
|
2013-03-13 23:56:09 -04:00
|
|
|
|
2014-09-29 09:54:50 -04:00
|
|
|
return i;
|
2014-08-09 07:50:13 -04:00
|
|
|
}
|
2013-03-13 23:56:09 -04:00
|
|
|
|
2014-08-09 07:50:13 -04:00
|
|
|
static VALUE
|
|
|
|
append_wstr(VALUE dst, const wchar_t *ws, size_t len, UINT cp, UINT path_cp, rb_encoding *path_encoding)
|
|
|
|
{
|
|
|
|
long olen, nlen = (long)len;
|
|
|
|
|
|
|
|
if (cp == path_cp) {
|
|
|
|
nlen = WideCharToMultiByte(cp, 0, ws, len, NULL, 0, NULL, NULL);
|
|
|
|
olen = RSTRING_LEN(dst);
|
|
|
|
rb_str_modify_expand(dst, nlen);
|
|
|
|
WideCharToMultiByte(cp, 0, ws, len, RSTRING_PTR(dst) + olen, nlen, NULL, NULL);
|
|
|
|
rb_enc_associate(dst, path_encoding);
|
2014-09-29 09:54:50 -04:00
|
|
|
rb_str_set_len(dst, olen + nlen);
|
2013-03-13 23:56:09 -04:00
|
|
|
}
|
|
|
|
else {
|
2014-08-09 07:50:13 -04:00
|
|
|
const int replaceflags = ECONV_UNDEF_REPLACE|ECONV_INVALID_REPLACE;
|
|
|
|
char *utf8str = wstr_to_mbstr(CP_UTF8, ws, (int)len, &nlen);
|
|
|
|
rb_econv_t *ec = rb_econv_open("UTF-8", rb_enc_name(path_encoding), replaceflags);
|
|
|
|
dst = rb_econv_append(ec, utf8str, nlen, dst, replaceflags);
|
|
|
|
rb_econv_close(ec);
|
|
|
|
free(utf8str);
|
|
|
|
}
|
|
|
|
return dst;
|
2013-03-13 23:56:09 -04:00
|
|
|
}
|
|
|
|
|
2012-08-23 23:44:56 -04:00
|
|
|
VALUE
|
|
|
|
rb_file_expand_path_internal(VALUE fname, VALUE dname, int abs_mode, int long_name, VALUE result)
|
|
|
|
{
|
2014-08-09 06:10:11 -04:00
|
|
|
size_t size = 0, whome_len = 0;
|
2012-08-23 23:44:56 -04:00
|
|
|
size_t buffer_len = 0;
|
2014-08-09 06:10:11 -04:00
|
|
|
long wpath_len = 0, wdir_len = 0;
|
2012-08-23 23:44:56 -04:00
|
|
|
char *fullpath = NULL;
|
2013-03-10 10:39:09 -04:00
|
|
|
wchar_t *wfullpath = NULL, *wpath = NULL, *wpath_pos = NULL;
|
|
|
|
wchar_t *wdir = NULL, *wdir_pos = NULL;
|
2012-08-23 23:44:56 -04:00
|
|
|
wchar_t *whome = NULL, *buffer = NULL, *buffer_pos = NULL;
|
|
|
|
UINT path_cp, cp;
|
|
|
|
VALUE path = fname, dir = dname;
|
|
|
|
wchar_t wfullpath_buffer[PATH_BUFFER_SIZE];
|
|
|
|
wchar_t path_drive = L'\0', dir_drive = L'\0';
|
|
|
|
int ignore_dir = 0;
|
|
|
|
rb_encoding *path_encoding;
|
|
|
|
int tainted = 0;
|
|
|
|
|
|
|
|
/* tainted if path is tainted */
|
|
|
|
tainted = OBJ_TAINTED(path);
|
|
|
|
|
|
|
|
/* get path encoding */
|
|
|
|
if (NIL_P(dir)) {
|
|
|
|
path_encoding = rb_enc_get(path);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
path_encoding = rb_enc_check(path, dir);
|
|
|
|
}
|
|
|
|
|
|
|
|
cp = path_cp = code_page(path_encoding);
|
|
|
|
|
|
|
|
/* workaround invalid codepage */
|
|
|
|
if (path_cp == INVALID_CODE_PAGE) {
|
|
|
|
cp = CP_UTF8;
|
|
|
|
if (!NIL_P(path)) {
|
|
|
|
path = fix_string_encoding(path, path_encoding);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* convert char * to wchar_t */
|
2013-07-26 00:00:28 -04:00
|
|
|
if (!NIL_P(path)) {
|
2014-08-09 06:10:11 -04:00
|
|
|
wpath = mbstr_to_wstr(cp, RSTRING_PTR(path), (int)RSTRING_LEN(path), &wpath_len);
|
2013-07-26 00:00:28 -04:00
|
|
|
wpath_pos = wpath;
|
|
|
|
}
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
/* determine if we need the user's home directory */
|
|
|
|
/* expand '~' only if NOT rb_file_absolute_path() where `abs_mode` is 1 */
|
2012-09-05 01:29:44 -04:00
|
|
|
if (abs_mode == 0 && wpath_len > 0 && wpath_pos[0] == L'~' &&
|
|
|
|
(wpath_len == 1 || IS_DIR_SEPARATOR_P(wpath_pos[1]))) {
|
2012-08-23 23:44:56 -04:00
|
|
|
/* tainted if expanding '~' */
|
|
|
|
tainted = 1;
|
|
|
|
|
|
|
|
whome = home_dir();
|
|
|
|
if (whome == NULL) {
|
|
|
|
xfree(wpath);
|
|
|
|
rb_raise(rb_eArgError, "couldn't find HOME environment -- expanding `~'");
|
|
|
|
}
|
|
|
|
whome_len = wcslen(whome);
|
|
|
|
|
|
|
|
if (PathIsRelativeW(whome) && !(whome_len >= 2 && IS_DIR_UNC_P(whome))) {
|
|
|
|
xfree(wpath);
|
2013-10-17 01:21:38 -04:00
|
|
|
xfree(whome);
|
2012-08-23 23:44:56 -04:00
|
|
|
rb_raise(rb_eArgError, "non-absolute home");
|
|
|
|
}
|
|
|
|
|
2013-10-19 06:59:06 -04:00
|
|
|
if (path_cp == INVALID_CODE_PAGE || rb_enc_str_asciionly_p(path)) {
|
|
|
|
/* use filesystem encoding if expanding home dir */
|
|
|
|
path_encoding = rb_filesystem_encoding();
|
|
|
|
cp = path_cp = system_code_page();
|
|
|
|
}
|
2012-08-23 23:44:56 -04:00
|
|
|
|
2013-05-18 23:10:21 -04:00
|
|
|
/* ignores dir since we are expanding home */
|
2012-08-23 23:44:56 -04:00
|
|
|
ignore_dir = 1;
|
|
|
|
|
|
|
|
/* exclude ~ from the result */
|
|
|
|
wpath_pos++;
|
|
|
|
wpath_len--;
|
|
|
|
|
|
|
|
/* exclude separator if present */
|
|
|
|
if (wpath_len && IS_DIR_SEPARATOR_P(wpath_pos[0])) {
|
|
|
|
wpath_pos++;
|
|
|
|
wpath_len--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (wpath_len >= 2 && wpath_pos[1] == L':') {
|
|
|
|
if (wpath_len >= 3 && IS_DIR_SEPARATOR_P(wpath_pos[2])) {
|
|
|
|
/* ignore dir since path contains a drive letter and a root slash */
|
|
|
|
ignore_dir = 1;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* determine if we ignore dir or not later */
|
|
|
|
path_drive = wpath_pos[0];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (abs_mode == 0 && wpath_len >= 2 && wpath_pos[0] == L'~') {
|
2014-08-09 07:50:13 -04:00
|
|
|
result = rb_str_new_cstr("can't find user ");
|
2014-09-29 09:54:50 -04:00
|
|
|
result = append_wstr(result, wpath_pos + 1, user_length_in_path(wpath_pos + 1, wpath_len - 1),
|
2014-08-09 07:50:13 -04:00
|
|
|
cp, path_cp, path_encoding);
|
2012-08-23 23:44:56 -04:00
|
|
|
|
2013-03-13 23:56:09 -04:00
|
|
|
if (wpath)
|
|
|
|
xfree(wpath);
|
2012-08-23 23:44:56 -04:00
|
|
|
|
2014-08-09 07:50:13 -04:00
|
|
|
rb_exc_raise(rb_exc_new_str(rb_eArgError, result));
|
2012-08-23 23:44:56 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
/* convert dir */
|
|
|
|
if (!ignore_dir && !NIL_P(dir)) {
|
|
|
|
/* fix string encoding */
|
|
|
|
if (path_cp == INVALID_CODE_PAGE) {
|
|
|
|
dir = fix_string_encoding(dir, path_encoding);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* convert char * to wchar_t */
|
2013-07-26 00:00:28 -04:00
|
|
|
if (!NIL_P(dir)) {
|
2014-08-09 06:10:11 -04:00
|
|
|
wdir = mbstr_to_wstr(cp, RSTRING_PTR(dir), (int)RSTRING_LEN(dir), &wdir_len);
|
2013-07-26 00:00:28 -04:00
|
|
|
wdir_pos = wdir;
|
|
|
|
}
|
2012-08-23 23:44:56 -04:00
|
|
|
|
2013-03-10 10:39:09 -04:00
|
|
|
if (abs_mode == 0 && wdir_len > 0 && wdir_pos[0] == L'~' &&
|
|
|
|
(wdir_len == 1 || IS_DIR_SEPARATOR_P(wdir_pos[1]))) {
|
|
|
|
/* tainted if expanding '~' */
|
|
|
|
tainted = 1;
|
|
|
|
|
|
|
|
whome = home_dir();
|
|
|
|
if (whome == NULL) {
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wpath);
|
|
|
|
free(wdir);
|
2013-03-10 10:39:09 -04:00
|
|
|
rb_raise(rb_eArgError, "couldn't find HOME environment -- expanding `~'");
|
|
|
|
}
|
|
|
|
whome_len = wcslen(whome);
|
|
|
|
|
|
|
|
if (PathIsRelativeW(whome) && !(whome_len >= 2 && IS_DIR_UNC_P(whome))) {
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wpath);
|
|
|
|
free(wdir);
|
2013-10-17 01:21:38 -04:00
|
|
|
xfree(whome);
|
2013-03-10 10:39:09 -04:00
|
|
|
rb_raise(rb_eArgError, "non-absolute home");
|
|
|
|
}
|
|
|
|
|
|
|
|
/* exclude ~ from the result */
|
|
|
|
wdir_pos++;
|
|
|
|
wdir_len--;
|
|
|
|
|
|
|
|
/* exclude separator if present */
|
|
|
|
if (wdir_len && IS_DIR_SEPARATOR_P(wdir_pos[0])) {
|
|
|
|
wdir_pos++;
|
|
|
|
wdir_len--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (wdir_len >= 2 && wdir[1] == L':') {
|
2012-08-23 23:44:56 -04:00
|
|
|
dir_drive = wdir[0];
|
|
|
|
if (wpath_len && IS_DIR_SEPARATOR_P(wpath_pos[0])) {
|
|
|
|
wdir_len = 2;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (wdir_len >= 2 && IS_DIR_UNC_P(wdir)) {
|
|
|
|
/* UNC path */
|
|
|
|
if (wpath_len && IS_DIR_SEPARATOR_P(wpath_pos[0])) {
|
|
|
|
/* cut the UNC path tail to '//host/share' */
|
2014-08-09 06:10:11 -04:00
|
|
|
long separators = 0;
|
|
|
|
long pos = 2;
|
2012-08-23 23:44:56 -04:00
|
|
|
while (pos < wdir_len && separators < 2) {
|
|
|
|
if (IS_DIR_SEPARATOR_P(wdir[pos])) {
|
|
|
|
separators++;
|
|
|
|
}
|
|
|
|
pos++;
|
|
|
|
}
|
|
|
|
if (separators == 2)
|
|
|
|
wdir_len = pos - 1;
|
|
|
|
}
|
|
|
|
}
|
2013-03-13 23:56:09 -04:00
|
|
|
else if (abs_mode == 0 && wdir_len >= 2 && wdir_pos[0] == L'~') {
|
2014-08-09 07:50:13 -04:00
|
|
|
result = rb_str_new_cstr("can't find user ");
|
2014-09-29 09:54:50 -04:00
|
|
|
result = append_wstr(result, wdir_pos + 1, user_length_in_path(wdir_pos + 1, wdir_len - 1),
|
2014-08-09 07:50:13 -04:00
|
|
|
cp, path_cp, path_encoding);
|
2013-03-13 23:56:09 -04:00
|
|
|
if (wpath)
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wpath);
|
2013-03-13 23:56:09 -04:00
|
|
|
|
|
|
|
if (wdir)
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wdir);
|
2013-03-13 23:56:09 -04:00
|
|
|
|
2014-08-09 07:50:13 -04:00
|
|
|
rb_exc_raise(rb_exc_new_str(rb_eArgError, result));
|
2013-03-13 23:56:09 -04:00
|
|
|
}
|
2012-08-23 23:44:56 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
/* determine if we ignore dir or not */
|
|
|
|
if (!ignore_dir && path_drive && dir_drive) {
|
|
|
|
if (towupper(path_drive) == towupper(dir_drive)) {
|
|
|
|
/* exclude path drive letter to use dir */
|
|
|
|
wpath_pos += 2;
|
|
|
|
wpath_len -= 2;
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
/* ignore dir since path drive is different from dir drive */
|
|
|
|
ignore_dir = 1;
|
|
|
|
wdir_len = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!ignore_dir && wpath_len >= 2 && IS_DIR_UNC_P(wpath)) {
|
|
|
|
/* ignore dir since path has UNC root */
|
|
|
|
ignore_dir = 1;
|
|
|
|
wdir_len = 0;
|
|
|
|
}
|
|
|
|
else if (!ignore_dir && wpath_len >= 1 && IS_DIR_SEPARATOR_P(wpath[0]) &&
|
2012-09-05 01:29:41 -04:00
|
|
|
!dir_drive && !(wdir_len >= 2 && IS_DIR_UNC_P(wdir))) {
|
2012-08-23 23:44:56 -04:00
|
|
|
/* ignore dir since path has root slash and dir doesn't have drive or UNC root */
|
|
|
|
ignore_dir = 1;
|
|
|
|
wdir_len = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
buffer_len = wpath_len + 1 + wdir_len + 1 + whome_len + 1;
|
|
|
|
|
|
|
|
buffer = buffer_pos = (wchar_t *)xmalloc((buffer_len + 1) * sizeof(wchar_t));
|
|
|
|
|
|
|
|
/* add home */
|
|
|
|
if (whome_len) {
|
|
|
|
wcsncpy(buffer_pos, whome, whome_len);
|
|
|
|
buffer_pos += whome_len;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Add separator if required */
|
|
|
|
if (whome_len && wcsrchr(L"\\/:", buffer_pos[-1]) == NULL) {
|
|
|
|
buffer_pos[0] = L'\\';
|
|
|
|
buffer_pos++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (wdir_len) {
|
|
|
|
/* tainted if dir is used and dir is tainted */
|
|
|
|
if (!tainted && OBJ_TAINTED(dir))
|
|
|
|
tainted = 1;
|
|
|
|
|
2013-03-10 10:39:09 -04:00
|
|
|
wcsncpy(buffer_pos, wdir_pos, wdir_len);
|
2012-08-23 23:44:56 -04:00
|
|
|
buffer_pos += wdir_len;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* add separator if required */
|
|
|
|
if (wdir_len && wcsrchr(L"\\/:", buffer_pos[-1]) == NULL) {
|
|
|
|
buffer_pos[0] = L'\\';
|
|
|
|
buffer_pos++;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* now deal with path */
|
|
|
|
if (wpath_len) {
|
|
|
|
wcsncpy(buffer_pos, wpath_pos, wpath_len);
|
|
|
|
buffer_pos += wpath_len;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* GetFullPathNameW requires at least "." to determine current directory */
|
|
|
|
if (wpath_len == 0) {
|
|
|
|
buffer_pos[0] = L'.';
|
|
|
|
buffer_pos++;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Ensure buffer is NULL terminated */
|
|
|
|
buffer_pos[0] = L'\0';
|
|
|
|
|
|
|
|
/* tainted if path is relative */
|
|
|
|
if (!tainted && PathIsRelativeW(buffer) && !(buffer_len >= 2 && IS_DIR_UNC_P(buffer)))
|
|
|
|
tainted = 1;
|
|
|
|
|
|
|
|
/* FIXME: Make this more robust */
|
|
|
|
/* Determine require buffer size */
|
|
|
|
size = GetFullPathNameW(buffer, PATH_BUFFER_SIZE, wfullpath_buffer, NULL);
|
|
|
|
if (size > PATH_BUFFER_SIZE) {
|
|
|
|
/* allocate more memory than alloted originally by PATH_BUFFER_SIZE */
|
|
|
|
wfullpath = (wchar_t *)xmalloc(size * sizeof(wchar_t));
|
|
|
|
size = GetFullPathNameW(buffer, size, wfullpath, NULL);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
wfullpath = wfullpath_buffer;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Remove any trailing slashes */
|
|
|
|
if (IS_DIR_SEPARATOR_P(wfullpath[size - 1]) &&
|
|
|
|
wfullpath[size - 2] != L':' &&
|
|
|
|
!(size == 2 && IS_DIR_UNC_P(wfullpath))) {
|
|
|
|
size -= 1;
|
|
|
|
wfullpath[size] = L'\0';
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Remove any trailing dot */
|
|
|
|
if (wfullpath[size - 1] == L'.') {
|
|
|
|
size -= 1;
|
|
|
|
wfullpath[size] = L'\0';
|
|
|
|
}
|
|
|
|
|
|
|
|
/* removes trailing invalid ':$DATA' */
|
|
|
|
size = remove_invalid_alternative_data(wfullpath, size);
|
|
|
|
|
|
|
|
/* Replace the trailing path to long name */
|
|
|
|
if (long_name)
|
|
|
|
size = replace_to_long_name(&wfullpath, size, (wfullpath != wfullpath_buffer));
|
|
|
|
|
|
|
|
/* sanitize backslashes with forwardslashes */
|
|
|
|
replace_wchar(wfullpath, L'\\', L'/');
|
|
|
|
|
|
|
|
/* convert to VALUE and set the path encoding */
|
2014-08-09 07:50:13 -04:00
|
|
|
rb_str_set_len(result, 0);
|
|
|
|
result = append_wstr(result, wfullpath, size, cp, path_cp, path_encoding);
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
/* makes the result object tainted if expanding tainted strings or returning modified path */
|
|
|
|
if (tainted)
|
|
|
|
OBJ_TAINT(result);
|
|
|
|
|
|
|
|
/* TODO: better cleanup */
|
|
|
|
if (buffer)
|
|
|
|
xfree(buffer);
|
|
|
|
|
|
|
|
if (wpath)
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wpath);
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
if (wdir)
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wdir);
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
if (whome)
|
|
|
|
xfree(whome);
|
|
|
|
|
|
|
|
if (wfullpath && wfullpath != wfullpath_buffer)
|
|
|
|
xfree(wfullpath);
|
|
|
|
|
|
|
|
if (fullpath)
|
|
|
|
xfree(fullpath);
|
|
|
|
|
2014-08-09 07:50:13 -04:00
|
|
|
rb_enc_associate(result, path_encoding);
|
2012-08-23 23:44:56 -04:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2012-02-28 10:51:25 -05:00
|
|
|
int
|
|
|
|
rb_file_load_ok(const char *path)
|
|
|
|
{
|
2013-07-26 00:04:23 -04:00
|
|
|
DWORD attr;
|
2012-02-28 23:07:08 -05:00
|
|
|
int ret = 1;
|
2014-08-09 06:10:11 -04:00
|
|
|
long len;
|
2013-07-26 00:04:23 -04:00
|
|
|
wchar_t* wpath;
|
|
|
|
|
2014-08-09 06:10:11 -04:00
|
|
|
wpath = mbstr_to_wstr(CP_UTF8, path, -1, &len);
|
|
|
|
if (!wpath) return 0;
|
2013-07-26 00:04:23 -04:00
|
|
|
|
|
|
|
attr = GetFileAttributesW(wpath);
|
2012-02-28 23:07:08 -05:00
|
|
|
if (attr == INVALID_FILE_ATTRIBUTES ||
|
2013-07-26 00:04:23 -04:00
|
|
|
(attr & FILE_ATTRIBUTE_DIRECTORY)) {
|
2012-02-28 10:51:25 -05:00
|
|
|
ret = 0;
|
2012-02-28 23:07:08 -05:00
|
|
|
}
|
|
|
|
else {
|
2013-07-26 00:04:23 -04:00
|
|
|
HANDLE h = CreateFileW(wpath, GENERIC_READ,
|
|
|
|
FILE_SHARE_READ | FILE_SHARE_WRITE,
|
|
|
|
NULL, OPEN_EXISTING, FILE_ATTRIBUTE_NORMAL, NULL);
|
2012-02-28 10:51:25 -05:00
|
|
|
if (h != INVALID_HANDLE_VALUE) {
|
2012-02-28 23:07:08 -05:00
|
|
|
CloseHandle(h);
|
2012-02-28 10:51:25 -05:00
|
|
|
}
|
|
|
|
else {
|
2012-02-28 23:07:08 -05:00
|
|
|
ret = 0;
|
2012-02-28 10:51:25 -05:00
|
|
|
}
|
2012-02-28 23:07:08 -05:00
|
|
|
}
|
2014-08-09 06:10:11 -04:00
|
|
|
free(wpath);
|
2012-02-28 23:07:08 -05:00
|
|
|
return ret;
|
2012-02-28 10:51:25 -05:00
|
|
|
}
|
2012-08-23 23:44:56 -04:00
|
|
|
|
|
|
|
void
|
2013-10-19 06:55:39 -04:00
|
|
|
Init_w32_codepage(void)
|
2012-08-23 23:44:56 -04:00
|
|
|
{
|
2013-10-19 06:59:06 -04:00
|
|
|
if (rb_code_page.count) return;
|
|
|
|
rb_enc_foreach_name(code_page_i, (st_data_t)&rb_code_page);
|
2012-08-23 23:44:56 -04:00
|
|
|
}
|