Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in / Register
Toggle navigation
P
protobuf
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Packages
Packages
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
submodule
protobuf
Commits
1b5b3b28
Unverified
Commit
1b5b3b28
authored
Dec 07, 2017
by
Jisi Liu
Committed by
GitHub
Dec 07, 2017
Browse files
Options
Browse Files
Download
Plain Diff
Merge pull request #4013 from laszlocsomor/io_win32
io_win32: support non-ASCII paths
parents
b140cb31
a3a1c93f
Expand all
Show whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
127 additions
and
59 deletions
+127
-59
io_win32.cc
src/google/protobuf/stubs/io_win32.cc
+108
-57
io_win32.h
src/google/protobuf/stubs/io_win32.h
+19
-2
io_win32_unittest.cc
src/google/protobuf/stubs/io_win32_unittest.cc
+0
-0
No files found.
src/google/protobuf/stubs/io_win32.cc
View file @
1b5b3b28
...
...
@@ -30,10 +30,11 @@
// Author: laszlocsomor@google.com (Laszlo Csomor)
//
// Implementation for long-path-aware open/mkdir/etc. on Windows.
// Implementation for long-path-aware open/mkdir/access/etc. on Windows, as well
// as for the supporting utility functions.
//
// These functions convert the input path to an absolute Windows path
// with "\\?\" prefix
if necessary, then pass that to _wopen/_wmkdir
/etc.
// with "\\?\" prefix
, then pass that to _wopen/_wmkdir/_waccess
/etc.
// (declared in <io.h>) respectively. This allows working with files/directories
// whose paths are longer than MAX_PATH (260 chars).
//
...
...
@@ -59,7 +60,6 @@
#include <google/protobuf/stubs/io_win32.h>
#include <google/protobuf/stubs/scoped_ptr.h>
#include <cassert>
#include <memory>
#include <sstream>
#include <string>
...
...
@@ -89,6 +89,11 @@ struct CharTraits<wchar_t> {
static
bool
is_alpha
(
wchar_t
ch
)
{
return
iswalpha
(
ch
);
}
};
template
<
typename
char_type
>
bool
null_or_empty
(
const
char_type
*
s
)
{
return
s
==
nullptr
||
*
s
==
0
;
}
// Returns true if the path starts with a drive letter, e.g. "c:".
// Note that this won't check for the "\" after the drive letter, so this also
// returns true for "c:foo" (which is "c:\${PWD}\foo").
...
...
@@ -121,16 +126,7 @@ bool is_drive_relative(const char_type* path) {
return
has_drive_letter
(
path
)
&&
(
path
[
2
]
==
0
||
!
is_separator
(
path
[
2
]));
}
template
<
typename
char_type
>
void
replace_directory_separators
(
char_type
*
p
)
{
for
(;
*
p
;
++
p
)
{
if
(
*
p
==
'/'
)
{
*
p
=
'\\'
;
}
}
}
string
join_paths
(
const
string
&
path1
,
const
string
&
path2
)
{
wstring
join_paths
(
const
wstring
&
path1
,
const
wstring
&
path2
)
{
if
(
path1
.
empty
()
||
is_path_absolute
(
path2
.
c_str
())
||
has_longpath_prefix
(
path2
.
c_str
()))
{
return
path2
;
...
...
@@ -144,23 +140,23 @@ string join_paths(const string& path1, const string& path2) {
:
(
path1
+
path2
);
}
else
{
return
is_separator
(
path2
[
0
])
?
(
path1
+
path2
)
:
(
path1
+
'\\'
+
path2
);
:
(
path1
+
L
'\\'
+
path2
);
}
}
string
normalize
(
string
path
)
{
wstring
normalize
(
w
string
path
)
{
if
(
has_longpath_prefix
(
path
.
c_str
()))
{
path
=
path
.
substr
(
4
);
}
static
const
string
dot
(
"."
);
static
const
string
dotdot
(
".."
);
static
const
wstring
dot
(
L
"."
);
static
const
wstring
dotdot
(
L
".."
);
std
::
vector
<
string
>
segments
;
std
::
vector
<
w
string
>
segments
;
int
segment_start
=
-
1
;
// Find the path segments in `path` (separated by "/").
for
(
int
i
=
0
;;
++
i
)
{
if
(
!
is_separator
(
path
[
i
])
&&
path
[
i
]
!=
'\0'
)
{
if
(
!
is_separator
(
path
[
i
])
&&
path
[
i
]
!=
L
'\0'
)
{
// The current character does not end a segment, so start one unless it's
// already started.
if
(
segment_start
<
0
)
{
...
...
@@ -169,7 +165,7 @@ string normalize(string path) {
}
else
if
(
segment_start
>=
0
&&
i
>
segment_start
)
{
// The current character is "/" or "\0", so this ends a segment.
// Add that to `segments` if there's anything to add; handle "." and "..".
string
segment
(
path
,
segment_start
,
i
-
segment_start
);
w
string
segment
(
path
,
segment_start
,
i
-
segment_start
);
segment_start
=
-
1
;
if
(
segment
==
dotdot
)
{
if
(
!
segments
.
empty
()
&&
...
...
@@ -180,7 +176,7 @@ string normalize(string path) {
segments
.
push_back
(
segment
);
}
}
if
(
path
[
i
]
==
'\0'
)
{
if
(
path
[
i
]
==
L
'\0'
)
{
break
;
}
}
...
...
@@ -189,64 +185,62 @@ string normalize(string path) {
// form of it, e.g. "c:\..").
if
(
segments
.
size
()
==
1
&&
segments
[
0
].
size
()
==
2
&&
has_drive_letter
(
segments
[
0
].
c_str
()))
{
return
segments
[
0
]
+
'\\'
;
return
segments
[
0
]
+
L
'\\'
;
}
// Join all segments.
bool
first
=
true
;
std
::
o
stringstream
result
;
std
::
w
stringstream
result
;
for
(
int
i
=
0
;
i
<
segments
.
size
();
++
i
)
{
if
(
!
first
)
{
result
<<
'\\'
;
result
<<
L
'\\'
;
}
first
=
false
;
result
<<
segments
[
i
];
}
// Preserve trailing separator if the input contained it.
if
(
!
path
.
empty
()
&&
is_separator
(
path
[
path
.
size
()
-
1
]))
{
result
<<
'\\'
;
result
<<
L
'\\'
;
}
return
result
.
str
();
}
WCHAR
*
as_wstring
(
const
string
&
s
)
{
int
len
=
::
MultiByteToWideChar
(
CP_UTF8
,
0
,
s
.
c_str
(),
s
.
size
(),
NULL
,
0
);
WCHAR
*
result
=
new
WCHAR
[
len
+
1
];
::
MultiByteToWideChar
(
CP_UTF8
,
0
,
s
.
c_str
(),
s
.
size
(),
result
,
len
+
1
);
result
[
len
]
=
0
;
return
result
;
}
void
as_wchar_path
(
const
string
&
path
,
wstring
*
wchar_path
)
{
scoped_array
<
WCHAR
>
wbuf
(
as_wstring
(
path
));
replace_directory_separators
(
wbuf
.
get
());
wchar_path
->
assign
(
wbuf
.
get
());
}
bool
as_windows_path
(
const
string
&
path
,
wstring
*
result
)
{
if
(
path
.
empty
())
{
bool
as_windows_path
(
const
char
*
path
,
wstring
*
result
)
{
if
(
null_or_empty
(
path
))
{
result
->
clear
();
return
true
;
}
if
(
is_separator
(
path
[
0
])
||
is_drive_relative
(
path
.
c_str
()))
{
wstring
wpath
;
if
(
!
strings
::
utf8_to_wcs
(
path
,
&
wpath
))
{
return
false
;
}
if
(
has_longpath_prefix
(
wpath
.
c_str
()))
{
*
result
=
wpath
;
return
true
;
}
if
(
is_separator
(
path
[
0
])
||
is_drive_relative
(
path
))
{
return
false
;
}
string
mutable_path
=
path
;
if
(
!
is_path_absolute
(
mutable_path
.
c_str
())
&&
!
has_longpath_prefix
(
mutable_path
.
c_str
()))
{
char
cwd
[
MAX_PATH
];
::
GetCurrentDirectoryA
(
MAX_PATH
,
cwd
);
mutable_path
=
join_paths
(
cwd
,
mutable_path
);
if
(
!
is_path_absolute
(
wpath
.
c_str
()))
{
int
size
=
::
GetCurrentDirectoryW
(
0
,
NULL
);
if
(
size
==
0
&&
GetLastError
()
!=
ERROR_INSUFFICIENT_BUFFER
)
{
return
false
;
}
scoped_array
<
WCHAR
>
wcwd
(
new
WCHAR
[
size
]);
::
GetCurrentDirectoryW
(
size
,
wcwd
.
get
());
wpath
=
join_paths
(
wcwd
.
get
(),
wpath
);
}
as_wchar_path
(
normalize
(
mutable_path
),
result
);
if
(
!
has_longpath_prefix
(
result
->
c_str
()))
{
wpath
=
normalize
(
wpath
);
if
(
!
has_longpath_prefix
(
wpath
.
c_str
()))
{
// Add the "\\?\" prefix unconditionally. This way we prevent the Win32 API
// from processing the path and "helpfully" removing trailing dots from the
// path, for example.
// See https://github.com/bazelbuild/bazel/issues/2935
*
result
=
wstring
(
L"
\\\\
?
\\
"
)
+
*
result
;
wpath
=
wstring
(
L"
\\\\
?
\\
"
)
+
wpath
;
}
*
result
=
wpath
;
return
true
;
}
...
...
@@ -319,13 +313,21 @@ int stat(const char* path, struct _stat* buffer) {
FILE
*
fopen
(
const
char
*
path
,
const
char
*
mode
)
{
#ifdef SUPPORT_LONGPATHS
if
(
null_or_empty
(
path
))
{
errno
=
EINVAL
;
return
NULL
;
}
wstring
wpath
;
if
(
!
as_windows_path
(
path
,
&
wpath
))
{
errno
=
ENOENT
;
return
NULL
;
}
scoped_array
<
WCHAR
>
wmode
(
as_wstring
(
mode
));
return
::
_wfopen
(
wpath
.
c_str
(),
wmode
.
get
());
wstring
wmode
;
if
(
!
strings
::
utf8_to_wcs
(
mode
,
&
wmode
))
{
errno
=
EINVAL
;
return
NULL
;
}
return
::
_wfopen
(
wpath
.
c_str
(),
wmode
.
c_str
());
#else
return
::
fopen
(
path
,
mode
);
#endif
...
...
@@ -347,16 +349,65 @@ int write(int fd, const void* buffer, size_t size) {
return
::
_write
(
fd
,
buffer
,
size
);
}
wstring
testonly_
path_to_winpath
(
const
string
&
path
)
{
wstring
testonly_
utf8_to_winpath
(
const
char
*
path
)
{
wstring
wpath
;
as_windows_path
(
path
,
&
wpath
);
return
wpath
;
return
as_windows_path
(
path
,
&
wpath
)
?
wpath
:
wstring
();
}
namespace
strings
{
bool
wcs_to_mbs
(
const
WCHAR
*
s
,
string
*
out
,
bool
outUtf8
)
{
if
(
null_or_empty
(
s
))
{
out
->
clear
();
return
true
;
}
BOOL
usedDefaultChar
=
FALSE
;
SetLastError
(
0
);
int
size
=
WideCharToMultiByte
(
outUtf8
?
CP_UTF8
:
CP_ACP
,
0
,
s
,
-
1
,
NULL
,
0
,
NULL
,
outUtf8
?
NULL
:
&
usedDefaultChar
);
if
((
size
==
0
&&
GetLastError
()
!=
ERROR_INSUFFICIENT_BUFFER
)
||
usedDefaultChar
)
{
return
false
;
}
scoped_array
<
CHAR
>
astr
(
new
CHAR
[
size
]);
WideCharToMultiByte
(
outUtf8
?
CP_UTF8
:
CP_ACP
,
0
,
s
,
-
1
,
astr
.
get
(),
size
,
NULL
,
NULL
);
out
->
assign
(
astr
.
get
());
return
true
;
}
bool
mbs_to_wcs
(
const
char
*
s
,
wstring
*
out
,
bool
inUtf8
)
{
if
(
null_or_empty
(
s
))
{
out
->
clear
();
return
true
;
}
SetLastError
(
0
);
int
size
=
MultiByteToWideChar
(
inUtf8
?
CP_UTF8
:
CP_ACP
,
0
,
s
,
-
1
,
NULL
,
0
);
if
(
size
==
0
&&
GetLastError
()
!=
ERROR_INSUFFICIENT_BUFFER
)
{
return
false
;
}
scoped_array
<
WCHAR
>
wstr
(
new
WCHAR
[
size
]);
MultiByteToWideChar
(
inUtf8
?
CP_UTF8
:
CP_ACP
,
0
,
s
,
-
1
,
wstr
.
get
(),
size
+
1
);
out
->
assign
(
wstr
.
get
());
return
true
;
}
bool
utf8_to_wcs
(
const
char
*
input
,
wstring
*
out
)
{
return
mbs_to_wcs
(
input
,
out
,
true
);
}
bool
wcs_to_utf8
(
const
wchar_t
*
input
,
string
*
out
)
{
return
wcs_to_mbs
(
input
,
out
,
true
);
}
}
// namespace strings
}
// namespace win32
}
// namespace internal
}
// namespace protobuf
}
// namespace google
#endif // defined(_WIN32)
src/google/protobuf/stubs/io_win32.h
View file @
1b5b3b28
...
...
@@ -69,8 +69,25 @@ LIBPROTOBUF_EXPORT int read(int fd, void* buffer, size_t size);
LIBPROTOBUF_EXPORT
int
setmode
(
int
fd
,
int
mode
);
LIBPROTOBUF_EXPORT
int
stat
(
const
char
*
path
,
struct
_stat
*
buffer
);
LIBPROTOBUF_EXPORT
int
write
(
int
fd
,
const
void
*
buffer
,
size_t
size
);
LIBPROTOBUF_EXPORT
std
::
wstring
testonly_path_to_winpath
(
const
std
::
string
&
path
);
LIBPROTOBUF_EXPORT
std
::
wstring
testonly_utf8_to_winpath
(
const
char
*
path
);
namespace
strings
{
// Convert from UTF-16 to Active-Code-Page-encoded or to UTF-8-encoded text.
LIBPROTOBUF_EXPORT
bool
wcs_to_mbs
(
const
wchar_t
*
s
,
std
::
string
*
out
,
bool
outUtf8
);
// Convert from Active-Code-Page-encoded or UTF-8-encoded text to UTF-16.
LIBPROTOBUF_EXPORT
bool
mbs_to_wcs
(
const
char
*
s
,
std
::
wstring
*
out
,
bool
inUtf8
);
// Convert from UTF-8-encoded text to UTF-16.
LIBPROTOBUF_EXPORT
bool
utf8_to_wcs
(
const
char
*
input
,
std
::
wstring
*
out
);
// Convert from UTF-16-encoded text to UTF-8.
LIBPROTOBUF_EXPORT
bool
wcs_to_utf8
(
const
wchar_t
*
input
,
std
::
string
*
out
);
}
// namespace strings
}
// namespace win32
}
// namespace internal
...
...
src/google/protobuf/stubs/io_win32_unittest.cc
View file @
1b5b3b28
This diff is collapsed.
Click to expand it.
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment