Skip to content

Commit

Permalink
python#3705: Command-line arguments were not correctly decoded when the
Browse files Browse the repository at this point in the history
terminal does not use UTF8.

Now the code propagates the unicode string as far as possible, and avoids
the conversion to char* which implicitely uses utf-8.

Reviewed by Benjamin.
  • Loading branch information
amauryfa committed Nov 11, 2008
1 parent d3013ff commit 9a5499b
Show file tree
Hide file tree
Showing 4 changed files with 35 additions and 25 deletions.
6 changes: 6 additions & 0 deletions Lib/test/test_cmd_line.py
Original file line number Diff line number Diff line change
Expand Up @@ -135,6 +135,12 @@ def test_run_code(self):
self.exit_code('-c', 'pass'),
0)

# Test handling of non-ascii data
command = "assert(ord('\xe9') == 0xe9)"
self.assertEqual(
self.exit_code('-c', command),
0)


def test_main():
test.support.run_unittest(CmdLineTest)
Expand Down
3 changes: 3 additions & 0 deletions Misc/NEWS
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,9 @@ What's New in Python 3.0 release candiate 3?
Core and Builtins
-----------------

- Issue #3705: Command-line arguments were not correctly decoded when the
terminal does not use UTF8.

Library
-------

Expand Down
40 changes: 19 additions & 21 deletions Modules/main.c
Original file line number Diff line number Diff line change
Expand Up @@ -287,7 +287,7 @@ Py_Main(int argc, wchar_t **argv)
{
int c;
int sts;
char *command = NULL;
wchar_t *command = NULL;
wchar_t *filename = NULL;
wchar_t *module = NULL;
FILE *fp = stdin;
Expand All @@ -299,7 +299,6 @@ Py_Main(int argc, wchar_t **argv)
int version = 0;
int saw_unbuffered_flag = 0;
PyCompilerFlags cf;
char *oldloc;

cf.cf_flags = 0;

Expand All @@ -310,30 +309,19 @@ Py_Main(int argc, wchar_t **argv)

while ((c = _PyOS_GetOpt(argc, argv, PROGRAM_OPTS)) != EOF) {
if (c == 'c') {
size_t r1, r2;
oldloc = setlocale(LC_ALL, NULL);
setlocale(LC_ALL, "");
r1 = wcslen(_PyOS_optarg);
r2 = wcstombs(NULL, _PyOS_optarg, r1);
if (r2 == (size_t) -1)
Py_FatalError(
"cannot convert character encoding of -c argument");
if (r2 > r1)
r1 = r2;
r1 += 2;
size_t len;
/* -c is the last option; following arguments
that look like options are left for the
command to interpret. */
command = (char *)malloc(r1);

len = wcslen(_PyOS_optarg) + 1 + 1;
command = (wchar_t *)malloc(sizeof(wchar_t) * len);
if (command == NULL)
Py_FatalError(
"not enough memory to copy -c argument");
r2 = wcstombs(command, _PyOS_optarg, r1);
if (r2 > r1-1)
Py_FatalError(
"not enough memory to copy -c argument");
strcat(command, "\n");
setlocale(LC_ALL, oldloc);
wcscpy(command, _PyOS_optarg);
command[len - 2] = '\n';
command[len - 1] = 0;
break;
}

Expand Down Expand Up @@ -543,8 +531,18 @@ Py_Main(int argc, wchar_t **argv)
}

if (command) {
sts = PyRun_SimpleStringFlags(command, &cf) != 0;
PyObject *commandObj = PyUnicode_FromWideChar(
command, wcslen(command));
free(command);
if (commandObj != NULL) {
sts = PyRun_SimpleStringFlags(
_PyUnicode_AsString(commandObj), &cf) != 0;
}
else {
PyErr_Print();
sts = 1;
}
Py_DECREF(commandObj);
} else if (module) {
sts = RunModule(module, 1);
}
Expand Down
11 changes: 7 additions & 4 deletions Python/import.c
Original file line number Diff line number Diff line change
Expand Up @@ -2793,6 +2793,7 @@ call_find_module(char *name, PyObject *path)
{
extern int fclose(FILE *);
PyObject *fob, *ret;
PyObject *pathobj;
struct filedescr *fdp;
char pathname[MAXPATHLEN+1];
FILE *fp = NULL;
Expand Down Expand Up @@ -2836,9 +2837,9 @@ call_find_module(char *name, PyObject *path)
fob = Py_None;
Py_INCREF(fob);
}
ret = Py_BuildValue("Os(ssi)",
fob, pathname, fdp->suffix, fdp->mode, fdp->type);
Py_DECREF(fob);
pathobj = PyUnicode_DecodeFSDefault(pathname);
ret = Py_BuildValue("NN(ssi)",
fob, pathobj, fdp->suffix, fdp->mode, fdp->type);
PyMem_FREE(found_encoding);

return ret;
Expand All @@ -2849,7 +2850,9 @@ imp_find_module(PyObject *self, PyObject *args)
{
char *name;
PyObject *path = NULL;
if (!PyArg_ParseTuple(args, "s|O:find_module", &name, &path))
if (!PyArg_ParseTuple(args, "es|O:find_module",
Py_FileSystemDefaultEncoding, &name,
&path))
return NULL;
return call_find_module(name, path);
}
Expand Down

0 comments on commit 9a5499b

Please sign in to comment.