getpathp.c 30 KB
Newer Older
1 2

/* Return the initial module search path. */
3
/* Used by DOS, Windows 3.1, Windows 95/98, Windows NT. */
4

5 6
/* ----------------------------------------------------------------
   PATH RULES FOR WINDOWS:
7 8
   This describes how sys.path is formed on Windows.  It describes the
   functionality, not the implementation (ie, the order in which these
9 10 11
   are actually fetched is different). The presence of a python._pth or
   pythonXY._pth file alongside the program overrides these rules - see
   below.
12 13 14 15

   * Python always adds an empty entry at the start, which corresponds
     to the current directory.

16
   * If the PYTHONPATH env. var. exists, its entries are added next.
17 18 19 20 21 22 23 24 25 26 27

   * We look in the registry for "application paths" - that is, sub-keys
     under the main PythonPath registry key.  These are added next (the
     order of sub-key processing is undefined).
     HKEY_CURRENT_USER is searched and added first.
     HKEY_LOCAL_MACHINE is searched and added next.
     (Note that all known installers only use HKLM, so HKCU is typically
     empty)

   * We attempt to locate the "Python Home" - if the PYTHONHOME env var
     is set, we believe it.  Otherwise, we use the path of our host .EXE's
Martin Panter's avatar
Martin Panter committed
28
     to try and locate one of our "landmarks" and deduce our home.
29
     - If we DO have a Python Home: The relevant sub-directories (Lib,
30
       DLLs, etc) are based on the Python Home
31
     - If we DO NOT have a Python Home, the core Python Path is
32
       loaded from the registry.  This is the main PythonPath key,
33 34 35 36
       and both HKLM and HKCU are combined to form the path)

   * Iff - we can not locate the Python Home, have not had a PYTHONPATH
     specified, and can't locate any Registry entries (ie, we have _nothing_
37
     we can assume is a good path), a default path with relative entries is
38
     used (eg. .\Lib;.\DLLs, etc)
39 40


41 42 43 44 45 46 47 48 49 50 51 52 53 54 55
   If a '._pth' file exists adjacent to the executable with the same base name
   (e.g. python._pth adjacent to python.exe) or adjacent to the shared library
   (e.g. python36._pth adjacent to python36.dll), it is used in preference to
   the above process. The shared library file takes precedence over the
   executable. The path file must contain a list of paths to add to sys.path,
   one per line. Each path is relative to the directory containing the file.
   Blank lines and comments beginning with '#' are permitted.

   In the presence of this ._pth file, no other paths are added to the search
   path, the registry finder is not enabled, site.py is not imported and
   isolated mode is enabled. The site package can be enabled by including a
   line reading "import site"; no other imports are recognized. Any invalid
   entry (other than directories that do not exist) will result in immediate
   termination of the program.

56

57 58 59 60 61 62
  The end result of all this is:
  * When running python.exe, or any other .exe in the main Python directory
    (either an installed version, or directly from the PCbuild directory),
    the core path is deduced, and the core paths in the registry are
    ignored.  Other "application paths" in the registry are always read.

63
  * When Python is hosted in another exe (different directory, embedded via
64
    COM, etc), the Python Home will not be deduced, so the core path from
65
    the registry is used.  Other "application paths" in the registry are
66 67 68 69 70 71
    always read.

  * If Python can't find its home and there is no registry (eg, frozen
    exe, some very strange installation setup) you get a path with
    some default, but relative, paths.

Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
72
  * An embedding application can use Py_SetPath() to override all of
73 74
    these automatic path computations.

75 76 77
  * An install of Python can fully specify the contents of sys.path using
    either a 'EXENAME._pth' or 'DLLNAME._pth' file, optionally including
    "import site" to enable the site module.
Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
78

79 80 81
   ---------------------------------------------------------------- */


82 83
#include "Python.h"
#include "osdefs.h"
84
#include <wchar.h>
85

86 87
#ifndef MS_WINDOWS
#error getpathp.c should only be built on Windows
88 89
#endif

90 91 92
#include <windows.h>
#include <Shlwapi.h>

93
#ifdef HAVE_SYS_TYPES_H
94
#include <sys/types.h>
95 96 97
#endif /* HAVE_SYS_TYPES_H */

#ifdef HAVE_SYS_STAT_H
98
#include <sys/stat.h>
99 100
#endif /* HAVE_SYS_STAT_H */

101 102 103 104 105 106
#include <string.h>

/* Search in some common locations for the associated Python libraries.
 *
 * Py_GetPath() tries to return a sensible Python module search path.
 *
107 108 109
 * The approach is an adaptation for Windows of the strategy used in
 * ../Modules/getpath.c; it uses the Windows Registry as one of its
 * information sources.
Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
110 111 112
 *
 * Py_SetPath() can be used to override this mechanism.  Call Py_SetPath
 * with a semicolon separated path prior to calling Py_Initialize.
113 114 115
 */

#ifndef LANDMARK
116
#define LANDMARK L"lib\\os.py"
117 118
#endif

119 120 121 122
static wchar_t prefix[MAXPATHLEN+1];
static wchar_t progpath[MAXPATHLEN+1];
static wchar_t dllpath[MAXPATHLEN+1];
static wchar_t *module_search_path = NULL;
123

124

125
static int
126
is_sep(wchar_t ch)      /* determine if "ch" is a separator character */
127 128
{
#ifdef ALTSEP
129
    return ch == SEP || ch == ALTSEP;
130
#else
131
    return ch == SEP;
132 133 134
#endif
}

135 136 137
/* assumes 'dir' null terminated in bounds.  Never writes
   beyond existing terminator.
*/
138
static void
139
reduce(wchar_t *dir)
140
{
141 142 143 144
    size_t i = wcsnlen_s(dir, MAXPATHLEN+1);
    if (i >= MAXPATHLEN+1)
        Py_FatalError("buffer overflow in getpathp.c's reduce()");

145 146 147
    while (i > 0 && !is_sep(dir[i]))
        --i;
    dir[i] = '\0';
148
}
149

150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176
static int
change_ext(wchar_t *dest, const wchar_t *src, const wchar_t *ext)
{
    size_t src_len = wcsnlen_s(src, MAXPATHLEN+1);
    size_t i = src_len;
    if (i >= MAXPATHLEN+1)
        Py_FatalError("buffer overflow in getpathp.c's reduce()");

    while (i > 0 && src[i] != '.' && !is_sep(src[i]))
        --i;

    if (i == 0) {
        dest[0] = '\0';
        return -1;
    }

    if (is_sep(src[i]))
        i = src_len;

    if (wcsncpy_s(dest, MAXPATHLEN+1, src, i) ||
        wcscat_s(dest, MAXPATHLEN+1, ext)) {
        dest[0] = '\0';
        return -1;
    }

    return 0;
}
177 178

static int
179
exists(wchar_t *filename)
180
{
181
    return GetFileAttributesW(filename) != 0xFFFFFFFF;
182 183
}

184
/* Assumes 'filename' MAXPATHLEN+1 bytes long -
185 186
   may extend 'filename' by one character.
*/
187
static int
188
ismodule(wchar_t *filename, int update_filename) /* Is module -- check for .pyc too */
189
{
190
    size_t n;
191

192 193 194 195
    if (exists(filename))
        return 1;

    /* Check for the compiled version of prefix. */
196 197 198
    n = wcsnlen_s(filename, MAXPATHLEN+1);
    if (n < MAXPATHLEN) {
        int exist = 0;
199
        filename[n] = L'c';
200 201 202 203 204
        filename[n + 1] = L'\0';
        exist = exists(filename);
        if (!update_filename)
            filename[n] = L'\0';
        return exist;
205 206
    }
    return 0;
207 208
}

209 210 211 212 213 214 215 216 217
/* Add a path component, by appending stuff to buffer.
   buffer must have at least MAXPATHLEN + 1 bytes allocated, and contain a
   NUL-terminated string with no more than MAXPATHLEN characters (not counting
   the trailing NUL).  It's a fatal error if it contains a string longer than
   that (callers must be careful!).  If these requirements are met, it's
   guaranteed that buffer will still be a NUL-terminated string with no more
   than MAXPATHLEN characters at exit.  If stuff is too long, only as much of
   stuff as fits will be appended.
*/
218 219 220 221 222

static int _PathCchCombineEx_Initialized = 0;
typedef HRESULT(__stdcall *PPathCchCombineEx)(PWSTR pszPathOut, size_t cchPathOut, PCWSTR pszPathIn, PCWSTR pszMore, unsigned long dwFlags);
static PPathCchCombineEx _PathCchCombineEx;

223
static void
224
join(wchar_t *buffer, const wchar_t *stuff)
225
{
226 227 228 229 230 231 232
    if (_PathCchCombineEx_Initialized == 0) {
        HMODULE pathapi = LoadLibraryW(L"api-ms-win-core-path-l1-1-0.dll");
        if (pathapi)
            _PathCchCombineEx = (PPathCchCombineEx)GetProcAddress(pathapi, "PathCchCombineEx");
        else
            _PathCchCombineEx = NULL;
        _PathCchCombineEx_Initialized = 1;
233 234
    }

235 236 237 238
    if (_PathCchCombineEx) {
        if (FAILED(_PathCchCombineEx(buffer, MAXPATHLEN+1, buffer, stuff, 0)))
            Py_FatalError("buffer overflow in getpathp.c's join()");
    } else {
239
        if (!PathCombineW(buffer, buffer, stuff))
240
            Py_FatalError("buffer overflow in getpathp.c's join()");
241
    }
242 243
}

244 245 246 247
/* gotlandmark only called by search_for_prefix, which ensures
   'prefix' is null terminated in bounds.  join() ensures
   'landmark' can not overflow prefix if too long.
*/
248
static int
249
gotlandmark(const wchar_t *landmark)
250
{
251
    int ok;
252
    Py_ssize_t n = wcsnlen_s(prefix, MAXPATHLEN);
253 254

    join(prefix, landmark);
255
    ok = ismodule(prefix, FALSE);
256 257
    prefix[n] = '\0';
    return ok;
258 259
}

260
/* assumes argv0_path is MAXPATHLEN+1 bytes long, already \0 term'd.
261
   assumption provided by only caller, calculate_path() */
262
static int
263
search_for_prefix(wchar_t *argv0_path, const wchar_t *landmark)
264
{
265
    /* Search from argv0_path, until landmark is found */
266
    wcscpy_s(prefix, MAXPATHLEN + 1, argv0_path);
267 268 269 270 271 272
    do {
        if (gotlandmark(landmark))
            return 1;
        reduce(prefix);
    } while (prefix[0]);
    return 0;
273 274
}

275
#ifdef Py_ENABLE_SHARED
276

277 278
/* a string loaded from the DLL at startup.*/
extern const char *PyWin_DLLVersionString;
279

280 281 282 283

/* Load a PYTHONPATH value from the registry.
   Load from either HKEY_LOCAL_MACHINE or HKEY_CURRENT_USER.

284 285 286
   Works in both Unicode and 8bit environments.  Only uses the
   Ex family of functions so it also works with Windows CE.

287
   Returns NULL, or a pointer that should be freed.
288 289 290 291

   XXX - this code is pretty strange, as it used to also
   work on Win16, where the buffer sizes werent available
   in advance.  It could be simplied now Win16/Win32s is dead!
292 293
*/

294
static wchar_t *
295
getpythonregpath(HKEY keyBase, int skipcore)
296
{
297 298 299 300 301 302 303 304
    HKEY newKey = 0;
    DWORD dataSize = 0;
    DWORD numKeys = 0;
    LONG rc;
    wchar_t *retval = NULL;
    WCHAR *dataBuf = NULL;
    static const WCHAR keyPrefix[] = L"Software\\Python\\PythonCore\\";
    static const WCHAR keySuffix[] = L"\\PythonPath";
305
    size_t versionLen, keyBufLen;
306 307 308 309 310 311 312 313
    DWORD index;
    WCHAR *keyBuf = NULL;
    WCHAR *keyBufPtr;
    WCHAR **ppPaths = NULL;

    /* Tried to use sysget("winver") but here is too early :-( */
    versionLen = strlen(PyWin_DLLVersionString);
    /* Space for all the chars, plus one \0 */
314 315 316 317
    keyBufLen = sizeof(keyPrefix) +
                sizeof(WCHAR)*(versionLen-1) +
                sizeof(keySuffix);
    keyBuf = keyBufPtr = PyMem_RawMalloc(keyBufLen);
318 319
    if (keyBuf==NULL) goto done;

320
    memcpy_s(keyBufPtr, keyBufLen, keyPrefix, sizeof(keyPrefix)-sizeof(WCHAR));
321
    keyBufPtr += Py_ARRAY_LENGTH(keyPrefix) - 1;
322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340
    mbstowcs(keyBufPtr, PyWin_DLLVersionString, versionLen);
    keyBufPtr += versionLen;
    /* NULL comes with this one! */
    memcpy(keyBufPtr, keySuffix, sizeof(keySuffix));
    /* Open the root Python key */
    rc=RegOpenKeyExW(keyBase,
                    keyBuf, /* subkey */
            0, /* reserved */
            KEY_READ,
            &newKey);
    if (rc!=ERROR_SUCCESS) goto done;
    /* Find out how big our core buffer is, and how many subkeys we have */
    rc = RegQueryInfoKey(newKey, NULL, NULL, NULL, &numKeys, NULL, NULL,
                    NULL, NULL, &dataSize, NULL, NULL);
    if (rc!=ERROR_SUCCESS) goto done;
    if (skipcore) dataSize = 0; /* Only count core ones if we want them! */
    /* Allocate a temp array of char buffers, so we only need to loop
       reading the registry once
    */
341
    ppPaths = PyMem_RawMalloc( sizeof(WCHAR *) * numKeys );
342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362
    if (ppPaths==NULL) goto done;
    memset(ppPaths, 0, sizeof(WCHAR *) * numKeys);
    /* Loop over all subkeys, allocating a temp sub-buffer. */
    for(index=0;index<numKeys;index++) {
        WCHAR keyBuf[MAX_PATH+1];
        HKEY subKey = 0;
        DWORD reqdSize = MAX_PATH+1;
        /* Get the sub-key name */
        DWORD rc = RegEnumKeyExW(newKey, index, keyBuf, &reqdSize,
                                 NULL, NULL, NULL, NULL );
        if (rc!=ERROR_SUCCESS) goto done;
        /* Open the sub-key */
        rc=RegOpenKeyExW(newKey,
                                        keyBuf, /* subkey */
                        0, /* reserved */
                        KEY_READ,
                        &subKey);
        if (rc!=ERROR_SUCCESS) goto done;
        /* Find the value of the buffer size, malloc, then read it */
        RegQueryValueExW(subKey, NULL, 0, NULL, NULL, &reqdSize);
        if (reqdSize) {
363
            ppPaths[index] = PyMem_RawMalloc(reqdSize);
364 365 366 367 368 369 370 371 372 373 374 375 376 377
            if (ppPaths[index]) {
                RegQueryValueExW(subKey, NULL, 0, NULL,
                                (LPBYTE)ppPaths[index],
                                &reqdSize);
                dataSize += reqdSize + 1; /* 1 for the ";" */
            }
        }
        RegCloseKey(subKey);
    }

    /* return null if no path to return */
    if (dataSize == 0) goto done;

    /* original datasize from RegQueryInfo doesn't include the \0 */
378
    dataBuf = PyMem_RawMalloc((dataSize+1) * sizeof(WCHAR));
379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407
    if (dataBuf) {
        WCHAR *szCur = dataBuf;
        /* Copy our collected strings */
        for (index=0;index<numKeys;index++) {
            if (index > 0) {
                *(szCur++) = L';';
                dataSize--;
            }
            if (ppPaths[index]) {
                Py_ssize_t len = wcslen(ppPaths[index]);
                wcsncpy(szCur, ppPaths[index], len);
                szCur += len;
                assert(dataSize > (DWORD)len);
                dataSize -= (DWORD)len;
            }
        }
        if (skipcore)
            *szCur = '\0';
        else {
            /* If we have no values, we dont need a ';' */
            if (numKeys) {
                *(szCur++) = L';';
                dataSize--;
            }
            /* Now append the core path entries -
               this will include the NULL
            */
            rc = RegQueryValueExW(newKey, NULL, 0, NULL,
                                  (LPBYTE)szCur, &dataSize);
408 409 410 411
            if (rc != ERROR_SUCCESS) {
                PyMem_RawFree(dataBuf);
                goto done;
            }
412 413 414 415
        }
        /* And set the result - caller must free */
        retval = dataBuf;
    }
416
done:
417 418
    /* Loop freeing my temp buffers */
    if (ppPaths) {
419 420 421
        for(index=0; index<numKeys; index++)
            PyMem_RawFree(ppPaths[index]);
        PyMem_RawFree(ppPaths);
422 423 424
    }
    if (newKey)
        RegCloseKey(newKey);
425
    PyMem_RawFree(keyBuf);
426
    return retval;
427
}
428
#endif /* Py_ENABLE_SHARED */
429

430
static void
431
get_progpath(void)
432
{
433 434 435
    extern wchar_t *Py_GetProgramName(void);
    wchar_t *path = _wgetenv(L"PATH");
    wchar_t *prog = Py_GetProgramName();
436

437
#ifdef Py_ENABLE_SHARED
438 439 440 441 442
    extern HANDLE PyWin_DLLhModule;
    /* static init of progpath ensures final char remains \0 */
    if (PyWin_DLLhModule)
        if (!GetModuleFileNameW(PyWin_DLLhModule, dllpath, MAXPATHLEN))
            dllpath[0] = 0;
443
#else
444
    dllpath[0] = 0;
445
#endif
446 447 448 449 450 451 452 453 454 455
    if (GetModuleFileNameW(NULL, progpath, MAXPATHLEN))
        return;
    if (prog == NULL || *prog == '\0')
        prog = L"python";

    /* If there is no slash in the argv0 path, then we have to
     * assume python is on the user's $PATH, since there's no
     * other way to find a directory to start the search from.  If
     * $PATH isn't exported, you lose.
     */
456
#ifdef ALTSEP
457
    if (wcschr(prog, SEP) || wcschr(prog, ALTSEP))
458
#else
459
    if (wcschr(prog, SEP))
460
#endif
461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489
        wcsncpy(progpath, prog, MAXPATHLEN);
    else if (path) {
        while (1) {
            wchar_t *delim = wcschr(path, DELIM);

            if (delim) {
                size_t len = delim - path;
                /* ensure we can't overwrite buffer */
                len = min(MAXPATHLEN,len);
                wcsncpy(progpath, path, len);
                *(progpath + len) = '\0';
            }
            else
                wcsncpy(progpath, path, MAXPATHLEN);

            /* join() is safe for MAXPATHLEN+1 size buffer */
            join(progpath, prog);
            if (exists(progpath))
                break;

            if (!delim) {
                progpath[0] = '\0';
                break;
            }
            path = delim + 1;
        }
    }
    else
        progpath[0] = '\0';
490 491
}

492 493 494 495 496 497 498 499 500 501 502
static int
find_env_config_value(FILE * env_file, const wchar_t * key, wchar_t * value)
{
    int result = 0; /* meaning not found */
    char buffer[MAXPATHLEN*2+1];  /* allow extra for key, '=', etc. */

    fseek(env_file, 0, SEEK_SET);
    while (!feof(env_file)) {
        char * p = fgets(buffer, MAXPATHLEN*2, env_file);
        wchar_t tmpbuffer[MAXPATHLEN*2+1];
        PyObject * decoded;
503
        size_t n;
504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520

        if (p == NULL)
            break;
        n = strlen(p);
        if (p[n - 1] != '\n') {
            /* line has overflowed - bail */
            break;
        }
        if (p[0] == '#')    /* Comment - skip */
            continue;
        decoded = PyUnicode_DecodeUTF8(buffer, n, "surrogateescape");
        if (decoded != NULL) {
            Py_ssize_t k;
            k = PyUnicode_AsWideChar(decoded,
                                     tmpbuffer, MAXPATHLEN * 2);
            Py_DECREF(decoded);
            if (k >= 0) {
521 522
                wchar_t * context = NULL;
                wchar_t * tok = wcstok_s(tmpbuffer, L" \t\r\n", &context);
523
                if ((tok != NULL) && !wcscmp(tok, key)) {
524
                    tok = wcstok_s(NULL, L" \t", &context);
525
                    if ((tok != NULL) && !wcscmp(tok, L"=")) {
526
                        tok = wcstok_s(NULL, L"\r\n", &context);
527 528 529 530 531 532 533 534 535 536 537 538 539
                        if (tok != NULL) {
                            wcsncpy(value, tok, MAXPATHLEN);
                            result = 1;
                            break;
                        }
                    }
                }
            }
        }
    }
    return result;
}

540
static int
541
read_pth_file(const wchar_t *path, wchar_t *prefix, int *isolated, int *nosite)
542 543 544 545 546
{
    FILE *sp_file = _Py_wfopen(path, L"r");
    if (sp_file == NULL)
        return -1;

547 548 549 550 551
    wcscpy_s(prefix, MAXPATHLEN+1, path);
    reduce(prefix);
    *isolated = 1;
    *nosite = 1;

552 553 554 555 556 557 558 559 560 561 562
    size_t bufsiz = MAXPATHLEN;
    size_t prefixlen = wcslen(prefix);

    wchar_t *buf = (wchar_t*)PyMem_RawMalloc(bufsiz * sizeof(wchar_t));
    buf[0] = '\0';

    while (!feof(sp_file)) {
        char line[MAXPATHLEN + 1];
        char *p = fgets(line, MAXPATHLEN + 1, sp_file);
        if (!p)
            break;
563
        if (*p == '\0' || *p == '\r' || *p == '\n' || *p == '#')
564 565 566 567 568 569 570
            continue;
        while (*++p) {
            if (*p == '\r' || *p == '\n') {
                *p = '\0';
                break;
            }
        }
571

572 573 574 575 576 577
        if (strcmp(line, "import site") == 0) {
            *nosite = 0;
            continue;
        } else if (strncmp(line, "import ", 7) == 0) {
            Py_FatalError("only 'import site' is supported in ._pth file");
        }
578

579
        DWORD wn = MultiByteToWideChar(CP_UTF8, 0, line, -1, NULL, 0);
580
        wchar_t *wline = (wchar_t*)PyMem_RawMalloc((wn + 1) * sizeof(wchar_t));
581
        wn = MultiByteToWideChar(CP_UTF8, 0, line, -1, wline, wn + 1);
582 583
        wline[wn] = '\0';

584 585
        size_t usedsiz = wcslen(buf);
        while (usedsiz + wn + prefixlen + 4 > bufsiz) {
586 587 588 589 590 591 592 593
            bufsiz += MAXPATHLEN;
            buf = (wchar_t*)PyMem_RawRealloc(buf, (bufsiz + 1) * sizeof(wchar_t));
            if (!buf) {
                PyMem_RawFree(wline);
                goto error;
            }
        }

594
        if (usedsiz) {
595
            wcscat_s(buf, bufsiz, L";");
596 597
            usedsiz += 1;
        }
598

599 600 601 602 603 604 605 606 607 608
        errno_t result;
        _Py_BEGIN_SUPPRESS_IPH
        result = wcscat_s(buf, bufsiz, prefix);
        _Py_END_SUPPRESS_IPH
        if (result == EINVAL) {
            Py_FatalError("invalid argument during ._pth processing");
        } else if (result == ERANGE) {
            Py_FatalError("buffer overflow during ._pth processing");
        }
        wchar_t *b = &buf[usedsiz];
609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625
        join(b, wline);

        PyMem_RawFree(wline);
    }

    module_search_path = buf;

    fclose(sp_file);
    return 0;

error:
    PyMem_RawFree(buf);
    fclose(sp_file);
    return -1;
}


626
static void
627
calculate_path(void)
628
{
629 630 631 632 633
    wchar_t argv0_path[MAXPATHLEN+1];
    wchar_t *buf;
    size_t bufsz;
    wchar_t *pythonhome = Py_GetPythonHome();
    wchar_t *envpath = NULL;
634

635 636 637 638 639 640 641 642
    int skiphome, skipdefault;
    wchar_t *machinepath = NULL;
    wchar_t *userpath = NULL;
    wchar_t zip_path[MAXPATHLEN+1];

    if (!Py_IgnoreEnvironmentFlag) {
        envpath = _wgetenv(L"PYTHONPATH");
    }
643

644 645
    get_progpath();
    /* progpath guaranteed \0 terminated in MAXPATH+1 bytes. */
646
    wcscpy_s(argv0_path, MAXPATHLEN+1, progpath);
647
    reduce(argv0_path);
648

649 650 651 652
    /* Search for a sys.path file */
    {
        wchar_t spbuffer[MAXPATHLEN+1];

653 654 655 656 657 658
        if ((dllpath[0] && !change_ext(spbuffer, dllpath, L"._pth") && exists(spbuffer)) ||
            (progpath[0] && !change_ext(spbuffer, progpath, L"._pth") && exists(spbuffer))) {

            if (!read_pth_file(spbuffer, prefix, &Py_IsolatedFlag, &Py_NoSiteFlag)) {
                return;
            }
659 660 661
        }
    }

662 663 664 665 666 667
    /* Search for an environment configuration file, first in the
       executable's directory and then in the parent directory.
       If found, open it for use when searching for prefixes.
    */

    {
668
        wchar_t envbuffer[MAXPATHLEN+1];
669
        wchar_t tmpbuffer[MAXPATHLEN+1];
670
        const wchar_t *env_cfg = L"pyvenv.cfg";
671 672
        FILE * env_file = NULL;

673 674 675
        wcscpy_s(envbuffer, MAXPATHLEN+1, argv0_path);
        join(envbuffer, env_cfg);
        env_file = _Py_wfopen(envbuffer, L"r");
676 677
        if (env_file == NULL) {
            errno = 0;
678 679 680 681
            reduce(envbuffer);
            reduce(envbuffer);
            join(envbuffer, env_cfg);
            env_file = _Py_wfopen(envbuffer, L"r");
682 683 684 685 686 687 688
            if (env_file == NULL) {
                errno = 0;
            }
        }
        if (env_file != NULL) {
            /* Look for a 'home' variable and set argv0_path to it, if found */
            if (find_env_config_value(env_file, L"home", tmpbuffer)) {
689
                wcscpy_s(argv0_path, MAXPATHLEN+1, tmpbuffer);
690 691 692 693 694 695
            }
            fclose(env_file);
            env_file = NULL;
        }
    }

696
    /* Calculate zip archive path from DLL or exe path */
697
    change_ext(zip_path, dllpath[0] ? dllpath : progpath, L".zip");
698

699
    if (pythonhome == NULL || *pythonhome == '\0') {
700 701 702 703 704
        if (zip_path[0] && exists(zip_path)) {
            wcscpy_s(prefix, MAXPATHLEN+1, zip_path);
            reduce(prefix);
            pythonhome = prefix;
        } else if (search_for_prefix(argv0_path, LANDMARK))
705 706 707 708 709
            pythonhome = prefix;
        else
            pythonhome = NULL;
    }
    else
710
        wcscpy_s(prefix, MAXPATHLEN+1, pythonhome);
711

712 713
    if (envpath && *envpath == '\0')
        envpath = NULL;
714

715

716
    skiphome = pythonhome==NULL ? 0 : 1;
717
#ifdef Py_ENABLE_SHARED
718 719
    machinepath = getpythonregpath(HKEY_LOCAL_MACHINE, skiphome);
    userpath = getpythonregpath(HKEY_CURRENT_USER, skiphome);
720
#endif
721 722 723 724
    /* We only use the default relative PYTHONPATH if we havent
       anything better to use! */
    skipdefault = envpath!=NULL || pythonhome!=NULL || \
                  machinepath!=NULL || userpath!=NULL;
725

726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746
    /* We need to construct a path from the following parts.
       (1) the PYTHONPATH environment variable, if set;
       (2) for Win32, the zip archive file path;
       (3) for Win32, the machinepath and userpath, if set;
       (4) the PYTHONPATH config macro, with the leading "."
           of each component replaced with pythonhome, if set;
       (5) the directory containing the executable (argv0_path).
       The length calculation calculates #4 first.
       Extra rules:
       - If PYTHONHOME is set (in any way) item (3) is ignored.
       - If registry values are used, (4) and (5) are ignored.
    */

    /* Calculate size of return buffer */
    if (pythonhome != NULL) {
        wchar_t *p;
        bufsz = 1;
        for (p = PYTHONPATH; *p; p++) {
            if (*p == DELIM)
                bufsz++; /* number of DELIM plus one */
        }
747
        bufsz *= wcslen(pythonhome);
748 749 750
    }
    else
        bufsz = 0;
751 752
    bufsz += wcslen(PYTHONPATH) + 1;
    bufsz += wcslen(argv0_path) + 1;
753
    if (userpath)
754
        bufsz += wcslen(userpath) + 1;
755
    if (machinepath)
756 757
        bufsz += wcslen(machinepath) + 1;
    bufsz += wcslen(zip_path) + 1;
758
    if (envpath != NULL)
759
        bufsz += wcslen(envpath) + 1;
760

761
    module_search_path = buf = PyMem_RawMalloc(bufsz*sizeof(wchar_t));
762 763 764 765 766 767 768 769 770 771 772
    if (buf == NULL) {
        /* We can't exit, so print a warning and limp along */
        fprintf(stderr, "Can't malloc dynamic PYTHONPATH.\n");
        if (envpath) {
            fprintf(stderr, "Using environment $PYTHONPATH.\n");
            module_search_path = envpath;
        }
        else {
            fprintf(stderr, "Using default static path.\n");
            module_search_path = PYTHONPATH;
        }
773 774
        PyMem_RawFree(machinepath);
        PyMem_RawFree(userpath);
775 776 777 778
        return;
    }

    if (envpath) {
779 780
        if (wcscpy_s(buf, bufsz - (buf - module_search_path), envpath))
            Py_FatalError("buffer overflow in getpathp.c's calculate_path()");
781 782 783 784
        buf = wcschr(buf, L'\0');
        *buf++ = DELIM;
    }
    if (zip_path[0]) {
785 786
        if (wcscpy_s(buf, bufsz - (buf - module_search_path), zip_path))
            Py_FatalError("buffer overflow in getpathp.c's calculate_path()");
787 788 789 790
        buf = wcschr(buf, L'\0');
        *buf++ = DELIM;
    }
    if (userpath) {
791 792
        if (wcscpy_s(buf, bufsz - (buf - module_search_path), userpath))
            Py_FatalError("buffer overflow in getpathp.c's calculate_path()");
793 794
        buf = wcschr(buf, L'\0');
        *buf++ = DELIM;
795
        PyMem_RawFree(userpath);
796 797
    }
    if (machinepath) {
798 799
        if (wcscpy_s(buf, bufsz - (buf - module_search_path), machinepath))
            Py_FatalError("buffer overflow in getpathp.c's calculate_path()");
800 801
        buf = wcschr(buf, L'\0');
        *buf++ = DELIM;
802
        PyMem_RawFree(machinepath);
803 804 805
    }
    if (pythonhome == NULL) {
        if (!skipdefault) {
806 807
            if (wcscpy_s(buf, bufsz - (buf - module_search_path), PYTHONPATH))
                Py_FatalError("buffer overflow in getpathp.c's calculate_path()");
808
            buf = wcschr(buf, L'\0');
809
            *buf++ = DELIM;
810
        }
811
    } else {
812 813 814 815 816 817 818 819 820 821
        wchar_t *p = PYTHONPATH;
        wchar_t *q;
        size_t n;
        for (;;) {
            q = wcschr(p, DELIM);
            if (q == NULL)
                n = wcslen(p);
            else
                n = q-p;
            if (p[0] == '.' && is_sep(p[1])) {
822 823
                if (wcscpy_s(buf, bufsz - (buf - module_search_path), pythonhome))
                    Py_FatalError("buffer overflow in getpathp.c's calculate_path()");
824 825 826 827 828 829
                buf = wcschr(buf, L'\0');
                p++;
                n--;
            }
            wcsncpy(buf, p, n);
            buf += n;
830
            *buf++ = DELIM;
831 832 833 834 835 836 837 838
            if (q == NULL)
                break;
            p = q+1;
        }
    }
    if (argv0_path) {
        wcscpy(buf, argv0_path);
        buf = wcschr(buf, L'\0');
839
        *buf++ = DELIM;
840
    }
841
    *(buf - 1) = L'\0';
842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875
    /* Now to pull one last hack/trick.  If sys.prefix is
       empty, then try and find it somewhere on the paths
       we calculated.  We scan backwards, as our general policy
       is that Python core directories are at the *end* of
       sys.path.  We assume that our "lib" directory is
       on the path, and that our 'prefix' directory is
       the parent of that.
    */
    if (*prefix==L'\0') {
        wchar_t lookBuf[MAXPATHLEN+1];
        wchar_t *look = buf - 1; /* 'buf' is at the end of the buffer */
        while (1) {
            Py_ssize_t nchars;
            wchar_t *lookEnd = look;
            /* 'look' will end up one character before the
               start of the path in question - even if this
               is one character before the start of the buffer
            */
            while (look >= module_search_path && *look != DELIM)
                look--;
            nchars = lookEnd-look;
            wcsncpy(lookBuf, look+1, nchars);
            lookBuf[nchars] = L'\0';
            /* Up one level to the parent */
            reduce(lookBuf);
            if (search_for_prefix(lookBuf, LANDMARK)) {
                break;
            }
            /* If we are out of paths to search - give up */
            if (look < module_search_path)
                break;
            look--;
        }
    }
876 877 878 879 880
}


/* External interface */

Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
881 882 883 884
void
Py_SetPath(const wchar_t *path)
{
    if (module_search_path != NULL) {
885
        PyMem_RawFree(module_search_path);
Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
886 887 888 889 890 891 892
        module_search_path = NULL;
    }
    if (path != NULL) {
        extern wchar_t *Py_GetProgramName(void);
        wchar_t *prog = Py_GetProgramName();
        wcsncpy(progpath, prog, MAXPATHLEN);
        prefix[0] = L'\0';
893
        module_search_path = PyMem_RawMalloc((wcslen(path) + 1) * sizeof(wchar_t));
Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
894 895
        if (module_search_path != NULL)
            wcscpy(module_search_path, path);
896
    }
Kristján Valur Jónsson's avatar
Kristján Valur Jónsson committed
897 898
}

899
wchar_t *
900
Py_GetPath(void)
901
{
902 903 904
    if (!module_search_path)
        calculate_path();
    return module_search_path;
905 906
}

907
wchar_t *
908
Py_GetPrefix(void)
909
{
910 911 912
    if (!module_search_path)
        calculate_path();
    return prefix;
913 914
}

915
wchar_t *
916
Py_GetExecPrefix(void)
917
{
918
    return Py_GetPrefix();
919 920
}

921
wchar_t *
922
Py_GetProgramFullPath(void)
923
{
924 925 926
    if (!module_search_path)
        calculate_path();
    return progpath;
927
}
928

929 930
/* Load python3.dll before loading any extension module that might refer
   to it. That way, we can be sure that always the python3.dll corresponding
931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962
   to this python DLL is loaded, not a python3.dll that might be on the path
   by chance.
   Return whether the DLL was found.
*/
static int python3_checked = 0;
static HANDLE hPython3;
int
_Py_CheckPython3()
{
    wchar_t py3path[MAXPATHLEN+1];
    wchar_t *s;
    if (python3_checked)
        return hPython3 != NULL;
    python3_checked = 1;

    /* If there is a python3.dll next to the python3y.dll,
       assume this is a build tree; use that DLL */
    wcscpy(py3path, dllpath);
    s = wcsrchr(py3path, L'\\');
    if (!s)
        s = py3path;
    wcscpy(s, L"\\python3.dll");
    hPython3 = LoadLibraryExW(py3path, NULL, LOAD_WITH_ALTERED_SEARCH_PATH);
    if (hPython3 != NULL)
        return 1;

    /* Check sys.prefix\DLLs\python3.dll */
    wcscpy(py3path, Py_GetPrefix());
    wcscat(py3path, L"\\DLLs\\python3.dll");
    hPython3 = LoadLibraryExW(py3path, NULL, LOAD_WITH_ALTERED_SEARCH_PATH);
    return hPython3 != NULL;
}