@@ -313,7 +313,7 @@ def _host_toolchain_impl(rctx):
313313 rctx .file ("BUILD.bazel" , _HOST_TOOLCHAIN_BUILD_CONTENT )
314314
315315 os_name = repo_utils .get_platforms_os_name (rctx )
316- host_platform = _get_host_platform (
316+ host_platform = _get_host_impl_repo_suffix (
317317 rctx = rctx ,
318318 logger = repo_utils .logger (rctx ),
319319 python_version = rctx .attr .python_version ,
@@ -386,7 +386,27 @@ Creates a repository with a shorter name meant to be used in the repository_ctx,
386386which needs to have `symlinks` for the interpreter. This is separate from the
387387toolchain_aliases repo because referencing the `python` interpreter target from
388388this repo causes an eager fetch of the toolchain for the host platform.
389- """ ,
389+
390+ This repo has three different ways in which is it called:
391+
392+ 1. Workspace. The `platforms` attribute is set, which are keys into the
393+ PLATFORMS global. It assumes `name` + <matching platform name> is a
394+ valid repo name which it can use as the backing repo.
395+
396+ 2. Bzlmod, created along side when python_register_toolchains is called
397+ and expected to use one of repos created as part of that
398+ python_register_toolchains call.
399+ Because the bzlmod extension decides the platform mapping, it is given
400+ the `platform`, `os_names`, and `archs` attributes to figure out which
401+ to use.
402+
403+ 3. Bzlmod, created when the initial python_register_toolchains didn't
404+ have a host-compatible runtime, so a different host-compatible
405+ implementation was used.
406+ This is like the normal bzlmod creation, except the python_versions
407+ and suffixes may vary between choices, so the `impl_repo_suffixes` and
408+ `python_version` attributes are specified.
409+ """ ,
390410 attrs = {
391411 "archs" : attr .string_dict (
392412 doc = """
@@ -398,8 +418,43 @@ If set, overrides the platform metadata. Keyed by index in `platforms`
398418If set, overrides the platform metadata. Keyed by index in `platforms`
399419""" ,
400420 ),
401- "platforms" : attr .string_list (mandatory = True ),
402- "python_version" : attr .string (mandatory = True ),
421+ "platforms" : attr .string_list (
422+ mandatory = True ,
423+ doc = """
424+ Platform names and backing repo-suffix.
425+
426+ NOTE: The order of this list matters. The first platform that is compatible
427+ with the host will be selected; this can be customized by using the
428+ `RULES_PYTHON_REPO_TOOLCHAIN_*` env vars.
429+
430+ When os_names aren't set, they act the key into the PLATFORMS
431+ dict to determine if a platform is compatible with the host. When
432+ os_names is set, then it is a (mostly) arbitrary platform name string
433+ (and platform metadata comes from the os_names/archs args).
434+
435+ The string is used as a suffix to create the name of the repo that
436+ should be pointed to. i.e. `name` + <selected platform string> should
437+ result in a valid repo (e.g. created by python_register_toolchains()).
438+ Under bzlmod, this also means the same extension must create the
439+ repo named `name+suffix` and the host_toolchain repo.
440+ """ ,
441+ ),
442+ "python_version" : attr .string (
443+ mandatory = True ,
444+ doc = "Full python version, Major.Minor.Micro" ,
445+ ),
446+ "python_versions" : attr .string_dict (
447+ doc = """
448+ If set, the Python version for the corresponding selected platform.
449+ Keyed by index in `platforms`. Values Major.Minor.Patch
450+ """ ,
451+ ),
452+ "impl_repo_suffixes" : attr .string_dict (
453+ doc = """
454+ If set, the suffix to append to `name` to identify the backing repo that is used.
455+ Keyed by index in `platforms`.
456+ """ ,
457+ ),
403458 "_rule_name" : attr .string (default = "host_toolchain" ),
404459 "_rules_python_workspace" : attr .label (default = Label ("//:WORKSPACE" )),
405460 },
@@ -438,8 +493,8 @@ multi_toolchain_aliases = repository_rule(
438493def sanitize_platform_name (platform ):
439494 return platform .replace ("-" , "_" )
440495
441- def sorted_host_platforms ( platform_map ):
442- """Sort the keys in the platform map to give correct precedence.
496+ def sorted_host_platform_names ( platform_names ):
497+ """Sort platform names to give correct precedence.
443498
444499 The order of keys in the platform mapping matters for the host toolchain
445500 selection. When multiple runtimes are compatible with the host, we take the
@@ -455,6 +510,29 @@ def sorted_host_platforms(platform_map):
455510 in a dict that autoformatters like to clobber and whose only documentation
456511 is an innocous looking formatter disable directive.
457512
513+ Args:
514+ platform_names: a list of platform names
515+
516+ Returns:
517+ list[str] the same values, but in the desired order.
518+ """
519+
520+ def platform_keyer (name ):
521+ # Ascending sort: lower is higher precedence
522+ pref = 0
523+ if name .endswith ("-" + FREETHREADED ):
524+ pref = 1
525+ elif name .endswith ("-" + MUSL ):
526+ pref = 2
527+ return (pref , name )
528+
529+ return sorted (platform_map .keys (), key = platform_keyer )
530+
531+ def sorted_host_platforms (platform_map ):
532+ """Sort the keys in the platform map to give correct precedence.
533+
534+ See sorted_host_platform_names for explanation.
535+
458536 Args:
459537 platform_map: a mapping of platforms and their metadata.
460538
@@ -472,13 +550,12 @@ def sorted_host_platforms(platform_map):
472550 pref = 2
473551 return (pref , name )
474552
475- sorted_platform_keys = sorted (platform_map .keys (), key = platform_keyer )
476553 return {
477554 key : platform_map [key ]
478- for key in sorted_platform_keys
555+ for key in sorted_host_platform_names ( platform_map . keys ())
479556 }
480557
481- def _get_host_platform (* , rctx , logger , python_version , os_name , cpu_name , platforms ):
558+ def _get_host_impl_repo_suffix (* , rctx , logger , python_version , os_name , cpu_name , platforms ):
482559 """Gets the host platform.
483560
484561 Args:
@@ -498,6 +575,8 @@ def _get_host_platform(*, rctx, logger, python_version, os_name, cpu_name, platf
498575 platform_map [platform_name ] = struct (
499576 os_name = rctx .attr .os_names [key ],
500577 arch = rctx .attr .archs [key ],
578+ python_version = rctx .attr .python_versions .get (key ),
579+ impl_repo_suffix = rctx .attr .impl_repo_suffixes .get (key ),
501580 )
502581 else :
503582 platform_map = sorted_host_platforms (PLATFORMS )
@@ -507,11 +586,13 @@ def _get_host_platform(*, rctx, logger, python_version, os_name, cpu_name, platf
507586 meta = platform_map [platform ]
508587
509588 if meta .os_name == os_name and meta .arch == cpu_name :
510- candidates .append (platform )
589+ candidates .append (( platform , meta ) )
511590
512591 if len (candidates ) == 1 :
513- return candidates [0 ]
592+ platform_name , meta = candidates [0 ]
593+ return getattr (meta , "impl_repo_suffix" , platform_name )
514594
595+ # todo: have this handle multiple python versions
515596 if candidates :
516597 env_var = "RULES_PYTHON_REPO_TOOLCHAIN_{}_{}_{}" .format (
517598 python_version .replace ("." , "_" ),
@@ -525,12 +606,21 @@ def _get_host_platform(*, rctx, logger, python_version, os_name, cpu_name, platf
525606 candidates ,
526607 ))
527608 elif preference not in candidates :
609+ # todo: need to map names like 3_13_0_linux_x86_64 back to
610+ # the input values. Ah, er, wait
611+ # Is this working?
612+ # The return value is appended to this repo's name.
613+ # This repo's name is e.g. python_3_13.
614+ # the net result would be
615+ # python_3_10_3_13_0_linux_x86_64
616+ # which isn't a valid name
528617 return logger .fail ("Please choose a preferred interpreter out of the following platforms: {}" .format (candidates ))
529618 else :
530619 candidates = [preference ]
531620
532621 if candidates :
533- return candidates [0 ]
622+ platform_name , meta = candidates [0 ]
623+ return getattr (meta , "impl_repo_suffix" , platform_name )
534624
535625 return logger .fail ("Could not find a compatible 'host' python for '{os_name}', '{cpu_name}' from the loaded platforms: {platforms}" .format (
536626 os_name = os_name ,
0 commit comments