Support running the test scope with --hadoop

Gedochao · Gedochao · commit 5622ba76cca6 · 2025-02-20T14:36:57.000+01:00
diff --git a/modules/cli/src/main/scala/scala/cli/commands/package0/Package.scala b/modules/cli/src/main/scala/scala/cli/commands/package0/Package.scala
@@ -5,6 +5,7 @@ import caseapp.*
 import caseapp.core.help.HelpFormat
 import coursier.launcher.*
 import dependency.*
+import os.Path
 import packager.config.*
 import packager.deb.DebianPackage
 import packager.docker.DockerPackage
@@ -337,7 +338,7 @@ object Package extends ScalaCommand[PackageOptions] with BuildCommandHelpers {
         case a: PackageType.Assembly =>
           value {
             assembly(
-              build,
+              Seq(build),
               destPath,
               a.mainClassInManifest match {
                 case None =>
@@ -367,7 +368,7 @@ object Package extends ScalaCommand[PackageOptions] with BuildCommandHelpers {
         case PackageType.Spark =>
           value {
             assembly(
-              build,
+              Seq(build),
               destPath,
               mainClassOpt,
               // The Spark modules are assumed to be already on the class path,
@@ -844,47 +845,52 @@ object Package extends ScalaCommand[PackageOptions] with BuildCommandHelpers {
   }
 
   def assembly(
-    build: Build.Successful,
+    builds: Seq[Build.Successful],
     destPath: os.Path,
     mainClassOpt: Option[String],
     extraProvided: Seq[dependency.AnyModule],
     withPreamble: Boolean,
     alreadyExistsCheck: () => Either[BuildException, Unit],
     logger: Logger
   ): Either[BuildException, Unit] = either {
-    val compiledClasses = os.walk(build.output).filter(os.isFile(_))
+    val compiledClassesByOutputDir: Seq[(Path, Path)] =
+      builds.flatMap(build =>
+        os.walk(build.output).filter(os.isFile(_)).map(build.output -> _)
+      ).distinct
     val (extraClassesFolders, extraJars) =
-      build.options.classPathOptions.extraClassPath.partition(os.isDir(_))
-    val extraClasses = extraClassesFolders.flatMap(os.walk(_)).filter(os.isFile(_))
-
-    val byteCodeZipEntries = (compiledClasses ++ extraClasses).map { path =>
-      val name         = path.relativeTo(build.output).toString
-      val content      = os.read.bytes(path)
-      val lastModified = os.mtime(path)
-      val ent          = new ZipEntry(name)
-      ent.setLastModifiedTime(FileTime.fromMillis(lastModified))
-      ent.setSize(content.length)
-      (ent, content)
-    }
+      builds.flatMap(_.options.classPathOptions.extraClassPath).partition(os.isDir(_))
+    val extraClassesByDefaultOutputDir =
+      extraClassesFolders.flatMap(os.walk(_)).filter(os.isFile(_)).map(builds.head.output -> _)
+
+    val byteCodeZipEntries =
+      (compiledClassesByOutputDir ++ extraClassesByDefaultOutputDir).map { (outputDir, path) =>
+        val name         = path.relativeTo(outputDir).toString
+        val content      = os.read.bytes(path)
+        val lastModified = os.mtime(path)
+        val ent          = new ZipEntry(name)
+        ent.setLastModifiedTime(FileTime.fromMillis(lastModified))
+        ent.setSize(content.length)
+        (ent, content)
+      }
 
-    val provided = build.options.notForBloopOptions.packageOptions.provided ++ extraProvided
-    val allJars  = build.artifacts.runtimeArtifacts.map(_._2) ++ extraJars.filter(os.exists(_))
+    val provided = builds.head.options.notForBloopOptions.packageOptions.provided ++ extraProvided
+    val allJars =
+      builds.flatMap(_.artifacts.runtimeArtifacts.map(_._2)) ++ extraJars.filter(os.exists(_))
     val jars =
       if (provided.isEmpty) allJars
       else {
-        val providedFilesSet = value(providedFiles(Seq(build), provided, logger)).toSet
+        val providedFilesSet = value(providedFiles(builds, provided, logger)).toSet
         allJars.filterNot(providedFilesSet.contains)
       }
 
     val preambleOpt =
-      if (withPreamble)
+      if withPreamble then
         Some {
           Preamble()
             .withOsKind(Properties.isWin)
             .callsItself(Properties.isWin)
         }
-      else
-        None
+      else None
     val params = Parameters.Assembly()
       .withExtraZipEntries(byteCodeZipEntries)
       .withFiles(jars.map(_.toIO))
diff --git a/modules/cli/src/main/scala/scala/cli/commands/run/Run.scala b/modules/cli/src/main/scala/scala/cli/commands/run/Run.scala
@@ -646,7 +646,7 @@ object Run extends ScalaCommand[RunOptions] with BuildCommandHelpers {
           case RunMode.HadoopJar =>
             value {
               RunHadoop.run(
-                builds.head, // TODO: handle multiple builds
+                builds,
                 mainClass,
                 args,
                 logger,
diff --git a/modules/cli/src/main/scala/scala/cli/commands/util/RunHadoop.scala b/modules/cli/src/main/scala/scala/cli/commands/util/RunHadoop.scala
@@ -10,15 +10,14 @@ import scala.cli.commands.packaging.Spark
 object RunHadoop {
 
   def run(
-    build: Build.Successful,
+    builds: Seq[Build.Successful],
     mainClass: String,
     args: Seq[String],
     logger: Logger,
     allowExecve: Boolean,
     showCommand: Boolean,
     scratchDirOpt: Option[os.Path]
   ): Either[BuildException, Either[Seq[String], (Process, Option[() => Unit])]] = either {
-
     // FIXME Get Spark.hadoopModules via provided settings?
     val providedModules = Spark.hadoopModules
     scratchDirOpt.foreach(os.makeDir.all(_))
@@ -30,7 +29,7 @@ object RunHadoop {
     )
     value {
       PackageCmd.assembly(
-        build,
+        builds,
         assembly,
         // "hadoop jar" doesn't accept a main class as second argument if the jar as first argument has a main class in its manifest…
         None,
@@ -41,27 +40,24 @@ object RunHadoop {
       )
     }
 
-    val javaOpts = build.options.javaOptions.javaOpts.toSeq.map(_.value.value)
+    val javaOpts = builds.head.options.javaOptions.javaOpts.toSeq.map(_.value.value)
     val extraEnv =
-      if (javaOpts.isEmpty) Map[String, String]()
+      if javaOpts.isEmpty then Map[String, String]()
       else
         Map(
           "HADOOP_CLIENT_OPTS" -> javaOpts.mkString(" ") // no escaping…
         )
     val hadoopJarCommand = Seq("hadoop", "jar")
     val finalCommand =
       hadoopJarCommand ++ Seq(assembly.toString, mainClass) ++ args
-    if (showCommand)
-      Left(Runner.envCommand(extraEnv) ++ finalCommand)
+    if showCommand then Left(Runner.envCommand(extraEnv) ++ finalCommand)
     else {
       val proc =
-        if (allowExecve)
-          Runner.maybeExec("hadoop", finalCommand, logger, extraEnv = extraEnv)
-        else
-          Runner.run(finalCommand, logger, extraEnv = extraEnv)
+        if allowExecve then Runner.maybeExec("hadoop", finalCommand, logger, extraEnv = extraEnv)
+        else Runner.run(finalCommand, logger, extraEnv = extraEnv)
       Right((
         proc,
-        if (scratchDirOpt.isEmpty) Some(() => os.remove(assembly, checkExists = true))
+        if scratchDirOpt.isEmpty then Some(() => os.remove(assembly, checkExists = true))
         else None
       ))
     }
diff --git a/modules/integration/src/test/scala/scala/cli/integration/HadoopTests.scala b/modules/integration/src/test/scala/scala/cli/integration/HadoopTests.scala
@@ -5,99 +5,108 @@ import com.eed3si9n.expecty.Expecty.expect
 class HadoopTests extends munit.FunSuite {
   protected lazy val extraOptions: Seq[String] = TestUtil.extraOptions
 
-  test("simple map-reduce") {
-    TestUtil.retryOnCi() {
-      val inputs = TestInputs(
-        os.rel / "WordCount.java" ->
-          """//> using dep org.apache.hadoop:hadoop-client-api:3.3.3
-            |
-            |// from https://hadoop.apache.org/docs/r3.3.3/hadoop-mapreduce-client/hadoop-mapreduce-client-core/MapReduceTutorial.html
-            |
-            |package foo;
-            |
-            |import java.io.IOException;
-            |import java.util.StringTokenizer;
-            |
-            |import org.apache.hadoop.conf.Configuration;
-            |import org.apache.hadoop.fs.Path;
-            |import org.apache.hadoop.io.IntWritable;
-            |import org.apache.hadoop.io.Text;
-            |import org.apache.hadoop.mapreduce.Job;
-            |import org.apache.hadoop.mapreduce.Mapper;
-            |import org.apache.hadoop.mapreduce.Reducer;
-            |import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
-            |import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
-            |
-            |public class WordCount {
-            |
-            |  public static class TokenizerMapper
-            |       extends Mapper<Object, Text, Text, IntWritable>{
-            |
-            |    private final static IntWritable one = new IntWritable(1);
-            |    private Text word = new Text();
-            |
-            |    public void map(Object key, Text value, Context context
-            |                    ) throws IOException, InterruptedException {
-            |      StringTokenizer itr = new StringTokenizer(value.toString());
-            |      while (itr.hasMoreTokens()) {
-            |        word.set(itr.nextToken());
-            |        context.write(word, one);
-            |      }
-            |    }
-            |  }
-            |
-            |  public static class IntSumReducer
-            |       extends Reducer<Text,IntWritable,Text,IntWritable> {
-            |    private IntWritable result = new IntWritable();
-            |
-            |    public void reduce(Text key, Iterable<IntWritable> values,
-            |                       Context context
-            |                       ) throws IOException, InterruptedException {
-            |      int sum = 0;
-            |      for (IntWritable val : values) {
-            |        sum += val.get();
-            |      }
-            |      result.set(sum);
-            |      context.write(key, result);
-            |    }
-            |  }
-            |
-            |  public static void main(String[] args) throws Exception {
-            |    Configuration conf = new Configuration();
-            |    Job job = Job.getInstance(conf, "word count");
-            |    job.setJarByClass(WordCount.class);
-            |    job.setMapperClass(TokenizerMapper.class);
-            |    job.setCombinerClass(IntSumReducer.class);
-            |    job.setReducerClass(IntSumReducer.class);
-            |    job.setOutputKeyClass(Text.class);
-            |    job.setOutputValueClass(IntWritable.class);
-            |    FileInputFormat.addInputPath(job, new Path(args[0]));
-            |    FileOutputFormat.setOutputPath(job, new Path(args[1]));
-            |    System.exit(job.waitForCompletion(true) ? 0 : 1);
-            |  }
-            |}
-            |""".stripMargin
-      )
-      inputs.fromRoot { root =>
-        val res = os.proc(
-          TestUtil.cli,
-          "--power",
-          "run",
-          TestUtil.extraOptions,
-          ".",
-          "--hadoop",
-          "--command",
-          "--scratch-dir",
-          "tmp",
-          "--",
-          "foo"
+  for {
+    withTestScope <- Seq(true, false)
+    scopeDescription = if (withTestScope) "test scope" else "main scope"
+    inputPath =
+      if (withTestScope) os.rel / "test" / "WordCount.java" else os.rel / "main" / "WordCount.java"
+    directiveKey = if (withTestScope) "test.dep" else "dep"
+    scopeOptions = if (withTestScope) Seq("--test") else Nil
+  }
+    test(s"simple map-reduce ($scopeDescription)") {
+      TestUtil.retryOnCi() {
+        val inputs = TestInputs(
+          inputPath ->
+            s"""//> using $directiveKey org.apache.hadoop:hadoop-client-api:3.3.3
+               |
+               |// from https://hadoop.apache.org/docs/r3.3.3/hadoop-mapreduce-client/hadoop-mapreduce-client-core/MapReduceTutorial.html
+               |
+               |package foo;
+               |
+               |import java.io.IOException;
+               |import java.util.StringTokenizer;
+               |
+               |import org.apache.hadoop.conf.Configuration;
+               |import org.apache.hadoop.fs.Path;
+               |import org.apache.hadoop.io.IntWritable;
+               |import org.apache.hadoop.io.Text;
+               |import org.apache.hadoop.mapreduce.Job;
+               |import org.apache.hadoop.mapreduce.Mapper;
+               |import org.apache.hadoop.mapreduce.Reducer;
+               |import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
+               |import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
+               |
+               |public class WordCount {
+               |
+               |  public static class TokenizerMapper
+               |       extends Mapper<Object, Text, Text, IntWritable>{
+               |
+               |    private final static IntWritable one = new IntWritable(1);
+               |    private Text word = new Text();
+               |
+               |    public void map(Object key, Text value, Context context
+               |                    ) throws IOException, InterruptedException {
+               |      StringTokenizer itr = new StringTokenizer(value.toString());
+               |      while (itr.hasMoreTokens()) {
+               |        word.set(itr.nextToken());
+               |        context.write(word, one);
+               |      }
+               |    }
+               |  }
+               |
+               |  public static class IntSumReducer
+               |       extends Reducer<Text,IntWritable,Text,IntWritable> {
+               |    private IntWritable result = new IntWritable();
+               |
+               |    public void reduce(Text key, Iterable<IntWritable> values,
+               |                       Context context
+               |                       ) throws IOException, InterruptedException {
+               |      int sum = 0;
+               |      for (IntWritable val : values) {
+               |        sum += val.get();
+               |      }
+               |      result.set(sum);
+               |      context.write(key, result);
+               |    }
+               |  }
+               |
+               |  public static void main(String[] args) throws Exception {
+               |    Configuration conf = new Configuration();
+               |    Job job = Job.getInstance(conf, "word count");
+               |    job.setJarByClass(WordCount.class);
+               |    job.setMapperClass(TokenizerMapper.class);
+               |    job.setCombinerClass(IntSumReducer.class);
+               |    job.setReducerClass(IntSumReducer.class);
+               |    job.setOutputKeyClass(Text.class);
+               |    job.setOutputValueClass(IntWritable.class);
+               |    FileInputFormat.addInputPath(job, new Path(args[0]));
+               |    FileOutputFormat.setOutputPath(job, new Path(args[1]));
+               |    System.exit(job.waitForCompletion(true) ? 0 : 1);
+               |  }
+               |}
+               |""".stripMargin
         )
-          .call(cwd = root)
-        val command = res.out.lines()
-        pprint.err.log(command)
-        expect(command.take(2) == Seq("hadoop", "jar"))
-        expect(command.takeRight(2) == Seq("foo.WordCount", "foo"))
+        inputs.fromRoot { root =>
+          val res = os.proc(
+            TestUtil.cli,
+            "--power",
+            "run",
+            TestUtil.extraOptions,
+            ".",
+            "--hadoop",
+            "--command",
+            "--scratch-dir",
+            "tmp",
+            scopeOptions,
+            "--",
+            "foo"
+          )
+            .call(cwd = root)
+          val command = res.out.lines()
+          pprint.err.log(command)
+          expect(command.take(2) == Seq("hadoop", "jar"))
+          expect(command.takeRight(2) == Seq("foo.WordCount", "foo"))
+        }
       }
     }
-  }
 }