fix

ford-at-aws · ford-at-aws · commit d2a6e3a42971 · 2024-09-23T14:28:44.000-04:00
diff --git a/ruby/example_code/glue/glue_wrapper.rb b/ruby/example_code/glue/glue_wrapper.rb
@@ -7,10 +7,8 @@
 # snippet-start:[ruby.example_code.glue.GlueWrapper.full]
 # snippet-start:[ruby.example_code.glue.GlueWrapper.decl]
 
-# The `GlueWrapper` class serves as a wrapper around the AWS Glue API,
-# providing a simplified interface for common operations.
-# It encapsulates the functionality of the AWS SDK for Glue and provides methods for interacting with Glue crawlers,
-# databases, tables, jobs, and S3 resources.
+# The `GlueWrapper` class serves as a wrapper around the AWS Glue API, providing a simplified interface for common operations.
+# It encapsulates the functionality of the AWS SDK for Glue and provides methods for interacting with Glue crawlers, databases, tables, jobs, and S3 resources.
 # The class initializes with a Glue client and a logger, allowing it to make API calls and log any errors or informational messages.
 class GlueWrapper
   def initialize(glue_client, logger)
@@ -76,7 +74,170 @@ def start_crawler(name)
   end
   # snippet-end:[ruby.example_code.glue.StartCrawler]
 
-  # Additional methods omitted for brevity...
+  # snippet-start:[ruby.example_code.glue.DeleteCrawler]
+  # Deletes a crawler with the specified name.
+  #
+  # @param name [String] The name of the crawler to delete.
+  # @return [void]
+  def delete_crawler(name)
+    @glue_client.delete_crawler(name: name)
+  rescue Aws::Glue::Errors::ServiceError => e
+    @logger.error("Glue could not delete crawler #{name}: \n#{e.message}")
+    raise
+  end
+  # snippet-end:[ruby.example_code.glue.DeleteCrawler]
+
+  # snippet-start:[ruby.example_code.glue.GetDatabase]
+  # Retrieves information about a specific database.
+  #
+  # @param name [String] The name of the database to retrieve information about.
+  # @return [Aws::Glue::Types::Database, nil] The database object if found, or nil if not found.
+  def get_database(name)
+    response = @glue_client.get_database(name: name)
+    response.database
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not get database #{name}: \n#{e.message}")
+    raise
+  end
+  # snippet-end:[ruby.example_code.glue.GetDatabase]
+
+  # snippet-start:[ruby.example_code.glue.GetTables]
+  # Retrieves a list of tables in the specified database.
+  #
+  # @param db_name [String] The name of the database to retrieve tables from.
+  # @return [Array<Aws::Glue::Types::Table>]
+  def get_tables(db_name)
+    response = @glue_client.get_tables(database_name: db_name)
+    response.table_list
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not get tables #{db_name}: \n#{e.message}")
+    raise
+  end
+  # snippet-end:[ruby.example_code.glue.GetTables]
+
+  # snippet-start:[ruby.example_code.glue.CreateJob]
+  # Creates a new job with the specified configuration.
+  #
+  # @param name [String] The name of the job.
+  # @param description [String] The description of the job.
+  # @param role_arn [String] The ARN of the IAM role to be used by the job.
+  # @param script_location [String] The location of the ETL script for the job.
+  # @return [void]
+  def create_job(name, description, role_arn, script_location)
+    @glue_client.create_job(
+      name: name,
+      description: description,
+      role: role_arn,
+      command: {
+        name: 'glueetl',
+        script_location: script_location,
+        python_version: '3'
+      },
+      glue_version: '3.0'
+    )
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not create job #{name}: \n#{e.message}")
+    raise
+  end
+  # snippet-end:[ruby.example_code.glue.CreateJob]
+
+  # snippet-start:[ruby.example_code.glue.StartJobRun]
+  # Starts a job run for the specified job.
+  #
+  # @param name [String] The name of the job to start the run for.
+  # @param input_database [String] The name of the input database for the job.
+  # @param input_table [String] The name of the input table for the job.
+  # @param output_bucket_name [String] The name of the output S3 bucket for the job.
+  # @return [String] The ID of the started job run.
+  def start_job_run(name, input_database, input_table, output_bucket_name)
+    response = @glue_client.start_job_run(
+      job_name: name,
+      arguments: {
+        '--input_database': input_database,
+        '--input_table': input_table,
+        '--output_bucket_url': "s3://#{output_bucket_name}/"
+      }
+    )
+    response.job_run_id
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not start job run #{name}: \n#{e.message}")
+    raise
+  end
+  # snippet-end:[ruby.example_code.glue.StartJobRun]
+
+  # snippet-start:[ruby.example_code.glue.ListJobs]
+  # Retrieves a list of jobs in AWS Glue.
+  #
+  # @return [Aws::Glue::Types::ListJobsResponse]
+  def list_jobs
+    @glue_client.list_jobs
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not list jobs: \n#{e.message}")
+    raise
+  end
+  # snippet-end:[ruby.example_code.glue.ListJobs]
+
+  # snippet-start:[ruby.example_code.glue.GetJobRuns]
+  # Retrieves a list of job runs for the specified job.
+  #
+  # @param job_name [String] The name of the job to retrieve job runs for.
+  # @return [Array<Aws::Glue::Types::JobRun>]
+  def get_job_runs(job_name)
+    response = @glue_client.get_job_runs(job_name: job_name)
+    response.job_runs
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not get job runs: \n#{e.message}")
+  end
+  # snippet-end:[ruby.example_code.glue.GetJobRuns]
+
+  # snippet-start:[ruby.example_code.glue.GetJobRun]
+  # Retrieves data for a specific job run.
+  #
+  # @param job_name [String] The name of the job run to retrieve data for.
+  # @return [Glue::Types::GetJobRunResponse]
+  def get_job_run(job_name, run_id)
+    @glue_client.get_job_run(job_name: job_name, run_id: run_id)
+  rescue Aws::Glue::Errors::GlueException => e
+    @logger.error("Glue could not get job runs: \n#{e.message}")
+  end
+  # snippet-end:[ruby.example_code.glue.GetJobRun]
+
+  # snippet-start:[ruby.example_code.glue.DeleteJob]
+  # Deletes a job with the specified name.
+  #
+  # @param job_name [String] The name of the job to delete.
+  # @return [void]
+  def delete_job(job_name)
+    @glue_client.delete_job(job_name: job_name)
+  rescue Aws::Glue::Errors::ServiceError => e
+    @logger.error("Glue could not delete job: \n#{e.message}")
+  end
+  # snippet-end:[ruby.example_code.glue.DeleteJob]
+
+  # snippet-start:[ruby.example_code.glue.DeleteTable]
+  # Deletes a table with the specified name.
+  #
+  # @param database_name [String] The name of the catalog database in which the table resides.
+  # @param table_name [String] The name of the table to be deleted.
+  # @return [void]
+  def delete_table(database_name, table_name)
+    @glue_client.delete_table(database_name: database_name, name: table_name)
+  rescue Aws::Glue::Errors::ServiceError => e
+    @logger.error("Glue could not delete job: \n#{e.message}")
+  end
+  # snippet-end:[ruby.example_code.glue.DeleteTable]
+
+  # snippet-start:[ruby.example_code.glue.DeleteDatabase]
+  # Removes a specified database from a Data Catalog.
+  #
+  # @param database_name [String] The name of the database to delete.
+  # @return [void]
+  def delete_database(database_name)
+    @glue_client.delete_database(name: database_name)
+  rescue Aws::Glue::Errors::ServiceError => e
+    @logger.error("Glue could not delete database: \n#{e.message}")
+  end
+  # snippet-end:[ruby.example_code.glue.DeleteDatabase]
 
   # Uploads a job script file to an S3 bucket.
   #